# Auth is handled by the claude CLI (claude setup-token) — no API key needed here. # ANTHROPIC_API_KEY=only_needed_if_switching_to_sdk # Path to the inara/ identity directory — relative to cortex/ or absolute INARA_DIR=../inara # Path for persistent JSON session files SESSIONS_DIR=./data/sessions # LLM defaults DEFAULT_MODEL=claude-sonnet-4-6 DEFAULT_TIER=2 # Session rolling window — number of messages to keep (user + assistant pairs) # 40 = 20 turns MAX_HISTORY_MESSAGES=40 # Per-backend timeouts (seconds) # Gemini is generous — it frequently takes 30-60s under load # Local models may need time to load into VRAM before first response TIMEOUT_CLAUDE=60 TIMEOUT_GEMINI=120 TIMEOUT_LOCAL=300 # Google Chat — must respond within 30s or Chat shows an error to the user GOOGLE_CHAT_TIMEOUT=25 # Backend pinned for Google Chat (claude recommended — more reliable within 25s) GOOGLE_CHAT_BACKEND=claude # TODO: add GOOGLE_CHAT_TOKEN for request verification once endpoint is public # Server PORT=8000 HOST=0.0.0.0