feat: audit log, usage tracking UI, OpenAI orchestrator compaction, onboarding + docs

Tool audit log: - Every orchestrator tool call logged to home/{user}/tool_audit/YYYY-MM-DD.jsonl - Files panel sidebar: audit log group (collapsed), date-linked read-only table - Admin endpoints: /api/audit/files, /api/audit/day, /api/audit/recent, /api/audit/stats - Engine and model name recorded per entry OpenAI orchestrator improvements: - Context budget enforcement: 75% of model context_k (min 16k) - Message compaction: truncates old tool results when approaching budget - max_rounds respected per model config (intersected with server cap) OpenRouter onboarding (setup.html, onboarding.py, app.js, settings.html): - Step 3 of 3: /setup/model with curated model picker - Chat banner for users on server-default model (informational, not alarmist) - Settings quick-link card; /setup/model works standalone for existing users Model registry + session store: - set_role_config / get_role_config for per-role tool lists and system_append - session_store: session rename, session name backfill endpoint UI updates (app.js, index.html, style.css, local_llm.html): - Role toggle in context panel - Off-the-record mode - Agent notes read-only viewer - OPERATIONS.md loaded at T2+ in context Documentation: - HELP.md: full tool table, per-role tool sets, Agent Notes, usage tracking - TOOLS.md: Agent Notes section, count corrected to 44 - ARCH__SYSTEM.md, ARCH__BACKENDS.md, MASTER.md updated to match reality - CLAUDE.md: onboarding flow, documentation philosophy sections - README.md: stack in practice, DeepSeek TUI mention, architecture diagram updated - TODO__Agents.md: onboarding task completed with deviation notes Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-05-08 21:26:43 -04:00
parent c02d2462b0
commit f8f7cd75da
25 changed files with 1088 additions and 151 deletions
--- a/cortex/routers/local_llm.py
+++ b/cortex/routers/local_llm.py
@@ -159,7 +159,8 @@ def _render(username: str, success: str = "", error: str = "") -> str:
        else:
            secondary = default_secondary

-        ctx      = f'<span class="ctx-badge">{m.get("context_k",0)}k</span>' if m.get("context_k") else ""
+        ctx       = f'<span class="ctx-badge">{m.get("context_k",0)}k</span>' if m.get("context_k") else ""
+        no_tools  = '' if m.get("tools", True) else '<span class="pbadge pb-notools">no tools</span>'
        tags_html = " ".join(f'<span class="tag">{t}</span>' for t in (m.get("tags") or []))
        sec      = f'<span class="model-host">{secondary}</span>' if secondary else ""

@@ -201,13 +202,15 @@ def _render(username: str, success: str = "", error: str = "") -> str:
        cur_label      = m.get("label", "")
        cur_model_name = m.get("model_name", "")
        cur_ctx        = m.get("context_k", 0) or 0
+        cur_max_rounds = m.get("max_rounds") or 0
+        cur_tools      = m.get("tools", True)
        cur_tags       = ", ".join(m.get("tags") or [])

        model_rows += f'''
        <div class="model-row" id="model-{m["id"]}">
          <div class="model-row-header">
            <div class="model-info">
-              <div>{badge}<span class="model-label">{m.get("label") or m.get("model_name","")}</span>{ctx}</div>
+              <div>{badge}<span class="model-label">{m.get("label") or m.get("model_name","")}</span>{ctx}{no_tools}</div>
              <span class="model-name">{m.get("model_name","")}</span>
              {sec}
              <div class="tag-row">{tags_html}</div>
@@ -239,8 +242,22 @@ def _render(username: str, success: str = "", error: str = "") -> str:
            {extra_fields}
            <div class="field-row">
              <div class="field" style="flex:0 0 auto">
-                <label>Context (k)</label>
-                <input type="number" name="context_k" value="{cur_ctx}" min="0">
+                <label title="Context window size in thousands of tokens. 0 = assume 32k.">Context (k)</label>
+                <input type="number" name="context_k" value="{cur_ctx}" min="0"
+                       title="Context window size in thousands of tokens. 0 = assume 32k (compaction budget ~24k tokens).">
+              </div>
+              <div class="field" style="flex:0 0 auto">
+                <label title="Per-model tool loop cap. 0 = use the global default (orchestrator_max_rounds).">Max rounds</label>
+                <input type="number" name="max_rounds" value="{cur_max_rounds}" min="0"
+                       title="Per-model tool loop cap. 0 = use the global default (orchestrator_max_rounds).">
+              </div>
+              <div class="field" style="flex:0 0 auto">
+                <label title="Whether this model supports tool calling. If not supported, requests skip the tool loop entirely.">Tool calling</label>
+                <select name="tools"
+                        title="Whether this model supports tool calling. If not supported, requests skip the tool loop entirely.">
+                  <option value="1" {'selected' if cur_tools else ''}>Supported</option>
+                  <option value="0" {'' if cur_tools else 'selected'}>Not supported</option>
+                </select>
              </div>
              <div class="field">
                <label>Tags</label>
@@ -426,6 +443,8 @@ async def add_model(
    provider:         str = Form("local"),
    label:            str = Form(""),
    context_k:        int = Form(0),
+    max_rounds:       int = Form(0),
+    tools:            int = Form(1),
    tags:             str = Form(""),
    # local-only fields
    host_id:          str = Form(""),
@@ -439,14 +458,17 @@ async def add_model(
    if not username:
        return RedirectResponse("/login", status_code=302)

-    tag_list = [t.strip() for t in tags.split(",") if t.strip()]
+    tag_list   = [t.strip() for t in tags.split(",") if t.strip()]
+    max_rounds_ = max_rounds or None
+    tools_bool  = tools != 0

    if provider == "local":
        if not model_name.strip():
            return HTMLResponse(_render(username, error="Model name is required."))
        if not host_id.strip():
            return HTMLResponse(_render(username, error="Select a host."))
-        reg.save_model(username, None, host_id, label, model_name, context_k, tag_list)
+        reg.save_model(username, None, host_id, label, model_name, context_k, tag_list,
+                       max_rounds=max_rounds_, tools=tools_bool)
        display = label or model_name

    elif provider in ("google", "anthropic"):
@@ -459,6 +481,7 @@ async def add_model(
            account_id=account_id or None,
            credential_id=credential_id or None,
            context_k=context_k, tags=tag_list,
+            max_rounds=max_rounds_, tools=tools_bool,
        )
        display = label or cloud_model_name
    else:
@@ -476,6 +499,8 @@ async def edit_model(
    label:         str = Form(""),
    model_name:    str = Form(""),
    context_k:     int = Form(0),
+    max_rounds:    int = Form(0),
+    tools:         int = Form(1),
    tags:          str = Form(""),
    host_id:       str = Form(""),
    account_id:    str = Form(""),
@@ -486,17 +511,22 @@ async def edit_model(
        return RedirectResponse("/login", status_code=302)
    if not model_name.strip():
        return HTMLResponse(_render(username, error="Model name is required."))
-    tag_list = [t.strip() for t in tags.split(",") if t.strip()]
+    tag_list    = [t.strip() for t in tags.split(",") if t.strip()]
+    max_rounds_ = max_rounds or None
+    tools_bool  = tools != 0
    if mtype == "local_openai":
        if not host_id.strip():
            return HTMLResponse(_render(username, error="Select a host for this model."))
-        reg.save_model(username, model_id, host_id, label, model_name, context_k, tag_list)
+        reg.save_model(username, model_id, host_id, label, model_name, context_k, tag_list,
+                       max_rounds=max_rounds_, tools=tools_bool)
    elif mtype == "gemini_api":
        reg.save_cloud_model(username, model_id, "google", model_name, label,
-                             account_id=account_id or None, context_k=context_k, tags=tag_list)
+                             account_id=account_id or None, context_k=context_k, tags=tag_list,
+                             max_rounds=max_rounds_, tools=tools_bool)
    elif mtype == "claude_cli":
        reg.save_cloud_model(username, model_id, "anthropic", model_name, label,
-                             credential_id=credential_id or "cli", context_k=context_k, tags=tag_list)
+                             credential_id=credential_id or "cli", context_k=context_k, tags=tag_list,
+                             max_rounds=max_rounds_, tools=tools_bool)
    else:
        return HTMLResponse(_render(username, error=f"Unknown model type: {mtype}"))
    display = label.strip() or model_name.strip()