diff --git a/cortex/routers/local_llm.py b/cortex/routers/local_llm.py index 3d853e0..bf25807 100644 --- a/cortex/routers/local_llm.py +++ b/cortex/routers/local_llm.py @@ -211,6 +211,11 @@ def _render(username: str, success: str = "", error: str = "") -> str: cur_tools = m.get("tools", True) cur_tags = ", ".join(m.get("tags") or []) cur_reasoning_budget = m.get("reasoning_budget_tokens") or 0 + _rb_levels = [(0, "Off — Non-think"), (1024, "Light"), (4096, "Moderate"), (8192, "High"), (32768, "Max")] + reasoning_opts = "".join( + f'' + for v, lbl in _rb_levels + ) model_rows += f'''
@@ -258,9 +263,11 @@ def _render(username: str, success: str = "", error: str = "") -> str: title="Per-model tool loop cap. 0 = use the global default (orchestrator_max_rounds).">
- - + +
diff --git a/cortex/static/local_llm.html b/cortex/static/local_llm.html index f553d70..bc64fd6 100644 --- a/cortex/static/local_llm.html +++ b/cortex/static/local_llm.html @@ -503,6 +503,17 @@
+
+ + +