feat(model): /model command overhaul — Phases 2, 3, 5

* feat(model): persist base_url on /model switch, auto-detect for bare /model custom Phase 2+3 of the /model command overhaul: Phase 2 — Persist base_url on model switch: - CLI: save model.base_url when switching to a non-OpenRouter endpoint; clear it when switching away from custom to prevent stale URLs leaking into the new provider's resolution - Gateway: same logic using direct YAML write Phase 3 — Better feedback and edge cases: - Bare '/model custom' now auto-detects the model from the endpoint using _auto_detect_local_model() and saves all three config values (model, provider, base_url) atomically - Shows endpoint URL in success messages when switching to/from custom providers (both CLI and gateway) - Clear error messages when no custom endpoint is configured - Updated test assertions for the additional save_config_value call Fixes #2562 (Phase 2+3) * feat(model): support custom:name:model triple syntax for named custom providers Phase 5 of the /model command overhaul. Extends parse_model_input() to handle the triple syntax: /model custom:local-server:qwen → provider='custom:local-server', model='qwen' /model custom:my-model → provider='custom', model='my-model' (unchanged) The 'custom:local-server' provider string is already supported by _get_named_custom_provider() in runtime_provider.py, which matches it against the custom_providers list in config.yaml. This just wires the parsing so users can do it from the /model slash command. Added 4 tests covering single, triple, whitespace, and empty model cases.
2026-03-24 06:58:04 -07:00 · 2026-03-24 06:58:04 -07:00 · b641ee88f4
commit b641ee88f4
parent 2f1c4fb01f
5 changed files with 166 additions and 15 deletions
--- a/gateway/run.py
+++ b/gateway/run.py
@ -2851,6 +2851,56 @@ class GatewayRunner:
            lines.append("Switch provider: `/model provider-name` or `/model provider:model-name`")
            return "\n".join(lines)

+        # Handle bare "/model custom" — switch to custom provider
+        # and auto-detect the model from the endpoint.
+        if args.strip().lower() == "custom":
+            from hermes_cli.runtime_provider import (
+                resolve_runtime_provider as _rtp_custom,
+                _auto_detect_local_model,
+            )
+            try:
+                runtime = _rtp_custom(requested="custom")
+                cust_base = runtime.get("base_url", "")
+                if not cust_base or "openrouter.ai" in cust_base:
+                    return (
+                        "⚠️ No custom endpoint configured.\n"
+                        "Set `model.base_url` in config.yaml, or `OPENAI_BASE_URL` in .env,\n"
+                        "or run: `hermes setup` → Custom OpenAI-compatible endpoint"
+                    )
+                detected_model = _auto_detect_local_model(cust_base)
+                if detected_model:
+                    try:
+                        user_config = {}
+                        if config_path.exists():
+                            with open(config_path, encoding="utf-8") as f:
+                                user_config = yaml.safe_load(f) or {}
+                        if "model" not in user_config or not isinstance(user_config["model"], dict):
+                            user_config["model"] = {}
+                        user_config["model"]["default"] = detected_model
+                        user_config["model"]["provider"] = "custom"
+                        user_config["model"]["base_url"] = cust_base
+                        with open(config_path, 'w', encoding="utf-8") as f:
+                            yaml.dump(user_config, f, default_flow_style=False, sort_keys=False)
+                    except Exception as e:
+                        return f"⚠️ Failed to save model change: {e}"
+                    os.environ["HERMES_MODEL"] = detected_model
+                    os.environ["HERMES_INFERENCE_PROVIDER"] = "custom"
+                    self._effective_model = None
+                    self._effective_provider = None
+                    return (
+                        f"🤖 Model changed to `{detected_model}` (saved to config)\n"
+                        f"**Provider:** Custom\n"
+                        f"**Endpoint:** `{cust_base}`\n"
+                        f"_Model auto-detected from endpoint. Takes effect on next message._"
+                    )
+                else:
+                    return (
+                        f"⚠️ Custom endpoint at `{cust_base}` is reachable but no single model was auto-detected.\n"
+                        f"Specify the model explicitly: `/model custom:<model-name>`"
+                    )
+            except Exception as e:
+                return f"⚠️ Could not resolve custom endpoint: {e}"
+
        # Parse provider:model syntax
        target_provider, new_model = parse_model_input(args, current_provider)

@ -2925,6 +2975,13 @@ class GatewayRunner:
                user_config["model"]["default"] = new_model
                if provider_changed:
                    user_config["model"]["provider"] = target_provider
+                    # Persist base_url for custom endpoints so it survives
+                    # restart; clear it when switching away from custom to
+                    # prevent stale URLs leaking (#2562 Phase 2).
+                    if base_url and "openrouter.ai" not in (base_url or ""):
+                        user_config["model"]["base_url"] = base_url
+                    else:
+                        user_config["model"].pop("base_url", None)
                with open(config_path, 'w', encoding="utf-8") as f:
                    yaml.dump(user_config, f, default_flow_style=False, sort_keys=False)
            except Exception as e:
@ -2950,15 +3007,20 @@ class GatewayRunner:
        self._effective_model = None
        self._effective_provider = None

-        # Helpful hint when staying on a custom/local endpoint
+        # Show endpoint info for custom providers
+        _target_is_custom = target_provider == "custom" or (
+            base_url and "openrouter.ai" not in (base_url or "")
+            and ("localhost" in (base_url or "") or "127.0.0.1" in (base_url or ""))
+        )
        custom_hint = ""
-        if is_custom and not provider_changed:
-            endpoint = _resolved_base or "custom endpoint"
-            custom_hint = (
-                f"\n**Endpoint:** `{endpoint}`"
-                "\n_To switch providers, use_ `/model provider:model`"
-                "\n_e.g._ `/model openrouter:anthropic/claude-sonnet-4`"
-            )
+        if _target_is_custom or (is_custom and not provider_changed):
+            endpoint = base_url or _resolved_base or "custom endpoint"
+            custom_hint = f"\n**Endpoint:** `{endpoint}`"
+            if not provider_changed:
+                custom_hint += (
+                    "\n_To switch providers, use_ `/model provider:model`"
+                    "\n_e.g._ `/model openrouter:anthropic/claude-sonnet-4`"
+                )

        return f"🤖 Model changed to `{new_model}` ({persist_note}){provider_note}{warning}{custom_hint}\n_(takes effect on next message)_"