Merge pull request #740 from NousResearch/hermes/hermes-3cd7c62d

feat: simple fallback model for provider resilience (#737)
This commit is contained in:
Teknium 2026-03-08 21:16:58 -07:00 committed by GitHub
commit 315f3ea429
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
6 changed files with 442 additions and 0 deletions

View file

@ -103,6 +103,27 @@ DEFAULT_CONFIG = {
},
},
# Fallback model — used when the primary model/provider fails after retries.
# When the primary hits rate limits (429), overload (529), or service errors (503),
# Hermes will automatically switch to this model for the remainder of the session.
# Set to None / omit to disable fallback.
#
# Supported providers (auto-resolve base_url and API key from env):
# openrouter (OPENROUTER_API_KEY) — routes to any model
# zai (ZAI_API_KEY) — Z.AI / GLM
# kimi-coding (KIMI_API_KEY) — Kimi / Moonshot
# minimax (MINIMAX_API_KEY) — MiniMax
# minimax-cn (MINIMAX_CN_API_KEY) — MiniMax (China)
#
# For any other OpenAI-compatible endpoint, use base_url + api_key_env.
"fallback_model": {
"provider": "", # provider name from the list above
"model": "", # model slug, e.g. "anthropic/claude-sonnet-4"
# Optional overrides (usually auto-resolved from provider):
# "base_url": "", # custom endpoint URL
# "api_key_env": "", # env var name for API key (e.g. "MY_CUSTOM_KEY")
},
"display": {
"compact": False,
"personality": "kawaii",