Extends the single fallback_model mechanism into an ordered chain.
When the primary model fails, Hermes tries each fallback provider in
sequence until one succeeds or the chain is exhausted.
Config format (new):
fallback_providers:
- provider: openrouter
model: anthropic/claude-sonnet-4
- provider: openai
model: gpt-4o
Legacy single-dict fallback_model format still works unchanged.
Key fix vs original PR: the call sites in the retry loop now use
_fallback_index < len(_fallback_chain) instead of the old one-shot
_fallback_activated guard, so the chain actually advances through
all configured providers.
Changes:
- run_agent.py: _fallback_chain list + _fallback_index replaces
one-shot _fallback_model; _try_activate_fallback() advances
through chain; failed provider resolution skips to next entry;
call sites updated to allow chain advancement
- cli.py: reads fallback_providers with legacy fallback_model compat
- gateway/run.py: same
- hermes_cli/config.py: fallback_providers: [] in DEFAULT_CONFIG
- tests: 12 new chain tests + 6 existing test fixtures updated
Co-authored-by: uzaylisak <uzaylisak@users.noreply.github.com>
This commit is contained in:
@@ -25,6 +25,8 @@ def _make_agent_with_compressor() -> AIAgent:
|
||||
"provider": "openai",
|
||||
"model": "gpt-4o",
|
||||
}
|
||||
agent._fallback_chain = [agent._fallback_model]
|
||||
agent._fallback_index = 0
|
||||
|
||||
# Context compressor with primary model values
|
||||
compressor = ContextCompressor(
|
||||
|
||||
156
tests/test_provider_fallback.py
Normal file
156
tests/test_provider_fallback.py
Normal file
@@ -0,0 +1,156 @@
|
||||
"""Tests for ordered provider fallback chain (salvage of PR #1761).
|
||||
|
||||
Extends the single-fallback tests in test_fallback_model.py to cover
|
||||
the new list-based ``fallback_providers`` config format and chain
|
||||
advancement through multiple providers.
|
||||
"""
|
||||
|
||||
from unittest.mock import MagicMock, patch
|
||||
|
||||
from run_agent import AIAgent
|
||||
|
||||
|
||||
def _make_agent(fallback_model=None):
|
||||
"""Create a minimal AIAgent with optional fallback config."""
|
||||
with (
|
||||
patch("run_agent.get_tool_definitions", return_value=[]),
|
||||
patch("run_agent.check_toolset_requirements", return_value={}),
|
||||
patch("run_agent.OpenAI"),
|
||||
):
|
||||
agent = AIAgent(
|
||||
api_key="test-key",
|
||||
quiet_mode=True,
|
||||
skip_context_files=True,
|
||||
skip_memory=True,
|
||||
fallback_model=fallback_model,
|
||||
)
|
||||
agent.client = MagicMock()
|
||||
return agent
|
||||
|
||||
|
||||
def _mock_client(base_url="https://openrouter.ai/api/v1", api_key="fb-key"):
|
||||
mock = MagicMock()
|
||||
mock.base_url = base_url
|
||||
mock.api_key = api_key
|
||||
return mock
|
||||
|
||||
|
||||
# ── Chain initialisation ──────────────────────────────────────────────────
|
||||
|
||||
|
||||
class TestFallbackChainInit:
|
||||
def test_no_fallback(self):
|
||||
agent = _make_agent(fallback_model=None)
|
||||
assert agent._fallback_chain == []
|
||||
assert agent._fallback_index == 0
|
||||
assert agent._fallback_model is None
|
||||
|
||||
def test_single_dict_backwards_compat(self):
|
||||
fb = {"provider": "openai", "model": "gpt-4o"}
|
||||
agent = _make_agent(fallback_model=fb)
|
||||
assert agent._fallback_chain == [fb]
|
||||
assert agent._fallback_model == fb
|
||||
|
||||
def test_list_of_providers(self):
|
||||
fbs = [
|
||||
{"provider": "openai", "model": "gpt-4o"},
|
||||
{"provider": "zai", "model": "glm-4.7"},
|
||||
]
|
||||
agent = _make_agent(fallback_model=fbs)
|
||||
assert len(agent._fallback_chain) == 2
|
||||
assert agent._fallback_model == fbs[0]
|
||||
|
||||
def test_invalid_entries_filtered(self):
|
||||
fbs = [
|
||||
{"provider": "openai", "model": "gpt-4o"},
|
||||
{"provider": "", "model": "glm-4.7"},
|
||||
{"provider": "zai"},
|
||||
"not-a-dict",
|
||||
]
|
||||
agent = _make_agent(fallback_model=fbs)
|
||||
assert len(agent._fallback_chain) == 1
|
||||
assert agent._fallback_chain[0]["provider"] == "openai"
|
||||
|
||||
def test_empty_list(self):
|
||||
agent = _make_agent(fallback_model=[])
|
||||
assert agent._fallback_chain == []
|
||||
assert agent._fallback_model is None
|
||||
|
||||
def test_invalid_dict_no_provider(self):
|
||||
agent = _make_agent(fallback_model={"model": "gpt-4o"})
|
||||
assert agent._fallback_chain == []
|
||||
|
||||
|
||||
# ── Chain advancement ─────────────────────────────────────────────────────
|
||||
|
||||
|
||||
class TestFallbackChainAdvancement:
|
||||
def test_exhausted_returns_false(self):
|
||||
agent = _make_agent(fallback_model=None)
|
||||
assert agent._try_activate_fallback() is False
|
||||
|
||||
def test_advances_index(self):
|
||||
fbs = [
|
||||
{"provider": "openai", "model": "gpt-4o"},
|
||||
{"provider": "zai", "model": "glm-4.7"},
|
||||
]
|
||||
agent = _make_agent(fallback_model=fbs)
|
||||
with patch("agent.auxiliary_client.resolve_provider_client",
|
||||
return_value=(_mock_client(), "gpt-4o")):
|
||||
assert agent._try_activate_fallback() is True
|
||||
assert agent._fallback_index == 1
|
||||
assert agent.model == "gpt-4o"
|
||||
assert agent._fallback_activated is True
|
||||
|
||||
def test_second_fallback_works(self):
|
||||
fbs = [
|
||||
{"provider": "openai", "model": "gpt-4o"},
|
||||
{"provider": "zai", "model": "glm-4.7"},
|
||||
]
|
||||
agent = _make_agent(fallback_model=fbs)
|
||||
with patch("agent.auxiliary_client.resolve_provider_client",
|
||||
return_value=(_mock_client(), "resolved")):
|
||||
assert agent._try_activate_fallback() is True
|
||||
assert agent.model == "gpt-4o"
|
||||
assert agent._try_activate_fallback() is True
|
||||
assert agent.model == "glm-4.7"
|
||||
assert agent._fallback_index == 2
|
||||
|
||||
def test_all_exhausted_returns_false(self):
|
||||
fbs = [{"provider": "openai", "model": "gpt-4o"}]
|
||||
agent = _make_agent(fallback_model=fbs)
|
||||
with patch("agent.auxiliary_client.resolve_provider_client",
|
||||
return_value=(_mock_client(), "gpt-4o")):
|
||||
assert agent._try_activate_fallback() is True
|
||||
assert agent._try_activate_fallback() is False
|
||||
|
||||
def test_skips_unconfigured_provider_to_next(self):
|
||||
"""If resolve_provider_client returns None, skip to next in chain."""
|
||||
fbs = [
|
||||
{"provider": "broken", "model": "nope"},
|
||||
{"provider": "openai", "model": "gpt-4o"},
|
||||
]
|
||||
agent = _make_agent(fallback_model=fbs)
|
||||
with patch("agent.auxiliary_client.resolve_provider_client") as mock_rpc:
|
||||
mock_rpc.side_effect = [
|
||||
(None, None), # broken provider
|
||||
(_mock_client(), "gpt-4o"), # fallback succeeds
|
||||
]
|
||||
assert agent._try_activate_fallback() is True
|
||||
assert agent.model == "gpt-4o"
|
||||
assert agent._fallback_index == 2
|
||||
|
||||
def test_skips_provider_that_raises_to_next(self):
|
||||
"""If resolve_provider_client raises, skip to next in chain."""
|
||||
fbs = [
|
||||
{"provider": "broken", "model": "nope"},
|
||||
{"provider": "openai", "model": "gpt-4o"},
|
||||
]
|
||||
agent = _make_agent(fallback_model=fbs)
|
||||
with patch("agent.auxiliary_client.resolve_provider_client") as mock_rpc:
|
||||
mock_rpc.side_effect = [
|
||||
RuntimeError("auth failed"),
|
||||
(_mock_client(), "gpt-4o"),
|
||||
]
|
||||
assert agent._try_activate_fallback() is True
|
||||
assert agent.model == "gpt-4o"
|
||||
@@ -2507,6 +2507,8 @@ class TestFallbackAnthropicProvider:
|
||||
def test_fallback_to_anthropic_sets_api_mode(self, agent):
|
||||
agent._fallback_activated = False
|
||||
agent._fallback_model = {"provider": "anthropic", "model": "claude-sonnet-4-20250514"}
|
||||
agent._fallback_chain = [agent._fallback_model]
|
||||
agent._fallback_index = 0
|
||||
|
||||
mock_client = MagicMock()
|
||||
mock_client.base_url = "https://api.anthropic.com/v1"
|
||||
@@ -2528,6 +2530,8 @@ class TestFallbackAnthropicProvider:
|
||||
def test_fallback_to_anthropic_enables_prompt_caching(self, agent):
|
||||
agent._fallback_activated = False
|
||||
agent._fallback_model = {"provider": "anthropic", "model": "claude-sonnet-4-20250514"}
|
||||
agent._fallback_chain = [agent._fallback_model]
|
||||
agent._fallback_index = 0
|
||||
|
||||
mock_client = MagicMock()
|
||||
mock_client.base_url = "https://api.anthropic.com/v1"
|
||||
@@ -2545,6 +2549,8 @@ class TestFallbackAnthropicProvider:
|
||||
def test_fallback_to_openrouter_uses_openai_client(self, agent):
|
||||
agent._fallback_activated = False
|
||||
agent._fallback_model = {"provider": "openrouter", "model": "anthropic/claude-sonnet-4"}
|
||||
agent._fallback_chain = [agent._fallback_model]
|
||||
agent._fallback_index = 0
|
||||
|
||||
mock_client = MagicMock()
|
||||
mock_client.base_url = "https://openrouter.ai/api/v1"
|
||||
@@ -3238,6 +3244,8 @@ class TestFallbackSetsOAuthFlag:
|
||||
def test_fallback_to_anthropic_oauth_sets_flag(self, agent):
|
||||
agent._fallback_activated = False
|
||||
agent._fallback_model = {"provider": "anthropic", "model": "claude-sonnet-4-6"}
|
||||
agent._fallback_chain = [agent._fallback_model]
|
||||
agent._fallback_index = 0
|
||||
|
||||
mock_client = MagicMock()
|
||||
mock_client.base_url = "https://api.anthropic.com/v1"
|
||||
@@ -3259,6 +3267,8 @@ class TestFallbackSetsOAuthFlag:
|
||||
def test_fallback_to_anthropic_api_key_clears_flag(self, agent):
|
||||
agent._fallback_activated = False
|
||||
agent._fallback_model = {"provider": "anthropic", "model": "claude-sonnet-4-6"}
|
||||
agent._fallback_chain = [agent._fallback_model]
|
||||
agent._fallback_index = 0
|
||||
|
||||
mock_client = MagicMock()
|
||||
mock_client.base_url = "https://api.anthropic.com/v1"
|
||||
|
||||
Reference in New Issue
Block a user