All checks were successful
Forge CI / smoke-and-build (pull_request) Successful in 36s
- model_metadata.py - fallback-config.yaml - hermes_cli/auth.py, main.py, models.py - test_api_key_providers.py - docs/integrations/providers.md - ezra quarterly report
54 lines
1.0 KiB
YAML
54 lines
1.0 KiB
YAML
# Hermes Agent Fallback Configuration
|
|
# Deploy this to Timmy and Ezra for automatic kimi-coding fallback
|
|
|
|
model: anthropic/claude-opus-4.6
|
|
|
|
# Fallback chain: Anthropic -> Kimi -> Ollama (local)
|
|
fallback_providers:
|
|
- provider: kimi-coding
|
|
model: kimi-k2.5
|
|
timeout: 60
|
|
reason: "Primary fallback when Anthropic quota limited"
|
|
|
|
- provider: ollama
|
|
model: qwen2.5:7b
|
|
base_url: http://localhost:11434
|
|
timeout: 120
|
|
reason: "Local fallback for offline operation"
|
|
|
|
# Provider settings
|
|
providers:
|
|
anthropic:
|
|
timeout: 30
|
|
retry_on_quota: true
|
|
max_retries: 2
|
|
|
|
kimi-coding:
|
|
timeout: 60
|
|
max_retries: 3
|
|
|
|
ollama:
|
|
timeout: 120
|
|
keep_alive: true
|
|
|
|
# Toolsets
|
|
toolsets:
|
|
- hermes-cli
|
|
- github
|
|
- web
|
|
|
|
# Agent settings
|
|
agent:
|
|
max_turns: 90
|
|
tool_use_enforcement: auto
|
|
fallback_on_errors:
|
|
- rate_limit_exceeded
|
|
- quota_exceeded
|
|
- timeout
|
|
- service_unavailable
|
|
|
|
# Display settings
|
|
display:
|
|
show_fallback_notifications: true
|
|
show_provider_switches: true
|