hermes-agent/config/fallback-config.yaml

# Hermes Agent Fallback Configuration
# Deploy this to Timmy and Ezra for automatic kimi-coding fallback

model: anthropic/claude-opus-4.6

# Fallback chain: Anthropic -> Kimi -> Ollama (local)
fallback_providers:
  - provider: kimi-coding
    model: kimi-k2.5
    timeout: 60
    reason: "Primary fallback when Anthropic quota limited"

  - provider: ollama
    model: qwen2.5:7b
    base_url: http://localhost:11434
    timeout: 120
    reason: "Local fallback for offline operation"

# Provider settings
providers:
  anthropic:
    timeout: 30
    retry_on_quota: true
    max_retries: 2

  kimi-coding:
    timeout: 60
    max_retries: 3

  ollama:
    timeout: 120
    keep_alive: true

# Toolsets
toolsets:
  - hermes-cli
  - github
  - web

# Agent settings
agent:
  max_turns: 90
  tool_use_enforcement: auto
  fallback_on_errors:
    - rate_limit_exceeded
    - quota_exceeded
    - timeout
    - service_unavailable

# Display settings
display:
  show_fallback_notifications: true
  show_provider_switches: true