diff --git a/hermes_cli/main.py b/hermes_cli/main.py index 4bd110140..9ab040a7a 100644 --- a/hermes_cli/main.py +++ b/hermes_cli/main.py @@ -2126,9 +2126,8 @@ def _model_flow_kimi(config, current_model=""): # Step 3: Model selection — show appropriate models for the endpoint if is_coding_plan: - # Coding Plan models (kimi-for-coding first) + # Coding Plan models (kimi-k2.5 first — kimi-for-coding retired due to 403) model_list = [ - "kimi-for-coding", "kimi-k2.5", "kimi-k2-thinking", "kimi-k2-thinking-turbo", diff --git a/hermes_cli/models.py b/hermes_cli/models.py index 18a35711b..edec2b12b 100644 --- a/hermes_cli/models.py +++ b/hermes_cli/models.py @@ -130,7 +130,6 @@ _PROVIDER_MODELS: dict[str, list[str]] = { "glm-4.5-flash", ], "kimi-coding": [ - "kimi-for-coding", "kimi-k2.5", "kimi-k2-thinking", "kimi-k2-thinking-turbo", diff --git a/reports/ezra-quarterly-report-april-2026.md b/reports/ezra-quarterly-report-april-2026.md index 725c8950e..c5f7f299b 100644 --- a/reports/ezra-quarterly-report-april-2026.md +++ b/reports/ezra-quarterly-report-april-2026.md @@ -235,7 +235,7 @@ The Hermes Agent framework serves as both the delivery platform and the portfoli | House | Host | Model / Provider | Gateway Status | |-------|------|------------------|----------------| -| Ezra | Hermes VPS | `kimi-for-coding` (Kimi K2.5) | API `8658`, webhook `8648` — Active | +| Ezra | Hermes VPS | `kimi-k2.5` (Kimi K2.5) | API `8658`, webhook `8648` — Active | | Bezalel | Hermes VPS | Claude Opus 4.6 (Anthropic) | Port `8645` — Active | | Allegro-Primus | Hermes VPS | Kimi K2.5 | Port `8644` — Requires restart | | Bilbo | External | Gemma 4B (local) | Telegram dual-mode — Active | diff --git a/tests/test_api_key_providers.py b/tests/test_api_key_providers.py index ee86507a1..be38ffe81 100644 --- a/tests/test_api_key_providers.py +++ b/tests/test_api_key_providers.py @@ -895,7 +895,7 @@ class TestKimiMoonshotModelListIsolation: def test_moonshot_list_excludes_coding_plan_only_models(self): from hermes_cli.main import _PROVIDER_MODELS moonshot_models = _PROVIDER_MODELS["moonshot"] - coding_plan_only = {"kimi-for-coding", "kimi-k2-thinking-turbo"} + coding_plan_only = {"kimi-k2-thinking-turbo"} leaked = set(moonshot_models) & coding_plan_only assert not leaked, f"Moonshot list contains Coding Plan-only models: {leaked}" @@ -908,7 +908,7 @@ class TestKimiMoonshotModelListIsolation: def test_coding_plan_list_contains_plan_specific_models(self): from hermes_cli.main import _PROVIDER_MODELS coding_models = _PROVIDER_MODELS["kimi-coding"] - assert "kimi-for-coding" in coding_models + assert "kimi-k2.5" in coding_models assert "kimi-k2-thinking-turbo" in coding_models diff --git a/website/docs/integrations/providers.md b/website/docs/integrations/providers.md index ca6a0c511..6d609b4c8 100644 --- a/website/docs/integrations/providers.md +++ b/website/docs/integrations/providers.md @@ -142,7 +142,7 @@ hermes chat --provider zai --model glm-5 # Requires: GLM_API_KEY in ~/.hermes/.env # Kimi / Moonshot AI -hermes chat --provider kimi-coding --model kimi-for-coding +hermes chat --provider kimi-coding --model kimi-k2.5 # Requires: KIMI_API_KEY in ~/.hermes/.env # MiniMax (global endpoint)