[claude] Load fine-tuned Timmy model into Hermes harness (#1104) (#1122)

2026-03-23 18:21:32 +00:00
parent e8b3d59041
commit a29e615f76
4 changed files with 1108 additions and 0 deletions
--- a/config/providers.yaml
+++ b/config/providers.yaml
@@ -63,6 +63,15 @@ providers:
        capabilities: [text, tools, json, streaming, reasoning]
        description: "NousResearch Hermes 4 14B — AutoLoRA base (Q5_K_M, ~11 GB)"

+      # AutoLoRA fine-tuned: Timmy — Hermes 4 14B + Timmy LoRA adapter (Project Bannerlord #1104)
+      # Build via: ./scripts/fuse_and_load.sh  (fuses adapter, converts to GGUF, imports)
+      # Then switch harness: hermes model timmy
+      # Validate: python scripts/test_timmy_skills.py
+      - name: timmy
+        context_window: 32768
+        capabilities: [text, tools, json, streaming, reasoning]
+        description: "Timmy — Hermes 4 14B fine-tuned on Timmy skill set (LoRA-fused, Q5_K_M, ~11 GB)"
+
      # AutoLoRA stretch goal: Hermes 4.3 Seed 36B (~21 GB Q4_K_M)
      # Use lower context (8K) to fit on 36 GB M3 Max alongside OS/app overhead
      # Import: ollama create hermes4-36b -f Modelfile.hermes4-36b (TBD)
@@ -156,6 +165,7 @@ fallback_chains:
  
  # Tool-calling models (for function calling)
  tools:
+    - timmy                # Fine-tuned Timmy (Hermes 4 14B + LoRA) — primary agent model
    - hermes4-14b          # Native tool calling + structured JSON (AutoLoRA base)
    - llama3.1:8b-instruct # Reliable tool use
    - qwen2.5:7b           # Reliable tools