[claude] Load fine-tuned Timmy model into Hermes harness (#1104) (#1122)
Some checks failed
Tests / lint (push) Has been cancelled
Tests / test (push) Has been cancelled

This commit was merged in pull request #1122.
This commit is contained in:
2026-03-23 18:21:32 +00:00
parent e8b3d59041
commit a29e615f76
4 changed files with 1108 additions and 0 deletions

View File

@@ -63,6 +63,15 @@ providers:
capabilities: [text, tools, json, streaming, reasoning]
description: "NousResearch Hermes 4 14B — AutoLoRA base (Q5_K_M, ~11 GB)"
# AutoLoRA fine-tuned: Timmy — Hermes 4 14B + Timmy LoRA adapter (Project Bannerlord #1104)
# Build via: ./scripts/fuse_and_load.sh (fuses adapter, converts to GGUF, imports)
# Then switch harness: hermes model timmy
# Validate: python scripts/test_timmy_skills.py
- name: timmy
context_window: 32768
capabilities: [text, tools, json, streaming, reasoning]
description: "Timmy — Hermes 4 14B fine-tuned on Timmy skill set (LoRA-fused, Q5_K_M, ~11 GB)"
# AutoLoRA stretch goal: Hermes 4.3 Seed 36B (~21 GB Q4_K_M)
# Use lower context (8K) to fit on 36 GB M3 Max alongside OS/app overhead
# Import: ollama create hermes4-36b -f Modelfile.hermes4-36b (TBD)
@@ -156,6 +165,7 @@ fallback_chains:
# Tool-calling models (for function calling)
tools:
- timmy # Fine-tuned Timmy (Hermes 4 14B + LoRA) — primary agent model
- hermes4-14b # Native tool calling + structured JSON (AutoLoRA base)
- llama3.1:8b-instruct # Reliable tool use
- qwen2.5:7b # Reliable tools