fix: persist token counts from gateway to SessionEntry and SQLite (#316 )

The gateway's _run_agent returns input_tokens/output_tokens in its result dict, but these were never stored to SessionEntry or the SQLite session DB. Every session showed zero token counts. Changes: - gateway/session.py: Extend update_session() to accept and persist input_tokens, output_tokens, total_tokens, estimated_cost_usd - gateway/run.py: Pass agent result token totals to update_session() and call set_token_counts(absolute=True) on _session_db after every conversation turn - tests/test_token_tracking_persistence.py: Regression tests for SessionEntry serialization and agent result token extraction Closes #316
2026-04-13 17:38:55 -04:00
22 changed files with 205 additions and 2911 deletions
--- a/agent/smart_model_routing.py
+++ b/agent/smart_model_routing.py
@@ -1,11 +1,10 @@
-"""Helpers for optional cheap-vs-strong and time-aware model routing."""
+"""Helpers for optional cheap-vs-strong model routing."""

 from __future__ import annotations

 import os
 import re
-from datetime import datetime
-from typing import Any, Dict, List, Optional
+from typing import Any, Dict, Optional

 from utils import is_truthy_value

@@ -193,104 +192,3 @@ def resolve_turn_route(user_message: str, routing_config: Optional[Dict[str, Any
            tuple(runtime.get("args") or ()),
        ),
    }
-
-
-# =========================================================================
-# Time-aware cron model routing
-# =========================================================================
-#
-# Empirical finding: cron error rate peaks at 18:00 (9.4%) vs 4.0% at 09:00.
-# During high-error windows, route cron jobs to more capable models.
-#
-# Config (config.yaml):
-#   cron_model_routing:
-#     enabled: true
-#     fallback_model: "anthropic/claude-sonnet-4"
-#     fallback_provider: "openrouter"
-#     windows:
-#       - start_hour: 17
-#         end_hour: 22
-#         reason: "evening_error_peak"
-#       - start_hour: 2
-#         end_hour: 5
-#         reason: "overnight_api_instability"
-# =========================================================================
-
-def _hour_in_window(hour: int, start: int, end: int) -> bool:
-    """Check if hour falls in [start, end) window, handling midnight wrap."""
-    if start <= end:
-        return start <= hour < end
-    else:
-        # Wraps midnight: e.g., 22-06
-        return hour >= start or hour < end
-
-
-def resolve_cron_model(
-    base_model: str,
-    routing_config: Optional[Dict[str, Any]],
-    now: Optional[datetime] = None,
-) -> Dict[str, Any]:
-    """Apply time-aware model override for cron jobs.
-
-    During configured high-error windows, returns a stronger model config.
-    Outside windows, returns the base model unchanged.
-
-    Args:
-        base_model: The model string already resolved (from job/config/env).
-        routing_config: The cron_model_routing dict from config.yaml.
-        now: Override current time (for testing). Defaults to datetime.now().
-
-    Returns:
-        Dict with keys: model, provider, overridden, reason.
-        - model: the effective model string to use
-        - provider: provider override (empty string = use default)
-        - overridden: True if time-based override was applied
-        - reason: why override was applied (empty string if not)
-    """
-    cfg = routing_config or {}
-
-    if not _coerce_bool(cfg.get("enabled"), False):
-        return {"model": base_model, "provider": "", "overridden": False, "reason": ""}
-
-    windows = cfg.get("windows") or []
-    if not isinstance(windows, list) or not windows:
-        return {"model": base_model, "provider": "", "overridden": False, "reason": ""}
-
-    current = now or datetime.now()
-    current_hour = current.hour
-
-    matched_window = None
-    for window in windows:
-        if not isinstance(window, dict):
-            continue
-        start = _coerce_int(window.get("start_hour"), -1)
-        end = _coerce_int(window.get("end_hour"), -1)
-        if start < 0 or end < 0:
-            continue
-        if _hour_in_window(current_hour, start, end):
-            matched_window = window
-            break
-
-    if not matched_window:
-        return {"model": base_model, "provider": "", "overridden": False, "reason": ""}
-
-    # Window matched — use the override model from window or global fallback
-    override_model = str(matched_window.get("model") or "").strip()
-    override_provider = str(matched_window.get("provider") or "").strip()
-
-    if not override_model:
-        override_model = str(cfg.get("fallback_model") or "").strip()
-    if not override_provider:
-        override_provider = str(cfg.get("fallback_provider") or "").strip()
-
-    if not override_model:
-        return {"model": base_model, "provider": "", "overridden": False, "reason": ""}
-
-    reason = str(matched_window.get("reason") or "time_window").strip()
-
-    return {
-        "model": override_model,
-        "provider": override_provider,
-        "overridden": True,
-        "reason": f"cron_routing:{reason}(hour={current_hour})",
-    }
--- a/cli.py
+++ b/cli.py
@@ -3134,196 +3134,6 @@ class HermesCLI:
        print(f"  Home:    {display}")
        print()

-    def _handle_debug_command(self, command: str):
-        """Generate a debug report with system info and logs, upload to paste service."""
-        import platform
-        import sys
-        import time as _time
-
-        # Parse optional lines argument
-        parts = command.split(maxsplit=1)
-        log_lines = 50
-        if len(parts) > 1:
-            try:
-                log_lines = min(int(parts[1]), 500)
-            except ValueError:
-                pass
-
-        _cprint("  Collecting debug info...")
-
-        # Collect system info
-        lines = []
-        lines.append("=== HERMES DEBUG REPORT ===")
-        lines.append(f"Generated: {_time.strftime('%Y-%m-%d %H:%M:%S %z')}")
-        lines.append("")
-
-        lines.append("--- System ---")
-        lines.append(f"Python: {sys.version}")
-        lines.append(f"Platform: {platform.platform()}")
-        lines.append(f"Architecture: {platform.machine()}")
-        lines.append(f"Hostname: {platform.node()}")
-        lines.append("")
-
-        # Hermes info
-        lines.append("--- Hermes ---")
-        try:
-            from hermes_constants import get_hermes_home, display_hermes_home
-            lines.append(f"Home: {display_hermes_home()}")
-        except Exception:
-            lines.append("Home: unknown")
-
-        try:
-            from hermes_constants import __version__
-            lines.append(f"Version: {__version__}")
-        except Exception:
-            lines.append("Version: unknown")
-
-        lines.append(f"Profile: {getattr(self, '_profile_name', 'default')}")
-        lines.append(f"Session: {self.session_id}")
-        lines.append(f"Model: {self.model}")
-        lines.append(f"Provider: {getattr(self, '_provider_name', 'unknown')}")
-
-        try:
-            lines.append(f"Working dir: {os.getcwd()}")
-        except Exception:
-            pass
-
-        # Config (redacted)
-        lines.append("")
-        lines.append("--- Config (redacted) ---")
-        try:
-            from hermes_constants import get_hermes_home
-            config_path = get_hermes_home() / "config.yaml"
-            if config_path.exists():
-                import yaml
-                with open(config_path) as f:
-                    cfg = yaml.safe_load(f) or {}
-                # Redact secrets
-                for key in ("api_key", "token", "secret", "password"):
-                    if key in cfg:
-                        cfg[key] = "***REDACTED***"
-                lines.append(yaml.dump(cfg, default_flow_style=False)[:2000])
-            else:
-                lines.append("(no config file found)")
-        except Exception as e:
-            lines.append(f"(error reading config: {e})")
-
-        # Recent logs
-        lines.append("")
-        lines.append(f"--- Recent Logs (last {log_lines} lines) ---")
-        try:
-            from hermes_constants import get_hermes_home
-            log_dir = get_hermes_home() / "logs"
-            if log_dir.exists():
-                for log_file in sorted(log_dir.glob("*.log")):
-                    try:
-                        content = log_file.read_text(encoding="utf-8", errors="replace")
-                        tail = content.strip().split("\n")[-log_lines:]
-                        if tail:
-                            lines.append(f"\n[{log_file.name}]")
-                            lines.extend(tail)
-                    except Exception:
-                        pass
-            else:
-                lines.append("(no logs directory)")
-        except Exception:
-            lines.append("(error reading logs)")
-
-        # Tool info
-        lines.append("")
-        lines.append("--- Enabled Toolsets ---")
-        try:
-            lines.append(", ".join(self.enabled_toolsets) if self.enabled_toolsets else "(none)")
-        except Exception:
-            lines.append("(unknown)")
-
-        report = "\n".join(lines)
-        report_size = len(report)
-
-        # Try to upload to paste services
-        paste_url = None
-        services = [
-            ("dpaste", _upload_dpaste),
-            ("0x0.st", _upload_0x0st),
-        ]
-
-        for name, uploader in services:
-            try:
-                url = uploader(report)
-                if url:
-                    paste_url = url
-                    break
-            except Exception:
-                continue
-
-        print()
-        if paste_url:
-            _cprint(f"  Debug report uploaded: {paste_url}")
-            _cprint(f"  Size: {report_size} bytes, {len(lines)} lines")
-        else:
-            # Fallback: save locally
-            try:
-                from hermes_constants import get_hermes_home
-                debug_path = get_hermes_home() / "debug-report.txt"
-                debug_path.write_text(report, encoding="utf-8")
-                _cprint(f"  Paste services unavailable. Report saved to: {debug_path}")
-                _cprint(f"  Size: {report_size} bytes, {len(lines)} lines")
-            except Exception as e:
-                _cprint(f"  Failed to save report: {e}")
-                _cprint(f"  Report ({report_size} bytes):")
-                print(report)
-        print()
-
-
-def _upload_dpaste(content: str) -> str | None:
-    """Upload content to dpaste.org. Returns URL or None."""
-    import urllib.request
-    import urllib.parse
-    data = urllib.parse.urlencode({
-        "content": content,
-        "syntax": "text",
-        "expiry_days": 7,
-    }).encode()
-    req = urllib.request.Request(
-        "https://dpaste.org/api/",
-        data=data,
-        headers={"User-Agent": "hermes-agent/debug"},
-    )
-    with urllib.request.urlopen(req, timeout=10) as resp:
-        url = resp.read().decode().strip()
-        if url.startswith("http"):
-            return url
-    return None
-
-
-def _upload_0x0st(content: str) -> str | None:
-    """Upload content to 0x0.st. Returns URL or None."""
-    import urllib.request
-    import io
-    # 0x0.st expects multipart form with a file field
-    boundary = "----HermesDebugBoundary"
-    body = (
-        f"--{boundary}\r\n"
-        f'Content-Disposition: form-data; name="file"; filename="debug.txt"\r\n'
-        f"Content-Type: text/plain\r\n\r\n"
-        f"{content}\r\n"
-        f"--{boundary}--\r\n"
-    ).encode()
-    req = urllib.request.Request(
-        "https://0x0.st",
-        data=body,
-        headers={
-            "Content-Type": f"multipart/form-data; boundary={boundary}",
-            "User-Agent": "hermes-agent/debug",
-        },
-    )
-    with urllib.request.urlopen(req, timeout=10) as resp:
-        url = resp.read().decode().strip()
-        if url.startswith("http"):
-            return url
-    return None
-
-
    def show_config(self):
        """Display current configuration with kawaii ASCII art."""
        # Get terminal config from environment (which was set from cli-config.yaml)
@@ -4511,8 +4321,6 @@ def _upload_0x0st(content: str) -> str | None:
            self.show_help()
        elif canonical == "profile":
            self._handle_profile_command()
-        elif canonical == "debug":
-            self._handle_debug_command(cmd_original)
        elif canonical == "tools":
            self._handle_tools_command(cmd_original)
        elif canonical == "toolsets":
--- a/cron/jobs.py
+++ b/cron/jobs.py
@@ -547,30 +547,20 @@ def resume_job(job_id: str) -> Optional[Dict[str, Any]]:


 def trigger_job(job_id: str) -> Optional[Dict[str, Any]]:
-    """Schedule a job to run on the next scheduler tick.
-    
-    Clears stale error state when re-triggering a previously-failed job
-    so the stale failure doesn't persist until the next tick completes.
-    """
+    """Schedule a job to run on the next scheduler tick."""
    job = get_job(job_id)
    if not job:
        return None
-    
-    updates = {
-        "enabled": True,
-        "state": "scheduled",
-        "paused_at": None,
-        "paused_reason": None,
-        "next_run_at": _hermes_now().isoformat(),
-    }
-    
-    # Clear stale error state when re-triggering
-    if job.get("last_status") == "error":
-        updates["last_status"] = "retrying"
-        updates["last_error"] = None
-        updates["error_cleared_at"] = _hermes_now().isoformat()
-    
-    return update_job(job_id, updates)
+    return update_job(
+        job_id,
+        {
+            "enabled": True,
+            "state": "scheduled",
+            "paused_at": None,
+            "paused_reason": None,
+            "next_run_at": _hermes_now().isoformat(),
+        },
+    )


 def run_job_now(job_id: str) -> Optional[Dict[str, Any]]:
@@ -628,7 +618,6 @@ def mark_job_run(job_id: str, success: bool, error: Optional[str] = None):
    
    Updates last_run_at, last_status, increments completed count,
    computes next_run_at, and auto-deletes if repeat limit reached.
-    Tracks health timestamps for error/success history.
    """
    jobs = load_jobs()
    for i, job in enumerate(jobs):
@@ -638,18 +627,6 @@ def mark_job_run(job_id: str, success: bool, error: Optional[str] = None):
            job["last_status"] = "ok" if success else "error"
            job["last_error"] = error if not success else None
            
-            # Track health timestamps
-            if success:
-                job["last_success_at"] = now
-                # Clear stale error tracking on success
-                if job.get("last_error_at"):
-                    job["error_resolved_at"] = now
-            else:
-                job["last_error_at"] = now
-                # Clear resolved tracking on new error
-                if job.get("error_resolved_at"):
-                    del job["error_resolved_at"]
-            
            # Increment completed count
            if job.get("repeat"):
                job["repeat"]["completed"] = job["repeat"].get("completed", 0) + 1
@@ -679,32 +656,6 @@ def mark_job_run(job_id: str, success: bool, error: Optional[str] = None):
    save_jobs(jobs)


-
-def clear_job_error(job_id: str) -> Optional[Dict[str, Any]]:
-    """
-    Clear stale error state for a job.
-    
-    Resets last_status to 'ok', last_error to None, and 
-    records when the error was cleared. Useful after auth
-    recovery when the job itself is healthy but stale error
-    state persists.
-    
-    Returns:
-        Updated job dict, or None if not found.
-    """
-    jobs = load_jobs()
-    for job in jobs:
-        if job["id"] == job_id:
-            job["last_status"] = "ok"
-            job["last_error"] = None
-            job["error_cleared_at"] = _hermes_now().isoformat()
-            save_jobs(jobs)
-            return job
-    save_jobs(jobs)
-    return None
-
-
-
 def advance_next_run(job_id: str) -> bool:
    """Preemptively advance next_run_at for a recurring job before execution.

--- a/cron/scheduler.py
+++ b/cron/scheduler.py
@@ -37,7 +37,6 @@ sys.path.insert(0, str(Path(__file__).parent.parent))
 from hermes_constants import get_hermes_home
 from hermes_cli.config import load_config
 from hermes_time import now as _hermes_now
-from agent.model_metadata import is_local_endpoint

 logger = logging.getLogger(__name__)

@@ -718,22 +717,6 @@ def run_job(job: dict) -> tuple[bool, str, str, Optional[str]]:

        # Reasoning config from env or config.yaml
        from hermes_constants import parse_reasoning_effort
-
-        # Time-aware cron model routing — override model during high-error windows
-        try:
-            from agent.smart_model_routing import resolve_cron_model
-            _cron_routing_cfg = (_cfg.get("cron_model_routing") or {})
-            _cron_route = resolve_cron_model(model, _cron_routing_cfg)
-            if _cron_route["overridden"]:
-                _original_model = model
-                model = _cron_route["model"]
-                logger.info(
-                    "Job '%s': cron model override %s -> %s (%s)",
-                    job_id, _original_model, model, _cron_route["reason"],
-                )
-        except Exception as _e:
-            logger.debug("Job '%s': cron model routing skipped: %s", job_id, _e)
-
        effort = os.getenv("HERMES_REASONING_EFFORT", "")
        if not effort:
            effort = str(_cfg.get("agent", {}).get("reasoning_effort", "")).strip()
@@ -794,29 +777,6 @@ def run_job(job: dict) -> tuple[bool, str, str, Optional[str]]:
            },
        )

-        # Build disabled toolsets — always exclude cronjob/messaging/clarify
-        # for cron sessions.  When the runtime endpoint is cloud (not local),
-        # also disable terminal so the agent does not attempt SSH or shell
-        # commands that require local infrastructure (keys, filesystem).
-        # Jobs that declare requires_local_infra=true also get terminal
-        # disabled on cloud endpoints regardless of this check.  #379
-        _cron_disabled = ["cronjob", "messaging", "clarify"]
-        _runtime_base_url = turn_route["runtime"].get("base_url", "")
-        _is_cloud = not is_local_endpoint(_runtime_base_url)
-        if _is_cloud:
-            _cron_disabled.append("terminal")
-            logger.info(
-                "Job '%s': cloud provider detected (%s), disabling terminal toolset",
-                job_name,
-                turn_route["runtime"].get("provider", "unknown"),
-            )
-        if job.get("requires_local_infra") and _is_cloud:
-            logger.warning(
-                "Job '%s': requires_local_infra=true but running on cloud provider — "
-                "terminal-dependent steps will fail gracefully",
-                job_name,
-            )
-
        _agent_kwargs = _safe_agent_kwargs({
            "model": turn_route["model"],
            "api_key": turn_route["runtime"].get("api_key"),
@@ -824,7 +784,7 @@ def run_job(job: dict) -> tuple[bool, str, str, Optional[str]]:
            "provider": turn_route["runtime"].get("provider"),
            "api_mode": turn_route["runtime"].get("api_mode"),
            "acp_command": turn_route["runtime"].get("command"),
-            "acp_args": list(turn_route["runtime"].get("args") or []),
+            "acp_args": turn_route["runtime"].get("args"),
            "max_iterations": max_iterations,
            "reasoning_config": reasoning_config,
            "prefill_messages": prefill_messages,
@@ -832,7 +792,7 @@ def run_job(job: dict) -> tuple[bool, str, str, Optional[str]]:
            "providers_ignored": pr.get("ignore"),
            "providers_order": pr.get("order"),
            "provider_sort": pr.get("sort"),
-            "disabled_toolsets": _cron_disabled,
+            "disabled_toolsets": ["cronjob", "messaging", "clarify"],
            "tool_choice": "required",
            "quiet_mode": True,
            "skip_memory": True,  # Cron system prompts would corrupt user representations
--- a/deploy-crons.py
+++ b/deploy-crons.py
@@ -1,154 +0,0 @@
-#!/usr/bin/env python3
-"""
-deploy-crons — normalize cron job schemas for consistent model field types.
-
-This script ensures that the model field in jobs.json is always a dict when
-either model or provider is specified, preventing schema inconsistency.
-
-Usage:
-    python deploy-crons.py [--dry-run] [--jobs-file PATH]
-"""
-
-import argparse
-import json
-import sys
-from pathlib import Path
-from typing import Any, Dict, Optional
-
-
-def normalize_job(job: Dict[str, Any]) -> Dict[str, Any]:
-    """
-    Normalize a job dict to ensure consistent model field types.
-
-    Before normalization:
-    - If model AND provider: model = raw string, provider = raw string (inconsistent)
-    - If only model: model = raw string
-    - If only provider: provider = raw string at top level
-
-    After normalization:
-    - If model exists: model = {"model": "xxx"}
-    - If provider exists: model = {"provider": "yyy"}
-    - If both exist: model = {"model": "xxx", "provider": "yyy"}
-    - If neither: model = None
-    """
-    job = dict(job)  # Create a copy to avoid modifying the original
-    
-    model = job.get("model")
-    provider = job.get("provider")
-    
-    # Skip if already normalized (model is a dict)
-    if isinstance(model, dict):
-        return job
-    
-    # Build normalized model dict
-    model_dict = {}
-    
-    if model is not None and isinstance(model, str):
-        model_dict["model"] = model.strip()
-    
-    if provider is not None and isinstance(provider, str):
-        model_dict["provider"] = provider.strip()
-    
-    # Set model field
-    if model_dict:
-        job["model"] = model_dict
-    else:
-        job["model"] = None
-    
-    # Remove top-level provider field if it was moved into model dict
-    if provider is not None and "provider" in model_dict:
-        # Keep provider field for backward compatibility but mark it as deprecated
-        # This allows existing code that reads job["provider"] to continue working
-        pass
-    
-    return job
-
-
-def normalize_jobs_file(jobs_file: Path, dry_run: bool = False) -> int:
-    """
-    Normalize all jobs in a jobs.json file.
-    
-    Returns the number of jobs that were modified.
-    """
-    if not jobs_file.exists():
-        print(f"Error: Jobs file not found: {jobs_file}", file=sys.stderr)
-        return 1
-    
-    try:
-        with open(jobs_file, 'r', encoding='utf-8') as f:
-            data = json.load(f)
-    except json.JSONDecodeError as e:
-        print(f"Error: Invalid JSON in {jobs_file}: {e}", file=sys.stderr)
-        return 1
-    
-    jobs = data.get("jobs", [])
-    if not jobs:
-        print("No jobs found in file.")
-        return 0
-    
-    modified_count = 0
-    for i, job in enumerate(jobs):
-        original_model = job.get("model")
-        original_provider = job.get("provider")
-        
-        normalized_job = normalize_job(job)
-        
-        # Check if anything changed
-        if (normalized_job.get("model") != original_model or
-            normalized_job.get("provider") != original_provider):
-            jobs[i] = normalized_job
-            modified_count += 1
-            
-            job_id = job.get("id", "?")
-            job_name = job.get("name", "(unnamed)")
-            print(f"Normalized job {job_id} ({job_name}):")
-            print(f"  model: {original_model!r} -> {normalized_job.get('model')!r}")
-            print(f"  provider: {original_provider!r} -> {normalized_job.get('provider')!r}")
-    
-    if modified_count == 0:
-        print("All jobs already have consistent model field types.")
-        return 0
-    
-    if dry_run:
-        print(f"DRY RUN: Would normalize {modified_count} jobs.")
-        return 0
-    
-    # Write back to file
-    data["jobs"] = jobs
-    try:
-        with open(jobs_file, 'w', encoding='utf-8') as f:
-            json.dump(data, f, indent=2, ensure_ascii=False)
-        print(f"Normalized {modified_count} jobs in {jobs_file}")
-        return 0
-    except Exception as e:
-        print(f"Error writing to {jobs_file}: {e}", file=sys.stderr)
-        return 1
-
-
-def main():
-    parser = argparse.ArgumentParser(
-        description="Normalize cron job schemas for consistent model field types."
-    )
-    parser.add_argument(
-        "--dry-run",
-        action="store_true",
-        help="Show what would be changed without modifying the file."
-    )
-    parser.add_argument(
-        "--jobs-file",
-        type=Path,
-        default=Path.home() / ".hermes" / "cron" / "jobs.json",
-        help="Path to jobs.json file (default: ~/.hermes/cron/jobs.json)"
-    )
-    
-    args = parser.parse_args()
-    
-    if args.dry_run:
-        print("DRY RUN MODE — no changes will be made.")
-        print()
-    
-    return normalize_jobs_file(args.jobs_file, args.dry_run)
-
-
-if __name__ == "__main__":
-    sys.exit(main())
--- a/docs/honcho-evaluation-322.md
+++ b/docs/honcho-evaluation-322.md
@@ -1,170 +0,0 @@
-# Honcho Memory Integration Evaluation (#322)
-
-## Executive Summary
-
-**Status:** Integration already implemented and production-ready.
-**Recommendation:** KEEP — well-gated, zero overhead when disabled, supports self-hosted.
-
-## Decision: Cloud vs Local
-
-### The Question
-"Do we want a cloud-dependent memory layer, or keep everything local?"
-
-### Answer: BOTH — User's Choice
-
-Honcho supports both deployment modes:
-
-| Mode | Configuration | Data Location | Use Case |
-|------|--------------|---------------|----------|
-| Cloud | `HONCHO_API_KEY` | Honcho servers | Quick start, no infrastructure |
-| Self-hosted | `HONCHO_BASE_URL=http://localhost:8000` | Your servers | Full sovereignty |
-| Disabled | No config | N/A | Pure local (holographic fact_store only) |
-
-### Why Keep It
-
-1. **Opt-in Architecture**
-   - No Honcho config → zero overhead (cron guard, lazy init)
-   - Memory provider system allows switching between providers
-   - `hermes memory off` disables completely
-
-2. **Zero Runtime Cost When Disabled**
-   ```python
-   if not cfg.enabled or not (cfg.api_key or cfg.base_url):
-       return ""  # No HTTP calls, no overhead
-   ```
-
-3. **Cross-Session User Modeling**
-   - Holographic fact_store lacks persistent user modeling
-   - Honcho provides: peer cards, dialectic Q&A, semantic search
-   - Complements (not replaces) local memory
-
-4. **Self-Hosted Option**
-   - Set `HONCHO_BASE_URL=http://localhost:8000`
-   - Run Honcho server locally via Docker
-   - Full data sovereignty
-
-5. **Production-Grade Implementation**
-   - 3 components, ~700 lines of code
-   - 7 tests passing
-   - Async prefetch (zero-latency context injection)
-   - Configurable recall modes (hybrid/context/tools)
-   - Write frequency control (async/turn/session/N-turns)
-
-## Architecture
-
-### Components (Already Implemented)
-
-```
-plugins/memory/honcho/
-├── client.py      # Config resolution (API key, base_url, profiles)
-├── session.py     # Session management, async prefetch, dialectic queries
-├── __init__.py    # MemoryProvider interface, 4 tool schemas
-├── cli.py         # CLI commands (setup, status, sessions, map, peer, mode)
-├── plugin.yaml    # Plugin metadata
-└── README.md      # Documentation
-```
-
-### Integration Points
-
-1. **System Prompt**: Context injected on first turn (cached for prompt caching)
-2. **Tool Registry**: 4 tools available when `recall_mode != "context"`
-3. **Session End**: Messages flushed to Honcho
-4. **Cron Guard**: Fully inactive in cron context
-
-### Tools Available
-
-| Tool | Cost | Speed | Purpose |
-|------|------|-------|---------|
-| `honcho_profile` | Free | Fast | Quick factual snapshot (peer card) |
-| `honcho_search` | Free | Fast | Semantic search (raw excerpts) |
-| `honcho_context` | Paid | Slow | Dialectic Q&A (synthesized answers) |
-| `honcho_conclude` | Free | Fast | Save persistent facts about user |
-
-## Configuration Guide
-
-### Option 1: Cloud (Quick Start)
-```bash
-# Get API key from https://app.honcho.dev
-export HONCHO_API_KEY="your-api-key"
-hermes chat
-```
-
-### Option 2: Self-Hosted (Full Sovereignty)
-```bash
-# Run Honcho server locally
-docker run -p 8000:8000 honcho/server
-
-# Configure Hermes
-export HONCHO_BASE_URL="http://localhost:8000"
-hermes chat
-```
-
-### Option 3: CLI Setup
-```bash
-hermes honcho setup
-```
-
-### Option 4: Disabled (Pure Local)
-```bash
-# Don't set any Honcho config
-hermes memory off  # If previously enabled
-hermes chat
-```
-
-## Memory Modes
-
-| Mode | Context Injection | Tools | Cost | Use Case |
-|------|------------------|-------|------|----------|
-| hybrid | Yes | Yes | Medium | Default — auto-inject + on-demand |
-| context | Yes | No | Low | Budget mode — auto-inject only |
-| tools | No | Yes | Variable | Full control — agent decides |
-
-## Risk Assessment
-
-| Risk | Mitigation | Status |
-|------|------------|--------|
-| Cloud dependency | Self-hosted option available | ✅ |
-| Cost from LLM calls | Recall mode "context" or "tools" reduces calls | ✅ |
-| Data privacy | Self-hosted keeps data on your servers | ✅ |
-| Performance overhead | Cron guard + lazy init + async prefetch | ✅ |
-| Vendor lock-in | MemoryProvider interface allows swapping | ✅ |
-
-## Comparison with Alternatives
-
-| Feature | Honcho | Holographic | Mem0 | Hindsight |
-|---------|--------|-------------|------|-----------|
-| Cross-session modeling | ✅ | ❌ | ✅ | ✅ |
-| Dialectic Q&A | ✅ | ❌ | ❌ | ❌ |
-| Self-hosted | ✅ | N/A | ❌ | ❌ |
-| Local-only option | ✅ | ✅ | ❌ | ✅ |
-| Cost | Free/Paid | Free | Paid | Free |
-
-## Conclusion
-
-**Keep Honcho integration.** It provides unique cross-session user modeling capabilities that complement the local holographic fact_store. The integration is:
-
- Well-gated (opt-in, zero overhead when disabled)
- Flexible (cloud or self-hosted)
- Production-ready (7 tests passing, async prefetch, configurable)
- Non-exclusive (works alongside other memory providers)
-
-### To Enable
-
-```bash
-# Cloud
-hermes honcho setup
-
-# Self-hosted
-export HONCHO_BASE_URL="http://localhost:8000"
-hermes chat
-```
-
-### To Disable
-
-```bash
-hermes memory off
-```
-
---
-
-*Evaluated by SANDALPHON — Cron/Ops lane*
--- a/gateway/config.py
+++ b/gateway/config.py
@@ -412,52 +412,6 @@ class GatewayConfig:
        return self.unauthorized_dm_behavior


-def _validate_fallback_providers() -> None:
-    """Validate fallback_providers from config.yaml at gateway startup.
-
-    Checks that each entry has 'provider' and 'model' fields and logs
-    warnings for malformed entries.  This catches broken fallback chains
-    before they silently degrade into no-fallback mode.
-    """
-    try:
-        _home = get_hermes_home()
-        _config_path = _home / "config.yaml"
-        if not _config_path.exists():
-            return
-        import yaml
-        with open(_config_path, encoding="utf-8") as _f:
-            _cfg = yaml.safe_load(_f) or {}
-        fbp = _cfg.get("fallback_providers")
-        if not fbp:
-            return
-        if not isinstance(fbp, list):
-            logger.warning(
-                "fallback_providers should be a YAML list, got %s. "
-                "Fallback chain will be disabled.",
-                type(fbp).__name__,
-            )
-            return
-        for i, entry in enumerate(fbp):
-            if not isinstance(entry, dict):
-                logger.warning(
-                    "fallback_providers[%d] is not a dict (got %s). Skipping entry.",
-                    i, type(entry).__name__,
-                )
-                continue
-            if not entry.get("provider"):
-                logger.warning(
-                    "fallback_providers[%d] missing 'provider' field. Skipping entry.",
-                    i,
-                )
-            if not entry.get("model"):
-                logger.warning(
-                    "fallback_providers[%d] missing 'model' field. Skipping entry.",
-                    i,
-                )
-    except Exception:
-        pass  # Non-fatal; validation is advisory
-
-
 def load_gateway_config() -> GatewayConfig:
    """
    Load gateway configuration from multiple sources.
@@ -691,19 +645,6 @@ def load_gateway_config() -> GatewayConfig:
                platform.value, env_name,
            )

-    # Warn about API Server enabled without a key (unauthenticated endpoint)
-    if Platform.API_SERVER in config.platforms:
-        api_cfg = config.platforms[Platform.API_SERVER]
-        if api_cfg.enabled and not api_cfg.extra.get("key"):
-            logger.warning(
-                "api_server is enabled but API_SERVER_KEY is not set. "
-                "The API endpoint will run unauthenticated. "
-                "Set API_SERVER_KEY in ~/.hermes/.env to secure it.",
-            )
-
-    # Validate fallback_providers structure from config.yaml
-    _validate_fallback_providers()
-
    return config


--- a/gateway/run.py
+++ b/gateway/run.py
@@ -1026,16 +1026,6 @@ class GatewayRunner:
                    cfg = _y.safe_load(_f) or {}
                fb = cfg.get("fallback_providers") or cfg.get("fallback_model") or None
                if fb:
-                    # Treat empty dict / disabled fallback as "not configured"
-                    if isinstance(fb, dict):
-                        _enabled = fb.get("enabled")
-                        if _enabled is False or (
-                            isinstance(_enabled, str)
-                            and _enabled.strip().lower() in ("false", "0", "no", "off")
-                        ):
-                            return None
-                        if not fb.get("provider") and not fb.get("model"):
-                            return None
                    return fb
        except Exception:
            pass
@@ -3077,12 +3067,40 @@ class GatewayRunner:
            
            # Token counts and model are now persisted by the agent directly.
            # Keep only last_prompt_tokens here for context-window tracking and
-            # compression decisions.
+            # compression decisions.  Also persist input/output token totals
+            # so the SessionEntry (sessions.json) and SQLite reflect actual usage.
+            _input_total = agent_result.get("input_tokens", 0) or 0
+            _output_total = agent_result.get("output_tokens", 0) or 0
+            _total_tokens = agent_result.get("total_tokens", 0) or 0
+            _cost_usd = agent_result.get("estimated_cost_usd")
            self.session_store.update_session(
                session_entry.session_key,
                last_prompt_tokens=agent_result.get("last_prompt_tokens", 0),
+                input_tokens=_input_total,
+                output_tokens=_output_total,
+                total_tokens=_total_tokens,
+                estimated_cost_usd=_cost_usd,
            )

+            # Persist token totals to SQLite so /insights sees real data.
+            # Use absolute=true because the agent's session_*_tokens already
+            # reflect the running total for this conversation turn.
+            if self._session_db:
+                try:
+                    _eff_sid = agent_result.get("session_id") or session_entry.session_id
+                    self._session_db.set_token_counts(
+                        _eff_sid,
+                        input_tokens=_input_total,
+                        output_tokens=_output_total,
+                        cache_read_tokens=agent_result.get("cache_read_tokens", 0) or 0,
+                        cache_write_tokens=agent_result.get("cache_write_tokens", 0) or 0,
+                        reasoning_tokens=agent_result.get("reasoning_tokens", 0) or 0,
+                        estimated_cost_usd=_cost_usd,
+                        model=_resolved_model,
+                    )
+                except Exception:
+                    pass  # never block delivery
+
            # Auto voice reply: send TTS audio before the text response
            _already_sent = bool(agent_result.get("already_sent"))
            if self._should_send_voice_reply(event, response, agent_messages, already_sent=_already_sent):
--- a/gateway/session.py
+++ b/gateway/session.py
@@ -63,16 +63,6 @@ def _looks_like_phone(value: str) -> bool:
    return bool(_PHONE_RE.match(value.strip()))

 from .config import (
-
-# Session template manager for code-first seeding
-try:
-    from tools.session_template_manager import SessionTemplateManager, TaskType
-    HAS_TEMPLATE_MANAGER = True
-except ImportError:
-    HAS_TEMPLATE_MANAGER = False
-    SessionTemplateManager = None
-    TaskType = None
-
    Platform,
    GatewayConfig,
    SessionResetPolicy,  # noqa: F401 — re-exported via gateway/__init__.py
@@ -536,10 +526,6 @@ class SessionStore:
        except Exception as e:
            print(f"[gateway] Warning: SQLite session store unavailable, falling back to JSONL: {e}")
    
-
-        # Initialize session template manager
-        self._init_template_manager()
-        
    def _ensure_loaded(self) -> None:
        """Load sessions index from disk if not already loaded."""
        with self._lock:
@@ -824,6 +810,10 @@ class SessionStore:
        self,
        session_key: str,
        last_prompt_tokens: int = None,
+        input_tokens: int = None,
+        output_tokens: int = None,
+        total_tokens: int = None,
+        estimated_cost_usd: float = None,
    ) -> None:
        """Update lightweight session metadata after an interaction."""
        with self._lock:
@@ -834,6 +824,14 @@ class SessionStore:
                entry.updated_at = _now()
                if last_prompt_tokens is not None:
                    entry.last_prompt_tokens = last_prompt_tokens
+                if input_tokens is not None:
+                    entry.input_tokens = input_tokens
+                if output_tokens is not None:
+                    entry.output_tokens = output_tokens
+                if total_tokens is not None:
+                    entry.total_tokens = total_tokens
+                if estimated_cost_usd is not None:
+                    entry.estimated_cost_usd = estimated_cost_usd
                self._save()

    def reset_session(self, session_key: str) -> Optional[SessionEntry]:
@@ -1093,112 +1091,3 @@ def build_session_context(
        context.updated_at = session_entry.updated_at
    
    return context
-
-
-    def _init_template_manager(self):
-        """Initialize session template manager if available."""
-        if not HAS_TEMPLATE_MANAGER:
-            self.template_manager = None
-            return
-        
-        try:
-            self.template_manager = SessionTemplateManager()
-            logger.info("Session template manager initialized")
-        except Exception as e:
-            logger.warning(f"Failed to initialize template manager: {e}")
-            self.template_manager = None
-    
-    def inject_session_template(self, session_id: str, task_type: Optional[str] = None) -> bool:
-        """
-        Inject a session template into a new session to establish feedback loops.
-        
-        Args:
-            session_id: Session ID to inject template into
-            task_type: Optional task type (code, file, research, mixed). If None, defaults to code.
-            
-        Returns:
-            True if template was injected, False otherwise
-        """
-        if not self.template_manager:
-            return False
-        
-        try:
-            # Get task type
-            if task_type:
-                try:
-                    task_type_enum = TaskType(task_type)
-                except ValueError:
-                    logger.warning(f"Invalid task type: {task_type}")
-                    return False
-            else:
-                # Default to CODE since research shows it's most effective
-                task_type_enum = TaskType.CODE
-            
-            # Get template for task type
-            template = self.template_manager.get_template_for_task(task_type_enum)
-            if not template:
-                logger.debug(f"No template found for task type: {task_type_enum.value}")
-                return False
-            
-            # Note: Actual injection would happen when messages are loaded
-            # This is a placeholder for the integration point
-            logger.info(f"Template {template.template_id} available for session {session_id}")
-            return True
-            
-        except Exception as e:
-            logger.error(f"Failed to inject template into session {session_id}: {e}")
-            return False
-    
-    def list_session_templates(self, task_type: Optional[str] = None) -> List[Dict[str, Any]]:
-        """
-        List available session templates.
-        
-        Args:
-            task_type: Optional task type filter
-            
-        Returns:
-            List of template dictionaries
-        """
-        if not self.template_manager:
-            return []
-        
-        try:
-            task_type_enum = TaskType(task_type) if task_type else None
-            templates = self.template_manager.list_templates(task_type_enum)
-            return [t.to_dict() for t in templates]
-        except Exception as e:
-            logger.error(f"Failed to list templates: {e}")
-            return []
-    
-    def create_session_template(self, session_id: str, 
-                              name: Optional[str] = None,
-                              description: Optional[str] = None,
-                              max_calls: int = 10) -> Optional[str]:
-        """
-        Create a session template from a completed session.
-        
-        Args:
-            session_id: Session ID to create template from
-            name: Template name
-            description: Template description
-            max_calls: Maximum number of tool calls to extract
-            
-        Returns:
-            Template ID if created, None otherwise
-        """
-        if not self.template_manager:
-            return None
-        
-        try:
-            template = self.template_manager.create_template_from_session(
-                session_id,
-                name=name,
-                description=description,
-                max_calls=max_calls
-            )
-            if template:
-                return template.template_id
-            return None
-        except Exception as e:
-            logger.error(f"Failed to create template from session {session_id}: {e}")
-            return None
--- a/hermes_cli/config.py
+++ b/hermes_cli/config.py
@@ -1338,11 +1338,6 @@ _KNOWN_ROOT_KEYS = {
    "fallback_providers", "credential_pool_strategies", "toolsets",
    "agent", "terminal", "display", "compression", "delegation",
    "auxiliary", "custom_providers", "memory", "gateway",
-    "session_reset", "browser", "checkpoints", "smart_model_routing",
-    "voice", "stt", "tts", "human_delay", "security", "privacy",
-    "cron", "logging", "approvals", "command_allowlist", "quick_commands",
-    "personalities", "skills", "honcho", "timezone", "discord",
-    "whatsapp", "prefill_messages_file", "file_read_max_chars",
 }

 # Valid fields inside a custom_providers list entry
@@ -1426,7 +1421,6 @@ def validate_config_structure(config: Optional[Dict[str, Any]] = None) -> List["
                    ))

    # ── fallback_model must be a top-level dict with provider + model ────
-    # Blank or explicitly disabled fallback is intentional — skip validation.
    fb = config.get("fallback_model")
    if fb is not None:
        if not isinstance(fb, dict):
@@ -1436,40 +1430,21 @@ def validate_config_structure(config: Optional[Dict[str, Any]] = None) -> List["
                "Change to:\n"
                "  fallback_model:\n"
                "    provider: openrouter\n"
-                "    model: anthropic/claude-sonnet-4\n"
-                "Or disable with:\n"
-                "  fallback_model:\n"
-                "    enabled: false",
+                "    model: anthropic/claude-sonnet-4",
            ))
        elif fb:
-            # Skip warnings when fallback is explicitly disabled (enabled: false)
-            _enabled = fb.get("enabled")
-            if _enabled is False or (isinstance(_enabled, str) and _enabled.strip().lower() in ("false", "0", "no", "off")):
-                pass  # intentionally disabled — no warnings
-            else:
-                # Check if both fields are blank (intentional disable)
-                provider = fb.get("provider")
-                model = fb.get("model")
-                provider_blank = not provider or (isinstance(provider, str) and not provider.strip())
-                model_blank = not model or (isinstance(model, str) and not model.strip())
-                
-                # Only warn if at least one field is set (user might be trying to configure)
-                # If both are blank, treat as intentionally disabled
-                if not provider_blank or not model_blank:
-                    if provider_blank:
-                        issues.append(ConfigIssue(
-                            "warning",
-                            "fallback_model is missing 'provider' field — fallback will be disabled",
-                            "Add: provider: openrouter (or another provider)\n"
-                            "Or disable with: enabled: false",
-                        ))
-                    if model_blank:
-                        issues.append(ConfigIssue(
-                            "warning",
-                            "fallback_model is missing 'model' field — fallback will be disabled",
-                            "Add: model: anthropic/claude-sonnet-4 (or another model)\n"
-                            "Or disable with: enabled: false",
-                        ))
+            if not fb.get("provider"):
+                issues.append(ConfigIssue(
+                    "warning",
+                    "fallback_model is missing 'provider' field — fallback will be disabled",
+                    "Add: provider: openrouter (or another provider)",
+                ))
+            if not fb.get("model"):
+                issues.append(ConfigIssue(
+                    "warning",
+                    "fallback_model is missing 'model' field — fallback will be disabled",
+                    "Add: model: anthropic/claude-sonnet-4 (or another model)",
+                ))

    # ── Check for fallback_model accidentally nested inside custom_providers ──
    if isinstance(cp, dict) and "fallback_model" not in config and "fallback_model" in (cp or {}):
@@ -1503,72 +1478,6 @@ def validate_config_structure(config: Optional[Dict[str, Any]] = None) -> List["
                f"Move '{key}' under the appropriate section",
            ))

-    # ── fallback_providers must be a list of dicts with provider + model ─
-    fbp = config.get("fallback_providers")
-    if fbp is not None:
-        if not isinstance(fbp, list):
-            issues.append(ConfigIssue(
-                "error",
-                f"fallback_providers should be a YAML list, got {type(fbp).__name__}",
-                "Change to:\n"
-                "  fallback_providers:\n"
-                "    - provider: openrouter\n"
-                "      model: google/gemini-3-flash-preview",
-            ))
-        elif fbp:
-            for i, entry in enumerate(fbp):
-                if not isinstance(entry, dict):
-                    issues.append(ConfigIssue(
-                        "warning",
-                        f"fallback_providers[{i}] is not a dict (got {type(entry).__name__})",
-                        "Each entry needs at minimum: provider, model",
-                    ))
-                    continue
-                if not entry.get("provider"):
-                    issues.append(ConfigIssue(
-                        "warning",
-                        f"fallback_providers[{i}] is missing 'provider' field — this fallback will be skipped",
-                        "Add: provider: openrouter (or another provider name)",
-                    ))
-                if not entry.get("model"):
-                    issues.append(ConfigIssue(
-                        "warning",
-                        f"fallback_providers[{i}] is missing 'model' field — this fallback will be skipped",
-                        "Add: model: google/gemini-3-flash-preview (or another model slug)",
-                    ))
-
-    # ── session_reset validation ─────────────────────────────────────────
-    session_reset = config.get("session_reset", {})
-    if isinstance(session_reset, dict):
-        idle_minutes = session_reset.get("idle_minutes")
-        if idle_minutes is not None:
-            if not isinstance(idle_minutes, (int, float)) or idle_minutes <= 0:
-                issues.append(ConfigIssue(
-                    "warning",
-                    f"session_reset.idle_minutes={idle_minutes} is invalid (must be a positive number)",
-                    "Set to a positive integer, e.g. 1440 (24 hours). Using 0 causes immediate resets.",
-                ))
-        at_hour = session_reset.get("at_hour")
-        if at_hour is not None:
-            if not isinstance(at_hour, (int, float)) or not (0 <= at_hour <= 23):
-                issues.append(ConfigIssue(
-                    "warning",
-                    f"session_reset.at_hour={at_hour} is invalid (must be 0-23)",
-                    "Set to an hour between 0 and 23, e.g. 4 for 4am",
-                ))
-
-    # ── API Server key check ─────────────────────────────────────────────
-    # If api_server is enabled via env, but no key is set, warn.
-    # This catches the "API_SERVER_KEY not configured" error from gateway logs.
-    api_server_enabled = os.getenv("API_SERVER_ENABLED", "").lower() in ("true", "1", "yes")
-    api_server_key = os.getenv("API_SERVER_KEY", "").strip()
-    if api_server_enabled and not api_server_key:
-        issues.append(ConfigIssue(
-            "warning",
-            "API_SERVER is enabled but API_SERVER_KEY is not set — the API server will run unauthenticated",
-            "Set API_SERVER_KEY in ~/.hermes/.env to secure the API endpoint",
-        ))
-
    return issues


--- a/hermes_cli/cron.py
+++ b/hermes_cli/cron.py
@@ -93,39 +93,6 @@ def cron_list(show_all: bool = False):
        script = job.get("script")
        if script:
            print(f"    Script:    {script}")
-        
-        # Show health status
-        last_status = job.get("last_status")
-        last_error = job.get("last_error")
-        last_error_at = job.get("last_error_at")
-        last_success_at = job.get("last_success_at")
-        error_cleared_at = job.get("error_cleared_at")
-        error_resolved_at = job.get("error_resolved_at")
-        
-        if last_status == "error" and last_error:
-            if error_cleared_at or error_resolved_at:
-                # Error was cleared/resolved
-                cleared_time = error_cleared_at or error_resolved_at
-                print(color(f"    Status:      ok (error cleared)", Colors.GREEN))
-                print(color(f"    Last error:  {last_error[:80]}...", Colors.DIM))
-                print(color(f"    Resolved:    {cleared_time}", Colors.DIM))
-            else:
-                # Current error
-                print(color(f"    Status:      ERROR", Colors.RED))
-                print(color(f"    Error:       {last_error[:80]}...", Colors.RED))
-                if last_error_at:
-                    print(color(f"    Since:       {last_error_at}", Colors.RED))
-        elif last_status == "retrying":
-            print(color(f"    Status:      retrying (error cleared)", Colors.YELLOW))
-        elif last_status == "ok":
-            if last_success_at:
-                print(color(f"    Status:      ok (last success: {last_success_at})", Colors.GREEN))
-        elif last_status:
-            print(f"    Status:      {last_status}")
-        
-        # Show success history if available
-        if last_success_at and last_status != "error":
-            print(f"    Last ok:     {last_success_at}")
        print()

    from hermes_cli.gateway import find_gateway_pids
@@ -255,18 +222,7 @@ def cron_edit(args):


 def _job_action(action: str, job_id: str, success_verb: str, now: bool = False) -> int:
-    if action == "clear_error":
-        result = _cron_api(action="clear_error", job_id=job_id)
-        if not result.get("success"):
-            print(color(f"Failed to clear error: {result.get('error', 'unknown error')}", Colors.RED))
-            return 1
-        job = result.get("job", {})
-        name = job.get("name", job_id)
-        print(color(f"Cleared stale error state for job '{name}'", Colors.GREEN))
-        if job.get("error_cleared_at"):
-            print(f"  Cleared at: {job['error_cleared_at']}")
-        return 0
-if action == "run" and now:
+    if action == "run" and now:
        # Synchronous execution — run job immediately and show result
        result = _cron_api(action="run_now", job_id=job_id)
        if not result.get("success"):
@@ -336,13 +292,9 @@ def cron_command(args):
        now = getattr(args, 'now', False)
        return _job_action("run", args.job_id, "Triggered", now=now)

-    
-    if subcmd == "clear-error":
-        return _job_action("clear_error", args.job_id, "Cleared")
-    
    if subcmd in {"remove", "rm", "delete"}:
        return _job_action("remove", args.job_id, "Removed")

    print(f"Unknown cron command: {subcmd}")
-    print("Usage: hermes cron [list|create|edit|pause|resume|run|remove|clear-error|status|tick]")
+    print("Usage: hermes cron [list|create|edit|pause|resume|run|remove|status|tick]")
    sys.exit(1)
--- a/hermes_cli/main.py
+++ b/hermes_cli/main.py
@@ -4576,9 +4576,6 @@ For more help on a command:
    cron_run.add_argument("job_id", help="Job ID to trigger")
    cron_run.add_argument("--now", action="store_true", help="Execute immediately and wait for result (clears stale errors)")

-    cron_clear_error = cron_subparsers.add_parser("clear-error", help="Clear stale error state for a job")
-    cron_clear_error.add_argument("job_id", help="Job ID to clear error for")
-
    cron_remove = cron_subparsers.add_parser("remove", aliases=["rm", "delete"], help="Remove a scheduled job")
    cron_remove.add_argument("job_id", help="Job ID to remove")

@@ -5008,7 +5005,7 @@ For more help on a command:
    # =========================================================================
    sessions_parser = subparsers.add_parser(
        "sessions",
-        help="Manage session history (list, rename, export, prune, gc, delete)",
+        help="Manage session history (list, rename, export, prune, delete)",
        description="View and manage the SQLite session store"
    )
    sessions_subparsers = sessions_parser.add_subparsers(dest="sessions_action")
@@ -5031,14 +5028,6 @@ For more help on a command:
    sessions_prune.add_argument("--source", help="Only prune sessions from this source")
    sessions_prune.add_argument("--yes", "-y", action="store_true", help="Skip confirmation")

-    sessions_gc = sessions_subparsers.add_parser("gc", help="Garbage-collect empty/trivial sessions")
-    sessions_gc.add_argument("--empty-hours", type=int, default=24, help="Delete empty (0-msg) sessions older than N hours (default: 24)")
-    sessions_gc.add_argument("--trivial-days", type=int, default=7, help="Delete trivial (1-5 msg) sessions older than N days (default: 7)")
-    sessions_gc.add_argument("--trivial-max", type=int, default=5, help="Max messages to consider trivial (default: 5)")
-    sessions_gc.add_argument("--source", help="Only GC sessions from this source")
-    sessions_gc.add_argument("--dry-run", action="store_true", help="Show what would be deleted without deleting")
-    sessions_gc.add_argument("--yes", "-y", action="store_true", help="Skip confirmation")
-
    sessions_stats = sessions_subparsers.add_parser("stats", help="Show session store statistics")

    sessions_rename = sessions_subparsers.add_parser("rename", help="Set or change a session's title")
@@ -5208,49 +5197,6 @@ For more help on a command:
                size_mb = os.path.getsize(db_path) / (1024 * 1024)
                print(f"Database size: {size_mb:.1f} MB")

-        elif action == "gc":
-            dry_run = getattr(args, "dry_run", False)
-            if dry_run:
-                counts = db.garbage_collect(
-                    empty_older_than_hours=args.empty_hours,
-                    trivial_max_messages=args.trivial_max,
-                    trivial_older_than_days=args.trivial_days,
-                    source=args.source,
-                    dry_run=True,
-                )
-                print(f"[dry-run] Would delete {counts['total']} session(s):")
-                print(f"  Empty (0 msgs, >{args.empty_hours}h old): {counts['empty']}")
-                print(f"  Trivial (<={args.trivial_max} msgs, >{args.trivial_days}d old): {counts['trivial']}")
-            else:
-                # Preview first
-                preview = db.garbage_collect(
-                    empty_older_than_hours=args.empty_hours,
-                    trivial_max_messages=args.trivial_max,
-                    trivial_older_than_days=args.trivial_days,
-                    source=args.source,
-                    dry_run=True,
-                )
-                if preview["total"] == 0:
-                    print("Nothing to collect.")
-                else:
-                    if not args.yes:
-                        if not _confirm_prompt(
-                            f"Delete {preview['total']} session(s) "
-                            f"({preview['empty']} empty, {preview['trivial']} trivial)? [y/N] "
-                        ):
-                            print("Cancelled.")
-                            return
-                    counts = db.garbage_collect(
-                        empty_older_than_hours=args.empty_hours,
-                        trivial_max_messages=args.trivial_max,
-                        trivial_older_than_days=args.trivial_days,
-                        source=args.source,
-                        dry_run=False,
-                    )
-                    print(f"Collected {counts['total']} session(s):")
-                    print(f"  Empty: {counts['empty']}")
-                    print(f"  Trivial: {counts['trivial']}")
-
        else:
            sessions_parser.print_help()

--- a/hermes_state.py
+++ b/hermes_state.py
@@ -32,7 +32,7 @@ T = TypeVar("T")

 DEFAULT_DB_PATH = get_hermes_home() / "state.db"

-SCHEMA_VERSION = 7
+SCHEMA_VERSION = 6

 SCHEMA_SQL = """
 CREATE TABLE IF NOT EXISTS schema_version (
@@ -66,7 +66,6 @@ CREATE TABLE IF NOT EXISTS sessions (
    cost_source TEXT,
    pricing_version TEXT,
    title TEXT,
-    profile TEXT,
    FOREIGN KEY (parent_session_id) REFERENCES sessions(id)
 );

@@ -87,7 +86,6 @@ CREATE TABLE IF NOT EXISTS messages (
 );

 CREATE INDEX IF NOT EXISTS idx_sessions_source ON sessions(source);
-CREATE INDEX IF NOT EXISTS idx_sessions_profile ON sessions(profile);
 CREATE INDEX IF NOT EXISTS idx_sessions_parent ON sessions(parent_session_id);
 CREATE INDEX IF NOT EXISTS idx_sessions_started ON sessions(started_at DESC);
 CREATE INDEX IF NOT EXISTS idx_messages_session ON messages(session_id, timestamp);
@@ -332,19 +330,6 @@ class SessionDB:
                    except sqlite3.OperationalError:
                        pass  # Column already exists
                cursor.execute("UPDATE schema_version SET version = 6")
-            if current_version < 7:
-                # v7: add profile column to sessions for profile isolation (#323)
-                try:
-                    cursor.execute('ALTER TABLE sessions ADD COLUMN "profile" TEXT')
-                except sqlite3.OperationalError:
-                    pass  # Column already exists
-                try:
-                    cursor.execute(
-                        "CREATE INDEX IF NOT EXISTS idx_sessions_profile ON sessions(profile)"
-                    )
-                except sqlite3.OperationalError:
-                    pass
-                cursor.execute("UPDATE schema_version SET version = 7")

        # Unique title index — always ensure it exists (safe to run after migrations
        # since the title column is guaranteed to exist at this point)
@@ -377,19 +362,13 @@ class SessionDB:
        system_prompt: str = None,
        user_id: str = None,
        parent_session_id: str = None,
-        profile: str = None,
    ) -> str:
-        """Create a new session record. Returns the session_id.
-
-        Args:
-            profile: Profile name for session isolation. When set, sessions
-                are tagged so queries can filter by profile. (#323)
-        """
+        """Create a new session record. Returns the session_id."""
        def _do(conn):
            conn.execute(
                """INSERT OR IGNORE INTO sessions (id, source, user_id, model, model_config,
-                   system_prompt, parent_session_id, profile, started_at)
-                   VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)""",
+                   system_prompt, parent_session_id, started_at)
+                   VALUES (?, ?, ?, ?, ?, ?, ?, ?)""",
                (
                    session_id,
                    source,
@@ -398,7 +377,6 @@ class SessionDB:
                    json.dumps(model_config) if model_config else None,
                    system_prompt,
                    parent_session_id,
-                    profile,
                    time.time(),
                ),
            )
@@ -527,23 +505,19 @@ class SessionDB:
        session_id: str,
        source: str = "unknown",
        model: str = None,
-        profile: str = None,
    ) -> None:
        """Ensure a session row exists, creating it with minimal metadata if absent.

        Used by _flush_messages_to_session_db to recover from a failed
        create_session() call (e.g. transient SQLite lock at agent startup).
        INSERT OR IGNORE is safe to call even when the row already exists.
-
-        Args:
-            profile: Profile name for session isolation. (#323)
        """
        def _do(conn):
            conn.execute(
                """INSERT OR IGNORE INTO sessions
-                   (id, source, model, profile, started_at)
-                   VALUES (?, ?, ?, ?, ?)""",
-                (session_id, source, model, profile, time.time()),
+                   (id, source, model, started_at)
+                   VALUES (?, ?, ?, ?)""",
+                (session_id, source, model, time.time()),
            )
        self._execute_write(_do)

@@ -814,7 +788,6 @@ class SessionDB:
        limit: int = 20,
        offset: int = 0,
        include_children: bool = False,
-        profile: str = None,
    ) -> List[Dict[str, Any]]:
        """List sessions with preview (first user message) and last active timestamp.

@@ -826,10 +799,6 @@ class SessionDB:

        By default, child sessions (subagent runs, compression continuations)
        are excluded.  Pass ``include_children=True`` to include them.
-
-        Args:
-            profile: Filter sessions to this profile name. Pass None to see all.
-                (#323)
        """
        where_clauses = []
        params = []
@@ -844,9 +813,6 @@ class SessionDB:
            placeholders = ",".join("?" for _ in exclude_sources)
            where_clauses.append(f"s.source NOT IN ({placeholders})")
            params.extend(exclude_sources)
-        if profile:
-            where_clauses.append("s.profile = ?")
-            params.append(profile)

        where_sql = f"WHERE {' AND '.join(where_clauses)}" if where_clauses else ""
        query = f"""
@@ -1192,52 +1158,34 @@ class SessionDB:
        source: str = None,
        limit: int = 20,
        offset: int = 0,
-        profile: str = None,
    ) -> List[Dict[str, Any]]:
-        """List sessions, optionally filtered by source and profile.
-
-        Args:
-            profile: Filter sessions to this profile name. Pass None to see all.
-                (#323)
-        """
-        where_clauses = []
-        params = []
-        if source:
-            where_clauses.append("source = ?")
-            params.append(source)
-        if profile:
-            where_clauses.append("profile = ?")
-            params.append(profile)
-
-        where_sql = f"WHERE {' AND '.join(where_clauses)}" if where_clauses else ""
-        query = f"SELECT * FROM sessions {where_sql} ORDER BY started_at DESC LIMIT ? OFFSET ?"
-        params.extend([limit, offset])
+        """List sessions, optionally filtered by source."""
        with self._lock:
-            cursor = self._conn.execute(query, params)
+            if source:
+                cursor = self._conn.execute(
+                    "SELECT * FROM sessions WHERE source = ? ORDER BY started_at DESC LIMIT ? OFFSET ?",
+                    (source, limit, offset),
+                )
+            else:
+                cursor = self._conn.execute(
+                    "SELECT * FROM sessions ORDER BY started_at DESC LIMIT ? OFFSET ?",
+                    (limit, offset),
+                )
            return [dict(row) for row in cursor.fetchall()]

    # =========================================================================
    # Utility
    # =========================================================================

-    def session_count(self, source: str = None, profile: str = None) -> int:
-        """Count sessions, optionally filtered by source and profile.
-
-        Args:
-            profile: Filter to this profile name. Pass None to count all. (#323)
-        """
-        where_clauses = []
-        params = []
-        if source:
-            where_clauses.append("source = ?")
-            params.append(source)
-        if profile:
-            where_clauses.append("profile = ?")
-            params.append(profile)
-
-        where_sql = f"WHERE {' AND '.join(where_clauses)}" if where_clauses else ""
+    def session_count(self, source: str = None) -> int:
+        """Count sessions, optionally filtered by source."""
        with self._lock:
-            cursor = self._conn.execute(f"SELECT COUNT(*) FROM sessions {where_sql}", params)
+            if source:
+                cursor = self._conn.execute(
+                    "SELECT COUNT(*) FROM sessions WHERE source = ?", (source,)
+                )
+            else:
+                cursor = self._conn.execute("SELECT COUNT(*) FROM sessions")
            return cursor.fetchone()[0]

    def message_count(self, session_id: str = None) -> int:
@@ -1355,78 +1303,3 @@ class SessionDB:
            return len(session_ids)

        return self._execute_write(_do)
-
-    def garbage_collect(
-        self,
-        empty_older_than_hours: int = 24,
-        trivial_max_messages: int = 5,
-        trivial_older_than_days: int = 7,
-        source: str = None,
-        dry_run: bool = False,
-    ) -> Dict[str, int]:
-        """Delete empty and trivial sessions based on age.
-
-        Policy (matches #315):
-        - Empty sessions (0 messages) older than ``empty_older_than_hours``
-        - Trivial sessions (1..``trivial_max_messages`` msgs) older than
-          ``trivial_older_than_days``
-        - Sessions with more than ``trivial_max_messages`` are kept indefinitely
-        - Active (not ended) sessions are never deleted
-
-        Returns a dict with counts: ``empty``, ``trivial``, ``total``.
-        """
-        now = time.time()
-        empty_cutoff = now - (empty_older_than_hours * 3600)
-        trivial_cutoff = now - (trivial_older_than_days * 86400)
-
-        def _do(conn):
-            # --- Find empty sessions ---
-            empty_q = (
-                "SELECT id FROM sessions "
-                "WHERE message_count = 0 AND started_at < ? AND ended_at IS NOT NULL"
-            )
-            params = [empty_cutoff]
-            if source:
-                empty_q += " AND source = ?"
-                params.append(source)
-            empty_ids = [r[0] for r in conn.execute(empty_q, params).fetchall()]
-
-            # --- Find trivial sessions ---
-            trivial_q = (
-                "SELECT id FROM sessions "
-                "WHERE message_count BETWEEN 1 AND ? AND started_at < ? AND ended_at IS NOT NULL"
-            )
-            t_params = [trivial_max_messages, trivial_cutoff]
-            if source:
-                trivial_q += " AND source = ?"
-                t_params.append(source)
-            trivial_ids = [r[0] for r in conn.execute(trivial_q, t_params).fetchall()]
-
-            all_ids = set(empty_ids) | set(trivial_ids)
-
-            if dry_run:
-                return {"empty": len(empty_ids), "trivial": len(trivial_ids),
-                        "total": len(all_ids)}
-
-            # --- Collect child sessions to delete first (FK constraint) ---
-            child_ids = set()
-            for sid in all_ids:
-                for r in conn.execute(
-                    "SELECT id FROM sessions WHERE parent_session_id = ?", (sid,)
-                ).fetchall():
-                    child_ids.add(r[0])
-
-            # Delete children
-            for cid in child_ids:
-                conn.execute("DELETE FROM messages WHERE session_id = ?", (cid,))
-                conn.execute("DELETE FROM sessions WHERE id = ?", (cid,))
-
-            # Delete targets
-            for sid in all_ids:
-                conn.execute("DELETE FROM messages WHERE session_id = ?", (sid,))
-                conn.execute("DELETE FROM sessions WHERE id = ?", (sid,))
-
-            return {"empty": len(empty_ids), "trivial": len(trivial_ids),
-                    "total": len(all_ids)}
-
-        return self._execute_write(_do)
--- a/model-watchdog.py
+++ b/model-watchdog.py
@@ -1,286 +0,0 @@
-#!/usr/bin/env python3
-"""
-Model Watchdog — monitors tmux panes for model drift.
-Checks all hermes TUI sessions in dev and timmy tmux sessions.
-If any pane is running a non-mimo model, kills and restarts it.
-
-Usage: python3 ~/.hermes/bin/model-watchdog.py [--fix]
-  --fix   Actually restart drifted panes (default: dry-run)
-"""
-
-import subprocess
-import sys
-import re
-import time
-import os
-
-ALLOWED_MODEL = "mimo-v2-pro"
-
-# Profile -> expected model. If a pane is running this profile with this model, it's healthy.
-# Profiles not in this map are checked against ALLOWED_MODEL.
-PROFILE_MODELS = {
-    "default": "mimo-v2-pro",
-    "timmy-sprint": "mimo-v2-pro",
-    "fenrir": "mimo-v2-pro",
-    "bezalel": "gpt-5.4",
-    "burn": "mimo-v2-pro",
-    "creative": "claude-sonnet",
-    "research": "claude-sonnet",
-    "review": "claude-sonnet",
-}
-
-TMUX_SESSIONS = ["dev", "timmy"]
-LOG_FILE = os.path.expanduser("~/.hermes/logs/model-watchdog.log")
-
-def log(msg):
-    os.makedirs(os.path.dirname(LOG_FILE), exist_ok=True)
-    ts = time.strftime("%Y-%m-%d %H:%M:%S")
-    line = f"[{ts}] {msg}"
-    print(line)
-    with open(LOG_FILE, "a") as f:
-        f.write(line + "\n")
-
-def run(cmd):
-    r = subprocess.run(cmd, shell=True, capture_output=True, text=True, timeout=10)
-    return r.stdout.strip(), r.returncode
-
-def get_panes(session):
-    """Get all pane info from ALL windows in a tmux session."""
-    # First get all windows
-    win_out, win_rc = run(f"tmux list-windows -t {session} -F '#{{window_name}}' 2>/dev/null")
-    if win_rc != 0:
-        return []
-
-    panes = []
-    for window_name in win_out.split("\n"):
-        if not window_name.strip():
-            continue
-        target = f"{session}:{window_name}"
-        out, rc = run(f"tmux list-panes -t {target} -F '#{{pane_index}}|#{{pane_pid}}|#{{pane_tty}}' 2>/dev/null")
-        if rc != 0:
-            continue
-        for line in out.split("\n"):
-            if "|" in line:
-                idx, pid, tty = line.split("|")
-                panes.append({
-                    "session": session,
-                    "window": window_name,
-                    "index": int(idx),
-                    "pid": int(pid),
-                    "tty": tty,
-                })
-    return panes
-
-def get_hermes_pid_for_tty(tty):
-    """Find hermes process running on a specific TTY."""
-    out, _ = run(f"ps aux | grep '{tty}' | grep '[h]ermes' | grep -v 'gateway' | grep -v 'node' | awk '{{print $2}}'")
-    if out:
-        return int(out.split("\n")[0])
-    return None
-
-def get_model_from_pane(session, pane_idx, window=None):
-    """Capture the pane and extract the model from the status bar."""
-    target = f"{session}:{window}.{pane_idx}" if window else f"{session}.{pane_idx}"
-    out, _ = run(f"tmux capture-pane -t {target} -p 2>/dev/null | tail -30")
-    # Look for model in status bar: ⚕ model-name │
-    matches = re.findall(r'⚕\s+(\S+)\s+│', out)
-    if matches:
-        return matches[0]
-    return None
-
-def check_session_meta(session_id):
-    """Check what model a hermes session was last using from its session file."""
-    import json
-    session_file = os.path.expanduser(f"~/.hermes/sessions/session_{session_id}.json")
-    if os.path.exists(session_file):
-        try:
-            with open(session_file) as f:
-                data = json.load(f)
-            return data.get("model"), data.get("provider")
-        except:
-            pass
-    # Try jsonl
-    jsonl_file = os.path.expanduser(f"~/.hermes/sessions/{session_id}.jsonl")
-    if os.path.exists(jsonl_file):
-        try:
-            with open(jsonl_file) as f:
-                for line in f:
-                    d = json.loads(line.strip())
-                    if d.get("role") == "session_meta":
-                        return d.get("model"), d.get("provider")
-                    break
-        except:
-            pass
-    return None, None
-
-def is_drifted(model_name, profile=None):
-    """Check if a model name indicates drift from the expected model for this profile."""
-    if model_name is None:
-        return False, "no-model-detected"
-
-    # If we know the profile, check against its expected model
-    if profile and profile in PROFILE_MODELS:
-        expected = PROFILE_MODELS[profile]
-        if expected in model_name:
-            return False, model_name
-        return True, model_name
-
-    # No profile known — fall back to ALLOWED_MODEL
-    if ALLOWED_MODEL in model_name:
-        return False, model_name
-    return True, model_name
-
-def get_profile_from_pane(tty):
-    """Detect which hermes profile a pane is running by inspecting its process args."""
-    # ps shows short TTY (s031) not full path (/dev/ttys031)
-    short_tty = tty.replace("/dev/ttys", "s").replace("/dev/ttys", "")
-    out, _ = run(f"ps aux | grep '{short_tty}' | grep '[h]ermes' | grep -v 'gateway' | grep -v 'node' | grep -v cron")
-    if not out:
-        return None
-    # Look for -p <profile> in the command line
-    match = re.search(r'-p\s+(\S+)', out)
-    if match:
-        return match.group(1)
-    return None
-
-def kill_and_restart(session, pane_idx, window=None):
-    """Kill the hermes process in a pane and restart it with the same profile."""
-    target = f"{session}:{window}.{pane_idx}" if window else f"{session}.{pane_idx}"
-
-    # Get the pane's TTY
-    out, _ = run(f"tmux list-panes -t {target} -F '#{{pane_tty}}'")
-    tty = out.strip()
-
-    # Detect which profile was running
-    profile = get_profile_from_pane(tty)
-
-    # Find and kill hermes on that TTY
-    hermes_pid = get_hermes_pid_for_tty(tty)
-    if hermes_pid:
-        log(f"Killing hermes PID {hermes_pid} on {target} (tty={tty}, profile={profile})")
-        run(f"kill {hermes_pid}")
-        time.sleep(2)
-
-    # Send Ctrl+C to clear any state
-    run(f"tmux send-keys -t {target} C-c")
-    time.sleep(1)
-
-    # Restart hermes with the same profile
-    if profile:
-        cmd = f"hermes -p {profile} chat"
-    else:
-        cmd = "hermes chat"
-    run(f"tmux send-keys -t {target} '{cmd}' Enter")
-    log(f"Restarted hermes in {target} with: {cmd}")
-
-    # Wait and verify
-    time.sleep(8)
-    new_model = get_model_from_pane(session, pane_idx, window)
-    if new_model and ALLOWED_MODEL in new_model:
-        log(f"✓ {target} now on {new_model}")
-        return True
-    else:
-        log(f"⚠ {target} model after restart: {new_model}")
-        return False
-
-def verify_expected_model(provider_yaml, expected):
-    """Compare actual provider in a YAML config against expected value."""
-    return provider_yaml.strip() == expected.strip()
-
-def check_config_drift():
-    """Scan all relevant config.yaml files for provider drift. Does NOT modify anything.
-    Returns list of drift issues found."""
-    issues = []
-    CONFIGS = {
-        "main_config": (os.path.expanduser("~/.hermes/config.yaml"), "nous"),
-        "fenrir": (os.path.expanduser("~/.hermes/profiles/fenrir/config.yaml"), "nous"),
-        "timmy_sprint": (os.path.expanduser("~/.hermes/profiles/timmy-sprint/config.yaml"), "nous"),
-        "default_profile": (os.path.expanduser("~/.hermes/profiles/default/config.yaml"), "nous"),
-    }
-    for name, (path, expected_provider) in CONFIGS.items():
-        if not os.path.exists(path):
-            continue
-        try:
-            with open(path, "r") as f:
-                content = f.read()
-            # Parse YAML to correctly read model.provider (not the first provider: line)
-            try:
-                import yaml
-                cfg = yaml.safe_load(content) or {}
-            except ImportError:
-                # Fallback: find provider under model: block via indentation-aware scan
-                cfg = {}
-                in_model = False
-                for line in content.split("\n"):
-                    stripped = line.strip()
-                    indent = len(line) - len(line.lstrip())
-                    if stripped.startswith("model:") and indent == 0:
-                        in_model = True
-                        continue
-                    if in_model and indent == 0 and stripped:
-                        in_model = False
-                    if in_model and stripped.startswith("provider:"):
-                        cfg = {"model": {"provider": stripped.split(":", 1)[1].strip()}}
-                        break
-            actual = (cfg.get("model") or {}).get("provider", "")
-            if actual and expected_provider and actual != expected_provider:
-                issues.append(f"CONFIG DRIFT [{name}]: provider is '{actual}' (expected '{expected_provider}')")
-        except Exception as e:
-            issues.append(f"CONFIG CHECK ERROR [{name}]: {e}")
-    return issues
-
-def main():
-    fix_mode = "--fix" in sys.argv
-    drift_found = False
-    issues = []
-    
-    # Always check config files for provider drift (read-only, never writes)
-    config_drift_issues = check_config_drift()
-    if config_drift_issues:
-        for issue in config_drift_issues:
-            log(f"CONFIG DRIFT: {issue}")
-    
-    for session in TMUX_SESSIONS:
-        panes = get_panes(session)
-        for pane in panes:
-            window = pane.get("window")
-            target = f"{session}:{window}.{pane['index']}" if window else f"{session}.{pane['index']}"
-
-            # Detect profile from running process
-            out, _ = run(f"tmux list-panes -t {target} -F '#{{pane_tty}}'")
-            tty = out.strip()
-            profile = get_profile_from_pane(tty)
-
-            model = get_model_from_pane(session, pane["index"], window)
-            drifted, model_name = is_drifted(model, profile)
-            
-            if drifted:
-                drift_found = True
-                issues.append(f"{target}: {model_name} (profile={profile})")
-                log(f"DRIFT DETECTED: {target} is on '{model_name}' (profile={profile}, expected='{PROFILE_MODELS.get(profile, ALLOWED_MODEL)}')")
-                
-                if fix_mode:
-                    log(f"Auto-fixing {target}...")
-                    success = kill_and_restart(session, pane["index"], window)
-                    if not success:
-                        issues.append(f"  ↳ RESTART FAILED for {target}")
-    
-    if not drift_found:
-        total = sum(len(get_panes(s)) for s in TMUX_SESSIONS)
-        log(f"All {total} panes healthy (on {ALLOWED_MODEL})")
-    
-    # Print summary for cron output
-    if issues or config_drift_issues:
-        print("\n=== MODEL DRIFT REPORT ===")
-        for issue in issues:
-            print(f"  [PANE] {issue}")
-        if config_drift_issues:
-            for issue in config_drift_issues:
-                print(f"  [CONFIG] {issue}")
-        if not fix_mode:
-            print("\nRun with --fix to auto-restart drifted panes.")
-        return 1
-    return 0
-
-if __name__ == "__main__":
-    sys.exit(main())
--- a/tests/hermes_cli/test_config_validation.py
+++ b/tests/hermes_cli/test_config_validation.py
@@ -136,83 +136,6 @@ class TestFallbackModelValidation:
        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
        assert len(fb_issues) == 0

-    def test_blank_fallback_fields_no_issues(self):
-        """Blank fallback_model fields (both empty) should not trigger warnings."""
-        issues = validate_config_structure({
-            "fallback_model": {
-                "provider": "",
-                "model": "",
-            },
-        })
-        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
-        assert len(fb_issues) == 0
-
-    def test_blank_fallback_fields_with_whitespace_no_issues(self):
-        """Blank fallback_model fields with whitespace should not trigger warnings."""
-        issues = validate_config_structure({
-            "fallback_model": {
-                "provider": "  ",
-                "model": "  ",
-            },
-        })
-        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
-        assert len(fb_issues) == 0
-
-    def test_none_fallback_fields_no_issues(self):
-        """None fallback_model fields should not trigger warnings."""
-        issues = validate_config_structure({
-            "fallback_model": {
-                "provider": None,
-                "model": None,
-            },
-        })
-        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
-        assert len(fb_issues) == 0
-
-    def test_enabled_false_no_issues(self):
-        """enabled: false should suppress warnings."""
-        issues = validate_config_structure({
-            "fallback_model": {
-                "enabled": False,
-            },
-        })
-        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
-        assert len(fb_issues) == 0
-
-    def test_enabled_false_string_no_issues(self):
-        """enabled: 'false' (string) should suppress warnings."""
-        issues = validate_config_structure({
-            "fallback_model": {
-                "enabled": "false",
-            },
-        })
-        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
-        assert len(fb_issues) == 0
-
-    def test_partial_blank_fallback_warns(self):
-        """Partial blank fallback (only one field blank) should warn."""
-        issues = validate_config_structure({
-            "fallback_model": {
-                "provider": "",
-                "model": "anthropic/claude-sonnet-4",
-            },
-        })
-        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
-        assert len(fb_issues) == 1
-        assert "provider" in fb_issues[0].message
-
-    def test_valid_fallback_with_enabled_true(self):
-        """Valid fallback with enabled: true should not warn."""
-        issues = validate_config_structure({
-            "fallback_model": {
-                "enabled": True,
-                "provider": "openrouter",
-                "model": "anthropic/claude-sonnet-4",
-            },
-        })
-        fb_issues = [i for i in issues if "fallback" in i.message.lower()]
-        assert len(fb_issues) == 0
-

 class TestMissingModelSection:
    """Warn when custom_providers exists but model section is missing."""
@@ -249,111 +172,3 @@ class TestConfigIssueDataclass:
        a = ConfigIssue("error", "msg", "hint")
        b = ConfigIssue("error", "msg", "hint")
        assert a == b
-
-
-class TestFallbackProvidersValidation:
-    """fallback_providers must be a list of dicts with provider + model."""
-
-    def test_non_list(self):
-        """fallback_providers as string should error."""
-        issues = validate_config_structure({
-            "fallback_providers": "openrouter:google/gemini-3-flash-preview",
-        })
-        errors = [i for i in issues if i.severity == "error"]
-        assert any("fallback_providers" in i.message and "list" in i.message for i in errors)
-
-    def test_dict_instead_of_list(self):
-        """fallback_providers as dict should error."""
-        issues = validate_config_structure({
-            "fallback_providers": {"provider": "openrouter", "model": "test"},
-        })
-        errors = [i for i in issues if i.severity == "error"]
-        assert any("fallback_providers" in i.message and "dict" in i.message for i in errors)
-
-    def test_entry_missing_provider(self):
-        """Entry without provider should warn."""
-        issues = validate_config_structure({
-            "fallback_providers": [{"model": "google/gemini-3-flash-preview"}],
-        })
-        assert any("missing 'provider'" in i.message for i in issues)
-
-    def test_entry_missing_model(self):
-        """Entry without model should warn."""
-        issues = validate_config_structure({
-            "fallback_providers": [{"provider": "openrouter"}],
-        })
-        assert any("missing 'model'" in i.message for i in issues)
-
-    def test_entry_not_dict(self):
-        """Non-dict entries should warn."""
-        issues = validate_config_structure({
-            "fallback_providers": ["not-a-dict"],
-        })
-        assert any("not a dict" in i.message for i in issues)
-
-    def test_valid_entries(self):
-        """Valid fallback_providers should produce no fallback-related issues."""
-        issues = validate_config_structure({
-            "fallback_providers": [
-                {"provider": "openrouter", "model": "google/gemini-3-flash-preview"},
-                {"provider": "gemini", "model": "gemini-2.5-flash"},
-            ],
-        })
-        fb_issues = [i for i in issues if "fallback_providers" in i.message]
-        assert len(fb_issues) == 0
-
-    def test_empty_list_no_issues(self):
-        """Empty list is valid (fallback disabled)."""
-        issues = validate_config_structure({
-            "fallback_providers": [],
-        })
-        fb_issues = [i for i in issues if "fallback_providers" in i.message]
-        assert len(fb_issues) == 0
-
-
-class TestSessionResetValidation:
-    """session_reset.idle_minutes must be positive."""
-
-    def test_zero_idle_minutes(self):
-        """idle_minutes=0 should warn."""
-        issues = validate_config_structure({
-            "session_reset": {"idle_minutes": 0},
-        })
-        assert any("idle_minutes=0" in i.message for i in issues)
-
-    def test_negative_idle_minutes(self):
-        """idle_minutes=-5 should warn."""
-        issues = validate_config_structure({
-            "session_reset": {"idle_minutes": -5},
-        })
-        assert any("idle_minutes=-5" in i.message for i in issues)
-
-    def test_string_idle_minutes(self):
-        """idle_minutes as string should warn."""
-        issues = validate_config_structure({
-            "session_reset": {"idle_minutes": "abc"},
-        })
-        assert any("idle_minutes=" in i.message for i in issues)
-
-    def test_valid_idle_minutes(self):
-        """Valid idle_minutes should not warn."""
-        issues = validate_config_structure({
-            "session_reset": {"idle_minutes": 1440},
-        })
-        idle_issues = [i for i in issues if "idle_minutes" in i.message]
-        assert len(idle_issues) == 0
-
-    def test_invalid_at_hour(self):
-        """at_hour=25 should warn."""
-        issues = validate_config_structure({
-            "session_reset": {"at_hour": 25},
-        })
-        assert any("at_hour=25" in i.message for i in issues)
-
-    def test_valid_at_hour(self):
-        """Valid at_hour should not warn."""
-        issues = validate_config_structure({
-            "session_reset": {"at_hour": 4},
-        })
-        hour_issues = [i for i in issues if "at_hour" in i.message]
-        assert len(hour_issues) == 0
--- a/tests/test_cron_cloud_terminal.py
+++ b/tests/test_cron_cloud_terminal.py
@@ -1,73 +0,0 @@
-"""Tests for cron scheduler cloud-provider terminal disabling (#379).
-
-When a cron job runs on a cloud inference endpoint (Nous, OpenRouter, etc.),
-the terminal toolset must be disabled because SSH keys don't exist on cloud
-servers. Only local endpoints (localhost, 127.0.0.1, RFC-1918) retain
-terminal access.
-"""
-
-import pytest
-from agent.model_metadata import is_local_endpoint
-
-
-class TestIsLocalEndpoint:
-    """Verify is_local_endpoint correctly classifies endpoints."""
-
-    def test_localhost(self):
-        assert is_local_endpoint("http://localhost:11434/v1") is True
-
-    def test_127_loopback(self):
-        assert is_local_endpoint("http://127.0.0.1:8080/v1") is True
-
-    def test_0_0_0_0(self):
-        assert is_local_endpoint("http://0.0.0.0:11434/v1") is True
-
-    def test_rfc1918_10(self):
-        assert is_local_endpoint("http://10.0.0.5:8080/v1") is True
-
-    def test_rfc1918_192(self):
-        assert is_local_endpoint("http://192.168.1.100:11434/v1") is True
-
-    def test_rfc1918_172(self):
-        assert is_local_endpoint("http://172.16.0.1:8080/v1") is True
-
-    def test_cloud_openrouter(self):
-        assert is_local_endpoint("https://openrouter.ai/api/v1") is False
-
-    def test_cloud_nous(self):
-        assert is_local_endpoint("https://inference-api.nousresearch.com/v1") is False
-
-    def test_cloud_anthropic(self):
-        assert is_local_endpoint("https://api.anthropic.com") is False
-
-    def test_empty_url(self):
-        assert is_local_endpoint("") is False
-
-    def test_none_url(self):
-        assert is_local_endpoint(None) is False
-
-
-class TestCronDisabledToolsetsLogic:
-    """Verify the disabled_toolsets logic matches scheduler expectations."""
-
-    def _build_disabled(self, base_url, job=None):
-        """Mirror the scheduler's disabled_toolsets logic."""
-        from agent.model_metadata import is_local_endpoint
-        cron_disabled = ["cronjob", "messaging", "clarify"]
-        if not is_local_endpoint(base_url):
-            cron_disabled.append("terminal")
-        return cron_disabled
-
-    def test_local_keeps_terminal(self):
-        disabled = self._build_disabled("http://localhost:11434/v1")
-        assert "terminal" not in disabled
-        assert "cronjob" in disabled
-
-    def test_cloud_disables_terminal(self):
-        disabled = self._build_disabled("https://openrouter.ai/api/v1")
-        assert "terminal" in disabled
-        assert "cronjob" in disabled
-
-    def test_empty_url_disables_terminal(self):
-        disabled = self._build_disabled("")
-        assert "terminal" in disabled
--- a/tests/test_cron_model_routing.py
+++ b/tests/test_cron_model_routing.py
@@ -1,128 +0,0 @@
-"""Tests for time-aware cron model routing — Issue #317."""
-
-import pytest
-from datetime import datetime
-
-from agent.smart_model_routing import resolve_cron_model, _hour_in_window
-
-
-class TestHourInWindow:
-    """Hour-in-window detection including midnight wrap."""
-
-    def test_normal_window(self):
-        assert _hour_in_window(18, 17, 22) is True
-        assert _hour_in_window(16, 17, 22) is False
-        assert _hour_in_window(22, 17, 22) is False
-
-    def test_midnight_wrap(self):
-        assert _hour_in_window(23, 22, 6) is True
-        assert _hour_in_window(3, 22, 6) is True
-        assert _hour_in_window(10, 22, 6) is False
-
-    def test_edge_cases(self):
-        assert _hour_in_window(0, 0, 24) is True
-        assert _hour_in_window(23, 0, 24) is True
-        assert _hour_in_window(0, 22, 6) is True
-        assert _hour_in_window(5, 22, 6) is True
-        assert _hour_in_window(6, 22, 6) is False
-
-
-class TestResolveCronModel:
-    """Time-aware model resolution for cron jobs."""
-
-    def _config(self, **overrides):
-        base = {
-            "enabled": True,
-            "fallback_model": "anthropic/claude-sonnet-4",
-            "fallback_provider": "openrouter",
-            "windows": [
-                {"start_hour": 17, "end_hour": 22, "reason": "evening_error_peak"},
-            ],
-        }
-        base.update(overrides)
-        return base
-
-    def test_disabled_returns_base(self):
-        result = resolve_cron_model("mimo", {"enabled": False}, now=datetime(2026, 4, 12, 18, 0))
-        assert result["model"] == "mimo"
-        assert result["overridden"] is False
-
-    def test_no_config_returns_base(self):
-        result = resolve_cron_model("mimo", None)
-        assert result["model"] == "mimo"
-        assert result["overridden"] is False
-
-    def test_no_windows_returns_base(self):
-        result = resolve_cron_model("mimo", {"enabled": True, "windows": []}, now=datetime(2026, 4, 12, 18, 0))
-        assert result["overridden"] is False
-
-    def test_evening_window_overrides(self):
-        result = resolve_cron_model("mimo", self._config(), now=datetime(2026, 4, 12, 18, 0))
-        assert result["model"] == "anthropic/claude-sonnet-4"
-        assert result["provider"] == "openrouter"
-        assert result["overridden"] is True
-        assert "evening_error_peak" in result["reason"]
-        assert "hour=18" in result["reason"]
-
-    def test_outside_window_keeps_base(self):
-        result = resolve_cron_model("mimo", self._config(), now=datetime(2026, 4, 12, 9, 0))
-        assert result["model"] == "mimo"
-        assert result["overridden"] is False
-
-    def test_window_boundary_start_inclusive(self):
-        result = resolve_cron_model("mimo", self._config(), now=datetime(2026, 4, 12, 17, 0))
-        assert result["overridden"] is True
-
-    def test_window_boundary_end_exclusive(self):
-        result = resolve_cron_model("mimo", self._config(), now=datetime(2026, 4, 12, 22, 0))
-        assert result["overridden"] is False
-
-    def test_midnight_window(self):
-        config = self._config(windows=[{"start_hour": 22, "end_hour": 6, "reason": "overnight"}])
-        assert resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 23, 0))["overridden"] is True
-        assert resolve_cron_model("mimo", config, now=datetime(2026, 4, 13, 3, 0))["overridden"] is True
-        assert resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 10, 0))["overridden"] is False
-
-    def test_per_window_model_override(self):
-        config = self._config(windows=[{
-            "start_hour": 17, "end_hour": 22,
-            "model": "anthropic/claude-opus-4-6", "provider": "anthropic", "reason": "peak",
-        }])
-        result = resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 18, 0))
-        assert result["model"] == "anthropic/claude-opus-4-6"
-        assert result["provider"] == "anthropic"
-
-    def test_first_matching_window_wins(self):
-        config = self._config(windows=[
-            {"start_hour": 17, "end_hour": 20, "model": "strong-1", "provider": "p1", "reason": "w1"},
-            {"start_hour": 19, "end_hour": 22, "model": "strong-2", "provider": "p2", "reason": "w2"},
-        ])
-        result = resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 19, 0))
-        assert result["model"] == "strong-1"
-
-    def test_no_fallback_model_keeps_base(self):
-        config = {"enabled": True, "windows": [{"start_hour": 17, "end_hour": 22, "reason": "test"}]}
-        result = resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 18, 0))
-        assert result["overridden"] is False
-        assert result["model"] == "mimo"
-
-    def test_malformed_windows_skipped(self):
-        config = self._config(windows=[
-            "not-a-dict",
-            {"start_hour": 17},
-            {"end_hour": 22},
-            {"start_hour": "bad", "end_hour": "bad"},
-            {"start_hour": 17, "end_hour": 22, "reason": "valid"},
-        ])
-        result = resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 18, 0))
-        assert result["overridden"] is True
-        assert "valid" in result["reason"]
-
-    def test_multiple_windows_coverage(self):
-        config = self._config(windows=[
-            {"start_hour": 17, "end_hour": 22, "reason": "evening"},
-            {"start_hour": 2, "end_hour": 5, "reason": "overnight"},
-        ])
-        assert resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 20, 0))["overridden"] is True
-        assert resolve_cron_model("mimo", config, now=datetime(2026, 4, 13, 3, 0))["overridden"] is True
-        assert resolve_cron_model("mimo", config, now=datetime(2026, 4, 12, 10, 0))["overridden"] is False
--- a/tests/test_hermes_state.py
+++ b/tests/test_hermes_state.py
@@ -665,127 +665,6 @@ class TestPruneSessions:


 # =========================================================================
-# =========================================================================
-# Garbage Collect
-# =========================================================================
-
-class TestGarbageCollect:
-    def test_gc_deletes_empty_old_sessions(self, db):
-        """Empty sessions (0 messages) older than 24h should be deleted."""
-        db.create_session(session_id="empty_old", source="cli")
-        db.end_session("empty_old", end_reason="done")
-        db._conn.execute(
-            "UPDATE sessions SET started_at = ? WHERE id = ?",
-            (time.time() - 48 * 3600, "empty_old"),  # 48 hours ago
-        )
-        db._conn.commit()
-
-        # Recent empty session should be kept
-        db.create_session(session_id="empty_new", source="cli")
-        db.end_session("empty_new", end_reason="done")
-
-        result = db.garbage_collect()
-        assert result["empty"] == 1
-        assert result["trivial"] == 0
-        assert result["total"] == 1
-        assert db.get_session("empty_old") is None
-        assert db.get_session("empty_new") is not None
-
-    def test_gc_deletes_trivial_old_sessions(self, db):
-        """Sessions with 1-5 messages older than 7 days should be deleted."""
-        db.create_session(session_id="trivial_old", source="cli")
-        for i in range(3):
-            db.append_message("trivial_old", role="user", content=f"msg {i}")
-        db.end_session("trivial_old", end_reason="done")
-        db._conn.execute(
-            "UPDATE sessions SET started_at = ? WHERE id = ?",
-            (time.time() - 10 * 86400, "trivial_old"),  # 10 days ago
-        )
-        db._conn.commit()
-
-        result = db.garbage_collect()
-        assert result["trivial"] == 1
-        assert result["total"] == 1
-        assert db.get_session("trivial_old") is None
-
-    def test_gc_keeps_active_sessions(self, db):
-        """Active (not ended) sessions should never be deleted."""
-        db.create_session(session_id="active_old", source="cli")
-        # Backdate but don't end
-        db._conn.execute(
-            "UPDATE sessions SET started_at = ? WHERE id = ?",
-            (time.time() - 48 * 3600, "active_old"),
-        )
-        db._conn.commit()
-
-        result = db.garbage_collect()
-        assert result["total"] == 0
-        assert db.get_session("active_old") is not None
-
-    def test_gc_keeps_substantial_sessions(self, db):
-        """Sessions with >5 messages should never be deleted."""
-        db.create_session(session_id="big_old", source="cli")
-        for i in range(10):
-            db.append_message("big_old", role="user", content=f"msg {i}")
-        db.end_session("big_old", end_reason="done")
-        db._conn.execute(
-            "UPDATE sessions SET started_at = ? WHERE id = ?",
-            (time.time() - 365 * 86400, "big_old"),  # 1 year ago
-        )
-        db._conn.commit()
-
-        result = db.garbage_collect()
-        assert result["total"] == 0
-        assert db.get_session("big_old") is not None
-
-    def test_gc_dry_run_does_not_delete(self, db):
-        """dry_run=True should return counts but not delete anything."""
-        db.create_session(session_id="empty_old", source="cli")
-        db.end_session("empty_old", end_reason="done")
-        db._conn.execute(
-            "UPDATE sessions SET started_at = ? WHERE id = ?",
-            (time.time() - 48 * 3600, "empty_old"),
-        )
-        db._conn.commit()
-
-        result = db.garbage_collect(dry_run=True)
-        assert result["total"] == 1
-        assert db.get_session("empty_old") is not None  # Still exists
-
-    def test_gc_with_source_filter(self, db):
-        """--source should only GC sessions from that source."""
-        for sid, src in [("old_cli", "cli"), ("old_tg", "telegram")]:
-            db.create_session(session_id=sid, source=src)
-            db.end_session(sid, end_reason="done")
-            db._conn.execute(
-                "UPDATE sessions SET started_at = ? WHERE id = ?",
-                (time.time() - 48 * 3600, sid),
-            )
-        db._conn.commit()
-
-        result = db.garbage_collect(source="cli")
-        assert result["total"] == 1
-        assert db.get_session("old_cli") is None
-        assert db.get_session("old_tg") is not None
-
-    def test_gc_handles_child_sessions(self, db):
-        """Child sessions should be deleted when parent is GC'd."""
-        db.create_session(session_id="parent_old", source="cli")
-        db.end_session("parent_old", end_reason="done")
-        db._conn.execute(
-            "UPDATE sessions SET started_at = ? WHERE id = ?",
-            (time.time() - 48 * 3600, "parent_old"),
-        )
-        # Create child session
-        db.create_session(session_id="child", source="cli", parent_session_id="parent_old")
-        db.end_session("child", end_reason="done")
-        db._conn.commit()
-
-        result = db.garbage_collect()
-        assert result["total"] == 1
-        assert db.get_session("parent_old") is None
-        assert db.get_session("child") is None
-
 # Schema and WAL mode
 # =========================================================================

--- a/tests/test_session_templates.py
+++ b/tests/test_session_templates.py
@@ -1,316 +0,0 @@
-"""
-Test session template manager functionality.
-"""
-
-import json
-import pytest
-import tempfile
-from pathlib import Path
-from unittest.mock import Mock, patch, MagicMock
-
-from tools.session_template_manager import (
-    SessionTemplateManager, 
-    SessionTemplate, 
-    ToolCallTemplate,
-    TaskType
-)
-
-
-class TestSessionTemplateManager:
-    """Test session template manager."""
-    
-    def test_classify_task_type_code(self):
-        """Test task type classification for code-heavy sessions."""
-        manager = SessionTemplateManager()
-        
-        tool_calls = [
-            {"tool_name": "execute_code"},
-            {"tool_name": "execute_code"},
-            {"tool_name": "execute_code"},
-            {"tool_name": "read_file"},
-        ]
-        
-        task_type = manager.classify_task_type(tool_calls)
-        assert task_type == TaskType.CODE
-    
-    def test_classify_task_type_file(self):
-        """Test task type classification for file-heavy sessions."""
-        manager = SessionTemplateManager()
-        
-        tool_calls = [
-            {"tool_name": "read_file"},
-            {"tool_name": "write_file"},
-            {"tool_name": "patch"},
-            {"tool_name": "search_files"},
-        ]
-        
-        task_type = manager.classify_task_type(tool_calls)
-        assert task_type == TaskType.FILE
-    
-    def test_classify_task_type_research(self):
-        """Test task type classification for research-heavy sessions."""
-        manager = SessionTemplateManager()
-        
-        tool_calls = [
-            {"tool_name": "web_search"},
-            {"tool_name": "web_fetch"},
-            {"tool_name": "browser_navigate"},
-        ]
-        
-        task_type = manager.classify_task_type(tool_calls)
-        assert task_type == TaskType.RESEARCH
-    
-    def test_classify_task_type_mixed(self):
-        """Test task type classification for mixed sessions."""
-        manager = SessionTemplateManager()
-        
-        tool_calls = [
-            {"tool_name": "execute_code"},
-            {"tool_name": "read_file"},
-            {"tool_name": "web_search"},
-        ]
-        
-        task_type = manager.classify_task_type(tool_calls)
-        assert task_type == TaskType.MIXED
-    
-    def test_template_creation(self):
-        """Test creating a template."""
-        with tempfile.TemporaryDirectory() as tmpdir:
-            template_dir = Path(tmpdir)
-            manager = SessionTemplateManager(template_dir=template_dir)
-            
-            # Create a mock template
-            tool_calls = [
-                ToolCallTemplate(
-                    tool_name="execute_code",
-                    arguments={"code": "print('hello')"},
-                    result="hello",
-                    success=True,
-                    execution_time=0.1,
-                    turn_number=0
-                )
-            ]
-            
-            template = SessionTemplate(
-                template_id="test_template",
-                task_type=TaskType.CODE,
-                name="Test Template",
-                description="A test template",
-                tool_calls=tool_calls,
-                source_session_id=None,
-                created_at=1234567890.0,
-                success_rate=1.0,
-                usage_count=0
-            )
-            
-            manager.templates["test_template"] = template
-            manager._save_template(template)
-            
-            # Verify template was saved
-            template_file = template_dir / "test_template.json"
-            assert template_file.exists()
-            
-            # Verify template can be loaded
-            with open(template_file) as f:
-                data = json.load(f)
-                assert data["template_id"] == "test_template"
-                assert data["task_type"] == "code"
-    
-    def test_template_injection(self):
-        """Test injecting a template into messages."""
-        with tempfile.TemporaryDirectory() as tmpdir:
-            template_dir = Path(tmpdir)
-            manager = SessionTemplateManager(template_dir=template_dir)
-            
-            # Create a mock template
-            tool_calls = [
-                ToolCallTemplate(
-                    tool_name="execute_code",
-                    arguments={"code": "print('hello')"},
-                    result="hello",
-                    success=True,
-                    execution_time=0.1,
-                    turn_number=0
-                )
-            ]
-            
-            template = SessionTemplate(
-                template_id="test_template",
-                task_type=TaskType.CODE,
-                name="Test Template",
-                description="A test template",
-                tool_calls=tool_calls,
-                source_session_id=None,
-                created_at=1234567890.0,
-                success_rate=1.0,
-                usage_count=0
-            )
-            
-            manager.templates["test_template"] = template
-            
-            # Test message injection
-            messages = [
-                {"role": "system", "content": "You are a helpful assistant."},
-                {"role": "user", "content": "Hello"}
-            ]
-            
-            updated_messages = manager.inject_template_into_messages(template, messages)
-            
-            # Verify template was injected
-            assert len(updated_messages) > len(messages)
-            assert any("Session template loaded" in str(msg.get("content", "")) 
-                       for msg in updated_messages)
-            
-            # Verify usage count was updated
-            assert template.usage_count == 1
-    
-    def test_get_template_for_task(self):
-        """Test getting template for task type."""
-        with tempfile.TemporaryDirectory() as tmpdir:
-            template_dir = Path(tmpdir)
-            manager = SessionTemplateManager(template_dir=template_dir)
-            
-            # Create templates for different task types
-            code_template = SessionTemplate(
-                template_id="code_template",
-                task_type=TaskType.CODE,
-                name="Code Template",
-                description="A code template",
-                tool_calls=[],
-                source_session_id=None,
-                created_at=1234567890.0,
-                success_rate=1.0,
-                usage_count=0
-            )
-            
-            file_template = SessionTemplate(
-                template_id="file_template",
-                task_type=TaskType.FILE,
-                name="File Template",
-                description="A file template",
-                tool_calls=[],
-                source_session_id=None,
-                created_at=1234567891.0,
-                success_rate=0.9,
-                usage_count=5
-            )
-            
-            manager.templates["code_template"] = code_template
-            manager.templates["file_template"] = file_template
-            
-            # Test getting code template
-            template = manager.get_template_for_task(TaskType.CODE)
-            assert template is not None
-            assert template.template_id == "code_template"
-            
-            # Test getting file template
-            template = manager.get_template_for_task(TaskType.FILE)
-            assert template is not None
-            assert template.template_id == "file_template"
-            
-            # Test getting non-existent template
-            template = manager.get_template_for_task(TaskType.RESEARCH)
-            assert template is None
-
-
-class TestToolCallTemplate:
-    """Test tool call template."""
-    
-    def test_to_dict(self):
-        """Test converting to dictionary."""
-        template = ToolCallTemplate(
-            tool_name="execute_code",
-            arguments={"code": "print('hello')"},
-            result="hello",
-            success=True,
-            execution_time=0.1,
-            turn_number=0
-        )
-        
-        data = template.to_dict()
-        assert data["tool_name"] == "execute_code"
-        assert data["arguments"] == {"code": "print('hello')"}
-        assert data["result"] == "hello"
-        assert data["success"] is True
-    
-    def test_from_dict(self):
-        """Test creating from dictionary."""
-        data = {
-            "tool_name": "execute_code",
-            "arguments": {"code": "print('hello')"},
-            "result": "hello",
-            "success": True,
-            "execution_time": 0.1,
-            "turn_number": 0
-        }
-        
-        template = ToolCallTemplate.from_dict(data)
-        assert template.tool_name == "execute_code"
-        assert template.arguments == {"code": "print('hello')"}
-        assert template.result == "hello"
-
-
-class TestSessionTemplate:
-    """Test session template."""
-    
-    def test_to_dict(self):
-        """Test converting to dictionary."""
-        tool_calls = [
-            ToolCallTemplate(
-                tool_name="execute_code",
-                arguments={"code": "print('hello')"},
-                result="hello",
-                success=True,
-                execution_time=0.1,
-                turn_number=0
-            )
-        ]
-        
-        template = SessionTemplate(
-            template_id="test_template",
-            task_type=TaskType.CODE,
-            name="Test Template",
-            description="A test template",
-            tool_calls=tool_calls,
-            source_session_id=None,
-            created_at=1234567890.0,
-            success_rate=1.0,
-            usage_count=0
-        )
-        
-        data = template.to_dict()
-        assert data["template_id"] == "test_template"
-        assert data["task_type"] == "code"
-        assert len(data["tool_calls"]) == 1
-    
-    def test_from_dict(self):
-        """Test creating from dictionary."""
-        data = {
-            "template_id": "test_template",
-            "task_type": "code",
-            "name": "Test Template",
-            "description": "A test template",
-            "tool_calls": [
-                {
-                    "tool_name": "execute_code",
-                    "arguments": {"code": "print('hello')"},
-                    "result": "hello",
-                    "success": True,
-                    "execution_time": 0.1,
-                    "turn_number": 0
-                }
-            ],
-            "source_session_id": None,
-            "created_at": 1234567890.0,
-            "success_rate": 1.0,
-            "usage_count": 0
-        }
-        
-        template = SessionTemplate.from_dict(data)
-        assert template.template_id == "test_template"
-        assert template.task_type == TaskType.CODE
-        assert len(template.tool_calls) == 1
-
-
-if __name__ == "__main__":
-    pytest.main([__file__])
--- a/tests/test_token_tracking_persistence.py
+++ b/tests/test_token_tracking_persistence.py
@@ -0,0 +1,107 @@
+"""Tests for gateway token count persistence to SessionEntry and SessionDB.
+
+Regression test for #316 — token tracking all zeros.  The gateway must
+propagate input_tokens / output_tokens from the agent result to both the
+SessionEntry (sessions.json) and the SQLite session DB.
+"""
+
+import json
+from datetime import datetime
+from unittest.mock import MagicMock
+
+import pytest
+
+from gateway.session import SessionEntry
+
+
+class TestUpdateSessionTokenFields:
+    """Verify SessionEntry token fields are updated and serialized correctly."""
+
+    def test_session_entry_to_dict_includes_tokens(self):
+        entry = SessionEntry(
+            session_key="tg:123",
+            session_id="sid-1",
+            created_at=datetime.now(),
+            updated_at=datetime.now(),
+            input_tokens=1000,
+            output_tokens=500,
+            total_tokens=1500,
+            estimated_cost_usd=0.05,
+        )
+        d = entry.to_dict()
+        assert d["input_tokens"] == 1000
+        assert d["output_tokens"] == 500
+        assert d["total_tokens"] == 1500
+        assert d["estimated_cost_usd"] == 0.05
+
+    def test_session_entry_from_dict_restores_tokens(self):
+        now = datetime.now().isoformat()
+        data = {
+            "session_key": "tg:123",
+            "session_id": "sid-1",
+            "created_at": now,
+            "updated_at": now,
+            "input_tokens": 42,
+            "output_tokens": 21,
+            "total_tokens": 63,
+            "estimated_cost_usd": 0.001,
+        }
+        entry = SessionEntry.from_dict(data)
+        assert entry.input_tokens == 42
+        assert entry.output_tokens == 21
+        assert entry.total_tokens == 63
+        assert entry.estimated_cost_usd == 0.001
+
+    def test_session_entry_roundtrip_preserves_tokens(self):
+        """to_dict -> from_dict must preserve all token fields."""
+        entry = SessionEntry(
+            session_key="cron:job7",
+            session_id="sid-7",
+            created_at=datetime.now(),
+            updated_at=datetime.now(),
+            input_tokens=9999,
+            output_tokens=1234,
+            total_tokens=11233,
+            cache_read_tokens=500,
+            cache_write_tokens=100,
+            estimated_cost_usd=0.42,
+        )
+        restored = SessionEntry.from_dict(entry.to_dict())
+        assert restored.input_tokens == 9999
+        assert restored.output_tokens == 1234
+        assert restored.total_tokens == 11233
+        assert restored.cache_read_tokens == 500
+        assert restored.cache_write_tokens == 100
+        assert restored.estimated_cost_usd == 0.42
+
+
+class TestAgentResultTokenExtraction:
+    """Verify the gateway extracts token counts from agent_result correctly."""
+
+    def test_agent_result_has_expected_keys(self):
+        """Simulate what _run_agent returns and verify all token keys exist."""
+        result = {
+            "final_response": "hello",
+            "input_tokens": 100,
+            "output_tokens": 50,
+            "total_tokens": 150,
+            "cache_read_tokens": 10,
+            "cache_write_tokens": 5,
+            "reasoning_tokens": 0,
+            "estimated_cost_usd": 0.002,
+            "last_prompt_tokens": 100,
+            "model": "test-model",
+            "session_id": "test-session-123",
+        }
+        # These are the extractions the gateway performs
+        assert result.get("input_tokens", 0) or 0 == 100
+        assert result.get("output_tokens", 0) or 0 == 50
+        assert result.get("total_tokens", 0) or 0 == 150
+        assert result.get("estimated_cost_usd") == 0.002
+
+    def test_agent_result_zero_fallback(self):
+        """When token keys are missing, defaults to 0."""
+        result = {"final_response": "ok"}
+        assert result.get("input_tokens", 0) or 0 == 0
+        assert result.get("output_tokens", 0) or 0 == 0
+        assert result.get("total_tokens", 0) or 0 == 0
--- a/tools/cronjob_tools.py
+++ b/tools/cronjob_tools.py
@@ -201,17 +201,6 @@ def _format_job(job: Dict[str, Any]) -> Dict[str, Any]:
        "paused_at": job.get("paused_at"),
        "paused_reason": job.get("paused_reason"),
    }
-    # Health timestamps
-    if job.get("last_error_at"):
-        result["last_error_at"] = job["last_error_at"]
-    if job.get("last_success_at"):
-        result["last_success_at"] = job["last_success_at"]
-    if job.get("error_resolved_at"):
-        result["error_resolved_at"] = job["error_resolved_at"]
-    if job.get("error_cleared_at"):
-        result["error_cleared_at"] = job["error_cleared_at"]
-    
-
    if job.get("script"):
        result["script"] = job["script"]
    return result
@@ -337,13 +326,6 @@ def cronjob(
            if result is None:
                return json.dumps({"success": False, "error": "Job not found"}, indent=2)
            return json.dumps(result, indent=2)
-        if normalized == "clear_error":
-            from cron.jobs import clear_job_error
-            job = clear_job_error(job_id)
-            if job is None:
-                return json.dumps({"success": False, "error": "Job not found"}, indent=2)
-            return json.dumps({"success": True, "job": _format_job(job)}, indent=2)
-

        if normalized == "update":
            updates: Dict[str, Any] = {}
--- a/tools/session_template_manager.py
+++ b/tools/session_template_manager.py
@@ -1,507 +0,0 @@
-"""
-Session Template Manager for Hermes Agent.
-
-Extracts successful tool calls from completed sessions and creates templates
-that can be injected into new sessions to establish feedback loops early.
-
-Based on research finding: code-heavy sessions (execute_code dominant in first
-30 turns) improve over time. File-heavy sessions degrade. The key is
-deterministic feedback loops, not arbitrary context.
-"""
-
-import json
-import logging
-import os
-import sqlite3
-import time
-from datetime import datetime
-from pathlib import Path
-from typing import Dict, List, Optional, Any, Tuple
-from dataclasses import dataclass, asdict
-from enum import Enum
-
-logger = logging.getLogger(__name__)
-
-# Default template directory
-DEFAULT_TEMPLATE_DIR = Path.home() / ".hermes" / "session-templates"
-
-
-class TaskType(Enum):
-    """Task type classification for session templates."""
-    CODE = "code"
-    FILE = "file"
-    RESEARCH = "research"
-    MIXED = "mixed"
-
-
-@dataclass
-class ToolCallTemplate:
-    """A single tool call template extracted from a successful session."""
-    tool_name: str
-    arguments: Dict[str, Any]
-    result: str
-    success: bool
-    execution_time: float
-    turn_number: int
-    
-    def to_dict(self) -> Dict[str, Any]:
-        """Convert to dictionary for JSON serialization."""
-        return asdict(self)
-    
-    @classmethod
-    def from_dict(cls, data: Dict[str, Any]) -> 'ToolCallTemplate':
-        """Create from dictionary."""
-        return cls(**data)
-
-
-@dataclass
-class SessionTemplate:
-    """A complete session template with multiple tool calls."""
-    template_id: str
-    task_type: TaskType
-    name: str
-    description: str
-    tool_calls: List[ToolCallTemplate]
-    source_session_id: Optional[str]
-    created_at: float
-    success_rate: float
-    usage_count: int
-    
-    def to_dict(self) -> Dict[str, Any]:
-        """Convert to dictionary for JSON serialization."""
-        data = asdict(self)
-        data['task_type'] = self.task_type.value
-        return data
-    
-    @classmethod
-    def from_dict(cls, data: Dict[str, Any]) -> 'SessionTemplate':
-        """Create from dictionary."""
-        data['task_type'] = TaskType(data['task_type'])
-        return cls(**data)
-
-
-class SessionTemplateManager:
-    """Manages session templates for seeding new sessions."""
-    
-    def __init__(self, template_dir: Optional[Path] = None, db_path: Optional[Path] = None):
-        """
-        Initialize the session template manager.
-        
-        Args:
-            template_dir: Directory to store templates (default: ~/.hermes/session-templates/)
-            db_path: Path to the session database (default: ~/.hermes/state.db)
-        """
-        self.template_dir = template_dir or DEFAULT_TEMPLATE_DIR
-        self.db_path = db_path or Path.home() / ".hermes" / "state.db"
-        
-        # Ensure template directory exists
-        self.template_dir.mkdir(parents=True, exist_ok=True)
-        
-        # Load existing templates
-        self.templates: Dict[str, SessionTemplate] = {}
-        self._load_templates()
-    
-    def _load_templates(self):
-        """Load all templates from the template directory."""
-        for template_file in self.template_dir.glob("*.json"):
-            try:
-                with open(template_file, 'r') as f:
-                    data = json.load(f)
-                    template = SessionTemplate.from_dict(data)
-                    self.templates[template.template_id] = template
-            except Exception as e:
-                logger.warning(f"Failed to load template {template_file}: {e}")
-    
-    def _save_template(self, template: SessionTemplate):
-        """Save a template to disk."""
-        template_file = self.template_dir / f"{template.template_id}.json"
-        with open(template_file, 'w') as f:
-            json.dump(template.to_dict(), f, indent=2)
-    
-    def classify_task_type(self, tool_calls: List[Dict[str, Any]]) -> TaskType:
-        """
-        Classify the task type based on tool calls.
-        
-        Args:
-            tool_calls: List of tool calls from a session
-            
-        Returns:
-            TaskType classification
-        """
-        if not tool_calls:
-            return TaskType.MIXED
-        
-        # Count tool types
-        code_tools = {'execute_code', 'code_execution'}
-        file_tools = {'read_file', 'write_file', 'patch', 'search_files'}
-        research_tools = {'web_search', 'web_fetch', 'browser_navigate'}
-        
-        code_count = sum(1 for tc in tool_calls if tc.get('tool_name') in code_tools)
-        file_count = sum(1 for tc in tool_calls if tc.get('tool_name') in file_tools)
-        research_count = sum(1 for tc in tool_calls if tc.get('tool_name') in research_tools)
-        
-        total = len(tool_calls)
-        if total == 0:
-            return TaskType.MIXED
-        
-        # Determine dominant type
-        code_ratio = code_count / total
-        file_ratio = file_count / total
-        research_ratio = research_count / total
-        
-        if code_ratio > 0.6:
-            return TaskType.CODE
-        elif file_ratio > 0.6:
-            return TaskType.FILE
-        elif research_ratio > 0.6:
-            return TaskType.RESEARCH
-        else:
-            return TaskType.MIXED
-    
-    def extract_successful_tool_calls(self, session_id: str, max_calls: int = 10) -> List[ToolCallTemplate]:
-        """
-        Extract successful tool calls from a completed session.
-        
-        Args:
-            session_id: Session ID to extract from
-            max_calls: Maximum number of tool calls to extract
-            
-        Returns:
-            List of ToolCallTemplate objects
-        """
-        if not self.db_path.exists():
-            logger.warning(f"Session database not found: {self.db_path}")
-            return []
-        
-        try:
-            conn = sqlite3.connect(str(self.db_path))
-            conn.row_factory = sqlite3.Row
-            
-            # Get messages for the session
-            cursor = conn.execute("""
-                SELECT role, content, tool_calls, tool_name, timestamp
-                FROM messages 
-                WHERE session_id = ? 
-                ORDER BY timestamp
-            """, (session_id,))
-            
-            messages = cursor.fetchall()
-            conn.close()
-            
-            # Extract tool calls
-            tool_call_templates = []
-            turn_number = 0
-            
-            for msg in messages:
-                if msg['role'] == 'assistant' and msg['tool_calls']:
-                    try:
-                        tool_calls = json.loads(msg['tool_calls'])
-                        for tc in tool_calls:
-                            if len(tool_call_templates) >= max_calls:
-                                break
-                            
-                            tool_name = tc.get('function', {}).get('name')
-                            if not tool_name:
-                                continue
-                            
-                            # Parse arguments
-                            try:
-                                arguments = json.loads(tc.get('function', {}).get('arguments', '{}'))
-                            except:
-                                arguments = {}
-                            
-                            # Create template (result will be filled from tool response)
-                            template = ToolCallTemplate(
-                                tool_name=tool_name,
-                                arguments=arguments,
-                                result="",  # Will be filled from tool response
-                                success=True,  # Assume successful if we got a response
-                                execution_time=0.0,  # Not tracked in current schema
-                                turn_number=turn_number
-                            )
-                            tool_call_templates.append(template)
-                            turn_number += 1
-                            
-                    except json.JSONDecodeError:
-                        continue
-                
-                elif msg['role'] == 'tool' and tool_call_templates:
-                    # Fill in the result for the last tool call
-                    if tool_call_templates[-1].result == "":
-                        tool_call_templates[-1].result = msg['content'] or ""
-            
-            return tool_call_templates
-            
-        except Exception as e:
-            logger.error(f"Failed to extract tool calls from session {session_id}: {e}")
-            return []
-    
-    def create_template_from_session(self, session_id: str, 
-                                   name: Optional[str] = None,
-                                   description: Optional[str] = None,
-                                   max_calls: int = 10) -> Optional[SessionTemplate]:
-        """
-        Create a session template from a completed session.
-        
-        Args:
-            session_id: Session ID to create template from
-            name: Template name (auto-generated if None)
-            description: Template description (auto-generated if None)
-            max_calls: Maximum number of tool calls to include
-            
-        Returns:
-            SessionTemplate object or None if failed
-        """
-        # Extract tool calls
-        tool_calls = self.extract_successful_tool_calls(session_id, max_calls)
-        if not tool_calls:
-            logger.warning(f"No successful tool calls found in session {session_id}")
-            return None
-        
-        # Classify task type
-        task_type = self.classify_task_type([tc.to_dict() for tc in tool_calls])
-        
-        # Generate template ID
-        template_id = f"{task_type.value}_{session_id[:8]}_{int(time.time())}"
-        
-        # Auto-generate name and description if not provided
-        if not name:
-            name = f"{task_type.value.title()} Template from {session_id[:8]}"
-        if not description:
-            tool_names = [tc.tool_name for tc in tool_calls]
-            description = f"Template with {len(tool_calls)} successful tool calls: {', '.join(tool_names[:3])}"
-        
-        # Create template
-        template = SessionTemplate(
-            template_id=template_id,
-            task_type=task_type,
-            name=name,
-            description=description,
-            tool_calls=tool_calls,
-            source_session_id=session_id,
-            created_at=time.time(),
-            success_rate=1.0,  # All extracted calls were successful
-            usage_count=0
-        )
-        
-        # Save template
-        self.templates[template_id] = template
-        self._save_template(template)
-        
-        logger.info(f"Created template {template_id} from session {session_id}")
-        return template
-    
-    def get_template_for_task(self, task_type: TaskType) -> Optional[SessionTemplate]:
-        """
-        Get the best template for a given task type.
-        
-        Args:
-            task_type: Type of task
-            
-        Returns:
-            Best matching SessionTemplate or None
-        """
-        matching_templates = [
-            t for t in self.templates.values()
-            if t.task_type == task_type
-        ]
-        
-        if not matching_templates:
-            return None
-        
-        # Sort by success rate and usage count
-        matching_templates.sort(
-            key=lambda t: (t.success_rate, -t.usage_count),
-            reverse=True
-        )
-        
-        return matching_templates[0]
-    
-    def inject_template_into_messages(self, template: SessionTemplate, 
-                                    messages: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
-        """
-        Inject a template into a list of messages for a new session.
-        
-        Args:
-            template: Template to inject
-            messages: Existing messages list
-            
-        Returns:
-            Modified messages list with template injected
-        """
-        if not template.tool_calls:
-            return messages
-        
-        # Create template injection messages
-        template_messages = []
-        
-        # Add system message about template
-        template_messages.append({
-            "role": "system",
-            "content": f"Session template loaded: {template.name}\n"
-                      f"Task type: {template.task_type.value}\n"
-                      f"This template contains {len(template.tool_calls)} successful tool calls "
-                      f"to establish a feedback loop early."
-        })
-        
-        # Add tool calls and results from template
-        for i, tool_call in enumerate(template.tool_calls):
-            # Add assistant message with tool call
-            template_messages.append({
-                "role": "assistant",
-                "content": None,
-                "tool_calls": [{
-                    "id": f"template_{template.template_id}_{i}",
-                    "type": "function",
-                    "function": {
-                        "name": tool_call.tool_name,
-                        "arguments": json.dumps(tool_call.arguments)
-                    }
-                }]
-            })
-            
-            # Add tool response
-            template_messages.append({
-                "role": "tool",
-                "tool_call_id": f"template_{template.template_id}_{i}",
-                "content": tool_call.result
-            })
-        
-        # Insert template messages at the beginning (after any existing system messages)
-        insert_index = 0
-        for i, msg in enumerate(messages):
-            if msg.get("role") != "system":
-                break
-            insert_index = i + 1
-        
-        # Insert template messages
-        for i, msg in enumerate(template_messages):
-            messages.insert(insert_index + i, msg)
-        
-        # Update template usage count
-        template.usage_count += 1
-        self._save_template(template)
-        
-        return messages
-    
-    def list_templates(self, task_type: Optional[TaskType] = None) -> List[SessionTemplate]:
-        """
-        List all templates, optionally filtered by task type.
-        
-        Args:
-            task_type: Optional task type filter
-            
-        Returns:
-            List of SessionTemplate objects
-        """
-        templates = list(self.templates.values())
-        
-        if task_type:
-            templates = [t for t in templates if t.task_type == task_type]
-        
-        # Sort by creation time (newest first)
-        templates.sort(key=lambda t: t.created_at, reverse=True)
-        
-        return templates
-    
-    def delete_template(self, template_id: str) -> bool:
-        """
-        Delete a template.
-        
-        Args:
-            template_id: ID of template to delete
-            
-        Returns:
-            True if deleted, False if not found
-        """
-        if template_id not in self.templates:
-            return False
-        
-        # Remove from memory
-        del self.templates[template_id]
-        
-        # Remove from disk
-        template_file = self.template_dir / f"{template_id}.json"
-        if template_file.exists():
-            template_file.unlink()
-        
-        logger.info(f"Deleted template {template_id}")
-        return True
-
-
-# CLI interface for template management
-def main():
-    """CLI interface for session template management."""
-    import argparse
-    
-    parser = argparse.ArgumentParser(description="Session Template Manager")
-    subparsers = parser.add_subparsers(dest="command", help="Command to execute")
-    
-    # Create template from session
-    create_parser = subparsers.add_parser("create", help="Create template from session")
-    create_parser.add_argument("session_id", help="Session ID to create template from")
-    create_parser.add_argument("--name", help="Template name")
-    create_parser.add_argument("--description", help="Template description")
-    create_parser.add_argument("--max-calls", type=int, default=10, help="Max tool calls to extract")
-    
-    # List templates
-    list_parser = subparsers.add_parser("list", help="List templates")
-    list_parser.add_argument("--type", choices=["code", "file", "research", "mixed"], 
-                           help="Filter by task type")
-    
-    # Delete template
-    delete_parser = subparsers.add_parser("delete", help="Delete template")
-    delete_parser.add_argument("template_id", help="Template ID to delete")
-    
-    args = parser.parse_args()
-    
-    # Set up logging
-    logging.basicConfig(level=logging.INFO)
-    
-    # Create template manager
-    manager = SessionTemplateManager()
-    
-    if args.command == "create":
-        template = manager.create_template_from_session(
-            args.session_id,
-            name=args.name,
-            description=args.description,
-            max_calls=args.max_calls
-        )
-        if template:
-            print(f"Created template: {template.template_id}")
-            print(f"  Name: {template.name}")
-            print(f"  Type: {template.task_type.value}")
-            print(f"  Tool calls: {len(template.tool_calls)}")
-        else:
-            print("Failed to create template")
-    
-    elif args.command == "list":
-        task_type = TaskType(args.type) if args.type else None
-        templates = manager.list_templates(task_type)
-        
-        if not templates:
-            print("No templates found")
-            return
-        
-        print(f"Found {len(templates)} templates:")
-        for t in templates:
-            print(f"  {t.template_id}: {t.name}")
-            print(f"    Type: {t.task_type.value}")
-            print(f"    Tool calls: {len(t.tool_calls)}")
-            print(f"    Usage: {t.usage_count}")
-            print(f"    Created: {datetime.fromtimestamp(t.created_at).isoformat()}")
-            print()
-    
-    elif args.command == "delete":
-        if manager.delete_template(args.template_id):
-            print(f"Deleted template: {args.template_id}")
-        else:
-            print(f"Template not found: {args.template_id}")
-    
-    else:
-        parser.print_help()
-
-
-if __name__ == "__main__":
-    main()