feat: integrate token tracking with orchestrator (#634 )

feat: token budget tracker module (#634 )
2026-04-15 23:04:37 +00:00 · 2026-04-15 23:03:54 +00:00
2 changed files with 413 additions and 3 deletions
--- a/orchestration.py
+++ b/orchestration.py
@@ -1,6 +1,274 @@
-"""Sovereign orchestration — Huey replaces 3,843 lines of homebrew."""
+"""Sovereign orchestration — Huey replaces 3,843 lines of homebrew.
-from huey import SqliteHuey, crontab
+Pipeline tasks automatically track token usage via token_budget.py.
 After each task completes, the Huey signal records usage for the pipeline.
 """
 import json
 import os
 import subprocess
 import sys
 from datetime import datetime, timezone
 from pathlib import Path
-huey = SqliteHuey(filename=str(Path.home() / ".hermes" / "orchestration.db"))
+from huey import SqliteHuey, crontab, signals
 # --- Setup ---
 HERMES_HOME = Path.home() / ".hermes"
 huey = SqliteHuey(filename=str(HERMES_HOME / "orchestration.db"))
 # Token budget integration
 sys.path.insert(0, str(Path(__file__).parent))
 try:
    from token_budget import record_usage, get_remaining, can_afford, get_report
    HAS_BUDGET = True
 except ImportError:
    HAS_BUDGET = False
 # --- Pipeline definitions ---
 PIPELINES = {
    "playground-factory": {
        "script": "scripts/pipeline_playground_factory.sh",
        "max_tokens": 100_000,
        "dependencies": [],
    },
    "training-factory": {
        "script": "scripts/pipeline_training_factory.sh",
        "max_tokens": 150_000,
        "dependencies": [],
    },
    "knowledge-mine": {
        "script": "scripts/pipeline_knowledge_mine.sh",
        "max_tokens": 80_000,
        "dependencies": ["training-factory"],
    },
    "adversary": {
        "script": "scripts/pipeline_adversary.sh",
        "max_tokens": 50_000,
        "dependencies": ["knowledge-mine"],
    },
    "codebase-genome": {
        "script": "scripts/pipeline_codebase_genome.sh",
        "max_tokens": 120_000,
        "dependencies": [],
    },
 }
 # --- Token tracking signal ---
@huey.signal()
 def track_tokens(signal, task, task_value=None, **kwargs):
    """Automatically log token usage after each pipeline task completes.
    Hooks into Huey's signal system. Fires on task execution.
    Extracts token counts from the task result and records them.
    """
    if not HAS_BUDGET:
        return
    # Only track pipeline tasks
    task_name = getattr(task, "name", "") or ""
    if not task_name.startswith("pipeline."):
        return
    pipeline = task_name.replace("pipeline.", "")
    # Extract token counts from result
    result = task_value or {}
    if isinstance(result, dict):
        input_tokens = result.get("input_tokens", 0)
        output_tokens = result.get("output_tokens", 0)
        if input_tokens or output_tokens:
            record_usage(pipeline, input_tokens, output_tokens)
 # --- Pipeline tasks ---
@huey.task()
 def pipeline_task(name: str, max_tokens: int = None):
    """Run a single pipeline and return token usage stats."""
    spec = PIPELINES.get(name)
    if not spec:
        return {"error": f"Unknown pipeline: {name}", "input_tokens": 0, "output_tokens": 0}
    script = spec["script"]
    budget = max_tokens or spec["max_tokens"]
    # Check budget before running
    if HAS_BUDGET and not can_afford(budget):
        return {
            "error": f"Insufficient budget for {name} (need {budget}, have {get_remaining()})",
            "input_tokens": 0,
            "output_tokens": 0,
        }
    # Check dependencies
    for dep in spec.get("dependencies", []):
        dep_state = _get_pipeline_state(dep)
        if dep_state not in ("running", "complete"):
            return {
                "error": f"Dependency {dep} not met (state: {dep_state})",
                "input_tokens": 0,
                "output_tokens": 0,
            }
    # Run the pipeline script
    script_path = Path.home() / "timmy-config" / script
    if not script_path.exists():
        return {"error": f"Script not found: {script_path}", "input_tokens": 0, "output_tokens": 0}
    _set_pipeline_state(name, "running")
    log_path = HERMES_HOME / "logs" / f"pipeline-{name}.log"
    log_path.parent.mkdir(parents=True, exist_ok=True)
    try:
        result = subprocess.run(
            ["bash", str(script_path), "--max-tokens", str(budget)],
            capture_output=True,
            text=True,
            timeout=3600,  # 1 hour max
        )
        # Parse token usage from stdout (if script reports it)
        input_tokens = 0
        output_tokens = 0
        for line in result.stdout.splitlines():
            if "input_tokens=" in line:
                try:
                    input_tokens = int(line.split("input_tokens=")[1].split()[0])
                except (ValueError, IndexError):
                    pass
            if "output_tokens=" in line:
                try:
                    output_tokens = int(line.split("output_tokens=")[1].split()[0])
                except (ValueError, IndexError):
                    pass
        # If script didn't report tokens, estimate from output
        if not input_tokens and not output_tokens:
            output_tokens = len(result.stdout) // 4  # rough estimate
        # Log output
        with open(log_path, "a") as f:
            f.write(f"\n--- {datetime.now(timezone.utc).isoformat()} ---\n")
            f.write(result.stdout)
            if result.stderr:
                f.write(f"\nSTDERR:\n{result.stderr}")
        if result.returncode == 0:
            _set_pipeline_state(name, "complete")
            return {
                "pipeline": name,
                "status": "complete",
                "input_tokens": input_tokens,
                "output_tokens": output_tokens,
            }
        else:
            _set_pipeline_state(name, "failed")
            return {
                "pipeline": name,
                "status": "failed",
                "error": result.stderr[:500],
                "input_tokens": input_tokens,
                "output_tokens": output_tokens,
            }
    except subprocess.TimeoutExpired:
        _set_pipeline_state(name, "failed")
        return {"pipeline": name, "status": "timeout", "input_tokens": 0, "output_tokens": 0}
    except Exception as e:
        _set_pipeline_state(name, "failed")
        return {"pipeline": name, "status": "error", "error": str(e), "input_tokens": 0, "output_tokens": 0}
@huey.periodic_task(crontab(hour="*/6"))
 def pipeline_scheduler():
    """Check pipeline state and start the next eligible pipeline."""
    report_lines = ["=== Pipeline Scheduler ==="]
    # Check budget
    if HAS_BUDGET:
        remaining = get_remaining()
        report_lines.append(f"Budget remaining: {remaining:,} tokens")
        if remaining <= 0:
            report_lines.append("Budget exhausted. Skipping.")
            return "\n".join(report_lines)
    # Find next eligible pipeline
    started = False
    for name, spec in PIPELINES.items():
        state = _get_pipeline_state(name)
        if state in ("running", "complete"):
            report_lines.append(f"SKIP {name}: {state}")
            continue
        # Check dependencies
        deps_ok = True
        for dep in spec.get("dependencies", []):
            dep_state = _get_pipeline_state(dep)
            if dep_state not in ("running", "complete"):
                report_lines.append(f"SKIP {name}: dependency {dep} not met")
                deps_ok = False
                break
        if not deps_ok:
            continue
        # Start pipeline
        report_lines.append(f"START {name}")
        pipeline_task(name)
        started = True
        break  # One pipeline per scheduler tick
    if not started:
        report_lines.append("No pipelines to start")
    return "\n".join(report_lines)
 # --- State management ---
 STATE_FILE = HERMES_HOME / "pipeline_state.json"
 def _get_pipeline_state(name: str) -> str:
    if STATE_FILE.exists():
        try:
            data = json.loads(STATE_FILE.read_text())
            return data.get(name, {}).get("state", "not_started")
        except (json.JSONDecodeError, OSError):
            pass
    return "not_started"
 def _set_pipeline_state(name: str, state: str):
    data = {}
    if STATE_FILE.exists():
        try:
            data = json.loads(STATE_FILE.read_text())
        except (json.JSONDecodeError, OSError):
            pass
    data[name] = {"state": state, "updated": datetime.now(timezone.utc).isoformat()}
    STATE_FILE.parent.mkdir(parents=True, exist_ok=True)
    STATE_FILE.write_text(json.dumps(data, indent=2))
 # --- CLI ---
 if __name__ == "__main__":
    if "--budget" in sys.argv or "--report" in sys.argv:
        if HAS_BUDGET:
            print(get_report())
        else:
            print("token_budget module not available")
    elif "--status" in sys.argv:
        for name in PIPELINES:
            state = _get_pipeline_state(name)
            print(f"  {name}: {state}")
    elif "--run" in sys.argv:
        idx = sys.argv.index("--run")
        name = sys.argv[idx + 1]
        print(f"Enqueuing pipeline: {name}")
        result = pipeline_task(name)
        print(f"Task enqueued")
    else:
        print("Usage: orchestration.py [--budget|--status|--run PIPELINE]")
--- a/scripts/token_budget.py
+++ b/scripts/token_budget.py
@@ -0,0 +1,142 @@
 #!/usr/bin/env python3
 """
 token_budget.py — Daily token budget tracker for pipeline orchestration.
 Tracks token usage per pipeline per day, enforces daily limits,
 and provides a query interface for the orchestrator.
 Data: ~/.hermes/pipeline_budget.json
 """
 import json
 import os
 from datetime import datetime, timezone
 from pathlib import Path
 BUDGET_FILE = Path.home() / ".hermes" / "pipeline_budget.json"
 DEFAULT_DAILY_LIMIT = 500_000
 def _load() -> dict:
    if BUDGET_FILE.exists():
        try:
            return json.loads(BUDGET_FILE.read_text())
        except (json.JSONDecodeError, OSError):
            pass
    return {}
 def _save(data: dict):
    BUDGET_FILE.parent.mkdir(parents=True, exist_ok=True)
    BUDGET_FILE.write_text(json.dumps(data, indent=2))
 def today_key() -> str:
    return datetime.now(timezone.utc).strftime("%Y-%m-%d")
 def get_daily_usage(pipeline: str = None) -> dict:
    """Get token usage for today. If pipeline specified, return just that pipeline."""
    data = _load()
    day = data.get("daily", {}).get(today_key(), {"tokens_used": 0, "pipelines": {}})
    if pipeline:
        return {
            "pipeline": pipeline,
            "tokens_used": day.get("pipelines", {}).get(pipeline, 0),
            "daily_total": day.get("tokens_used", 0),
        }
    return day
 def get_remaining(limit: int = DEFAULT_DAILY_LIMIT) -> int:
    """Get remaining token budget for today."""
    usage = get_daily_usage()
    return max(0, limit - usage.get("tokens_used", 0))
 def can_afford(tokens: int, limit: int = DEFAULT_DAILY_LIMIT) -> bool:
    """Check if we have budget for a token spend."""
    return get_remaining(limit) >= tokens
 def record_usage(pipeline: str, input_tokens: int, output_tokens: int) -> dict:
    """
    Record token usage for a pipeline task.
    Called automatically by the orchestrator after each pipeline task completes.
    Returns the updated daily state.
    """
    total = input_tokens + output_tokens
    data = _load()
    today = today_key()
    daily = data.setdefault("daily", {})
    day = daily.setdefault(today, {"tokens_used": 0, "pipelines": {}})
    day["tokens_used"] = day.get("tokens_used", 0) + total
    pipes = day.setdefault("pipelines", {})
    pipes[pipeline] = pipes.get(pipeline, 0) + total
    # Track breakdown
    breakdown = day.setdefault("breakdown", {})
    pb = breakdown.setdefault(pipeline, {"input": 0, "output": 0, "calls": 0})
    pb["input"] += input_tokens
    pb["output"] += output_tokens
    pb["calls"] += 1
    # Track lifetime stats
    lifetime = data.setdefault("lifetime", {"total_tokens": 0, "total_days": 0})
    lifetime["total_tokens"] = lifetime.get("total_tokens", 0) + total
    _save(data)
    return {
        "pipeline": pipeline,
        "input_tokens": input_tokens,
        "output_tokens": output_tokens,
        "total": total,
        "daily_used": day["tokens_used"],
        "daily_remaining": get_remaining(),
    }
 def get_report() -> str:
    """Generate a human-readable budget report."""
    data = _load()
    today = today_key()
    day = data.get("daily", {}).get(today, {"tokens_used": 0, "pipelines": {}})
    lines = []
    lines.append(f"Token Budget — {today}")
    lines.append(f"  Daily usage: {day.get('tokens_used', 0):,} / {DEFAULT_DAILY_LIMIT:,}")
    lines.append(f"  Remaining: {get_remaining():,}")
    lines.append("")
    lines.append("  Pipelines:")
    breakdown = day.get("breakdown", {})
    for name, stats in sorted(breakdown.items(), key=lambda x: -x[1]["output"]):
        total = stats["input"] + stats["output"]
        lines.append(f"    {name}: {total:,} tokens ({stats['calls']} calls)")
    if not breakdown:
        lines.append("    (no pipelines run today)")
    lifetime = data.get("lifetime", {})
    lines.append("")
    lines.append(f"  Lifetime: {lifetime.get('total_tokens', 0):,} total tokens")
    return "\n".join(lines)
 if __name__ == "__main__":
    import sys
    if "--report" in sys.argv:
        print(get_report())
    elif "--remaining" in sys.argv:
        print(get_remaining())
    elif "--can-afford" in sys.argv:
        idx = sys.argv.index("--can-afford")
        tokens = int(sys.argv[idx + 1])
        print("yes" if can_afford(tokens) else "no")
    else:
        print(get_report())
Author	SHA1	Message	Date
Alexander Whitestone	ac2bb0f773	feat: integrate token tracking with orchestrator (#634 ) Some checks failed Architecture Lint / Linter Tests (pull_request) Successful in 26s Details PR Checklist / pr-checklist (pull_request) Failing after 4m1s Details Smoke Test / smoke (pull_request) Failing after 24s Details Validate Config / YAML Lint (pull_request) Failing after 18s Details Validate Config / JSON Validate (pull_request) Successful in 16s Details Validate Config / Python Syntax & Import Check (pull_request) Failing after 1m15s Details Validate Config / Shell Script Lint (pull_request) Failing after 33s Details Validate Config / Cron Syntax Check (pull_request) Successful in 8s Details Validate Config / Deploy Script Dry Run (pull_request) Successful in 8s Details Validate Config / Playbook Schema Validation (pull_request) Successful in 24s Details Architecture Lint / Lint Repository (pull_request) Has been cancelled Details Validate Config / Python Test Suite (pull_request) Has been cancelled Details	2026-04-15 23:04:37 +00:00
Alexander Whitestone	1aa4a3d3c8	feat: token budget tracker module (#634 )	2026-04-15 23:03:54 +00:00