refactor: break up MCPBridge.run() into focused helper methods

Extract connection setup/message building, tool-call round processing, and the multi-round loop into three private helpers: - _build_initial_messages() — static, constructs prompt message list - _process_round_tool_calls() — executes one round of tool calls - _run_tool_loop() — drives the multi-round loop, returns result tuple run() is now ~35 lines of logic (down from 129), with error recovery consolidated in a single return at the end. Fixes #1135 Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
[claude] Build Timmy autonomous backlog triage loop (#1071 ) (#1141 )
2026-03-23 14:38:38 -04:00 · 2026-03-23 18:32:27 +00:00 · 2026-03-23 18:26:40 +00:00
11 changed files with 1501 additions and 968 deletions
--- a/src/config.py
+++ b/src/config.py
@@ -289,14 +289,6 @@ class Settings(BaseSettings):
    thinking_memory_check_every: int = 50  # check memory status every Nth thought
    thinking_idle_timeout_minutes: int = 60  # pause thoughts after N minutes without user input

-    # ── Dreaming Mode ─────────────────────────────────────────────────
-    # When enabled, the agent replays past sessions during idle time to
-    # simulate alternative actions and propose behavioural rules.
-    dreaming_enabled: bool = True
-    dreaming_idle_threshold_minutes: int = 10  # idle minutes before dreaming starts
-    dreaming_cycle_seconds: int = 600           # seconds between dream attempts
-    dreaming_timeout_seconds: int = 60          # max LLM call time per dream cycle
-
    # ── Gitea Integration ─────────────────────────────────────────────
    # Local Gitea instance for issue tracking and self-improvement.
    # These values are passed as env vars to the gitea-mcp server process.
@@ -312,6 +304,16 @@ class Settings(BaseSettings):
    mcp_timeout: int = 15
    mcp_bridge_timeout: int = 60  # HTTP timeout for MCP bridge Ollama calls (seconds)

+    # ── Backlog Triage Loop ────────────────────────────────────────────
+    # Autonomous loop: fetch open issues, score, assign to agents.
+    backlog_triage_enabled: bool = False
+    # Seconds between triage cycles (default: 15 minutes).
+    backlog_triage_interval_seconds: int = 900
+    # When True, score and summarize but don't write to Gitea.
+    backlog_triage_dry_run: bool = False
+    # Create a daily triage summary issue/comment.
+    backlog_triage_daily_summary: bool = True
+
    # ── Loop QA (Self-Testing) ─────────────────────────────────────────
    # Self-test orchestrator that probes capabilities alongside the thinking loop.
    loop_qa_enabled: bool = True
--- a/src/dashboard/app.py
+++ b/src/dashboard/app.py
@@ -35,7 +35,6 @@ from dashboard.routes.chat_api_v1 import router as chat_api_v1_router
 from dashboard.routes.daily_run import router as daily_run_router
 from dashboard.routes.db_explorer import router as db_explorer_router
 from dashboard.routes.discord import router as discord_router
-from dashboard.routes.dreaming import router as dreaming_router
 from dashboard.routes.experiments import router as experiments_router
 from dashboard.routes.grok import router as grok_router
 from dashboard.routes.health import router as health_router
@@ -220,36 +219,6 @@ async def _loop_qa_scheduler() -> None:
        await asyncio.sleep(interval)


-async def _dreaming_scheduler() -> None:
-    """Background task: run idle-time dreaming cycles.
-
-    When the system has been idle for ``dreaming_idle_threshold_minutes``,
-    the dreaming engine replays a past session and simulates alternatives.
-    """
-    from timmy.dreaming import dreaming_engine
-
-    await asyncio.sleep(15)  # Stagger after loop QA scheduler
-
-    while True:
-        try:
-            if settings.dreaming_enabled:
-                await asyncio.wait_for(
-                    dreaming_engine.dream_once(),
-                    timeout=settings.dreaming_timeout_seconds + 10,
-                )
-        except TimeoutError:
-            logger.warning(
-                "Dreaming cycle timed out after %ds",
-                settings.dreaming_timeout_seconds,
-            )
-        except asyncio.CancelledError:
-            raise
-        except Exception as exc:
-            logger.error("Dreaming scheduler error: %s", exc)
-
-        await asyncio.sleep(settings.dreaming_cycle_seconds)
-
-
 _PRESENCE_POLL_SECONDS = 30
 _PRESENCE_INITIAL_DELAY = 3

@@ -410,7 +379,6 @@ def _startup_background_tasks() -> list[asyncio.Task]:
        asyncio.create_task(_briefing_scheduler()),
        asyncio.create_task(_thinking_scheduler()),
        asyncio.create_task(_loop_qa_scheduler()),
-        asyncio.create_task(_dreaming_scheduler()),
        asyncio.create_task(_presence_watcher()),
        asyncio.create_task(_start_chat_integrations_background()),
    ]
@@ -673,7 +641,6 @@ app.include_router(daily_run_router)
 app.include_router(quests_router)
 app.include_router(scorecards_router)
 app.include_router(sovereignty_metrics_router)
-app.include_router(dreaming_router)


@app.websocket("/ws")
--- a/src/dashboard/routes/dreaming.py
+++ b/src/dashboard/routes/dreaming.py
@@ -1,85 +0,0 @@
-"""Dreaming mode dashboard routes.
-
-GET  /dreaming/api/status   — JSON status of the dreaming engine
-GET  /dreaming/api/recent   — JSON list of recent dream records
-POST /dreaming/api/trigger  — Manually trigger a dream cycle (for testing)
-GET  /dreaming/partial      — HTMX partial: dreaming status panel
-"""
-
-import logging
-
-from fastapi import APIRouter, Request
-from fastapi.responses import HTMLResponse, JSONResponse
-
-from dashboard.templating import templates
-from timmy.dreaming import dreaming_engine
-
-logger = logging.getLogger(__name__)
-
-router = APIRouter(prefix="/dreaming", tags=["dreaming"])
-
-
-@router.get("/api/status", response_class=JSONResponse)
-async def dreaming_status():
-    """Return current dreaming engine status as JSON."""
-    return dreaming_engine.get_status()
-
-
-@router.get("/api/recent", response_class=JSONResponse)
-async def dreaming_recent(limit: int = 10):
-    """Return recent dream records as JSON."""
-    dreams = dreaming_engine.get_recent_dreams(limit=limit)
-    return [
-        {
-            "id": d.id,
-            "session_excerpt": d.session_excerpt[:200],
-            "decision_point": d.decision_point[:200],
-            "simulation": d.simulation,
-            "proposed_rule": d.proposed_rule,
-            "created_at": d.created_at,
-        }
-        for d in dreams
-    ]
-
-
-@router.post("/api/trigger", response_class=JSONResponse)
-async def dreaming_trigger():
-    """Manually trigger a dream cycle (bypasses idle check).
-
-    Useful for testing and manual inspection. Forces idle state temporarily.
-    """
-    from datetime import UTC, datetime, timedelta
-
-    from config import settings
-
-    # Temporarily back-date last activity to appear idle
-    original_time = dreaming_engine._last_activity_time
-    dreaming_engine._last_activity_time = datetime.now(UTC) - timedelta(
-        minutes=settings.dreaming_idle_threshold_minutes + 1
-    )
-
-    try:
-        dream = await dreaming_engine.dream_once()
-    finally:
-        dreaming_engine._last_activity_time = original_time
-
-    if dream:
-        return {
-            "status": "ok",
-            "dream_id": dream.id,
-            "proposed_rule": dream.proposed_rule,
-            "simulation": dream.simulation[:200],
-        }
-    return {"status": "skipped", "reason": "No dream produced (no sessions or LLM unavailable)"}
-
-
-@router.get("/partial", response_class=HTMLResponse)
-async def dreaming_partial(request: Request):
-    """HTMX partial: dreaming status panel for the dashboard."""
-    status = dreaming_engine.get_status()
-    recent = dreaming_engine.get_recent_dreams(limit=5)
-    return templates.TemplateResponse(
-        request,
-        "partials/dreaming_status.html",
-        {"status": status, "recent_dreams": recent},
-    )
--- a/src/dashboard/templates/partials/dreaming_status.html
+++ b/src/dashboard/templates/partials/dreaming_status.html
@@ -1,32 +0,0 @@
-{% if not status.enabled %}
-<div class="dream-disabled text-muted small">Dreaming mode disabled</div>
-{% elif status.dreaming %}
-<div class="dream-active">
-  <span class="dream-pulse"></span>
-  <span class="dream-label">DREAMING</span>
-  <div class="dream-summary">{{ status.current_summary }}</div>
-</div>
-{% elif status.idle %}
-<div class="dream-idle">
-  <span class="dream-dot dream-dot-idle"></span>
-  <span class="dream-label-idle">IDLE</span>
-  <span class="dream-idle-meta">{{ status.idle_minutes }}m — dream cycle pending</span>
-</div>
-{% else %}
-<div class="dream-standby">
-  <span class="dream-dot dream-dot-standby"></span>
-  <span class="dream-label-standby">STANDBY</span>
-  <span class="dream-idle-meta">idle in {{ status.idle_threshold_minutes - status.idle_minutes }}m</span>
-</div>
-{% endif %}
-
-{% if recent_dreams %}
-<div class="dream-history mt-2">
-  {% for d in recent_dreams %}
-  <div class="dream-record">
-    <div class="dream-rule">{{ d.proposed_rule if d.proposed_rule else "No rule extracted" }}</div>
-    <div class="dream-meta">{{ d.created_at[:16] | replace("T", " ") }}</div>
-  </div>
-  {% endfor %}
-</div>
-{% endif %}
--- a/src/timmy/backlog_triage.py
+++ b/src/timmy/backlog_triage.py
@@ -0,0 +1,759 @@
+"""Autonomous backlog triage loop — Timmy scans Gitea and assigns work.
+
+Continuously fetches open issues, scores/prioritizes them, and decides
+what to work on next without waiting to be asked.
+
+Loop flow::
+
+    while true:
+        1. Fetch all open issues from Gitea API
+        2. Score/prioritize by labels, age, type, blocked status
+        3. Identify unassigned high-priority items
+        4. Decide: assign to claude, dispatch to kimi, or flag for Alex
+        5. Execute the assignment (comment + assign)
+        6. Optionally post a daily triage summary
+        7. Sleep for configurable interval (default 15 min)
+
+Priority tiers:
+    P0 — security, data loss, blocking bugs → immediate action
+    P1 — core functionality, ready issues → next sprint
+    P2 — improvements, low-score issues → backlog
+    P3 — philosophy, meta → someday/never (skip in triage)
+
+Usage::
+
+    from timmy.backlog_triage import BacklogTriageLoop
+
+    loop = BacklogTriageLoop()
+    await loop.run_once()           # single triage cycle
+    await loop.start()              # background daemon loop
+    loop.stop()                     # graceful shutdown
+"""
+
+from __future__ import annotations
+
+import asyncio
+import logging
+import re
+from dataclasses import dataclass, field
+from datetime import UTC, datetime, timedelta
+from typing import Any
+
+import httpx
+
+from config import settings
+
+logger = logging.getLogger(__name__)
+
+# ── Constants ────────────────────────────────────────────────────────────────
+
+# Minimum triage score to be considered "ready" for assignment
+READY_THRESHOLD = 5
+
+# Agent Gitea logins
+AGENT_CLAUDE = "claude"
+AGENT_KIMI = "kimi"
+OWNER_LOGIN = "rockachopa"  # Alex — human owner
+
+# Labels
+KIMI_READY_LABEL = "kimi-ready"
+TRIAGE_DONE_LABEL = "triage-done"
+
+# Tag sets (mirrors scripts/triage_score.py)
+_BUG_TAGS = frozenset({"bug", "broken", "crash", "error", "fix", "regression", "hotfix"})
+_FEATURE_TAGS = frozenset({"feature", "feat", "enhancement", "capability", "timmy-capability"})
+_REFACTOR_TAGS = frozenset({"refactor", "cleanup", "tech-debt", "optimization", "perf"})
+_META_TAGS = frozenset({"philosophy", "soul-gap", "discussion", "question", "rfc"})
+_P0_TAGS = frozenset({"security", "data-loss", "blocking", "p0", "critical"})
+_RESEARCH_TAGS = frozenset({"research", "kimi-ready", "investigation", "spike"})
+_LOOP_TAG = "loop-generated"
+
+# Regex patterns for scoring
+_TAG_RE = re.compile(r"\[([^\]]+)\]")
+_FILE_RE = re.compile(r"(?:src/|tests/|scripts/|\.py|\.html|\.js|\.yaml|\.toml|\.sh)", re.IGNORECASE)
+_FUNC_RE = re.compile(r"(?:def |class |function |method |`\w+\(\)`)", re.IGNORECASE)
+_ACCEPT_RE = re.compile(
+    r"(?:should|must|expect|verify|assert|test.?case|acceptance|criteria"
+    r"|pass(?:es|ing)|fail(?:s|ing)|return(?:s)?|raise(?:s)?)",
+    re.IGNORECASE,
+)
+_TEST_RE = re.compile(r"(?:tox|pytest|test_\w+|\.test\.|assert\s)", re.IGNORECASE)
+_BLOCKED_RE = re.compile(r"\bblock(?:ed|s|ing)\b", re.IGNORECASE)
+
+
+# ── Data types ───────────────────────────────────────────────────────────────
+
+
+@dataclass
+class ScoredIssue:
+    """A Gitea issue enriched with triage scoring."""
+
+    number: int
+    title: str
+    body: str
+    labels: list[str]
+    tags: set[str]
+    assignees: list[str]
+    created_at: datetime
+    issue_type: str  # bug | feature | refactor | philosophy | research | unknown
+
+    score: int = 0
+    scope: int = 0
+    acceptance: int = 0
+    alignment: int = 0
+    ready: bool = False
+    age_days: int = 0
+    is_p0: bool = False
+    is_blocked: bool = False
+
+    @property
+    def is_unassigned(self) -> bool:
+        return len(self.assignees) == 0
+
+    @property
+    def needs_kimi(self) -> bool:
+        return bool(self.tags & _RESEARCH_TAGS) or KIMI_READY_LABEL in self.labels
+
+
+@dataclass
+class TriageDecision:
+    """The outcome of a triage decision for a single issue."""
+
+    issue_number: int
+    action: str  # "assign_claude" | "assign_kimi" | "flag_alex" | "skip"
+    reason: str
+    agent: str = ""  # the agent assigned (login)
+    executed: bool = False
+    error: str = ""
+
+
+@dataclass
+class TriageCycleResult:
+    """Summary of one complete triage cycle."""
+
+    timestamp: str
+    total_open: int
+    scored: int
+    ready: int
+    decisions: list[TriageDecision] = field(default_factory=list)
+    errors: list[str] = field(default_factory=list)
+    duration_ms: int = 0
+
+
+# ── Scoring ──────────────────────────────────────────────────────────────────
+
+
+def _extract_tags(title: str, labels: list[str]) -> set[str]:
+    """Pull tags from [bracket] title notation + Gitea label names."""
+    tags: set[str] = set()
+    for m in _TAG_RE.finditer(title):
+        tags.add(m.group(1).lower().strip())
+    for lbl in labels:
+        tags.add(lbl.lower().strip())
+    return tags
+
+
+def _score_scope(title: str, body: str, tags: set[str]) -> int:
+    """0–3: How well-scoped is this issue?"""
+    text = f"{title}\n{body}"
+    score = 0
+    if _FILE_RE.search(text):
+        score += 1
+    if _FUNC_RE.search(text):
+        score += 1
+    clean = _TAG_RE.sub("", title).strip()
+    if len(clean) < 80:
+        score += 1
+    if tags & _META_TAGS:
+        score = max(0, score - 2)
+    return min(3, score)
+
+
+def _score_acceptance(title: str, body: str, tags: set[str]) -> int:
+    """0–3: Does this have clear acceptance criteria?"""
+    text = f"{title}\n{body}"
+    score = 0
+    matches = len(_ACCEPT_RE.findall(text))
+    if matches >= 3:
+        score += 2
+    elif matches >= 1:
+        score += 1
+    if _TEST_RE.search(text):
+        score += 1
+    if re.search(r"##\s*(problem|solution|expected|actual|steps)", body, re.IGNORECASE):
+        score += 1
+    if tags & _META_TAGS:
+        score = max(0, score - 1)
+    return min(3, score)
+
+
+def _score_alignment(title: str, body: str, tags: set[str]) -> int:
+    """0–3: How aligned is this with the north star?"""
+    score = 0
+    if tags & _BUG_TAGS:
+        return 3
+    if tags & _REFACTOR_TAGS:
+        score += 2
+    if tags & _FEATURE_TAGS:
+        score += 2
+    if _LOOP_TAG in tags:
+        score += 1
+    if tags & _META_TAGS:
+        score = 0
+    return min(3, score)
+
+
+def score_issue(issue: dict[str, Any]) -> ScoredIssue:
+    """Score and classify a raw Gitea issue dict."""
+    number = issue["number"]
+    title = issue.get("title", "")
+    body = issue.get("body") or ""
+    label_names = [lbl["name"] for lbl in issue.get("labels", [])]
+    tags = _extract_tags(title, label_names)
+    assignees = [a["login"] for a in issue.get("assignees", [])]
+
+    # Parse created_at
+    raw_ts = issue.get("created_at", "")
+    try:
+        created_at = datetime.fromisoformat(raw_ts.replace("Z", "+00:00"))
+    except (ValueError, AttributeError):
+        created_at = datetime.now(UTC)
+    age_days = (datetime.now(UTC) - created_at).days
+
+    # Scores
+    scope = _score_scope(title, body, tags)
+    acceptance = _score_acceptance(title, body, tags)
+    alignment = _score_alignment(title, body, tags)
+    total = scope + acceptance + alignment
+
+    # Classify
+    if tags & _BUG_TAGS:
+        issue_type = "bug"
+    elif tags & _RESEARCH_TAGS:
+        issue_type = "research"
+    elif tags & _FEATURE_TAGS:
+        issue_type = "feature"
+    elif tags & _REFACTOR_TAGS:
+        issue_type = "refactor"
+    elif tags & _META_TAGS:
+        issue_type = "philosophy"
+    else:
+        issue_type = "unknown"
+
+    is_p0 = bool(tags & _P0_TAGS) or issue_type == "bug"
+    is_blocked = bool(_BLOCKED_RE.search(title) or _BLOCKED_RE.search(body))
+
+    return ScoredIssue(
+        number=number,
+        title=_TAG_RE.sub("", title).strip(),
+        body=body,
+        labels=label_names,
+        tags=tags,
+        assignees=assignees,
+        created_at=created_at,
+        issue_type=issue_type,
+        score=total,
+        scope=scope,
+        acceptance=acceptance,
+        alignment=alignment,
+        ready=total >= READY_THRESHOLD,
+        age_days=age_days,
+        is_p0=is_p0,
+        is_blocked=is_blocked,
+    )
+
+
+# ── Decision logic ───────────────────────────────────────────────────────────
+
+
+def decide(issue: ScoredIssue) -> TriageDecision:
+    """Decide what to do with an issue.
+
+    Returns a TriageDecision with action, reason, and agent.
+    Decision is not yet executed — call execute_decision() for that.
+    """
+    num = issue.number
+
+    # Skip philosophy/meta — not dev-actionable
+    if issue.issue_type == "philosophy":
+        return TriageDecision(
+            issue_number=num,
+            action="skip",
+            reason="Philosophy/meta issue — not dev-actionable in the triage loop.",
+        )
+
+    # Skip already-assigned issues
+    if not issue.is_unassigned:
+        return TriageDecision(
+            issue_number=num,
+            action="skip",
+            reason=f"Already assigned to: {', '.join(issue.assignees)}.",
+        )
+
+    # Skip if not ready (low score)
+    if not issue.ready:
+        return TriageDecision(
+            issue_number=num,
+            action="skip",
+            reason=f"Score {issue.score} < {READY_THRESHOLD} threshold — needs more detail before assignment.",
+        )
+
+    # Blocked: flag for Alex
+    if issue.is_blocked:
+        return TriageDecision(
+            issue_number=num,
+            action="flag_alex",
+            agent=OWNER_LOGIN,
+            reason=(
+                "Issue appears blocked. Flagging for @rockachopa to unblock before autonomous assignment."
+            ),
+        )
+
+    # Research / Kimi-ready
+    if issue.needs_kimi:
+        return TriageDecision(
+            issue_number=num,
+            action="assign_kimi",
+            agent=AGENT_KIMI,
+            reason=(
+                f"Issue type '{issue.issue_type}' with research/investigation scope. "
+                f"Assigning kimi-ready label for Kimi agent to pick up."
+            ),
+        )
+
+    # P0 bugs and blocking issues → Claude immediately
+    if issue.is_p0:
+        return TriageDecision(
+            issue_number=num,
+            action="assign_claude",
+            agent=AGENT_CLAUDE,
+            reason=(
+                f"P0/{issue.issue_type} issue (score={issue.score}, age={issue.age_days}d). "
+                f"Assigning to Claude Code for immediate attention."
+            ),
+        )
+
+    # Everything else that is ready → Claude Code
+    return TriageDecision(
+        issue_number=num,
+        action="assign_claude",
+        agent=AGENT_CLAUDE,
+        reason=(
+            f"Unassigned ready issue (type={issue.issue_type}, score={issue.score}, "
+            f"age={issue.age_days}d). Assigning to Claude Code."
+        ),
+    )
+
+
+# ── Gitea API client ─────────────────────────────────────────────────────────
+
+
+def _api_headers() -> dict[str, str]:
+    return {
+        "Authorization": f"token {settings.gitea_token}",
+        "Content-Type": "application/json",
+        "Accept": "application/json",
+    }
+
+
+def _repo_url(path: str) -> str:
+    owner, repo = settings.gitea_repo.split("/", 1)
+    return f"{settings.gitea_url}/api/v1/repos/{owner}/{repo}/{path}"
+
+
+async def fetch_open_issues(client: httpx.AsyncClient) -> list[dict[str, Any]]:
+    """Fetch all open issues from Gitea, paginating as needed."""
+    all_issues: list[dict[str, Any]] = []
+    page = 1
+    while True:
+        url = _repo_url(f"issues?state=open&type=issues&limit=50&page={page}")
+        try:
+            resp = await client.get(url, headers=_api_headers())
+            if resp.status_code != 200:
+                logger.warning("Gitea issues fetch failed (HTTP %s)", resp.status_code)
+                break
+            batch: list[dict[str, Any]] = resp.json()
+            if not batch:
+                break
+            all_issues.extend(batch)
+            if len(batch) < 50:
+                break
+            page += 1
+        except (httpx.ConnectError, httpx.ReadError, httpx.TimeoutException) as exc:
+            logger.warning("Gitea connection error fetching issues: %s", exc)
+            break
+    return all_issues
+
+
+async def post_comment(
+    client: httpx.AsyncClient,
+    issue_number: int,
+    body: str,
+) -> bool:
+    """Post a comment on a Gitea issue. Returns True on success."""
+    url = _repo_url(f"issues/{issue_number}/comments")
+    try:
+        resp = await client.post(url, headers=_api_headers(), json={"body": body})
+        return resp.status_code in (200, 201)
+    except (httpx.ConnectError, httpx.ReadError, httpx.TimeoutException) as exc:
+        logger.warning("Failed to post comment on #%d: %s", issue_number, exc)
+        return False
+
+
+async def assign_issue(
+    client: httpx.AsyncClient,
+    issue_number: int,
+    assignee: str,
+) -> bool:
+    """Assign an issue to a Gitea user. Returns True on success."""
+    url = _repo_url(f"issues/{issue_number}")
+    try:
+        resp = await client.patch(
+            url,
+            headers=_api_headers(),
+            json={"assignees": [assignee]},
+        )
+        return resp.status_code in (200, 201)
+    except (httpx.ConnectError, httpx.ReadError, httpx.TimeoutException) as exc:
+        logger.warning("Failed to assign #%d to %s: %s", issue_number, assignee, exc)
+        return False
+
+
+async def add_label(
+    client: httpx.AsyncClient,
+    issue_number: int,
+    label_name: str,
+) -> bool:
+    """Add a label to a Gitea issue by name (auto-creates if missing). Returns True on success."""
+    owner, repo = settings.gitea_repo.split("/", 1)
+    labels_url = f"{settings.gitea_url}/api/v1/repos/{owner}/{repo}/labels"
+    headers = _api_headers()
+
+    try:
+        # Fetch existing labels
+        resp = await client.get(labels_url, headers=headers)
+        if resp.status_code != 200:
+            return False
+        existing = {lbl["name"]: lbl["id"] for lbl in resp.json()}
+
+        if label_name in existing:
+            label_id = existing[label_name]
+        else:
+            # Auto-create the label
+            create_resp = await client.post(
+                labels_url,
+                headers=headers,
+                json={"name": label_name, "color": "#006b75"},
+            )
+            if create_resp.status_code not in (200, 201):
+                return False
+            label_id = create_resp.json()["id"]
+
+        # Apply to the issue
+        apply_url = _repo_url(f"issues/{issue_number}/labels")
+        apply_resp = await client.post(
+            apply_url, headers=headers, json={"labels": [label_id]}
+        )
+        return apply_resp.status_code in (200, 201)
+
+    except (httpx.ConnectError, httpx.ReadError, httpx.TimeoutException) as exc:
+        logger.warning("Failed to add label %r to #%d: %s", label_name, issue_number, exc)
+        return False
+
+
+# ── Decision execution ───────────────────────────────────────────────────────
+
+
+async def execute_decision(
+    client: httpx.AsyncClient,
+    decision: TriageDecision,
+    dry_run: bool = False,
+) -> TriageDecision:
+    """Execute a triage decision — comment + assign/label.
+
+    When dry_run=True, logs the decision but makes no Gitea API calls.
+    Returns the updated decision with executed=True on success.
+    """
+    num = decision.issue_number
+
+    if decision.action == "skip":
+        logger.debug("Triage skip #%d: %s", num, decision.reason)
+        decision.executed = True
+        return decision
+
+    audit_comment = _build_audit_comment(decision)
+
+    if dry_run:
+        logger.info(
+            "[DRY RUN] #%d → %s (%s): %s",
+            num,
+            decision.action,
+            decision.agent,
+            decision.reason,
+        )
+        decision.executed = True
+        return decision
+
+    # Post audit comment first (always, so Alex can see reasoning)
+    comment_ok = await post_comment(client, num, audit_comment)
+    if not comment_ok:
+        decision.error = "Failed to post audit comment"
+        logger.warning("Triage #%d: comment failed", num)
+        return decision
+
+    # Execute assignment
+    ok = False
+    if decision.action == "assign_claude":
+        ok = await assign_issue(client, num, AGENT_CLAUDE)
+    elif decision.action == "assign_kimi":
+        ok = await add_label(client, num, KIMI_READY_LABEL)
+    elif decision.action == "flag_alex":
+        # Comment already posted above — that's sufficient for flagging
+        ok = True
+
+    if ok:
+        decision.executed = True
+        logger.info("Triage #%d → %s OK", num, decision.action)
+    else:
+        decision.error = f"Action {decision.action!r} failed"
+        logger.warning("Triage #%d: action %r failed", num, decision.action)
+
+    return decision
+
+
+def _build_audit_comment(decision: TriageDecision) -> str:
+    """Build the audit trail comment that Alex can read to see reasoning."""
+    ts = datetime.now(UTC).strftime("%Y-%m-%d %H:%M UTC")
+    action_text = {
+        "assign_claude": f"Assigning to @{AGENT_CLAUDE} for implementation.",
+        "assign_kimi": f"Adding `{KIMI_READY_LABEL}` label — queuing for Kimi research agent.",
+        "flag_alex": f"Flagging for @{OWNER_LOGIN} — issue appears blocked or needs human decision.",
+    }.get(decision.action, decision.action)
+
+    return (
+        f"**[Timmy Triage — {ts}]**\n\n"
+        f"**Decision:** {action_text}\n\n"
+        f"**Why:** {decision.reason}\n\n"
+        f"*Autonomous triage by Timmy. Reply to override.*"
+    )
+
+
+# ── Daily summary ─────────────────────────────────────────────────────────────
+
+
+def _build_daily_summary(result: TriageCycleResult, scored: list[ScoredIssue]) -> str:
+    """Build the daily triage summary body."""
+    now = datetime.now(UTC).strftime("%Y-%m-%d %H:%M UTC")
+    assigned = [d for d in result.decisions if d.executed and d.action != "skip"]
+    skipped = [d for d in result.decisions if d.action == "skip"]
+
+    lines = [
+        f"# Timmy Backlog Triage — {now}",
+        "",
+        f"**Open issues:** {result.total_open}  |  "
+        f"**Scored:** {result.scored}  |  "
+        f"**Ready:** {result.ready}  |  "
+        f"**Assigned this cycle:** {len(assigned)}",
+        "",
+        "## Top 10 Ready Issues (by score)",
+        "",
+    ]
+
+    top = sorted([s for s in scored if s.ready], key=lambda s: (-s.score, s.number))[:10]
+    for s in top:
+        flag = "🐛" if s.issue_type == "bug" else "⚡" if s.is_p0 else "✦"
+        lines.append(
+            f"- {flag} **#{s.number}** (score={s.score}, age={s.age_days}d) — {s.title[:80]}"
+        )
+
+    if assigned:
+        lines += ["", "## Actions Taken", ""]
+        for d in assigned:
+            lines.append(f"- #{d.issue_number} → `{d.action}` ({d.agent}): {d.reason[:100]}")
+
+    if skipped:
+        lines += ["", f"## Skipped ({len(skipped)} issues)", ""]
+        for d in skipped[:5]:
+            lines.append(f"- #{d.issue_number}: {d.reason[:80]}")
+        if len(skipped) > 5:
+            lines.append(f"- … and {len(skipped) - 5} more")
+
+    lines += [
+        "",
+        "---",
+        "*Auto-generated by Timmy's backlog triage loop. "
+        "Override any decision by reassigning or commenting.*",
+    ]
+    return "\n".join(lines)
+
+
+async def post_daily_summary(
+    client: httpx.AsyncClient,
+    result: TriageCycleResult,
+    scored: list[ScoredIssue],
+    dry_run: bool = False,
+) -> bool:
+    """Post a daily triage summary as a new Gitea issue."""
+    today = datetime.now(UTC).strftime("%Y-%m-%d")
+    title = f"[Triage] Daily backlog summary — {today}"
+    body = _build_daily_summary(result, scored)
+
+    if dry_run:
+        logger.info("[DRY RUN] Would post daily summary: %s", title)
+        return True
+
+    url = _repo_url("issues")
+    try:
+        resp = await client.post(
+            url,
+            headers=_api_headers(),
+            json={
+                "title": title,
+                "body": body,
+                "labels": [],
+            },
+        )
+        if resp.status_code in (200, 201):
+            issue_num = resp.json().get("number", "?")
+            logger.info("Daily triage summary posted as issue #%s", issue_num)
+            return True
+        logger.warning("Daily summary post failed (HTTP %s)", resp.status_code)
+        return False
+    except (httpx.ConnectError, httpx.ReadError, httpx.TimeoutException) as exc:
+        logger.warning("Failed to post daily summary: %s", exc)
+        return False
+
+
+# ── Main loop class ───────────────────────────────────────────────────────────
+
+
+class BacklogTriageLoop:
+    """Autonomous backlog triage loop.
+
+    Fetches, scores, and assigns Gitea issues on a configurable interval.
+
+    Parameters
+    ----------
+    interval:
+        Seconds between triage cycles. Default: settings.backlog_triage_interval_seconds.
+    dry_run:
+        When True, score and log decisions but don't write to Gitea.
+    daily_summary:
+        When True, post a daily triage summary issue after each cycle.
+    """
+
+    def __init__(
+        self,
+        *,
+        interval: float | None = None,
+        dry_run: bool | None = None,
+        daily_summary: bool | None = None,
+    ) -> None:
+        self._interval = float(interval or settings.backlog_triage_interval_seconds)
+        self._dry_run = dry_run if dry_run is not None else settings.backlog_triage_dry_run
+        self._daily_summary = (
+            daily_summary if daily_summary is not None else settings.backlog_triage_daily_summary
+        )
+        self._running = False
+        self._task: asyncio.Task | None = None
+        self._cycle_count = 0
+        self._last_summary_date: str = ""
+        self.history: list[TriageCycleResult] = []
+
+    @property
+    def is_running(self) -> bool:
+        return self._running
+
+    @property
+    def cycle_count(self) -> int:
+        return self._cycle_count
+
+    async def run_once(self) -> TriageCycleResult:
+        """Execute one full triage cycle.
+
+        1. Fetch all open Gitea issues
+        2. Score and prioritize
+        3. Decide on each unassigned ready issue
+        4. Execute decisions
+        5. Optionally post daily summary
+        """
+        import time
+
+        self._cycle_count += 1
+        start = time.monotonic()
+        ts = datetime.now(UTC).isoformat()
+        result = TriageCycleResult(timestamp=ts, total_open=0, scored=0, ready=0)
+
+        if not settings.gitea_enabled or not settings.gitea_token:
+            logger.warning("Backlog triage: Gitea not configured — skipping cycle")
+            return result
+
+        async with httpx.AsyncClient(timeout=30) as client:
+            # 1. Fetch
+            raw_issues = await fetch_open_issues(client)
+            result.total_open = len(raw_issues)
+            logger.info("Triage cycle #%d: fetched %d open issues", self._cycle_count, len(raw_issues))
+
+            # 2. Score
+            scored = [score_issue(i) for i in raw_issues]
+            result.scored = len(scored)
+            result.ready = sum(1 for s in scored if s.ready)
+
+            # 3 & 4. Decide and execute for each issue
+            for issue in scored:
+                decision = decide(issue)
+                if decision.action == "skip":
+                    result.decisions.append(decision)
+                    continue
+                decision = await execute_decision(client, decision, dry_run=self._dry_run)
+                result.decisions.append(decision)
+
+                # Rate-limit: short pause between API writes to avoid hammering Gitea
+                if not self._dry_run:
+                    await asyncio.sleep(0.5)
+
+            # 5. Daily summary (once per UTC day)
+            today = datetime.now(UTC).strftime("%Y-%m-%d")
+            if self._daily_summary and today != self._last_summary_date:
+                await post_daily_summary(client, result, scored, dry_run=self._dry_run)
+                self._last_summary_date = today
+
+        result.duration_ms = int((time.monotonic() - start) * 1000)
+        self.history.append(result)
+
+        assigned_count = sum(1 for d in result.decisions if d.executed and d.action != "skip")
+        logger.info(
+            "Triage cycle #%d complete (%d ms): %d open, %d ready, %d assigned",
+            self._cycle_count,
+            result.duration_ms,
+            result.total_open,
+            result.ready,
+            assigned_count,
+        )
+        return result
+
+    async def start(self) -> None:
+        """Start the triage loop as a background task."""
+        if self._running:
+            logger.warning("BacklogTriageLoop already running")
+            return
+        self._running = True
+        await self._loop()
+
+    async def _loop(self) -> None:
+        logger.info(
+            "BacklogTriageLoop started (interval=%.0fs, dry_run=%s)",
+            self._interval,
+            self._dry_run,
+        )
+        while self._running:
+            try:
+                await self.run_once()
+            except Exception:
+                logger.exception("Backlog triage cycle failed")
+            await asyncio.sleep(self._interval)
+
+    def stop(self) -> None:
+        """Signal the loop to stop after the current cycle."""
+        self._running = False
+        logger.info("BacklogTriageLoop stop requested")
--- a/src/timmy/dreaming.py
+++ b/src/timmy/dreaming.py
@@ -1,434 +0,0 @@
-"""Dreaming Mode — idle-time session replay and counterfactual simulation.
-
-When the dashboard has been idle for a configurable period, this engine
-selects a past chat session, identifies key agent response points, and
-asks the LLM to simulate alternative approaches.  Insights are stored as
-proposed rules that can feed the auto-crystallizer or memory system.
-
-Usage::
-
-    from timmy.dreaming import dreaming_engine
-
-    # Run one dream cycle (called by the background scheduler)
-    await dreaming_engine.dream_once()
-
-    # Query recent dreams
-    dreams = dreaming_engine.get_recent_dreams(limit=10)
-
-    # Get current status dict for API/dashboard
-    status = dreaming_engine.get_status()
-"""
-
-import logging
-import re
-import sqlite3
-import uuid
-from collections.abc import Generator
-from contextlib import closing, contextmanager
-from dataclasses import dataclass
-from datetime import UTC, datetime, timedelta
-from pathlib import Path
-from typing import Any
-
-from config import settings
-
-logger = logging.getLogger(__name__)
-
-_DEFAULT_DB = Path("data/dreams.db")
-
-# Strip <think> tags from reasoning model output
-_THINK_TAG_RE = re.compile(r"<think>.*?</think>\s*", re.DOTALL)
-
-# Minimum messages in a session to be worth replaying
-_MIN_SESSION_MESSAGES = 3
-
-# Gap in seconds between messages that signals a new session
-_SESSION_GAP_SECONDS = 1800  # 30 minutes
-
-
-@dataclass
-class DreamRecord:
-    """A single completed dream cycle."""
-
-    id: str
-    session_excerpt: str      # Short excerpt from the replayed session
-    decision_point: str       # The agent message that was re-simulated
-    simulation: str           # The alternative response generated
-    proposed_rule: str        # Rule extracted from the simulation
-    created_at: str
-
-
-@contextmanager
-def _get_conn(db_path: Path = _DEFAULT_DB) -> Generator[sqlite3.Connection, None, None]:
-    db_path.parent.mkdir(parents=True, exist_ok=True)
-    with closing(sqlite3.connect(str(db_path))) as conn:
-        conn.row_factory = sqlite3.Row
-        conn.execute("""
-            CREATE TABLE IF NOT EXISTS dreams (
-                id            TEXT PRIMARY KEY,
-                session_excerpt TEXT NOT NULL,
-                decision_point  TEXT NOT NULL,
-                simulation      TEXT NOT NULL,
-                proposed_rule   TEXT NOT NULL DEFAULT '',
-                created_at      TEXT NOT NULL
-            )
-        """)
-        conn.execute("CREATE INDEX IF NOT EXISTS idx_dreams_time ON dreams(created_at)")
-        conn.commit()
-        yield conn
-
-
-def _row_to_dream(row: sqlite3.Row) -> DreamRecord:
-    return DreamRecord(
-        id=row["id"],
-        session_excerpt=row["session_excerpt"],
-        decision_point=row["decision_point"],
-        simulation=row["simulation"],
-        proposed_rule=row["proposed_rule"],
-        created_at=row["created_at"],
-    )
-
-
-class DreamingEngine:
-    """Idle-time dreaming engine — replays sessions and simulates alternatives."""
-
-    def __init__(self, db_path: Path = _DEFAULT_DB) -> None:
-        self._db_path = db_path
-        self._last_activity_time: datetime = datetime.now(UTC)
-        self._is_dreaming: bool = False
-        self._current_dream_summary: str = ""
-        self._dreaming_agent = None  # Lazy-initialised
-
-    # ── Public API ────────────────────────────────────────────────────────
-
-    def record_activity(self) -> None:
-        """Reset the idle timer — call this on every user/agent interaction."""
-        self._last_activity_time = datetime.now(UTC)
-
-    def is_idle(self) -> bool:
-        """Return True if the system has been idle long enough to start dreaming."""
-        threshold = settings.dreaming_idle_threshold_minutes
-        if threshold <= 0:
-            return False
-        return datetime.now(UTC) - self._last_activity_time > timedelta(minutes=threshold)
-
-    def get_status(self) -> dict[str, Any]:
-        """Return a status dict suitable for API/dashboard consumption."""
-        return {
-            "enabled": settings.dreaming_enabled,
-            "dreaming": self._is_dreaming,
-            "idle": self.is_idle(),
-            "current_summary": self._current_dream_summary,
-            "idle_minutes": int(
-                (datetime.now(UTC) - self._last_activity_time).total_seconds() / 60
-            ),
-            "idle_threshold_minutes": settings.dreaming_idle_threshold_minutes,
-            "dream_count": self.count_dreams(),
-        }
-
-    async def dream_once(self) -> DreamRecord | None:
-        """Execute one dream cycle.
-
-        Returns the stored DreamRecord, or None if the cycle was skipped
-        (not idle, dreaming disabled, no suitable session, or LLM error).
-        """
-        if not settings.dreaming_enabled:
-            return None
-
-        if not self.is_idle():
-            logger.debug(
-                "Dreaming skipped — system active (idle for %d min, threshold %d min)",
-                int((datetime.now(UTC) - self._last_activity_time).total_seconds() / 60),
-                settings.dreaming_idle_threshold_minutes,
-            )
-            return None
-
-        if self._is_dreaming:
-            logger.debug("Dreaming skipped — cycle already in progress")
-            return None
-
-        self._is_dreaming = True
-        self._current_dream_summary = "Selecting a past session…"
-        await self._broadcast_status()
-
-        try:
-            return await self._run_dream_cycle()
-        except Exception as exc:
-            logger.warning("Dream cycle failed: %s", exc)
-            return None
-        finally:
-            self._is_dreaming = False
-            self._current_dream_summary = ""
-            await self._broadcast_status()
-
-    def get_recent_dreams(self, limit: int = 20) -> list[DreamRecord]:
-        """Retrieve the most recent dream records."""
-        with _get_conn(self._db_path) as conn:
-            rows = conn.execute(
-                "SELECT * FROM dreams ORDER BY created_at DESC LIMIT ?",
-                (limit,),
-            ).fetchall()
-        return [_row_to_dream(r) for r in rows]
-
-    def count_dreams(self) -> int:
-        """Return total number of stored dream records."""
-        with _get_conn(self._db_path) as conn:
-            row = conn.execute("SELECT COUNT(*) AS c FROM dreams").fetchone()
-            return row["c"] if row else 0
-
-    # ── Private helpers ───────────────────────────────────────────────────
-
-    async def _run_dream_cycle(self) -> DreamRecord | None:
-        """Core dream logic: select → simulate → store."""
-        # 1. Select a past session from the chat log
-        session = await self._select_session()
-        if not session:
-            logger.debug("No suitable chat session found for dreaming")
-            self._current_dream_summary = "No past sessions to replay"
-            return None
-
-        decision_point, session_excerpt = session
-
-        self._current_dream_summary = f"Simulating alternative for: {decision_point[:60]}…"
-        await self._broadcast_status()
-
-        # 2. Simulate an alternative response
-        simulation = await self._simulate_alternative(decision_point, session_excerpt)
-        if not simulation:
-            logger.debug("Dream simulation produced no output")
-            return None
-
-        # 3. Extract a proposed rule
-        proposed_rule = await self._extract_rule(decision_point, simulation)
-
-        # 4. Store and broadcast
-        dream = self._store_dream(
-            session_excerpt=session_excerpt,
-            decision_point=decision_point,
-            simulation=simulation,
-            proposed_rule=proposed_rule,
-        )
-
-        self._current_dream_summary = f"Dream complete: {proposed_rule[:80]}" if proposed_rule else "Dream complete"
-
-        logger.info(
-            "Dream [%s]: replayed session, proposed rule: %s",
-            dream.id[:8],
-            proposed_rule[:80] if proposed_rule else "(none)",
-        )
-
-        await self._broadcast_status()
-        await self._broadcast_dream(dream)
-        return dream
-
-    async def _select_session(self) -> tuple[str, str] | None:
-        """Select a past chat session and return (decision_point, session_excerpt).
-
-        Uses the SQLite chat store.  Groups messages into sessions by time
-        gap.  Picks a random session with enough messages, then selects one
-        agent response as the decision point.
-        """
-        try:
-            from infrastructure.chat_store import DB_PATH
-
-            if not DB_PATH.exists():
-                return None
-
-            import asyncio
-            rows = await asyncio.to_thread(self._load_chat_rows)
-            if not rows:
-                return None
-
-            sessions = self._group_into_sessions(rows)
-            if not sessions:
-                return None
-
-            # Filter sessions with enough messages
-            valid = [s for s in sessions if len(s) >= _MIN_SESSION_MESSAGES]
-            if not valid:
-                return None
-
-            import random
-            session = random.choice(valid)  # noqa: S311 (not cryptographic)
-
-            # Build a short text excerpt (last N messages)
-            excerpt_msgs = session[-6:]
-            excerpt = "\n".join(
-                f"{m['role'].upper()}: {m['content'][:200]}" for m in excerpt_msgs
-            )
-
-            # Find agent responses as candidate decision points
-            agent_msgs = [m for m in session if m["role"] in ("agent", "assistant")]
-            if not agent_msgs:
-                return None
-
-            decision = random.choice(agent_msgs)  # noqa: S311
-            return decision["content"], excerpt
-
-        except Exception as exc:
-            logger.warning("Session selection failed: %s", exc)
-            return None
-
-    def _load_chat_rows(self) -> list[dict]:
-        """Synchronously load chat messages from SQLite."""
-        from infrastructure.chat_store import DB_PATH
-
-        with closing(sqlite3.connect(str(DB_PATH))) as conn:
-            conn.row_factory = sqlite3.Row
-            rows = conn.execute(
-                "SELECT role, content, timestamp FROM chat_messages "
-                "ORDER BY timestamp ASC"
-            ).fetchall()
-        return [dict(r) for r in rows]
-
-    def _group_into_sessions(self, rows: list[dict]) -> list[list[dict]]:
-        """Group chat rows into sessions based on time gaps."""
-        if not rows:
-            return []
-
-        sessions: list[list[dict]] = []
-        current: list[dict] = [rows[0]]
-
-        for prev, curr in zip(rows, rows[1:], strict=False):
-            try:
-                t_prev = datetime.fromisoformat(prev["timestamp"].replace("Z", "+00:00"))
-                t_curr = datetime.fromisoformat(curr["timestamp"].replace("Z", "+00:00"))
-                gap = (t_curr - t_prev).total_seconds()
-            except Exception:
-                gap = 0
-
-            if gap > _SESSION_GAP_SECONDS:
-                sessions.append(current)
-                current = [curr]
-            else:
-                current.append(curr)
-
-        sessions.append(current)
-        return sessions
-
-    async def _simulate_alternative(
-        self, decision_point: str, session_excerpt: str
-    ) -> str:
-        """Ask the LLM to simulate an alternative response."""
-        prompt = (
-            "You are Timmy, a sovereign AI agent in a dreaming state.\n"
-            "You are replaying a past conversation and exploring what you could "
-            "have done differently at a key decision point.\n\n"
-            "PAST SESSION EXCERPT:\n"
-            f"{session_excerpt}\n\n"
-            "KEY DECISION POINT (your past response):\n"
-            f"{decision_point[:500]}\n\n"
-            "TASK: In 2-3 sentences, describe ONE concrete alternative approach "
-            "you could have taken at this decision point that would have been "
-            "more helpful, more accurate, or more efficient.\n"
-            "Be specific — reference the actual content of the conversation.\n"
-            "Do NOT include meta-commentary about dreaming or this exercise.\n\n"
-            "Alternative approach:"
-        )
-
-        raw = await self._call_agent(prompt)
-        return _THINK_TAG_RE.sub("", raw).strip() if raw else ""
-
-    async def _extract_rule(self, decision_point: str, simulation: str) -> str:
-        """Extract a proposed behaviour rule from the simulation."""
-        prompt = (
-            "Given this pair of agent responses:\n\n"
-            f"ORIGINAL: {decision_point[:300]}\n\n"
-            f"IMPROVED ALTERNATIVE: {simulation[:400]}\n\n"
-            "Extract ONE concise rule (max 20 words) that captures what to do "
-            "differently next time.  Format: 'When X, do Y instead of Z.'\n"
-            "Rule:"
-        )
-
-        raw = await self._call_agent(prompt)
-        rule = _THINK_TAG_RE.sub("", raw).strip() if raw else ""
-        # Keep only the first sentence/line
-        rule = rule.split("\n")[0].strip().rstrip(".")
-        return rule[:200]  # Safety cap
-
-    async def _call_agent(self, prompt: str) -> str:
-        """Call the Timmy agent for a dreaming prompt (skip MCP, 60 s timeout)."""
-        import asyncio
-
-        if self._dreaming_agent is None:
-            from timmy.agent import create_timmy
-
-            self._dreaming_agent = create_timmy(skip_mcp=True)
-
-        try:
-            async with asyncio.timeout(settings.dreaming_timeout_seconds):
-                run = await self._dreaming_agent.arun(prompt, stream=False)
-        except TimeoutError:
-            logger.warning("Dreaming LLM call timed out after %ds", settings.dreaming_timeout_seconds)
-            return ""
-        except Exception as exc:
-            logger.warning("Dreaming LLM call failed: %s", exc)
-            return ""
-
-        raw = run.content if hasattr(run, "content") else str(run)
-        return raw or ""
-
-    def _store_dream(
-        self,
-        *,
-        session_excerpt: str,
-        decision_point: str,
-        simulation: str,
-        proposed_rule: str,
-    ) -> DreamRecord:
-        dream = DreamRecord(
-            id=str(uuid.uuid4()),
-            session_excerpt=session_excerpt,
-            decision_point=decision_point,
-            simulation=simulation,
-            proposed_rule=proposed_rule,
-            created_at=datetime.now(UTC).isoformat(),
-        )
-        with _get_conn(self._db_path) as conn:
-            conn.execute(
-                """
-                INSERT INTO dreams
-                    (id, session_excerpt, decision_point, simulation, proposed_rule, created_at)
-                VALUES (?, ?, ?, ?, ?, ?)
-                """,
-                (
-                    dream.id,
-                    dream.session_excerpt,
-                    dream.decision_point,
-                    dream.simulation,
-                    dream.proposed_rule,
-                    dream.created_at,
-                ),
-            )
-            conn.commit()
-        return dream
-
-    async def _broadcast_status(self) -> None:
-        """Push current dreaming status via WebSocket."""
-        try:
-            from infrastructure.ws_manager.handler import ws_manager
-
-            await ws_manager.broadcast("dreaming_state", self.get_status())
-        except Exception as exc:
-            logger.debug("Dreaming status broadcast failed: %s", exc)
-
-    async def _broadcast_dream(self, dream: DreamRecord) -> None:
-        """Push a completed dream record via WebSocket."""
-        try:
-            from infrastructure.ws_manager.handler import ws_manager
-
-            await ws_manager.broadcast(
-                "dreaming_complete",
-                {
-                    "id": dream.id,
-                    "proposed_rule": dream.proposed_rule,
-                    "simulation": dream.simulation[:200],
-                    "created_at": dream.created_at,
-                },
-            )
-        except Exception as exc:
-            logger.debug("Dreaming complete broadcast failed: %s", exc)
-
-
-# Module-level singleton
-dreaming_engine = DreamingEngine()
--- a/src/timmy/mcp_bridge.py
+++ b/src/timmy/mcp_bridge.py
@@ -399,6 +399,74 @@ class MCPBridge:
            logger.warning("Tool '%s' execution failed: %s", name, exc)
            return f"Error executing {name}: {exc}"

+    @staticmethod
+    def _build_initial_messages(
+        prompt: str, system_prompt: str | None
+    ) -> list[dict]:
+        """Build the initial message list for a run."""
+        messages: list[dict] = []
+        if system_prompt:
+            messages.append({"role": "system", "content": system_prompt})
+        messages.append({"role": "user", "content": prompt})
+        return messages
+
+    async def _process_round_tool_calls(
+        self,
+        messages: list[dict],
+        model_tool_calls: list[dict],
+        rounds: int,
+        tool_calls_made: list[dict],
+    ) -> None:
+        """Execute all tool calls in one round, appending results to messages."""
+        for tc in model_tool_calls:
+            func = tc.get("function", {})
+            tool_name = func.get("name", "unknown")
+            tool_args = func.get("arguments", {})
+            logger.info(
+                "Bridge tool call [round %d]: %s(%s)",
+                rounds,
+                tool_name,
+                tool_args,
+            )
+            result = await self._execute_tool_call(tc)
+            tool_calls_made.append(
+                {
+                    "round": rounds,
+                    "tool": tool_name,
+                    "arguments": tool_args,
+                    "result": result[:500],  # Truncate for logging
+                }
+            )
+            messages.append({"role": "tool", "content": result})
+
+    async def _run_tool_loop(
+        self, messages: list[dict], tools: list[dict]
+    ) -> tuple[str, list[dict], int, str]:
+        """Run the tool-call loop until final response or max rounds reached.
+
+        Returns:
+            Tuple of (content, tool_calls_made, rounds, error).
+        """
+        tool_calls_made: list[dict] = []
+        rounds = 0
+
+        for round_num in range(self.max_rounds):
+            rounds = round_num + 1
+            response = await self._chat(messages, tools)
+            msg = response.get("message", {})
+            model_tool_calls = msg.get("tool_calls", [])
+
+            if not model_tool_calls:
+                return msg.get("content", ""), tool_calls_made, rounds, ""
+
+            messages.append(msg)
+            await self._process_round_tool_calls(
+                messages, model_tool_calls, rounds, tool_calls_made
+            )
+
+        error = f"Exceeded maximum of {self.max_rounds} tool-call rounds"
+        return "(max tool-call rounds reached)", tool_calls_made, rounds, error
+
    async def run(
        self,
        prompt: str,
@@ -419,115 +487,37 @@ class MCPBridge:
            BridgeResult with the final response and tool call history.
        """
        start = time.time()
-        messages: list[dict] = []
-
-        if system_prompt:
-            messages.append({"role": "system", "content": system_prompt})
-
-        messages.append({"role": "user", "content": prompt})
-
+        messages = self._build_initial_messages(prompt, system_prompt)
        tools = self._build_ollama_tools()
        tool_calls_made: list[dict] = []
        rounds = 0
+        error_msg = ""

        try:
-            for round_num in range(self.max_rounds):
-                rounds = round_num + 1
-                response = await self._chat(messages, tools)
-                msg = response.get("message", {})
-
-                # Check if model made tool calls
-                model_tool_calls = msg.get("tool_calls", [])
-                if not model_tool_calls:
-                    # Final text response — done.
-                    content = msg.get("content", "")
-                    latency = (time.time() - start) * 1000
-                    return BridgeResult(
-                        content=content,
-                        tool_calls_made=tool_calls_made,
-                        rounds=rounds,
-                        latency_ms=latency,
-                        model=self.model,
-                    )
-
-                # Append the assistant message (with tool_calls) to history
-                messages.append(msg)
-
-                # Execute each tool call and add results
-                for tc in model_tool_calls:
-                    func = tc.get("function", {})
-                    tool_name = func.get("name", "unknown")
-                    tool_args = func.get("arguments", {})
-
-                    logger.info(
-                        "Bridge tool call [round %d]: %s(%s)",
-                        rounds,
-                        tool_name,
-                        tool_args,
-                    )
-
-                    result = await self._execute_tool_call(tc)
-                    tool_calls_made.append(
-                        {
-                            "round": rounds,
-                            "tool": tool_name,
-                            "arguments": tool_args,
-                            "result": result[:500],  # Truncate for logging
-                        }
-                    )
-
-                    # Add tool result to message history
-                    messages.append(
-                        {
-                            "role": "tool",
-                            "content": result,
-                        }
-                    )
-
-            # Hit max rounds
-            latency = (time.time() - start) * 1000
-            return BridgeResult(
-                content="(max tool-call rounds reached)",
-                tool_calls_made=tool_calls_made,
-                rounds=rounds,
-                latency_ms=latency,
-                model=self.model,
-                error=f"Exceeded maximum of {self.max_rounds} tool-call rounds",
+            content, tool_calls_made, rounds, error_msg = await self._run_tool_loop(
+                messages, tools
            )
-
        except httpx.ConnectError as exc:
-            latency = (time.time() - start) * 1000
            logger.warning("Ollama connection failed: %s", exc)
-            return BridgeResult(
-                content="",
-                tool_calls_made=tool_calls_made,
-                rounds=rounds,
-                latency_ms=latency,
-                model=self.model,
-                error=f"Ollama connection failed: {exc}",
-            )
+            error_msg = f"Ollama connection failed: {exc}"
+            content = ""
        except httpx.HTTPStatusError as exc:
-            latency = (time.time() - start) * 1000
            logger.warning("Ollama HTTP error: %s", exc)
-            return BridgeResult(
-                content="",
-                tool_calls_made=tool_calls_made,
-                rounds=rounds,
-                latency_ms=latency,
-                model=self.model,
-                error=f"Ollama HTTP error: {exc.response.status_code}",
-            )
+            error_msg = f"Ollama HTTP error: {exc.response.status_code}"
+            content = ""
        except Exception as exc:
-            latency = (time.time() - start) * 1000
            logger.error("MCPBridge run failed: %s", exc)
-            return BridgeResult(
-                content="",
-                tool_calls_made=tool_calls_made,
-                rounds=rounds,
-                latency_ms=latency,
-                model=self.model,
-                error=str(exc),
-            )
+            error_msg = str(exc)
+            content = ""
+
+        return BridgeResult(
+            content=content,
+            tool_calls_made=tool_calls_made,
+            rounds=rounds,
+            latency_ms=(time.time() - start) * 1000,
+            model=self.model,
+            error=error_msg,
+        )

    def status(self) -> dict:
        """Return bridge status for the dashboard."""
--- a/src/timmy/tools.py
+++ b/src/timmy/tools.py
@@ -462,7 +462,8 @@ def consult_grok(query: str) -> str:
            inv = ln.create_invoice(sats, f"Grok query: {query[:_INVOICE_MEMO_MAX_LEN]}")
            invoice_info = f"\n[Lightning invoice: {sats} sats — {inv.payment_request[:40]}...]"
        except (ImportError, OSError, ValueError) as exc:
-            logger.warning("Tool execution failed (Lightning invoice): %s", exc)
+            logger.error("Lightning invoice creation failed: %s", exc)
+            return "Error: Failed to create Lightning invoice. Please check logs."

    result = backend.run(query)

@@ -533,7 +534,8 @@ def _register_web_fetch_tool(toolkit: Toolkit) -> None:
    try:
        toolkit.register(web_fetch, name="web_fetch")
    except Exception as exc:
-        logger.warning("Tool execution failed (web_fetch registration): %s", exc)
+        logger.error("Failed to register web_fetch tool: %s", exc)
+        raise


 def _register_core_tools(toolkit: Toolkit, base_path: Path) -> None:
@@ -565,8 +567,8 @@ def _register_grok_tool(toolkit: Toolkit) -> None:
            toolkit.register(consult_grok, name="consult_grok")
            logger.info("Grok consultation tool registered")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (Grok registration): %s", exc)
-        logger.debug("Grok tool not available")
+        logger.error("Failed to register Grok tool: %s", exc)
+        raise


 def _register_memory_tools(toolkit: Toolkit) -> None:
@@ -579,8 +581,8 @@ def _register_memory_tools(toolkit: Toolkit) -> None:
        toolkit.register(memory_read, name="memory_read")
        toolkit.register(memory_forget, name="memory_forget")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (Memory tools registration): %s", exc)
-        logger.debug("Memory tools not available")
+        logger.error("Failed to register Memory tools: %s", exc)
+        raise


 def _register_agentic_loop_tool(toolkit: Toolkit) -> None:
@@ -628,8 +630,8 @@ def _register_agentic_loop_tool(toolkit: Toolkit) -> None:

        toolkit.register(plan_and_execute, name="plan_and_execute")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (plan_and_execute registration): %s", exc)
-        logger.debug("plan_and_execute tool not available")
+        logger.error("Failed to register plan_and_execute tool: %s", exc)
+        raise


 def _register_introspection_tools(toolkit: Toolkit) -> None:
@@ -647,15 +649,16 @@ def _register_introspection_tools(toolkit: Toolkit) -> None:
        toolkit.register(get_memory_status, name="get_memory_status")
        toolkit.register(run_self_tests, name="run_self_tests")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (Introspection tools registration): %s", exc)
-        logger.debug("Introspection tools not available")
+        logger.error("Failed to register Introspection tools: %s", exc)
+        raise

    try:
        from timmy.mcp_tools import update_gitea_avatar

        toolkit.register(update_gitea_avatar, name="update_gitea_avatar")
    except (ImportError, AttributeError) as exc:
-        logger.debug("update_gitea_avatar tool not available: %s", exc)
+        logger.error("Failed to register update_gitea_avatar tool: %s", exc)
+        raise

    try:
        from timmy.session_logger import self_reflect, session_history
@@ -663,8 +666,8 @@ def _register_introspection_tools(toolkit: Toolkit) -> None:
        toolkit.register(session_history, name="session_history")
        toolkit.register(self_reflect, name="self_reflect")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (session_history registration): %s", exc)
-        logger.debug("session_history tool not available")
+        logger.error("Failed to register session_history tool: %s", exc)
+        raise


 def _register_delegation_tools(toolkit: Toolkit) -> None:
@@ -676,8 +679,8 @@ def _register_delegation_tools(toolkit: Toolkit) -> None:
        toolkit.register(delegate_to_kimi, name="delegate_to_kimi")
        toolkit.register(list_swarm_agents, name="list_swarm_agents")
    except Exception as exc:
-        logger.warning("Tool execution failed (Delegation tools registration): %s", exc)
-        logger.debug("Delegation tools not available")
+        logger.error("Failed to register Delegation tools: %s", exc)
+        raise


 def _register_gematria_tool(toolkit: Toolkit) -> None:
@@ -687,8 +690,8 @@ def _register_gematria_tool(toolkit: Toolkit) -> None:

        toolkit.register(gematria, name="gematria")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (Gematria registration): %s", exc)
-        logger.debug("Gematria tool not available")
+        logger.error("Failed to register Gematria tool: %s", exc)
+        raise


 def _register_artifact_tools(toolkit: Toolkit) -> None:
@@ -699,8 +702,8 @@ def _register_artifact_tools(toolkit: Toolkit) -> None:
        toolkit.register(jot_note, name="jot_note")
        toolkit.register(log_decision, name="log_decision")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (Artifact tools registration): %s", exc)
-        logger.debug("Artifact tools not available")
+        logger.error("Failed to register Artifact tools: %s", exc)
+        raise


 def _register_thinking_tools(toolkit: Toolkit) -> None:
@@ -710,8 +713,8 @@ def _register_thinking_tools(toolkit: Toolkit) -> None:

        toolkit.register(search_thoughts, name="thought_search")
    except (ImportError, AttributeError) as exc:
-        logger.warning("Tool execution failed (Thinking tools registration): %s", exc)
-        logger.debug("Thinking tools not available")
+        logger.error("Failed to register Thinking tools: %s", exc)
+        raise


 def create_full_toolkit(base_dir: str | Path | None = None):
--- a/static/css/mission-control.css
+++ b/static/css/mission-control.css
@@ -2547,44 +2547,3 @@
 .tower-adv-title { font-size: 0.85rem; font-weight: 600; color: var(--text-bright); }
 .tower-adv-detail { font-size: 0.8rem; color: var(--text); margin-top: 2px; }
 .tower-adv-action { font-size: 0.75rem; color: var(--green); margin-top: 4px; font-style: italic; }
-
-/* ═══════════════════════════════════════════════════════════════
-   Dreaming Mode
-   ═══════════════════════════════════════════════════════════════ */
-
-.dream-active {
-  display: flex; align-items: center; gap: 8px;
-  padding: 6px 0;
-}
-.dream-label { font-size: 0.75rem; font-weight: 700; color: var(--purple); letter-spacing: 0.12em; }
-.dream-summary { font-size: 0.75rem; color: var(--text-dim); font-style: italic; flex: 1; }
-
-.dream-pulse {
-  display: inline-block; width: 8px; height: 8px; border-radius: 50%;
-  background: var(--purple);
-  animation: dream-pulse 1.8s ease-in-out infinite;
-}
-@keyframes dream-pulse {
-  0%, 100% { opacity: 1; transform: scale(1); }
-  50%       { opacity: 0.4; transform: scale(0.7); }
-}
-
-.dream-dot {
-  display: inline-block; width: 7px; height: 7px; border-radius: 50%;
-}
-.dream-dot-idle     { background: var(--amber); }
-.dream-dot-standby  { background: var(--text-dim); }
-
-.dream-idle, .dream-standby {
-  display: flex; align-items: center; gap: 6px; padding: 4px 0;
-}
-.dream-label-idle    { font-size: 0.7rem; font-weight: 700; color: var(--amber); letter-spacing: 0.1em; }
-.dream-label-standby { font-size: 0.7rem; font-weight: 700; color: var(--text-dim); letter-spacing: 0.1em; }
-.dream-idle-meta     { font-size: 0.7rem; color: var(--text-dim); }
-
-.dream-history { border-top: 1px solid var(--border); padding-top: 6px; }
-.dream-record  { padding: 4px 0; border-bottom: 1px solid var(--border); }
-.dream-record:last-child { border-bottom: none; }
-.dream-rule    { font-size: 0.75rem; color: var(--text); font-style: italic; }
-.dream-meta    { font-size: 0.65rem; color: var(--text-dim); margin-top: 2px; }
-
--- a/tests/unit/test_backlog_triage.py
+++ b/tests/unit/test_backlog_triage.py
@@ -0,0 +1,621 @@
+"""Unit tests for timmy.backlog_triage — autonomous backlog triage loop."""
+
+from datetime import UTC, datetime
+from unittest.mock import AsyncMock, MagicMock, patch
+
+import pytest
+
+from timmy.backlog_triage import (
+    AGENT_CLAUDE,
+    AGENT_KIMI,
+    KIMI_READY_LABEL,
+    OWNER_LOGIN,
+    READY_THRESHOLD,
+    BacklogTriageLoop,
+    ScoredIssue,
+    TriageCycleResult,
+    TriageDecision,
+    _build_audit_comment,
+    _build_daily_summary,
+    _extract_tags,
+    _score_acceptance,
+    _score_alignment,
+    _score_scope,
+    decide,
+    score_issue,
+)
+
+
+# ── Fixtures ─────────────────────────────────────────────────────────────────
+
+
+def _make_raw_issue(
+    number: int = 1,
+    title: str = "Fix the login bug",
+    body: str = "## Problem\nLogin fails on empty password.\n\n## Steps\nassert response == 200",
+    labels: list | None = None,
+    assignees: list | None = None,
+    created_at: str = "2026-03-20T10:00:00Z",
+) -> dict:
+    return {
+        "number": number,
+        "title": title,
+        "body": body,
+        "labels": [{"name": lbl} for lbl in (labels or [])],
+        "assignees": [{"login": a} for a in (assignees or [])],
+        "created_at": created_at,
+    }
+
+
+def _make_scored_issue(
+    number: int = 1,
+    title: str = "Fix login bug",
+    issue_type: str = "bug",
+    score: int = 7,
+    ready: bool = True,
+    is_p0: bool = True,
+    is_blocked: bool = False,
+    assignees: list | None = None,
+    tags: set | None = None,
+    labels: list | None = None,
+    age_days: int = 3,
+) -> ScoredIssue:
+    return ScoredIssue(
+        number=number,
+        title=title,
+        body="",
+        labels=labels or [],
+        tags=tags or {"bug"},
+        assignees=assignees or [],
+        created_at=datetime.now(UTC),
+        issue_type=issue_type,
+        score=score,
+        scope=2,
+        acceptance=2,
+        alignment=3,
+        ready=ready,
+        age_days=age_days,
+        is_p0=is_p0,
+        is_blocked=is_blocked,
+    )
+
+
+# ── _extract_tags ─────────────────────────────────────────────────────────────
+
+
+class TestExtractTags:
+    def test_bracket_tags_in_title(self):
+        tags = _extract_tags("[Bug] Login fails", [])
+        assert "bug" in tags
+
+    def test_multiple_brackets(self):
+        tags = _extract_tags("[Bug][P0] Crash on startup", [])
+        assert "bug" in tags
+        assert "p0" in tags
+
+    def test_label_names(self):
+        tags = _extract_tags("Fix thing", ["security", "hotfix"])
+        assert "security" in tags
+        assert "hotfix" in tags
+
+    def test_labels_lowercased(self):
+        tags = _extract_tags("Title", ["Bug", "FEATURE"])
+        assert "bug" in tags
+        assert "feature" in tags
+
+    def test_empty_inputs(self):
+        tags = _extract_tags("", [])
+        assert tags == set()
+
+
+# ── Scoring functions ─────────────────────────────────────────────────────────
+
+
+class TestScoreScope:
+    def test_file_reference_adds_point(self):
+        score = _score_scope("Fix auth", "Edit src/timmy/auth.py", set())
+        assert score >= 1
+
+    def test_function_reference_adds_point(self):
+        score = _score_scope("Fix auth", "def validate_token()", set())
+        assert score >= 1
+
+    def test_short_title_adds_point(self):
+        score = _score_scope("Short title", "", set())
+        assert score >= 1
+
+    def test_meta_tag_penalizes(self):
+        score = _score_scope("Discussion about philosophy", "long body " * 5, {"philosophy"})
+        assert score <= 1
+
+    def test_max_score_3(self):
+        score = _score_scope("Fix auth", "src/auth.py\ndef login()", set())
+        assert score <= 3
+
+
+class TestScoreAcceptance:
+    def test_acceptance_keywords(self):
+        body = "should return 200\nmust pass tests\nexpect response"
+        score = _score_acceptance("Title", body, set())
+        assert score >= 2
+
+    def test_test_reference_adds_point(self):
+        score = _score_acceptance("Title", "Run tox -e unit", set())
+        assert score >= 1
+
+    def test_structured_sections(self):
+        body = "## Problem\nX\n## Solution\nY"
+        score = _score_acceptance("Title", body, set())
+        assert score >= 1
+
+    def test_meta_tag_penalizes(self):
+        score = _score_acceptance("Title", "should do something", {"philosophy"})
+        # still counts but penalized
+        assert score <= 2
+
+    def test_empty_body(self):
+        score = _score_acceptance("Title", "", set())
+        assert score == 0
+
+
+class TestScoreAlignment:
+    def test_bug_tags_score_max(self):
+        assert _score_alignment("", "", {"bug"}) == 3
+
+    def test_hotfix_tag_max(self):
+        assert _score_alignment("", "", {"hotfix"}) == 3
+
+    def test_refactor_tag(self):
+        score = _score_alignment("", "", {"refactor"})
+        assert score >= 2
+
+    def test_feature_tag(self):
+        score = _score_alignment("", "", {"feature"})
+        assert score >= 2
+
+    def test_meta_tags_zero(self):
+        assert _score_alignment("", "", {"philosophy"}) == 0
+
+    def test_loop_generated_bonus(self):
+        score = _score_alignment("", "", {"loop-generated"})
+        assert score >= 1
+
+
+# ── score_issue ───────────────────────────────────────────────────────────────
+
+
+class TestScoreIssue:
+    def test_bug_issue_classified_correctly(self):
+        raw = _make_raw_issue(labels=["bug"], title="[Bug] Crash on startup")
+        scored = score_issue(raw)
+        assert scored.issue_type == "bug"
+        assert scored.is_p0 is True
+
+    def test_feature_issue_classified(self):
+        raw = _make_raw_issue(labels=["feature"], title="Add voice support")
+        scored = score_issue(raw)
+        assert scored.issue_type == "feature"
+
+    def test_philosophy_issue_classified(self):
+        raw = _make_raw_issue(labels=["philosophy"], title="[Philosophy] Should Timmy sleep?")
+        scored = score_issue(raw)
+        assert scored.issue_type == "philosophy"
+
+    def test_research_issue_classified(self):
+        raw = _make_raw_issue(labels=["research"], title="Investigate model options")
+        scored = score_issue(raw)
+        assert scored.issue_type == "research"
+
+    def test_ready_flag_set_when_score_high(self):
+        body = (
+            "## Problem\nX breaks.\n## Solution\nFix src/timmy/agent.py def run()\n"
+            "should return True\nmust pass tox -e unit"
+        )
+        raw = _make_raw_issue(labels=["bug"], body=body)
+        scored = score_issue(raw)
+        assert scored.score >= READY_THRESHOLD
+        assert scored.ready is True
+
+    def test_is_blocked_detected_in_body(self):
+        raw = _make_raw_issue(body="This is blocked by issue #50")
+        scored = score_issue(raw)
+        assert scored.is_blocked is True
+
+    def test_is_blocked_detected_in_title(self):
+        raw = _make_raw_issue(title="[blocking] Cannot proceed")
+        scored = score_issue(raw)
+        # "blocking" in brackets becomes a tag
+        assert scored.is_blocked is True
+
+    def test_unassigned_when_no_assignees(self):
+        raw = _make_raw_issue(assignees=[])
+        scored = score_issue(raw)
+        assert scored.is_unassigned is True
+
+    def test_assigned_when_has_assignee(self):
+        raw = _make_raw_issue(assignees=["claude"])
+        scored = score_issue(raw)
+        assert scored.is_unassigned is False
+
+    def test_age_days_computed(self):
+        old_ts = "2026-01-01T00:00:00Z"
+        raw = _make_raw_issue(created_at=old_ts)
+        scored = score_issue(raw)
+        assert scored.age_days > 0
+
+    def test_needs_kimi_for_research_label(self):
+        raw = _make_raw_issue(labels=["kimi-ready"])
+        scored = score_issue(raw)
+        assert scored.needs_kimi is True
+
+
+# ── decide ────────────────────────────────────────────────────────────────────
+
+
+class TestDecide:
+    def test_philosophy_skipped(self):
+        issue = _make_scored_issue(issue_type="philosophy", tags={"philosophy"})
+        d = decide(issue)
+        assert d.action == "skip"
+        assert "philosophy" in d.reason.lower()
+
+    def test_assigned_issue_skipped(self):
+        issue = _make_scored_issue(assignees=["perplexity"])
+        d = decide(issue)
+        assert d.action == "skip"
+        assert "assigned" in d.reason.lower()
+
+    def test_low_score_skipped(self):
+        issue = _make_scored_issue(score=2, ready=False)
+        d = decide(issue)
+        assert d.action == "skip"
+        assert "threshold" in d.reason.lower()
+
+    def test_blocked_issue_flagged_for_alex(self):
+        issue = _make_scored_issue(is_blocked=True)
+        d = decide(issue)
+        assert d.action == "flag_alex"
+        assert d.agent == OWNER_LOGIN
+
+    def test_research_issue_assigned_kimi(self):
+        issue = _make_scored_issue(
+            issue_type="research",
+            tags={"research"},
+            is_p0=False,
+            is_blocked=False,
+        )
+        d = decide(issue)
+        assert d.action == "assign_kimi"
+        assert d.agent == AGENT_KIMI
+
+    def test_kimi_ready_label_assigns_kimi(self):
+        issue = _make_scored_issue(
+            issue_type="unknown",
+            tags={"kimi-ready"},
+            labels=["kimi-ready"],
+            is_p0=False,
+            is_blocked=False,
+        )
+        d = decide(issue)
+        assert d.action == "assign_kimi"
+
+    def test_p0_bug_assigns_claude(self):
+        issue = _make_scored_issue(issue_type="bug", is_p0=True, is_blocked=False)
+        d = decide(issue)
+        assert d.action == "assign_claude"
+        assert d.agent == AGENT_CLAUDE
+
+    def test_ready_feature_assigns_claude(self):
+        issue = _make_scored_issue(
+            issue_type="feature",
+            is_p0=False,
+            is_blocked=False,
+            tags={"feature"},
+        )
+        d = decide(issue)
+        assert d.action == "assign_claude"
+        assert d.agent == AGENT_CLAUDE
+
+    def test_decision_has_reason(self):
+        issue = _make_scored_issue()
+        d = decide(issue)
+        assert len(d.reason) > 10
+
+
+# ── _build_audit_comment ──────────────────────────────────────────────────────
+
+
+class TestBuildAuditComment:
+    def test_contains_timmy_triage_header(self):
+        d = TriageDecision(42, "assign_claude", "High priority bug", agent=AGENT_CLAUDE)
+        comment = _build_audit_comment(d)
+        assert "Timmy Triage" in comment
+
+    def test_contains_issue_reason(self):
+        d = TriageDecision(42, "assign_claude", "Urgent P0 bug", agent=AGENT_CLAUDE)
+        comment = _build_audit_comment(d)
+        assert "Urgent P0 bug" in comment
+
+    def test_assign_claude_mentions_agent(self):
+        d = TriageDecision(42, "assign_claude", "reason", agent=AGENT_CLAUDE)
+        comment = _build_audit_comment(d)
+        assert AGENT_CLAUDE in comment
+
+    def test_assign_kimi_mentions_label(self):
+        d = TriageDecision(42, "assign_kimi", "reason", agent=AGENT_KIMI)
+        comment = _build_audit_comment(d)
+        assert KIMI_READY_LABEL in comment
+
+    def test_flag_alex_mentions_owner(self):
+        d = TriageDecision(42, "flag_alex", "blocked", agent=OWNER_LOGIN)
+        comment = _build_audit_comment(d)
+        assert OWNER_LOGIN in comment
+
+    def test_contains_override_note(self):
+        d = TriageDecision(42, "assign_claude", "reason", agent=AGENT_CLAUDE)
+        comment = _build_audit_comment(d)
+        assert "override" in comment.lower()
+
+
+# ── _build_daily_summary ──────────────────────────────────────────────────────
+
+
+class TestBuildDailySummary:
+    def _make_result(self, decisions=None) -> TriageCycleResult:
+        return TriageCycleResult(
+            timestamp=datetime.now(UTC).isoformat(),
+            total_open=10,
+            scored=8,
+            ready=5,
+            decisions=decisions or [],
+        )
+
+    def test_contains_open_count(self):
+        result = self._make_result()
+        scored = [_make_scored_issue(number=i, ready=True, score=6) for i in range(1, 4)]
+        summary = _build_daily_summary(result, scored)
+        assert "10" in summary  # total_open
+
+    def test_contains_ready_count(self):
+        result = self._make_result()
+        summary = _build_daily_summary(result, [])
+        assert "5" in summary
+
+    def test_actions_taken_section(self):
+        decisions = [
+            TriageDecision(1, "assign_claude", "P0 bug", agent="claude", executed=True),
+        ]
+        result = self._make_result(decisions=decisions)
+        summary = _build_daily_summary(result, [])
+        assert "Actions Taken" in summary
+        assert "#1" in summary
+
+    def test_top_issues_listed(self):
+        scored = [_make_scored_issue(number=99, ready=True, score=8)]
+        result = self._make_result()
+        summary = _build_daily_summary(result, scored)
+        assert "#99" in summary
+
+    def test_footer_present(self):
+        summary = _build_daily_summary(self._make_result(), [])
+        assert "Auto-generated" in summary
+
+
+# ── BacklogTriageLoop ─────────────────────────────────────────────────────────
+
+
+class TestBacklogTriageLoop:
+    def test_default_interval_from_settings(self):
+        loop = BacklogTriageLoop()
+        from config import settings
+
+        assert loop._interval == float(settings.backlog_triage_interval_seconds)
+
+    def test_custom_interval(self):
+        loop = BacklogTriageLoop(interval=300)
+        assert loop._interval == 300.0
+
+    def test_dry_run_default(self):
+        loop = BacklogTriageLoop(dry_run=True)
+        assert loop._dry_run is True
+
+    def test_not_running_initially(self):
+        loop = BacklogTriageLoop()
+        assert loop.is_running is False
+
+    def test_stop_sets_running_false(self):
+        loop = BacklogTriageLoop()
+        loop._running = True
+        loop.stop()
+        assert loop._running is False
+
+    def test_cycle_count_starts_zero(self):
+        loop = BacklogTriageLoop()
+        assert loop.cycle_count == 0
+
+    @pytest.mark.asyncio
+    async def test_run_once_skips_when_no_gitea_token(self):
+        loop = BacklogTriageLoop()
+        mock_settings = MagicMock()
+        mock_settings.gitea_enabled = True
+        mock_settings.gitea_token = ""
+        mock_settings.backlog_triage_interval_seconds = 900
+        mock_settings.backlog_triage_dry_run = False
+        mock_settings.backlog_triage_daily_summary = False
+
+        with patch("timmy.backlog_triage.settings", mock_settings):
+            result = await loop.run_once()
+
+        assert result.total_open == 0
+
+    @pytest.mark.asyncio
+    async def test_run_once_dry_run_no_api_writes(self):
+        """In dry_run mode, decisions are made but no Gitea API writes happen."""
+        loop = BacklogTriageLoop(dry_run=True, daily_summary=False)
+
+        raw_issues = [
+            _make_raw_issue(
+                number=10,
+                title="Fix crash",
+                labels=["bug"],
+                body=(
+                    "## Problem\nCrash on login.\n## Solution\nFix src/auth.py "
+                    "def login()\nshould return 200\nmust pass tox tests"
+                ),
+            )
+        ]
+
+        mock_settings = MagicMock()
+        mock_settings.gitea_enabled = True
+        mock_settings.gitea_token = "fake-token"
+        mock_settings.gitea_repo = "owner/repo"
+        mock_settings.gitea_url = "http://gitea.local"
+        mock_settings.backlog_triage_interval_seconds = 900
+        mock_settings.backlog_triage_dry_run = True
+        mock_settings.backlog_triage_daily_summary = False
+
+        mock_client = AsyncMock()
+        mock_client.get.return_value = MagicMock(
+            status_code=200, json=MagicMock(return_value=raw_issues)
+        )
+
+        mock_ctx = AsyncMock()
+        mock_ctx.__aenter__.return_value = mock_client
+        mock_ctx.__aexit__.return_value = False
+
+        with (
+            patch("timmy.backlog_triage.settings", mock_settings),
+            patch("httpx.AsyncClient", return_value=mock_ctx),
+        ):
+            result = await loop.run_once()
+
+        # No POST/PATCH calls in dry run
+        mock_client.post.assert_not_called()
+        mock_client.patch.assert_not_called()
+
+        assert result.total_open == 1
+        assert loop.cycle_count == 1
+        assert len(loop.history) == 1
+
+    @pytest.mark.asyncio
+    async def test_run_once_assigns_unassigned_bug(self):
+        """Unassigned ready bug should be assigned to Claude with audit comment."""
+        loop = BacklogTriageLoop(dry_run=False, daily_summary=False)
+
+        body = (
+            "## Problem\nCrash on login.\n## Solution\nFix src/auth.py "
+            "def login()\nshould return 200\nmust pass tox tests"
+        )
+        raw_issues = [_make_raw_issue(number=5, title="Fix crash", labels=["bug"], body=body)]
+
+        mock_settings = MagicMock()
+        mock_settings.gitea_enabled = True
+        mock_settings.gitea_token = "fake-token"
+        mock_settings.gitea_repo = "owner/repo"
+        mock_settings.gitea_url = "http://gitea.local"
+        mock_settings.backlog_triage_interval_seconds = 900
+        mock_settings.backlog_triage_dry_run = False
+        mock_settings.backlog_triage_daily_summary = False
+
+        # GET /issues returns our issue
+        get_issues_resp = MagicMock(status_code=200)
+        get_issues_resp.json.return_value = raw_issues
+
+        # POST /comments returns success
+        comment_resp = MagicMock(status_code=201)
+        comment_resp.json.return_value = {"id": 1}
+
+        # PATCH /issues/{n} (assign) returns success
+        assign_resp = MagicMock(status_code=200)
+        assign_resp.json.return_value = {"number": 5}
+
+        mock_client = AsyncMock()
+        mock_client.get.return_value = get_issues_resp
+        mock_client.post.return_value = comment_resp
+        mock_client.patch.return_value = assign_resp
+
+        mock_ctx = AsyncMock()
+        mock_ctx.__aenter__.return_value = mock_client
+        mock_ctx.__aexit__.return_value = False
+
+        with (
+            patch("timmy.backlog_triage.settings", mock_settings),
+            patch("httpx.AsyncClient", return_value=mock_ctx),
+            patch("asyncio.sleep", new_callable=AsyncMock),
+        ):
+            result = await loop.run_once()
+
+        assert result.total_open == 1
+        # Comment should have been posted
+        mock_client.post.assert_called()
+        # Assign should have been called (PATCH)
+        mock_client.patch.assert_called()
+
+    @pytest.mark.asyncio
+    async def test_run_once_skips_already_assigned(self):
+        """Issues already assigned should not be acted upon."""
+        loop = BacklogTriageLoop(dry_run=False, daily_summary=False)
+
+        raw_issues = [
+            _make_raw_issue(
+                number=3,
+                labels=["bug"],
+                assignees=["perplexity"],
+                body="## Problem\nX\nmust pass tox\nshould return 200 at least 3 times",
+            )
+        ]
+
+        mock_settings = MagicMock()
+        mock_settings.gitea_enabled = True
+        mock_settings.gitea_token = "tok"
+        mock_settings.gitea_repo = "owner/repo"
+        mock_settings.gitea_url = "http://gitea.local"
+        mock_settings.backlog_triage_interval_seconds = 900
+        mock_settings.backlog_triage_dry_run = False
+        mock_settings.backlog_triage_daily_summary = False
+
+        get_resp = MagicMock(status_code=200)
+        get_resp.json.return_value = raw_issues
+
+        mock_client = AsyncMock()
+        mock_client.get.return_value = get_resp
+
+        mock_ctx = AsyncMock()
+        mock_ctx.__aenter__.return_value = mock_client
+        mock_ctx.__aexit__.return_value = False
+
+        with (
+            patch("timmy.backlog_triage.settings", mock_settings),
+            patch("httpx.AsyncClient", return_value=mock_ctx),
+        ):
+            result = await loop.run_once()
+
+        # No writes for already-assigned issue
+        mock_client.post.assert_not_called()
+        mock_client.patch.assert_not_called()
+        assert result.decisions[0].action == "skip"
+
+
+# ── ScoredIssue properties ────────────────────────────────────────────────────
+
+
+class TestScoredIssueProperties:
+    def test_is_unassigned_true_when_no_assignees(self):
+        issue = _make_scored_issue(assignees=[])
+        assert issue.is_unassigned is True
+
+    def test_is_unassigned_false_when_assigned(self):
+        issue = _make_scored_issue(assignees=["claude"])
+        assert issue.is_unassigned is False
+
+    def test_needs_kimi_for_research_tag(self):
+        issue = _make_scored_issue(tags={"research"})
+        assert issue.needs_kimi is True
+
+    def test_needs_kimi_for_kimi_ready_label(self):
+        issue = _make_scored_issue(labels=["kimi-ready"], tags=set())
+        assert issue.needs_kimi is True
+
+    def test_needs_kimi_false_for_bug(self):
+        issue = _make_scored_issue(tags={"bug"}, labels=[])
+        assert issue.needs_kimi is False
--- a/tests/unit/test_dreaming.py
+++ b/tests/unit/test_dreaming.py
@@ -1,217 +0,0 @@
-"""Unit tests for the Dreaming mode engine."""
-
-import sqlite3
-from contextlib import closing
-from datetime import UTC, datetime, timedelta
-from unittest.mock import AsyncMock, patch
-
-import pytest
-
-from timmy.dreaming import _SESSION_GAP_SECONDS, DreamingEngine, DreamRecord
-
-pytestmark = pytest.mark.unit
-
-# ── Fixtures ──────────────────────────────────────────────────────────────────
-
-
-@pytest.fixture()
-def tmp_dreams_db(tmp_path):
-    """Return a temporary path for the dreams database."""
-    return tmp_path / "dreams.db"
-
-
-@pytest.fixture()
-def engine(tmp_dreams_db):
-    """DreamingEngine backed by a temp database."""
-    return DreamingEngine(db_path=tmp_dreams_db)
-
-
-@pytest.fixture()
-def chat_db(tmp_path):
-    """Create a minimal chat database with some messages."""
-    db_path = tmp_path / "chat.db"
-    with closing(sqlite3.connect(str(db_path))) as conn:
-        conn.execute("""
-            CREATE TABLE IF NOT EXISTS chat_messages (
-                id INTEGER PRIMARY KEY AUTOINCREMENT,
-                role TEXT NOT NULL,
-                content TEXT NOT NULL,
-                timestamp TEXT NOT NULL,
-                source TEXT NOT NULL DEFAULT 'browser'
-            )
-        """)
-        now = datetime.now(UTC)
-        messages = [
-            ("user",  "Hello, can you help me?",          (now - timedelta(hours=2)).isoformat()),
-            ("agent", "Of course! What do you need?",     (now - timedelta(hours=2, seconds=-5)).isoformat()),
-            ("user",  "How does Python handle errors?",   (now - timedelta(hours=2, seconds=-60)).isoformat()),
-            ("agent", "Python uses try/except blocks.",   (now - timedelta(hours=2, seconds=-120)).isoformat()),
-            ("user",  "Thanks!",                          (now - timedelta(hours=2, seconds=-180)).isoformat()),
-        ]
-        conn.executemany(
-            "INSERT INTO chat_messages (role, content, timestamp) VALUES (?, ?, ?)",
-            messages,
-        )
-        conn.commit()
-    return db_path
-
-
-# ── Idle detection ─────────────────────────────────────────────────────────────
-
-
-class TestIdleDetection:
-    def test_not_idle_immediately(self, engine):
-        assert engine.is_idle() is False
-
-    def test_idle_after_threshold(self, engine):
-        engine._last_activity_time = datetime.now(UTC) - timedelta(minutes=20)
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_idle_threshold_minutes = 10
-            assert engine.is_idle() is True
-
-    def test_not_idle_when_threshold_zero(self, engine):
-        engine._last_activity_time = datetime.now(UTC) - timedelta(hours=99)
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_idle_threshold_minutes = 0
-            assert engine.is_idle() is False
-
-    def test_record_activity_resets_timer(self, engine):
-        engine._last_activity_time = datetime.now(UTC) - timedelta(minutes=30)
-        engine.record_activity()
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_idle_threshold_minutes = 10
-            assert engine.is_idle() is False
-
-
-# ── Status dict ───────────────────────────────────────────────────────────────
-
-
-class TestGetStatus:
-    def test_status_shape(self, engine):
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_enabled = True
-            mock_settings.dreaming_idle_threshold_minutes = 10
-            status = engine.get_status()
-        assert "enabled" in status
-        assert "dreaming" in status
-        assert "idle" in status
-        assert "dream_count" in status
-        assert "idle_minutes" in status
-
-    def test_dream_count_starts_at_zero(self, engine):
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_enabled = True
-            mock_settings.dreaming_idle_threshold_minutes = 10
-            assert engine.get_status()["dream_count"] == 0
-
-
-# ── Session grouping ──────────────────────────────────────────────────────────
-
-
-class TestGroupIntoSessions:
-    def test_single_session(self, engine):
-        now = datetime.now(UTC)
-        rows = [
-            {"role": "user",  "content": "hi",   "timestamp": now.isoformat()},
-            {"role": "agent", "content": "hello", "timestamp": (now + timedelta(seconds=10)).isoformat()},
-        ]
-        sessions = engine._group_into_sessions(rows)
-        assert len(sessions) == 1
-        assert len(sessions[0]) == 2
-
-    def test_splits_on_large_gap(self, engine):
-        now = datetime.now(UTC)
-        gap = _SESSION_GAP_SECONDS + 100
-        rows = [
-            {"role": "user",  "content": "hi",    "timestamp": now.isoformat()},
-            {"role": "agent", "content": "hello",  "timestamp": (now + timedelta(seconds=gap)).isoformat()},
-        ]
-        sessions = engine._group_into_sessions(rows)
-        assert len(sessions) == 2
-
-    def test_empty_input(self, engine):
-        assert engine._group_into_sessions([]) == []
-
-
-# ── Dream storage ─────────────────────────────────────────────────────────────
-
-
-class TestDreamStorage:
-    def test_store_and_retrieve(self, engine):
-        dream = engine._store_dream(
-            session_excerpt="User asked about Python.",
-            decision_point="Python uses try/except blocks.",
-            simulation="I could have given a code example.",
-            proposed_rule="When explaining errors, include a code snippet.",
-        )
-        assert dream.id
-        assert dream.proposed_rule == "When explaining errors, include a code snippet."
-
-        retrieved = engine.get_recent_dreams(limit=1)
-        assert len(retrieved) == 1
-        assert retrieved[0].id == dream.id
-
-    def test_count_increments(self, engine):
-        assert engine.count_dreams() == 0
-        engine._store_dream(
-            session_excerpt="test", decision_point="test", simulation="test", proposed_rule="test"
-        )
-        assert engine.count_dreams() == 1
-
-
-# ── dream_once integration ─────────────────────────────────────────────────────
-
-
-class TestDreamOnce:
-    @pytest.mark.asyncio
-    async def test_skips_when_disabled(self, engine):
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_enabled = False
-            result = await engine.dream_once()
-        assert result is None
-
-    @pytest.mark.asyncio
-    async def test_skips_when_not_idle(self, engine):
-        engine._last_activity_time = datetime.now(UTC)
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_enabled = True
-            mock_settings.dreaming_idle_threshold_minutes = 60
-            result = await engine.dream_once()
-        assert result is None
-
-    @pytest.mark.asyncio
-    async def test_skips_when_already_dreaming(self, engine):
-        engine._is_dreaming = True
-        with patch("timmy.dreaming.settings") as mock_settings:
-            mock_settings.dreaming_enabled = True
-            mock_settings.dreaming_idle_threshold_minutes = 0
-            result = await engine.dream_once()
-        # Reset for cleanliness
-        engine._is_dreaming = False
-        assert result is None
-
-    @pytest.mark.asyncio
-    async def test_dream_produces_record_when_idle(self, engine, chat_db):
-        """Full cycle: idle + chat data + mocked LLM → produces DreamRecord."""
-        engine._last_activity_time = datetime.now(UTC) - timedelta(hours=1)
-
-        with (
-            patch("timmy.dreaming.settings") as mock_settings,
-            patch("timmy.dreaming.DreamingEngine._call_agent", new_callable=AsyncMock) as mock_agent,
-            patch("infrastructure.chat_store.DB_PATH", chat_db),
-        ):
-            mock_settings.dreaming_enabled = True
-            mock_settings.dreaming_idle_threshold_minutes = 10
-            mock_settings.dreaming_timeout_seconds = 30
-            mock_agent.side_effect = [
-                "I could have provided a concrete try/except example.",  # simulation
-                "When explaining errors, always include a runnable code snippet.",  # rule
-            ]
-
-            result = await engine.dream_once()
-
-        assert result is not None
-        assert isinstance(result, DreamRecord)
-        assert result.simulation
-        assert result.proposed_rule
-        assert engine.count_dreams() == 1
Author	SHA1	Message	Date
Alexander Whitestone	7bc6e39a93	refactor: break up MCPBridge.run() into focused helper methods Some checks failed Tests / lint (pull_request) Failing after 15s Details Tests / test (pull_request) Has been skipped Details Extract connection setup/message building, tool-call round processing, and the multi-round loop into three private helpers: - _build_initial_messages() — static, constructs prompt message list - _process_round_tool_calls() — executes one round of tool calls - _run_tool_loop() — drives the multi-round loop, returns result tuple run() is now ~35 lines of logic (down from 129), with error recovery consolidated in a single return at the end. Fixes #1135 Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>	2026-03-23 14:38:38 -04:00
Claude (Opus 4.6)	4f8e86348c	[claude] Build Timmy autonomous backlog triage loop (#1071 ) (#1141 ) Some checks failed Tests / lint (push) Has been cancelled Details Tests / test (push) Has been cancelled Details	2026-03-23 18:32:27 +00:00
Google Gemini	0c627f175b	[gemini] refactor: Gracefully handle tool registration errors (#938 ) (#1132 ) Some checks failed Tests / lint (push) Has been cancelled Details Tests / test (push) Has been cancelled Details	2026-03-23 18:26:40 +00:00