fix: loop_guard GITEA_API default + queue.json validation guard (#951 , #952 )

2026-03-22 13:51:59 -04:00
18 changed files with 24 additions and 1208 deletions
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -50,7 +50,6 @@ sounddevice = { version = ">=0.4.6", optional = true }
 sentence-transformers = { version = ">=2.0.0", optional = true }
 numpy = { version = ">=1.24.0", optional = true }
 requests = { version = ">=2.31.0", optional = true }
-trafilatura = { version = ">=1.6.0", optional = true }
 GitPython = { version = ">=3.1.40", optional = true }
 pytest = { version = ">=8.0.0", optional = true }
 pytest-asyncio = { version = ">=0.24.0", optional = true }
@@ -68,7 +67,6 @@ voice = ["pyttsx3", "openai-whisper", "piper-tts", "sounddevice"]
 celery = ["celery"]
 embeddings = ["sentence-transformers", "numpy"]
 git = ["GitPython"]
-research = ["requests", "trafilatura"]
 dev = ["pytest", "pytest-asyncio", "pytest-cov", "pytest-timeout", "pytest-randomly", "pytest-xdist", "selenium"]

 [tool.poetry.group.dev.dependencies]
--- a/scripts/backfill_retro.py
+++ b/scripts/backfill_retro.py
@@ -17,23 +17,8 @@ REPO_ROOT = Path(__file__).resolve().parent.parent
 RETRO_FILE = REPO_ROOT / ".loop" / "retro" / "cycles.jsonl"
 SUMMARY_FILE = REPO_ROOT / ".loop" / "retro" / "summary.json"

-
-def _get_gitea_api() -> str:
-    """Read Gitea API URL from env var, then ~/.hermes/gitea_api file, then default."""
-    # Check env vars first (TIMMY_GITEA_API is preferred, GITEA_API for compatibility)
-    api_url = os.environ.get("TIMMY_GITEA_API") or os.environ.get("GITEA_API")
-    if api_url:
-        return api_url
-    # Check ~/.hermes/gitea_api file
-    api_file = Path.home() / ".hermes" / "gitea_api"
-    if api_file.exists():
-        return api_file.read_text().strip()
-    # Default fallback
-    return "http://localhost:3000/api/v1"
-
-
-GITEA_API = _get_gitea_api()
-REPO_SLUG = os.environ.get("REPO_SLUG", "rockachopa/Timmy-time-dashboard")
+GITEA_API = "http://localhost:3000/api/v1"
+REPO_SLUG = "rockachopa/Timmy-time-dashboard"
 TOKEN_FILE = Path.home() / ".hermes" / "gitea_token"

 TAG_RE = re.compile(r"\[([^\]]+)\]")
--- a/scripts/gitea_backup.sh
+++ b/scripts/gitea_backup.sh
@@ -1,83 +0,0 @@
-#!/bin/bash
-# Gitea backup script — run on the VPS before any hardening changes.
-# Usage: sudo bash scripts/gitea_backup.sh [off-site-dest]
-#
-# off-site-dest: optional rsync/scp destination for off-site copy
-#   e.g. user@backup-host:/backups/gitea/
-#
-# Refs: #971, #990
-
-set -euo pipefail
-
-BACKUP_DIR="/opt/gitea/backups"
-TIMESTAMP=$(date +"%Y%m%d_%H%M%S")
-GITEA_CONF="/etc/gitea/app.ini"
-GITEA_WORK_DIR="/var/lib/gitea"
-OFFSITE_DEST="${1:-}"
-
-echo "=== Gitea Backup — $TIMESTAMP ==="
-
-# Ensure backup directory exists
-mkdir -p "$BACKUP_DIR"
-cd "$BACKUP_DIR"
-
-# Run the dump
-echo "[1/4] Running gitea dump..."
-gitea dump -c "$GITEA_CONF"
-
-# Find the newest zip (gitea dump names it gitea-dump-*.zip)
-BACKUP_FILE=$(ls -t "$BACKUP_DIR"/gitea-dump-*.zip 2>/dev/null | head -1)
-
-if [ -z "$BACKUP_FILE" ]; then
-    echo "ERROR: No backup zip found in $BACKUP_DIR"
-    exit 1
-fi
-
-BACKUP_SIZE=$(stat -c%s "$BACKUP_FILE" 2>/dev/null || stat -f%z "$BACKUP_FILE")
-echo "[2/4] Backup created: $BACKUP_FILE ($BACKUP_SIZE bytes)"
-
-if [ "$BACKUP_SIZE" -eq 0 ]; then
-    echo "ERROR: Backup file is 0 bytes"
-    exit 1
-fi
-
-# Lock down permissions
-chmod 600 "$BACKUP_FILE"
-
-# Verify contents
-echo "[3/4] Verifying backup contents..."
-CONTENTS=$(unzip -l "$BACKUP_FILE" 2>/dev/null || true)
-
-check_component() {
-    if echo "$CONTENTS" | grep -q "$1"; then
-        echo "  OK: $2"
-    else
-        echo "  WARN: $2 not found in backup"
-    fi
-}
-
-check_component "gitea-db.sql"    "Database dump"
-check_component "gitea-repo"      "Repositories"
-check_component "custom"          "Custom config"
-check_component "app.ini"         "app.ini"
-
-# Off-site copy
-if [ -n "$OFFSITE_DEST" ]; then
-    echo "[4/4] Copying to off-site: $OFFSITE_DEST"
-    rsync -avz "$BACKUP_FILE" "$OFFSITE_DEST"
-    echo "  Off-site copy complete."
-else
-    echo "[4/4] No off-site destination provided. Skipping."
-    echo "  To copy later: scp $BACKUP_FILE user@backup-host:/backups/gitea/"
-fi
-
-echo ""
-echo "=== Backup complete ==="
-echo "File: $BACKUP_FILE"
-echo "Size: $BACKUP_SIZE bytes"
-echo ""
-echo "To verify restore on a clean instance:"
-echo "  1. Copy zip to test machine"
-echo "  2. unzip $BACKUP_FILE"
-echo "  3. gitea restore --from <extracted-dir> -c /etc/gitea/app.ini"
-echo "  4. Verify repos and DB are intact"
--- a/scripts/loop_guard.py
+++ b/scripts/loop_guard.py
@@ -30,22 +30,7 @@ IDLE_STATE_FILE = REPO_ROOT / ".loop" / "idle_state.json"
 CYCLE_RESULT_FILE = REPO_ROOT / ".loop" / "cycle_result.json"
 TOKEN_FILE = Path.home() / ".hermes" / "gitea_token"

-
-def _get_gitea_api() -> str:
-    """Read Gitea API URL from env var, then ~/.hermes/gitea_api file, then default."""
-    # Check env vars first (TIMMY_GITEA_API is preferred, GITEA_API for compatibility)
-    api_url = os.environ.get("TIMMY_GITEA_API") or os.environ.get("GITEA_API")
-    if api_url:
-        return api_url
-    # Check ~/.hermes/gitea_api file
-    api_file = Path.home() / ".hermes" / "gitea_api"
-    if api_file.exists():
-        return api_file.read_text().strip()
-    # Default fallback
-    return "http://localhost:3000/api/v1"
-
-
-GITEA_API = _get_gitea_api()
+GITEA_API = os.environ.get("GITEA_API", "http://143.198.27.163:3000/api/v1")
 REPO_SLUG = os.environ.get("REPO_SLUG", "rockachopa/Timmy-time-dashboard")

 # Default cycle duration in seconds (5 min); stale threshold = 2× this
@@ -202,11 +187,7 @@ def load_queue() -> list[dict]:
                # Persist the cleaned queue so stale entries don't recur
                _save_cleaned_queue(data, open_numbers)
        return ready
-    except json.JSONDecodeError as exc:
-        print(f"[loop-guard] WARNING: Corrupt queue.json ({exc}) — returning empty queue")
-        return []
-    except OSError as exc:
-        print(f"[loop-guard] WARNING: Cannot read queue.json ({exc}) — returning empty queue")
+    except (json.JSONDecodeError, OSError):
        return []


--- a/scripts/triage_score.py
+++ b/scripts/triage_score.py
@@ -20,28 +20,11 @@ from datetime import datetime, timezone
 from pathlib import Path

 # ── Config ──────────────────────────────────────────────────────────────
-
-
-def _get_gitea_api() -> str:
-    """Read Gitea API URL from env var, then ~/.hermes/gitea_api file, then default."""
-    # Check env vars first (TIMMY_GITEA_API is preferred, GITEA_API for compatibility)
-    api_url = os.environ.get("TIMMY_GITEA_API") or os.environ.get("GITEA_API")
-    if api_url:
-        return api_url
-    # Check ~/.hermes/gitea_api file
-    api_file = Path.home() / ".hermes" / "gitea_api"
-    if api_file.exists():
-        return api_file.read_text().strip()
-    # Default fallback
-    return "http://localhost:3000/api/v1"
-
-
-GITEA_API = _get_gitea_api()
+GITEA_API = os.environ.get("GITEA_API", "http://143.198.27.163:3000/api/v1")
 REPO_SLUG = os.environ.get("REPO_SLUG", "rockachopa/Timmy-time-dashboard")
 TOKEN_FILE = Path.home() / ".hermes" / "gitea_token"
 REPO_ROOT = Path(__file__).resolve().parent.parent
 QUEUE_FILE = REPO_ROOT / ".loop" / "queue.json"
-QUEUE_BACKUP_FILE = REPO_ROOT / ".loop" / "queue.json.bak"
 RETRO_FILE = REPO_ROOT / ".loop" / "retro" / "triage.jsonl"
 QUARANTINE_FILE = REPO_ROOT / ".loop" / "quarantine.json"
 CYCLE_RETRO_FILE = REPO_ROOT / ".loop" / "retro" / "cycles.jsonl"
@@ -343,36 +326,31 @@ def run_triage() -> list[dict]:
    ready = [s for s in scored if s["ready"]]
    not_ready = [s for s in scored if not s["ready"]]

-    # Save backup before writing (if current file exists and is valid)
+    QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
+    backup_file = QUEUE_FILE.with_suffix(".json.bak")
+
+    # Backup existing queue before overwriting
    if QUEUE_FILE.exists():
        try:
-            json.loads(QUEUE_FILE.read_text())  # Validate current file
-            QUEUE_BACKUP_FILE.write_text(QUEUE_FILE.read_text())
-        except (json.JSONDecodeError, OSError):
-            pass  # Current file is corrupt, don't overwrite backup
+            backup_file.write_text(QUEUE_FILE.read_text())
+        except OSError:
+            pass

-    # Write new queue file
-    QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    QUEUE_FILE.write_text(json.dumps(ready, indent=2) + "\n")
+    # Write and validate
+    queue_json = json.dumps(ready, indent=2) + "\n"
+    QUEUE_FILE.write_text(queue_json)

-    # Validate the write by re-reading and parsing
+    # Validate by re-reading — restore backup on corruption
    try:
-        json.loads(QUEUE_FILE.read_text())
-    except (json.JSONDecodeError, OSError) as exc:
-        print(f"[triage] ERROR: queue.json validation failed: {exc}", file=sys.stderr)
-        # Restore from backup if available
-        if QUEUE_BACKUP_FILE.exists():
-            try:
-                backup_data = QUEUE_BACKUP_FILE.read_text()
-                json.loads(backup_data)  # Validate backup
-                QUEUE_FILE.write_text(backup_data)
-                print(f"[triage] Restored queue.json from backup")
-            except (json.JSONDecodeError, OSError) as restore_exc:
-                print(f"[triage] ERROR: Backup restore failed: {restore_exc}", file=sys.stderr)
-                # Write empty list as last resort
-                QUEUE_FILE.write_text("[]\n")
+        validated = json.loads(QUEUE_FILE.read_text())
+        if not isinstance(validated, list):
+            raise ValueError("queue.json is not a list")
+    except (json.JSONDecodeError, ValueError) as e:
+        print(f"[triage] ERROR: queue.json validation failed: {e}", file=sys.stderr)
+        if backup_file.exists():
+            print("[triage] Restoring from backup", file=sys.stderr)
+            QUEUE_FILE.write_text(backup_file.read_text())
        else:
-            # No backup, write empty list
            QUEUE_FILE.write_text("[]\n")

    # Write retro entry
--- a/skills/research/architecture_spike.md
+++ b/skills/research/architecture_spike.md
@@ -1,67 +0,0 @@
---
-name: Architecture Spike
-type: research
-typical_query_count: 2-4
-expected_output_length: 600-1200 words
-cascade_tier: groq_preferred
-description: >
-  Investigate how to connect two systems or components. Produces an integration
-  architecture with sequence diagram, key decisions, and a proof-of-concept outline.
---
-
-# Architecture Spike: Connect {system_a} to {system_b}
-
-## Context
-
-We need to integrate **{system_a}** with **{system_b}** in the context of
-**{project_context}**. This spike answers: what is the best way to wire them
-together, and what are the trade-offs?
-
-## Constraints
-
- Prefer approaches that avoid adding new infrastructure dependencies.
- The integration should be **{sync_or_async}** (synchronous / asynchronous).
- Must work within: {environment_constraints}.
-
-## Research Steps
-
-1. Identify the APIs / protocols exposed by both systems.
-2. List all known integration patterns (direct API, message queue, webhook, SDK, etc.).
-3. Evaluate each pattern for complexity, reliability, and latency.
-4. Select the recommended approach and outline a proof-of-concept.
-
-## Output Format
-
-### Integration Options
-
-| Pattern | Complexity | Reliability | Latency | Notes |
-|---------|-----------|-------------|---------|-------|
-| ...     | ...       | ...         | ...     | ...   |
-
-### Recommended Approach
-
-**Pattern:** {pattern_name}
-
-**Why:** One paragraph explaining the choice.
-
-### Sequence Diagram
-
-```
-{system_a} -> {middleware} -> {system_b}
-```
-
-Describe the data flow step by step:
-
-1. {system_a} does X...
-2. {middleware} transforms / routes...
-3. {system_b} receives Y...
-
-### Proof-of-Concept Outline
-
- Files to create or modify
- Key libraries / dependencies needed
- Estimated effort: {effort_estimate}
-
-### Open Questions
-
-Bullet list of decisions that need human input before proceeding.
--- a/skills/research/competitive_scan.md
+++ b/skills/research/competitive_scan.md
@@ -1,74 +0,0 @@
---
-name: Competitive Scan
-type: research
-typical_query_count: 3-5
-expected_output_length: 800-1500 words
-cascade_tier: groq_preferred
-description: >
-  Compare a project against its alternatives. Produces a feature matrix,
-  strengths/weaknesses analysis, and positioning summary.
---
-
-# Competitive Scan: {project} vs Alternatives
-
-## Context
-
-Compare **{project}** against **{alternatives}** (comma-separated list of
-competitors). The goal is to understand where {project} stands and identify
-differentiation opportunities.
-
-## Constraints
-
- Comparison date: {date}.
- Focus areas: {focus_areas} (e.g., features, pricing, community, performance).
- Perspective: {perspective} (user, developer, business).
-
-## Research Steps
-
-1. Gather key facts about {project} (features, pricing, community size, release cadence).
-2. Gather the same data for each alternative in {alternatives}.
-3. Build a feature comparison matrix.
-4. Identify strengths and weaknesses for each entry.
-5. Summarize positioning and recommend next steps.
-
-## Output Format
-
-### Overview
-
-One paragraph: what space does {project} compete in, and who are the main players?
-
-### Feature Matrix
-
-| Feature / Attribute | {project} | {alt_1} | {alt_2} | {alt_3} |
-|--------------------|-----------|---------|---------|---------|
-| {feature_1}        | ...       | ...     | ...     | ...     |
-| {feature_2}        | ...       | ...     | ...     | ...     |
-| Pricing            | ...       | ...     | ...     | ...     |
-| License            | ...       | ...     | ...     | ...     |
-| Community Size     | ...       | ...     | ...     | ...     |
-| Last Major Release | ...       | ...     | ...     | ...     |
-
-### Strengths & Weaknesses
-
-#### {project}
- **Strengths:** ...
- **Weaknesses:** ...
-
-#### {alt_1}
- **Strengths:** ...
- **Weaknesses:** ...
-
-_(Repeat for each alternative)_
-
-### Positioning Map
-
-Describe where each project sits along the key dimensions (e.g., simplicity
-vs power, free vs paid, niche vs general).
-
-### Recommendations
-
-Bullet list of actions based on the competitive landscape:
-
- **Differentiate on:** {differentiator}
- **Watch out for:** {threat}
- **Consider adopting from {alt}:** {feature_or_approach}
--- a/skills/research/game_analysis.md
+++ b/skills/research/game_analysis.md
@@ -1,68 +0,0 @@
---
-name: Game Analysis
-type: research
-typical_query_count: 2-3
-expected_output_length: 600-1000 words
-cascade_tier: local_ok
-description: >
-  Evaluate a game for AI agent playability. Assesses API availability,
-  observation/action spaces, and existing bot ecosystems.
---
-
-# Game Analysis: {game}
-
-## Context
-
-Evaluate **{game}** to determine whether an AI agent can play it effectively.
-Focus on programmatic access, observation space, action space, and existing
-bot/AI ecosystems.
-
-## Constraints
-
- Platform: {platform} (PC, console, mobile, browser).
- Agent type: {agent_type} (reinforcement learning, rule-based, LLM-driven, hybrid).
- Budget for API/licenses: {budget}.
-
-## Research Steps
-
-1. Identify official APIs, modding support, or programmatic access methods for {game}.
-2. Characterize the observation space (screen pixels, game state JSON, memory reading, etc.).
-3. Characterize the action space (keyboard/mouse, API calls, controller inputs).
-4. Survey existing bots, AI projects, or research papers for {game}.
-5. Assess feasibility and difficulty for the target agent type.
-
-## Output Format
-
-### Game Profile
-
-| Property          | Value                  |
-|-------------------|------------------------|
-| Game              | {game}                 |
-| Genre             | {genre}                |
-| Platform          | {platform}             |
-| API Available     | Yes / No / Partial     |
-| Mod Support       | Yes / No / Limited     |
-| Existing AI Work  | Extensive / Some / None|
-
-### Observation Space
-
-Describe what data the agent can access and how (API, screen capture, memory hooks, etc.).
-
-### Action Space
-
-Describe how the agent can interact with the game (input methods, timing constraints, etc.).
-
-### Existing Ecosystem
-
-List known bots, frameworks, research papers, or communities working on AI for {game}.
-
-### Feasibility Assessment
-
- **Difficulty:** Easy / Medium / Hard / Impractical
- **Best approach:** {recommended_agent_type}
- **Key challenges:** Bullet list
- **Estimated time to MVP:** {time_estimate}
-
-### Recommendation
-
-One paragraph: should we proceed, and if so, what is the first step?
--- a/skills/research/integration_guide.md
+++ b/skills/research/integration_guide.md
@@ -1,79 +0,0 @@
---
-name: Integration Guide
-type: research
-typical_query_count: 3-5
-expected_output_length: 1000-2000 words
-cascade_tier: groq_preferred
-description: >
-  Step-by-step guide to wire a specific tool into an existing stack,
-  complete with code samples, configuration, and testing steps.
---
-
-# Integration Guide: Wire {tool} into {stack}
-
-## Context
-
-Integrate **{tool}** into our **{stack}** stack. The goal is to
-**{integration_goal}** (e.g., "add vector search to the dashboard",
-"send notifications via Telegram").
-
-## Constraints
-
- Must follow existing project conventions (see CLAUDE.md).
- No new cloud AI dependencies unless explicitly approved.
- Environment config via `pydantic-settings` / `config.py`.
-
-## Research Steps
-
-1. Review {tool}'s official documentation for installation and setup.
-2. Identify the minimal dependency set required.
-3. Map {tool}'s API to our existing patterns (singletons, graceful degradation).
-4. Write integration code with proper error handling.
-5. Define configuration variables and their defaults.
-
-## Output Format
-
-### Prerequisites
-
- Dependencies to install (with versions)
- External services or accounts required
- Environment variables to configure
-
-### Configuration
-
-```python
-# In config.py — add these fields to Settings:
-{config_fields}
-```
-
-### Implementation
-
-```python
-# {file_path}
-{implementation_code}
-```
-
-### Graceful Degradation
-
-Describe how the integration behaves when {tool} is unavailable:
-
-| Scenario              | Behavior           | Log Level |
-|-----------------------|--------------------|-----------|
-| {tool} not installed  | {fallback}         | WARNING   |
-| {tool} unreachable    | {fallback}         | WARNING   |
-| Invalid credentials   | {fallback}         | ERROR     |
-
-### Testing
-
-```python
-# tests/unit/test_{tool_snake}.py
-{test_code}
-```
-
-### Verification Checklist
-
- [ ] Dependency added to pyproject.toml
- [ ] Config fields added with sensible defaults
- [ ] Graceful degradation tested (service down)
- [ ] Unit tests pass (`tox -e unit`)
- [ ] No new linting errors (`tox -e lint`)
--- a/skills/research/state_of_art.md
+++ b/skills/research/state_of_art.md
@@ -1,67 +0,0 @@
---
-name: State of the Art
-type: research
-typical_query_count: 4-6
-expected_output_length: 1000-2000 words
-cascade_tier: groq_preferred
-description: >
-  Comprehensive survey of what currently exists in a given field or domain.
-  Produces a structured landscape overview with key players, trends, and gaps.
---
-
-# State of the Art: {field} (as of {date})
-
-## Context
-
-Survey the current landscape of **{field}**. Identify key players, recent
-developments, dominant approaches, and notable gaps. This is a point-in-time
-snapshot intended to inform decision-making.
-
-## Constraints
-
- Focus on developments from the last {timeframe} (e.g., 12 months, 2 years).
- Prioritize {priority} (open-source, commercial, academic, or all).
- Target audience: {audience} (technical team, leadership, general).
-
-## Research Steps
-
-1. Identify the major categories or sub-domains within {field}.
-2. For each category, list the leading projects, companies, or research groups.
-3. Note recent milestones, releases, or breakthroughs.
-4. Identify emerging trends and directions.
-5. Highlight gaps — things that don't exist yet but should.
-
-## Output Format
-
-### Executive Summary
-
-Two to three sentences: what is the state of {field} right now?
-
-### Landscape Map
-
-| Category       | Key Players              | Maturity    | Trend       |
-|---------------|--------------------------|-------------|-------------|
-| {category_1}  | {player_a}, {player_b}   | Early / GA  | Growing / Stable / Declining |
-| {category_2}  | {player_c}, {player_d}   | Early / GA  | Growing / Stable / Declining |
-
-### Recent Milestones
-
-Chronological list of notable events in the last {timeframe}:
-
- **{date_1}:** {event_description}
- **{date_2}:** {event_description}
-
-### Trends
-
-Numbered list of the top 3-5 trends shaping {field}:
-
-1. **{trend_name}** — {one-line description}
-2. **{trend_name}** — {one-line description}
-
-### Gaps & Opportunities
-
-Bullet list of things that are missing, underdeveloped, or ripe for innovation.
-
-### Implications for Us
-
-One paragraph: what does this mean for our project? What should we do next?
--- a/skills/research/tool_evaluation.md
+++ b/skills/research/tool_evaluation.md
@@ -1,52 +0,0 @@
---
-name: Tool Evaluation
-type: research
-typical_query_count: 3-5
-expected_output_length: 800-1500 words
-cascade_tier: groq_preferred
-description: >
-  Discover and evaluate all shipping tools/libraries/services in a given domain.
-  Produces a ranked comparison table with pros, cons, and recommendation.
---
-
-# Tool Evaluation: {domain}
-
-## Context
-
-You are researching tools, libraries, and services for **{domain}**.
-The goal is to find everything that is currently shipping (not vaporware)
-and produce a structured comparison.
-
-## Constraints
-
- Only include tools that have public releases or hosted services available today.
- If a tool is in beta/preview, note that clearly.
- Focus on {focus_criteria} when evaluating (e.g., cost, ease of integration, community size).
-
-## Research Steps
-
-1. Identify all actively-maintained tools in the **{domain}** space.
-2. For each tool, gather: name, URL, license/pricing, last release date, language/platform.
-3. Evaluate each tool against the focus criteria.
-4. Rank by overall fit for the use case: **{use_case}**.
-
-## Output Format
-
-### Summary
-
-One paragraph: what the landscape looks like and the top recommendation.
-
-### Comparison Table
-
-| Tool | License / Price | Last Release | Language | {focus_criteria} Score | Notes |
-|------|----------------|--------------|----------|----------------------|-------|
-| ...  | ...            | ...          | ...      | ...                  | ...   |
-
-### Top Pick
-
- **Recommended:** {tool_name} — {one-line reason}
- **Runner-up:** {tool_name} — {one-line reason}
-
-### Risks & Gaps
-
-Bullet list of things to watch out for (missing features, vendor lock-in, etc.).
--- a/src/dashboard/routes/system.py
+++ b/src/dashboard/routes/system.py
@@ -56,13 +56,11 @@ async def self_modify_queue(request: Request):

@router.get("/swarm/mission-control", response_class=HTMLResponse)
 async def mission_control(request: Request):
-    """Render the swarm mission control dashboard page."""
    return templates.TemplateResponse(request, "mission_control.html", {})


@router.get("/bugs", response_class=HTMLResponse)
 async def bugs_page(request: Request):
-    """Render the bug tracking page."""
    return templates.TemplateResponse(
        request,
        "bugs.html",
@@ -77,19 +75,16 @@ async def bugs_page(request: Request):

@router.get("/self-coding", response_class=HTMLResponse)
 async def self_coding(request: Request):
-    """Render the self-coding automation status page."""
    return templates.TemplateResponse(request, "self_coding.html", {"stats": {}})


@router.get("/hands", response_class=HTMLResponse)
 async def hands_page(request: Request):
-    """Render the hands (automation executions) page."""
    return templates.TemplateResponse(request, "hands.html", {"executions": []})


@router.get("/creative/ui", response_class=HTMLResponse)
 async def creative_ui(request: Request):
-    """Render the creative UI playground page."""
    return templates.TemplateResponse(request, "creative.html", {})


--- a/src/dashboard/routes/tasks.py
+++ b/src/dashboard/routes/tasks.py
@@ -145,7 +145,6 @@ async def tasks_page(request: Request):

@router.get("/tasks/pending", response_class=HTMLResponse)
 async def tasks_pending(request: Request):
-    """Return HTMX partial for pending approval tasks."""
    with _get_db() as db:
        rows = db.execute(
            "SELECT * FROM tasks WHERE status='pending_approval' ORDER BY created_at DESC"
@@ -165,7 +164,6 @@ async def tasks_pending(request: Request):

@router.get("/tasks/active", response_class=HTMLResponse)
 async def tasks_active(request: Request):
-    """Return HTMX partial for active (approved/running/paused) tasks."""
    with _get_db() as db:
        rows = db.execute(
            "SELECT * FROM tasks WHERE status IN ('approved','running','paused') ORDER BY created_at DESC"
@@ -185,7 +183,6 @@ async def tasks_active(request: Request):

@router.get("/tasks/completed", response_class=HTMLResponse)
 async def tasks_completed(request: Request):
-    """Return HTMX partial for completed/vetoed/failed tasks (last 50)."""
    with _get_db() as db:
        rows = db.execute(
            "SELECT * FROM tasks WHERE status IN ('completed','vetoed','failed') ORDER BY completed_at DESC LIMIT 50"
@@ -244,31 +241,26 @@ async def create_task_form(

@router.post("/tasks/{task_id}/approve", response_class=HTMLResponse)
 async def approve_task(request: Request, task_id: str):
-    """Approve a pending task and move it to active queue."""
    return await _set_status(request, task_id, "approved")


@router.post("/tasks/{task_id}/veto", response_class=HTMLResponse)
 async def veto_task(request: Request, task_id: str):
-    """Veto a task, marking it as rejected."""
    return await _set_status(request, task_id, "vetoed")


@router.post("/tasks/{task_id}/pause", response_class=HTMLResponse)
 async def pause_task(request: Request, task_id: str):
-    """Pause a running or approved task."""
    return await _set_status(request, task_id, "paused")


@router.post("/tasks/{task_id}/cancel", response_class=HTMLResponse)
 async def cancel_task(request: Request, task_id: str):
-    """Cancel a task (marks as vetoed)."""
    return await _set_status(request, task_id, "vetoed")


@router.post("/tasks/{task_id}/retry", response_class=HTMLResponse)
 async def retry_task(request: Request, task_id: str):
-    """Retry a failed/vetoed task by moving it back to approved."""
    return await _set_status(request, task_id, "approved")


@@ -279,7 +271,6 @@ async def modify_task(
    title: str = Form(...),
    description: str = Form(""),
 ):
-    """Update task title and description."""
    with _get_db() as db:
        db.execute(
            "UPDATE tasks SET title=?, description=? WHERE id=?",
--- a/src/timmy/tools.py
+++ b/src/timmy/tools.py
@@ -473,69 +473,6 @@ def consult_grok(query: str) -> str:
    return response


-def web_fetch(url: str, max_tokens: int = 4000) -> str:
-    """Fetch a web page and return its main text content.
-
-    Downloads the URL, extracts readable text using trafilatura, and
-    truncates to a token budget.  Use this to read full articles, docs,
-    or blog posts that web_search only returns snippets for.
-
-    Args:
-        url: The URL to fetch (must start with http:// or https://).
-        max_tokens: Maximum approximate token budget (default 4000).
-                    Text is truncated to max_tokens * 4 characters.
-
-    Returns:
-        Extracted text content, or an error message on failure.
-    """
-    if not url or not url.startswith(("http://", "https://")):
-        return f"Error: invalid URL — must start with http:// or https://: {url!r}"
-
-    try:
-        import requests as _requests
-    except ImportError:
-        return "Error: 'requests' package is not installed. Install with: pip install requests"
-
-    try:
-        import trafilatura
-    except ImportError:
-        return (
-            "Error: 'trafilatura' package is not installed. Install with: pip install trafilatura"
-        )
-
-    try:
-        resp = _requests.get(
-            url,
-            timeout=15,
-            headers={"User-Agent": "TimmyResearchBot/1.0"},
-        )
-        resp.raise_for_status()
-    except _requests.exceptions.Timeout:
-        return f"Error: request timed out after 15 seconds for {url}"
-    except _requests.exceptions.HTTPError as exc:
-        return f"Error: HTTP {exc.response.status_code} for {url}"
-    except _requests.exceptions.RequestException as exc:
-        return f"Error: failed to fetch {url} — {exc}"
-
-    text = trafilatura.extract(resp.text, include_tables=True, include_links=True)
-    if not text:
-        return f"Error: could not extract readable content from {url}"
-
-    char_budget = max_tokens * 4
-    if len(text) > char_budget:
-        text = text[:char_budget] + f"\n\n[…truncated to ~{max_tokens} tokens]"
-
-    return text
-
-
-def _register_web_fetch_tool(toolkit: Toolkit) -> None:
-    """Register the web_fetch tool for full-page content extraction."""
-    try:
-        toolkit.register(web_fetch, name="web_fetch")
-    except Exception as exc:
-        logger.warning("Tool execution failed (web_fetch registration): %s", exc)
-
-
 def _register_core_tools(toolkit: Toolkit, base_path: Path) -> None:
    """Register core execution and file tools."""
    # Python execution
@@ -735,7 +672,6 @@ def create_full_toolkit(base_dir: str | Path | None = None):
    base_path = Path(base_dir) if base_dir else Path(settings.repo_root)

    _register_core_tools(toolkit, base_path)
-    _register_web_fetch_tool(toolkit)
    _register_grok_tool(toolkit)
    _register_memory_tools(toolkit)
    _register_agentic_loop_tool(toolkit)
@@ -893,11 +829,6 @@ def _analysis_tool_catalog() -> dict:
            "description": "Evaluate mathematical expressions with exact results",
            "available_in": ["orchestrator"],
        },
-        "web_fetch": {
-            "name": "Web Fetch",
-            "description": "Fetch a web page and extract clean readable text (trafilatura)",
-            "available_in": ["orchestrator"],
-        },
    }


--- a/tests/infrastructure/test_db_pool.py
+++ b/tests/infrastructure/test_db_pool.py
@@ -242,145 +242,6 @@ class TestCloseAll:
            conn.execute("SELECT 1")


-class TestConnectionLeaks:
-    """Test that connections do not leak."""
-
-    def test_get_connection_after_close_returns_fresh_connection(self, tmp_path):
-        """After close, get_connection() returns a new working connection."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        conn1 = pool.get_connection()
-        pool.close_connection()
-
-        conn2 = pool.get_connection()
-        assert conn2 is not conn1
-        # New connection must be usable
-        cursor = conn2.execute("SELECT 1")
-        assert cursor.fetchone()[0] == 1
-        pool.close_connection()
-
-    def test_context_manager_does_not_leak_connection(self, tmp_path):
-        """After context manager exit, thread-local conn is cleared."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        with pool.connection():
-            pass
-        # Thread-local should be cleaned up
-        assert pool._local.conn is None
-
-    def test_context_manager_exception_does_not_leak_connection(self, tmp_path):
-        """Connection is cleaned up even when an exception occurs."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        try:
-            with pool.connection():
-                raise RuntimeError("boom")
-        except RuntimeError:
-            pass
-        assert pool._local.conn is None
-
-    def test_threads_do_not_leak_into_each_other(self, tmp_path):
-        """A connection opened in one thread is invisible to another."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        # Open a connection on main thread
-        pool.get_connection()
-
-        visible_from_other_thread = []
-
-        def check():
-            has_conn = hasattr(pool._local, "conn") and pool._local.conn is not None
-            visible_from_other_thread.append(has_conn)
-
-        t = threading.Thread(target=check)
-        t.start()
-        t.join()
-
-        assert visible_from_other_thread == [False]
-        pool.close_connection()
-
-    def test_repeated_open_close_cycles(self, tmp_path):
-        """Repeated open/close cycles do not accumulate leaked connections."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        for _ in range(50):
-            with pool.connection() as conn:
-                conn.execute("SELECT 1")
-            # After each cycle, connection should be cleaned up
-            assert pool._local.conn is None
-
-
-class TestPragmaApplication:
-    """Test that SQLite pragmas can be applied and persist on pooled connections.
-
-    The codebase uses WAL journal mode and busy_timeout pragmas on connections
-    obtained from the pool. These tests verify that pattern works correctly.
-    """
-
-    def test_wal_journal_mode_persists(self, tmp_path):
-        """WAL journal mode set on a pooled connection persists for its lifetime."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        conn = pool.get_connection()
-        conn.execute("PRAGMA journal_mode=WAL")
-        mode = conn.execute("PRAGMA journal_mode").fetchone()[0]
-        assert mode == "wal"
-
-        # Same connection should retain the pragma
-        same_conn = pool.get_connection()
-        mode2 = same_conn.execute("PRAGMA journal_mode").fetchone()[0]
-        assert mode2 == "wal"
-        pool.close_connection()
-
-    def test_busy_timeout_persists(self, tmp_path):
-        """busy_timeout pragma set on a pooled connection persists."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        conn = pool.get_connection()
-        conn.execute("PRAGMA busy_timeout=5000")
-        timeout = conn.execute("PRAGMA busy_timeout").fetchone()[0]
-        assert timeout == 5000
-        pool.close_connection()
-
-    def test_pragmas_apply_per_connection(self, tmp_path):
-        """Pragmas set on one thread's connection are independent of another's."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        conn_main = pool.get_connection()
-        conn_main.execute("PRAGMA cache_size=9999")
-
-        other_cache = []
-
-        def check_pragma():
-            conn = pool.get_connection()
-            # Don't set cache_size — should get the default, not 9999
-            val = conn.execute("PRAGMA cache_size").fetchone()[0]
-            other_cache.append(val)
-            pool.close_connection()
-
-        t = threading.Thread(target=check_pragma)
-        t.start()
-        t.join()
-
-        # Other thread's connection should NOT have our custom cache_size
-        assert other_cache[0] != 9999
-        pool.close_connection()
-
-    def test_session_pragma_resets_on_new_connection(self, tmp_path):
-        """Session-level pragmas (cache_size) reset on a new connection."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        conn1 = pool.get_connection()
-        conn1.execute("PRAGMA cache_size=9999")
-        assert conn1.execute("PRAGMA cache_size").fetchone()[0] == 9999
-        pool.close_connection()
-
-        conn2 = pool.get_connection()
-        cache = conn2.execute("PRAGMA cache_size").fetchone()[0]
-        # New connection gets default cache_size, not the previous value
-        assert cache != 9999
-        pool.close_connection()
-
-    def test_wal_mode_via_context_manager(self, tmp_path):
-        """WAL mode can be set within a context manager block."""
-        pool = ConnectionPool(tmp_path / "test.db")
-        with pool.connection() as conn:
-            conn.execute("PRAGMA journal_mode=WAL")
-            mode = conn.execute("PRAGMA journal_mode").fetchone()[0]
-            assert mode == "wal"
-
-
 class TestIntegration:
    """Integration tests for real-world usage patterns."""

--- a/tests/loop/test_loop_guard_corrupt_queue.py
+++ b/tests/loop/test_loop_guard_corrupt_queue.py
@@ -1,97 +0,0 @@
-"""Tests for load_queue corrupt JSON handling in loop_guard.py."""
-
-from __future__ import annotations
-
-import json
-from pathlib import Path
-
-import pytest
-import scripts.loop_guard as lg
-
-
-@pytest.fixture(autouse=True)
-def _isolate(tmp_path, monkeypatch):
-    """Redirect loop_guard paths to tmp_path for isolation."""
-    monkeypatch.setattr(lg, "QUEUE_FILE", tmp_path / "queue.json")
-    monkeypatch.setattr(lg, "IDLE_STATE_FILE", tmp_path / "idle_state.json")
-    monkeypatch.setattr(lg, "CYCLE_RESULT_FILE", tmp_path / "cycle_result.json")
-    monkeypatch.setattr(lg, "GITEA_API", "http://test:3000/api/v1")
-    monkeypatch.setattr(lg, "REPO_SLUG", "owner/repo")
-
-
-def test_load_queue_missing_file(tmp_path):
-    """Missing queue file returns empty list."""
-    result = lg.load_queue()
-    assert result == []
-
-
-def test_load_queue_valid_data(tmp_path):
-    """Valid queue.json returns ready items."""
-    data = [
-        {"issue": 1, "title": "Ready issue", "ready": True},
-        {"issue": 2, "title": "Not ready", "ready": False},
-    ]
-    lg.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    lg.QUEUE_FILE.write_text(json.dumps(data, indent=2))
-
-    result = lg.load_queue()
-    assert len(result) == 1
-    assert result[0]["issue"] == 1
-
-
-def test_load_queue_corrupt_json_logs_warning(tmp_path, capsys):
-    """Corrupt queue.json returns empty list and logs warning."""
-    lg.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    lg.QUEUE_FILE.write_text("not valid json {{{")
-
-    result = lg.load_queue()
-    assert result == []
-
-    captured = capsys.readouterr()
-    assert "WARNING" in captured.out
-    assert "Corrupt queue.json" in captured.out
-
-
-def test_load_queue_not_a_list(tmp_path):
-    """Queue.json that is not a list returns empty list."""
-    lg.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    lg.QUEUE_FILE.write_text(json.dumps({"not": "a list"}))
-
-    result = lg.load_queue()
-    assert result == []
-
-
-def test_load_queue_no_ready_items(tmp_path):
-    """Queue with no ready items returns empty list."""
-    data = [
-        {"issue": 1, "title": "Not ready 1", "ready": False},
-        {"issue": 2, "title": "Not ready 2", "ready": False},
-    ]
-    lg.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    lg.QUEUE_FILE.write_text(json.dumps(data, indent=2))
-
-    result = lg.load_queue()
-    assert result == []
-
-
-def test_load_queue_oserror_logs_warning(tmp_path, monkeypatch, capsys):
-    """OSError when reading queue.json returns empty list and logs warning."""
-    lg.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    lg.QUEUE_FILE.write_text("[]")
-
-    # Mock Path.read_text to raise OSError
-    original_read_text = Path.read_text
-
-    def mock_read_text(self, *args, **kwargs):
-        if self.name == "queue.json":
-            raise OSError("Permission denied")
-        return original_read_text(self, *args, **kwargs)
-
-    monkeypatch.setattr(Path, "read_text", mock_read_text)
-
-    result = lg.load_queue()
-    assert result == []
-
-    captured = capsys.readouterr()
-    assert "WARNING" in captured.out
-    assert "Cannot read queue.json" in captured.out
--- a/tests/scripts/test_triage_score_validation.py
+++ b/tests/scripts/test_triage_score_validation.py
@@ -1,159 +0,0 @@
-"""Tests for queue.json validation and backup in triage_score.py."""
-
-from __future__ import annotations
-
-import json
-
-import pytest
-import scripts.triage_score as ts
-
-
-@pytest.fixture(autouse=True)
-def _isolate(tmp_path, monkeypatch):
-    """Redirect triage_score paths to tmp_path for isolation."""
-    monkeypatch.setattr(ts, "QUEUE_FILE", tmp_path / "queue.json")
-    monkeypatch.setattr(ts, "QUEUE_BACKUP_FILE", tmp_path / "queue.json.bak")
-    monkeypatch.setattr(ts, "RETRO_FILE", tmp_path / "retro" / "triage.jsonl")
-    monkeypatch.setattr(ts, "QUARANTINE_FILE", tmp_path / "quarantine.json")
-    monkeypatch.setattr(ts, "CYCLE_RETRO_FILE", tmp_path / "retro" / "cycles.jsonl")
-
-
-def test_backup_created_on_write(tmp_path):
-    """When writing queue.json, a backup should be created from previous valid file."""
-    # Create initial valid queue file
-    initial_data = [{"issue": 1, "title": "Test", "ready": True}]
-    ts.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_FILE.write_text(json.dumps(initial_data))
-
-    # Write new data
-    new_data = [{"issue": 2, "title": "New", "ready": True}]
-    ts.QUEUE_FILE.write_text(json.dumps(new_data, indent=2) + "\n")
-
-    # Manually run the backup logic as run_triage would
-    if ts.QUEUE_FILE.exists():
-        try:
-            json.loads(ts.QUEUE_FILE.read_text())
-            ts.QUEUE_BACKUP_FILE.write_text(ts.QUEUE_FILE.read_text())
-        except (json.JSONDecodeError, OSError):
-            pass
-
-    # Both files should exist with same content
-    assert ts.QUEUE_BACKUP_FILE.exists()
-    assert json.loads(ts.QUEUE_BACKUP_FILE.read_text()) == new_data
-
-
-def test_corrupt_queue_restored_from_backup(tmp_path, capsys):
-    """If queue.json is corrupt, it should be restored from backup."""
-    # Create a valid backup
-    valid_data = [{"issue": 1, "title": "Backup", "ready": True}]
-    ts.QUEUE_BACKUP_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_BACKUP_FILE.write_text(json.dumps(valid_data, indent=2) + "\n")
-
-    # Create a corrupt queue file
-    ts.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_FILE.write_text("not valid json {{{")
-
-    # Run validation and restore logic
-    try:
-        json.loads(ts.QUEUE_FILE.read_text())
-    except (json.JSONDecodeError, OSError):
-        if ts.QUEUE_BACKUP_FILE.exists():
-            try:
-                backup_data = ts.QUEUE_BACKUP_FILE.read_text()
-                json.loads(backup_data)  # Validate backup
-                ts.QUEUE_FILE.write_text(backup_data)
-                print("[triage] Restored queue.json from backup")
-            except (json.JSONDecodeError, OSError):
-                ts.QUEUE_FILE.write_text("[]\n")
-        else:
-            ts.QUEUE_FILE.write_text("[]\n")
-
-    # Queue should be restored from backup
-    assert json.loads(ts.QUEUE_FILE.read_text()) == valid_data
-    captured = capsys.readouterr()
-    assert "Restored queue.json from backup" in captured.out
-
-
-def test_corrupt_queue_no_backup_writes_empty_list(tmp_path):
-    """If queue.json is corrupt and no backup exists, write empty list."""
-    # Ensure no backup exists
-    assert not ts.QUEUE_BACKUP_FILE.exists()
-
-    # Create a corrupt queue file
-    ts.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_FILE.write_text("not valid json {{{")
-
-    # Run validation and restore logic
-    try:
-        json.loads(ts.QUEUE_FILE.read_text())
-    except (json.JSONDecodeError, OSError):
-        if ts.QUEUE_BACKUP_FILE.exists():
-            try:
-                backup_data = ts.QUEUE_BACKUP_FILE.read_text()
-                json.loads(backup_data)
-                ts.QUEUE_FILE.write_text(backup_data)
-            except (json.JSONDecodeError, OSError):
-                ts.QUEUE_FILE.write_text("[]\n")
-        else:
-            ts.QUEUE_FILE.write_text("[]\n")
-
-    # Should have empty list
-    assert json.loads(ts.QUEUE_FILE.read_text()) == []
-
-
-def test_corrupt_backup_writes_empty_list(tmp_path):
-    """If both queue.json and backup are corrupt, write empty list."""
-    # Create a corrupt backup
-    ts.QUEUE_BACKUP_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_BACKUP_FILE.write_text("also corrupt backup")
-
-    # Create a corrupt queue file
-    ts.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_FILE.write_text("not valid json {{{")
-
-    # Run validation and restore logic
-    try:
-        json.loads(ts.QUEUE_FILE.read_text())
-    except (json.JSONDecodeError, OSError):
-        if ts.QUEUE_BACKUP_FILE.exists():
-            try:
-                backup_data = ts.QUEUE_BACKUP_FILE.read_text()
-                json.loads(backup_data)
-                ts.QUEUE_FILE.write_text(backup_data)
-            except (json.JSONDecodeError, OSError):
-                ts.QUEUE_FILE.write_text("[]\n")
-        else:
-            ts.QUEUE_FILE.write_text("[]\n")
-
-    # Should have empty list
-    assert json.loads(ts.QUEUE_FILE.read_text()) == []
-
-
-def test_valid_queue_not_corrupt_no_backup_overwrite(tmp_path):
-    """Don't overwrite backup if current queue.json is corrupt."""
-    # Create a valid backup
-    valid_backup = [{"issue": 99, "title": "Old Backup", "ready": True}]
-    ts.QUEUE_BACKUP_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_BACKUP_FILE.write_text(json.dumps(valid_backup, indent=2) + "\n")
-
-    # Create a corrupt queue file
-    ts.QUEUE_FILE.parent.mkdir(parents=True, exist_ok=True)
-    ts.QUEUE_FILE.write_text("corrupt data")
-
-    # Try to save backup (should skip because current is corrupt)
-    if ts.QUEUE_FILE.exists():
-        try:
-            json.loads(ts.QUEUE_FILE.read_text())  # This will fail
-            ts.QUEUE_BACKUP_FILE.write_text(ts.QUEUE_FILE.read_text())
-        except (json.JSONDecodeError, OSError):
-            pass  # Should hit this branch
-
-    # Backup should still have original valid data
-    assert json.loads(ts.QUEUE_BACKUP_FILE.read_text()) == valid_backup
-
-
-def test_backup_path_configuration():
-    """Ensure backup file path is properly configured relative to queue file."""
-    assert ts.QUEUE_BACKUP_FILE.parent == ts.QUEUE_FILE.parent
-    assert ts.QUEUE_BACKUP_FILE.name == "queue.json.bak"
-    assert ts.QUEUE_FILE.name == "queue.json"
--- a/tests/timmy/test_tools_web_fetch.py
+++ b/tests/timmy/test_tools_web_fetch.py
@@ -1,158 +0,0 @@
-"""Unit tests for the web_fetch tool in timmy.tools."""
-
-from __future__ import annotations
-
-from unittest.mock import MagicMock, patch
-
-from timmy.tools import web_fetch
-
-
-class TestWebFetch:
-    """Tests for web_fetch function."""
-
-    def test_invalid_url_no_scheme(self):
-        """URLs without http(s) scheme are rejected."""
-        result = web_fetch("example.com")
-        assert "Error: invalid URL" in result
-
-    def test_invalid_url_empty(self):
-        """Empty URL is rejected."""
-        result = web_fetch("")
-        assert "Error: invalid URL" in result
-
-    def test_invalid_url_ftp(self):
-        """Non-HTTP schemes are rejected."""
-        result = web_fetch("ftp://example.com")
-        assert "Error: invalid URL" in result
-
-    @patch("timmy.tools.trafilatura", create=True)
-    @patch("timmy.tools._requests", create=True)
-    def test_successful_fetch(self, mock_requests, mock_trafilatura):
-        """Happy path: fetch + extract returns text."""
-        # We need to patch at import level inside the function
-        mock_resp = MagicMock()
-        mock_resp.text = "<html><body><p>Hello world</p></body></html>"
-
-        with patch.dict(
-            "sys.modules", {"requests": mock_requests, "trafilatura": mock_trafilatura}
-        ):
-            mock_requests.get.return_value = mock_resp
-            mock_requests.exceptions = _make_exceptions()
-            mock_trafilatura.extract.return_value = "Hello world"
-
-            result = web_fetch("https://example.com")
-
-        assert result == "Hello world"
-
-    @patch.dict("sys.modules", {"requests": MagicMock(), "trafilatura": MagicMock()})
-    def test_truncation(self):
-        """Long text is truncated to max_tokens * 4 chars."""
-        import sys
-
-        mock_trafilatura = sys.modules["trafilatura"]
-        mock_requests = sys.modules["requests"]
-
-        long_text = "a" * 20000
-        mock_resp = MagicMock()
-        mock_resp.text = "<html><body>" + long_text + "</body></html>"
-        mock_requests.get.return_value = mock_resp
-        mock_requests.exceptions = _make_exceptions()
-        mock_trafilatura.extract.return_value = long_text
-
-        result = web_fetch("https://example.com", max_tokens=100)
-
-        # 100 tokens * 4 chars = 400 chars max
-        assert len(result) < 500
-        assert "[…truncated" in result
-
-    @patch.dict("sys.modules", {"requests": MagicMock(), "trafilatura": MagicMock()})
-    def test_extraction_failure(self):
-        """Returns error when trafilatura can't extract text."""
-        import sys
-
-        mock_trafilatura = sys.modules["trafilatura"]
-        mock_requests = sys.modules["requests"]
-
-        mock_resp = MagicMock()
-        mock_resp.text = "<html></html>"
-        mock_requests.get.return_value = mock_resp
-        mock_requests.exceptions = _make_exceptions()
-        mock_trafilatura.extract.return_value = None
-
-        result = web_fetch("https://example.com")
-        assert "Error: could not extract" in result
-
-    @patch.dict("sys.modules", {"trafilatura": MagicMock()})
-    def test_timeout(self):
-        """Timeout errors are handled gracefully."""
-
-        mock_requests = MagicMock()
-        exc_mod = _make_exceptions()
-        mock_requests.exceptions = exc_mod
-        mock_requests.get.side_effect = exc_mod.Timeout("timed out")
-
-        with patch.dict("sys.modules", {"requests": mock_requests}):
-            result = web_fetch("https://example.com")
-
-        assert "timed out" in result
-
-    @patch.dict("sys.modules", {"trafilatura": MagicMock()})
-    def test_http_error(self):
-        """HTTP errors (404, 500, etc.) are handled gracefully."""
-
-        mock_requests = MagicMock()
-        exc_mod = _make_exceptions()
-        mock_requests.exceptions = exc_mod
-
-        mock_response = MagicMock()
-        mock_response.status_code = 404
-        mock_requests.get.return_value.raise_for_status.side_effect = exc_mod.HTTPError(
-            response=mock_response
-        )
-
-        with patch.dict("sys.modules", {"requests": mock_requests}):
-            result = web_fetch("https://example.com/nope")
-
-        assert "404" in result
-
-    def test_missing_requests(self):
-        """Graceful error when requests not installed."""
-        with patch.dict("sys.modules", {"requests": None}):
-            result = web_fetch("https://example.com")
-        assert "requests" in result and "not installed" in result
-
-    def test_missing_trafilatura(self):
-        """Graceful error when trafilatura not installed."""
-        mock_requests = MagicMock()
-        with patch.dict("sys.modules", {"requests": mock_requests, "trafilatura": None}):
-            result = web_fetch("https://example.com")
-        assert "trafilatura" in result and "not installed" in result
-
-    def test_catalog_entry_exists(self):
-        """web_fetch should appear in the tool catalog."""
-        from timmy.tools import get_all_available_tools
-
-        catalog = get_all_available_tools()
-        assert "web_fetch" in catalog
-        assert "orchestrator" in catalog["web_fetch"]["available_in"]
-
-
-def _make_exceptions():
-    """Create a mock exceptions module with real exception classes."""
-
-    class Timeout(Exception):
-        pass
-
-    class HTTPError(Exception):
-        def __init__(self, *args, response=None, **kwargs):
-            super().__init__(*args, **kwargs)
-            self.response = response
-
-    class RequestException(Exception):
-        pass
-
-    mod = MagicMock()
-    mod.Timeout = Timeout
-    mod.HTTPError = HTTPError
-    mod.RequestException = RequestException
-    return mod