src/spark/eidos.py

"""EIDOS cognitive loop — prediction, evaluation, and learning.

Implements the core Spark learning cycle:
1. PREDICT — Before a task is assigned, predict the outcome
2. OBSERVE — Watch what actually happens
3. EVALUATE — Compare prediction vs reality
4. LEARN — Update internal models based on accuracy

All predictions and evaluations are stored in SQLite for
transparency and audit.  The loop runs passively, recording
predictions when tasks are posted and evaluating them when
tasks complete.
"""

import json
import logging
import sqlite3
import uuid
from collections.abc import Generator
from contextlib import closing, contextmanager
from dataclasses import dataclass
from datetime import UTC, datetime
from pathlib import Path

logger = logging.getLogger(__name__)

DB_PATH = Path("data/spark.db")


@dataclass
class Prediction:
    """A prediction made by the EIDOS loop."""

    id: str
    task_id: str
    prediction_type: str  # outcome, best_agent, bid_range
    predicted_value: str  # JSON-encoded prediction
    actual_value: str | None  # JSON-encoded actual (filled on evaluation)
    accuracy: float | None  # 0.0–1.0 (filled on evaluation)
    created_at: str
    evaluated_at: str | None


@contextmanager
def _get_conn() -> Generator[sqlite3.Connection, None, None]:
    DB_PATH.parent.mkdir(parents=True, exist_ok=True)
    with closing(sqlite3.connect(str(DB_PATH))) as conn:
        conn.row_factory = sqlite3.Row
        conn.execute("PRAGMA journal_mode=WAL")
        conn.execute("PRAGMA busy_timeout=5000")
        conn.execute("""
            CREATE TABLE IF NOT EXISTS spark_predictions (
                id               TEXT PRIMARY KEY,
                task_id          TEXT NOT NULL,
                prediction_type  TEXT NOT NULL,
                predicted_value  TEXT NOT NULL,
                actual_value     TEXT,
                accuracy         REAL,
                created_at       TEXT NOT NULL,
                evaluated_at     TEXT
            )
            """)
        conn.execute("CREATE INDEX IF NOT EXISTS idx_pred_task ON spark_predictions(task_id)")
        conn.execute(
            "CREATE INDEX IF NOT EXISTS idx_pred_type ON spark_predictions(prediction_type)"
        )
        conn.commit()
        yield conn


# ── Prediction phase ────────────────────────────────────────────────────────


def predict_task_outcome(
    task_id: str,
    task_description: str,
    candidate_agents: list[str],
    agent_history: dict | None = None,
) -> dict:
    """Predict the outcome of a task before it's assigned.

    Returns a prediction dict with:
    - likely_winner: agent_id most likely to win the auction
    - success_probability: 0.0–1.0 chance the task succeeds
    - estimated_bid_range: (low, high) sats range
    """
    # Default prediction when no history exists
    prediction = {
        "likely_winner": candidate_agents[0] if candidate_agents else None,
        "success_probability": 0.7,
        "estimated_bid_range": [20, 80],
        "reasoning": "baseline prediction (no history)",
    }

    if agent_history:
        # Adjust based on historical success rates
        best_agent = None
        best_rate = 0.0
        for aid, metrics in agent_history.items():
            if aid not in candidate_agents:
                continue
            rate = metrics.get("success_rate", 0.0)
            if rate > best_rate:
                best_rate = rate
                best_agent = aid

        if best_agent:
            prediction["likely_winner"] = best_agent
            prediction["success_probability"] = round(min(1.0, 0.5 + best_rate * 0.4), 2)
            prediction["reasoning"] = f"agent {best_agent[:8]} has {best_rate:.0%} success rate"

        # Adjust bid range from history
        all_bids = []
        for metrics in agent_history.values():
            avg = metrics.get("avg_winning_bid", 0)
            if avg > 0:
                all_bids.append(avg)
        if all_bids:
            prediction["estimated_bid_range"] = [
                max(1, int(min(all_bids) * 0.8)),
                int(max(all_bids) * 1.2),
            ]

    # Store prediction
    pred_id = str(uuid.uuid4())
    now = datetime.now(UTC).isoformat()
    with _get_conn() as conn:
        conn.execute(
            """
            INSERT INTO spark_predictions
                (id, task_id, prediction_type, predicted_value, created_at)
            VALUES (?, ?, ?, ?, ?)
            """,
            (pred_id, task_id, "outcome", json.dumps(prediction), now),
        )
        conn.commit()

    prediction["prediction_id"] = pred_id
    return prediction


# ── Evaluation phase ────────────────────────────────────────────────────────


def evaluate_prediction(
    task_id: str,
    actual_winner: str | None,
    task_succeeded: bool,
    winning_bid: int | None = None,
) -> dict | None:
    """Evaluate a stored prediction against actual outcomes.

    Returns the evaluation result or None if no prediction exists.
    """
    with _get_conn() as conn:
        row = conn.execute(
            """
            SELECT * FROM spark_predictions
            WHERE task_id = ? AND prediction_type = 'outcome' AND evaluated_at IS NULL
            ORDER BY created_at DESC LIMIT 1
            """,
            (task_id,),
        ).fetchone()

        if not row:
            return None

        predicted = json.loads(row["predicted_value"])
        actual = {
            "winner": actual_winner,
            "succeeded": task_succeeded,
            "winning_bid": winning_bid,
        }

        # Calculate accuracy
        accuracy = _compute_accuracy(predicted, actual)
        now = datetime.now(UTC).isoformat()

        conn.execute(
            """
            UPDATE spark_predictions
            SET actual_value = ?, accuracy = ?, evaluated_at = ?
            WHERE id = ?
            """,
            (json.dumps(actual), accuracy, now, row["id"]),
        )
        conn.commit()

    return {
        "prediction_id": row["id"],
        "predicted": predicted,
        "actual": actual,
        "accuracy": accuracy,
    }


def _compute_accuracy(predicted: dict, actual: dict) -> float:
    """Score prediction accuracy from 0.0–1.0.

    Components:
    - Winner prediction: 0.4 weight (correct = 1.0, wrong = 0.0)
    - Success prediction: 0.4 weight (how close)
    - Bid range: 0.2 weight (was actual bid in predicted range)
    """
    score = 0.0
    weights = 0.0

    # Winner accuracy
    pred_winner = predicted.get("likely_winner")
    actual_winner = actual.get("winner")
    if pred_winner and actual_winner:
        score += 0.4 * (1.0 if pred_winner == actual_winner else 0.0)
        weights += 0.4

    # Success probability accuracy
    pred_success = predicted.get("success_probability", 0.5)
    actual_success = 1.0 if actual.get("succeeded") else 0.0
    success_error = abs(pred_success - actual_success)
    score += 0.4 * (1.0 - success_error)
    weights += 0.4

    # Bid range accuracy
    bid_range = predicted.get("estimated_bid_range", [20, 80])
    actual_bid = actual.get("winning_bid")
    if actual_bid is not None and len(bid_range) == 2:
        low, high = bid_range
        if low <= actual_bid <= high:
            score += 0.2
        else:
            # Partial credit: how far outside the range
            distance = min(abs(actual_bid - low), abs(actual_bid - high))
            range_size = max(1, high - low)
            score += 0.2 * max(0, 1.0 - distance / range_size)
        weights += 0.2

    return round(score / max(weights, 0.01), 2)


# ── Query helpers ──────────────────────────────────────────────────────────


def get_predictions(
    task_id: str | None = None,
    evaluated_only: bool = False,
    limit: int = 50,
) -> list[Prediction]:
    """Query stored predictions."""
    query = "SELECT * FROM spark_predictions WHERE 1=1"
    params: list = []

    if task_id:
        query += " AND task_id = ?"
        params.append(task_id)
    if evaluated_only:
        query += " AND evaluated_at IS NOT NULL"

    query += " ORDER BY created_at DESC LIMIT ?"
    params.append(limit)

    with _get_conn() as conn:
        rows = conn.execute(query, params).fetchall()
    return [
        Prediction(
            id=r["id"],
            task_id=r["task_id"],
            prediction_type=r["prediction_type"],
            predicted_value=r["predicted_value"],
            actual_value=r["actual_value"],
            accuracy=r["accuracy"],
            created_at=r["created_at"],
            evaluated_at=r["evaluated_at"],
        )
        for r in rows
    ]


def get_accuracy_stats() -> dict:
    """Return aggregate accuracy statistics for the EIDOS loop."""
    with _get_conn() as conn:
        row = conn.execute("""
            SELECT
                COUNT(*)                          AS total_predictions,
                COUNT(evaluated_at)               AS evaluated,
                AVG(CASE WHEN accuracy IS NOT NULL THEN accuracy END) AS avg_accuracy,
                MIN(CASE WHEN accuracy IS NOT NULL THEN accuracy END) AS min_accuracy,
                MAX(CASE WHEN accuracy IS NOT NULL THEN accuracy END) AS max_accuracy
            FROM spark_predictions
            """).fetchone()

    return {
        "total_predictions": row["total_predictions"] or 0,
        "evaluated": row["evaluated"] or 0,
        "pending": (row["total_predictions"] or 0) - (row["evaluated"] or 0),
        "avg_accuracy": round(row["avg_accuracy"] or 0.0, 2),
        "min_accuracy": round(row["min_accuracy"] or 0.0, 2),
        "max_accuracy": round(row["max_accuracy"] or 0.0, 2),
    }
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								"""EIDOS cognitive loop — prediction, evaluation, and learning.
 								Implements the core Spark learning cycle:
 . PREDICT — Before a task is assigned, predict the outcome
 . OBSERVE — Watch what actually happens
 . EVALUATE — Compare prediction vs reality
 . LEARN — Update internal models based on accuracy
 								All predictions and evaluations are stored in SQLite for
 								transparency and audit.  The loop runs passively, recording
 								predictions when tasks are posted and evaluating them when
 								tasks complete.
 								"""
 								import json
 								import logging
 								import sqlite3
 								import uuid
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								from collections.abc import Generator
 								from contextlib import closing, contextmanager
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								from dataclasses import dataclass
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								from datetime import UTC, datetime
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								from pathlib import Path
 								logger = logging.getLogger(__name__)
 								DB_PATH = Path("data/spark.db")
 								@dataclass
 								class Prediction:
 								    """A prediction made by the EIDOS loop."""
-												feat: code quality audit + autoresearch integration + infra hardening (#150)
											
										
										
											2026-03-08 12:50:44 -04:00
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								    id: str
 								    task_id: str
-												feat: code quality audit + autoresearch integration + infra hardening (#150)
											
										
										
											2026-03-08 12:50:44 -04:00
+								    prediction_type: str  # outcome, best_agent, bid_range
 								    predicted_value: str  # JSON-encoded prediction
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								    actual_value: str | None  # JSON-encoded actual (filled on evaluation)
 								    accuracy: float | None  # 0.0–1.0 (filled on evaluation)
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								    created_at: str
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								    evaluated_at: str | None
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								@contextmanager
 								def _get_conn() -> Generator[sqlite3.Connection, None, None]:
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								    DB_PATH.parent.mkdir(parents=True, exist_ok=True)
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								    with closing(sqlite3.connect(str(DB_PATH))) as conn:
 								        conn.row_factory = sqlite3.Row
 								        conn.execute("PRAGMA journal_mode=WAL")
 								        conn.execute("PRAGMA busy_timeout=5000")
 								        conn.execute("""
 								            CREATE TABLE IF NOT EXISTS spark_predictions (
 								                id               TEXT PRIMARY KEY,
 								                task_id          TEXT NOT NULL,
 								                prediction_type  TEXT NOT NULL,
 								                predicted_value  TEXT NOT NULL,
 								                actual_value     TEXT,
 								                accuracy         REAL,
 								                created_at       TEXT NOT NULL,
 								                evaluated_at     TEXT
 								            )
 								            """)
 								        conn.execute("CREATE INDEX IF NOT EXISTS idx_pred_task ON spark_predictions(task_id)")
 								        conn.execute(
 								            "CREATE INDEX IF NOT EXISTS idx_pred_type ON spark_predictions(prediction_type)"
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								        )
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								        conn.commit()
 								        yield conn
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
 								# ── Prediction phase ────────────────────────────────────────────────────────
-												feat: code quality audit + autoresearch integration + infra hardening (#150)
											
										
										
											2026-03-08 12:50:44 -04:00
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								def predict_task_outcome(
 								    task_id: str,
 								    task_description: str,
 								    candidate_agents: list[str],
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								    agent_history: dict | None = None,
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								) -> dict:
 								    """Predict the outcome of a task before it's assigned.
 								    Returns a prediction dict with:
 								    - likely_winner: agent_id most likely to win the auction
 								    - success_probability: 0.0–1.0 chance the task succeeds
 								    - estimated_bid_range: (low, high) sats range
 								    """
 								    # Default prediction when no history exists
 								    prediction = {
 								        "likely_winner": candidate_agents[0] if candidate_agents else None,
 								        "success_probability": 0.7,
 								        "estimated_bid_range": [20, 80],
 								        "reasoning": "baseline prediction (no history)",
 								    }
 								    if agent_history:
 								        # Adjust based on historical success rates
 								        best_agent = None
 								        best_rate = 0.0
 								        for aid, metrics in agent_history.items():
 								            if aid not in candidate_agents:
 								                continue
 								            rate = metrics.get("success_rate", 0.0)
 								            if rate > best_rate:
 								                best_rate = rate
 								                best_agent = aid
 								        if best_agent:
 								            prediction["likely_winner"] = best_agent
-												feat: code quality audit + autoresearch integration + infra hardening (#150)
											
										
										
											2026-03-08 12:50:44 -04:00
+								            prediction["success_probability"] = round(min(1.0, 0.5 + best_rate * 0.4), 2)
 								            prediction["reasoning"] = f"agent {best_agent[:8]} has {best_rate:.0%} success rate"
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
 								        # Adjust bid range from history
 								        all_bids = []
 								        for metrics in agent_history.values():
 								            avg = metrics.get("avg_winning_bid", 0)
 								            if avg > 0:
 								                all_bids.append(avg)
 								        if all_bids:
 								            prediction["estimated_bid_range"] = [
 								                max(1, int(min(all_bids) * 0.8)),
 								                int(max(all_bids) * 1.2),
 								            ]
 								    # Store prediction
 								    pred_id = str(uuid.uuid4())
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								    now = datetime.now(UTC).isoformat()
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								    with _get_conn() as conn:
 								        conn.execute(
 								            """
 								            INSERT INTO spark_predictions
 								                (id, task_id, prediction_type, predicted_value, created_at)
 								            VALUES (?, ?, ?, ?, ?)
 								            """,
 								            (pred_id, task_id, "outcome", json.dumps(prediction), now),
 								        )
 								        conn.commit()
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
 								    prediction["prediction_id"] = pred_id
 								    return prediction
 								# ── Evaluation phase ────────────────────────────────────────────────────────
-												feat: code quality audit + autoresearch integration + infra hardening (#150)
											
										
										
											2026-03-08 12:50:44 -04:00
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								def evaluate_prediction(
 								    task_id: str,
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								    actual_winner: str | None,
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								    task_succeeded: bool,
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								    winning_bid: int | None = None,
 								) -> dict | None:
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								    """Evaluate a stored prediction against actual outcomes.
 								    Returns the evaluation result or None if no prediction exists.
 								    """
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								    with _get_conn() as conn:
 								        row = conn.execute(
 								            """
 								            SELECT * FROM spark_predictions
 								            WHERE task_id = ? AND prediction_type = 'outcome' AND evaluated_at IS NULL
 								            ORDER BY created_at DESC LIMIT 1
 								            """,
 								            (task_id,),
 								        ).fetchone()
 								        if not row:
 								            return None
 								        predicted = json.loads(row["predicted_value"])
 								        actual = {
 								            "winner": actual_winner,
 								            "succeeded": task_succeeded,
 								            "winning_bid": winning_bid,
 								        }
 								        # Calculate accuracy
 								        accuracy = _compute_accuracy(predicted, actual)
 								        now = datetime.now(UTC).isoformat()
 								        conn.execute(
 								            """
 								            UPDATE spark_predictions
 								            SET actual_value = ?, accuracy = ?, evaluated_at = ?
 								            WHERE id = ?
 								            """,
 								            (json.dumps(actual), accuracy, now, row["id"]),
 								        )
 								        conn.commit()
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
 								    return {
 								        "prediction_id": row["id"],
 								        "predicted": predicted,
 								        "actual": actual,
 								        "accuracy": accuracy,
 								    }
 								def _compute_accuracy(predicted: dict, actual: dict) -> float:
 								    """Score prediction accuracy from 0.0–1.0.
 								    Components:
 								    - Winner prediction: 0.4 weight (correct = 1.0, wrong = 0.0)
 								    - Success prediction: 0.4 weight (how close)
 								    - Bid range: 0.2 weight (was actual bid in predicted range)
 								    """
 								    score = 0.0
 								    weights = 0.0
 								    # Winner accuracy
 								    pred_winner = predicted.get("likely_winner")
 								    actual_winner = actual.get("winner")
 								    if pred_winner and actual_winner:
 								        score += 0.4 * (1.0 if pred_winner == actual_winner else 0.0)
 								        weights += 0.4
 								    # Success probability accuracy
 								    pred_success = predicted.get("success_probability", 0.5)
 								    actual_success = 1.0 if actual.get("succeeded") else 0.0
 								    success_error = abs(pred_success - actual_success)
 								    score += 0.4 * (1.0 - success_error)
 								    weights += 0.4
 								    # Bid range accuracy
 								    bid_range = predicted.get("estimated_bid_range", [20, 80])
 								    actual_bid = actual.get("winning_bid")
 								    if actual_bid is not None and len(bid_range) == 2:
 								        low, high = bid_range
 								        if low <= actual_bid <= high:
 								            score += 0.2
 								        else:
 								            # Partial credit: how far outside the range
 								            distance = min(abs(actual_bid - low), abs(actual_bid - high))
 								            range_size = max(1, high - low)
 								            score += 0.2 * max(0, 1.0 - distance / range_size)
 								        weights += 0.2
 								    return round(score / max(weights, 0.01), 2)
 								# ── Query helpers ──────────────────────────────────────────────────────────
-												feat: code quality audit + autoresearch integration + infra hardening (#150)
											
										
										
											2026-03-08 12:50:44 -04:00
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								def get_predictions(
-												ruff (#169)

* polish: streamline nav, extract inline styles, improve tablet UX

- Restructure desktop nav from 8+ flat links + overflow dropdown into
  5 grouped dropdowns (Core, Agents, Intel, System, More) matching
  the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
  notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
  notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
  showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
  Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
  disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* fix(security): move auth-gate credentials to environment variables

Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

* refactor(tooling): migrate from black+isort+bandit to ruff

Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.

https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h

---------

Co-authored-by: Claude <noreply@anthropic.com>
											
										
										
											2026-03-11 12:23:35 -04:00
+								    task_id: str | None = None,
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								    evaluated_only: bool = False,
 								    limit: int = 50,
 								) -> list[Prediction]:
 								    """Query stored predictions."""
 								    query = "SELECT * FROM spark_predictions WHERE 1=1"
 								    params: list = []
 								    if task_id:
 								        query += " AND task_id = ?"
 								        params.append(task_id)
 								    if evaluated_only:
 								        query += " AND evaluated_at IS NOT NULL"
 								    query += " ORDER BY created_at DESC LIMIT ?"
 								    params.append(limit)
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								    with _get_conn() as conn:
 								        rows = conn.execute(query, params).fetchall()
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
+								    return [
 								        Prediction(
 								            id=r["id"],
 								            task_id=r["task_id"],
 								            prediction_type=r["prediction_type"],
 								            predicted_value=r["predicted_value"],
 								            actual_value=r["actual_value"],
 								            accuracy=r["accuracy"],
 								            created_at=r["created_at"],
 								            evaluated_at=r["evaluated_at"],
 								        )
 								        for r in rows
 								    ]
 								def get_accuracy_stats() -> dict:
 								    """Return aggregate accuracy statistics for the EIDOS loop."""
-												[loop-cycle-50] refactor: replace bare sqlite3.connect() with context managers batch 2 (#157) (#180)

											
										
										
											2026-03-15 11:58:43 -04:00
+								    with _get_conn() as conn:
 								        row = conn.execute("""
 								            SELECT
 								                COUNT(*)                          AS total_predictions,
 								                COUNT(evaluated_at)               AS evaluated,
 								                AVG(CASE WHEN accuracy IS NOT NULL THEN accuracy END) AS avg_accuracy,
 								                MIN(CASE WHEN accuracy IS NOT NULL THEN accuracy END) AS min_accuracy,
 								                MAX(CASE WHEN accuracy IS NOT NULL THEN accuracy END) AS max_accuracy
 								            FROM spark_predictions
 								            """).fetchone()
-												feat: integrate Spark Intelligence into Timmy swarm system

Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.

New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together

Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
  predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header

Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)

Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.

https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c

											
										
										
											2026-02-24 15:51:15 +00:00
 								    return {
 								        "total_predictions": row["total_predictions"] or 0,
 								        "evaluated": row["evaluated"] or 0,
 								        "pending": (row["total_predictions"] or 0) - (row["evaluated"] or 0),
 								        "avg_accuracy": round(row["avg_accuracy"] or 0.0, 2),
 								        "min_accuracy": round(row["min_accuracy"] or 0.0, 2),
 								        "max_accuracy": round(row["max_accuracy"] or 0.0, 2),
 								    }