Timmy-time-dashboard/src/timmy/sovereignty/session_report.py

"""Session Sovereignty Report Generator.

Auto-generates a sovereignty scorecard at the end of each play session
and commits it as a markdown file to the Gitea repo under
``reports/sovereignty/``.

Report contents (per issue #957):
- Session duration + game played
- Total model calls by type (VLM, LLM, TTS, API)
- Total cache/rule hits by type
- New skills crystallized (placeholder — pending skill-tracking impl)
- Sovereignty delta (change from session start → end)
- Cost breakdown (actual API spend)
- Per-layer sovereignty %: perception, decision, narration
- Trend comparison vs previous session

Refs: #957 (Sovereignty P0) · #953 (The Sovereignty Loop)
"""

import base64
import json
import logging
from datetime import UTC, datetime
from pathlib import Path
from typing import Any

import httpx

from config import settings

# Optional module-level imports — degrade gracefully if unavailable at import time
try:
    from timmy.session_logger import get_session_logger
except Exception:  # ImportError or circular import during early startup
    get_session_logger = None  # type: ignore[assignment]

try:
    from infrastructure.sovereignty_metrics import GRADUATION_TARGETS, get_sovereignty_store
except Exception:
    GRADUATION_TARGETS: dict = {}  # type: ignore[assignment]
    get_sovereignty_store = None  # type: ignore[assignment]

logger = logging.getLogger(__name__)

# Module-level session start time; set by mark_session_start()
_SESSION_START: datetime | None = None


# ---------------------------------------------------------------------------
# Public API
# ---------------------------------------------------------------------------


def mark_session_start() -> None:
    """Record the session start wall-clock time.

    Call once during application startup so ``generate_report()`` can
    compute accurate session durations.
    """
    global _SESSION_START
    _SESSION_START = datetime.now(UTC)
    logger.debug("Sovereignty: session start recorded at %s", _SESSION_START.isoformat())


def generate_report(session_id: str = "dashboard") -> str:
    """Render a sovereignty scorecard as a markdown string.

    Pulls from:
    - ``timmy.session_logger`` — message/tool-call/error counts
    - ``infrastructure.sovereignty_metrics`` — cache hit rate, API cost,
      graduation phase, and trend data

    Args:
        session_id: The session identifier (default: "dashboard").

    Returns:
        Markdown-formatted sovereignty report string.
    """
    now = datetime.now(UTC)
    session_start = _SESSION_START or now
    duration_secs = (now - session_start).total_seconds()

    session_data = _gather_session_data()
    sov_data = _gather_sovereignty_data()

    return _render_markdown(now, session_id, duration_secs, session_data, sov_data)


def commit_report(report_md: str, session_id: str = "dashboard") -> bool:
    """Commit a sovereignty report to the Gitea repo.

    Creates or updates ``reports/sovereignty/{date}_{session_id}.md``
    via the Gitea Contents API.  Degrades gracefully: logs a warning
    and returns ``False`` if Gitea is unreachable or misconfigured.

    Args:
        report_md: Markdown content to commit.
        session_id: Session identifier used in the filename.

    Returns:
        ``True`` on success, ``False`` on failure.
    """
    if not settings.gitea_enabled:
        logger.info("Sovereignty: Gitea disabled — skipping report commit")
        return False

    if not settings.gitea_token:
        logger.warning("Sovereignty: no Gitea token — skipping report commit")
        return False

    date_str = datetime.now(UTC).strftime("%Y-%m-%d")
    file_path = f"reports/sovereignty/{date_str}_{session_id}.md"
    url = f"{settings.gitea_url}/api/v1/repos/{settings.gitea_repo}/contents/{file_path}"
    headers = {
        "Authorization": f"token {settings.gitea_token}",
        "Content-Type": "application/json",
    }
    encoded_content = base64.b64encode(report_md.encode()).decode()
    commit_message = (
        f"report: sovereignty session {session_id} ({date_str})\n\n"
        f"Auto-generated by Timmy. Refs #957"
    )
    payload: dict[str, Any] = {
        "message": commit_message,
        "content": encoded_content,
    }

    try:
        with httpx.Client(timeout=10.0) as client:
            # Fetch existing file SHA so we can update rather than create
            check = client.get(url, headers=headers)
            if check.status_code == 200:
                existing = check.json()
                payload["sha"] = existing.get("sha", "")

            resp = client.put(url, headers=headers, json=payload)
            resp.raise_for_status()

        logger.info("Sovereignty: report committed to %s", file_path)
        return True

    except httpx.HTTPStatusError as exc:
        logger.warning(
            "Sovereignty: commit failed (HTTP %s): %s",
            exc.response.status_code,
            exc,
        )
        return False
    except Exception as exc:
        logger.warning("Sovereignty: commit failed: %s", exc)
        return False


async def generate_and_commit_report(session_id: str = "dashboard") -> bool:
    """Generate and commit a sovereignty report for the current session.

    Primary entry point — call at session end / application shutdown.
    Wraps the synchronous ``commit_report`` call in ``asyncio.to_thread``
    so it does not block the event loop.

    Args:
        session_id: The session identifier.

    Returns:
        ``True`` if the report was generated and committed successfully.
    """
    import asyncio

    try:
        report_md = generate_report(session_id)
        logger.info("Sovereignty: report generated (%d chars)", len(report_md))
        committed = await asyncio.to_thread(commit_report, report_md, session_id)
        return committed
    except Exception as exc:
        logger.warning("Sovereignty: report generation failed: %s", exc)
        return False


# ---------------------------------------------------------------------------
# Internal helpers
# ---------------------------------------------------------------------------


def _format_duration(seconds: float) -> str:
    """Format a duration in seconds as a human-readable string."""
    total = int(seconds)
    hours, remainder = divmod(total, 3600)
    minutes, secs = divmod(remainder, 60)
    if hours:
        return f"{hours}h {minutes}m {secs}s"
    if minutes:
        return f"{minutes}m {secs}s"
    return f"{secs}s"


def _gather_session_data() -> dict[str, Any]:
    """Pull session statistics from the session logger.

    Returns a dict with:
    - ``user_messages``, ``timmy_messages``, ``tool_calls``, ``errors``
    - ``tool_call_breakdown``: dict[tool_name, count]
    """
    default: dict[str, Any] = {
        "user_messages": 0,
        "timmy_messages": 0,
        "tool_calls": 0,
        "errors": 0,
        "tool_call_breakdown": {},
    }

    try:
        if get_session_logger is None:
            return default
        sl = get_session_logger()
        sl.flush()

        # Read today's session file directly for accurate counts
        if not sl.session_file.exists():
            return default

        entries: list[dict] = []
        with open(sl.session_file) as f:
            for line in f:
                line = line.strip()
                if line:
                    try:
                        entries.append(json.loads(line))
                    except json.JSONDecodeError:
                        continue

        tool_breakdown: dict[str, int] = {}
        user_msgs = timmy_msgs = tool_calls = errors = 0

        for entry in entries:
            etype = entry.get("type")
            if etype == "message":
                if entry.get("role") == "user":
                    user_msgs += 1
                elif entry.get("role") == "timmy":
                    timmy_msgs += 1
            elif etype == "tool_call":
                tool_calls += 1
                tool_name = entry.get("tool", "unknown")
                tool_breakdown[tool_name] = tool_breakdown.get(tool_name, 0) + 1
            elif etype == "error":
                errors += 1

        return {
            "user_messages": user_msgs,
            "timmy_messages": timmy_msgs,
            "tool_calls": tool_calls,
            "errors": errors,
            "tool_call_breakdown": tool_breakdown,
        }

    except Exception as exc:
        logger.warning("Sovereignty: failed to gather session data: %s", exc)
        return default


def _gather_sovereignty_data() -> dict[str, Any]:
    """Pull sovereignty metrics from the SQLite store.

    Returns a dict with:
    - ``metrics``: summary from ``SovereigntyMetricsStore.get_summary()``
    - ``deltas``: per-metric start/end values within recent history window
    - ``previous_session``: most recent prior value for each metric
    """
    try:
        if get_sovereignty_store is None:
            return {"metrics": {}, "deltas": {}, "previous_session": {}}
        store = get_sovereignty_store()
        summary = store.get_summary()

        deltas: dict[str, dict[str, Any]] = {}
        previous_session: dict[str, float | None] = {}

        for metric_type in GRADUATION_TARGETS:
            history = store.get_latest(metric_type, limit=10)
            if len(history) >= 2:
                deltas[metric_type] = {
                    "start": history[-1]["value"],
                    "end": history[0]["value"],
                }
                previous_session[metric_type] = history[1]["value"]
            elif len(history) == 1:
                deltas[metric_type] = {"start": history[0]["value"], "end": history[0]["value"]}
                previous_session[metric_type] = None
            else:
                deltas[metric_type] = {"start": None, "end": None}
                previous_session[metric_type] = None

        return {
            "metrics": summary,
            "deltas": deltas,
            "previous_session": previous_session,
        }

    except Exception as exc:
        logger.warning("Sovereignty: failed to gather sovereignty data: %s", exc)
        return {"metrics": {}, "deltas": {}, "previous_session": {}}


def _render_markdown(
    now: datetime,
    session_id: str,
    duration_secs: float,
    session_data: dict[str, Any],
    sov_data: dict[str, Any],
) -> str:
    """Assemble the full sovereignty report in markdown."""
    lines: list[str] = []

    # Header
    lines += [
        "# Sovereignty Session Report",
        "",
        f"**Session ID:** `{session_id}`  ",
        f"**Date:** {now.strftime('%Y-%m-%d')}  ",
        f"**Duration:** {_format_duration(duration_secs)}  ",
        f"**Generated:** {now.isoformat()}",
        "",
        "---",
        "",
    ]

    # Session activity
    lines += [
        "## Session Activity",
        "",
        "| Metric | Count |",
        "|--------|-------|",
        f"| User messages | {session_data['user_messages']} |",
        f"| Timmy responses | {session_data['timmy_messages']} |",
        f"| Tool calls | {session_data['tool_calls']} |",
        f"| Errors | {session_data['errors']} |",
        "",
    ]

    tool_breakdown = session_data.get("tool_call_breakdown", {})
    if tool_breakdown:
        lines += ["### Model Calls by Tool", ""]
        for tool_name, count in sorted(tool_breakdown.items(), key=lambda x: -x[1]):
            lines.append(f"- `{tool_name}`: {count}")
        lines.append("")

    # Sovereignty scorecard

    lines += [
        "## Sovereignty Scorecard",
        "",
        "| Metric | Current | Target (graduation) | Phase |",
        "|--------|---------|---------------------|-------|",
    ]

    for metric_type, data in sov_data["metrics"].items():
        current = data.get("current")
        current_str = f"{current:.4f}" if current is not None else "N/A"
        grad_target = GRADUATION_TARGETS.get(metric_type, {}).get("graduation")
        grad_str = f"{grad_target:.4f}" if isinstance(grad_target, (int, float)) else "N/A"
        phase = data.get("phase", "unknown")
        lines.append(f"| {metric_type} | {current_str} | {grad_str} | {phase} |")

    lines += ["", "### Sovereignty Delta (This Session)", ""]

    for metric_type, delta_info in sov_data.get("deltas", {}).items():
        start_val = delta_info.get("start")
        end_val = delta_info.get("end")
        if start_val is not None and end_val is not None:
            diff = end_val - start_val
            sign = "+" if diff >= 0 else ""
            lines.append(
                f"- **{metric_type}**: {start_val:.4f} → {end_val:.4f} ({sign}{diff:.4f})"
            )
        else:
            lines.append(f"- **{metric_type}**: N/A (no data recorded)")

    # Cost breakdown
    lines += ["", "## Cost Breakdown", ""]
    api_cost_data = sov_data["metrics"].get("api_cost", {})
    current_cost = api_cost_data.get("current")
    if current_cost is not None:
        lines.append(f"- **Total API spend (latest recorded):** ${current_cost:.4f}")
    else:
        lines.append("- **Total API spend:** N/A (no data recorded)")
    lines.append("")

    # Per-layer sovereignty
    lines += [
        "## Per-Layer Sovereignty",
        "",
        "| Layer | Sovereignty % |",
        "|-------|--------------|",
        "| Perception (VLM) | N/A |",
        "| Decision (LLM) | N/A |",
        "| Narration (TTS) | N/A |",
        "",
        "> Per-layer tracking requires instrumented inference calls. See #957.",
        "",
    ]

    # Skills crystallized
    lines += [
        "## Skills Crystallized",
        "",
        "_Skill crystallization tracking not yet implemented. See #957._",
        "",
    ]

    # Trend vs previous session
    lines += ["## Trend vs Previous Session", ""]
    prev_data = sov_data.get("previous_session", {})
    has_prev = any(v is not None for v in prev_data.values())

    if has_prev:
        lines += [
            "| Metric | Previous | Current | Change |",
            "|--------|----------|---------|--------|",
        ]
        for metric_type, curr_info in sov_data["metrics"].items():
            curr_val = curr_info.get("current")
            prev_val = prev_data.get(metric_type)
            curr_str = f"{curr_val:.4f}" if curr_val is not None else "N/A"
            prev_str = f"{prev_val:.4f}" if prev_val is not None else "N/A"
            if curr_val is not None and prev_val is not None:
                diff = curr_val - prev_val
                sign = "+" if diff >= 0 else ""
                change_str = f"{sign}{diff:.4f}"
            else:
                change_str = "N/A"
            lines.append(f"| {metric_type} | {prev_str} | {curr_str} | {change_str} |")
        lines.append("")
    else:
        lines += ["_No previous session data available for comparison._", ""]

    # Footer
    lines += [
        "---",
        "_Auto-generated by Timmy · Session Sovereignty Report · Refs: #957_",
    ]

    return "\n".join(lines)