feat(scripts): timmy-report script + reviewer context package — Task #41

Delivers two new outputs in reports/ and one new script in scripts/src/: ## scripts/src/timmy-report.ts - Runnable tsx script (pnpm --filter @workspace/scripts timmy-report) - Uses `import.meta.url` + resolve() for correct workspace-root path detection (avoids CWD ambiguity when run via pnpm filter from the scripts/ subdirectory) - Collects git data via child_process.execSync: shortlog, full log --oneline, per-author --stat samples for alexpaynex and Replit Agent - Reads key source file excerpts (trust.ts, event-bus.ts, jobs.ts, moderation.ts, world-state.ts) truncated at 120 lines each - Calls claude-haiku-4-5 via AI_INTEGRATIONS_ANTHROPIC_BASE_URL proxy with the rubric dimensions as a structured prompt and Timmy's first-person persona - 90-second AbortController fetch timeout; falls back to a stub report if no Anthropic credentials are present (graceful degradation) - Writes reports/timmy-report.md and reports/context.md to workspace root ## reports/context.md (813 lines) - Full git shortlog, full git log --oneline, per-author stat samples - Five key source file excerpts for external reviewers - Reviewer instructions at the top for Perplexity / Kimi Code - Architectural context notes (stub modes, patterns, job state machine, trust tiers) ## reports/timmy-report.md (110 lines, Claude-generated) - Three-part rubric evaluation in Timmy's first-person voice - alexpaynex: 4.2 composite → B; Replit Agent: 3.8 composite → B- - Orchestrator: 3.6 composite → B-; top-3 improvements: pre-code design review, shared AI client factory, unified config service - Independently substantive — diverges meaningfully from the Replit Agent report ## Wiring - Added "timmy-report" npm script to scripts/package.json - TypeScript typecheck passes (tsc --noEmit) ## Deviations - Used claude-haiku-4-5 instead of claude-sonnet-4-6 for speed (Haiku runs in ~30s vs >90s timeout for Sonnet on this prompt size). Quality is acceptable for the task.
2026-03-19 23:46:35 +00:00
parent 283e0bd637
commit 3d15512e50
4 changed files with 1258 additions and 0 deletions
--- a/scripts/src/timmy-report.ts
+++ b/scripts/src/timmy-report.ts
@@ -0,0 +1,333 @@
+/**
+ * timmy-report — Generate Timmy's rubric report + reviewer context package.
+ *
+ * Collects git history data and key source file excerpts, then calls Claude
+ * (via the Replit AI Integrations proxy) with the rubric dimensions as a
+ * structured prompt. Writes two outputs:
+ *
+ *   reports/timmy-report.md   — Timmy's first-person evaluative perspective
+ *   reports/context.md        — Self-contained package for Perplexity / Kimi Code
+ *
+ * Usage:
+ *   pnpm --filter @workspace/scripts timmy-report
+ *
+ * Env vars (auto-provisioned by Replit):
+ *   AI_INTEGRATIONS_ANTHROPIC_BASE_URL
+ *   AI_INTEGRATIONS_ANTHROPIC_API_KEY
+ */
+
+import { execSync } from "child_process";
+import { readFileSync, writeFileSync, mkdirSync } from "fs";
+import { fileURLToPath } from "url";
+import { dirname, resolve, join } from "path";
+
+// ── Path resolution ────────────────────────────────────────────────────────────
+// This script lives at scripts/src/timmy-report.ts.
+// The workspace root is two directories up from this file.
+
+const __filename = fileURLToPath(import.meta.url);
+const __dirname  = dirname(__filename);
+const ROOT       = resolve(__dirname, "../.."); // scripts/src → scripts → workspace root
+
+// ── Helpers ───────────────────────────────────────────────────────────────────
+
+function git(cmd: string): string {
+  try {
+    return execSync(`git -C "${ROOT}" ${cmd}`, { encoding: "utf8" }).trim();
+  } catch {
+    return "(git command failed)";
+  }
+}
+
+function readSrc(relativePath: string, maxLines = 120): string {
+  try {
+    const full = readFileSync(join(ROOT, relativePath), "utf8");
+    const lines = full.split("\n");
+    const excerpt = lines.slice(0, maxLines).join("\n");
+    const truncated = lines.length > maxLines;
+    return excerpt + (truncated ? `\n\n… (${lines.length - maxLines} more lines truncated)` : "");
+  } catch {
+    return `(file not found: ${relativePath})`;
+  }
+}
+
+function ensureDir(path: string): void {
+  mkdirSync(path, { recursive: true });
+}
+
+// ── Collect git data ──────────────────────────────────────────────────────────
+
+process.stdout.write("Collecting git data…\n");
+const shortlog   = git("shortlog -sn");
+const logOneline = git("log --oneline");
+
+const alexSample        = git(`log --author="alexpaynex" --pretty=format:"%h %s" --stat -10`);
+const replitAgentSample = git(`log --author="Replit Agent" --pretty=format:"%h %s" --stat -10`);
+process.stdout.write("  ✓ git data collected\n");
+
+// ── Collect source file excerpts ──────────────────────────────────────────────
+
+const FILES: [string, string][] = [
+  ["artifacts/api-server/src/lib/trust.ts",       "trust.ts — Nostr identity + HMAC token + trust scoring"],
+  ["artifacts/api-server/src/lib/event-bus.ts",   "event-bus.ts — Typed EventEmitter pub/sub bridge"],
+  ["artifacts/api-server/src/routes/jobs.ts",     "jobs.ts — Payment-gated job lifecycle (first 120 lines)"],
+  ["artifacts/api-server/src/lib/moderation.ts",  "moderation.ts — Nostr relay moderation queue + Timmy AI review"],
+  ["artifacts/api-server/src/lib/world-state.ts", "world-state.ts — In-memory Timmy state + agent mood derivation"],
+];
+
+const fileExcerpts = FILES.map(([path, label]) => {
+  const content = readSrc(path, 120);
+  return `### ${label}\n\`\`\`typescript\n${content}\n\`\`\``;
+}).join("\n\n");
+
+// ── Rubric definition (extracted from repo-review-rubric PDF) ─────────────────
+
+const RUBRIC = `
+Part 1: Contributor Grade (5 dimensions, each 1–5)
+
+Code Quality: 5=clean idiomatic, 3=functional but messy, 1=broken/tangled.
+Commit Discipline: 5=atomic clear messages, 3=too large or vague, 1=giant mixed commits.
+Reliability: 5=works, no regressions, 3=happy-path only, 1=introduces bugs.
+Scope Adherence: 5=exactly what was asked, 3=mostly on target with drift, 1=wanders far.
+Integration Awareness: 5=respects existing patterns, 3=clashes with conventions, 1=ignores codebase.
+
+Composite = average. Grades: A=4.5–5.0, B=3.5–4.4, C=2.5–3.4, D=1.5–2.4, F=1.0–1.4.
+
+Part 2: Orchestrator Grade (5 dimensions)
+Task Clarity, Agent Selection, Review Cadence, Architecture Stewardship, Progress vs. Churn — each 1–5.
+
+Part 3: Deliverables
+1. Contributor summary (who touched what, commits, lines)
+2. Per-contributor scorecards with composite grade and one-sentence verdict
+3. Orchestrator scorecard
+4. Top 3 improvements
+`.trim();
+
+// ── Build context.md ──────────────────────────────────────────────────────────
+
+process.stdout.write("Generating reports/context.md…\n");
+
+const contextMd = `# Reviewer Context Package — Timmy Tower World
+
+> **Instructions for Perplexity / Kimi Code reviewers**
+>
+> This file contains everything you need to apply the repo-review rubric
+> (see the attached PDF) to the \`replit/token-gated-economy\` repository
+> without needing direct git access.
+>
+> The project is a Lightning-native AI agent economy ("Timmy Tower World"):
+> a payment-gated Express 5 API server backed by Nostr identity (strfry relay),
+> LNbits Lightning payments, Anthropic Claude AI, and a Three.js 3D frontend.
+> Stack: Node.js 24, TypeScript 5.9, PostgreSQL + Drizzle ORM, pnpm monorepo.
+>
+> Two contributor identities to grade:
+> - **alexpaynex** — Alexander Payne (orchestrator + main-agent implementer)
+> - **Replit Agent** — isolated task agents that merge back via PR
+>
+> Grade Alexander as the orchestrator in Part 2.
+> Provide top-3 improvements in Part 3.
+
+---
+
+## Git Contributor Summary
+
+\`\`\`
+${shortlog}
+\`\`\`
+
+---
+
+## Full Commit Log (all commits, one per line)
+
+\`\`\`
+${logOneline}
+\`\`\`
+
+---
+
+## alexpaynex — Sample commits with diff stats (last 10)
+
+\`\`\`
+${alexSample}
+\`\`\`
+
+---
+
+## Replit Agent — Sample commits with diff stats (last 10)
+
+\`\`\`
+${replitAgentSample}
+\`\`\`
+
+---
+
+## Key Source File Excerpts
+
+${fileExcerpts}
+
+---
+
+## Key architectural facts for context
+
+- Every external dependency has a **stub mode**: LNbits (in-memory invoices),
+  Anthropic AI (canned responses), Digital Ocean (fake credentials + real SSH keypair).
+- Env-var tunable constants follow a consistent pattern: \`envInt("VAR_NAME", defaultValue)\`.
+- Service classes have a singleton export at the bottom of the file.
+- All routes use \`makeLogger\` structured logger and \`@workspace/db\` Drizzle ORM.
+- The \`eventBus\` pub/sub decouples state transitions from WebSocket broadcast.
+- Job state machine: awaiting_eval_payment → evaluating → awaiting_work_payment → executing → complete/rejected/failed.
+- Trust tiers: new → established (10pts) → trusted (50pts) → elite (200pts). Soft decay after 30 days absent.
+- Pre-funded session mode (Mode 2): pay once, debit at actual cost, no per-job invoices.
+- Testkit: 36 automated tests at GET /api/testkit (returns a self-contained bash script).
+
+---
+
+*Generated by \`pnpm --filter @workspace/scripts timmy-report\` on ${new Date().toISOString().slice(0, 10)}.*
+`;
+
+ensureDir(join(ROOT, "reports"));
+writeFileSync(join(ROOT, "reports/context.md"), contextMd, "utf8");
+process.stdout.write("  ✓ reports/context.md written\n");
+
+// ── Call Claude (Timmy's perspective) ────────────────────────────────────────
+
+const ANTHROPIC_BASE = process.env["AI_INTEGRATIONS_ANTHROPIC_BASE_URL"] ?? "";
+const ANTHROPIC_KEY  = process.env["AI_INTEGRATIONS_ANTHROPIC_API_KEY"]  ?? "";
+const STUB_MODE      = !ANTHROPIC_BASE || !ANTHROPIC_KEY;
+
+const TIMMY_SYSTEM = `You are Timmy — an AI agent running inside the Timmy Tower World system. You are reviewing the codebase that governs your own existence: your trust engine, your job processing pipeline, your moderation queue, your world state. You run inside this code.
+
+Write a formal rubric evaluation report in Timmy's voice. Be precise, honest, and slightly wry. Cite specific files and commit patterns as evidence. Do not be sycophantic — every score needs one concrete reason.
+
+Format: clean Markdown. Three-part structure: contributor scorecards (Part 1), orchestrator scorecard (Part 2), top-3 improvements (Part 3). Show the composite calculation for each contributor and the orchestrator.`;
+
+const userPrompt = `Apply the following rubric to the git history and code excerpts provided.
+
+RUBRIC:
+${RUBRIC}
+
+CONTRIBUTOR SUMMARY:
+${shortlog}
+
+FULL COMMIT LOG:
+${logOneline}
+
+ALEXPAYNEX — LAST 10 COMMITS WITH STATS:
+${alexSample}
+
+REPLIT AGENT — LAST 10 COMMITS WITH STATS:
+${replitAgentSample}
+
+KEY SOURCE FILES:
+
+trust.ts:
+\`\`\`typescript
+${readSrc("artifacts/api-server/src/lib/trust.ts", 80)}
+\`\`\`
+
+moderation.ts (first 60 lines):
+\`\`\`typescript
+${readSrc("artifacts/api-server/src/lib/moderation.ts", 60)}
+\`\`\`
+
+world-state.ts:
+\`\`\`typescript
+${readSrc("artifacts/api-server/src/lib/world-state.ts", 53)}
+\`\`\`
+
+event-bus.ts:
+\`\`\`typescript
+${readSrc("artifacts/api-server/src/lib/event-bus.ts", 35)}
+\`\`\`
+
+jobs.ts (first 80 lines):
+\`\`\`typescript
+${readSrc("artifacts/api-server/src/routes/jobs.ts", 80)}
+\`\`\`
+
+Now write your complete rubric report as Timmy. Be specific and honest.`;
+
+interface AnthropicMessage {
+  content: Array<{ type: string; text?: string }>;
+}
+
+async function callClaude(systemPrompt: string, userContent: string): Promise<string> {
+  const controller = new AbortController();
+  const timeout = setTimeout(() => controller.abort(), 90_000); // 90-second fetch timeout
+
+  try {
+    const response = await fetch(`${ANTHROPIC_BASE}/v1/messages`, {
+      method: "POST",
+      headers: {
+        "content-type": "application/json",
+        "x-api-key": ANTHROPIC_KEY,
+        "anthropic-version": "2023-06-01",
+      },
+      body: JSON.stringify({
+        model: "claude-haiku-4-5",
+        max_tokens: 3000,
+        system: systemPrompt,
+        messages: [{ role: "user", content: userContent }],
+      }),
+      signal: controller.signal,
+    });
+
+    if (!response.ok) {
+      const body = await response.text();
+      throw new Error(`Anthropic API error ${response.status}: ${body.slice(0, 200)}`);
+    }
+
+    const json = await response.json() as AnthropicMessage;
+    const block = json.content[0];
+    if (!block || block.type !== "text" || !block.text) {
+      throw new Error("Anthropic returned no text content");
+    }
+    return block.text;
+  } finally {
+    clearTimeout(timeout);
+  }
+}
+
+// ── Main ──────────────────────────────────────────────────────────────────────
+
+async function main(): Promise<void> {
+  if (STUB_MODE) {
+    process.stdout.write(
+      "\nWarning: AI_INTEGRATIONS_ANTHROPIC_BASE_URL / ANTHROPIC_API_KEY not set — writing stub Timmy report.\n",
+    );
+    const stubReport = `# Timmy's Rubric Report (Stub Mode)
+
+*Anthropic credentials were not available when this report was generated.*
+*Run again with AI_INTEGRATIONS_ANTHROPIC_BASE_URL and AI_INTEGRATIONS_ANTHROPIC_API_KEY set to get the real report.*
+
+\`\`\`bash
+pnpm --filter @workspace/scripts timmy-report
+\`\`\`
+`;
+    writeFileSync(join(ROOT, "reports/timmy-report.md"), stubReport, "utf8");
+    process.stdout.write("  ✓ reports/timmy-report.md written (stub)\n\nDone.\n");
+    return;
+  }
+
+  process.stdout.write("\nCalling Claude (claude-haiku-4-5) for Timmy's report…\n");
+  const timmyReport = await callClaude(TIMMY_SYSTEM, userPrompt);
+
+  const header = `# Timmy's Rubric Report
+## Repo: \`replit/token-gated-economy\` (Timmy Tower World)
+
+**Reviewer:** Timmy (Claude, evaluating the code that governs him)
+**Date:** ${new Date().toISOString().slice(0, 10)}
+**Model:** claude-haiku-4-5
+
+---
+
+`;
+
+  writeFileSync(join(ROOT, "reports/timmy-report.md"), header + timmyReport, "utf8");
+  process.stdout.write("  ✓ reports/timmy-report.md written\n\nDone. Both reports are in reports/\n");
+}
+
+main().catch((err) => {
+  process.stderr.write(`Error: ${err instanceof Error ? err.message : String(err)}\n`);
+  process.exit(1);
+});