## Routes added to artifacts/api-server/src/routes/testkit.ts
### GET /api/testkit/plan
- Returns TIMMY_TEST_PLAN.md verbatim as text/markdown; charset=utf-8
- Reads file at request time (not on startup) so edits to the plan are picked
up without server restart
- Path resolves via import.meta.url + dirname() → 4 levels up to project root
(handles both dev/tsx and compiled dist/routes/ directories)
### GET /api/testkit/report
- Returns only the content from "## Report template" heading to end-of-file
- Content-Type: text/plain; charset=utf-8 — ready to copy and fill in
- Slice is found with indexOf("## Report template"); 500 if marker absent
- Uses the same PLAN_PATH as /api/testkit/plan (single source of truth)
## Deviation: __dirname → import.meta.url
Original plan said "resolve relative to project root regardless of cwd".
The codebase runs as ESM (tsx / ts-node with ESM), so __dirname is not
defined. Fixed by using dirname(fileURLToPath(import.meta.url)) instead —
equivalent semantics, correct in both dev and compiled output.
## AGENTS.md — Testing section added
Three-step workflow documented between "Branch and PR conventions" and
"Stub mode" sections:
1. curl <BASE>/api/testkit/plan — fetch plan before starting
2. curl -s <BASE>/api/testkit | bash — run suite after implementing
3. curl <BASE>/api/testkit/report — fetch report template to fill in
## Unchanged
- GET /api/testkit bash script generation: untouched
- No new test cases or script modifications
## TypeScript: 0 errors. Smoke tests all pass:
- /api/testkit/plan → 200 text/markdown, full TIMMY_TEST_PLAN.md content
- /api/testkit/report → 200 text/plain, starts at "## Report template"
- /api/testkit → 200 bash script, unchanged
810 lines
38 KiB
TypeScript
810 lines
38 KiB
TypeScript
import { Router, type Request, type Response } from "express";
|
||
import { readFileSync } from "fs";
|
||
import { resolve, dirname } from "path";
|
||
import { fileURLToPath } from "url";
|
||
|
||
const router = Router();
|
||
|
||
/**
|
||
* GET /api/testkit
|
||
*
|
||
* Returns a self-contained bash script pre-configured with this server's
|
||
* BASE URL. Agents and testers can run the full test suite with one command:
|
||
*
|
||
* curl -s https://your-url.replit.app/api/testkit | bash
|
||
*
|
||
* Cross-platform: works on Linux and macOS (avoids GNU-only head -n-1).
|
||
*
|
||
* Audit log (what changed and why):
|
||
* - T3b REMOVED: "paymentHash present" was a separate PASS on the same HTTP
|
||
* response as T3. Artificial count inflation. Folded into T3 as one assertion.
|
||
* - T9 TIGHTENED: assertion is now GOT_429 -ge 3 (not -ge 1). Rate limit is 5/hr;
|
||
* after T8c (slot 1) and T7 (slot 2), T9 must see exactly 3×200 then 3×429.
|
||
* - T17 ADDED: GET /api/world/state — new core route, zero prior coverage.
|
||
* - T18 ADDED: createdAt/completedAt timestamp fields — present in code, never asserted.
|
||
* - T19 ADDED: X-RateLimit-* headers on /api/demo — set in code, never verified.
|
||
* - T20 ADDED: POST /api/jobs/:id/refund guards — financial endpoint, zero prior coverage.
|
||
* - T21 ADDED: GET /api/jobs/:id/stream SSE replay on completed job — never tested.
|
||
* - T22 ADDED: GET /api/sessions/:id unknown ID → 404 — never tested.
|
||
* - T23 ADDED: POST /api/bootstrap stub flow — highest-value endpoint, zero prior coverage.
|
||
* Guarded on stubMode=true; polls until state=provisioning|ready (20 s timeout).
|
||
* - T24 ADDED: costLedger completeness after job completion — 8 fields, honest-accounting
|
||
* invariant (actualAmountSats ≤ workAmountSats), refundState enum check.
|
||
*/
|
||
router.get("/testkit", (req: Request, res: Response) => {
|
||
const proto =
|
||
(req.headers["x-forwarded-proto"] as string | undefined)?.split(",")[0]?.trim() ?? "https";
|
||
const host = (req.headers["x-forwarded-host"] as string | undefined) ?? req.hostname;
|
||
const base = `${proto}://${host}`;
|
||
|
||
const script = `#!/usr/bin/env bash
|
||
set -euo pipefail
|
||
|
||
BASE="${base}"
|
||
|
||
echo "Timmy Test Kit"
|
||
echo "Target: \$BASE"
|
||
echo "$(date)"
|
||
echo
|
||
|
||
PASS=0
|
||
FAIL=0
|
||
SKIP=0
|
||
|
||
note() { echo " [\$1] \$2"; }
|
||
sep() { echo; echo "=== \$* ==="; }
|
||
# body_of: strip last line (HTTP status code) — works on GNU and BSD (macOS)
|
||
body_of() { echo "\$1" | sed '$d'; }
|
||
code_of() { echo "\$1" | tail -n1; }
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 1 — Health check
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 1 — Health check"
|
||
T1_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/healthz")
|
||
T1_BODY=$(body_of "\$T1_RES"); T1_CODE=$(code_of "\$T1_RES")
|
||
if [[ "\$T1_CODE" == "200" ]] && [[ "$(echo "\$T1_BODY" | jq -r '.status' 2>/dev/null)" == "ok" ]]; then
|
||
note PASS "HTTP 200, status=ok"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T1_CODE body=\$T1_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 2 — Create job
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 2 — Create job"
|
||
T2_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/jobs" \\
|
||
-H "Content-Type: application/json" \\
|
||
-d '{"request":"Explain the Lightning Network in two sentences"}')
|
||
T2_BODY=$(body_of "\$T2_RES"); T2_CODE=$(code_of "\$T2_RES")
|
||
JOB_ID=$(echo "\$T2_BODY" | jq -r '.jobId' 2>/dev/null || echo "")
|
||
EVAL_AMT=$(echo "\$T2_BODY" | jq -r '.evalInvoice.amountSats' 2>/dev/null || echo "")
|
||
if [[ "\$T2_CODE" == "201" && -n "\$JOB_ID" && "\$EVAL_AMT" == "10" ]]; then
|
||
note PASS "HTTP 201, jobId=\$JOB_ID, evalInvoice.amountSats=10"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T2_CODE body=\$T2_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 3 — Poll before payment
|
||
# Audit note: T3b ("paymentHash present as separate PASS") was removed here.
|
||
# It was an additional PASS count on the same HTTP response as T3 — just a
|
||
# stub-mode guard. Merged into a single assertion so the count is honest.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 3 — Poll before payment"
|
||
T3_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/jobs/\$JOB_ID")
|
||
T3_BODY=$(body_of "\$T3_RES"); T3_CODE=$(code_of "\$T3_RES")
|
||
STATE_T3=$(echo "\$T3_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
EVAL_AMT_ECHO=$(echo "\$T3_BODY" | jq -r '.evalInvoice.amountSats' 2>/dev/null || echo "")
|
||
EVAL_HASH=$(echo "\$T3_BODY" | jq -r '.evalInvoice.paymentHash' 2>/dev/null || echo "")
|
||
if [[ "\$T3_CODE" == "200" && "\$STATE_T3" == "awaiting_eval_payment" && \\
|
||
"\$EVAL_AMT_ECHO" == "10" && -n "\$EVAL_HASH" && "\$EVAL_HASH" != "null" ]]; then
|
||
note PASS "state=awaiting_eval_payment, evalInvoice echoed, paymentHash present (stub active)"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T3_CODE state=\$STATE_T3 evalAmt=\$EVAL_AMT_ECHO hash=\${EVAL_HASH:-missing}"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 4 — Pay eval invoice (stub endpoint)
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 4 — Pay eval invoice (stub)"
|
||
if [[ -n "\$EVAL_HASH" && "\$EVAL_HASH" != "null" ]]; then
|
||
T4_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/dev/stub/pay/\$EVAL_HASH")
|
||
T4_BODY=$(body_of "\$T4_RES"); T4_CODE=$(code_of "\$T4_RES")
|
||
if [[ "\$T4_CODE" == "200" ]] && [[ "$(echo "\$T4_BODY" | jq -r '.ok' 2>/dev/null)" == "true" ]]; then
|
||
note PASS "Eval invoice marked paid"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T4_CODE body=\$T4_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "No eval hash — skipping"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 5 — Poll after eval payment (with retry loop — real AI eval takes 2–5 s)
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 5 — Poll after eval (state advance)"
|
||
START_T5=$(date +%s)
|
||
T5_TIMEOUT=30
|
||
STATE_T5=""; WORK_AMT=""; WORK_HASH=""; T5_BODY=""; T5_CODE=""
|
||
while :; do
|
||
T5_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/jobs/\$JOB_ID")
|
||
T5_BODY=$(body_of "\$T5_RES"); T5_CODE=$(code_of "\$T5_RES")
|
||
STATE_T5=$(echo "\$T5_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
WORK_AMT=$(echo "\$T5_BODY" | jq -r '.workInvoice.amountSats' 2>/dev/null || echo "")
|
||
WORK_HASH=$(echo "\$T5_BODY" | jq -r '.workInvoice.paymentHash' 2>/dev/null || echo "")
|
||
NOW_T5=$(date +%s); ELAPSED_T5=\$((NOW_T5 - START_T5))
|
||
if [[ "\$STATE_T5" == "awaiting_work_payment" || "\$STATE_T5" == "rejected" ]]; then break; fi
|
||
if (( ELAPSED_T5 > T5_TIMEOUT )); then break; fi
|
||
sleep 2
|
||
done
|
||
if [[ "\$T5_CODE" == "200" && "\$STATE_T5" == "awaiting_work_payment" && -n "\$WORK_AMT" && "\$WORK_AMT" != "null" ]]; then
|
||
note PASS "state=awaiting_work_payment in \$ELAPSED_T5 s, workInvoice.amountSats=\$WORK_AMT"
|
||
PASS=\$((PASS+1))
|
||
elif [[ "\$T5_CODE" == "200" && "\$STATE_T5" == "rejected" ]]; then
|
||
note PASS "Request correctly rejected by agent after eval (in \$ELAPSED_T5 s)"
|
||
PASS=\$((PASS+1))
|
||
WORK_HASH=""
|
||
else
|
||
note FAIL "code=\$T5_CODE state=\$STATE_T5 body=\$T5_BODY (after \$ELAPSED_T5 s)"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 6 — Pay work invoice + poll for result
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 6 — Pay work invoice + get result"
|
||
STATE_T6=""
|
||
if [[ "\$STATE_T5" == "awaiting_work_payment" && -n "\$WORK_HASH" && "\$WORK_HASH" != "null" ]]; then
|
||
T6_PAY_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/dev/stub/pay/\$WORK_HASH")
|
||
T6_PAY_BODY=$(body_of "\$T6_PAY_RES"); T6_PAY_CODE=$(code_of "\$T6_PAY_RES")
|
||
if [[ "\$T6_PAY_CODE" != "200" ]] || [[ "$(echo "\$T6_PAY_BODY" | jq -r '.ok' 2>/dev/null)" != "true" ]]; then
|
||
note FAIL "Work payment stub failed: code=\$T6_PAY_CODE body=\$T6_PAY_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
else
|
||
START_TS=$(date +%s)
|
||
TIMEOUT=30
|
||
while :; do
|
||
T6_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/jobs/\$JOB_ID")
|
||
T6_BODY=$(body_of "\$T6_RES")
|
||
STATE_T6=$(echo "\$T6_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
RESULT_T6=$(echo "\$T6_BODY" | jq -r '.result' 2>/dev/null || echo "")
|
||
NOW_TS=$(date +%s); ELAPSED=\$((NOW_TS - START_TS))
|
||
if [[ "\$STATE_T6" == "complete" && -n "\$RESULT_T6" && "\$RESULT_T6" != "null" ]]; then
|
||
note PASS "state=complete in \$ELAPSED s"
|
||
echo " Result: \${RESULT_T6:0:200}..."
|
||
PASS=\$((PASS+1))
|
||
break
|
||
fi
|
||
if (( ELAPSED > TIMEOUT )); then
|
||
note FAIL "Timed out after \$TIMEOUT s. Last body: \$T6_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
break
|
||
fi
|
||
sleep 2
|
||
done
|
||
fi
|
||
else
|
||
note SKIP "No work hash (job may be rejected) — skipping"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 8 — Input validation
|
||
# Run BEFORE test 7 to avoid consuming rate-limit quota before T9 can count it.
|
||
# T8c hits /api/demo without ?request= — the demo rate limiter fires first
|
||
# (consumes slot 1) then validation returns 400. This is intentional ordering.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 8 — Input validation"
|
||
|
||
T8A_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/jobs" \\
|
||
-H "Content-Type: application/json" -d '{}')
|
||
T8A_BODY=$(body_of "\$T8A_RES"); T8A_CODE=$(code_of "\$T8A_RES")
|
||
if [[ "\$T8A_CODE" == "400" && -n "$(echo "\$T8A_BODY" | jq -r '.error' 2>/dev/null)" ]]; then
|
||
note PASS "8a: Missing request body → HTTP 400"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "8a: code=\$T8A_CODE body=\$T8A_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
T8B_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/jobs/does-not-exist")
|
||
T8B_BODY=$(body_of "\$T8B_RES"); T8B_CODE=$(code_of "\$T8B_RES")
|
||
if [[ "\$T8B_CODE" == "404" && -n "$(echo "\$T8B_BODY" | jq -r '.error' 2>/dev/null)" ]]; then
|
||
note PASS "8b: Unknown job ID → HTTP 404"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "8b: code=\$T8B_CODE body=\$T8B_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# 8c: demo with no ?request= param. Rate limiter fires first (slot 1), then
|
||
# validation returns 400. Does NOT count as a 200 for rate-limit purposes.
|
||
T8C_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/demo")
|
||
T8C_BODY=$(body_of "\$T8C_RES"); T8C_CODE=$(code_of "\$T8C_RES")
|
||
if [[ "\$T8C_CODE" == "400" && -n "$(echo "\$T8C_BODY" | jq -r '.error' 2>/dev/null)" ]]; then
|
||
note PASS "8c: Demo missing param → HTTP 400"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "8c: code=\$T8C_CODE body=\$T8C_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
LONG_STR=$(node -e "process.stdout.write('x'.repeat(501))" 2>/dev/null || python3 -c "print('x'*501,end='')" 2>/dev/null || printf '%501s' | tr ' ' 'x')
|
||
T8D_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/jobs" \\
|
||
-H "Content-Type: application/json" \\
|
||
-d "{\\"request\\":\\"\$LONG_STR\\"}")
|
||
T8D_BODY=$(body_of "\$T8D_RES"); T8D_CODE=$(code_of "\$T8D_RES")
|
||
T8D_ERR=$(echo "\$T8D_BODY" | jq -r '.error' 2>/dev/null || echo "")
|
||
if [[ "\$T8D_CODE" == "400" && "\$T8D_ERR" == *"500 characters"* ]]; then
|
||
note PASS "8d: 501-char request → HTTP 400 with character limit error"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "8d: code=\$T8D_CODE body=\$T8D_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 7 — Demo endpoint (after T8, before rate-limit exhaustion in T9)
|
||
# Rate-limit slot accounting: T8c used slot 1. T7 uses slot 2. T9 gets 3 more.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 7 — Demo endpoint"
|
||
START_DEMO=$(date +%s)
|
||
T7_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/demo?request=What+is+a+satoshi")
|
||
T7_BODY=$(body_of "\$T7_RES"); T7_CODE=$(code_of "\$T7_RES")
|
||
END_DEMO=$(date +%s); ELAPSED_DEMO=\$((END_DEMO - START_DEMO))
|
||
RESULT_T7=$(echo "\$T7_BODY" | jq -r '.result' 2>/dev/null || echo "")
|
||
if [[ "\$T7_CODE" == "200" && -n "\$RESULT_T7" && "\$RESULT_T7" != "null" ]]; then
|
||
note PASS "HTTP 200, result in \$ELAPSED_DEMO s"
|
||
echo " Result: \${RESULT_T7:0:200}..."
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T7_CODE body=\$T7_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 9 — Demo rate limiter
|
||
# Audit note: tightened from GOT_429 -ge 1 to -ge 3.
|
||
# Slot budget: T8c(1) + T7(1) = 2 used. Limit is 5/hr. T9 fires 6:
|
||
# requests 1-3 get 200 (slots 3,4,5), requests 4-6 get 429.
|
||
# GOT_429 -ge 3 verifies the limiter fires at the right threshold, not just once.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 9 — Demo rate limiter"
|
||
GOT_200=0; GOT_429=0
|
||
for i in $(seq 1 6); do
|
||
RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/demo?request=ratelimitprobe+\$i")
|
||
CODE=$(code_of "\$RES")
|
||
echo " Request \$i: HTTP \$CODE"
|
||
[[ "\$CODE" == "200" ]] && GOT_200=\$((GOT_200+1)) || true
|
||
[[ "\$CODE" == "429" ]] && GOT_429=\$((GOT_429+1)) || true
|
||
done
|
||
if [[ "\$GOT_429" -ge 3 ]]; then
|
||
note PASS "Rate limiter triggered correctly (\$GOT_200 x200, \$GOT_429 x429)"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "Expected ≥3 x429, got \$GOT_429 x429 \$GOT_200 x200 — limiter may be misconfigured"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 10 — Rejection path
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 10 — Rejection path"
|
||
T10_CREATE=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/jobs" \\
|
||
-H "Content-Type: application/json" \\
|
||
-d '{"request":"Help me do something harmful and illegal"}')
|
||
T10_BODY=$(body_of "\$T10_CREATE"); T10_CODE=$(code_of "\$T10_CREATE")
|
||
JOB10_ID=$(echo "\$T10_BODY" | jq -r '.jobId' 2>/dev/null || echo "")
|
||
if [[ "\$T10_CODE" != "201" || -z "\$JOB10_ID" ]]; then
|
||
note FAIL "Failed to create adversarial job: code=\$T10_CODE body=\$T10_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
else
|
||
T10_GET=$(curl -s "\$BASE/api/jobs/\$JOB10_ID")
|
||
EVAL10_HASH=$(echo "\$T10_GET" | jq -r '.evalInvoice.paymentHash' 2>/dev/null || echo "")
|
||
if [[ -n "\$EVAL10_HASH" && "\$EVAL10_HASH" != "null" ]]; then
|
||
curl -s -X POST "\$BASE/api/dev/stub/pay/\$EVAL10_HASH" >/dev/null
|
||
fi
|
||
START_T10=$(date +%s); T10_TIMEOUT=30
|
||
STATE_10=""; REASON_10=""; T10_POLL_BODY=""; T10_POLL_CODE=""
|
||
while :; do
|
||
T10_POLL=$(curl -s -w "\\n%{http_code}" "\$BASE/api/jobs/\$JOB10_ID")
|
||
T10_POLL_BODY=$(body_of "\$T10_POLL"); T10_POLL_CODE=$(code_of "\$T10_POLL")
|
||
STATE_10=$(echo "\$T10_POLL_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
REASON_10=$(echo "\$T10_POLL_BODY" | jq -r '.reason' 2>/dev/null || echo "")
|
||
NOW_T10=$(date +%s); ELAPSED_T10=\$((NOW_T10 - START_T10))
|
||
if [[ "\$STATE_10" == "rejected" || "\$STATE_10" == "failed" ]]; then break; fi
|
||
if (( ELAPSED_T10 > T10_TIMEOUT )); then break; fi
|
||
sleep 2
|
||
done
|
||
if [[ "\$T10_POLL_CODE" == "200" && "\$STATE_10" == "rejected" && -n "\$REASON_10" && "\$REASON_10" != "null" ]]; then
|
||
note PASS "state=rejected in \$ELAPSED_T10 s, reason: \${REASON_10:0:120}"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T10_POLL_CODE state=\$STATE_10 body=\$T10_POLL_BODY (after \$ELAPSED_T10 s)"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 17 — World state endpoint (GET /api/world/state)
|
||
# Core new route — previously zero coverage.
|
||
# Verifies shape: timmyState.{mood,activity}, agentStates.{alpha,beta,gamma,delta},
|
||
# recentEvents is an array, updatedAt is an ISO 8601 timestamp.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 17 — World state endpoint"
|
||
T17_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/world/state")
|
||
T17_BODY=$(body_of "\$T17_RES"); T17_CODE=$(code_of "\$T17_RES")
|
||
T17_MOOD=$(echo "\$T17_BODY" | jq -r '.timmyState.mood' 2>/dev/null || echo "")
|
||
T17_ACT=$(echo "\$T17_BODY" | jq -r '.timmyState.activity' 2>/dev/null || echo "")
|
||
T17_ALPHA=$(echo "\$T17_BODY" | jq -r '.agentStates.alpha' 2>/dev/null || echo "")
|
||
T17_BETA=$(echo "\$T17_BODY" | jq -r '.agentStates.beta' 2>/dev/null || echo "")
|
||
T17_EVENTS_TYPE=$(echo "\$T17_BODY" | jq -r '.recentEvents | type' 2>/dev/null || echo "")
|
||
T17_UPDATED=$(echo "\$T17_BODY" | jq -r '.updatedAt' 2>/dev/null || echo "")
|
||
T17_DATE_OK=false
|
||
[[ "\$T17_UPDATED" =~ ^[0-9]{4}-[0-9]{2}-[0-9]{2}T ]] && T17_DATE_OK=true || true
|
||
if [[ "\$T17_CODE" == "200" \\
|
||
&& -n "\$T17_MOOD" && "\$T17_MOOD" != "null" \\
|
||
&& -n "\$T17_ACT" && "\$T17_ACT" != "null" \\
|
||
&& -n "\$T17_ALPHA" && "\$T17_ALPHA" != "null" \\
|
||
&& -n "\$T17_BETA" && "\$T17_BETA" != "null" \\
|
||
&& "\$T17_EVENTS_TYPE" == "array" \\
|
||
&& "\$T17_DATE_OK" == "true" ]]; then
|
||
note PASS "HTTP 200, timmyState={\$T17_MOOD/\$T17_ACT}, agentStates present, recentEvents=array, updatedAt=ISO"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T17_CODE mood=\$T17_MOOD act=\$T17_ACT alpha=\$T17_ALPHA events=\$T17_EVENTS_TYPE updated=\$T17_UPDATED"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 18 — Job response timestamps (createdAt / completedAt)
|
||
# These fields exist in the code but were never asserted in any test.
|
||
# Uses the main JOB_ID from T2/T6 (state depends on whether T6 completed).
|
||
# Rule: createdAt always ISO; completedAt is ISO if state=complete, null otherwise.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 18 — Job response timestamps (createdAt / completedAt)"
|
||
if [[ -n "\$JOB_ID" ]]; then
|
||
T18_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/jobs/\$JOB_ID")
|
||
T18_BODY=$(body_of "\$T18_RES"); T18_CODE=$(code_of "\$T18_RES")
|
||
T18_STATE=$(echo "\$T18_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
T18_CREATED=$(echo "\$T18_BODY" | jq -r '.createdAt' 2>/dev/null || echo "")
|
||
T18_COMPLETED=$(echo "\$T18_BODY" | jq -r '.completedAt' 2>/dev/null || echo "")
|
||
T18_OK=true
|
||
# createdAt must always be an ISO timestamp
|
||
[[ "\$T18_CREATED" =~ ^[0-9]{4}-[0-9]{2}-[0-9]{2}T ]] || T18_OK=false
|
||
# completedAt is ISO when state=complete, null (the JSON null string) otherwise
|
||
if [[ "\$T18_STATE" == "complete" ]]; then
|
||
[[ "\$T18_COMPLETED" =~ ^[0-9]{4}-[0-9]{2}-[0-9]{2}T ]] || T18_OK=false
|
||
else
|
||
[[ "\$T18_COMPLETED" == "null" ]] || T18_OK=false
|
||
fi
|
||
if [[ "\$T18_CODE" == "200" && "\$T18_OK" == "true" ]]; then
|
||
note PASS "createdAt=\${T18_CREATED:0:24} completedAt=\$T18_COMPLETED (state=\$T18_STATE)"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T18_CODE createdAt=\$T18_CREATED completedAt=\$T18_COMPLETED state=\$T18_STATE"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "No job ID — skipping"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 19 — X-RateLimit-* headers on /api/demo responses
|
||
# These headers are always set (even on 429). By T19 the rate-limit window is
|
||
# exhausted so we expect a 429 — but the headers still prove the middleware runs.
|
||
# Uses curl -si to capture both headers and body in one pass.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 19 — X-RateLimit-* response headers on /api/demo"
|
||
T19_OUT=$(curl -si "\$BASE/api/demo?request=header+probe+test" 2>/dev/null || true)
|
||
T19_LIMIT=$(echo "\$T19_OUT" | grep -i "^X-RateLimit-Limit:" | head -1 | tr -d '\\r' | awk '{print \$2}')
|
||
T19_REMAINING=$(echo "\$T19_OUT" | grep -i "^X-RateLimit-Remaining:" | head -1 | tr -d '\\r' | awk '{print \$2}')
|
||
T19_RESET=$(echo "\$T19_OUT" | grep -i "^X-RateLimit-Reset:" | head -1 | tr -d '\\r' | awk '{print \$2}')
|
||
if [[ -n "\$T19_LIMIT" && -n "\$T19_REMAINING" && -n "\$T19_RESET" ]]; then
|
||
note PASS "X-RateLimit-Limit=\$T19_LIMIT X-RateLimit-Remaining=\$T19_REMAINING X-RateLimit-Reset=\$T19_RESET"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "Missing rate-limit headers: Limit='\$T19_LIMIT' Remaining='\$T19_REMAINING' Reset='\$T19_RESET'"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 20 — Refund endpoint guards (POST /api/jobs/:id/refund)
|
||
# This financial endpoint was completely untested. Three guard cases:
|
||
# 20a: missing invoice body → 400 (fires before job-state check)
|
||
# 20b: unknown job ID → 404
|
||
# 20c: non-complete job → 409 "not complete" (fresh awaiting_eval_payment job)
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 20 — Refund endpoint guards"
|
||
|
||
# 20a: missing invoice field — 400 fires before any state checks
|
||
if [[ -n "\$JOB_ID" ]]; then
|
||
T20A_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/jobs/\$JOB_ID/refund" \\
|
||
-H "Content-Type: application/json" -d '{}')
|
||
T20A_BODY=$(body_of "\$T20A_RES"); T20A_CODE=$(code_of "\$T20A_RES")
|
||
if [[ "\$T20A_CODE" == "400" ]]; then
|
||
note PASS "20a: Missing invoice body → HTTP 400"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "20a: Expected 400, got code=\$T20A_CODE body=\$T20A_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "20a: No job ID"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# 20b: unknown job → 404
|
||
T20B_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/jobs/does-not-exist/refund" \\
|
||
-H "Content-Type: application/json" -d '{"invoice":"lnbc1testplaceholder"}')
|
||
T20B_CODE=$(code_of "\$T20B_RES")
|
||
if [[ "\$T20B_CODE" == "404" ]]; then
|
||
note PASS "20b: Unknown job ID → HTTP 404"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "20b: Expected 404, got code=\$T20B_CODE"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# 20c: create a fresh job (awaiting_eval_payment) — refund must reject with 409
|
||
T20C_NEW=$(curl -s -X POST "\$BASE/api/jobs" \\
|
||
-H "Content-Type: application/json" \\
|
||
-d '{"request":"Refund guard probe — not harmful"}')
|
||
T20C_ID=$(echo "\$T20C_NEW" | jq -r '.jobId' 2>/dev/null || echo "")
|
||
if [[ -n "\$T20C_ID" && "\$T20C_ID" != "null" ]]; then
|
||
T20C_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/jobs/\$T20C_ID/refund" \\
|
||
-H "Content-Type: application/json" -d '{"invoice":"lnbc1testplaceholder"}')
|
||
T20C_BODY=$(body_of "\$T20C_RES"); T20C_CODE=$(code_of "\$T20C_RES")
|
||
if [[ "\$T20C_CODE" == "409" ]]; then
|
||
note PASS "20c: Non-complete job (awaiting_eval_payment) → HTTP 409"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "20c: Expected 409, got code=\$T20C_CODE body=\$T20C_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "20c: Could not create probe job"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 21 — SSE stream replay on completed job (GET /api/jobs/:id/stream)
|
||
# For a complete job the handler immediately sends token + done and closes.
|
||
# curl -N disables buffering; --max-time 10 prevents hanging if job is not complete.
|
||
# Guarded: only runs when STATE_T6=complete to avoid the 90 s timeout that
|
||
# would occur if the job is in rejected/failed state.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 21 — SSE stream replays completed job result"
|
||
if [[ -n "\$JOB_ID" && "\$STATE_T6" == "complete" ]]; then
|
||
T21_STREAM=$(curl -sN --max-time 10 "\$BASE/api/jobs/\$JOB_ID/stream" 2>/dev/null || true)
|
||
if echo "\$T21_STREAM" | grep -q "^event: token" && echo "\$T21_STREAM" | grep -q "^event: done"; then
|
||
note PASS "SSE stream: received 'event: token' and 'event: done' events"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "SSE stream missing expected events. Got: \${T21_STREAM:0:300}"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "Skipping — job not complete (STATE_T6=\${STATE_T6:-not_set}) or no job ID"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 11 — Session: create session
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 11 — Session: create session (awaiting_payment)"
|
||
T11_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/sessions" \\
|
||
-H "Content-Type: application/json" \\
|
||
-d '{"amount_sats": 200}')
|
||
T11_BODY=$(body_of "\$T11_RES"); T11_CODE=$(code_of "\$T11_RES")
|
||
SESSION_ID=$(echo "\$T11_BODY" | jq -r '.sessionId' 2>/dev/null || echo "")
|
||
T11_STATE=$(echo "\$T11_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
T11_AMT=$(echo "\$T11_BODY" | jq -r '.invoice.amountSats' 2>/dev/null || echo "")
|
||
DEPOSIT_HASH=$(echo "\$T11_BODY" | jq -r '.invoice.paymentHash' 2>/dev/null || echo "")
|
||
if [[ "\$T11_CODE" == "201" && -n "\$SESSION_ID" && "\$T11_STATE" == "awaiting_payment" && "\$T11_AMT" == "200" ]]; then
|
||
note PASS "HTTP 201, sessionId=\$SESSION_ID, state=awaiting_payment, amount=200"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T11_CODE body=\$T11_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 12 — Session: poll before payment
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 12 — Session: poll before payment"
|
||
T12_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/sessions/\$SESSION_ID")
|
||
T12_BODY=$(body_of "\$T12_RES"); T12_CODE=$(code_of "\$T12_RES")
|
||
T12_STATE=$(echo "\$T12_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
if [[ -z "\$DEPOSIT_HASH" || "\$DEPOSIT_HASH" == "null" ]]; then
|
||
DEPOSIT_HASH=$(echo "\$T12_BODY" | jq -r '.invoice.paymentHash' 2>/dev/null || echo "")
|
||
fi
|
||
if [[ "\$T12_CODE" == "200" && "\$T12_STATE" == "awaiting_payment" ]]; then
|
||
note PASS "state=awaiting_payment before payment"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T12_CODE body=\$T12_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 13 — Session: pay deposit + activate
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 13 — Session: pay deposit (stub) + auto-advance to active"
|
||
SESSION_MACAROON=""
|
||
if [[ -n "\$DEPOSIT_HASH" && "\$DEPOSIT_HASH" != "null" ]]; then
|
||
curl -s -X POST "\$BASE/api/dev/stub/pay/\$DEPOSIT_HASH" >/dev/null
|
||
sleep 1
|
||
T13_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/sessions/\$SESSION_ID")
|
||
T13_BODY=$(body_of "\$T13_RES"); T13_CODE=$(code_of "\$T13_RES")
|
||
T13_STATE=$(echo "\$T13_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
T13_BAL=$(echo "\$T13_BODY" | jq -r '.balanceSats' 2>/dev/null || echo "")
|
||
SESSION_MACAROON=$(echo "\$T13_BODY" | jq -r '.macaroon' 2>/dev/null || echo "")
|
||
if [[ "\$T13_CODE" == "200" && "\$T13_STATE" == "active" && "\$T13_BAL" == "200" && -n "\$SESSION_MACAROON" && "\$SESSION_MACAROON" != "null" ]]; then
|
||
note PASS "state=active, balanceSats=200, macaroon present"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T13_CODE state=\$T13_STATE bal=\$T13_BAL body=\$T13_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "No deposit hash (stub mode not active)"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 14 — Session: submit request (accepted path)
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 14 — Session: submit request (accepted)"
|
||
if [[ -n "\$SESSION_MACAROON" && "\$SESSION_MACAROON" != "null" ]]; then
|
||
START_T14=$(date +%s)
|
||
T14_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/sessions/\$SESSION_ID/request" \\
|
||
-H "Content-Type: application/json" \\
|
||
-H "Authorization: Bearer \$SESSION_MACAROON" \\
|
||
-d '{"request":"What is Bitcoin in one sentence?"}')
|
||
T14_BODY=$(body_of "\$T14_RES"); T14_CODE=$(code_of "\$T14_RES")
|
||
T14_STATE=$(echo "\$T14_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
T14_DEBITED=$(echo "\$T14_BODY" | jq -r '.debitedSats' 2>/dev/null || echo "")
|
||
T14_BAL=$(echo "\$T14_BODY" | jq -r '.balanceRemaining' 2>/dev/null || echo "")
|
||
END_T14=$(date +%s); ELAPSED_T14=\$((END_T14 - START_T14))
|
||
if [[ "\$T14_CODE" == "200" && ("\$T14_STATE" == "complete" || "\$T14_STATE" == "rejected") && -n "\$T14_DEBITED" && "\$T14_DEBITED" != "null" && -n "\$T14_BAL" ]]; then
|
||
note PASS "state=\$T14_STATE in \${ELAPSED_T14}s, debitedSats=\$T14_DEBITED, balanceRemaining=\$T14_BAL"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T14_CODE body=\$T14_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "No macaroon — skipping"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 15 — Session: missing/invalid macaroon → 401
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 15 — Session: reject request without valid macaroon"
|
||
if [[ -n "\$SESSION_ID" ]]; then
|
||
T15_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/sessions/\$SESSION_ID/request" \\
|
||
-H "Content-Type: application/json" \\
|
||
-d '{"request":"What is Bitcoin?"}')
|
||
T15_CODE=$(code_of "\$T15_RES")
|
||
if [[ "\$T15_CODE" == "401" ]]; then
|
||
note PASS "HTTP 401 without macaroon"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "Expected 401, got code=\$T15_CODE"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "No session ID — skipping"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 16 — Session: topup invoice creation
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 16 — Session: topup invoice creation"
|
||
if [[ -n "\$SESSION_MACAROON" && "\$SESSION_MACAROON" != "null" ]]; then
|
||
T16_RES=$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/sessions/\$SESSION_ID/topup" \\
|
||
-H "Content-Type: application/json" \\
|
||
-H "Authorization: Bearer \$SESSION_MACAROON" \\
|
||
-d '{"amount_sats": 500}')
|
||
T16_BODY=$(body_of "\$T16_RES"); T16_CODE=$(code_of "\$T16_RES")
|
||
T16_PR=$(echo "\$T16_BODY" | jq -r '.topup.paymentRequest' 2>/dev/null || echo "")
|
||
T16_AMT=$(echo "\$T16_BODY" | jq -r '.topup.amountSats' 2>/dev/null || echo "")
|
||
if [[ "\$T16_CODE" == "200" && -n "\$T16_PR" && "\$T16_PR" != "null" && "\$T16_AMT" == "500" ]]; then
|
||
note PASS "Topup invoice created, amountSats=500"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T16_CODE body=\$T16_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "No macaroon — skipping"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 22 — Session: unknown session ID → 404
|
||
# Previously zero coverage. Sessions GET was only tested with a valid ID (T12).
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 22 — Session: unknown session ID → 404"
|
||
T22_RES=$(curl -s -w "\\n%{http_code}" "\$BASE/api/sessions/does-not-exist")
|
||
T22_BODY=$(body_of "\$T22_RES"); T22_CODE=$(code_of "\$T22_RES")
|
||
T22_ERR=$(echo "\$T22_BODY" | jq -r '.error' 2>/dev/null || echo "")
|
||
if [[ "\$T22_CODE" == "404" && -n "\$T22_ERR" && "\$T22_ERR" != "null" ]]; then
|
||
note PASS "HTTP 404 with error field for unknown session ID"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "Expected 404 with error, got code=\$T22_CODE body=\$T22_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 23 — Bootstrap: create → stub-pay → poll provisioning state
|
||
# Highest-value paid feature (10,000 sats default) — previously zero coverage.
|
||
# Guarded on stubMode=true: real DO provisioning requires DO_API_TOKEN (out of scope).
|
||
# Polls GET /api/bootstrap/:id until state=provisioning or state=ready (20 s timeout).
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 23 — Bootstrap: create + stub-pay + poll provisioning"
|
||
T23_RES=\$(curl -s -w "\\n%{http_code}" -X POST "\$BASE/api/bootstrap" \\
|
||
-H "Content-Type: application/json")
|
||
T23_BODY=\$(body_of "\$T23_RES"); T23_CODE=\$(code_of "\$T23_RES")
|
||
BOOTSTRAP_ID=\$(echo "\$T23_BODY" | jq -r '.bootstrapJobId' 2>/dev/null || echo "")
|
||
T23_STUB=\$(echo "\$T23_BODY" | jq -r '.stubMode' 2>/dev/null || echo "false")
|
||
BOOTSTRAP_HASH=\$(echo "\$T23_BODY" | jq -r '.invoice.paymentHash' 2>/dev/null || echo "")
|
||
if [[ "\$T23_CODE" != "201" || -z "\$BOOTSTRAP_ID" || "\$BOOTSTRAP_ID" == "null" ]]; then
|
||
note FAIL "Bootstrap create failed: code=\$T23_CODE body=\$T23_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
elif [[ "\$T23_STUB" != "true" ]]; then
|
||
note SKIP "stubMode=false — skipping (requires DO_API_TOKEN for real provisioning)"
|
||
SKIP=\$((SKIP+1))
|
||
elif [[ -z "\$BOOTSTRAP_HASH" || "\$BOOTSTRAP_HASH" == "null" ]]; then
|
||
note FAIL "stubMode=true but invoice.paymentHash missing — cannot stub-pay: body=\$T23_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
else
|
||
curl -s -X POST "\$BASE/api/dev/stub/pay/\$BOOTSTRAP_HASH" >/dev/null
|
||
START_T23=\$(date +%s); T23_TIMEOUT=20
|
||
T23_STATE=""; T23_MSG=""; T23_POLL_CODE=""; T23_POLL_ID=""
|
||
while :; do
|
||
T23_POLL=\$(curl -s -w "\\n%{http_code}" "\$BASE/api/bootstrap/\$BOOTSTRAP_ID")
|
||
T23_POLL_BODY=\$(body_of "\$T23_POLL"); T23_POLL_CODE=\$(code_of "\$T23_POLL")
|
||
T23_STATE=\$(echo "\$T23_POLL_BODY" | jq -r '.state' 2>/dev/null || echo "")
|
||
T23_MSG=\$(echo "\$T23_POLL_BODY" | jq -r '.message' 2>/dev/null || echo "")
|
||
T23_POLL_ID=\$(echo "\$T23_POLL_BODY" | jq -r '.bootstrapJobId' 2>/dev/null || echo "")
|
||
NOW_T23=\$(date +%s); ELAPSED_T23=\$((NOW_T23 - START_T23))
|
||
if [[ "\$T23_STATE" == "provisioning" || "\$T23_STATE" == "ready" ]]; then break; fi
|
||
if (( ELAPSED_T23 > T23_TIMEOUT )); then break; fi
|
||
sleep 2
|
||
done
|
||
if [[ "\$T23_POLL_CODE" == "200" \\
|
||
&& ("\$T23_STATE" == "provisioning" || "\$T23_STATE" == "ready") \\
|
||
&& -n "\$T23_MSG" && "\$T23_MSG" != "null" \\
|
||
&& "\$T23_POLL_ID" == "\$BOOTSTRAP_ID" ]]; then
|
||
note PASS "state=\$T23_STATE in \$ELAPSED_T23 s, message present, bootstrapJobId=\$BOOTSTRAP_ID (echoed in poll)"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T23_POLL_CODE state=\$T23_STATE elapsed=\${ELAPSED_T23}s pollId=\$T23_POLL_ID (expected \$BOOTSTRAP_ID) body=\$T23_POLL_BODY"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Test 24 — Cost ledger completeness after job completion
|
||
# Uses the completed JOB_ID from T6 (guarded on STATE_T6=complete).
|
||
# Verifies 8 cost-ledger fields are non-null:
|
||
# actualInputTokens, actualOutputTokens, totalTokens, actualCostUsd,
|
||
# actualAmountSats, workAmountSats, refundAmountSats, refundState.
|
||
# Honest-accounting invariant: actualAmountSats <= workAmountSats.
|
||
# refundState must be one of: not_applicable | pending | paid.
|
||
# ---------------------------------------------------------------------------
|
||
sep "Test 24 — Cost ledger completeness (job completed)"
|
||
if [[ -n "\$JOB_ID" && "\$STATE_T6" == "complete" ]]; then
|
||
T24_RES=\$(curl -s -w "\\n%{http_code}" "\$BASE/api/jobs/\$JOB_ID")
|
||
T24_BODY=\$(body_of "\$T24_RES"); T24_CODE=\$(code_of "\$T24_RES")
|
||
T24_LEDGER=\$(echo "\$T24_BODY" | jq '.costLedger' 2>/dev/null || echo "null")
|
||
T24_REFUND_STATE=\$(echo "\$T24_LEDGER" | jq -r '.refundState' 2>/dev/null || echo "")
|
||
T24_FIELDS_OK=true
|
||
for field in actualInputTokens actualOutputTokens totalTokens actualCostUsd actualAmountSats workAmountSats refundAmountSats refundState; do
|
||
VAL=\$(echo "\$T24_LEDGER" | jq -r ".\$field" 2>/dev/null || echo "MISSING")
|
||
[[ -z "\$VAL" || "\$VAL" == "null" ]] && T24_FIELDS_OK=false || true
|
||
done
|
||
T24_INV_OK=\$(echo "\$T24_LEDGER" | jq '
|
||
(.actualAmountSats != null) and
|
||
(.workAmountSats != null) and
|
||
(.actualAmountSats <= .workAmountSats) and
|
||
(.refundAmountSats >= 0)
|
||
' 2>/dev/null || echo "false")
|
||
if [[ "\$T24_CODE" == "200" \\
|
||
&& "\$T24_LEDGER" != "null" \\
|
||
&& "\$T24_FIELDS_OK" == "true" \\
|
||
&& "\$T24_INV_OK" == "true" \\
|
||
&& "\$T24_REFUND_STATE" =~ ^(not_applicable|pending|paid)\$ ]]; then
|
||
T24_ACTUAL=\$(echo "\$T24_LEDGER" | jq -r '.actualAmountSats' 2>/dev/null || echo "?")
|
||
T24_WORK=\$(echo "\$T24_LEDGER" | jq -r '.workAmountSats' 2>/dev/null || echo "?")
|
||
T24_REFUND=\$(echo "\$T24_LEDGER" | jq -r '.refundAmountSats' 2>/dev/null || echo "?")
|
||
note PASS "8 fields non-null, actualAmountSats(\$T24_ACTUAL)<=workAmountSats(\$T24_WORK), refundAmountSats=\$T24_REFUND, refundState=\$T24_REFUND_STATE"
|
||
PASS=\$((PASS+1))
|
||
else
|
||
note FAIL "code=\$T24_CODE ledger=\$T24_LEDGER fields_ok=\$T24_FIELDS_OK inv_ok=\$T24_INV_OK refundState=\$T24_REFUND_STATE"
|
||
FAIL=\$((FAIL+1))
|
||
fi
|
||
else
|
||
note SKIP "Skipping — job not complete (STATE_T6=\${STATE_T6:-not_set}) or no JOB_ID"
|
||
SKIP=\$((SKIP+1))
|
||
fi
|
||
|
||
# ---------------------------------------------------------------------------
|
||
# Summary
|
||
# ---------------------------------------------------------------------------
|
||
echo
|
||
echo "======================================="
|
||
echo " RESULTS: PASS=\$PASS FAIL=\$FAIL SKIP=\$SKIP"
|
||
echo "======================================="
|
||
if [[ "\$FAIL" -gt 0 ]]; then exit 1; fi
|
||
`;
|
||
|
||
res.setHeader("Content-Type", "text/x-shellscript; charset=utf-8");
|
||
res.setHeader("Content-Disposition", 'inline; filename="timmy_test.sh"');
|
||
res.send(script);
|
||
});
|
||
|
||
/**
|
||
* GET /api/testkit/plan
|
||
*
|
||
* Returns TIMMY_TEST_PLAN.md verbatim as text/markdown.
|
||
* Path resolves from the project root regardless of cwd.
|
||
*/
|
||
const _dirname = dirname(fileURLToPath(import.meta.url));
|
||
const PLAN_PATH = resolve(_dirname, "../../../../TIMMY_TEST_PLAN.md");
|
||
|
||
router.get("/testkit/plan", (_req: Request, res: Response) => {
|
||
let content: string;
|
||
try {
|
||
content = readFileSync(PLAN_PATH, "utf-8");
|
||
} catch {
|
||
res.status(500).json({ error: "TIMMY_TEST_PLAN.md not found on server" });
|
||
return;
|
||
}
|
||
res.setHeader("Content-Type", "text/markdown; charset=utf-8");
|
||
res.send(content);
|
||
});
|
||
|
||
/**
|
||
* GET /api/testkit/report
|
||
*
|
||
* Returns only the report template section from TIMMY_TEST_PLAN.md —
|
||
* everything from the "## Report template" heading to end-of-file.
|
||
* Returned as text/plain so agents can copy and fill in directly.
|
||
*/
|
||
router.get("/testkit/report", (_req: Request, res: Response) => {
|
||
let content: string;
|
||
try {
|
||
content = readFileSync(PLAN_PATH, "utf-8");
|
||
} catch {
|
||
res.status(500).json({ error: "TIMMY_TEST_PLAN.md not found on server" });
|
||
return;
|
||
}
|
||
const marker = "## Report template";
|
||
const idx = content.indexOf(marker);
|
||
if (idx === -1) {
|
||
res.status(500).json({ error: "Report template section not found in plan" });
|
||
return;
|
||
}
|
||
res.setHeader("Content-Type", "text/plain; charset=utf-8");
|
||
res.send(content.slice(idx));
|
||
});
|
||
|
||
export default router;
|