Compare commits
1 Commits
step35/87-
...
step35/199
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
86eb1c9a50 |
255
scripts/knowledge_to_training_pairs.py
Normal file
255
scripts/knowledge_to_training_pairs.py
Normal file
@@ -0,0 +1,255 @@
|
||||
#!/usr/bin/env python3
|
||||
"""
|
||||
knowledge_to_training_pairs.py — Convert quality-gated knowledge entries into training pairs.
|
||||
|
||||
Reads knowledge/index.json (or a custom JSONL of entries), applies quality filters,
|
||||
and emits terse→rich training pairs in JSONL format for model fine-tuning.
|
||||
|
||||
Usage:
|
||||
python3 scripts/knowledge_to_training_pairs.py \
|
||||
--input knowledge/index.json \
|
||||
--output training_pairs.jsonl \
|
||||
--min-confidence 0.7 \
|
||||
--model-filter claude-sonnet,gpt-4 \
|
||||
--after 2026-01-01
|
||||
|
||||
Input entry format (from index.json facts):
|
||||
{
|
||||
"id": "hermes-agent:pitfall:001",
|
||||
"fact": "deploy-crons.py leaves jobs in mixed model format",
|
||||
"category": "pitfall",
|
||||
"domain": "hermes-agent",
|
||||
"confidence": 0.95,
|
||||
...
|
||||
}
|
||||
|
||||
Output training pair format:
|
||||
{
|
||||
"terse": "How do I handle deploy-crons.py mixed model format?",
|
||||
"rich": "deploy-crons.py leaves jobs in mixed model format.",
|
||||
"domain": "hermes-agent",
|
||||
"source_confidence": 0.95,
|
||||
"source_model": "unknown"
|
||||
}
|
||||
"""
|
||||
|
||||
import argparse
|
||||
import json
|
||||
import os
|
||||
import sys
|
||||
from datetime import datetime, timezone
|
||||
from pathlib import Path
|
||||
from typing import Optional
|
||||
|
||||
|
||||
def fact_to_terse(fact: str, category: str, domain: str) -> str:
|
||||
"""
|
||||
Derive a short user query from a knowledge fact.
|
||||
|
||||
Strategy:
|
||||
- Pitfalls → "How do I avoid/handle/fix <fact excerpt>?"
|
||||
- Patterns → "What's the recommended way to <pattern core>?"
|
||||
- Tool quirks → "How does <tool> behave in <context>?"
|
||||
- Facts → "What should I know about <fact excerpt>?"
|
||||
- Questions → "What is the answer to: <fact>?"
|
||||
"""
|
||||
fact_lower = fact.lower()
|
||||
# Extract a concise excerpt (first sentence or 80 chars)
|
||||
excerpt = fact.split('. ')[0] if '. ' in fact else fact[:80]
|
||||
|
||||
if category == "pitfall":
|
||||
verbs = ["avoid", "handle", "fix", "prevent"]
|
||||
# pick verb based on fact wording
|
||||
if "trigger" in fact_lower or "cause" in fact_lower:
|
||||
verb = "avoid"
|
||||
elif "broken" in fact_lower or "fails" in fact_lower:
|
||||
verb = "fix"
|
||||
else:
|
||||
verb = "handle"
|
||||
return f"How do I {verb} {excerpt.rstrip('.')}?"
|
||||
elif category == "pattern":
|
||||
return f"What's the recommended way to {excerpt.rstrip('.')}?"
|
||||
elif category == "tool-quirk":
|
||||
# Try to extract tool name
|
||||
tool = fact.split()[0] if fact.split() else domain
|
||||
return f"How does {tool} behave in this context?"
|
||||
elif category == "question":
|
||||
return f"What is the answer to: {excerpt}?"
|
||||
else: # fact or unknown
|
||||
return f"What should I know about {excerpt.rstrip('.')}?"
|
||||
|
||||
|
||||
def parse_date(date_str: Optional[str]) -> Optional[datetime]:
|
||||
"""Parse ISO date string to datetime, or return None."""
|
||||
if not date_str:
|
||||
return None
|
||||
try:
|
||||
return datetime.fromisoformat(date_str.replace("Z", "+00:00"))
|
||||
except ValueError:
|
||||
return None
|
||||
|
||||
|
||||
def load_knowledge_index(path: str) -> list[dict]:
|
||||
"""Load knowledge facts from index.json (or plain JSONL of entries)."""
|
||||
p = Path(path)
|
||||
if not p.exists():
|
||||
print(f"ERROR: Knowledge input not found: {path}", file=sys.stderr)
|
||||
sys.exit(1)
|
||||
|
||||
with open(p) as f:
|
||||
data = json.load(f)
|
||||
|
||||
# index.json format: {"facts": [...], ...}
|
||||
if isinstance(data, dict) and "facts" in data:
|
||||
return data["facts"]
|
||||
# JSONL format: one entry per line
|
||||
if isinstance(data, list):
|
||||
return data
|
||||
# Plain file with JSON array
|
||||
print(f"ERROR: Unrecognized input format in {path}", file=sys.stderr)
|
||||
sys.exit(1)
|
||||
|
||||
|
||||
def filter_entries(entries: list[dict],
|
||||
min_confidence: float = 0.0,
|
||||
model_filter: Optional[list[str]] = None,
|
||||
after: Optional[datetime] = None,
|
||||
before: Optional[datetime] = None) -> list[dict]:
|
||||
"""Apply quality and provenance filters."""
|
||||
filtered = []
|
||||
for entry in entries:
|
||||
# Confidence filter (entry confidence)
|
||||
conf = entry.get("confidence", 0.0)
|
||||
if conf < min_confidence:
|
||||
continue
|
||||
|
||||
# Model filter: if specified, entry's model must be in the list
|
||||
if model_filter:
|
||||
entry_model = entry.get("model", entry.get("provenance", {}).get("model", "unknown"))
|
||||
if entry_model not in model_filter:
|
||||
continue
|
||||
|
||||
# Date filter: use last_confirmed or first_seen or harvested_at
|
||||
entry_date = None
|
||||
for field in ("last_confirmed", "first_seen", "harvested_at"):
|
||||
if field in entry:
|
||||
entry_date = parse_date(entry[field])
|
||||
if entry_date:
|
||||
break
|
||||
if after and entry_date and entry_date < after:
|
||||
continue
|
||||
if before and entry_date and entry_date > before:
|
||||
continue
|
||||
|
||||
filtered.append(entry)
|
||||
return filtered
|
||||
|
||||
|
||||
def entry_to_pair(entry: dict) -> dict:
|
||||
"""Convert a knowledge entry into a training pair."""
|
||||
fact = entry.get("fact", "").strip()
|
||||
if not fact:
|
||||
return None
|
||||
|
||||
category = entry.get("category", "fact")
|
||||
domain = entry.get("domain", "global")
|
||||
|
||||
terse = fact_to_terse(fact, category, domain)
|
||||
rich = fact
|
||||
source_confidence = round(entry.get("confidence", 0.0), 4)
|
||||
source_model = entry.get("model", entry.get("provenance", {}).get("model", "unknown"))
|
||||
|
||||
return {
|
||||
"terse": terse,
|
||||
"rich": rich,
|
||||
"domain": domain,
|
||||
"source_confidence": source_confidence,
|
||||
"source_model": source_model,
|
||||
}
|
||||
|
||||
|
||||
def main():
|
||||
parser = argparse.ArgumentParser(description="Knowledge entries → training pairs")
|
||||
parser.add_argument("--input", "-i", default="knowledge/index.json",
|
||||
help="Input knowledge index or JSONL (default: knowledge/index.json)")
|
||||
parser.add_argument("--output", "-o", default="training_pairs.jsonl",
|
||||
help="Output JSONL file")
|
||||
parser.add_argument("--min-confidence", type=float, default=0.5,
|
||||
help="Minimum entry confidence to include (0.0-1.0, default: 0.5)")
|
||||
parser.add_argument("--model-filter",
|
||||
help="Comma-separated list of source models to include")
|
||||
parser.add_argument("--after",
|
||||
help="Include entries last_confirmed/first_seen on or after this date (YYYY-MM-DD)")
|
||||
parser.add_argument("--before",
|
||||
help="Include entries last_confirmed/first_seen on or before this date (YYYY-MM-DD)")
|
||||
parser.add_argument("--dry-run", action="store_true",
|
||||
help="Print sample pairs and stats without writing")
|
||||
args = parser.parse_args()
|
||||
|
||||
# Load
|
||||
entries = load_knowledge_index(args.input)
|
||||
print(f"Loaded {len(entries)} entries from {args.input}", file=sys.stderr)
|
||||
|
||||
# Parse filters
|
||||
model_list = args.model_filter.split(",") if args.model_filter else None
|
||||
after_dt = parse_date(args.after) if args.after else None
|
||||
before_dt = parse_date(args.before) if args.before else None
|
||||
|
||||
# Filter
|
||||
kept = filter_entries(
|
||||
entries,
|
||||
min_confidence=args.min_confidence,
|
||||
model_filter=model_list,
|
||||
after=after_dt,
|
||||
before=before_dt,
|
||||
)
|
||||
print(f"After filtering: {len(kept)} / {len(entries)} entries", file=sys.stderr)
|
||||
|
||||
# Convert
|
||||
pairs = []
|
||||
for entry in kept:
|
||||
pair = entry_to_pair(entry)
|
||||
if pair:
|
||||
pairs.append(pair)
|
||||
|
||||
# Stats
|
||||
if pairs:
|
||||
avg_conf = sum(p["source_confidence"] for p in pairs) / len(pairs)
|
||||
domains = {}
|
||||
models = {}
|
||||
for p in pairs:
|
||||
domains[p["domain"]] = domains.get(p["domain"], 0) + 1
|
||||
models[p["source_model"]] = models.get(p["source_model"], 0) + 1
|
||||
else:
|
||||
avg_conf = 0.0
|
||||
domains = {}
|
||||
models = {}
|
||||
|
||||
stats = {
|
||||
"input_entries": len(entries),
|
||||
"after_filter": len(kept),
|
||||
"pairs_generated": len(pairs),
|
||||
"avg_confidence": round(avg_conf, 4),
|
||||
"domains": domains,
|
||||
"source_models": models,
|
||||
}
|
||||
print(json.dumps(stats, indent=2), file=sys.stderr)
|
||||
|
||||
if args.dry_run:
|
||||
print("\nSample pairs:", file=sys.stderr)
|
||||
for p in pairs[:3]:
|
||||
print(json.dumps(p, ensure_ascii=False), file=sys.stderr)
|
||||
return
|
||||
|
||||
# Write JSONL
|
||||
out_path = Path(args.output)
|
||||
out_path.parent.mkdir(parents=True, exist_ok=True)
|
||||
with open(out_path, "w", encoding="utf-8") as f:
|
||||
for pair in pairs:
|
||||
f.write(json.dumps(pair, ensure_ascii=False) + "\n")
|
||||
|
||||
print(f"\nWrote {len(pairs)} training pairs to {out_path}", file=sys.stderr)
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
main()
|
||||
@@ -1,108 +0,0 @@
|
||||
#!/usr/bin/env python3
|
||||
"""Generated regression tests from fix commits — Compounding Intelligence #87."""
|
||||
|
||||
import argparse, re, subprocess, sys
|
||||
from pathlib import Path
|
||||
|
||||
HERE = Path(__file__).parent
|
||||
ROOT = HERE.parent
|
||||
TESTS_DIR = ROOT / "tests"
|
||||
OUT_FILE = TESTS_DIR / "test_regression_generated.py"
|
||||
|
||||
def run_git(args, cwd):
|
||||
r = subprocess.run(["git"] + args, capture_output=True, text=True, cwd=str(cwd))
|
||||
if r.returncode != 0:
|
||||
raise RuntimeError(r.stderr.strip() or "git error")
|
||||
return r.stdout.strip()
|
||||
|
||||
def get_fix_commits(since=None):
|
||||
args = ["log", "--all", "--grep=fix", "--format=%H"]
|
||||
if since:
|
||||
args.append(f"--since={since}")
|
||||
out = run_git(args, ROOT)
|
||||
return [l.strip() for l in out.splitlines() if l.strip()]
|
||||
|
||||
def get_commit_info(sha):
|
||||
"""Return message, full diff, and list of changed file paths."""
|
||||
msg = run_git(["show", "--no-patch", "--format=%s", sha], ROOT)
|
||||
diff = run_git(["show", "--format=full", sha], ROOT)
|
||||
files_out = run_git(["diff-tree", "--no-commit-id", "--name-only", "-r", sha], ROOT)
|
||||
files = [p for p in files_out.splitlines() if p.strip()]
|
||||
return {"sha": sha, "msg": msg, "diff": diff, "files": files}
|
||||
|
||||
# ── Test templates ───────────────────────────────────────────────────────
|
||||
REGEX_TEST = """
|
||||
class TestRegression_{prefix}(unittest.TestCase):
|
||||
\"\"\"Regression: regex syntax fix - commit {commit}.\"\"\"
|
||||
def test_regex_compiles(self):
|
||||
import re
|
||||
pattern = r"open\\\\([^)]*)[\\x27\\x22]w[\\x27\\x22]"
|
||||
try:
|
||||
regex = re.compile(pattern)
|
||||
except SyntaxError as e:
|
||||
self.fail(f"Regex still invalid after fix: {e}")
|
||||
self.assertRegex("open(test_file, 'w')", regex)
|
||||
self.assertRegex('open(test_file, "w")', regex)
|
||||
self.assertNotRegex("open(test_file, 'r')", regex)
|
||||
"""
|
||||
|
||||
GENERIC_TEST = """
|
||||
class TestRegression_{prefix}(unittest.TestCase):
|
||||
\"\"\"Regression guard: {first_line} - commit {sha}.\"\"\"
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("{file_path}")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: {file_path}")
|
||||
"""
|
||||
|
||||
# ── Generation ───────────────────────────────────────────────────────────
|
||||
def generate(commits):
|
||||
cases = []
|
||||
for sha in commits:
|
||||
try:
|
||||
info = get_commit_info(sha)
|
||||
# Keep only existing files (skip ones deleted/removed later)
|
||||
existing = [p for p in info["files"] if (ROOT / p).exists()]
|
||||
if not existing:
|
||||
continue
|
||||
first_file = existing[0]
|
||||
# Heuristic: regex-related fix if message or diff mentions open( with write mode pattern
|
||||
content = info["msg"] + "n" + info["diff"]
|
||||
if re.search(r"open\\\\([^)]*)[\"']w[\"']", content, re.IGNORECASE):
|
||||
cases.append(REGEX_TEST.format(prefix=sha[:8], commit=sha))
|
||||
else:
|
||||
first_line = info["msg"].replace('"', '\\"')[:80]
|
||||
cases.append(GENERIC_TEST.format(
|
||||
prefix=sha[:8],
|
||||
file_path=first_file,
|
||||
first_line=first_line,
|
||||
sha=sha))
|
||||
except Exception as e:
|
||||
print(f"[WARN] {sha[:8]}: {e}", file=sys.stderr)
|
||||
|
||||
OUT_FILE.parent.mkdir(parents=True, exist_ok=True)
|
||||
OUT_FILE.write_text(
|
||||
f"""# AUTO-GENERATED — DO NOT EDIT
|
||||
import unittest
|
||||
from pathlib import Path
|
||||
|
||||
{"".join(cases)}
|
||||
|
||||
if __name__ == "__main__":
|
||||
unittest.main()
|
||||
""",
|
||||
encoding="utf-8"
|
||||
)
|
||||
print(f"Wrote {OUT_FILE} — {len(cases)} test cases")
|
||||
|
||||
def main():
|
||||
parser = argparse.ArgumentParser()
|
||||
parser.add_argument("--commit", help="specific commit SHA")
|
||||
parser.add_argument("--since", help="e.g. 2025-01-01")
|
||||
args = parser.parse_args()
|
||||
shas = [args.commit] if args.commit else get_fix_commits(args.since)
|
||||
print(f"Scanning {len(shas)} fix commits…")
|
||||
generate(shas)
|
||||
|
||||
if __name__ == "__main__":
|
||||
main()
|
||||
174
tests/test_knowledge_to_training_pairs.py
Normal file
174
tests/test_knowledge_to_training_pairs.py
Normal file
@@ -0,0 +1,174 @@
|
||||
#!/usr/bin/env python3
|
||||
"""
|
||||
Smoke tests for knowledge_to_training_pairs.py
|
||||
|
||||
Tests:
|
||||
- Output is valid JSONL
|
||||
- Each line has required fields (terse, rich, domain, source_confidence, source_model)
|
||||
- Confidence values are in [0,1]
|
||||
- Terse is non-empty and reasonably short (< 200 chars)
|
||||
- Rich matches the original fact
|
||||
"""
|
||||
|
||||
import json
|
||||
import sys
|
||||
import os
|
||||
import tempfile
|
||||
from pathlib import Path
|
||||
|
||||
# Add scripts dir to path for imports
|
||||
SCRIPT_DIR = Path(__file__).parent.parent / "scripts"
|
||||
sys.path.insert(0, str(SCRIPT_DIR))
|
||||
|
||||
from knowledge_to_training_pairs import (
|
||||
fact_to_terse,
|
||||
filter_entries,
|
||||
entry_to_pair,
|
||||
parse_date,
|
||||
)
|
||||
|
||||
|
||||
def test_fact_to_terse_pitfall():
|
||||
fact = "deploy-crons.py leaves jobs in mixed model format"
|
||||
category = "pitfall"
|
||||
domain = "hermes-agent"
|
||||
terse = fact_to_terse(fact, category, domain)
|
||||
assert terse.startswith("How do I")
|
||||
assert "?" in terse
|
||||
assert len(terse) < 150
|
||||
print("PASS: test_fact_to_terse_pitfall")
|
||||
|
||||
|
||||
def test_fact_to_terse_fact():
|
||||
fact = "Python is a high-level programming language"
|
||||
terse = fact_to_terse(fact, "fact", "global")
|
||||
assert terse.startswith("What should I know about")
|
||||
assert "?" in terse
|
||||
print("PASS: test_fact_to_terse_fact")
|
||||
|
||||
|
||||
def test_fact_to_terse_pattern():
|
||||
fact = "Use sparse checkout for large repos"
|
||||
terse = fact_to_terse(fact, "pattern", "devops")
|
||||
assert "recommended way" in terse or "best way" in terse
|
||||
print("PASS: test_fact_to_terse_pattern")
|
||||
|
||||
|
||||
def test_entry_to_pair_structure():
|
||||
entry = {
|
||||
"id": "test:001",
|
||||
"fact": "Test fact text.",
|
||||
"category": "fact",
|
||||
"domain": "test-domain",
|
||||
"confidence": 0.85,
|
||||
"model": "test-model",
|
||||
}
|
||||
pair = entry_to_pair(entry)
|
||||
assert pair is not None
|
||||
assert "terse" in pair
|
||||
assert "rich" in pair
|
||||
assert "domain" in pair
|
||||
assert "source_confidence" in pair
|
||||
assert "source_model" in pair
|
||||
assert pair["rich"] == "Test fact text."
|
||||
assert pair["domain"] == "test-domain"
|
||||
assert 0.0 <= pair["source_confidence"] <= 1.0
|
||||
print("PASS: test_entry_to_pair_structure")
|
||||
|
||||
|
||||
def test_filter_by_confidence():
|
||||
entries = [
|
||||
{"fact": "A", "confidence": 0.9},
|
||||
{"fact": "B", "confidence": 0.4},
|
||||
{"fact": "C", "confidence": 0.6},
|
||||
]
|
||||
filtered = filter_entries(entries, min_confidence=0.5)
|
||||
assert len(filtered) == 2
|
||||
assert all(e["confidence"] >= 0.5 for e in filtered)
|
||||
print("PASS: test_filter_by_confidence")
|
||||
|
||||
|
||||
def test_filter_by_model():
|
||||
entries = [
|
||||
{"fact": "A", "model": "claude-sonnet"},
|
||||
{"fact": "B", "model": "gpt-4"},
|
||||
{"fact": "C", "model": "unknown"},
|
||||
]
|
||||
filtered = filter_entries(entries, model_filter=["claude-sonnet", "gpt-4"])
|
||||
assert len(filtered) == 2
|
||||
assert all(e["model"] in ("claude-sonnet", "gpt-4") for e in filtered)
|
||||
print("PASS: test_filter_by_model")
|
||||
|
||||
|
||||
def test_filter_by_date():
|
||||
entries = [
|
||||
{"fact": "A", "last_confirmed": "2026-04-10"},
|
||||
{"fact": "B", "last_confirmed": "2026-03-01"},
|
||||
{"fact": "C", "first_seen": "2026-04-15"},
|
||||
]
|
||||
after_dt = parse_date("2026-04-01")
|
||||
filtered = filter_entries(entries, after=after_dt)
|
||||
assert len(filtered) == 2
|
||||
print("PASS: test_filter_by_date")
|
||||
|
||||
|
||||
def test_end_to_end_jsonl_output():
|
||||
"""Integration test: run the script and verify JSONL validity."""
|
||||
import subprocess
|
||||
|
||||
repo_dir = SCRIPT_DIR.parent
|
||||
result = subprocess.run(
|
||||
["python3", "scripts/knowledge_to_training_pairs.py", "--dry-run"],
|
||||
capture_output=True, text=True, cwd=repo_dir
|
||||
)
|
||||
assert result.returncode == 0
|
||||
stderr = result.stderr.strip()
|
||||
|
||||
# The stats JSON object is at the top of stderr. Find its bounds via brace matching.
|
||||
start = stderr.find('{')
|
||||
assert start >= 0, "Stats JSON not found in stderr"
|
||||
stderr_sub = stderr[start:]
|
||||
|
||||
depth = 0
|
||||
end = 0
|
||||
for i, ch in enumerate(stderr_sub):
|
||||
if ch == '{':
|
||||
depth += 1
|
||||
elif ch == '}':
|
||||
depth -= 1
|
||||
if depth == 0:
|
||||
end = i + 1
|
||||
break
|
||||
assert end > 0, "Unterminated JSON in stderr"
|
||||
|
||||
stats = json.loads(stderr_sub[:end])
|
||||
assert stats["input_entries"] > 0
|
||||
assert stats["pairs_generated"] > 0
|
||||
print("PASS: test_end_to_end_jsonl_output")
|
||||
|
||||
|
||||
def test_terse_length_constraint():
|
||||
"""Terse should be reasonably short for training."""
|
||||
# Sample facts from actual knowledge
|
||||
test_facts = [
|
||||
("deploy-crons.py leaves jobs in mixed model format", "pitfall", "hermes-agent"),
|
||||
("Cron jobs with blank fallback_model fields trigger warnings", "pitfall", "hermes-agent"),
|
||||
("Use the Gitea REST API when clone times out", "pattern", "devops"),
|
||||
]
|
||||
for fact, cat, domain in test_facts:
|
||||
terse = fact_to_terse(fact, cat, domain)
|
||||
assert len(terse) < 200, f"Terse too long ({len(terse)}): {terse}"
|
||||
print("PASS: test_terse_length_constraint")
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
test_fact_to_terse_pitfall()
|
||||
test_fact_to_terse_fact()
|
||||
test_fact_to_terse_pattern()
|
||||
test_entry_to_pair_structure()
|
||||
test_filter_by_confidence()
|
||||
test_filter_by_model()
|
||||
test_filter_by_date()
|
||||
test_end_to_end_jsonl_output()
|
||||
test_terse_length_constraint()
|
||||
print("\nAll smoke tests passed.")
|
||||
@@ -1,239 +0,0 @@
|
||||
# AUTO-GENERATED — DO NOT EDIT
|
||||
import unittest
|
||||
from pathlib import Path
|
||||
|
||||
|
||||
class TestRegression_2133b189(unittest.TestCase):
|
||||
"""Regression guard: fix: correct Makefile syntax (tabs for recipe lines) - commit 2133b1892906b5a870e7db71ac5a6be4ffd56a09."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("Makefile")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: Makefile")
|
||||
|
||||
class TestRegression_8374ec93(unittest.TestCase):
|
||||
"""Regression guard: fix(perf-bottleneck): make find_slow_tests_pytest functional; unblock pytest col - commit 8374ec937e6fd868636e468877a9ea8c1dded19d."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_77e7e5da(unittest.TestCase):
|
||||
"""Regression guard: feat(test): add dependency_graph test suite + fix self-cycle duplicate - commit 77e7e5daebb43983aa683633f44ad5a52c765ec6."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/dependency_graph.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/dependency_graph.py")
|
||||
|
||||
class TestRegression_b1a728f5(unittest.TestCase):
|
||||
"""Regression guard: feat: fix session_pair_harvester to use role/content format (#91) - commit b1a728f5f464a9fd43dd7cb8424dd73a05bb7dc1."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/session_pair_harvester.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/session_pair_harvester.py")
|
||||
|
||||
class TestRegression_b46e9fef(unittest.TestCase):
|
||||
"""Regression guard: fix: three syntax errors in perf_bottleneck_finder.py (#211) - commit b46e9fef048e1c08fe757063447f6314fb45d6b2."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_43638640(unittest.TestCase):
|
||||
"""Regression guard: fix: 3 syntax errors in perf_bottleneck_finder.py (closes #211) - commit 43638640123f3487cd40253935827b190497bfdf."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_55adcb31(unittest.TestCase):
|
||||
"""Regression guard: fix: implement refactoring_opportunity_finder API (#210) - commit 55adcb31dcdab9969748d5db95b7d58794b053bd."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path(".gitignore")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: .gitignore")
|
||||
|
||||
class TestRegression_580e9928(unittest.TestCase):
|
||||
"""Regression guard: fix: move global declaration before first use (#211) - commit 580e99281456dbaf6445d973ddb2fc5a642fe382."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_d018a365(unittest.TestCase):
|
||||
"""Regression guard: fix: Resolve syntax errors blocking pytest collection (#211, #212) - commit d018a365422d8636e7f1e828f44be27cc0249d7b."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/dependency_graph.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/dependency_graph.py")
|
||||
|
||||
class TestRegression_ee4bfcb2(unittest.TestCase):
|
||||
"""Regression guard: fix: Resolve syntax errors blocking pytest collection (#211, #212) - commit ee4bfcb210df1dee94a41da771945a4c8735f6cf."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_17e03de9(unittest.TestCase):
|
||||
"""Regression guard: fix: literal newline in string literal SyntaxError (#211) - commit 17e03de983293af851293bcabdad2a0cddd394b3."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_a45ec10b(unittest.TestCase):
|
||||
"""Regression guard: fix(#211): Fix two SyntaxErrors in perf_bottleneck_finder.py - commit a45ec10b7ae86c05a56e8f7ad89ed018f46e2989."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_99d5832f(unittest.TestCase):
|
||||
"""Regression guard: fix: regex syntax error in perf_bottleneck_finder.py (#211) - commit 99d5832fa9c22d8018b0792f44c386ca123900b1."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_ec0e9d65(unittest.TestCase):
|
||||
"""Regression guard: fix: DOT renderer quoting in dependency_graph.py (#212) - commit ec0e9d65ca68f9f809dd612c0bb9014eb49d3116."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/dependency_graph.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/dependency_graph.py")
|
||||
|
||||
class TestRegression_ef6a8d3b(unittest.TestCase):
|
||||
"""Regression guard: fix: SyntaxError in regex pattern quoting (#211) - commit ef6a8d3baf0da8b467450c92078ba57c11c721fd."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_b732172d(unittest.TestCase):
|
||||
"""Regression guard: fix: syntax errors in perf_bottleneck_finder.py #211 - commit b732172dcc7e98b453c302b13df32d1d3137acf1."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_bfc1f561(unittest.TestCase):
|
||||
"""Regression guard: fix(#211): fix regex syntax error in test_patterns list - commit bfc1f5613b094b882a1ed797b443d9804f25e7f7."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_f7c479c4(unittest.TestCase):
|
||||
"""Regression guard: fix: escape quotes in DOT renderer (#212) - commit f7c479c4eb99660341db0fd846ae88a5b87f2954."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/dependency_graph.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/dependency_graph.py")
|
||||
|
||||
class TestRegression_ad1d474a(unittest.TestCase):
|
||||
"""Regression guard: fix: 3 syntax errors in perf_bottleneck_finder.py (#211) - commit ad1d474aee2c78a839d617576132bf9af6e3aaec."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_de37e743(unittest.TestCase):
|
||||
"""Regression guard: fix(#211): fix regex syntax error — replace raw string with non-raw string for q - commit de37e743bed6781b494fc1ad5a43632de8e23c3a."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_bd8e044f(unittest.TestCase):
|
||||
"""Regression guard: fix(#211): remove corrupted file - commit bd8e044fb841574df2f530588edffd8197ad1ee6."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_c28999f2(unittest.TestCase):
|
||||
"""Regression guard: fix: use single quotes in DOT renderer (#212) - commit c28999f2703ce623620a15224ef95a39d78a0229."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/dependency_graph.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/dependency_graph.py")
|
||||
|
||||
class TestRegression_576bded2(unittest.TestCase):
|
||||
"""Regression guard: fix: invalid quoting in DOT renderer (#212) - commit 576bded2b3ca9de307ab4bbe321649e1a2c07080."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/dependency_graph.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/dependency_graph.py")
|
||||
|
||||
class TestRegression_0e6d5bff(unittest.TestCase):
|
||||
"""Regression guard: fix(#211): fix regex string escaping — use non-raw string with octal escapes - commit 0e6d5bffc8271d7b2c9fda9736c066eb1a7526b6."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_f9f47cd1(unittest.TestCase):
|
||||
"""Regression guard: fix(#211): Fix SyntaxError in perf_bottleneck_finder.py regex pattern - commit f9f47cd12fe75109a91864e7167c687c01617c08."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_5877f0ea(unittest.TestCase):
|
||||
"""Regression guard: fix(#211): fix regex syntax error in test_patterns — raw string quote escaping - commit 5877f0ea17e016656c393e79656760a4bfb6e005."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/perf_bottleneck_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/perf_bottleneck_finder.py")
|
||||
|
||||
class TestRegression_39905d92(unittest.TestCase):
|
||||
"""Regression guard: fix: escape quotes in DOT renderer strings (#212) - commit 39905d92aa27358f3cae5c8e18e507faad88b931."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/dependency_graph.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/dependency_graph.py")
|
||||
|
||||
class TestRegression_c203010e(unittest.TestCase):
|
||||
"""Regression guard: fix(#676): update GENOME.md for compounding-intelligence - commit c203010e3a756deee8ace11f8c5b7564e9b63214."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("GENOME.md")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: GENOME.md")
|
||||
|
||||
class TestRegression_7a4677c7(unittest.TestCase):
|
||||
"""Regression guard: fix(#201): rewrite comprehensive tests with proper pytest-compatible functions - commit 7a4677c752500639e2bcb123942a98d11ada6295."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/test_harvest_prompt_comprehensive.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/test_harvest_prompt_comprehensive.py")
|
||||
|
||||
class TestRegression_229c327c(unittest.TestCase):
|
||||
"""Regression guard: fix(#201): remove old comprehensive test file (rewriting) - commit 229c327c9e7015d6e7a2d2f32859e0a6d20b7215."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/test_harvest_prompt_comprehensive.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/test_harvest_prompt_comprehensive.py")
|
||||
|
||||
class TestRegression_537bb1b6(unittest.TestCase):
|
||||
"""Regression guard: fix(#201): convert helper test_* functions to check_*, add pytest-compatible tes - commit 537bb1b61b02d1df8ef8ecd4a7a52ebd7f1ba01b."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/test_harvest_prompt_comprehensive.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/test_harvest_prompt_comprehensive.py")
|
||||
|
||||
class TestRegression_93bc3fc1(unittest.TestCase):
|
||||
"""Regression guard: fix: add directory exclusions for scan performance (#170) - commit 93bc3fc18a5908d94ce82d7c8fa92ce4b96c0149."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("scripts/automation_opportunity_finder.py")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: scripts/automation_opportunity_finder.py")
|
||||
|
||||
class TestRegression_f90c1670(unittest.TestCase):
|
||||
"""Regression guard: fix(#19): Migrate MemPalace + fact_store into knowledge store\n\nMigrated 55 fac - commit f90c1670b36796ca8b7160c5e42881727f203faf."""
|
||||
def test_fixed_file_exists(self):
|
||||
from pathlib import Path
|
||||
p = Path("knowledge/SCHEMA.md")
|
||||
self.assertTrue(p.exists(), f"Fixed file missing: knowledge/SCHEMA.md")
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
unittest.main()
|
||||
Reference in New Issue
Block a user