From b48854e95dca49f4172d93dc08d593de9adb707f Mon Sep 17 00:00:00 2001 From: Ezra Date: Sun, 5 Apr 2026 08:58:28 +0000 Subject: [PATCH] [EZRA BURN-MODE] Phase 1: configuration --- scaffold/deepdive/phase1/config.yaml | 43 ++++++++++++++++++++++++++++ 1 file changed, 43 insertions(+) create mode 100644 scaffold/deepdive/phase1/config.yaml diff --git a/scaffold/deepdive/phase1/config.yaml b/scaffold/deepdive/phase1/config.yaml new file mode 100644 index 0000000..5a21b4b --- /dev/null +++ b/scaffold/deepdive/phase1/config.yaml @@ -0,0 +1,43 @@ +# Deep Dive — Phase 1 Configuration +# Parent: the-nexus#830 + +# ArXiv categories to monitor +categories: + - cs.AI # Artificial Intelligence + - cs.CL # Computation and Language (NLP) + - cs.LG # Machine Learning + +# Feed URLs (arXiv RSS format) +feed_template: "http://export.arxiv.org/rss/{category}" + +# Rate limiting (seconds between requests) +rate_limit: 3 + +# Storage +output_dir: "data/deepdive/raw" + +# Date format for output files +date_format: "%Y-%m-%d" + +# User agent for requests +user_agent: "DeepDiveBot/0.1 (research aggregator; ezra@timmy.local)" + +# Keywords for pre-filtering (Phase 2 does real scoring) +keywords: + - "agent" + - "llm" + - "language model" + - "reinforcement learning" + - "rl" + - "grpo" + - "fine-tuning" + - "training" + - "inference" + - "open source" + - "local" + - "gemma" + - "llama" + - "hermes" + - "tool use" + - "rag" + - "embeddings"