2026-03-08 16:07:02 -04:00
|
|
|
import logging as _logging
|
|
|
|
|
import os
|
|
|
|
|
import sys
|
2026-02-21 16:53:16 +00:00
|
|
|
from typing import Literal
|
|
|
|
|
|
2026-02-19 19:31:48 +00:00
|
|
|
from pydantic_settings import BaseSettings, SettingsConfigDict
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Settings(BaseSettings):
|
2026-03-05 19:45:38 -05:00
|
|
|
# Display name for the primary agent — override with AGENT_NAME env var
|
|
|
|
|
agent_name: str = "Agent"
|
|
|
|
|
|
2026-02-19 19:31:48 +00:00
|
|
|
# Ollama host — override with OLLAMA_URL env var or .env file
|
|
|
|
|
ollama_url: str = "http://localhost:11434"
|
|
|
|
|
|
|
|
|
|
# LLM model passed to Agno/Ollama — override with OLLAMA_MODEL
|
2026-03-11 18:36:42 -04:00
|
|
|
# qwen3.5:latest is the primary model — better reasoning and tool calling
|
2026-03-11 08:11:26 -04:00
|
|
|
# than llama3.1:8b-instruct while still running locally on modest hardware.
|
2026-03-11 18:36:42 -04:00
|
|
|
# Fallback: llama3.1:8b-instruct if qwen3.5:latest not available.
|
2026-02-26 13:42:36 -05:00
|
|
|
# llama3.2 (3B) hallucinated tool output consistently in testing.
|
2026-03-11 18:36:42 -04:00
|
|
|
ollama_model: str = "qwen3.5:latest"
|
2026-02-19 19:31:48 +00:00
|
|
|
|
|
|
|
|
# Set DEBUG=true to enable /docs and /redoc (disabled by default)
|
|
|
|
|
debug: bool = False
|
|
|
|
|
|
2026-02-22 17:16:12 +00:00
|
|
|
# Telegram bot token — set via TELEGRAM_TOKEN env var or the /telegram/setup endpoint
|
|
|
|
|
telegram_token: str = ""
|
|
|
|
|
|
2026-02-25 01:11:14 +00:00
|
|
|
# Discord bot token — set via DISCORD_TOKEN env var or the /discord/setup endpoint
|
|
|
|
|
discord_token: str = ""
|
|
|
|
|
|
2026-03-09 21:54:04 -04:00
|
|
|
# ── Discord action confirmation ──────────────────────────────────────────
|
|
|
|
|
# When True, dangerous tools (shell, write_file, python) require user
|
|
|
|
|
# confirmation via Discord button before executing.
|
|
|
|
|
discord_confirm_actions: bool = True
|
|
|
|
|
# Seconds to wait for user confirmation before auto-rejecting.
|
|
|
|
|
discord_confirm_timeout: int = 120
|
|
|
|
|
|
2026-02-21 16:53:16 +00:00
|
|
|
# ── AirLLM / backend selection ───────────────────────────────────────────
|
|
|
|
|
# "ollama" — always use Ollama (default, safe everywhere)
|
|
|
|
|
# "airllm" — always use AirLLM (requires pip install ".[bigbrain]")
|
|
|
|
|
# "auto" — use AirLLM on Apple Silicon if airllm is installed,
|
|
|
|
|
# fall back to Ollama otherwise
|
2026-03-10 18:17:47 -04:00
|
|
|
timmy_model_backend: Literal["ollama", "airllm", "grok", "claude", "auto"] = "ollama"
|
2026-02-21 16:53:16 +00:00
|
|
|
|
|
|
|
|
# AirLLM model size when backend is airllm or auto.
|
|
|
|
|
# Larger = smarter, but needs more RAM / disk.
|
|
|
|
|
# 8b ~16 GB | 70b ~140 GB | 405b ~810 GB
|
2026-03-10 18:17:47 -04:00
|
|
|
airllm_model_size: Literal["8b", "70b", "405b"] = "70b"
|
2026-02-21 16:53:16 +00:00
|
|
|
|
feat: add Grok (xAI) as opt-in premium backend with monetization
- Add GrokBackend class in src/timmy/backends.py with full sync/async
support, health checks, usage stats, and cost estimation in sats
- Add consult_grok tool to Timmy's toolkit for proactive Grok queries
- Extend cascade router with Grok provider type for failover chain
- Add Grok Mode toggle card to Mission Control dashboard (HTMX live)
- Add "Ask Grok" button on chat input for direct Grok queries
- Add /grok/* routes: status, toggle, chat, stats endpoints
- Integrate Lightning invoice generation for Grok usage monetization
- Add GROK_ENABLED, XAI_API_KEY, GROK_DEFAULT_MODEL, GROK_MAX_SATS_PER_QUERY,
GROK_FREE config settings via pydantic-settings
- Update .env.example and docker-compose.yml with Grok env vars
- Add 21 tests covering backend, tools, and route endpoints (all green)
Local-first ethos preserved: Grok is premium augmentation only,
disabled by default, and Lightning-payable when enabled.
https://claude.ai/code/session_01FygwN8wS8J6WGZ8FPb7XGV
2026-02-27 01:12:51 +00:00
|
|
|
# ── Grok (xAI) — opt-in premium cloud backend ────────────────────────
|
|
|
|
|
# Grok is a premium augmentation layer — local-first ethos preserved.
|
|
|
|
|
# Only used when explicitly enabled and query complexity warrants it.
|
|
|
|
|
grok_enabled: bool = False
|
|
|
|
|
xai_api_key: str = ""
|
|
|
|
|
grok_default_model: str = "grok-3-fast"
|
|
|
|
|
grok_max_sats_per_query: int = 200
|
|
|
|
|
grok_free: bool = False # Skip Lightning invoice when user has own API key
|
|
|
|
|
|
2026-02-28 09:35:44 -05:00
|
|
|
# ── Claude (Anthropic) — cloud fallback backend ────────────────────────
|
|
|
|
|
# Used when Ollama is offline and local inference isn't available.
|
|
|
|
|
# Set ANTHROPIC_API_KEY to enable. Default model is Haiku (fast + cheap).
|
|
|
|
|
anthropic_api_key: str = ""
|
|
|
|
|
claude_model: str = "haiku"
|
|
|
|
|
|
feat: integrate Spark Intelligence into Timmy swarm system
Adds a self-evolving cognitive layer inspired by vibeship-spark-intelligence,
adapted for Timmy's agent architecture. Spark captures swarm events, runs
EIDOS prediction-evaluation loops, consolidates memories, and generates
advisory recommendations — all backed by SQLite consistent with existing
patterns.
New modules:
- spark/memory.py — event capture with importance scoring + memory consolidation
- spark/eidos.py — EIDOS cognitive loop (predict → observe → evaluate → learn)
- spark/advisor.py — ranked advisory generation from accumulated intelligence
- spark/engine.py — top-level API wiring all subsystems together
Dashboard:
- /spark/ui — full Spark Intelligence dashboard (3-column: status/advisories,
predictions/memories, event timeline) with HTMX auto-refresh
- /spark — JSON API for programmatic access
- SPARK link added to navigation header
Integration:
- Coordinator hooks emit Spark events on task post, bid, assign, complete, fail
- EIDOS predictions generated when tasks are posted, evaluated on completion
- Memory consolidation triggers when agents accumulate enough outcomes
- SPARK_ENABLED config toggle (default: true)
Tests: 47 new tests covering all Spark subsystems + dashboard routes.
Full suite: 538 tests passing.
https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c
2026-02-24 15:51:15 +00:00
|
|
|
# ── Spark Intelligence ────────────────────────────────────────────────
|
|
|
|
|
# Enable/disable the Spark cognitive layer.
|
|
|
|
|
# When enabled, Spark captures swarm events, runs EIDOS predictions,
|
|
|
|
|
# consolidates memories, and generates advisory recommendations.
|
|
|
|
|
spark_enabled: bool = True
|
|
|
|
|
|
feat: add full creative studio + DevOps tools (Pixel, Lyra, Reel personas)
Adds 3 new personas (Pixel, Lyra, Reel) and 5 new tool modules:
- Git/DevOps tools (GitPython): clone, status, diff, log, blame, branch,
add, commit, push, pull, stash — wired to Forge and Helm personas
- Image generation (FLUX via diffusers): text-to-image, storyboards,
variations — Pixel persona
- Music generation (ACE-Step 1.5): full songs with vocals+instrumentals,
instrumental tracks, vocal-only tracks — Lyra persona
- Video generation (Wan 2.1 via diffusers): text-to-video, image-to-video
clips — Reel persona
- Creative Director pipeline: multi-step orchestration that chains
storyboard → music → video → assembly into 3+ minute final videos
- Video assembler (MoviePy + FFmpeg): stitch clips, overlay audio,
title cards, subtitles, final export
Also includes:
- Spark Intelligence tool-level + creative pipeline event capture
- Creative Studio dashboard page (/creative/ui) with 4 tabs
- Config settings for all new models and output directories
- pyproject.toml creative optional extra for GPU dependencies
- 107 new tests covering all modules (624 total, all passing)
https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c
2026-02-24 16:31:47 +00:00
|
|
|
# ── Git / DevOps ──────────────────────────────────────────────────────
|
|
|
|
|
git_default_repo_dir: str = "~/repos"
|
|
|
|
|
|
2026-02-26 23:39:13 -05:00
|
|
|
# Repository root - auto-detected but can be overridden
|
|
|
|
|
# This is the main project directory where .git lives
|
|
|
|
|
repo_root: str = ""
|
|
|
|
|
|
feat: add full creative studio + DevOps tools (Pixel, Lyra, Reel personas)
Adds 3 new personas (Pixel, Lyra, Reel) and 5 new tool modules:
- Git/DevOps tools (GitPython): clone, status, diff, log, blame, branch,
add, commit, push, pull, stash — wired to Forge and Helm personas
- Image generation (FLUX via diffusers): text-to-image, storyboards,
variations — Pixel persona
- Music generation (ACE-Step 1.5): full songs with vocals+instrumentals,
instrumental tracks, vocal-only tracks — Lyra persona
- Video generation (Wan 2.1 via diffusers): text-to-video, image-to-video
clips — Reel persona
- Creative Director pipeline: multi-step orchestration that chains
storyboard → music → video → assembly into 3+ minute final videos
- Video assembler (MoviePy + FFmpeg): stitch clips, overlay audio,
title cards, subtitles, final export
Also includes:
- Spark Intelligence tool-level + creative pipeline event capture
- Creative Studio dashboard page (/creative/ui) with 4 tabs
- Config settings for all new models and output directories
- pyproject.toml creative optional extra for GPU dependencies
- 107 new tests covering all modules (624 total, all passing)
https://claude.ai/code/session_01KJm6jQkNi3aA3yoQJn636c
2026-02-24 16:31:47 +00:00
|
|
|
# ── Creative — Image Generation (Pixel) ───────────────────────────────
|
|
|
|
|
flux_model_id: str = "black-forest-labs/FLUX.1-schnell"
|
|
|
|
|
image_output_dir: str = "data/images"
|
|
|
|
|
image_default_steps: int = 4
|
|
|
|
|
|
|
|
|
|
# ── Creative — Music Generation (Lyra) ────────────────────────────────
|
|
|
|
|
music_output_dir: str = "data/music"
|
|
|
|
|
ace_step_model: str = "ace-step/ACE-Step-v1.5"
|
|
|
|
|
|
|
|
|
|
# ── Creative — Video Generation (Reel) ────────────────────────────────
|
|
|
|
|
video_output_dir: str = "data/video"
|
|
|
|
|
wan_model_id: str = "Wan-AI/Wan2.1-T2V-1.3B"
|
|
|
|
|
video_default_resolution: str = "480p"
|
|
|
|
|
|
|
|
|
|
# ── Creative — Pipeline / Assembly ────────────────────────────────────
|
|
|
|
|
creative_output_dir: str = "data/creative"
|
|
|
|
|
video_transition_duration: float = 1.0
|
|
|
|
|
default_video_codec: str = "libx264"
|
|
|
|
|
|
2026-02-25 18:19:22 +00:00
|
|
|
# ── L402 Lightning ───────────────────────────────────────────────────
|
|
|
|
|
# HMAC secrets for macaroon signing and invoice verification.
|
|
|
|
|
# Generate with: python3 -c "import secrets; print(secrets.token_hex(32))"
|
2026-02-25 15:32:19 -05:00
|
|
|
# In production (TIMMY_ENV=production), these MUST be set or the app will refuse to start.
|
|
|
|
|
l402_hmac_secret: str = ""
|
|
|
|
|
l402_macaroon_secret: str = ""
|
2026-02-25 18:19:22 +00:00
|
|
|
lightning_backend: Literal["mock", "lnd"] = "mock"
|
|
|
|
|
|
2026-02-25 15:32:19 -05:00
|
|
|
# ── Privacy / Sovereignty ────────────────────────────────────────────
|
|
|
|
|
# Disable Agno telemetry for air-gapped/sovereign deployments.
|
|
|
|
|
# Default is False (telemetry disabled) to align with sovereign AI vision.
|
|
|
|
|
telemetry_enabled: bool = False
|
|
|
|
|
|
2026-03-11 18:36:42 -04:00
|
|
|
# CORS allowed origins for the web chat interface (Gitea Pages, etc.)
|
feat: replace GitHub page with embedded Timmy chat interface
Replaces the marketing landing page with a minimal, full-screen chat
interface that connects to a running Timmy instance. Mobile-first design
with single vertical scroll direction, looping scroll, no zoom, no
buttons — just type and press Enter to talk to Timmy.
- docs/index.html: full rewrite as a clean chat UI with dark terminal
theme, looping infinite scroll, markdown rendering, connection status,
and /connect, /clear, /help slash commands
- src/dashboard/app.py: add CORS middleware so the GitHub Pages site can
reach a local Timmy server cross-origin
- src/config.py: add cors_origins setting (defaults to ["*"])
https://claude.ai/code/session_01AWLxg6KDWsfCATiuvsRMGr
2026-02-27 00:35:33 +00:00
|
|
|
# Set CORS_ORIGINS as a comma-separated list, e.g. "http://localhost:3000,https://example.com"
|
|
|
|
|
cors_origins: list[str] = ["*"]
|
|
|
|
|
|
2026-03-11 10:37:20 -04:00
|
|
|
# Trusted hosts for the Host header check (TrustedHostMiddleware).
|
|
|
|
|
# Set TRUSTED_HOSTS as a comma-separated list. Wildcards supported (e.g. "*.ts.net").
|
|
|
|
|
# Defaults include localhost + Tailscale MagicDNS. Add your Tailscale IP if needed.
|
|
|
|
|
trusted_hosts: list[str] = [
|
|
|
|
|
"localhost",
|
|
|
|
|
"127.0.0.1",
|
|
|
|
|
"*.local",
|
|
|
|
|
"*.ts.net",
|
|
|
|
|
"testserver",
|
|
|
|
|
]
|
|
|
|
|
|
2026-02-25 15:32:19 -05:00
|
|
|
# Environment mode: development | production
|
|
|
|
|
# In production, security settings are strictly enforced.
|
|
|
|
|
timmy_env: Literal["development", "production"] = "development"
|
|
|
|
|
|
2026-03-07 22:34:30 -05:00
|
|
|
# ── Memory Management ──────────────────────────────────────────────
|
|
|
|
|
# Auto-prune vector store memories older than this many days on startup.
|
|
|
|
|
# Set to 0 to disable auto-pruning.
|
|
|
|
|
memory_prune_days: int = 90
|
|
|
|
|
# When True, fact-type memories are kept even when older than the TTL.
|
|
|
|
|
memory_prune_keep_facts: bool = True
|
|
|
|
|
# Maximum size in MB for the memory/notes/ vault directory.
|
|
|
|
|
# When exceeded, a warning is logged. Set to 0 to disable.
|
|
|
|
|
memory_vault_max_mb: int = 100
|
|
|
|
|
|
feat: agentic loop for multi-step tasks + regression fixes (#148)
* fix: name extraction blocklist, memory preview escaping, and gitignore cleanup
- Add _NAME_BLOCKLIST to extract_user_name() to reject gerunds and UI-state
words like "Sending" that were incorrectly captured as user names
- Collapse whitespace in get_memory_status() preview so newlines survive
JSON serialization without showing raw \n escape sequences
- Broaden .gitignore from specific memory/self/user_profile.md to memory/self/
and untrack memory/self/methodology.md (runtime-edited file)
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* fix: catch Ollama connection errors in session.py + add 71 smoke tests
- Wrap agent.run() in session.py with try/except so Ollama connection
failures return a graceful fallback message instead of dumping raw
tracebacks to Docker logs
- Add tests/test_smoke.py with 71 tests covering every GET route:
core pages, feature pages, JSON APIs, and a parametrized no-500 sweep
— catches import errors, template failures, and schema mismatches
that unit tests miss
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* feat: agentic loop for multi-step tasks + Round 10 regression fixes
Agentic loop (Parts 1-4):
- Add multi-step chaining instructions to system prompt
- New agentic_loop.py with plan→execute→adapt→summarize flow
- Register plan_and_execute tool for background task execution
- Add max_agent_steps config setting (default: 10)
- Discord fix: 300s timeout, typing indicator, send error handling
- 16 new unit + e2e tests for agentic loop
Round 10 regressions (R1-R5, P1):
- R1: Fix literal \n escape sequences in tool responses
- R2: Chat timeout/error feedback in agent panel
- R3: /hands infinite spinner → static empty states
- R4: /self-coding infinite spinner → static stats + journal
- R5: /grok/status raw JSON → HTML dashboard template
- P1: VETO confirmation dialog on task cards
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* fix: briefing route 500 in CI when agno is MagicMock stub
_call_agent() returned a MagicMock instead of a string when agno is
stubbed in tests, causing SQLite "Error binding parameter 4" on save.
Ensure the return value is always an actual string.
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* fix: briefing route 500 in CI — graceful degradation at route level
When agno is stubbed with MagicMock in CI, agent.run() returns a
MagicMock instead of raising — so the exception handler never fires
and a MagicMock propagates as the summary to SQLite, which can't
bind it.
Fix: catch at the route level and return a fallback Briefing object.
This follows the project's graceful degradation pattern — the briefing
page always renders, even when the backend is completely unavailable.
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---------
Co-authored-by: Trip T <trip@local>
Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
2026-03-08 01:46:29 -05:00
|
|
|
# ── Agentic Loop ──────────────────────────────────────────────────
|
|
|
|
|
# Maximum steps the agentic loop will execute before stopping.
|
|
|
|
|
max_agent_steps: int = 10
|
|
|
|
|
|
2026-03-07 18:49:37 -05:00
|
|
|
# ── Test / Diagnostics ─────────────────────────────────────────────
|
|
|
|
|
# Skip loading heavy embedding models (for tests / low-memory envs).
|
|
|
|
|
timmy_skip_embeddings: bool = False
|
|
|
|
|
# Disable CSRF middleware entirely (for tests).
|
|
|
|
|
timmy_disable_csrf: bool = False
|
|
|
|
|
# Mark the process as running in test mode.
|
|
|
|
|
timmy_test_mode: bool = False
|
|
|
|
|
|
|
|
|
|
# ── Brain / rqlite ─────────────────────────────────────────────────
|
|
|
|
|
# URL of the local rqlite node for distributed memory.
|
|
|
|
|
# Empty string means rqlite is not configured.
|
|
|
|
|
rqlite_url: str = ""
|
|
|
|
|
# Source identifier for brain memory entries.
|
|
|
|
|
brain_source: str = "default"
|
|
|
|
|
# Path override for the local brain SQLite database.
|
|
|
|
|
brain_db_path: str = ""
|
|
|
|
|
|
|
|
|
|
# ── Security Tuning ───────────────────────────────────────────────
|
|
|
|
|
# Set to True in production to mark CSRF cookies as Secure (HTTPS only).
|
|
|
|
|
csrf_cookie_secure: bool = False
|
|
|
|
|
# Maximum size in bytes for chat API request bodies.
|
|
|
|
|
chat_api_max_body_bytes: int = 1_048_576 # 1 MB
|
|
|
|
|
|
2026-02-25 17:18:58 -05:00
|
|
|
# ── Self-Modification ──────────────────────────────────────────────
|
Claude/remove persona system f vgt m (#126)
* Remove persona system, identity, and all Timmy references
Strip the codebase to pure orchestration logic:
- Delete TIMMY_IDENTITY.md and memory/self/identity.md
- Gut brain/identity.py to no-op stubs (empty returns)
- Remove all system prompts reinforcing Timmy's character, faith,
sovereignty, sign-off ("Sir, affirmative"), and agent roster
- Replace identity-laden prompts with generic local-AI-assistant prompts
- Remove "You work for Timmy" from all sub-agent system prompts
- Rename PersonaTools → AgentTools, PERSONA_TOOLKITS → AGENT_TOOLKITS
- Replace "timmy" agent ID with "orchestrator" across routes, marketplace,
tools catalog, and orchestrator class
- Strip Timmy references from config comments, templates, telegram bot,
chat API, and dashboard UI
- Delete tests/brain/test_identity.py entirely
- Fix all test assertions that checked for persona identity content
729 tests pass (2 pre-existing failures in test_calm.py unrelated).
https://claude.ai/code/session_01LjQGUE6nk9W9674zaxrYxy
* Add Taskosaur (PM + AI task execution) to docker-compose
Spins up Taskosaur alongside the dashboard on `docker compose up`:
- postgres:16-alpine (port 5432, Taskosaur DB)
- redis:7-alpine (Bull queue backend)
- taskosaur (ports 3000 API / 3001 UI)
- dashboard now depends_on taskosaur healthy
- TASKOSAUR_API_URL injected into dashboard environment
Dashboard can reach Taskosaur at http://taskosaur:3000/api on the
internal network. Frontend UI accessible at http://localhost:3001.
https://claude.ai/code/session_01LjQGUE6nk9W9674zaxrYxy
---------
Co-authored-by: Claude <noreply@anthropic.com>
2026-03-04 12:00:49 -05:00
|
|
|
# Enable self-modification capabilities. When enabled, the agent can
|
2026-02-25 17:18:58 -05:00
|
|
|
# edit its own source code, run tests, and commit changes.
|
|
|
|
|
self_modify_enabled: bool = False
|
|
|
|
|
self_modify_max_retries: int = 2
|
|
|
|
|
self_modify_allowed_dirs: str = "src,tests"
|
|
|
|
|
self_modify_backend: str = "auto" # "ollama", "anthropic", or "auto"
|
|
|
|
|
|
2026-02-26 10:27:08 -05:00
|
|
|
# ── Work Orders ──────────────────────────────────────────────────
|
|
|
|
|
# External users and agents can submit work orders for improvements.
|
|
|
|
|
work_orders_enabled: bool = True
|
|
|
|
|
work_orders_auto_execute: bool = False # Master switch for auto-execution
|
2026-02-26 23:39:13 -05:00
|
|
|
work_orders_auto_threshold: str = (
|
|
|
|
|
"low" # Max priority that auto-executes: "low" | "medium" | "high" | "none"
|
|
|
|
|
)
|
2026-02-26 10:27:08 -05:00
|
|
|
|
feat: add custom weights, model registry, per-agent models, and reward scoring
Inspired by OpenClaw-RL's multi-model orchestration, this adds four
features for custom model management:
1. Custom model registry (infrastructure/models/registry.py) — SQLite-backed
registry for GGUF, safetensors, HF checkpoint, and Ollama models with
role-based lookups (general, reward, teacher, judge).
2. Per-agent model assignment — each swarm persona can use a different model
instead of sharing the global default. Resolved via registry assignment >
persona default > global default.
3. Runtime model management API (/api/v1/models) — REST endpoints to register,
list, assign, enable/disable, and remove custom models without restart.
Includes a dashboard page at /models.
4. Reward model scoring (PRM-style) — majority-vote quality evaluation of
agent outputs using a configurable reward model. Scores persist in SQLite
and feed into the swarm learner.
New config settings: custom_weights_dir, reward_model_enabled,
reward_model_name, reward_model_votes.
54 new tests covering registry CRUD, API endpoints, agent assignments,
role lookups, and reward scoring.
https://claude.ai/code/session_01V4iTozMwcE2gjfnCJdCugC
2026-02-27 01:08:03 +00:00
|
|
|
# ── Custom Weights & Models ──────────────────────────────────────
|
|
|
|
|
# Directory for custom model weights (GGUF, safetensors, HF checkpoints).
|
|
|
|
|
# Models placed here can be registered at runtime and assigned to agents.
|
|
|
|
|
custom_weights_dir: str = "data/models"
|
|
|
|
|
# Enable the reward model for scoring agent outputs (PRM-style).
|
|
|
|
|
reward_model_enabled: bool = False
|
|
|
|
|
# Reward model name (must be available via Ollama or a custom weight path).
|
|
|
|
|
reward_model_name: str = ""
|
|
|
|
|
# Minimum votes for majority-vote reward scoring (odd number recommended).
|
|
|
|
|
reward_model_votes: int = 3
|
|
|
|
|
|
feat: add in-browser local model support for iPhone via WebLLM
Enable Timmy to run directly on iPhone by loading a small LLM into
the browser via WebGPU (Safari 26+ / iOS 26+). No server connection
required — fully sovereign, fully offline.
New files:
- static/local_llm.js: WebLLM wrapper with model catalogue, WebGPU
detection, streaming chat, and progress callbacks
- templates/mobile_local.html: Mobile-optimized UI with model
selector, download progress, LOCAL/SERVER badge, and chat
- tests/dashboard/test_local_models.py: 31 tests covering routes,
config, template UX, JS asset, and XSS prevention
Changes:
- config.py: browser_model_enabled, browser_model_id,
browser_model_fallback settings
- routes/mobile.py: /mobile/local page, /mobile/local-models API
- base.html: LOCAL AI nav link
Supported models: SmolLM2-360M (~200MB), Qwen2.5-0.5B (~350MB),
SmolLM2-1.7B (~1GB), Llama-3.2-1B (~700MB). Falls back to
server-side Ollama when local model is unavailable.
https://claude.ai/code/session_01Cqkvr4sZbED7T3iDu1rwSD
2026-02-27 00:03:05 +00:00
|
|
|
# ── Browser Local Models (iPhone / WebGPU) ───────────────────────
|
|
|
|
|
# Enable in-browser LLM inference via WebLLM for offline iPhone use.
|
|
|
|
|
# When enabled, the mobile dashboard loads a small model directly
|
|
|
|
|
# in the browser — no server or Ollama required.
|
|
|
|
|
browser_model_enabled: bool = True
|
|
|
|
|
# WebLLM model ID — must be a pre-compiled MLC model.
|
|
|
|
|
# Recommended for iPhone: SmolLM2-360M (fast) or Qwen3-0.6B (smart).
|
|
|
|
|
browser_model_id: str = "SmolLM2-360M-Instruct-q4f16_1-MLC"
|
|
|
|
|
# Fallback to server when browser model is unavailable or too slow.
|
|
|
|
|
browser_model_fallback: bool = True
|
|
|
|
|
|
2026-02-27 01:00:11 -05:00
|
|
|
# ── Default Thinking ──────────────────────────────────────────────
|
Claude/remove persona system f vgt m (#126)
* Remove persona system, identity, and all Timmy references
Strip the codebase to pure orchestration logic:
- Delete TIMMY_IDENTITY.md and memory/self/identity.md
- Gut brain/identity.py to no-op stubs (empty returns)
- Remove all system prompts reinforcing Timmy's character, faith,
sovereignty, sign-off ("Sir, affirmative"), and agent roster
- Replace identity-laden prompts with generic local-AI-assistant prompts
- Remove "You work for Timmy" from all sub-agent system prompts
- Rename PersonaTools → AgentTools, PERSONA_TOOLKITS → AGENT_TOOLKITS
- Replace "timmy" agent ID with "orchestrator" across routes, marketplace,
tools catalog, and orchestrator class
- Strip Timmy references from config comments, templates, telegram bot,
chat API, and dashboard UI
- Delete tests/brain/test_identity.py entirely
- Fix all test assertions that checked for persona identity content
729 tests pass (2 pre-existing failures in test_calm.py unrelated).
https://claude.ai/code/session_01LjQGUE6nk9W9674zaxrYxy
* Add Taskosaur (PM + AI task execution) to docker-compose
Spins up Taskosaur alongside the dashboard on `docker compose up`:
- postgres:16-alpine (port 5432, Taskosaur DB)
- redis:7-alpine (Bull queue backend)
- taskosaur (ports 3000 API / 3001 UI)
- dashboard now depends_on taskosaur healthy
- TASKOSAUR_API_URL injected into dashboard environment
Dashboard can reach Taskosaur at http://taskosaur:3000/api on the
internal network. Frontend UI accessible at http://localhost:3001.
https://claude.ai/code/session_01LjQGUE6nk9W9674zaxrYxy
---------
Co-authored-by: Claude <noreply@anthropic.com>
2026-03-04 12:00:49 -05:00
|
|
|
# When enabled, the agent starts an internal thought loop on server start.
|
2026-02-27 01:00:11 -05:00
|
|
|
thinking_enabled: bool = True
|
|
|
|
|
thinking_interval_seconds: int = 300 # 5 minutes between thoughts
|
|
|
|
|
|
2026-03-06 01:20:14 -05:00
|
|
|
# ── Paperclip AI — orchestration bridge ────────────────────────────
|
|
|
|
|
# URL where the Paperclip server listens.
|
|
|
|
|
# For VPS deployment behind nginx, use the public domain.
|
|
|
|
|
paperclip_url: str = "http://localhost:3100"
|
|
|
|
|
# Enable/disable the Paperclip integration.
|
|
|
|
|
paperclip_enabled: bool = False
|
|
|
|
|
# API key or auth-gate cookie for authenticating with Paperclip.
|
|
|
|
|
paperclip_api_key: str = ""
|
|
|
|
|
# Timmy's agent ID in the Paperclip org chart.
|
|
|
|
|
paperclip_agent_id: str = ""
|
|
|
|
|
# Company ID in Paperclip — required for most API calls.
|
|
|
|
|
paperclip_company_id: str = ""
|
|
|
|
|
# Timeout in seconds for Paperclip HTTP calls.
|
|
|
|
|
paperclip_timeout: int = 30
|
|
|
|
|
# How often (seconds) Timmy polls Paperclip for work (0 = disabled).
|
|
|
|
|
paperclip_poll_interval: int = 0
|
|
|
|
|
|
2026-02-28 19:27:48 -05:00
|
|
|
# ── OpenFang — vendored agent runtime ─────────────────────────────
|
|
|
|
|
# URL where the OpenFang sidecar listens. Set to the Docker service
|
|
|
|
|
# name when running in compose, or localhost for bare-metal dev.
|
|
|
|
|
openfang_url: str = "http://localhost:8080"
|
|
|
|
|
# Enable/disable OpenFang integration. When disabled, the tool
|
|
|
|
|
# executor falls back to Timmy's native (simulated) execution.
|
|
|
|
|
openfang_enabled: bool = False
|
|
|
|
|
# Timeout in seconds for OpenFang hand execution (some hands are slow).
|
|
|
|
|
openfang_timeout: int = 120
|
|
|
|
|
|
2026-03-08 12:50:44 -04:00
|
|
|
# ── Autoresearch — autonomous ML experiment loops ──────────────────
|
|
|
|
|
# Integrates Karpathy's autoresearch pattern: agents modify training
|
|
|
|
|
# code, run time-boxed experiments, evaluate metrics, and iterate.
|
|
|
|
|
autoresearch_enabled: bool = False
|
|
|
|
|
autoresearch_workspace: str = "data/experiments"
|
|
|
|
|
autoresearch_time_budget: int = 300 # seconds per experiment run
|
|
|
|
|
autoresearch_max_iterations: int = 100
|
|
|
|
|
autoresearch_metric: str = "val_bpb" # metric to optimise (lower = better)
|
|
|
|
|
|
2026-03-06 09:01:24 -05:00
|
|
|
# ── Local Hands (Shell + Git) ──────────────────────────────────────
|
|
|
|
|
# Enable local shell/git execution hands.
|
|
|
|
|
hands_shell_enabled: bool = True
|
|
|
|
|
# Default timeout in seconds for shell commands.
|
|
|
|
|
hands_shell_timeout: int = 60
|
|
|
|
|
# Comma-separated additional command prefixes to allow.
|
|
|
|
|
hands_shell_extra_allowed: str = ""
|
|
|
|
|
# Enable the git hand for version-control operations.
|
|
|
|
|
hands_git_enabled: bool = True
|
|
|
|
|
# Default timeout for git operations.
|
|
|
|
|
hands_git_timeout: int = 60
|
|
|
|
|
|
2026-02-27 19:51:37 -05:00
|
|
|
# ── Error Logging ─────────────────────────────────────────────────
|
|
|
|
|
error_log_enabled: bool = True
|
|
|
|
|
error_log_dir: str = "logs"
|
|
|
|
|
error_log_max_bytes: int = 5_242_880 # 5 MB
|
|
|
|
|
error_log_backup_count: int = 5
|
|
|
|
|
error_feedback_enabled: bool = True # Auto-create bug report tasks
|
|
|
|
|
error_dedup_window_seconds: int = 300 # 5-min dedup window
|
|
|
|
|
|
2026-02-26 17:06:00 +00:00
|
|
|
# ── Scripture / Biblical Integration ──────────────────────────────
|
Claude/remove persona system f vgt m (#126)
* Remove persona system, identity, and all Timmy references
Strip the codebase to pure orchestration logic:
- Delete TIMMY_IDENTITY.md and memory/self/identity.md
- Gut brain/identity.py to no-op stubs (empty returns)
- Remove all system prompts reinforcing Timmy's character, faith,
sovereignty, sign-off ("Sir, affirmative"), and agent roster
- Replace identity-laden prompts with generic local-AI-assistant prompts
- Remove "You work for Timmy" from all sub-agent system prompts
- Rename PersonaTools → AgentTools, PERSONA_TOOLKITS → AGENT_TOOLKITS
- Replace "timmy" agent ID with "orchestrator" across routes, marketplace,
tools catalog, and orchestrator class
- Strip Timmy references from config comments, templates, telegram bot,
chat API, and dashboard UI
- Delete tests/brain/test_identity.py entirely
- Fix all test assertions that checked for persona identity content
729 tests pass (2 pre-existing failures in test_calm.py unrelated).
https://claude.ai/code/session_01LjQGUE6nk9W9674zaxrYxy
* Add Taskosaur (PM + AI task execution) to docker-compose
Spins up Taskosaur alongside the dashboard on `docker compose up`:
- postgres:16-alpine (port 5432, Taskosaur DB)
- redis:7-alpine (Bull queue backend)
- taskosaur (ports 3000 API / 3001 UI)
- dashboard now depends_on taskosaur healthy
- TASKOSAUR_API_URL injected into dashboard environment
Dashboard can reach Taskosaur at http://taskosaur:3000/api on the
internal network. Frontend UI accessible at http://localhost:3001.
https://claude.ai/code/session_01LjQGUE6nk9W9674zaxrYxy
---------
Co-authored-by: Claude <noreply@anthropic.com>
2026-03-04 12:00:49 -05:00
|
|
|
# Enable the biblical text module.
|
2026-02-26 17:06:00 +00:00
|
|
|
scripture_enabled: bool = True
|
|
|
|
|
# Primary translation for retrieval and citation.
|
|
|
|
|
scripture_translation: str = "ESV"
|
|
|
|
|
# Meditation mode: sequential | thematic | lectionary
|
|
|
|
|
scripture_meditation_mode: str = "sequential"
|
|
|
|
|
# Background meditation interval in seconds (0 = disabled).
|
|
|
|
|
scripture_meditation_interval: int = 0
|
|
|
|
|
|
2026-02-26 23:39:13 -05:00
|
|
|
def _compute_repo_root(self) -> str:
|
|
|
|
|
"""Auto-detect repo root if not set."""
|
|
|
|
|
if self.repo_root:
|
|
|
|
|
return self.repo_root
|
|
|
|
|
# Walk up from this file to find .git
|
|
|
|
|
import os
|
|
|
|
|
|
|
|
|
|
path = os.path.dirname(os.path.abspath(__file__))
|
|
|
|
|
path = os.path.dirname(os.path.dirname(path)) # src/ -> project root
|
|
|
|
|
while path != os.path.dirname(path):
|
|
|
|
|
if os.path.exists(os.path.join(path, ".git")):
|
|
|
|
|
return path
|
|
|
|
|
path = os.path.dirname(path)
|
|
|
|
|
return os.getcwd()
|
|
|
|
|
|
2026-02-19 19:31:48 +00:00
|
|
|
model_config = SettingsConfigDict(
|
|
|
|
|
env_file=".env",
|
|
|
|
|
env_file_encoding="utf-8",
|
|
|
|
|
extra="ignore",
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
settings = Settings()
|
2026-02-26 23:39:13 -05:00
|
|
|
# Ensure repo_root is computed if not set
|
|
|
|
|
if not settings.repo_root:
|
|
|
|
|
settings.repo_root = settings._compute_repo_root()
|
2026-02-25 18:19:22 +00:00
|
|
|
|
2026-02-26 13:42:36 -05:00
|
|
|
# ── Model fallback configuration ────────────────────────────────────────────
|
|
|
|
|
# Primary model for reliable tool calling (llama3.1:8b-instruct)
|
2026-03-11 18:36:42 -04:00
|
|
|
# Fallback if primary not available: qwen3.5:latest
|
|
|
|
|
OLLAMA_MODEL_PRIMARY: str = "qwen3.5:latest"
|
2026-03-07 18:20:34 -05:00
|
|
|
OLLAMA_MODEL_FALLBACK: str = "llama3.1:8b-instruct"
|
2026-02-26 13:42:36 -05:00
|
|
|
|
|
|
|
|
|
|
|
|
|
def check_ollama_model_available(model_name: str) -> bool:
|
|
|
|
|
"""Check if a specific Ollama model is available locally."""
|
|
|
|
|
try:
|
2026-03-05 18:56:52 -05:00
|
|
|
import json
|
2026-02-26 13:42:36 -05:00
|
|
|
import urllib.request
|
2026-02-26 23:39:13 -05:00
|
|
|
|
2026-02-26 13:42:36 -05:00
|
|
|
url = settings.ollama_url.replace("localhost", "127.0.0.1")
|
|
|
|
|
req = urllib.request.Request(
|
|
|
|
|
f"{url}/api/tags",
|
|
|
|
|
method="GET",
|
|
|
|
|
headers={"Accept": "application/json"},
|
|
|
|
|
)
|
|
|
|
|
with urllib.request.urlopen(req, timeout=5) as response:
|
|
|
|
|
data = json.loads(response.read().decode())
|
2026-03-05 18:56:52 -05:00
|
|
|
models = [m.get("name", "") for m in data.get("models", [])]
|
|
|
|
|
return any(
|
|
|
|
|
model_name == m or model_name == m.split(":")[0] or m.startswith(model_name)
|
|
|
|
|
for m in models
|
|
|
|
|
)
|
2026-02-26 13:42:36 -05:00
|
|
|
except Exception:
|
|
|
|
|
return False
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def get_effective_ollama_model() -> str:
|
|
|
|
|
"""Get the effective Ollama model, with fallback logic."""
|
|
|
|
|
# If user has overridden, use their setting
|
|
|
|
|
user_model = settings.ollama_model
|
2026-02-26 23:39:13 -05:00
|
|
|
|
2026-02-26 13:42:36 -05:00
|
|
|
# Check if user's model is available
|
|
|
|
|
if check_ollama_model_available(user_model):
|
|
|
|
|
return user_model
|
2026-02-26 23:39:13 -05:00
|
|
|
|
2026-02-26 13:42:36 -05:00
|
|
|
# Try primary
|
|
|
|
|
if check_ollama_model_available(OLLAMA_MODEL_PRIMARY):
|
|
|
|
|
_startup_logger.warning(
|
ruff (#169)
* polish: streamline nav, extract inline styles, improve tablet UX
- Restructure desktop nav from 8+ flat links + overflow dropdown into
5 grouped dropdowns (Core, Agents, Intel, System, More) matching
the mobile menu structure to reduce decision fatigue
- Extract all inline styles from mission_control.html and base.html
notification elements into mission-control.css with semantic classes
- Replace JS-built innerHTML with secure DOM construction in
notification loader and chat history
- Add CONNECTING state to connection indicator (amber) instead of
showing OFFLINE before WebSocket connects
- Add tablet breakpoint (1024px) with larger touch targets for
Apple Pencil / stylus use and safe-area padding for iPad toolbar
- Add active-link highlighting in desktop dropdown menus
- Rename "Mission Control" page title to "System Overview" to
disambiguate from the chat home page
- Add "Home — Timmy Time" page title to index.html
https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h
* fix(security): move auth-gate credentials to environment variables
Hardcoded username, password, and HMAC secret in auth-gate.py replaced
with os.environ lookups. Startup now refuses to run if any variable is
unset. Added AUTH_GATE_SECRET/USER/PASS to .env.example.
https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h
* refactor(tooling): migrate from black+isort+bandit to ruff
Replace three separate linting/formatting tools with a single ruff
invocation. Updates tox.ini (lint, format, pre-push, pre-commit envs),
.pre-commit-config.yaml, and CI workflow. Fixes all ruff errors
including unused imports, missing raise-from, and undefined names.
Ruff config maps existing bandit skips to equivalent S-rules.
https://claude.ai/code/session_015uPUoKyYa8M2UAcyk5Gt6h
---------
Co-authored-by: Claude <noreply@anthropic.com>
2026-03-11 12:23:35 -04:00
|
|
|
f"Requested model '{user_model}' not available. Using primary: {OLLAMA_MODEL_PRIMARY}"
|
2026-02-26 13:42:36 -05:00
|
|
|
)
|
|
|
|
|
return OLLAMA_MODEL_PRIMARY
|
2026-02-26 23:39:13 -05:00
|
|
|
|
2026-02-26 13:42:36 -05:00
|
|
|
# Try fallback
|
|
|
|
|
if check_ollama_model_available(OLLAMA_MODEL_FALLBACK):
|
|
|
|
|
_startup_logger.warning(
|
|
|
|
|
f"Primary model '{OLLAMA_MODEL_PRIMARY}' not available. "
|
|
|
|
|
f"Using fallback: {OLLAMA_MODEL_FALLBACK}"
|
|
|
|
|
)
|
|
|
|
|
return OLLAMA_MODEL_FALLBACK
|
2026-02-26 23:39:13 -05:00
|
|
|
|
2026-02-26 13:42:36 -05:00
|
|
|
# Last resort - return user's setting and hope for the best
|
|
|
|
|
return user_model
|
|
|
|
|
|
|
|
|
|
|
2026-02-25 18:19:22 +00:00
|
|
|
# ── Startup validation ───────────────────────────────────────────────────────
|
|
|
|
|
_startup_logger = _logging.getLogger("config")
|
2026-03-08 16:07:02 -04:00
|
|
|
_startup_validated = False
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def validate_startup(*, force: bool = False) -> None:
|
|
|
|
|
"""Enforce security requirements — call from app entry points, not import.
|
|
|
|
|
|
|
|
|
|
Skipped in test mode (TIMMY_TEST_MODE=1) unless force=True.
|
|
|
|
|
In production: sys.exit(1) if required secrets are missing.
|
|
|
|
|
In development: log warnings only.
|
|
|
|
|
"""
|
|
|
|
|
global _startup_validated
|
|
|
|
|
if _startup_validated and not force:
|
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
if os.environ.get("TIMMY_TEST_MODE") == "1" and not force:
|
|
|
|
|
_startup_validated = True
|
|
|
|
|
return
|
|
|
|
|
|
|
|
|
|
if settings.timmy_env == "production":
|
|
|
|
|
_missing = []
|
|
|
|
|
if not settings.l402_hmac_secret:
|
|
|
|
|
_missing.append("L402_HMAC_SECRET")
|
|
|
|
|
if not settings.l402_macaroon_secret:
|
|
|
|
|
_missing.append("L402_MACAROON_SECRET")
|
|
|
|
|
if _missing:
|
|
|
|
|
_startup_logger.error(
|
|
|
|
|
"PRODUCTION SECURITY ERROR: The following secrets must be set: %s\n"
|
|
|
|
|
'Generate with: python3 -c "import secrets; print(secrets.token_hex(32))"\n'
|
|
|
|
|
"Set in .env file or environment variables.",
|
|
|
|
|
", ".join(_missing),
|
|
|
|
|
)
|
|
|
|
|
sys.exit(1)
|
|
|
|
|
_startup_logger.info("Production mode: security secrets validated ✓")
|
|
|
|
|
else:
|
|
|
|
|
if not settings.l402_hmac_secret:
|
|
|
|
|
_startup_logger.warning(
|
|
|
|
|
"SEC: L402_HMAC_SECRET is not set — "
|
|
|
|
|
"set a unique secret in .env before deploying to production."
|
|
|
|
|
)
|
|
|
|
|
if not settings.l402_macaroon_secret:
|
|
|
|
|
_startup_logger.warning(
|
|
|
|
|
"SEC: L402_MACAROON_SECRET is not set — "
|
|
|
|
|
"set a unique secret in .env before deploying to production."
|
|
|
|
|
)
|
2026-02-25 18:19:22 +00:00
|
|
|
|
2026-03-08 16:07:02 -04:00
|
|
|
_startup_validated = True
|