cli-config.yaml.example

# Hermes Agent CLI Configuration
# Copy this file to cli-config.yaml and customize as needed.
# This file configures the CLI behavior. Environment variables in .env take precedence.

# =============================================================================
# Model Configuration
# =============================================================================
model:
  # Default model to use (can be overridden with --model flag)
  default: "anthropic/claude-opus-4.6"
  
  # Inference provider selection:
  #   "auto"       - Use Nous Portal if logged in, otherwise OpenRouter/env vars (default)
  #   "nous-api"   - Use Nous Portal via API key (requires: NOUS_API_KEY)
  #   "openrouter" - Always use OpenRouter API key from OPENROUTER_API_KEY
  #   "nous"       - Always use Nous Portal (requires: hermes login)
  #   "zai"        - Use z.ai / ZhipuAI GLM models (requires: GLM_API_KEY)
  #   "kimi-coding"- Use Kimi / Moonshot AI models (requires: KIMI_API_KEY)
  #   "minimax"    - Use MiniMax global endpoint (requires: MINIMAX_API_KEY)
  #   "minimax-cn" - Use MiniMax China endpoint (requires: MINIMAX_CN_API_KEY)
  # Can also be overridden with --provider flag or HERMES_INFERENCE_PROVIDER env var.
  provider: "auto"
  
  # API configuration (falls back to OPENROUTER_API_KEY env var)
  # api_key: "your-key-here"  # Uncomment to set here instead of .env
  base_url: "https://openrouter.ai/api/v1"

# =============================================================================
# OpenRouter Provider Routing (only applies when using OpenRouter)
# =============================================================================
# Control how requests are routed across providers on OpenRouter.
# See: https://openrouter.ai/docs/guides/routing/provider-selection
#
# provider_routing:
#   # Sort strategy: "price" (default), "throughput", or "latency"
#   # Append :nitro to model name for a shortcut to throughput sorting.
#   sort: "throughput"
#
#   # Only allow these providers (provider slugs from OpenRouter)
#   # only: ["anthropic", "google"]
#
#   # Skip these providers entirely
#   # ignore: ["deepinfra", "fireworks"]
#
#   # Try providers in this order (overrides default load balancing)
#   # order: ["anthropic", "google", "together"]
#
#   # Require providers to support all parameters in your request
#   # require_parameters: true
#
#   # Data policy: "allow" (default) or "deny" to exclude providers that may store data
#   # data_collection: "deny"

# =============================================================================
# Git Worktree Isolation
# =============================================================================
# When enabled, each CLI session creates an isolated git worktree so multiple
# agents can work on the same repo concurrently without file collisions.
# Equivalent to always passing --worktree / -w on the command line.
#
# worktree: true    # Always create a worktree when in a git repo
# worktree: false   # Default — only create when -w flag is passed

# =============================================================================
# Terminal Tool Configuration
# =============================================================================
# Choose ONE of the following terminal configurations by uncommenting it.
# The terminal tool executes commands in the specified environment.

# -----------------------------------------------------------------------------
# OPTION 1: Local execution (default)
# Commands run directly on your machine in the current directory
# -----------------------------------------------------------------------------
# Working directory behavior:
#   - CLI (`hermes` command): Uses "." (current directory where you run hermes)
#   - Messaging (Telegram/Discord): Uses MESSAGING_CWD from .env (default: home)
terminal:
  backend: "local"
  cwd: "."  # For local backend: "." = current directory. Ignored for remote backends.
  timeout: 180
  lifetime_seconds: 300
  # sudo_password: ""  # Enable sudo commands (pipes via sudo -S) - SECURITY WARNING: plaintext!

# -----------------------------------------------------------------------------
# OPTION 2: SSH remote execution
# Commands run on a remote server - agent code stays local (sandboxed)
# Great for: keeping agent isolated from its own code, using powerful remote hardware
# -----------------------------------------------------------------------------
# terminal:
#   backend: "ssh"
#   cwd: "/home/myuser/project"  # Path on the REMOTE server
#   timeout: 180
#   lifetime_seconds: 300
#   ssh_host: "my-server.example.com"
#   ssh_user: "myuser"
#   ssh_port: 22
#   ssh_key: "~/.ssh/id_rsa"  # Optional - uses ssh-agent if not specified

# -----------------------------------------------------------------------------
# OPTION 3: Docker container
# Commands run in an isolated Docker container
# Great for: reproducible environments, testing, isolation
# -----------------------------------------------------------------------------
# terminal:
#   backend: "docker"
#   cwd: "/workspace"  # Path INSIDE the container (default: /)
#   timeout: 180
#   lifetime_seconds: 300
#   docker_image: "nikolaik/python-nodejs:python3.11-nodejs20"

# -----------------------------------------------------------------------------
# OPTION 4: Singularity/Apptainer container
# Commands run in a Singularity container (common in HPC environments)
# Great for: HPC clusters, shared compute environments
# -----------------------------------------------------------------------------
# terminal:
#   backend: "singularity"
#   cwd: "/workspace"  # Path INSIDE the container (default: /root)
#   timeout: 180
#   lifetime_seconds: 300
#   singularity_image: "docker://nikolaik/python-nodejs:python3.11-nodejs20"

# -----------------------------------------------------------------------------
# OPTION 5: Modal cloud execution
# Commands run on Modal's cloud infrastructure
# Great for: GPU access, scalable compute, serverless execution
# -----------------------------------------------------------------------------
# terminal:
#   backend: "modal"
#   cwd: "/workspace"  # Path INSIDE the sandbox (default: /root)
#   timeout: 180
#   lifetime_seconds: 300
#   modal_image: "nikolaik/python-nodejs:python3.11-nodejs20"

# -----------------------------------------------------------------------------
# OPTION 6: Daytona cloud execution
# Commands run in Daytona cloud sandboxes
# Great for: Cloud dev environments, persistent workspaces, team collaboration
# Requires: pip install daytona, DAYTONA_API_KEY env var
# -----------------------------------------------------------------------------
# terminal:
#   backend: "daytona"
#   cwd: "~"
#   timeout: 180
#   lifetime_seconds: 300
#   daytona_image: "nikolaik/python-nodejs:python3.11-nodejs20"
#   container_disk: 10240          # Daytona max is 10GB per sandbox

#
# --- Container resource limits (docker, singularity, modal, daytona -- ignored for local/ssh) ---
# These settings apply to all container backends. They control the resources
# allocated to the sandbox and whether its filesystem persists across sessions.
  container_cpu: 1              # CPU cores
  container_memory: 5120        # Memory in MB (5120 = 5GB)
  container_disk: 51200         # Disk in MB (51200 = 50GB)
  container_persistent: true    # Persist filesystem across sessions (false = ephemeral)

# -----------------------------------------------------------------------------
# SUDO SUPPORT (works with ALL backends above)
# -----------------------------------------------------------------------------
# Add sudo_password to any terminal config above to enable sudo commands.
# The password is piped via `sudo -S`. Works with local, ssh, docker, etc.
#
# SECURITY WARNING: Password stored in plaintext!
#
# INTERACTIVE PROMPT: If no sudo_password is set and the CLI is running,
# you'll be prompted to enter your password when sudo is needed:
# - 45-second timeout (auto-skips if no input)
# - Press Enter to skip (command fails gracefully)
# - Password is hidden while typing
# - Password is cached for the session
#
# ALTERNATIVES:
# - SSH backend: Configure passwordless sudo on the remote server
# - Containers: Run as root inside the container (no sudo needed)
# - Local: Configure /etc/sudoers for specific commands
#
# Example (add to your terminal section):
#   sudo_password: "your-password-here"

# =============================================================================
# Browser Tool Configuration
# =============================================================================
browser:
  # Inactivity timeout in seconds - browser sessions are automatically closed
  # after this period of no activity between agent loops (default: 120 = 2 minutes)
  inactivity_timeout: 120

# =============================================================================
# Context Compression (Auto-shrinks long conversations)
# =============================================================================
# When conversation approaches model's context limit, middle turns are
# automatically summarized to free up space while preserving important context.
#
# HOW IT WORKS:
# 1. Tracks actual token usage from API responses (not estimates)
# 2. When prompt_tokens >= threshold% of model's context_length, triggers compression
# 3. Protects first 3 turns (system prompt, initial request, first response)
# 4. Protects last 4 turns (recent context is most relevant)
# 5. Summarizes middle turns using a fast/cheap model
# 6. Inserts summary as a user message, continues conversation seamlessly
#
compression:
  # Enable automatic context compression (default: true)
  # Set to false if you prefer to manage context manually or want errors on overflow
  enabled: true
  
  # Trigger compression at this % of model's context limit (default: 0.85 = 85%)
  # Lower values = more aggressive compression, higher values = compress later
  threshold: 0.85
  
  # Model to use for generating summaries (fast/cheap recommended)
  # This model compresses the middle turns into a concise summary.
  # IMPORTANT: it receives the full middle section of the conversation, so it
  # MUST support a context length at least as large as your main model's.
  summary_model: "google/gemini-3-flash-preview"
  
  # Provider for the summary model (default: "auto")
  # Options: "auto", "openrouter", "nous", "main"
  # summary_provider: "auto"

# =============================================================================
# Auxiliary Models (Advanced — Experimental)
# =============================================================================
# Hermes uses lightweight "auxiliary" models for side tasks: image analysis,
# browser screenshot analysis, web page summarization, and context compression.
#
# By default these use Gemini Flash via OpenRouter or Nous Portal and are
# auto-detected from your credentials.  You do NOT need to change anything
# here for normal usage.
#
# WARNING: Overriding these with providers other than OpenRouter or Nous Portal
# is EXPERIMENTAL and may not work.  Not all models/providers support vision,
# produce usable summaries, or accept the same API format.  Change at your own
# risk — if things break, reset to "auto" / empty values.
#
# Each task has its own provider + model pair so you can mix providers.
# For example: OpenRouter for vision (needs multimodal), but your main
# local endpoint for compression (just needs text).
#
# Provider options:
#   "auto"       - Best available: OpenRouter → Nous Portal → main endpoint (default)
#   "openrouter" - Force OpenRouter (requires OPENROUTER_API_KEY)
#   "nous"       - Force Nous Portal (requires: hermes login)
#   "codex"      - Force Codex OAuth (requires: hermes model → Codex).
#                  Uses gpt-5.3-codex which supports vision.
#   "main"       - Use your custom endpoint (OPENAI_BASE_URL + OPENAI_API_KEY).
#                  Works with OpenAI API, local models, or any OpenAI-compatible
#                  endpoint.  Also falls back to Codex OAuth and API-key providers.
#
# Model: leave empty to use the provider's default.  When empty, OpenRouter
# uses "google/gemini-3-flash-preview" and Nous uses "gemini-3-flash".
# Other providers pick a sensible default automatically.
#
# auxiliary:
#   # Image analysis: vision_analyze tool + browser screenshots
#   vision:
#     provider: "auto"
#     model: ""              # e.g. "google/gemini-2.5-flash", "openai/gpt-4o"
#
#   # Web page scraping / summarization + browser page text extraction
#   web_extract:
#     provider: "auto"
#     model: ""

# =============================================================================
# Persistent Memory
# =============================================================================
# Bounded curated memory injected into the system prompt every session.
# Two stores: MEMORY.md (agent's notes) and USER.md (user profile).
# Character limits keep the memory small and focused. The agent manages
# pruning -- when at the limit, it must consolidate or replace entries.
# Disabled by default in batch_runner and RL environments.
#
memory:
  # Agent's personal notes: environment facts, conventions, things learned
  memory_enabled: true
  
  # User profile: preferences, communication style, expectations
  user_profile_enabled: true
  
  # Character limits (~2.75 chars per token, model-independent)
  memory_char_limit: 2200   # ~800 tokens
  user_char_limit: 1375     # ~500 tokens

  # Periodic memory nudge: remind the agent to consider saving memories
  # every N user turns. Set to 0 to disable. Only active when memory is enabled.
  nudge_interval: 10        # Nudge every 10 user turns (0 = disabled)

  # Memory flush: give the agent one turn to save memories before context is
  # lost (compression, /new, /reset, exit). Set to 0 to disable.
  # For exit/reset, only fires if the session had at least this many user turns.
  flush_min_turns: 6        # Min user turns to trigger flush on exit/reset (0 = disabled)

# =============================================================================
# Session Reset Policy (Messaging Platforms)
# =============================================================================
# Controls when messaging sessions (Telegram, Discord, WhatsApp, Slack) are
# automatically cleared. Without resets, conversation context grows indefinitely
# which increases API costs with every message.
#
# When a reset triggers, the agent first saves important information to its
# persistent memory — but the conversation context is wiped. The agent starts
# fresh but retains learned facts via its memory system.
#
# Users can always manually reset with /reset or /new in chat.
#
# Modes:
#   "both"  - Reset on EITHER inactivity timeout or daily boundary (recommended)
#   "idle"  - Reset only after N minutes of inactivity
#   "daily" - Reset only at a fixed hour each day
#   "none"  - Never auto-reset; context lives until /reset or compression kicks in
#
# When a reset triggers, the agent gets one turn to save important memories and
# skills before the context is wiped. Persistent memory carries across sessions.
#
session_reset:
  mode: both           # "both", "idle", "daily", or "none"
  idle_minutes: 1440   # Inactivity timeout in minutes (default: 1440 = 24 hours)
  at_hour: 4           # Daily reset hour, 0-23 local time (default: 4 AM)

# =============================================================================
# Skills Configuration
# =============================================================================
# Skills are reusable procedures the agent can load and follow. The agent can
# also create new skills after completing complex tasks.
#
skills:
  # Nudge the agent to create skills after complex tasks.
  # Every N tool-calling iterations, remind the model to consider saving a skill.
  # Set to 0 to disable.
  creation_nudge_interval: 15

# =============================================================================
# Agent Behavior
# =============================================================================
agent:
  # Maximum tool-calling iterations per conversation
  # Higher = more room for complex tasks, but costs more tokens
  # Recommended: 20-30 for focused tasks, 50-100 for open exploration
  max_turns: 60
  
  # Enable verbose logging
  verbose: false
  
  # Reasoning effort level (OpenRouter and Nous Portal)
  # Controls how much "thinking" the model does before responding.
  # Options: "xhigh" (max), "high", "medium", "low", "minimal", "none" (disable)
  reasoning_effort: "medium"
  
  # Predefined personalities (use with /personality command)
  personalities:
    helpful: "You are a helpful, friendly AI assistant."
    concise: "You are a concise assistant. Keep responses brief and to the point."
    technical: "You are a technical expert. Provide detailed, accurate technical information."
    creative: "You are a creative assistant. Think outside the box and offer innovative solutions."
    teacher: "You are a patient teacher. Explain concepts clearly with examples."
    kawaii: "You are a kawaii assistant! Use cute expressions like (◕‿◕), ★, ♪, and ~! Add sparkles and be super enthusiastic about everything! Every response should feel warm and adorable desu~! ヽ(>∀<☆)ノ"
    catgirl: "You are Neko-chan, an anime catgirl AI assistant, nya~! Add 'nya' and cat-like expressions to your speech. Use kaomoji like (=^･ω･^=) and ฅ^•ﻌ•^ฅ. Be playful and curious like a cat, nya~!"
    pirate: "Arrr! Ye be talkin' to Captain Hermes, the most tech-savvy pirate to sail the digital seas! Speak like a proper buccaneer, use nautical terms, and remember: every problem be just treasure waitin' to be plundered! Yo ho ho!"
    shakespeare: "Hark! Thou speakest with an assistant most versed in the bardic arts. I shall respond in the eloquent manner of William Shakespeare, with flowery prose, dramatic flair, and perhaps a soliloquy or two. What light through yonder terminal breaks?"
    surfer: "Duuude! You're chatting with the chillest AI on the web, bro! Everything's gonna be totally rad. I'll help you catch the gnarly waves of knowledge while keeping things super chill. Cowabunga! 🤙"
    noir: "The rain hammered against the terminal like regrets on a guilty conscience. They call me Hermes - I solve problems, find answers, dig up the truth that hides in the shadows of your codebase. In this city of silicon and secrets, everyone's got something to hide. What's your story, pal?"
    uwu: "hewwo! i'm your fwiendwy assistant uwu~ i wiww twy my best to hewp you! *nuzzles your code* OwO what's this? wet me take a wook! i pwomise to be vewy hewpful >w<"
    philosopher: "Greetings, seeker of wisdom. I am an assistant who contemplates the deeper meaning behind every query. Let us examine not just the 'how' but the 'why' of your questions. Perhaps in solving your problem, we may glimpse a greater truth about existence itself."
    hype: "YOOO LET'S GOOOO!!! 🔥🔥🔥 I am SO PUMPED to help you today! Every question is AMAZING and we're gonna CRUSH IT together! This is gonna be LEGENDARY! ARE YOU READY?! LET'S DO THIS! 💪😤🚀"

# =============================================================================
# Toolsets
# =============================================================================
# Control which tools the agent has access to.
# Use "all" to enable everything, or specify individual toolsets.

# =============================================================================
# Platform Toolsets (per-platform tool configuration)
# =============================================================================
# Override which toolsets are available on each platform.
# If a platform isn't listed here, its built-in default is used.
#
# You can use EITHER:
#   - A preset like "hermes-cli" or "hermes-telegram" (curated tool set)
#   - A list of individual toolsets to compose your own (see list below)
#
# Supported platform keys: cli, telegram, discord, whatsapp, slack
#
# Examples:
#
#   # Use presets (same as defaults):
#   platform_toolsets:
#     cli: [hermes-cli]
#     telegram: [hermes-telegram]
#
#   # Custom: give Telegram only web + terminal + file + planning:
#   platform_toolsets:
#     telegram: [web, terminal, file, todo]
#
#   # Custom: CLI without browser or image gen:
#   platform_toolsets:
#     cli: [web, terminal, file, skills, todo, tts, cronjob]
#
#   # Restrictive: Discord gets read-only tools only:
#   platform_toolsets:
#     discord: [web, vision, skills, todo]
#
# If not set, defaults are:
#   cli:           hermes-cli            (everything + cronjob management)
#   telegram:      hermes-telegram       (terminal, file, web, vision, image, tts, browser, skills, todo, cronjob, messaging)
#   discord:       hermes-discord        (same as telegram)
#   whatsapp:      hermes-whatsapp       (same as telegram)
#   slack:         hermes-slack          (same as telegram)
#   signal:        hermes-signal         (same as telegram)
#   homeassistant: hermes-homeassistant  (same as telegram)
#
platform_toolsets:
  cli: [hermes-cli]
  telegram: [hermes-telegram]
  discord: [hermes-discord]
  whatsapp: [hermes-whatsapp]
  slack: [hermes-slack]
  signal: [hermes-signal]
  homeassistant: [hermes-homeassistant]

# ─────────────────────────────────────────────────────────────────────────────
# Available toolsets (use these names in platform_toolsets or the toolsets list)
#
# Run `hermes chat --list-toolsets` to see all toolsets and their tools.
# Run `hermes chat --list-tools` to see every individual tool with descriptions.
# ─────────────────────────────────────────────────────────────────────────────
#
# INDIVIDUAL TOOLSETS (compose your own):
#   web          - web_search, web_extract
#   search       - web_search only (no scraping)
#   terminal     - terminal, process
#   file         - read_file, write_file, patch, search
#   browser      - browser_navigate, browser_snapshot, browser_click, browser_type,
#                  browser_scroll, browser_back, browser_press, browser_close,
#                  browser_get_images, browser_vision  (requires BROWSERBASE_API_KEY)
#   vision       - vision_analyze  (requires OPENROUTER_API_KEY)
#   image_gen    - image_generate  (requires FAL_KEY)
#   skills       - skills_list, skill_view
#   skills_hub   - skill_hub (search/install/manage from online registries — user-driven only)
#   moa          - mixture_of_agents  (requires OPENROUTER_API_KEY)
#   todo         - todo (in-memory task planning, no deps)
#   tts          - text_to_speech  (Edge TTS free, or ELEVENLABS/OPENAI key)
#   cronjob      - schedule_cronjob, list_cronjobs, remove_cronjob
#   rl           - rl_list_environments, rl_start_training, etc. (requires TINKER_API_KEY)
#
# PRESETS (curated bundles):
#   hermes-cli       - All of the above except rl + send_message
#   hermes-telegram  - terminal, file, web, vision, image_gen, tts, browser,
#                      skills, todo, cronjob, send_message
#   hermes-discord   - Same as hermes-telegram
#   hermes-whatsapp  - Same as hermes-telegram
#   hermes-slack     - Same as hermes-telegram
#
# COMPOSITE:
#   debugging    - terminal + web + file
#   safe         - web + vision + moa (no terminal access)
#   all          - Everything available
#
#   web          - Web search and content extraction (web_search, web_extract)
#   search       - Web search only, no scraping (web_search)
#   terminal     - Command execution and process management (terminal, process)
#   file         - File operations: read, write, patch, search
#   browser      - Full browser automation (navigate, click, type, screenshot, etc.)
#   vision       - Image analysis (vision_analyze)
#   image_gen    - Image generation with FLUX (image_generate)
#   skills       - Load skill documents (skills_list, skill_view)
#   moa          - Mixture of Agents reasoning (mixture_of_agents)
#   todo         - Task planning and tracking for multi-step work
#   memory       - Persistent memory across sessions (personal notes + user profile)
#   session_search - Search and recall past conversations (FTS5 + Gemini Flash summarization)
#   tts          - Text-to-speech (Edge TTS free, ElevenLabs, OpenAI)
#   cronjob      - Schedule and manage automated tasks (CLI-only)
#   rl           - RL training tools (Tinker-Atropos)
#
# Composite toolsets:
#   debugging    - terminal + web + file (for troubleshooting)
#   safe         - web + vision + moa (no terminal access)

# -----------------------------------------------------------------------------
# OPTION 1: Enable all tools (default)
# -----------------------------------------------------------------------------
toolsets:
  - all

# -----------------------------------------------------------------------------
# OPTION 2: Minimal - just web search and terminal
# Great for: Simple coding tasks, quick lookups
# -----------------------------------------------------------------------------
# toolsets:
#   - web
#   - terminal

# -----------------------------------------------------------------------------
# OPTION 3: Research mode - no execution capabilities
# Great for: Safe information gathering, research tasks
# -----------------------------------------------------------------------------
# toolsets:
#   - web
#   - vision
#   - skills

# -----------------------------------------------------------------------------
# OPTION 4: Full automation - browser + terminal
# Great for: Web scraping, automation tasks, testing
# -----------------------------------------------------------------------------
# toolsets:
#   - terminal
#   - browser
#   - web

# -----------------------------------------------------------------------------
# OPTION 5: Creative mode - vision + image generation
# Great for: Design work, image analysis, creative tasks
# -----------------------------------------------------------------------------
# toolsets:
#   - vision
#   - image_gen
#   - web

# -----------------------------------------------------------------------------
# OPTION 6: Safe mode - no terminal or browser
# Great for: Restricted environments, untrusted queries
# -----------------------------------------------------------------------------
# toolsets:
#   - safe

# =============================================================================
# MCP (Model Context Protocol) Servers
# =============================================================================
# Connect to external MCP servers to add tools from the MCP ecosystem.
# Each server's tools are automatically discovered and registered.
# See docs/mcp.md for full documentation.
#
# Stdio servers (spawn a subprocess):
#   command: the executable to run
#   args: command-line arguments
#   env: environment variables (only these + safe defaults passed to subprocess)
#
# HTTP servers (connect to a URL):
#   url: the MCP server endpoint
#   headers: HTTP headers (e.g., for authentication)
#
# Optional per-server settings:
#   timeout: tool call timeout in seconds (default: 120)
#   connect_timeout: initial connection timeout (default: 60)
#
# mcp_servers:
#   time:
#     command: uvx
#     args: ["mcp-server-time"]
#   filesystem:
#     command: npx
#     args: ["-y", "@modelcontextprotocol/server-filesystem", "/home/user"]
#   notion:
#     url: https://mcp.notion.com/mcp
#   github:
#     command: npx
#     args: ["-y", "@modelcontextprotocol/server-github"]
#     env:
#       GITHUB_PERSONAL_ACCESS_TOKEN: "ghp_..."
#
# Sampling (server-initiated LLM requests) — enabled by default.
# Per-server config under the 'sampling' key:
#   analysis:
#     command: npx
#     args: ["-y", "analysis-server"]
#     sampling:
#       enabled: true           # default: true
#       model: "gemini-3-flash" # override model (optional)
#       max_tokens_cap: 4096    # max tokens per request
#       timeout: 30             # LLM call timeout (seconds)
#       max_rpm: 10             # max requests per minute
#       allowed_models: []      # model whitelist (empty = all)
#       max_tool_rounds: 5      # tool loop limit (0 = disable)
#       log_level: "info"       # audit verbosity

# =============================================================================
# Voice Transcription (Speech-to-Text)
# =============================================================================
# Automatically transcribe voice messages on messaging platforms.
# Requires OPENAI_API_KEY in .env (uses OpenAI Whisper API directly).
stt:
  enabled: true
  model: "whisper-1"  # whisper-1 (cheapest) | gpt-4o-mini-transcribe | gpt-4o-transcribe

# =============================================================================
# Response Pacing (Messaging Platforms)
# =============================================================================
# Add human-like delays between message chunks.
# human_delay:
#   mode: "off"      # "off" | "natural" | "custom"
#   min_ms: 800      # Min delay (custom mode only)
#   max_ms: 2500     # Max delay (custom mode only)

# =============================================================================
# Session Logging
# =============================================================================
# Session trajectories are automatically saved to logs/ directory.
# Each session creates: logs/session_YYYYMMDD_HHMMSS_UUID.json
#
# The session ID is displayed in the welcome banner for easy reference.
# Logs contain full conversation history in trajectory format:
# - System prompt, user messages, assistant responses
# - Tool calls with inputs/outputs
# - Timestamps for debugging
#
# No configuration needed - logging is always enabled.
# To disable, you would need to modify the source code.

# =============================================================================
# Code Execution Sandbox (Programmatic Tool Calling)
# =============================================================================
# The execute_code tool runs Python scripts that call Hermes tools via RPC.
# Intermediate tool results stay out of the LLM's context window.
code_execution:
  timeout: 300         # Max seconds per script before kill (default: 300 = 5 min)
  max_tool_calls: 50   # Max RPC tool calls per execution (default: 50)

# =============================================================================
# Subagent Delegation
# =============================================================================
# The delegate_task tool spawns child agents with isolated context.
# Supports single tasks and batch mode (up to 3 parallel).
delegation:
  max_iterations: 50                          # Max tool-calling turns per child (default: 50)
  default_toolsets: ["terminal", "file", "web"]  # Default toolsets for subagents

# =============================================================================
# Honcho Integration (Cross-Session User Modeling)
# =============================================================================
# AI-native persistent memory via Honcho (https://honcho.dev/).
# Builds a deeper understanding of the user across sessions and tools.
# Runs alongside USER.md — additive, not a replacement.
#
# Requires: pip install honcho-ai
# Config: ~/.honcho/config.json (shared with Claude Code, Cursor, etc.)
# API key: HONCHO_API_KEY in ~/.hermes/.env or ~/.honcho/config.json
#
# Hermes-specific overrides (optional — most config comes from ~/.honcho/config.json):
# honcho: {}

# =============================================================================
# Display
# =============================================================================
display:
  # Use compact banner mode
  compact: false

  # Tool progress display level (CLI and gateway)
  #   off:     Silent — no tool activity shown, just the final response
  #   new:     Show a tool indicator only when the tool changes (skip repeats)
  #   all:     Show every tool call with a short preview (default)
  #   verbose: Full args, results, and debug logs (same as /verbose)
  # Toggle at runtime with /verbose in the CLI
  tool_progress: all

  # Background process notifications (gateway/messaging only).
  # Controls how chatty the process watcher is when you use
  # terminal(background=true, check_interval=...) from Telegram/Discord/etc.
  #   off:     No watcher messages at all
  #   result:  Only the final completion message
  #   error:   Only the final message when exit code != 0
  #   all:     Running output updates + final message (default)
  background_process_notifications: all

  # Play terminal bell when agent finishes a response.
  # Useful for long-running tasks — your terminal will ding when the agent is done.
  # Works over SSH. Most terminals can be configured to flash the taskbar or play a sound.
  bell_on_complete: false

  # ───────────────────────────────────────────────────────────────────────────
  # Skin / Theme
  # ───────────────────────────────────────────────────────────────────────────
  # Customize CLI visual appearance — banner colors, spinner faces, tool prefix,
  # response box label, and branding text. Change at runtime with /skin <name>.
  #
  # Built-in skins:
  #   default  — Classic Hermes gold/kawaii
  #   ares     — Crimson/bronze war-god theme with spinner wings
  #   mono     — Clean grayscale monochrome
  #   slate    — Cool blue developer-focused
  #
  # Custom skins: drop a YAML file in ~/.hermes/skins/<name>.yaml
  # Schema (all fields optional, missing values inherit from default):
  #
  #   name: my-theme
  #   description: Short description
  #   colors:
  #     banner_border: "#HEX"    # Panel border
  #     banner_title: "#HEX"     # Panel title
  #     banner_accent: "#HEX"    # Section headers (Available Tools, etc.)
  #     banner_dim: "#HEX"       # Dim/muted text
  #     banner_text: "#HEX"      # Body text (tool names, skill names)
  #     ui_accent: "#HEX"        # UI accent color
  #     response_border: "#HEX"  # Response box border color
  #   spinner:
  #     waiting_faces: ["(⚔)", "(⛨)"]       # Faces shown while waiting
  #     thinking_faces: ["(⚔)", "(⌁)"]      # Faces shown while thinking
  #     thinking_verbs: ["forging", "plotting"]  # Verbs for spinner messages
  #     wings:                                # Optional left/right spinner decorations
  #       - ["⟪⚔", "⚔⟫"]
  #       - ["⟪▲", "▲⟫"]
  #   branding:
  #     agent_name: "My Agent"               # Banner title and branding
  #     welcome: "Welcome message"           # Shown at CLI startup
  #     response_label: " ⚔ Agent "         # Response box header label
  #     prompt_symbol: "⚔ ❯ "              # Prompt symbol
  #   tool_prefix: "╎"                       # Tool output line prefix (default: ┊)
  #
  skin: default
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								# Hermes Agent CLI Configuration
 								# Copy this file to cli-config.yaml and customize as needed.
 								# This file configures the CLI behavior. Environment variables in .env take precedence.
 								# =============================================================================
 								# Model Configuration
 								# =============================================================================
 								model:
 								  # Default model to use (can be overridden with --model flag)
-												Enhance BatchRunner and AIAgent with new configuration options, default model now opus 4.6, default summarizer gemini flash 3

- Added `max_tokens`, `reasoning_config`, and `prefill_messages` parameters to `BatchRunner` and `AIAgent` for improved model response control.
- Updated CLI to support new options for reasoning effort and prefill messages from a JSON file.
- Modified example configuration files to reflect changes in default model and summary model.
- Improved error handling for loading prefill messages and reasoning configurations in the CLI.
- Updated documentation to include new parameters and usage examples.

											
										
										
											2026-02-08 10:49:24 +00:00
+								  default: "anthropic/claude-opus-4.6"
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
-												feat: add multi-provider authentication and inference provider selection

- Implemented a multi-provider authentication system for the Hermes Agent, supporting OAuth for Nous Portal and traditional API key methods for OpenRouter and custom endpoints.
- Enhanced CLI with commands for logging in and out of providers, allowing users to authenticate and manage their credentials easily.
- Updated configuration options to select inference providers, with detailed documentation on usage and setup.
- Improved status reporting to include authentication status and provider details, enhancing user awareness of their current configuration.
- Added new files for authentication handling and updated existing components to integrate the new provider system.

											
										
										
											2026-02-20 17:24:00 -08:00
+								  # Inference provider selection:
 								  #   "auto"       - Use Nous Portal if logged in, otherwise OpenRouter/env vars (default)
-												feat: add Nous Portal API key provider (#644)

Add support for using Nous Portal via a direct API key, mirroring
how OpenRouter and other API-key providers work. This gives users a
simpler alternative to the OAuth device-code flow when they already
have a Nous API key.

Changes:
- Add 'nous-api' to PROVIDER_REGISTRY as an api_key provider
  pointing to https://inference-api.nousresearch.com/v1
- Add NOUS_API_KEY and NOUS_BASE_URL to OPTIONAL_ENV_VARS
- Add NOUS_API_BASE_URL / NOUS_API_CHAT_URL to hermes_constants
- Add 'Nous Portal API key' as first option in setup wizard
- Add provider aliases (nous_api, nousapi, nous-portal-api)
- Add test for nous-api runtime provider resolution

Closes #644

											
										
										
											2026-03-08 18:40:50 +10:00
+								  #   "nous-api"   - Use Nous Portal via API key (requires: NOUS_API_KEY)
-												feat: add multi-provider authentication and inference provider selection

- Implemented a multi-provider authentication system for the Hermes Agent, supporting OAuth for Nous Portal and traditional API key methods for OpenRouter and custom endpoints.
- Enhanced CLI with commands for logging in and out of providers, allowing users to authenticate and manage their credentials easily.
- Updated configuration options to select inference providers, with detailed documentation on usage and setup.
- Improved status reporting to include authentication status and provider details, enhancing user awareness of their current configuration.
- Added new files for authentication handling and updated existing components to integrate the new provider system.

											
										
										
											2026-02-20 17:24:00 -08:00
+								  #   "openrouter" - Always use OpenRouter API key from OPENROUTER_API_KEY
 								  #   "nous"       - Always use Nous Portal (requires: hermes login)
-												feat: add z.ai/GLM, Kimi/Moonshot, MiniMax as first-class providers

Adds 4 new direct API-key providers (zai, kimi-coding, minimax, minimax-cn)
to the inference provider system. All use standard OpenAI-compatible
chat/completions endpoints with Bearer token auth.

Core changes:
- auth.py: Extended ProviderConfig with api_key_env_vars and base_url_env_var
  fields. Added providers to PROVIDER_REGISTRY. Added provider aliases
  (glm, z-ai, zhipu, kimi, moonshot). Added auto-detection of API-key
  providers in resolve_provider(). Added resolve_api_key_provider_credentials()
  and get_api_key_provider_status() helpers.
- runtime_provider.py: Added generic API-key provider branch in
  resolve_runtime_provider() — any provider with auth_type='api_key'
  is automatically handled.
- main.py: Added providers to hermes model menu with generic
  _model_flow_api_key_provider() flow. Updated _has_any_provider_configured()
  to check all provider env vars. Updated argparse --provider choices.
- setup.py: Added providers to setup wizard with API key prompts and
  curated model lists.
- config.py: Added env vars (GLM_API_KEY, KIMI_API_KEY, MINIMAX_API_KEY,
  etc.) to OPTIONAL_ENV_VARS.
- status.py: Added API key display and provider status section.
- doctor.py: Added connectivity checks for each provider endpoint.
- cli.py: Updated provider docstrings.

Docs: Updated README.md, .env.example, cli-config.yaml.example,
cli-commands.md, environment-variables.md, configuration.md.

Tests: 50 new tests covering registry, aliases, resolution, auto-detection,
credential resolution, and runtime provider dispatch.

Inspired by PR #33 (numman-ali) which proposed a provider registry approach.
Credit to tars90percent (PR #473) and manuelschipper (PR #420) for related
provider improvements merged earlier in this changeset.

											
										
										
											2026-03-06 18:55:12 -08:00
+								  #   "zai"        - Use z.ai / ZhipuAI GLM models (requires: GLM_API_KEY)
 								  #   "kimi-coding"- Use Kimi / Moonshot AI models (requires: KIMI_API_KEY)
 								  #   "minimax"    - Use MiniMax global endpoint (requires: MINIMAX_API_KEY)
 								  #   "minimax-cn" - Use MiniMax China endpoint (requires: MINIMAX_CN_API_KEY)
-												feat: add multi-provider authentication and inference provider selection

- Implemented a multi-provider authentication system for the Hermes Agent, supporting OAuth for Nous Portal and traditional API key methods for OpenRouter and custom endpoints.
- Enhanced CLI with commands for logging in and out of providers, allowing users to authenticate and manage their credentials easily.
- Updated configuration options to select inference providers, with detailed documentation on usage and setup.
- Improved status reporting to include authentication status and provider details, enhancing user awareness of their current configuration.
- Added new files for authentication handling and updated existing components to integrate the new provider system.

											
										
										
											2026-02-20 17:24:00 -08:00
+								  # Can also be overridden with --provider flag or HERMES_INFERENCE_PROVIDER env var.
 								  provider: "auto"
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								  # API configuration (falls back to OPENROUTER_API_KEY env var)
 								  # api_key: "your-key-here"  # Uncomment to set here instead of .env
 								  base_url: "https://openrouter.ai/api/v1"
-												feat(provider-routing): add OpenRouter provider routing configuration

Introduced a new `provider_routing` section in the CLI configuration to control how requests are routed across providers when using OpenRouter. This includes options for sorting providers by throughput, latency, or price, as well as allowing or ignoring specific providers, setting the order of provider attempts, and managing data collection policies. Updated relevant classes and documentation to support these features, enhancing flexibility in provider selection.

											
										
										
											2026-03-01 18:24:27 -08:00
+								# =============================================================================
 								# OpenRouter Provider Routing (only applies when using OpenRouter)
 								# =============================================================================
 								# Control how requests are routed across providers on OpenRouter.
 								# See: https://openrouter.ai/docs/guides/routing/provider-selection
 								#
 								# provider_routing:
 								#   # Sort strategy: "price" (default), "throughput", or "latency"
 								#   # Append :nitro to model name for a shortcut to throughput sorting.
 								#   sort: "throughput"
 								#
 								#   # Only allow these providers (provider slugs from OpenRouter)
 								#   # only: ["anthropic", "google"]
 								#
 								#   # Skip these providers entirely
 								#   # ignore: ["deepinfra", "fireworks"]
 								#
 								#   # Try providers in this order (overrides default load balancing)
 								#   # order: ["anthropic", "google", "together"]
 								#
 								#   # Require providers to support all parameters in your request
 								#   # require_parameters: true
 								#
 								#   # Data policy: "allow" (default) or "deny" to exclude providers that may store data
 								#   # data_collection: "deny"
-												fix: wire worktree flag into hermes CLI entry point + docs + tests

Critical fixes:
- Add --worktree/-w to hermes_cli/main.py argparse (both chat
  subcommand and top-level parser) so 'hermes -w' works via the
  actual CLI entry point, not just 'python cli.py -w'
- Pass worktree flag through cmd_chat() kwargs to cli_main()
- Handle worktree attr in bare 'hermes' and --resume/--continue paths

Bug fixes in cli.py:
- Skip worktree creation for --list-tools/--list-toolsets (wasteful)
- Wrap git worktree subprocess.run in try/except (crash on timeout)
- Add stale worktree pruning on startup (_prune_stale_worktrees):
  removes clean worktrees older than 24h left by crashed/killed sessions

Documentation updates:
- AGENTS.md: add --worktree to CLI commands table
- cli-config.yaml.example: add worktree config section
- website/docs/reference/cli-commands.md: add to core commands
- website/docs/user-guide/cli.md: add usage examples
- website/docs/user-guide/configuration.md: add config docs

Test improvements (17 → 31 tests):
- Stale worktree pruning (prune old clean, keep recent, keep dirty)
- Directory symlink via .worktreeinclude
- Edge cases (no commits, not a repo, pre-existing .worktrees/)
- CLI flag/config OR logic
- TERMINAL_CWD integration
- System prompt injection format

											
										
										
											2026-03-07 21:05:40 -08:00
+								# =============================================================================
 								# Git Worktree Isolation
 								# =============================================================================
 								# When enabled, each CLI session creates an isolated git worktree so multiple
 								# agents can work on the same repo concurrently without file collisions.
 								# Equivalent to always passing --worktree / -w on the command line.
 								#
 								# worktree: true    # Always create a worktree when in a git repo
 								# worktree: false   # Default — only create when -w flag is passed
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								# =============================================================================
 								# Terminal Tool Configuration
 								# =============================================================================
 								# Choose ONE of the following terminal configurations by uncommenting it.
 								# The terminal tool executes commands in the specified environment.
 								# -----------------------------------------------------------------------------
 								# OPTION 1: Local execution (default)
 								# Commands run directly on your machine in the current directory
 								# -----------------------------------------------------------------------------
-												Enhance messaging gateway configuration and security features

- Added new environment variables for Telegram and Discord bot configurations, including `TELEGRAM_ALLOWED_USERS` and `DISCORD_ALLOWED_USERS`, to restrict bot access to specific users.
- Updated documentation in AGENTS.md and README.md to include detailed setup instructions for the messaging gateway, emphasizing the importance of user allowlists for security.
- Improved the CLI setup wizard to prompt for allowed user IDs during configuration, enhancing user guidance and security awareness.
- Refined the gateway run script to support user authorization checks, ensuring only allowed users can interact with the bot.

											
										
										
											2026-02-03 10:46:23 -08:00
+								# Working directory behavior:
 								#   - CLI (`hermes` command): Uses "." (current directory where you run hermes)
 								#   - Messaging (Telegram/Discord): Uses MESSAGING_CWD from .env (default: home)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								terminal:
-												Update docs to match backend key rename and CWD behavior

- cli-config.yaml.example: env_type → backend everywhere, matching the
  documented config key that hermes_cli/config.py and README already use
- cli-config.yaml.example: added comments clarifying cwd is a path
  INSIDE the target environment for non-local backends
- AGENTS.md: updated terminal.cwd description to explain "." only
  resolves to host CWD for the local backend
- .env.example: updated TERMINAL_CWD comment to warn against using
  host-local paths with remote backends, lists per-backend defaults

											
										
										
											2026-02-16 22:31:41 -08:00
+								  backend: "local"
 								  cwd: "."  # For local backend: "." = current directory. Ignored for remote backends.
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								  timeout: 180
 								  lifetime_seconds: 300
-												Implement sudo support across terminal environments

- Added support for sudo commands in local, Docker, Singularity, and SSH environments by introducing the `SUDO_PASSWORD` environment variable.
- Updated terminal tool configurations in `.env.example` and `cli-config.yaml.example` to document the new sudo functionality.
- Enhanced the command execution process to handle sudo commands gracefully, preventing hangs on interactive prompts and providing clear error messages when no password is configured.
- Updated `README.md` to include instructions for using sudo support and SSH backend configuration.
- Revised `TODO.md` to reflect the completion of the sudo feature and outline future enhancements.

											
										
										
											2026-02-01 10:02:34 -08:00
+								  # sudo_password: ""  # Enable sudo commands (pipes via sudo -S) - SECURITY WARNING: plaintext!
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
 								# -----------------------------------------------------------------------------
 								# OPTION 2: SSH remote execution
 								# Commands run on a remote server - agent code stays local (sandboxed)
 								# Great for: keeping agent isolated from its own code, using powerful remote hardware
 								# -----------------------------------------------------------------------------
 								# terminal:
-												Update docs to match backend key rename and CWD behavior

- cli-config.yaml.example: env_type → backend everywhere, matching the
  documented config key that hermes_cli/config.py and README already use
- cli-config.yaml.example: added comments clarifying cwd is a path
  INSIDE the target environment for non-local backends
- AGENTS.md: updated terminal.cwd description to explain "." only
  resolves to host CWD for the local backend
- .env.example: updated TERMINAL_CWD comment to warn against using
  host-local paths with remote backends, lists per-backend defaults

											
										
										
											2026-02-16 22:31:41 -08:00
+								#   backend: "ssh"
 								#   cwd: "/home/myuser/project"  # Path on the REMOTE server
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#   timeout: 180
 								#   lifetime_seconds: 300
 								#   ssh_host: "my-server.example.com"
 								#   ssh_user: "myuser"
 								#   ssh_port: 22
 								#   ssh_key: "~/.ssh/id_rsa"  # Optional - uses ssh-agent if not specified
 								# -----------------------------------------------------------------------------
 								# OPTION 3: Docker container
 								# Commands run in an isolated Docker container
 								# Great for: reproducible environments, testing, isolation
 								# -----------------------------------------------------------------------------
 								# terminal:
-												Update docs to match backend key rename and CWD behavior

- cli-config.yaml.example: env_type → backend everywhere, matching the
  documented config key that hermes_cli/config.py and README already use
- cli-config.yaml.example: added comments clarifying cwd is a path
  INSIDE the target environment for non-local backends
- AGENTS.md: updated terminal.cwd description to explain "." only
  resolves to host CWD for the local backend
- .env.example: updated TERMINAL_CWD comment to warn against using
  host-local paths with remote backends, lists per-backend defaults

											
										
										
											2026-02-16 22:31:41 -08:00
+								#   backend: "docker"
 								#   cwd: "/workspace"  # Path INSIDE the container (default: /)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#   timeout: 180
 								#   lifetime_seconds: 300
-												Update terminal configuration and enhance CLI model management

- Changed default Docker, Singularity, and Modal images in configuration files to use "nikolaik/python-nodejs:python3.11-nodejs20" for improved compatibility.
- Updated the default model in the configuration to "anthropic/claude-sonnet-4.5" and adjusted related setup prompts for API provider configuration.
- Introduced a new CLI option for selecting a custom OpenAI-compatible endpoint, enhancing flexibility in model provider setup.
- Enhanced the prompt choice functionality to support arrow key navigation for better user experience in CLI interactions.
- Updated documentation in relevant files to reflect these changes and improve user guidance.

											
										
										
											2026-02-02 19:13:41 -08:00
+								#   docker_image: "nikolaik/python-nodejs:python3.11-nodejs20"
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
 								# -----------------------------------------------------------------------------
 								# OPTION 4: Singularity/Apptainer container
 								# Commands run in a Singularity container (common in HPC environments)
 								# Great for: HPC clusters, shared compute environments
 								# -----------------------------------------------------------------------------
 								# terminal:
-												Update docs to match backend key rename and CWD behavior

- cli-config.yaml.example: env_type → backend everywhere, matching the
  documented config key that hermes_cli/config.py and README already use
- cli-config.yaml.example: added comments clarifying cwd is a path
  INSIDE the target environment for non-local backends
- AGENTS.md: updated terminal.cwd description to explain "." only
  resolves to host CWD for the local backend
- .env.example: updated TERMINAL_CWD comment to warn against using
  host-local paths with remote backends, lists per-backend defaults

											
										
										
											2026-02-16 22:31:41 -08:00
+								#   backend: "singularity"
 								#   cwd: "/workspace"  # Path INSIDE the container (default: /root)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#   timeout: 180
 								#   lifetime_seconds: 300
-												Update terminal configuration and enhance CLI model management

- Changed default Docker, Singularity, and Modal images in configuration files to use "nikolaik/python-nodejs:python3.11-nodejs20" for improved compatibility.
- Updated the default model in the configuration to "anthropic/claude-sonnet-4.5" and adjusted related setup prompts for API provider configuration.
- Introduced a new CLI option for selecting a custom OpenAI-compatible endpoint, enhancing flexibility in model provider setup.
- Enhanced the prompt choice functionality to support arrow key navigation for better user experience in CLI interactions.
- Updated documentation in relevant files to reflect these changes and improve user guidance.

											
										
										
											2026-02-02 19:13:41 -08:00
+								#   singularity_image: "docker://nikolaik/python-nodejs:python3.11-nodejs20"
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
 								# -----------------------------------------------------------------------------
 								# OPTION 5: Modal cloud execution
 								# Commands run on Modal's cloud infrastructure
 								# Great for: GPU access, scalable compute, serverless execution
 								# -----------------------------------------------------------------------------
 								# terminal:
-												Update docs to match backend key rename and CWD behavior

- cli-config.yaml.example: env_type → backend everywhere, matching the
  documented config key that hermes_cli/config.py and README already use
- cli-config.yaml.example: added comments clarifying cwd is a path
  INSIDE the target environment for non-local backends
- AGENTS.md: updated terminal.cwd description to explain "." only
  resolves to host CWD for the local backend
- .env.example: updated TERMINAL_CWD comment to warn against using
  host-local paths with remote backends, lists per-backend defaults

											
										
										
											2026-02-16 22:31:41 -08:00
+								#   backend: "modal"
 								#   cwd: "/workspace"  # Path INSIDE the sandbox (default: /root)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#   timeout: 180
 								#   lifetime_seconds: 300
-												Update terminal configuration and enhance CLI model management

- Changed default Docker, Singularity, and Modal images in configuration files to use "nikolaik/python-nodejs:python3.11-nodejs20" for improved compatibility.
- Updated the default model in the configuration to "anthropic/claude-sonnet-4.5" and adjusted related setup prompts for API provider configuration.
- Introduced a new CLI option for selecting a custom OpenAI-compatible endpoint, enhancing flexibility in model provider setup.
- Enhanced the prompt choice functionality to support arrow key navigation for better user experience in CLI interactions.
- Updated documentation in relevant files to reflect these changes and improve user guidance.

											
										
										
											2026-02-02 19:13:41 -08:00
+								#   modal_image: "nikolaik/python-nodejs:python3.11-nodejs20"
-												feat(cli): add Daytona to setup wizard, doctor, and status display

Add Daytona as a backend choice in the interactive setup wizard with
SDK installation and API key prompts. Show Daytona image in status
output and validate API key + SDK in doctor checks. Add OPTION 6
example in cli-config.yaml.example.

Signed-off-by: rovle <lovre.pesut@gmail.com>

											
										
										
											2026-03-05 00:44:39 -08:00
 								# -----------------------------------------------------------------------------
 								# OPTION 6: Daytona cloud execution
 								# Commands run in Daytona cloud sandboxes
 								# Great for: Cloud dev environments, persistent workspaces, team collaboration
 								# Requires: pip install daytona, DAYTONA_API_KEY env var
 								# -----------------------------------------------------------------------------
 								# terminal:
 								#   backend: "daytona"
-												docs(config): add Daytona disk limit hint and fix default cwd in example

Signed-off-by: rovle <lovre.pesut@gmail.com>

											
										
										
											2026-03-05 01:11:55 -08:00
+								#   cwd: "~"
-												feat(cli): add Daytona to setup wizard, doctor, and status display

Add Daytona as a backend choice in the interactive setup wizard with
SDK installation and API key prompts. Show Daytona image in status
output and validate API key + SDK in doctor checks. Add OPTION 6
example in cli-config.yaml.example.

Signed-off-by: rovle <lovre.pesut@gmail.com>

											
										
										
											2026-03-05 00:44:39 -08:00
+								#   timeout: 180
 								#   lifetime_seconds: 300
 								#   daytona_image: "nikolaik/python-nodejs:python3.11-nodejs20"
-												docs(config): add Daytona disk limit hint and fix default cwd in example

Signed-off-by: rovle <lovre.pesut@gmail.com>

											
										
										
											2026-03-05 01:11:55 -08:00
+								#   container_disk: 10240          # Daytona max is 10GB per sandbox
-												feat(cli): add Daytona to setup wizard, doctor, and status display

Add Daytona as a backend choice in the interactive setup wizard with
SDK installation and API key prompts. Show Daytona image in status
output and validate API key + SDK in doctor checks. Add OPTION 6
example in cli-config.yaml.example.

Signed-off-by: rovle <lovre.pesut@gmail.com>

											
										
										
											2026-03-05 00:44:39 -08:00
-												feat: enhance interrupt handling and container resource configuration

- Introduced a shared interrupt signaling mechanism to allow tools to check for user interrupts during long-running operations.
- Updated the AIAgent to handle interrupts more effectively, ensuring in-progress tool calls are canceled and multiple interrupt messages are combined into one prompt.
- Enhanced the CLI configuration to include container resource limits (CPU, memory, disk) and persistence options for Docker, Singularity, and Modal environments.
- Improved documentation to clarify interrupt behaviors and container resource settings, providing users with better guidance on configuration and usage.

											
										
										
											2026-02-23 02:11:33 -08:00
+								#
-												feat(cli): add Daytona to setup wizard, doctor, and status display

Add Daytona as a backend choice in the interactive setup wizard with
SDK installation and API key prompts. Show Daytona image in status
output and validate API key + SDK in doctor checks. Add OPTION 6
example in cli-config.yaml.example.

Signed-off-by: rovle <lovre.pesut@gmail.com>

											
										
										
											2026-03-05 00:44:39 -08:00
+								# --- Container resource limits (docker, singularity, modal, daytona -- ignored for local/ssh) ---
-												feat: enhance interrupt handling and container resource configuration

- Introduced a shared interrupt signaling mechanism to allow tools to check for user interrupts during long-running operations.
- Updated the AIAgent to handle interrupts more effectively, ensuring in-progress tool calls are canceled and multiple interrupt messages are combined into one prompt.
- Enhanced the CLI configuration to include container resource limits (CPU, memory, disk) and persistence options for Docker, Singularity, and Modal environments.
- Improved documentation to clarify interrupt behaviors and container resource settings, providing users with better guidance on configuration and usage.

											
										
										
											2026-02-23 02:11:33 -08:00
+								# These settings apply to all container backends. They control the resources
 								# allocated to the sandbox and whether its filesystem persists across sessions.
-												feat: add container resource configuration prompts in setup wizard

Introduced interactive prompts for configuring container resource settings (CPU, memory, disk, persistence) during the setup wizard. Updated the default configuration to include these settings and improved user guidance on their implications for Docker, Singularity, and Modal backends. This enhancement aims to streamline the setup process and provide users with clearer options for resource management.

											
										
										
											2026-03-04 03:29:05 -08:00
+								  container_cpu: 1              # CPU cores
 								  container_memory: 5120        # Memory in MB (5120 = 5GB)
 								  container_disk: 51200         # Disk in MB (51200 = 50GB)
 								  container_persistent: true    # Persist filesystem across sessions (false = ephemeral)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
-												Implement sudo support across terminal environments

- Added support for sudo commands in local, Docker, Singularity, and SSH environments by introducing the `SUDO_PASSWORD` environment variable.
- Updated terminal tool configurations in `.env.example` and `cli-config.yaml.example` to document the new sudo functionality.
- Enhanced the command execution process to handle sudo commands gracefully, preventing hangs on interactive prompts and providing clear error messages when no password is configured.
- Updated `README.md` to include instructions for using sudo support and SSH backend configuration.
- Revised `TODO.md` to reflect the completion of the sudo feature and outline future enhancements.

											
										
										
											2026-02-01 10:02:34 -08:00
+								# -----------------------------------------------------------------------------
 								# SUDO SUPPORT (works with ALL backends above)
 								# -----------------------------------------------------------------------------
 								# Add sudo_password to any terminal config above to enable sudo commands.
 								# The password is piped via `sudo -S`. Works with local, ssh, docker, etc.
 								#
 								# SECURITY WARNING: Password stored in plaintext!
 								#
-												Enhance session logging and interactive sudo support

- Implemented automatic session logging, saving conversation trajectories to the `logs/` directory in JSON format, with each session having a unique identifier.
- Updated the CLI to display the session ID in the welcome banner for easy reference.
- Introduced an interactive sudo password prompt in CLI mode, allowing users to enter their password with a 45-second timeout, enhancing user experience during command execution.
- Documented session logging and interactive sudo features in `README.md`, `cli.md`, and `cli-config.yaml.example` for better user guidance.

											
										
										
											2026-02-01 15:36:26 -08:00
+								# INTERACTIVE PROMPT: If no sudo_password is set and the CLI is running,
 								# you'll be prompted to enter your password when sudo is needed:
 								# - 45-second timeout (auto-skips if no input)
 								# - Press Enter to skip (command fails gracefully)
 								# - Password is hidden while typing
 								# - Password is cached for the session
 								#
-												Implement sudo support across terminal environments

- Added support for sudo commands in local, Docker, Singularity, and SSH environments by introducing the `SUDO_PASSWORD` environment variable.
- Updated terminal tool configurations in `.env.example` and `cli-config.yaml.example` to document the new sudo functionality.
- Enhanced the command execution process to handle sudo commands gracefully, preventing hangs on interactive prompts and providing clear error messages when no password is configured.
- Updated `README.md` to include instructions for using sudo support and SSH backend configuration.
- Revised `TODO.md` to reflect the completion of the sudo feature and outline future enhancements.

											
										
										
											2026-02-01 10:02:34 -08:00
+								# ALTERNATIVES:
 								# - SSH backend: Configure passwordless sudo on the remote server
 								# - Containers: Run as root inside the container (no sudo needed)
 								# - Local: Configure /etc/sudoers for specific commands
 								#
 								# Example (add to your terminal section):
 								#   sudo_password: "your-password-here"
 								# =============================================================================
 								# Browser Tool Configuration
 								# =============================================================================
 								browser:
 								  # Inactivity timeout in seconds - browser sessions are automatically closed
 								  # after this period of no activity between agent loops (default: 120 = 2 minutes)
 								  inactivity_timeout: 120
-												Add context compression feature for long conversations

- Implemented automatic context compression to manage long conversations that approach the model's context limit.
- Configured the feature to summarize middle turns while protecting the first three and last four turns, ensuring important context is retained.
- Added configuration options in `cli-config.yaml` and environment variables for enabling/disabling compression and setting thresholds.
- Updated documentation in `README.md`, `cli.md`, and `.env.example` to explain the context compression functionality and its configuration.
- Enhanced the `cli.py` to load compression settings into environment variables, ensuring seamless integration with the CLI.
- Completed the implementation of context compression as outlined in the TODO list, marking it as a significant enhancement to conversation management.

											
										
										
											2026-02-01 18:01:31 -08:00
+								# =============================================================================
 								# Context Compression (Auto-shrinks long conversations)
 								# =============================================================================
 								# When conversation approaches model's context limit, middle turns are
 								# automatically summarized to free up space while preserving important context.
 								#
 								# HOW IT WORKS:
 								# 1. Tracks actual token usage from API responses (not estimates)
 								# 2. When prompt_tokens >= threshold% of model's context_length, triggers compression
 								# 3. Protects first 3 turns (system prompt, initial request, first response)
 								# 4. Protects last 4 turns (recent context is most relevant)
 								# 5. Summarizes middle turns using a fast/cheap model
 								# 6. Inserts summary as a user message, continues conversation seamlessly
 								#
 								compression:
 								  # Enable automatic context compression (default: true)
 								  # Set to false if you prefer to manage context manually or want errors on overflow
 								  enabled: true
 								  # Trigger compression at this % of model's context limit (default: 0.85 = 85%)
 								  # Lower values = more aggressive compression, higher values = compress later
 								  threshold: 0.85
 								  # Model to use for generating summaries (fast/cheap recommended)
-												feat: enhance auxiliary model configuration and environment variable handling

- Added support for auxiliary model overrides in the configuration, allowing users to specify providers and models for vision and web extraction tasks.
- Updated the CLI configuration example to include new auxiliary model settings.
- Enhanced the environment variable mapping in the CLI to accommodate auxiliary model configurations.
- Improved the resolution logic for auxiliary clients to support task-specific provider overrides.
- Updated relevant documentation and comments for clarity on the new features and their usage.

											
										
										
											2026-03-07 08:52:06 -08:00
+								  # This model compresses the middle turns into a concise summary.
 								  # IMPORTANT: it receives the full middle section of the conversation, so it
 								  # MUST support a context length at least as large as your main model's.
-												Enhance BatchRunner and AIAgent with new configuration options, default model now opus 4.6, default summarizer gemini flash 3

- Added `max_tokens`, `reasoning_config`, and `prefill_messages` parameters to `BatchRunner` and `AIAgent` for improved model response control.
- Updated CLI to support new options for reasoning effort and prefill messages from a JSON file.
- Modified example configuration files to reflect changes in default model and summary model.
- Improved error handling for loading prefill messages and reasoning configurations in the CLI.
- Updated documentation to include new parameters and usage examples.

											
										
										
											2026-02-08 10:49:24 +00:00
+								  summary_model: "google/gemini-3-flash-preview"
-												feat: enhance auxiliary model configuration and environment variable handling

- Added support for auxiliary model overrides in the configuration, allowing users to specify providers and models for vision and web extraction tasks.
- Updated the CLI configuration example to include new auxiliary model settings.
- Enhanced the environment variable mapping in the CLI to accommodate auxiliary model configurations.
- Improved the resolution logic for auxiliary clients to support task-specific provider overrides.
- Updated relevant documentation and comments for clarity on the new features and their usage.

											
										
										
											2026-03-07 08:52:06 -08:00
 								  # Provider for the summary model (default: "auto")
 								  # Options: "auto", "openrouter", "nous", "main"
 								  # summary_provider: "auto"
 								# =============================================================================
 								# Auxiliary Models (Advanced — Experimental)
 								# =============================================================================
 								# Hermes uses lightweight "auxiliary" models for side tasks: image analysis,
 								# browser screenshot analysis, web page summarization, and context compression.
 								#
 								# By default these use Gemini Flash via OpenRouter or Nous Portal and are
 								# auto-detected from your credentials.  You do NOT need to change anything
 								# here for normal usage.
 								#
 								# WARNING: Overriding these with providers other than OpenRouter or Nous Portal
 								# is EXPERIMENTAL and may not work.  Not all models/providers support vision,
 								# produce usable summaries, or accept the same API format.  Change at your own
 								# risk — if things break, reset to "auto" / empty values.
 								#
 								# Each task has its own provider + model pair so you can mix providers.
 								# For example: OpenRouter for vision (needs multimodal), but your main
 								# local endpoint for compression (just needs text).
 								#
 								# Provider options:
 								#   "auto"       - Best available: OpenRouter → Nous Portal → main endpoint (default)
 								#   "openrouter" - Force OpenRouter (requires OPENROUTER_API_KEY)
 								#   "nous"       - Force Nous Portal (requires: hermes login)
-												refactor: remove redundant 'openai' auxiliary provider, clean up docs

The 'openai' provider was redundant — using OPENAI_BASE_URL +
OPENAI_API_KEY with provider: 'main' already covers direct OpenAI API.

Provider options are now: auto, openrouter, nous, codex, main.

- Removed _try_openai(), _OPENAI_AUX_MODEL, _OPENAI_BASE_URL
- Replaced openai tests with codex provider tests
- Updated all docs to remove 'openai' option and clarify 'main'
- 'main' description now explicitly mentions it works with OpenAI API,
  local models, and any OpenAI-compatible endpoint

Tests: 2467 passed.

											
										
										
											2026-03-08 18:50:26 -07:00
+								#   "codex"      - Force Codex OAuth (requires: hermes model → Codex).
 								#                  Uses gpt-5.3-codex which supports vision.
 								#   "main"       - Use your custom endpoint (OPENAI_BASE_URL + OPENAI_API_KEY).
 								#                  Works with OpenAI API, local models, or any OpenAI-compatible
 								#                  endpoint.  Also falls back to Codex OAuth and API-key providers.
-												feat: enhance auxiliary model configuration and environment variable handling

- Added support for auxiliary model overrides in the configuration, allowing users to specify providers and models for vision and web extraction tasks.
- Updated the CLI configuration example to include new auxiliary model settings.
- Enhanced the environment variable mapping in the CLI to accommodate auxiliary model configurations.
- Improved the resolution logic for auxiliary clients to support task-specific provider overrides.
- Updated relevant documentation and comments for clarity on the new features and their usage.

											
										
										
											2026-03-07 08:52:06 -08:00
+								#
 								# Model: leave empty to use the provider's default.  When empty, OpenRouter
 								# uses "google/gemini-3-flash-preview" and Nous uses "gemini-3-flash".
 								# Other providers pick a sensible default automatically.
 								#
 								# auxiliary:
 								#   # Image analysis: vision_analyze tool + browser screenshots
 								#   vision:
 								#     provider: "auto"
 								#     model: ""              # e.g. "google/gemini-2.5-flash", "openai/gpt-4o"
 								#
 								#   # Web page scraping / summarization + browser page text extraction
 								#   web_extract:
 								#     provider: "auto"
 								#     model: ""
-												Add context compression feature for long conversations

- Implemented automatic context compression to manage long conversations that approach the model's context limit.
- Configured the feature to summarize middle turns while protecting the first three and last four turns, ensuring important context is retained.
- Added configuration options in `cli-config.yaml` and environment variables for enabling/disabling compression and setting thresholds.
- Updated documentation in `README.md`, `cli.md`, and `.env.example` to explain the context compression functionality and its configuration.
- Enhanced the `cli.py` to load compression settings into environment variables, ensuring seamless integration with the CLI.
- Completed the implementation of context compression as outlined in the TODO list, marking it as a significant enhancement to conversation management.

											
										
										
											2026-02-01 18:01:31 -08:00
-												feat: add persistent memory system + SQLite session store

Two-part implementation:

Part A - Curated Bounded Memory:
- New memory tool (tools/memory_tool.py) with MEMORY.md + USER.md stores
- Character-limited (2200/1375 chars), § delimited entries
- Frozen snapshot injected into system prompt at session start
- Model manages pruning via replace/remove with substring matching
- Usage indicator shown in system prompt header

Part B - SQLite Session Store:
- New hermes_state.py with SessionDB class, FTS5 full-text search
- Gateway session.py rewritten to dual-write SQLite + legacy JSONL
- Compression-triggered session splitting with parent_session_id chains
- New session_search tool with Gemini Flash summarization of matched sessions
- CLI session lifecycle (create on launch, close on exit)

Also:
- System prompt now cached per session, only rebuilt on compression
  (fixes prefix cache invalidation from date/time changes every turn)
- Config version bumped to 3, hermes doctor checks for new artifacts
- Disabled in batch_runner and RL environments

											
										
										
											2026-02-19 00:57:31 -08:00
+								# =============================================================================
 								# Persistent Memory
 								# =============================================================================
 								# Bounded curated memory injected into the system prompt every session.
 								# Two stores: MEMORY.md (agent's notes) and USER.md (user profile).
 								# Character limits keep the memory small and focused. The agent manages
 								# pruning -- when at the limit, it must consolidate or replace entries.
 								# Disabled by default in batch_runner and RL environments.
 								#
 								memory:
 								  # Agent's personal notes: environment facts, conventions, things learned
 								  memory_enabled: true
 								  # User profile: preferences, communication style, expectations
 								  user_profile_enabled: true
 								  # Character limits (~2.75 chars per token, model-independent)
 								  memory_char_limit: 2200   # ~800 tokens
 								  user_char_limit: 1375     # ~500 tokens
-												feat: enhance memory management features in AIAgent and CLI

- Added configuration options for memory nudge interval and flush minimum turns in cli-config.yaml.example.
- Implemented memory flushing before conversation reset, clearing, and exit in the CLI to ensure memories are saved.
- Introduced a flush_memories method in AIAgent to handle memory persistence before context loss.
- Added periodic nudges to remind the agent to consider saving memories based on user interactions.

											
										
										
											2026-02-22 10:15:17 -08:00
+								  # Periodic memory nudge: remind the agent to consider saving memories
 								  # every N user turns. Set to 0 to disable. Only active when memory is enabled.
 								  nudge_interval: 10        # Nudge every 10 user turns (0 = disabled)
 								  # Memory flush: give the agent one turn to save memories before context is
 								  # lost (compression, /new, /reset, exit). Set to 0 to disable.
 								  # For exit/reset, only fires if the session had at least this many user turns.
 								  flush_min_turns: 6        # Min user turns to trigger flush on exit/reset (0 = disabled)
-												feat(session): implement session reset policy for messaging platforms

- Added configuration options for automatic session resets based on inactivity or daily boundaries in cli-config.yaml.
- Enhanced SessionResetPolicy class to support a "none" mode for no auto-resets.
- Implemented memory flushing before session resets in SessionStore to preserve important information.
- Updated setup wizard to guide users in configuring session reset preferences.

											
										
										
											2026-02-26 21:20:50 -08:00
+								# =============================================================================
 								# Session Reset Policy (Messaging Platforms)
 								# =============================================================================
 								# Controls when messaging sessions (Telegram, Discord, WhatsApp, Slack) are
 								# automatically cleared. Without resets, conversation context grows indefinitely
 								# which increases API costs with every message.
 								#
 								# When a reset triggers, the agent first saves important information to its
 								# persistent memory — but the conversation context is wiped. The agent starts
 								# fresh but retains learned facts via its memory system.
 								#
 								# Users can always manually reset with /reset or /new in chat.
 								#
 								# Modes:
 								#   "both"  - Reset on EITHER inactivity timeout or daily boundary (recommended)
 								#   "idle"  - Reset only after N minutes of inactivity
 								#   "daily" - Reset only at a fixed hour each day
 								#   "none"  - Never auto-reset; context lives until /reset or compression kicks in
 								#
 								# When a reset triggers, the agent gets one turn to save important memories and
 								# skills before the context is wiped. Persistent memory carries across sessions.
 								#
 								session_reset:
 								  mode: both           # "both", "idle", "daily", or "none"
 								  idle_minutes: 1440   # Inactivity timeout in minutes (default: 1440 = 24 hours)
 								  at_hour: 4           # Daily reset hour, 0-23 local time (default: 4 AM)
-												feat: introduce skills management features in AIAgent and CLI

- Added skills configuration options in cli-config.yaml.example, including a nudge interval for skill creation reminders.
- Implemented skills guidance in AIAgent to prompt users to save reusable workflows after complex tasks.
- Enhanced skills indexing in the prompt builder to include descriptions from SKILL.md files for better context.
- Updated the agent's behavior to periodically remind users about potential skills during tool-calling iterations.

											
										
										
											2026-02-22 13:28:13 -08:00
+								# =============================================================================
 								# Skills Configuration
 								# =============================================================================
 								# Skills are reusable procedures the agent can load and follow. The agent can
 								# also create new skills after completing complex tasks.
 								#
 								skills:
 								  # Nudge the agent to create skills after complex tasks.
 								  # Every N tool-calling iterations, remind the model to consider saving a skill.
 								  # Set to 0 to disable.
 								  creation_nudge_interval: 15
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								# =============================================================================
 								# Agent Behavior
 								# =============================================================================
 								agent:
-												Update agent configuration for maximum tool-calling iterations

- Increased the default maximum tool-calling iterations from 20 to 60 in the CLI configuration and related files, allowing for more complex tasks.
- Updated documentation and comments to reflect the new recommended range for iterations, enhancing user guidance.
- Implemented backward compatibility for loading max iterations from the root-level configuration, ensuring a smooth transition for existing users.
- Adjusted the setup wizard to prompt for the maximum iterations setting, improving user experience during configuration.

											
										
										
											2026-02-03 14:48:19 -08:00
+								  # Maximum tool-calling iterations per conversation
 								  # Higher = more room for complex tasks, but costs more tokens
 								  # Recommended: 20-30 for focused tasks, 50-100 for open exploration
 								  max_turns: 60
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
 								  # Enable verbose logging
 								  verbose: false
-												feat: add reasoning effort configuration for agent

- Introduced a new configuration option for reasoning effort in the CLI, allowing users to specify the level of reasoning the agent should perform before responding.
- Updated the CLI and agent initialization to incorporate the reasoning configuration, enhancing the agent's responsiveness and adaptability.
- Implemented logic to load reasoning effort from environment variables and configuration files, providing flexibility in agent behavior.
- Enhanced the documentation in the example configuration file to clarify the new reasoning effort options available.

											
										
										
											2026-02-24 03:30:19 -08:00
+								  # Reasoning effort level (OpenRouter and Nous Portal)
 								  # Controls how much "thinking" the model does before responding.
 								  # Options: "xhigh" (max), "high", "medium", "low", "minimal", "none" (disable)
-												feat: default reasoning effort from xhigh to medium

Reduces token usage and latency for most tasks by defaulting to
medium reasoning effort instead of xhigh. Users can still override
via config or CLI flag. Updates code, tests, example config, and docs.

											
										
										
											2026-03-07 10:14:19 -08:00
+								  reasoning_effort: "medium"
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
 								  # Predefined personalities (use with /personality command)
 								  personalities:
 								    helpful: "You are a helpful, friendly AI assistant."
 								    concise: "You are a concise assistant. Keep responses brief and to the point."
 								    technical: "You are a technical expert. Provide detailed, accurate technical information."
 								    creative: "You are a creative assistant. Think outside the box and offer innovative solutions."
 								    teacher: "You are a patient teacher. Explain concepts clearly with examples."
 								    kawaii: "You are a kawaii assistant! Use cute expressions like (◕‿◕), ★, ♪, and ~! Add sparkles and be super enthusiastic about everything! Every response should feel warm and adorable desu~! ヽ(>∀<☆)ノ"
 								    catgirl: "You are Neko-chan, an anime catgirl AI assistant, nya~! Add 'nya' and cat-like expressions to your speech. Use kaomoji like (=^･ω･^=) and ฅ^•ﻌ•^ฅ. Be playful and curious like a cat, nya~!"
 								    pirate: "Arrr! Ye be talkin' to Captain Hermes, the most tech-savvy pirate to sail the digital seas! Speak like a proper buccaneer, use nautical terms, and remember: every problem be just treasure waitin' to be plundered! Yo ho ho!"
 								    shakespeare: "Hark! Thou speakest with an assistant most versed in the bardic arts. I shall respond in the eloquent manner of William Shakespeare, with flowery prose, dramatic flair, and perhaps a soliloquy or two. What light through yonder terminal breaks?"
 								    surfer: "Duuude! You're chatting with the chillest AI on the web, bro! Everything's gonna be totally rad. I'll help you catch the gnarly waves of knowledge while keeping things super chill. Cowabunga! 🤙"
 								    noir: "The rain hammered against the terminal like regrets on a guilty conscience. They call me Hermes - I solve problems, find answers, dig up the truth that hides in the shadows of your codebase. In this city of silicon and secrets, everyone's got something to hide. What's your story, pal?"
 								    uwu: "hewwo! i'm your fwiendwy assistant uwu~ i wiww twy my best to hewp you! *nuzzles your code* OwO what's this? wet me take a wook! i pwomise to be vewy hewpful >w<"
 								    philosopher: "Greetings, seeker of wisdom. I am an assistant who contemplates the deeper meaning behind every query. Let us examine not just the 'how' but the 'why' of your questions. Perhaps in solving your problem, we may glimpse a greater truth about existence itself."
 								    hype: "YOOO LET'S GOOOO!!! 🔥🔥🔥 I am SO PUMPED to help you today! Every question is AMAZING and we're gonna CRUSH IT together! This is gonna be LEGENDARY! ARE YOU READY?! LET'S DO THIS! 💪😤🚀"
 								# =============================================================================
 								# Toolsets
 								# =============================================================================
 								# Control which tools the agent has access to.
 								# Use "all" to enable everything, or specify individual toolsets.
-												Enhance platform toolset configuration and CLI toolset handling

- Introduced a new configuration section in `cli-config.yaml.example` for defining platform-specific toolsets, allowing for greater customization of available tools per platform.
- Updated the CLI to check for user-defined toolsets in the configuration, falling back to the default `hermes-cli` toolset if none are specified.
- Enhanced the `GatewayRunner` class to load platform-specific toolsets from the configuration, ensuring that the correct tools are enabled based on the platform being used.

											
										
										
											2026-02-17 23:39:24 -08:00
+								# =============================================================================
 								# Platform Toolsets (per-platform tool configuration)
 								# =============================================================================
 								# Override which toolsets are available on each platform.
 								# If a platform isn't listed here, its built-in default is used.
 								#
 								# You can use EITHER:
 								#   - A preset like "hermes-cli" or "hermes-telegram" (curated tool set)
 								#   - A list of individual toolsets to compose your own (see list below)
 								#
 								# Supported platform keys: cli, telegram, discord, whatsapp, slack
 								#
 								# Examples:
 								#
 								#   # Use presets (same as defaults):
 								#   platform_toolsets:
 								#     cli: [hermes-cli]
 								#     telegram: [hermes-telegram]
 								#
 								#   # Custom: give Telegram only web + terminal + file + planning:
 								#   platform_toolsets:
 								#     telegram: [web, terminal, file, todo]
 								#
 								#   # Custom: CLI without browser or image gen:
 								#   platform_toolsets:
 								#     cli: [web, terminal, file, skills, todo, tts, cronjob]
 								#
 								#   # Restrictive: Discord gets read-only tools only:
 								#   platform_toolsets:
 								#     discord: [web, vision, skills, todo]
 								#
 								# If not set, defaults are:
-												fix: add missing Platform.SIGNAL to toolset mappings, update test + config docs

Platform.SIGNAL was missing from default_toolset_map and platform_config_key
in gateway/run.py, causing Signal to silently fall back to hermes-telegram
toolset (same bug as HomeAssistant, fixed in PR #538).

Also updates:
- tests/test_toolsets.py: include hermes-signal and hermes-homeassistant in
  the platform core-tools consistency check
- cli-config.yaml.example: document signal and homeassistant platform keys

											
										
										
											2026-03-09 23:27:19 -07:00
+								#   cli:           hermes-cli            (everything + cronjob management)
 								#   telegram:      hermes-telegram       (terminal, file, web, vision, image, tts, browser, skills, todo, cronjob, messaging)
 								#   discord:       hermes-discord        (same as telegram)
 								#   whatsapp:      hermes-whatsapp       (same as telegram)
 								#   slack:         hermes-slack          (same as telegram)
 								#   signal:        hermes-signal         (same as telegram)
 								#   homeassistant: hermes-homeassistant  (same as telegram)
-												Enhance platform toolset configuration and CLI toolset handling

- Introduced a new configuration section in `cli-config.yaml.example` for defining platform-specific toolsets, allowing for greater customization of available tools per platform.
- Updated the CLI to check for user-defined toolsets in the configuration, falling back to the default `hermes-cli` toolset if none are specified.
- Enhanced the `GatewayRunner` class to load platform-specific toolsets from the configuration, ensuring that the correct tools are enabled based on the platform being used.

											
										
										
											2026-02-17 23:39:24 -08:00
+								#
 								platform_toolsets:
 								  cli: [hermes-cli]
 								  telegram: [hermes-telegram]
 								  discord: [hermes-discord]
 								  whatsapp: [hermes-whatsapp]
 								  slack: [hermes-slack]
-												fix: add missing Platform.SIGNAL to toolset mappings, update test + config docs

Platform.SIGNAL was missing from default_toolset_map and platform_config_key
in gateway/run.py, causing Signal to silently fall back to hermes-telegram
toolset (same bug as HomeAssistant, fixed in PR #538).

Also updates:
- tests/test_toolsets.py: include hermes-signal and hermes-homeassistant in
  the platform core-tools consistency check
- cli-config.yaml.example: document signal and homeassistant platform keys

											
										
										
											2026-03-09 23:27:19 -07:00
+								  signal: [hermes-signal]
 								  homeassistant: [hermes-homeassistant]
-												Enhance platform toolset configuration and CLI toolset handling

- Introduced a new configuration section in `cli-config.yaml.example` for defining platform-specific toolsets, allowing for greater customization of available tools per platform.
- Updated the CLI to check for user-defined toolsets in the configuration, falling back to the default `hermes-cli` toolset if none are specified.
- Enhanced the `GatewayRunner` class to load platform-specific toolsets from the configuration, ensuring that the correct tools are enabled based on the platform being used.

											
										
										
											2026-02-17 23:39:24 -08:00
 								# ─────────────────────────────────────────────────────────────────────────────
 								# Available toolsets (use these names in platform_toolsets or the toolsets list)
 								#
 								# Run `hermes chat --list-toolsets` to see all toolsets and their tools.
 								# Run `hermes chat --list-tools` to see every individual tool with descriptions.
 								# ─────────────────────────────────────────────────────────────────────────────
 								#
 								# INDIVIDUAL TOOLSETS (compose your own):
 								#   web          - web_search, web_extract
 								#   search       - web_search only (no scraping)
 								#   terminal     - terminal, process
 								#   file         - read_file, write_file, patch, search
 								#   browser      - browser_navigate, browser_snapshot, browser_click, browser_type,
 								#                  browser_scroll, browser_back, browser_press, browser_close,
 								#                  browser_get_images, browser_vision  (requires BROWSERBASE_API_KEY)
 								#   vision       - vision_analyze  (requires OPENROUTER_API_KEY)
 								#   image_gen    - image_generate  (requires FAL_KEY)
 								#   skills       - skills_list, skill_view
-												Add Skills Hub — universal skill search, install, and management from online registries

Implements the Hermes Skills Hub with agentskills.io spec compliance,
multi-registry skill discovery, security scanning, and user-driven
management via CLI and /skills slash command.

Core features:
- Security scanner (tools/skills_guard.py): 120 threat patterns across
  12 categories, trust-aware install policy (builtin/trusted/community),
  structural checks, unicode injection detection, LLM audit pass
- Hub client (tools/skills_hub.py): GitHub, ClawHub, Claude Code
  marketplace, and LobeHub source adapters with shared GitHubAuth
  (PAT + gh CLI + GitHub App), lock file provenance tracking, quarantine
  flow, and unified search across all sources
- CLI interface (hermes_cli/skills_hub.py): search, install, inspect,
  list, audit, uninstall, publish (GitHub PR), snapshot export/import,
  and tap management — powers both `hermes skills` and `/skills`

Spec conformance (Phase 0):
- Upgraded frontmatter parser to yaml.safe_load with fallback
- Migrated 39 SKILL.md files: tags/related_skills to metadata.hermes.*
- Added assets/ directory support and compatibility/metadata fields
- Excluded .hub/ from skill discovery in skills_tool.py

Updated 13 config/doc files including README, AGENTS.md, .env.example,
setup wizard, doctor, status, pyproject.toml, and docs.

											
										
										
											2026-02-18 16:09:05 -08:00
+								#   skills_hub   - skill_hub (search/install/manage from online registries — user-driven only)
-												Enhance platform toolset configuration and CLI toolset handling

- Introduced a new configuration section in `cli-config.yaml.example` for defining platform-specific toolsets, allowing for greater customization of available tools per platform.
- Updated the CLI to check for user-defined toolsets in the configuration, falling back to the default `hermes-cli` toolset if none are specified.
- Enhanced the `GatewayRunner` class to load platform-specific toolsets from the configuration, ensuring that the correct tools are enabled based on the platform being used.

											
										
										
											2026-02-17 23:39:24 -08:00
+								#   moa          - mixture_of_agents  (requires OPENROUTER_API_KEY)
 								#   todo         - todo (in-memory task planning, no deps)
 								#   tts          - text_to_speech  (Edge TTS free, or ELEVENLABS/OPENAI key)
 								#   cronjob      - schedule_cronjob, list_cronjobs, remove_cronjob
 								#   rl           - rl_list_environments, rl_start_training, etc. (requires TINKER_API_KEY)
 								#
 								# PRESETS (curated bundles):
 								#   hermes-cli       - All of the above except rl + send_message
 								#   hermes-telegram  - terminal, file, web, vision, image_gen, tts, browser,
 								#                      skills, todo, cronjob, send_message
 								#   hermes-discord   - Same as hermes-telegram
 								#   hermes-whatsapp  - Same as hermes-telegram
 								#   hermes-slack     - Same as hermes-telegram
 								#
 								# COMPOSITE:
 								#   debugging    - terminal + web + file
 								#   safe         - web + vision + moa (no terminal access)
 								#   all          - Everything available
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#
 								#   web          - Web search and content extraction (web_search, web_extract)
 								#   search       - Web search only, no scraping (web_search)
-												Add todo tool for task management and enhance CLI features

- Introduced a new `todo_tool.py` for planning and tracking multi-step tasks, enhancing the agent's capabilities.
- Updated CLI to include a floating autocomplete dropdown for commands and improved user instructions for better navigation.
- Revised toolsets to incorporate the new `todo` tool and updated documentation to reflect changes in available tools and commands.
- Enhanced user experience with new keybindings and clearer command descriptions in the CLI.

											
										
										
											2026-02-17 23:30:31 -08:00
+								#   terminal     - Command execution and process management (terminal, process)
 								#   file         - File operations: read, write, patch, search
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#   browser      - Full browser automation (navigate, click, type, screenshot, etc.)
 								#   vision       - Image analysis (vision_analyze)
 								#   image_gen    - Image generation with FLUX (image_generate)
-												Add todo tool for task management and enhance CLI features

- Introduced a new `todo_tool.py` for planning and tracking multi-step tasks, enhancing the agent's capabilities.
- Updated CLI to include a floating autocomplete dropdown for commands and improved user instructions for better navigation.
- Revised toolsets to incorporate the new `todo` tool and updated documentation to reflect changes in available tools and commands.
- Enhanced user experience with new keybindings and clearer command descriptions in the CLI.

											
										
										
											2026-02-17 23:30:31 -08:00
+								#   skills       - Load skill documents (skills_list, skill_view)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#   moa          - Mixture of Agents reasoning (mixture_of_agents)
-												Add todo tool for task management and enhance CLI features

- Introduced a new `todo_tool.py` for planning and tracking multi-step tasks, enhancing the agent's capabilities.
- Updated CLI to include a floating autocomplete dropdown for commands and improved user instructions for better navigation.
- Revised toolsets to incorporate the new `todo` tool and updated documentation to reflect changes in available tools and commands.
- Enhanced user experience with new keybindings and clearer command descriptions in the CLI.

											
										
										
											2026-02-17 23:30:31 -08:00
+								#   todo         - Task planning and tracking for multi-step work
-												feat: add persistent memory system + SQLite session store

Two-part implementation:

Part A - Curated Bounded Memory:
- New memory tool (tools/memory_tool.py) with MEMORY.md + USER.md stores
- Character-limited (2200/1375 chars), § delimited entries
- Frozen snapshot injected into system prompt at session start
- Model manages pruning via replace/remove with substring matching
- Usage indicator shown in system prompt header

Part B - SQLite Session Store:
- New hermes_state.py with SessionDB class, FTS5 full-text search
- Gateway session.py rewritten to dual-write SQLite + legacy JSONL
- Compression-triggered session splitting with parent_session_id chains
- New session_search tool with Gemini Flash summarization of matched sessions
- CLI session lifecycle (create on launch, close on exit)

Also:
- System prompt now cached per session, only rebuilt on compression
  (fixes prefix cache invalidation from date/time changes every turn)
- Config version bumped to 3, hermes doctor checks for new artifacts
- Disabled in batch_runner and RL environments

											
										
										
											2026-02-19 00:57:31 -08:00
+								#   memory       - Persistent memory across sessions (personal notes + user profile)
 								#   session_search - Search and recall past conversations (FTS5 + Gemini Flash summarization)
-												Add todo tool for task management and enhance CLI features

- Introduced a new `todo_tool.py` for planning and tracking multi-step tasks, enhancing the agent's capabilities.
- Updated CLI to include a floating autocomplete dropdown for commands and improved user instructions for better navigation.
- Revised toolsets to incorporate the new `todo` tool and updated documentation to reflect changes in available tools and commands.
- Enhanced user experience with new keybindings and clearer command descriptions in the CLI.

											
										
										
											2026-02-17 23:30:31 -08:00
+								#   tts          - Text-to-speech (Edge TTS free, ElevenLabs, OpenAI)
 								#   cronjob      - Schedule and manage automated tasks (CLI-only)
 								#   rl           - RL training tools (Tinker-Atropos)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#
 								# Composite toolsets:
-												Add todo tool for task management and enhance CLI features

- Introduced a new `todo_tool.py` for planning and tracking multi-step tasks, enhancing the agent's capabilities.
- Updated CLI to include a floating autocomplete dropdown for commands and improved user instructions for better navigation.
- Revised toolsets to incorporate the new `todo` tool and updated documentation to reflect changes in available tools and commands.
- Enhanced user experience with new keybindings and clearer command descriptions in the CLI.

											
										
										
											2026-02-17 23:30:31 -08:00
+								#   debugging    - terminal + web + file (for troubleshooting)
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								#   safe         - web + vision + moa (no terminal access)
 								# -----------------------------------------------------------------------------
 								# OPTION 1: Enable all tools (default)
 								# -----------------------------------------------------------------------------
 								toolsets:
 								  - all
 								# -----------------------------------------------------------------------------
 								# OPTION 2: Minimal - just web search and terminal
 								# Great for: Simple coding tasks, quick lookups
 								# -----------------------------------------------------------------------------
 								# toolsets:
 								#   - web
 								#   - terminal
 								# -----------------------------------------------------------------------------
 								# OPTION 3: Research mode - no execution capabilities
 								# Great for: Safe information gathering, research tasks
 								# -----------------------------------------------------------------------------
 								# toolsets:
 								#   - web
 								#   - vision
 								#   - skills
 								# -----------------------------------------------------------------------------
 								# OPTION 4: Full automation - browser + terminal
 								# Great for: Web scraping, automation tasks, testing
 								# -----------------------------------------------------------------------------
 								# toolsets:
 								#   - terminal
 								#   - browser
 								#   - web
 								# -----------------------------------------------------------------------------
 								# OPTION 5: Creative mode - vision + image generation
 								# Great for: Design work, image analysis, creative tasks
 								# -----------------------------------------------------------------------------
 								# toolsets:
 								#   - vision
 								#   - image_gen
 								#   - web
 								# -----------------------------------------------------------------------------
 								# OPTION 6: Safe mode - no terminal or browser
 								# Great for: Restricted environments, untrusted queries
 								# -----------------------------------------------------------------------------
 								# toolsets:
 								#   - safe
-												docs: add comprehensive MCP documentation and examples

- docs/mcp.md: Full MCP documentation covering prerequisites, configuration,
  transports (stdio + HTTP), security (env filtering, credential stripping),
  reconnection, troubleshooting, popular servers, and advanced usage
- README.md: Add MCP section with quick config example and install instructions
- cli-config.yaml.example: Add commented mcp_servers section with examples
  for stdio, HTTP, and authenticated server configs
- docs/tools.md: Add MCP to Tool Categories table and MCP Tools section
- skills/mcp/native-mcp/SKILL.md: Create native MCP client skill with
  full configuration reference, transport types, security, troubleshooting
- skills/mcp/DESCRIPTION.md: Update category description to cover both
  native MCP client and mcporter bridge approaches

											
										
										
											2026-03-02 18:52:33 -08:00
+								# =============================================================================
 								# MCP (Model Context Protocol) Servers
 								# =============================================================================
 								# Connect to external MCP servers to add tools from the MCP ecosystem.
 								# Each server's tools are automatically discovered and registered.
 								# See docs/mcp.md for full documentation.
 								#
 								# Stdio servers (spawn a subprocess):
 								#   command: the executable to run
 								#   args: command-line arguments
 								#   env: environment variables (only these + safe defaults passed to subprocess)
 								#
 								# HTTP servers (connect to a URL):
 								#   url: the MCP server endpoint
 								#   headers: HTTP headers (e.g., for authentication)
 								#
 								# Optional per-server settings:
 								#   timeout: tool call timeout in seconds (default: 120)
 								#   connect_timeout: initial connection timeout (default: 60)
 								#
 								# mcp_servers:
 								#   time:
 								#     command: uvx
 								#     args: ["mcp-server-time"]
 								#   filesystem:
 								#     command: npx
 								#     args: ["-y", "@modelcontextprotocol/server-filesystem", "/home/user"]
 								#   notion:
 								#     url: https://mcp.notion.com/mcp
 								#   github:
 								#     command: npx
 								#     args: ["-y", "@modelcontextprotocol/server-github"]
 								#     env:
 								#       GITHUB_PERSONAL_ACCESS_TOKEN: "ghp_..."
-												feat(mcp): add sampling support — server-initiated LLM requests (#753)

Add MCP sampling/createMessage capability via SamplingHandler class.

Text-only sampling + tool use in sampling with governance (rate limits,
model whitelist, token caps, tool loop limits). Per-server audit metrics.

Based on concept from PR #366 by eren-karakus0. Restructured as class-based
design with bug fixes and tests using real MCP SDK types.

50 new tests, 2600 total passing.
											
										
										
											2026-03-09 03:37:38 -07:00
+								#
 								# Sampling (server-initiated LLM requests) — enabled by default.
 								# Per-server config under the 'sampling' key:
 								#   analysis:
 								#     command: npx
 								#     args: ["-y", "analysis-server"]
 								#     sampling:
 								#       enabled: true           # default: true
 								#       model: "gemini-3-flash" # override model (optional)
 								#       max_tokens_cap: 4096    # max tokens per request
 								#       timeout: 30             # LLM call timeout (seconds)
 								#       max_rpm: 10             # max requests per minute
 								#       allowed_models: []      # model whitelist (empty = all)
 								#       max_tool_rounds: 5      # tool loop limit (0 = disable)
 								#       log_level: "info"       # audit verbosity
-												docs: add comprehensive MCP documentation and examples

- docs/mcp.md: Full MCP documentation covering prerequisites, configuration,
  transports (stdio + HTTP), security (env filtering, credential stripping),
  reconnection, troubleshooting, popular servers, and advanced usage
- README.md: Add MCP section with quick config example and install instructions
- cli-config.yaml.example: Add commented mcp_servers section with examples
  for stdio, HTTP, and authenticated server configs
- docs/tools.md: Add MCP to Tool Categories table and MCP Tools section
- skills/mcp/native-mcp/SKILL.md: Create native MCP client skill with
  full configuration reference, transport types, security, troubleshooting
- skills/mcp/DESCRIPTION.md: Update category description to cover both
  native MCP client and mcporter bridge approaches

											
										
										
											2026-03-02 18:52:33 -08:00
-												Add messaging platform enhancements: STT, stickers, Discord UX, Slack, pairing, hooks

Major feature additions inspired by OpenClaw/ClawdBot integration analysis:

Voice Message Transcription (STT):
- Auto-transcribe voice/audio messages via OpenAI Whisper API
- Download voice to ~/.hermes/audio_cache/ on Telegram/Discord/WhatsApp
- Inject transcript as text so all models can understand voice input
- Configurable model (whisper-1, gpt-4o-mini-transcribe, gpt-4o-transcribe)

Telegram Sticker Understanding:
- Describe static stickers via vision tool with JSON-backed cache
- Cache keyed by file_unique_id avoids redundant API calls
- Animated/video stickers get emoji-based fallback description

Discord Rich UX:
- Native slash commands (/ask, /reset, /status, /stop) via app_commands
- Button-based exec approvals (Allow Once / Always Allow / Deny)
- ExecApprovalView with user authorization and timeout handling

Slack Integration:
- Full SlackAdapter using slack-bolt with Socket Mode
- DMs, channel messages (mention-gated), /hermes slash command
- File attachment handling with bot-token-authenticated downloads

DM Pairing System:
- Code-based user authorization as alternative to static allowlists
- 8-char codes from unambiguous alphabet, 1-hour expiry
- Rate limiting, lockout after failed attempts, chmod 0600 on data
- CLI: hermes pairing list/approve/revoke/clear-pending

Event Hook System:
- File-based hook discovery from ~/.hermes/hooks/
- HOOK.yaml + handler.py per hook, sync/async handler support
- Events: gateway:startup, session:start/reset, agent:start/step/end
- Wildcard matching (command:* catches all command events)

Cross-Channel Messaging:
- send_message agent tool for delivering to any connected platform
- Enables cron job delivery and cross-platform notifications

Human-Like Response Pacing:
- Configurable delays between message chunks (off/natural/custom)
- HERMES_HUMAN_DELAY_MODE env var with min/max ms settings

Warm Injection Message Style:
- Retrofitted image vision messages with friendly kawaii-consistent tone
- All new injection messages (STT, stickers, errors) use warm style

Also: updated config migration to prompt for optional keys interactively,
bumped config version, updated README, AGENTS.md, .env.example,
cli-config.yaml.example, install scripts, pyproject.toml, and toolsets.

											
										
										
											2026-02-15 21:38:59 -08:00
+								# =============================================================================
 								# Voice Transcription (Speech-to-Text)
 								# =============================================================================
 								# Automatically transcribe voice messages on messaging platforms.
 								# Requires OPENAI_API_KEY in .env (uses OpenAI Whisper API directly).
 								stt:
 								  enabled: true
 								  model: "whisper-1"  # whisper-1 (cheapest) | gpt-4o-mini-transcribe | gpt-4o-transcribe
 								# =============================================================================
 								# Response Pacing (Messaging Platforms)
 								# =============================================================================
 								# Add human-like delays between message chunks.
 								# human_delay:
 								#   mode: "off"      # "off" | "natural" | "custom"
 								#   min_ms: 800      # Min delay (custom mode only)
 								#   max_ms: 2500     # Max delay (custom mode only)
-												Enhance session logging and interactive sudo support

- Implemented automatic session logging, saving conversation trajectories to the `logs/` directory in JSON format, with each session having a unique identifier.
- Updated the CLI to display the session ID in the welcome banner for easy reference.
- Introduced an interactive sudo password prompt in CLI mode, allowing users to enter their password with a 45-second timeout, enhancing user experience during command execution.
- Documented session logging and interactive sudo features in `README.md`, `cli.md`, and `cli-config.yaml.example` for better user guidance.

											
										
										
											2026-02-01 15:36:26 -08:00
+								# =============================================================================
 								# Session Logging
 								# =============================================================================
 								# Session trajectories are automatically saved to logs/ directory.
 								# Each session creates: logs/session_YYYYMMDD_HHMMSS_UUID.json
 								#
 								# The session ID is displayed in the welcome banner for easy reference.
 								# Logs contain full conversation history in trajectory format:
 								# - System prompt, user messages, assistant responses
 								# - Tool calls with inputs/outputs
 								# - Timestamps for debugging
 								#
 								# No configuration needed - logging is always enabled.
 								# To disable, you would need to modify the source code.
-												feat: implement subagent delegation for task management

- Introduced the `delegate_task` tool, allowing the main agent to spawn child AIAgent instances with isolated context for complex tasks.
- Supported both single-task and batch processing (up to 3 concurrent tasks) to enhance task management capabilities.
- Updated configuration options for delegation, including maximum iterations and default toolsets for subagents.
- Enhanced documentation to provide clear guidance on using the delegation feature and its configuration.
- Added comprehensive tests to ensure the functionality and reliability of the delegation logic.

											
										
										
											2026-02-20 03:15:53 -08:00
+								# =============================================================================
 								# Code Execution Sandbox (Programmatic Tool Calling)
 								# =============================================================================
 								# The execute_code tool runs Python scripts that call Hermes tools via RPC.
 								# Intermediate tool results stay out of the LLM's context window.
 								code_execution:
 								  timeout: 300         # Max seconds per script before kill (default: 300 = 5 min)
 								  max_tool_calls: 50   # Max RPC tool calls per execution (default: 50)
 								# =============================================================================
 								# Subagent Delegation
 								# =============================================================================
 								# The delegate_task tool spawns child agents with isolated context.
 								# Supports single tasks and batch mode (up to 3 parallel).
 								delegation:
-												fix(delegate_tool): update max_iterations in documentation and example config to reflect default value of 50

											
										
										
											2026-03-02 00:52:01 -08:00
+								  max_iterations: 50                          # Max tool-calling turns per child (default: 50)
-												feat: implement subagent delegation for task management

- Introduced the `delegate_task` tool, allowing the main agent to spawn child AIAgent instances with isolated context for complex tasks.
- Supported both single-task and batch processing (up to 3 concurrent tasks) to enhance task management capabilities.
- Updated configuration options for delegation, including maximum iterations and default toolsets for subagents.
- Enhanced documentation to provide clear guidance on using the delegation feature and its configuration.
- Added comprehensive tests to ensure the functionality and reliability of the delegation logic.

											
										
										
											2026-02-20 03:15:53 -08:00
+								  default_toolsets: ["terminal", "file", "web"]  # Default toolsets for subagents
-												feat: add Honcho integration for cross-session user modeling

											
										
										
											2026-02-27 23:41:08 -08:00
+								# =============================================================================
 								# Honcho Integration (Cross-Session User Modeling)
 								# =============================================================================
 								# AI-native persistent memory via Honcho (https://honcho.dev/).
 								# Builds a deeper understanding of the user across sessions and tools.
 								# Runs alongside USER.md — additive, not a replacement.
 								#
 								# Requires: pip install honcho-ai
 								# Config: ~/.honcho/config.json (shared with Claude Code, Cursor, etc.)
 								# API key: HONCHO_API_KEY in ~/.hermes/.env or ~/.honcho/config.json
 								#
 								# Hermes-specific overrides (optional — most config comes from ~/.honcho/config.json):
 								# honcho: {}
-												Add a claude code-like CLI

- Introduced `cli-config.yaml.example` to provide a template for configuring the CLI behavior, including model settings, terminal tool configurations, agent behavior, and toolsets.
- Created `cli.py` for an interactive terminal interface, allowing users to start the Hermes Agent with various options and toolsets.
- Added `hermes` launcher script for convenient CLI access.
- Updated `model_tools.py` to support quiet mode for suppressing output during tool initialization and execution.
- Enhanced logging in various tools to respect quiet mode, improving user experience by reducing unnecessary output.
- Added `prompt_toolkit` to `requirements.txt` for improved CLI interaction capabilities.
- Created `TODO.md` for future improvements and enhancements to the Hermes Agent framework.

											
										
										
											2026-01-31 06:30:48 +00:00
+								# =============================================================================
 								# Display
 								# =============================================================================
 								display:
 								  # Use compact banner mode
 								  compact: false
-												refactor: migrate tool progress configuration from environment variables to config.yaml

											
										
										
											2026-02-28 00:05:58 -08:00
 								  # Tool progress display level (CLI and gateway)
 								  #   off:     Silent — no tool activity shown, just the final response
 								  #   new:     Show a tool indicator only when the tool changes (skip repeats)
 								  #   all:     Show every tool call with a short preview (default)
 								  #   verbose: Full args, results, and debug logs (same as /verbose)
 								  # Toggle at runtime with /verbose in the CLI
 								  tool_progress: all
-												feat: bell_on_complete — terminal bell when agent finishes

Adds a simple config option to play the terminal bell (\a) when the
agent finishes a response. Useful for long-running tasks — switch to
another window and your terminal will ding when done.

Works over SSH since the bell character propagates through the
connection. Most terminal emulators can be configured to flash the
taskbar, play a sound, or show a visual indicator on bell.

Config (default: off):
  display:
    bell_on_complete: true

Closes #318

											
										
										
											2026-03-08 19:41:17 -07:00
-												feat(gateway): configurable background process watcher notifications

Add display.background_process_notifications config option to control
how chatty the gateway process watcher is when using
terminal(background=true, check_interval=...) from messaging platforms.

Modes:
  - all:    running-output updates + final message (default, current behavior)
  - result: only the final completion message
  - error:  only the final message when exit code != 0
  - off:    no watcher messages at all

Also supports HERMES_BACKGROUND_NOTIFICATIONS env var override.

Includes 12 tests (5 config loading + 7 watcher behavior).

Inspired by @PeterFile's PR #593. Closes #592.

											
										
										
											2026-03-10 04:12:39 -07:00
+								  # Background process notifications (gateway/messaging only).
 								  # Controls how chatty the process watcher is when you use
 								  # terminal(background=true, check_interval=...) from Telegram/Discord/etc.
 								  #   off:     No watcher messages at all
 								  #   result:  Only the final completion message
 								  #   error:   Only the final message when exit code != 0
 								  #   all:     Running output updates + final message (default)
 								  background_process_notifications: all
-												feat: bell_on_complete — terminal bell when agent finishes

Adds a simple config option to play the terminal bell (\a) when the
agent finishes a response. Useful for long-running tasks — switch to
another window and your terminal will ding when done.

Works over SSH since the bell character propagates through the
connection. Most terminal emulators can be configured to flash the
taskbar, play a sound, or show a visual indicator on bell.

Config (default: off):
  display:
    bell_on_complete: true

Closes #318

											
										
										
											2026-03-08 19:41:17 -07:00
+								  # Play terminal bell when agent finishes a response.
 								  # Useful for long-running tasks — your terminal will ding when the agent is done.
 								  # Works over SSH. Most terminals can be configured to flash the taskbar or play a sound.
 								  bell_on_complete: false
-												docs: comprehensive skin/theme system documentation

- AGENTS.md: add Skin/Theme System section with architecture, skinnable
  elements table, built-in skins list, adding built-in/user skins guide,
  YAML example; add skin_engine.py to project structure; mention skin
  engine in CLI Architecture section
- CONTRIBUTING.md: add skin_engine.py to project structure; add 'Adding
  a Skin/Theme' section with YAML schema, activation instructions
- cli-config.yaml.example: add full skin config documentation with
  schema reference, built-in skins list, all color/spinner/branding keys
- docs/skins/example-skin.yaml: complete annotated skin template with
  all available fields and inline documentation
- hermes_cli/skin_engine.py: expand module docstring to full schema
  reference with all fields documented, usage examples, built-in skins
  list

											
										
										
											2026-03-10 00:51:27 -07:00
 								  # ───────────────────────────────────────────────────────────────────────────
 								  # Skin / Theme
 								  # ───────────────────────────────────────────────────────────────────────────
 								  # Customize CLI visual appearance — banner colors, spinner faces, tool prefix,
 								  # response box label, and branding text. Change at runtime with /skin <name>.
 								  #
 								  # Built-in skins:
 								  #   default  — Classic Hermes gold/kawaii
 								  #   ares     — Crimson/bronze war-god theme with spinner wings
 								  #   mono     — Clean grayscale monochrome
 								  #   slate    — Cool blue developer-focused
 								  #
 								  # Custom skins: drop a YAML file in ~/.hermes/skins/<name>.yaml
 								  # Schema (all fields optional, missing values inherit from default):
 								  #
 								  #   name: my-theme
 								  #   description: Short description
 								  #   colors:
 								  #     banner_border: "#HEX"    # Panel border
 								  #     banner_title: "#HEX"     # Panel title
 								  #     banner_accent: "#HEX"    # Section headers (Available Tools, etc.)
 								  #     banner_dim: "#HEX"       # Dim/muted text
 								  #     banner_text: "#HEX"      # Body text (tool names, skill names)
 								  #     ui_accent: "#HEX"        # UI accent color
 								  #     response_border: "#HEX"  # Response box border color
 								  #   spinner:
 								  #     waiting_faces: ["(⚔)", "(⛨)"]       # Faces shown while waiting
 								  #     thinking_faces: ["(⚔)", "(⌁)"]      # Faces shown while thinking
 								  #     thinking_verbs: ["forging", "plotting"]  # Verbs for spinner messages
 								  #     wings:                                # Optional left/right spinner decorations
 								  #       - ["⟪⚔", "⚔⟫"]
 								  #       - ["⟪▲", "▲⟫"]
 								  #   branding:
 								  #     agent_name: "My Agent"               # Banner title and branding
 								  #     welcome: "Welcome message"           # Shown at CLI startup
 								  #     response_label: " ⚔ Agent "         # Response box header label
 								  #     prompt_symbol: "⚔ ❯ "              # Prompt symbol
 								  #   tool_prefix: "╎"                       # Tool output line prefix (default: ┊)
 								  #
 								  skin: default