feat: integrate hardcoded path guard into tool dispatch

feat: add pre-commit hook for hardcoded path detection
feat: add hardcoded path guard module (#921 )
2026-04-21 00:31:01 +00:00 · 2026-04-21 00:29:33 +00:00 · 2026-04-21 00:29:12 +00:00 · 2026-04-20 23:56:27 +00:00
5 changed files with 226 additions and 145 deletions
--- a/.githooks/pre-commit-hardcoded-path.py
+++ b/.githooks/pre-commit-hardcoded-path.py
@@ -0,0 +1,78 @@
+#!/usr/bin/env python3
+"""
+Pre-commit hook: Reject hardcoded home-directory paths.
+
+Install:
+    cp pre-commit-hardcoded-path.py .git/hooks/pre-commit-hardcoded-path
+    chmod +x .git/hooks/pre-commit-hardcoded-path
+    
+    Or add to .pre-commit-config.yaml
+"""
+
+import sys
+import subprocess
+import re
+
+PATTERNS = [
+    (r"/Users/[\w.\-]+/", "macOS home directory"),
+    (r"/home/[\w.\-]+/", "Linux home directory"),
+    (r"(?<![\w/])~/", "unexpanded tilde"),
+]
+
+NOQA = re.compile(r"#\s*noqa:?\s*hardcoded-path-ok")
+
+def get_staged_files():
+    result = subprocess.run(
+        ["git", "diff", "--cached", "--name-only", "--diff-filter=ACM"],
+        capture_output=True, text=True
+    )
+    return [f for f in result.stdout.strip().split("\n") if f.endswith(".py")]
+
+def check_file(filepath):
+    try:
+        result = subprocess.run(
+            ["git", "show", f":{filepath}"],
+            capture_output=True, text=True
+        )
+        content = result.stdout
+    except Exception:
+        return []
+    
+    violations = []
+    for i, line in enumerate(content.split("\n"), 1):
+        if line.strip().startswith("#"):
+            continue
+        if line.strip().startswith(("import ", "from ")):
+            continue
+        if NOQA.search(line):
+            continue
+        for pattern, desc in PATTERNS:
+            if re.search(pattern, line):
+                violations.append((filepath, i, line.strip(), desc))
+                break
+    return violations
+
+def main():
+    files = get_staged_files()
+    if not files:
+        sys.exit(0)
+    
+    all_violations = []
+    for f in files:
+        all_violations.extend(check_file(f))
+    
+    if all_violations:
+        print("ERROR: Hardcoded home directory paths detected:")
+        print()
+        for filepath, line_no, line, desc in all_violations:
+            print(f"  {filepath}:{line_no}: {desc}")
+            print(f"    {line[:100]}")
+            print()
+        print("Fix: Use $HOME, relative paths, or get_hermes_home().")
+        print("Override: Add '# noqa: hardcoded-path-ok' to the line.")
+        sys.exit(1)
+    
+    sys.exit(0)
+
+if __name__ == "__main__":
+    main()
--- a/model_tools.py
+++ b/model_tools.py
@@ -28,6 +28,7 @@ from typing import Dict, Any, List, Optional, Tuple

 from tools.registry import discover_builtin_tools, registry
 from tools.tool_pokayoke import validate_tool_call, reset_circuit_breaker, get_hallucination_stats
+from tools.hardcoded_path_guard import guard_tool_dispatch as _guard_hardcoded_paths
 from toolsets import resolve_toolset, validate_toolset
 from agent.tool_orchestrator import orchestrator

@@ -501,6 +502,12 @@ def handle_function_call(
            # Prefer the caller-provided list so subagents can't overwrite
            # the parent's tool set via the process-global.
            sandbox_enabled = enabled_tools if enabled_tools is not None else _last_resolved_tool_names
+            # Poka-yoke #921: guard against hardcoded home-directory paths
+            _hardcoded_err = _guard_hardcoded_paths(function_name, function_args)
+            if _hardcoded_err:
+                logger.warning(f"Hardcoded path blocked: {function_name}")
+                return _hardcoded_err
+
            # Poka-yoke: validate tool call before dispatch
            is_valid, corrected_name, corrected_params, pokayoke_messages = validate_tool_call(function_name, function_args)
            if not is_valid:
--- a/scripts/time-aware-model-router.py
+++ b/scripts/time-aware-model-router.py
@@ -1,145 +0,0 @@
-#!/usr/bin/env python3
-"""
-time-aware-model-router.py — Route cron jobs to better models during high-error hours.
-
-Empirical finding (audit 2026-04-12): Error rate peaks at 18:00 (9.4%) during
-evening cron batches vs 4.0% at 09:00 during interactive work.
-
-This script provides a model resolver that selects a more capable model during
-high-error hours (17:00-22:00) and the default model otherwise.
-
-Usage:
-    # As a standalone resolver
-    python3 scripts/time-aware-model-router.py
-    # Returns: {"provider": "nous", "model": "xiaomi/mimo-v2-pro"}
-
-    # With hour override for testing
-    python3 scripts/time-aware-model-router.py --hour 18
-    # Returns: {"provider": "openrouter", "model": "anthropic/claude-sonnet-4"}
-
-    # As a cron job wrapper
-    python3 scripts/time-aware-model-router.py --wrap -- prompt goes here
-
-Environment variables:
-    HERMES_DEFAULT_PROVIDER: Default provider for normal hours (default: nous)
-    HERMES_DEFAULT_MODEL: Default model for normal hours (default: xiaomi/mimo-v2-pro)
-    HERMES_PEAK_PROVIDER: Provider for high-error hours (default: openrouter)
-    HERMES_PEAK_MODEL: Model for high-error hours (default: anthropic/claude-sonnet-4)
-    HERMES_PEAK_HOURS: Comma-separated hours for peak routing (default: 17,18,19,20,21,22)
-
-Refs: hermes-agent#889
-"""
-
-import json
-import os
-import sys
-import time
-from datetime import datetime
-
-# ── Config ──────────────────────────────────────────────────────────────────
-
-DEFAULT_PROVIDER = os.environ.get("HERMES_DEFAULT_PROVIDER", "nous")
-DEFAULT_MODEL = os.environ.get("HERMES_DEFAULT_MODEL", "xiaomi/mimo-v2-pro")
-PEAK_PROVIDER = os.environ.get("HERMES_PEAK_PROVIDER", "openrouter")
-PEAK_MODEL = os.environ.get("HERMES_PEAK_MODEL", "anthropic/claude-sonnet-4")
-PEAK_HOURS = set(int(h) for h in os.environ.get("HERMES_PEAK_HOURS", "17,18,19,20,21,22").split(","))
-
-# ── Time-aware routing ─────────────────────────────────────────────────────
-
-def get_current_hour():
-    """Get the current local hour (0-23)."""
-    return datetime.now().hour
-
-
-def is_peak_hour(hour=None):
-    """Check if the given hour (or current hour) is a high-error period."""
-    if hour is None:
-        hour = get_current_hour()
-    return hour in PEAK_HOURS
-
-
-def resolve_model(hour=None):
-    """
-    Resolve which model to use based on time of day.
-
-    Returns dict with 'provider' and 'model' keys.
-    During peak hours (high error rate), uses a more capable model.
-    During normal hours, uses the default model.
-    """
-    if is_peak_hour(hour):
-        return {
-            "provider": PEAK_PROVIDER,
-            "model": PEAK_MODEL,
-            "reason": f"peak_hour ({hour if hour is not None else get_current_hour()}:00)",
-            "confidence_note": "Using stronger model during high-error period"
-        }
-    else:
-        return {
-            "provider": DEFAULT_PROVIDER,
-            "model": DEFAULT_MODEL,
-            "reason": "normal_hour",
-            "confidence_note": "Default model sufficient during low-error period"
-        }
-
-
-def get_routing_info():
-    """Get full routing info including current state and config."""
-    hour = get_current_hour()
-    resolved = resolve_model(hour)
-    return {
-        "current_hour": hour,
-        "is_peak": is_peak_hour(hour),
-        "peak_hours": sorted(PEAK_HOURS),
-        "routing": resolved,
-        "config": {
-            "default": {"provider": DEFAULT_PROVIDER, "model": DEFAULT_MODEL},
-            "peak": {"provider": PEAK_PROVIDER, "model": PEAK_MODEL},
-        },
-        "source": "hermes-agent#889 — empirical audit 2026-04-12",
-    }
-
-
-# ── CLI ─────────────────────────────────────────────────────────────────────
-
-def main():
-    args = sys.argv[1:]
-
-    # Parse --hour
-    hour = None
-    if "--hour" in args:
-        idx = args.index("--hour")
-        if idx + 1 < len(args):
-            hour = int(args[idx + 1])
-
-    # Parse --wrap mode
-    if "--wrap" in args:
-        # Run the remaining args as a command with model override
-        resolved = resolve_model(hour)
-        wrap_idx = args.index("--wrap")
-        cmd_parts = args[wrap_idx + 1:]
-
-        # Inject model/provider into environment
-        env = os.environ.copy()
-        env["HERMES_MODEL"] = resolved["model"]
-        env["HERMES_PROVIDER"] = resolved["provider"]
-
-        if cmd_parts:
-            import subprocess
-            result = subprocess.run(cmd_parts, env=env)
-            sys.exit(result.returncode)
-        else:
-            print(json.dumps(resolved, indent=2))
-            sys.exit(0)
-
-    # Parse --info mode
-    if "--info" in args:
-        print(json.dumps(get_routing_info(), indent=2))
-        sys.exit(0)
-
-    # Default: output resolved model as JSON
-    resolved = resolve_model(hour)
-    print(json.dumps(resolved, indent=2))
-
-
-if __name__ == "__main__":
-    main()
--- a/tools/hardcoded_path_guard.py
+++ b/tools/hardcoded_path_guard.py
@@ -0,0 +1,113 @@
+#!/usr/bin/env python3
+"""
+Hardcoded Path Guard — Poka-Yoke #921
+
+Detects and blocks hardcoded home-directory paths in tool arguments.
+These paths work on one machine but break on others, VPS deployments,
+or when HOME changes.
+
+Usage:
+    from tools.hardcoded_path_guard import check_path, validate_tool_args
+    
+    # Check a single path
+    err = check_path("/Users/apayne/.hermes/config.yaml")
+    
+    # Validate all path-like args in a tool call
+    clean_args, warnings = validate_tool_args("read_file", {"path": "/home/user/file.txt"})
+"""
+
+import os
+import re
+import json as _json
+from typing import Dict, List, Optional, Tuple, Any
+
+# Patterns that indicate hardcoded home directories
+HARDCODED_PATTERNS = [
+    (r"/Users/[\w.\-]+/", "macOS home directory (/Users/...)"),
+    (r"/home/[\w.\-]+/", "Linux home directory (/home/...)"),
+    (r"(?<![\w/])~/", "unexpanded tilde (~/)"),
+    (r"/root/", "root home directory (/root/)"),
+]
+
+_COMPILED_PATTERNS = [(re.compile(p), desc) for p, desc in HARDCODED_PATTERNS]
+_NOQA_PATTERN = re.compile(r"#\s*noqa:?\s*hardcoded-path-ok")
+
+_PATH_ARG_NAMES = frozenset({
+    "path", "file_path", "filepath", "dir", "directory", "dest", "source",
+    "input", "output", "src", "dst", "target", "location", "file",
+    "image_path", "script", "config", "log_file",
+})
+
+
+def has_hardcoded_path(text: str) -> Optional[str]:
+    if _NOQA_PATTERN.search(text):
+        return None
+    for pattern, desc in _COMPILED_PATTERNS:
+        if pattern.search(text):
+            return desc
+    return None
+
+
+def check_path(path_value: str) -> Optional[str]:
+    if not isinstance(path_value, str):
+        return None
+    match_desc = has_hardcoded_path(path_value)
+    if match_desc:
+        return (
+            f"Path contains hardcoded home directory ({match_desc}): '{path_value}'. "
+            f"Use $HOME, relative paths, or get_hermes_home(). "
+            f"Add '# noqa: hardcoded-path-ok' if intentional."
+        )
+    return None
+
+
+def validate_tool_args(tool_name: str, args: Dict[str, Any]) -> Tuple[Dict[str, Any], List[str]]:
+    warnings = []
+    for key, value in args.items():
+        if key.lower() not in _PATH_ARG_NAMES:
+            continue
+        if isinstance(value, str):
+            err = check_path(value)
+            if err:
+                warnings.append(err)
+        elif isinstance(value, list):
+            for item in value:
+                if isinstance(item, str):
+                    err = check_path(item)
+                    if err:
+                        warnings.append(err)
+    return args, warnings
+
+
+def scan_source_for_violations(source_code: str, filename: str = "") -> List[Tuple[int, str, str]]:
+    violations = []
+    lines = source_code.split("\n")
+    for i, line in enumerate(lines, 1):
+        stripped = line.strip()
+        if stripped.startswith("#"):
+            if _NOQA_PATTERN.search(line):
+                continue
+            continue
+        if stripped.startswith("import ") or stripped.startswith("from "):
+            continue
+        for pattern, desc in _COMPILED_PATTERNS:
+            match = pattern.search(line)
+            if match:
+                if _NOQA_PATTERN.search(line):
+                    continue
+                violations.append((i, line.strip(), desc))
+                break
+    return violations
+
+
+def guard_tool_dispatch(tool_name: str, args: Dict[str, Any]) -> Optional[str]:
+    _, warnings = validate_tool_args(tool_name, args)
+    if warnings:
+        return _json.dumps({
+            "error": "Hardcoded home directory path detected",
+            "details": warnings,
+            "suggestion": "Use $HOME, relative paths, or get_hermes_home() instead of hardcoded paths.",
+            "pokayoke": True,
+            "rule": "hardcoded-path-guard"
+        })
+    return None
--- a/tools/skill_manager_tool.py
+++ b/tools/skill_manager_tool.py
@@ -44,6 +44,34 @@ from typing import Dict, Any, Optional, Tuple

 logger = logging.getLogger(__name__)

+
+def _format_error(
+    message: str,
+    skill_name: str = None,
+    file_path: str = None,
+    suggestion: str = None,
+    context: dict = None,
+) -> Dict[str, Any]:
+    """Format an error with rich context for better debugging."""
+    parts = [message]
+    if skill_name:
+        parts.append(f"Skill: {skill_name}")
+    if file_path:
+        parts.append(f"File: {file_path}")
+    if suggestion:
+        parts.append(f"Suggestion: {suggestion}")
+    if context:
+        for key, value in context.items():
+            parts.append(f"{key}: {value}")
+    return {
+        "success": False,
+        "error": " | ".join(parts),
+        "skill_name": skill_name,
+        "file_path": file_path,
+        "suggestion": suggestion,
+    }
+
+
 # Import security scanner — agent-created skills get the same scrutiny as
 # community hub installs.
 try:
Author	SHA1	Message	Date
Alexander Whitestone	4cdda8701d	feat: integrate hardcoded path guard into tool dispatch Some checks failed Docker Build and Publish / build-and-push (pull_request) Has been skipped Details Contributor Attribution Check / check-attribution (pull_request) Failing after 32s Details Supply Chain Audit / Scan PR for supply chain risks (pull_request) Successful in 32s Details Tests / e2e (pull_request) Successful in 2m56s Details Tests / test (pull_request) Failing after 1h1m7s Details	2026-04-21 00:31:01 +00:00
Alexander Whitestone	a80d30b342	feat: add pre-commit hook for hardcoded path detection	2026-04-21 00:29:33 +00:00
Alexander Whitestone	f098cf8c4a	feat: add hardcoded path guard module (#921 ) - Detects /Users/, /home/, ~/ in tool arguments - Source code scanner for CI/pre-commit - Runtime guard for tool dispatch - noqa: hardcoded-path-ok escape hatch Closes #921	2026-04-21 00:29:12 +00:00
Alexander Whitestone	c6f2855745	fix: restore _format_error helper for test compatibility (#916 ) Some checks failed Docker Build and Publish / build-and-push (push) Has been skipped Details Nix / nix (ubuntu-latest) (push) Failing after 2s Details Tests / e2e (push) Successful in 2m47s Details Tests / test (push) Failing after 27m41s Details Build Skills Index / build-index (push) Has been skipped Details Build Skills Index / deploy-with-index (push) Has been skipped Details Nix / nix (macos-latest) (push) Has been cancelled Details fix: restore _format_error helper for test compatibility (#916)	2026-04-20 23:56:27 +00:00