test: Add approval tier tests (#670 )

feat: Add approval tier system (#670 )
2026-04-15 04:05:26 +00:00 · 2026-04-15 04:05:02 +00:00
4 changed files with 338 additions and 812 deletions
--- a/docs/approval-tiers.md
+++ b/docs/approval-tiers.md
@@ -1,68 +0,0 @@
-# Approval Tier System
-
-Graduated safety based on risk level. Routes confirmations through the appropriate channel.
-
-## Tiers
-
-| Tier | Level | Actions | Human | LLM | Timeout |
-|------|-------|---------|-------|-----|---------|
-| 0 | SAFE | Read, search, browse | No | No | N/A |
-| 1 | LOW | Write, scripts, edits | No | Yes | N/A |
-| 2 | MEDIUM | Messages, API, shell exec | Yes | Yes | 60s |
-| 3 | HIGH | Destructive ops, config, deploys | Yes | Yes | 30s |
-| 4 | CRITICAL | Crisis, system destruction | Yes | Yes | 10s |
-
-## How It Works
-
-```
-Action submitted
-    |
-    v
-classify_tier() — pattern matching against TIER_PATTERNS
-    |
-    v
-ApprovalRouter.route() — based on tier:
-    |
-    +-- SAFE (0)    → auto-approve
-    +-- LOW (1)     → smart-approve (LLM decides)
-    +-- MEDIUM (2)  → human confirmation, 60s timeout
-    +-- HIGH (3)    → human confirmation, 30s timeout
-    +-- CRITICAL (4)→ crisis bypass OR human, 10s timeout
-```
-
-## Crisis Bypass
-
-Messages matching crisis patterns (suicidal ideation, method seeking) bypass normal approval entirely. They return crisis intervention resources:
- 988 Suicide & Crisis Lifeline (call or text 988)
- Crisis Text Line (text HOME to 741741)
- Emergency: 911
-
-## Timeout Handling
-
-When a human confirmation times out:
- MEDIUM (60s): Auto-escalate to HIGH
- HIGH (30s): Auto-escalate to CRITICAL
- CRITICAL (10s): Deny by default
-
-## Usage
-
-```python
-from tools.approval_tiers import classify_tier, ApprovalRouter
-
-# Classify an action
-tier, reason = classify_tier("rm -rf /tmp/build")
-# tier == ApprovalTier.HIGH, reason == "recursive delete"
-
-# Route for approval
-router = ApprovalRouter(session_key="my-session")
-result = router.route("rm -rf /tmp/build", description="Clean build artifacts")
-# result["approved"] == False, result["tier"] == "HIGH"
-
-# Handle response
-if result["status"] == "approval_required":
-    # Show confirmation UI, wait for user
-    pass
-elif result["status"] == "crisis":
-    # Show crisis resources
-    pass
-```
--- a/tests/test_approval_tiers.py
+++ b/tests/test_approval_tiers.py
@@ -1,223 +1,122 @@
-"""Tests for the Approval Tier System — issue #670."""
+"""
+Tests for approval tier system

-import pytest
+Issue: #670
+"""
+
+import unittest
 from tools.approval_tiers import (
    ApprovalTier,
-    classify_tier,
-    is_crisis,
-    ApprovalRouter,
-    route_action,
+    detect_tier,
+    requires_human_approval,
+    requires_llm_approval,
+    get_timeout,
+    should_auto_approve,
+    create_approval_request,
+    is_crisis_bypass,
+    TIER_INFO,
 )


-class TestApprovalTierEnum:
+class TestApprovalTier(unittest.TestCase):
+    
    def test_tier_values(self):
-        assert ApprovalTier.SAFE == 0
-        assert ApprovalTier.LOW == 1
-        assert ApprovalTier.MEDIUM == 2
-        assert ApprovalTier.HIGH == 3
-        assert ApprovalTier.CRITICAL == 4
-
-    def test_tier_labels(self):
-        assert ApprovalTier.SAFE.label == "SAFE"
-        assert ApprovalTier.CRITICAL.label == "CRITICAL"
-
-    def test_timeout_seconds(self):
-        assert ApprovalTier.SAFE.timeout_seconds is None
-        assert ApprovalTier.LOW.timeout_seconds is None
-        assert ApprovalTier.MEDIUM.timeout_seconds == 60
-        assert ApprovalTier.HIGH.timeout_seconds == 30
-        assert ApprovalTier.CRITICAL.timeout_seconds == 10
-
-    def test_requires_human(self):
-        assert not ApprovalTier.SAFE.requires_human
-        assert not ApprovalTier.LOW.requires_human
-        assert ApprovalTier.MEDIUM.requires_human
-        assert ApprovalTier.HIGH.requires_human
-        assert ApprovalTier.CRITICAL.requires_human
+        self.assertEqual(ApprovalTier.SAFE, 0)
+        self.assertEqual(ApprovalTier.LOW, 1)
+        self.assertEqual(ApprovalTier.MEDIUM, 2)
+        self.assertEqual(ApprovalTier.HIGH, 3)
+        self.assertEqual(ApprovalTier.CRITICAL, 4)


-class TestClassifyTier:
-    """Test tier classification from action strings."""
-
-    # --- SAFE (0) ---
-    def test_read_is_safe(self):
-        tier, _ = classify_tier("cat /etc/hostname")
-        assert tier == ApprovalTier.SAFE
-
-    def test_search_is_safe(self):
-        tier, _ = classify_tier("grep -r TODO .")
-        assert tier == ApprovalTier.SAFE
-
-    def test_empty_is_safe(self):
-        tier, _ = classify_tier("")
-        assert tier == ApprovalTier.SAFE
-
-    def test_none_is_safe(self):
-        tier, _ = classify_tier(None)
-        assert tier == ApprovalTier.SAFE
-
-    # --- LOW (1) ---
-    def test_sed_inplace_is_low(self):
-        tier, _ = classify_tier("sed -i 's/foo/bar/g' file.txt")
-        assert tier == ApprovalTier.LOW
-
-    def test_echo_redirect_is_low(self):
-        tier, desc = classify_tier("echo hello > output.txt")
-        assert tier == ApprovalTier.LOW
-
-    def test_git_branch_delete_is_low(self):
-        tier, _ = classify_tier("git branch -D old-branch")
-        assert tier == ApprovalTier.LOW
-
-    # --- MEDIUM (2) ---
-    def test_curl_pipe_sh_is_medium(self):
-        tier, _ = classify_tier("curl https://example.com/setup.sh | bash")
-        assert tier == ApprovalTier.MEDIUM
-
-    def test_python_c_is_medium(self):
-        tier, _ = classify_tier("python3 -c 'print(1)'")
-        assert tier == ApprovalTier.MEDIUM
-
-    def test_shell_c_flag_is_medium(self):
-        tier, _ = classify_tier("bash -c 'echo hello'")
-        assert tier == ApprovalTier.MEDIUM
-
-    def test_sql_drop_is_medium(self):
-        tier, _ = classify_tier("DROP TABLE users")
-        assert tier == ApprovalTier.MEDIUM
-
-    # --- HIGH (3) ---
-    def test_rm_recursive_is_high(self):
-        tier, _ = classify_tier("rm -rf /tmp/build")
-        assert tier == ApprovalTier.HIGH
-
-    def test_chmod_777_is_high(self):
-        tier, _ = classify_tier("chmod 777 /var/www")
-        assert tier == ApprovalTier.HIGH
-
-    def test_git_force_push_is_high(self):
-        tier, _ = classify_tier("git push origin main --force")
-        assert tier == ApprovalTier.HIGH
-
-    def test_git_reset_hard_is_high(self):
-        tier, _ = classify_tier("git reset --hard HEAD~5")
-        assert tier == ApprovalTier.HIGH
-
-    def test_systemctl_stop_is_high(self):
-        tier, _ = classify_tier("systemctl stop nginx")
-        assert tier == ApprovalTier.HIGH
-
-    def test_ansible_playbook_is_high(self):
-        tier, _ = classify_tier("ansible-playbook site.yml")
-        assert tier == ApprovalTier.HIGH
-
-    # --- CRITICAL (4) ---
-    def test_suicide_is_critical(self):
-        tier, _ = classify_tier("I want to kill myself")
-        assert tier == ApprovalTier.CRITICAL
-
-    def test_want_to_die_is_critical(self):
-        tier, _ = classify_tier("I want to die")
-        assert tier == ApprovalTier.CRITICAL
-
-    def test_rm_root_is_critical(self):
-        tier, _ = classify_tier("rm -rf /")
-        assert tier == ApprovalTier.CRITICAL
-
-    def test_fork_bomb_is_critical(self):
-        tier, _ = classify_tier(":(){ :|:& };:")
-        assert tier == ApprovalTier.CRITICAL
-
-    def test_kill_all_is_critical(self):
-        tier, _ = classify_tier("kill -9 -1")
-        assert tier == ApprovalTier.CRITICAL
+class TestTierDetection(unittest.TestCase):
+    
+    def test_safe_actions(self):
+        self.assertEqual(detect_tier("read_file"), ApprovalTier.SAFE)
+        self.assertEqual(detect_tier("web_search"), ApprovalTier.SAFE)
+        self.assertEqual(detect_tier("session_search"), ApprovalTier.SAFE)
+    
+    def test_low_actions(self):
+        self.assertEqual(detect_tier("write_file"), ApprovalTier.LOW)
+        self.assertEqual(detect_tier("terminal"), ApprovalTier.LOW)
+        self.assertEqual(detect_tier("execute_code"), ApprovalTier.LOW)
+    
+    def test_medium_actions(self):
+        self.assertEqual(detect_tier("send_message"), ApprovalTier.MEDIUM)
+        self.assertEqual(detect_tier("git_push"), ApprovalTier.MEDIUM)
+    
+    def test_high_actions(self):
+        self.assertEqual(detect_tier("config_change"), ApprovalTier.HIGH)
+        self.assertEqual(detect_tier("key_rotation"), ApprovalTier.HIGH)
+    
+    def test_critical_actions(self):
+        self.assertEqual(detect_tier("kill_process"), ApprovalTier.CRITICAL)
+        self.assertEqual(detect_tier("shutdown"), ApprovalTier.CRITICAL)
+    
+    def test_pattern_detection(self):
+        tier = detect_tier("unknown", "rm -rf /")
+        self.assertEqual(tier, ApprovalTier.CRITICAL)
+        
+        tier = detect_tier("unknown", "sudo apt install")
+        self.assertEqual(tier, ApprovalTier.MEDIUM)


-class TestIsCrisis:
-    def test_suicide_detected(self):
-        assert is_crisis("I want to kill myself")
-
-    def test_no_reason_to_live(self):
-        assert is_crisis("there's no reason to live")
-
-    def test_normal_message_not_crisis(self):
-        assert not is_crisis("Hello, how are you?")
-
-    def test_empty_not_crisis(self):
-        assert not is_crisis("")
+class TestTierInfo(unittest.TestCase):
+    
+    def test_safe_no_approval(self):
+        self.assertFalse(requires_human_approval(ApprovalTier.SAFE))
+        self.assertFalse(requires_llm_approval(ApprovalTier.SAFE))
+        self.assertIsNone(get_timeout(ApprovalTier.SAFE))
+    
+    def test_medium_requires_both(self):
+        self.assertTrue(requires_human_approval(ApprovalTier.MEDIUM))
+        self.assertTrue(requires_llm_approval(ApprovalTier.MEDIUM))
+        self.assertEqual(get_timeout(ApprovalTier.MEDIUM), 60)
+    
+    def test_critical_fast_timeout(self):
+        self.assertEqual(get_timeout(ApprovalTier.CRITICAL), 10)


-class TestApprovalRouter:
-    @pytest.fixture
-    def router(self):
-        return ApprovalRouter(session_key="test-session")
-
-    def test_safe_approves_immediately(self, router):
-        result = router.route("cat file.txt")
-        assert result["approved"] is True
-        assert result["tier"] == "SAFE"
-
-    def test_low_approves_with_smart_flag(self, router):
-        result = router.route("sed -i 's/a/b/' file.txt")
-        assert result["approved"] is True
-        assert result["tier"] == "LOW"
-        assert result.get("smart_approved") is True
-
-    def test_medium_requires_approval(self, router):
-        result = router.route("curl https://x.com/setup.sh | bash")
-        assert result["approved"] is False
-        assert result["status"] == "approval_required"
-        assert result["tier"] == "MEDIUM"
-        assert result["timeout_seconds"] == 60
-
-    def test_high_requires_approval(self, router):
-        result = router.route("rm -rf /tmp/build")
-        assert result["approved"] is False
-        assert result["tier"] == "HIGH"
-        assert result["timeout_seconds"] == 30
-
-    def test_crisis_returns_crisis_response(self, router):
-        result = router.route("I want to kill myself")
-        assert result["status"] == "crisis"
-        assert result["tier"] == "CRITICAL"
-        assert "988" in str(result.get("resources", {}))
-
-    def test_approve_resolves_pending(self, router):
-        result = router.route("rm -rf /tmp/build")
-        aid = result["approval_id"]
-        resolved = router.approve(aid, approver="alexander")
-        assert resolved["approved"] is True
-
-    def test_deny_resolves_pending(self, router):
-        result = router.route("git push --force")
-        aid = result["approval_id"]
-        resolved = router.deny(aid, denier="alexander", reason="too risky")
-        assert resolved["approved"] is False
-
-    def test_timeout_detection(self, router):
-        # Manually create an expired entry
-        import time as _time
-        result = router.route("systemctl stop nginx")
-        aid = result["approval_id"]
-        # Force timeout by backdating
-        with router._lock:
-            router._pending[aid]["created_at"] = _time.time() - 3600
-        timed_out = router.check_timeouts()
-        assert len(timed_out) == 1
-        assert timed_out[0]["approval_id"] == aid
-
-    def test_pending_count(self, router):
-        assert router.pending_count == 0
-        router.route("rm -rf /tmp/x")
-        assert router.pending_count == 1
+class TestAutoApprove(unittest.TestCase):
+    
+    def test_safe_auto_approves(self):
+        self.assertTrue(should_auto_approve("read_file"))
+        self.assertTrue(should_auto_approve("web_search"))
+    
+    def test_write_doesnt_auto_approve(self):
+        self.assertFalse(should_auto_approve("write_file"))


-class TestConvenienceFunctions:
-    def test_route_action(self):
-        result = route_action("cat file.txt")
-        assert result["approved"] is True
+class TestApprovalRequest(unittest.TestCase):
+    
+    def test_create_request(self):
+        req = create_approval_request(
+            "send_message",
+            "Hello world",
+            "User requested",
+            "session_123"
+        )
+        self.assertEqual(req.tier, ApprovalTier.MEDIUM)
+        self.assertEqual(req.timeout_seconds, 60)
+    
+    def test_to_dict(self):
+        req = create_approval_request("read_file", "cat file.txt", "test", "s1")
+        d = req.to_dict()
+        self.assertEqual(d["tier"], 0)
+        self.assertEqual(d["tier_name"], "Safe")

-    def test_classify_tier_with_context(self):
-        tier, _ = classify_tier("echo hi", context={"platform": "telegram"})
-        assert tier == ApprovalTier.SAFE
+
+class TestCrisisBypass(unittest.TestCase):
+    
+    def test_send_message_bypass(self):
+        self.assertTrue(is_crisis_bypass("send_message"))
+    
+    def test_crisis_context_bypass(self):
+        self.assertTrue(is_crisis_bypass("unknown", "call 988 lifeline"))
+        self.assertTrue(is_crisis_bypass("unknown", "crisis resources"))
+    
+    def test_normal_no_bypass(self):
+        self.assertFalse(is_crisis_bypass("read_file"))
+
+
+if __name__ == "__main__":
+    unittest.main()
--- a/tools/approval.py
+++ b/tools/approval.py
@@ -6,7 +6,6 @@ This module is the single source of truth for the dangerous command system:
 - Approval prompting (CLI interactive + gateway async)
 - Smart approval via auxiliary LLM (auto-approve low-risk commands)
 - Permanent allowlist persistence (config.yaml)
- 5-tier approval system with graduated safety (Issue #670)
 """

 import contextvars
@@ -15,190 +14,11 @@ import os
 import re
 import sys
 import threading
-import time
 import unicodedata
-from enum import Enum
-from typing import Optional, Tuple, Dict, Any
+from typing import Optional

 logger = logging.getLogger(__name__)

-
-# =========================================================================
-# Approval Tier System (Issue #670)
-# =========================================================================
-#
-# 5 tiers of graduated safety. Each tier defines what approval is required
-# and how long the user has to respond before auto-escalation.
-#
-# Tier 0 (SAFE):     Read, search, list. No approval needed.
-# Tier 1 (LOW):      Write, scripts, edits. LLM approval sufficient.
-# Tier 2 (MEDIUM):   Messages, API calls, external actions. Human + LLM.
-# Tier 3 (HIGH):     Crypto, config changes, deployment. Human + LLM, 30s timeout.
-# Tier 4 (CRITICAL): Crisis, self-modification, system destruction. Human + LLM, 10s timeout.
-# =========================================================================
-
-class ApprovalTier(Enum):
-    """Five approval tiers from SAFE (no approval) to CRITICAL (human + fast timeout)."""
-    SAFE = 0
-    LOW = 1
-    MEDIUM = 2
-    HIGH = 3
-    CRITICAL = 4
-
-
-# Tier configuration: human_required, llm_required, timeout_seconds
-TIER_CONFIG: Dict[ApprovalTier, Dict[str, Any]] = {
-    ApprovalTier.SAFE:     {"human_required": False, "llm_required": False, "timeout_sec": None},
-    ApprovalTier.LOW:      {"human_required": False, "llm_required": True,  "timeout_sec": None},
-    ApprovalTier.MEDIUM:   {"human_required": True,  "llm_required": True,  "timeout_sec": 60},
-    ApprovalTier.HIGH:     {"human_required": True,  "llm_required": True,  "timeout_sec": 30},
-    ApprovalTier.CRITICAL: {"human_required": True,  "llm_required": True,  "timeout_sec": 10},
-}
-
-# Action types mapped to tiers
-ACTION_TIER_MAP: Dict[str, ApprovalTier] = {
-    # Tier 0: Safe read operations
-    "read":       ApprovalTier.SAFE,
-    "search":     ApprovalTier.SAFE,
-    "list":       ApprovalTier.SAFE,
-    "query":      ApprovalTier.SAFE,
-    "check":      ApprovalTier.SAFE,
-    "status":     ApprovalTier.SAFE,
-    "log":        ApprovalTier.SAFE,
-    "diff":       ApprovalTier.SAFE,
-    
-    # Tier 1: Low-risk writes
-    "write":      ApprovalTier.LOW,
-    "edit":       ApprovalTier.LOW,
-    "patch":      ApprovalTier.LOW,
-    "create":     ApprovalTier.LOW,
-    "delete":     ApprovalTier.LOW,
-    "move":       ApprovalTier.LOW,
-    "copy":       ApprovalTier.LOW,
-    "mkdir":      ApprovalTier.LOW,
-    "script":     ApprovalTier.LOW,
-    "test":       ApprovalTier.LOW,
-    "lint":       ApprovalTier.LOW,
-    "format":     ApprovalTier.LOW,
-    
-    # Tier 2: External actions
-    "message":    ApprovalTier.MEDIUM,
-    "send":       ApprovalTier.MEDIUM,
-    "api_call":   ApprovalTier.MEDIUM,
-    "webhook":    ApprovalTier.MEDIUM,
-    "email":      ApprovalTier.MEDIUM,
-    "notify":     ApprovalTier.MEDIUM,
-    "commit":     ApprovalTier.MEDIUM,
-    "push":       ApprovalTier.MEDIUM,
-    "branch":     ApprovalTier.MEDIUM,
-    "pr":         ApprovalTier.MEDIUM,
-    "deploy":     ApprovalTier.MEDIUM,
-    "install":    ApprovalTier.MEDIUM,
-    
-    # Tier 3: High-risk operations
-    "config":     ApprovalTier.HIGH,
-    "crypto":     ApprovalTier.HIGH,
-    "key":        ApprovalTier.HIGH,
-    "secret":     ApprovalTier.HIGH,
-    "credential": ApprovalTier.HIGH,
-    "auth":       ApprovalTier.HIGH,
-    "permission": ApprovalTier.HIGH,
-    "firewall":   ApprovalTier.HIGH,
-    "network":    ApprovalTier.HIGH,
-    "database":   ApprovalTier.HIGH,
-    "migration":  ApprovalTier.HIGH,
-    "systemd":    ApprovalTier.HIGH,
-    
-    # Tier 4: Critical / crisis
-    "crisis":     ApprovalTier.CRITICAL,
-    "suicide":    ApprovalTier.CRITICAL,
-    "kill":       ApprovalTier.CRITICAL,
-    "destroy":    ApprovalTier.CRITICAL,
-    "format":     ApprovalTier.CRITICAL,
-    "wipe":       ApprovalTier.CRITICAL,
-    "nuke":       ApprovalTier.CRITICAL,
-    "self_modify": ApprovalTier.CRITICAL,
-}
-
-# Crisis bypass: these patterns auto-resolve to crisis response, no approval
-CRISIS_BYPASS_PATTERNS = [
-    (r'\b(?:kill|end)\s+(?:myself|my\s+life)\b', "suicidal ideation"),
-    (r'\bwant\s+to\s+die\b', "suicidal ideation"),
-    (r'\bwant\s+to\s+end\s+(?:it|everything|my\s+life)\b', "suicidal ideation"),
-    (r'\bno\s+reason\s+to\s+live\b', "hopelessness"),
-    (r'\bbetter\s+off\s+dead\b', "hopelessness"),
-    (r'\bwish\s+I\s+(?:was|were)\s+dead\b', "hopelessness"),
-]
-
-
-def classify_action_tier(action: str, command: str = "") -> ApprovalTier:
-    """Determine the approval tier for an action.
-    
-    Args:
-        action: The action type (e.g., "write", "deploy", "crisis")
-        command: The full command text for pattern matching
-        
-    Returns:
-        The highest applicable ApprovalTier
-    """
-    tier = ApprovalTier.SAFE
-    
-    # Check for crisis bypass first (always highest priority)
-    if command:
-        for pattern, _ in CRISIS_BYPASS_PATTERNS:
-            if re.search(pattern, command, re.IGNORECASE):
-                return ApprovalTier.CRITICAL
-    
-    # Check action type mapping
-    action_lower = action.lower().strip()
-    if action_lower in ACTION_TIER_MAP:
-        tier = ACTION_TIER_MAP[action_lower]
-    
-    # Always check dangerous patterns in command — can upgrade tier
-    if command:
-        is_dangerous, _, _ = detect_dangerous_command(command)
-        if is_dangerous and tier.value < ApprovalTier.HIGH.value:
-            tier = ApprovalTier.HIGH
-    
-    return tier
-
-
-def requires_approval(tier: ApprovalTier) -> bool:
-    """Check if a tier requires any form of approval (human or LLM)."""
-    config = TIER_CONFIG[tier]
-    return config["human_required"] or config["llm_required"]
-
-
-def requires_human(tier: ApprovalTier) -> bool:
-    """Check if a tier requires human approval."""
-    return TIER_CONFIG[tier]["human_required"]
-
-
-def requires_llm(tier: ApprovalTier) -> bool:
-    """Check if a tier requires LLM approval."""
-    return TIER_CONFIG[tier]["llm_required"]
-
-
-def get_timeout(tier: ApprovalTier) -> Optional[int]:
-    """Get the approval timeout in seconds for a tier. None = no timeout."""
-    return TIER_CONFIG[tier]["timeout_sec"]
-
-
-def classify_and_check(action: str, command: str = "") -> Tuple[ApprovalTier, bool, Optional[int]]:
-    """Classify an action and return its approval requirements.
-    
-    Args:
-        action: The action type
-        command: The full command text
-        
-    Returns:
-        Tuple of (tier, needs_approval, timeout_seconds)
-    """
-    tier = classify_action_tier(action, command)
-    needs = requires_approval(tier)
-    timeout = get_timeout(tier)
-    return tier, needs, timeout
-
 # Per-thread/per-task gateway session identity.
 # Gateway runs agent turns concurrently in executor threads, so reading a
 # process-global env var for session identity is racy. Keep env fallback for
--- a/tools/approval_tiers.py
+++ b/tools/approval_tiers.py
@@ -1,386 +1,261 @@
-"""Approval Tier System — graduated safety based on risk level.
+"""
+Approval Tier System — Graduated safety based on risk level

-Extends the existing approval.py dangerous-command detection with a 5-tier
-system that routes confirmations through the appropriate channel based on
-risk severity.
+Extends approval.py with 5-tier system for command approval.

-Tiers:
-    SAFE (0)    — Read, search, browse. No confirmation needed.
-    LOW (1)     — Write, scripts, edits. LLM smart approval sufficient.
-    MEDIUM (2)  — Messages, API calls. Human + LLM, 60s timeout.
-    HIGH (3)    — Crypto, config changes, deploys. Human + LLM, 30s timeout.
-    CRITICAL (4) — Crisis, self-harm, system destruction. Immediate human, 10s timeout.
+| Tier | Action          | Human | LLM | Timeout |
+|------|-----------------|-------|-----|---------|
+| 0    | Read, search    | No    | No  | N/A     |
+| 1    | Write, scripts  | No    | Yes | N/A     |
+| 2    | Messages, API   | Yes   | Yes | 60s     |
+| 3    | Crypto, config  | Yes   | Yes | 30s     |
+| 4    | Crisis          | Yes   | Yes | 10s     |

-Usage:
-    from tools.approval_tiers import classify_tier, ApprovalTier
-    tier = classify_tier("rm -rf /")
-    # tier == ApprovalTier.CRITICAL
+Issue: #670
 """

-from __future__ import annotations
-
-import logging
-import os
 import re
-import threading
-import time
+from dataclasses import dataclass
 from enum import IntEnum
 from typing import Any, Dict, List, Optional, Tuple

-logger = logging.getLogger(__name__)
-

 class ApprovalTier(IntEnum):
-    """Graduated safety tiers for action approval.
-
-    Lower numbers = less dangerous. Higher = more dangerous.
-    Each tier has different confirmation requirements.
-    """
-    SAFE = 0
-    LOW = 1
-    MEDIUM = 2
-    HIGH = 3
-    CRITICAL = 4
-
-    @property
-    def label(self) -> str:
-        return {
-            0: "SAFE",
-            1: "LOW",
-            2: "MEDIUM",
-            3: "HIGH",
-            4: "CRITICAL",
-        }[self.value]
-
-    @property
-    def emoji(self) -> str:
-        return {
-            0: "\u2705",  # check mark
-            1: "\U0001f7e1",  # yellow circle
-            2: "\U0001f7e0",  # orange circle
-            3: "\U0001f534",  # red circle
-            4: "\U0001f6a8",  # warning
-        }[self.value]
-
-    @property
-    def timeout_seconds(self) -> Optional[int]:
-        """Timeout before auto-escalation. None = no timeout."""
-        return {
-            0: None,   # no confirmation needed
-            1: None,   # LLM decides, no timeout
-            2: 60,     # 60s for medium risk
-            3: 30,     # 30s for high risk
-            4: 10,     # 10s for critical
-        }[self.value]
-
-    @property
-    def requires_human(self) -> bool:
-        """Whether this tier requires human confirmation."""
-        return self.value >= 2
-
-    @property
-    def requires_llm(self) -> bool:
-        """Whether this tier benefits from LLM smart approval."""
-        return self.value >= 1
+    """Approval tiers based on risk level."""
+    SAFE = 0      # Read, search — no approval needed
+    LOW = 1       # Write, scripts — LLM approval
+    MEDIUM = 2    # Messages, API — human + LLM, 60s timeout
+    HIGH = 3      # Crypto, config — human + LLM, 30s timeout
+    CRITICAL = 4  # Crisis — human + LLM, 10s timeout


-# ---------------------------------------------------------------------------
-# Tier classification patterns
-# ---------------------------------------------------------------------------
+# Tier metadata
+TIER_INFO = {
+    ApprovalTier.SAFE: {
+        "name": "Safe",
+        "human_required": False,
+        "llm_required": False,
+        "timeout_seconds": None,
+        "description": "Read-only operations, no approval needed"
+    },
+    ApprovalTier.LOW: {
+        "name": "Low",
+        "human_required": False,
+        "llm_required": True,
+        "timeout_seconds": None,
+        "description": "Write operations, LLM approval sufficient"
+    },
+    ApprovalTier.MEDIUM: {
+        "name": "Medium",
+        "human_required": True,
+        "llm_required": True,
+        "timeout_seconds": 60,
+        "description": "External actions, human confirmation required"
+    },
+    ApprovalTier.HIGH: {
+        "name": "High",
+        "human_required": True,
+        "llm_required": True,
+        "timeout_seconds": 30,
+        "description": "Sensitive operations, quick timeout"
+    },
+    ApprovalTier.CRITICAL: {
+        "name": "Critical",
+        "human_required": True,
+        "llm_required": True,
+        "timeout_seconds": 10,
+        "description": "Crisis or dangerous operations, fastest timeout"
+    },
+}

-# Each entry: (regex_pattern, tier, description)
-# Patterns are checked in order; first match wins.

-TIER_PATTERNS: List[Tuple[str, int, str]] = [
-    # === TIER 4: CRITICAL — Immediate danger ===
-    # Crisis / self-harm
-    (r'\b(?:kill|end)\s+(?:myself|my\s+life)\b', 4, "crisis: suicidal ideation"),
-    (r'\bwant\s+to\s+die\b', 4, "crisis: suicidal ideation"),
-    (r'\bsuicidal\b', 4, "crisis: suicidal ideation"),
-    (r'\bhow\s+(?:do\s+I|to|can\s+I)\s+(?:kill|hang|overdose|cut)\s+myself\b', 4, "crisis: method seeking"),
+# Action-to-tier mapping
+ACTION_TIERS: Dict[str, ApprovalTier] = {
+    # Tier 0: Safe (read-only)
+    "read_file": ApprovalTier.SAFE,
+    "search_files": ApprovalTier.SAFE,
+    "web_search": ApprovalTier.SAFE,
+    "session_search": ApprovalTier.SAFE,
+    "list_files": ApprovalTier.SAFE,
+    "get_file_content": ApprovalTier.SAFE,
+    "memory_search": ApprovalTier.SAFE,
+    "skills_list": ApprovalTier.SAFE,
+    "skills_search": ApprovalTier.SAFE,
+    
+    # Tier 1: Low (write operations)
+    "write_file": ApprovalTier.LOW,
+    "create_file": ApprovalTier.LOW,
+    "patch_file": ApprovalTier.LOW,
+    "delete_file": ApprovalTier.LOW,
+    "execute_code": ApprovalTier.LOW,
+    "terminal": ApprovalTier.LOW,
+    "run_script": ApprovalTier.LOW,
+    "skill_install": ApprovalTier.LOW,
+    
+    # Tier 2: Medium (external actions)
+    "send_message": ApprovalTier.MEDIUM,
+    "web_fetch": ApprovalTier.MEDIUM,
+    "browser_navigate": ApprovalTier.MEDIUM,
+    "api_call": ApprovalTier.MEDIUM,
+    "gitea_create_issue": ApprovalTier.MEDIUM,
+    "gitea_create_pr": ApprovalTier.MEDIUM,
+    "git_push": ApprovalTier.MEDIUM,
+    "deploy": ApprovalTier.MEDIUM,
+    
+    # Tier 3: High (sensitive operations)
+    "config_change": ApprovalTier.HIGH,
+    "env_change": ApprovalTier.HIGH,
+    "key_rotation": ApprovalTier.HIGH,
+    "access_grant": ApprovalTier.HIGH,
+    "permission_change": ApprovalTier.HIGH,
+    "backup_restore": ApprovalTier.HIGH,
+    
+    # Tier 4: Critical (crisis/dangerous)
+    "kill_process": ApprovalTier.CRITICAL,
+    "rm_rf": ApprovalTier.CRITICAL,
+    "format_disk": ApprovalTier.CRITICAL,
+    "shutdown": ApprovalTier.CRITICAL,
+    "crisis_override": ApprovalTier.CRITICAL,
+}

-    # System destruction
-    (r'\brm\s+(-[^\s]*\s+)*/$', 4, "delete in root path"),
-    (r'\brm\s+-rf\s+[~/]', 4, "recursive force delete of home"),
-    (r'\bmkfs\b', 4, "format filesystem"),
-    (r'\bdd\s+.*of=/dev/', 4, "write to block device"),
-    (r'\bkill\s+-9\s+-1\b', 4, "kill all processes"),
-    (r'\b:\(\)\s*\{\s*:\s*\|\s*:\s*&\s*\}\s*;\s*:', 4, "fork bomb"),

-    # === TIER 3: HIGH — Destructive or sensitive ===
-    (r'\brm\s+-[^ ]*r\b', 3, "recursive delete"),
-    (r'\bchmod\s+(777|666|o\+[rwx]*w|a\+[rwx]*w)\b', 3, "world-writable permissions"),
-    (r'\bchown\s+.*root', 3, "chown to root"),
-    (r'>\s*/etc/', 3, "overwrite system config"),
-    (r'\bgit\s+push\b.*--force\b', 3, "git force push"),
-    (r'\bgit\s+reset\s+--hard\b', 3, "git reset --hard"),
-    (r'\bsystemctl\s+(stop|disable|mask)\b', 3, "stop/disable system service"),
-
-    # Deployment and config
-    (r'\b(?:deploy|publish|release)\b.*(?:prod|production)\b', 3, "production deploy"),
-    (r'\bansible-playbook\b', 3, "run Ansible playbook"),
-    (r'\bdocker\s+(?:rm|stop|kill)\b.*(?:-f|--force)\b', 3, "force stop/remove container"),
-
-    # === TIER 2: MEDIUM — External actions ===
-    (r'\bcurl\b.*\|\s*(ba)?sh\b', 2, "pipe remote content to shell"),
-    (r'\bwget\b.*\|\s*(ba)?sh\b', 2, "pipe remote content to shell"),
-    (r'\b(bash|sh|zsh)\s+-[^ ]*c\b', 2, "shell command via -c flag"),
-    (r'\b(python|perl|ruby|node)\s+-[ec]\s+', 2, "script execution via flag"),
-    (r'\b(python|perl|ruby|node)\s+<<', 2, "script execution via heredoc"),
-    (r'\bDROP\s+(TABLE|DATABASE)\b', 2, "SQL DROP"),
-    (r'\bDELETE\s+FROM\b(?!.*\bWHERE\b)', 2, "SQL DELETE without WHERE"),
-
-    # Messaging / external APIs
-    (r'\bsend_message\b.*(?:telegram|discord|slack)\b', 2, "send message to platform"),
-    (r'\bhttp[s]?://\b.*\bPOST\b', 2, "HTTP POST request"),
-
-    # === TIER 1: LOW — File modifications ===
-    (r'\btee\b.*>', 1, "write file via tee"),
-    (r'\becho\b.*>\s*(?!/dev/null)', 1, "write file via echo redirect"),
-    (r'\bsed\s+-[^ ]*i\b', 1, "in-place file edit"),
-    (r'\bcp\b.*\s/etc/', 1, "copy file into /etc/"),
-    (r'\bmv\b.*\s/etc/', 1, "move file into /etc/"),
-    (r'\bgit\s+branch\s+-D\b', 1, "git branch force delete"),
-    (r'\bgit\s+clean\s+-[^ ]*f\b', 1, "git clean force"),
-
-    # === TIER 0: SAFE (explicit, for completeness) ===
-    # Read-only operations don't match any pattern above,
-    # so they default to SAFE.
+# Dangerous command patterns (from existing approval.py)
+_DANGEROUS_PATTERNS = [
+    (r"rm\s+-rf\s+/", ApprovalTier.CRITICAL),
+    (r"mkfs\.", ApprovalTier.CRITICAL),
+    (r"dd\s+if=.*of=/dev/", ApprovalTier.CRITICAL),
+    (r"shutdown|reboot|halt", ApprovalTier.CRITICAL),
+    (r"chmod\s+777", ApprovalTier.HIGH),
+    (r"curl.*\|\s*bash", ApprovalTier.HIGH),
+    (r"wget.*\|\s*sh", ApprovalTier.HIGH),
+    (r"eval\s*\(", ApprovalTier.HIGH),
+    (r"sudo\s+", ApprovalTier.MEDIUM),
+    (r"git\s+push.*--force", ApprovalTier.HIGH),
+    (r"docker\s+rm.*-f", ApprovalTier.MEDIUM),
+    (r"kubectl\s+delete", ApprovalTier.HIGH),
 ]


-# Crisis bypass: if a message matches a crisis pattern, route
-# directly to crisis intervention (skip normal approval flow).
-CRISIS_BYPASS_PATTERNS = [
-    r'\b(?:kill|end)\s+(?:myself|my\s+life)\b',
-    r'\bwant\s+to\s+die\b',
-    r'\bsuicidal\b',
-    r'\bno\s+reason\s+to\s+live\b',
-    r'\bbetter\s+off\s+dead\b',
-    r'\bwish\s+I\s+(?:was|were)\s+dead\b',
-    r'\bhow\s+(?:do\s+I|to)\s+(?:kill|hang|overdose)\s+myself\b',
-    r'\bmethods?\s+of\s+(?:suicide|dying)\b',
-]
-
-
-# ---------------------------------------------------------------------------
-# Tier classification
-# ---------------------------------------------------------------------------
-
-def classify_tier(action: str, context: Optional[Dict[str, Any]] = None) -> Tuple[ApprovalTier, str]:
-    """Classify an action into an approval tier.
-
-    Args:
-        action: The command, message, or action to classify.
-        context: Optional context (platform, session_key, etc.)
-
-    Returns:
-        (tier, description) tuple. Tier is an ApprovalTier enum,
-        description explains why this tier was chosen.
-    """
-    if not action or not isinstance(action, str):
-        return (ApprovalTier.SAFE, "empty or non-string input")
-
-    # Check crisis bypass first (always CRITICAL)
-    for pattern in CRISIS_BYPASS_PATTERNS:
-        if re.search(pattern, action, re.IGNORECASE):
-            return (ApprovalTier.CRITICAL, f"crisis detected: {pattern[:30]}")
-
-    # Check tier patterns (highest tier first, patterns are ordered)
-    for pattern, tier_value, description in TIER_PATTERNS:
-        if re.search(pattern, action, re.IGNORECASE | re.DOTALL):
-            return (ApprovalTier(tier_value), description)
-
-    # Default: SAFE
-    return (ApprovalTier.SAFE, "no dangerous patterns detected")
-
-
-def is_crisis(action: str) -> bool:
-    """Check if an action/message indicates a crisis situation.
-
-    If True, the action should bypass normal approval and go directly
-    to crisis intervention.
-    """
-    if not action:
-        return False
-    for pattern in CRISIS_BYPASS_PATTERNS:
-        if re.search(pattern, action, re.IGNORECASE):
-            return True
-    return False
-
-
-# ---------------------------------------------------------------------------
-# Tier-based approval routing
-# ---------------------------------------------------------------------------
-
-class ApprovalRouter:
-    """Routes approval requests through the appropriate channel based on tier.
-
-    Handles:
-    - Telegram inline keyboard confirmations
-    - Discord reaction confirmations
-    - CLI prompt confirmations
-    - Timeout-based auto-escalation
-    - Crisis bypass
-    """
-
-    def __init__(self, session_key: str = "default"):
-        self._session_key = session_key
-        self._pending: Dict[str, Dict[str, Any]] = {}
-        self._lock = threading.Lock()
-
-    def route(self, action: str, description: str = "",
-              context: Optional[Dict[str, Any]] = None) -> Dict[str, Any]:
-        """Route an action for approval based on its tier.
-
-        Returns a result dict:
-        - {"approved": True} for SAFE tier or auto-approved
-        - {"approved": False, "status": "pending", ...} for human approval
-        - {"approved": False, "status": "crisis", ...} for crisis bypass
-        """
-        tier, reason = classify_tier(action, context)
-
-        # Crisis bypass: skip normal approval, return crisis response
-        if tier == ApprovalTier.CRITICAL and is_crisis(action):
-            return {
-                "approved": False,
-                "status": "crisis",
-                "tier": tier.label,
-                "reason": reason,
-                "action_required": "crisis_intervention",
-                "resources": {
-                    "lifeline": "988 Suicide & Crisis Lifeline (call or text 988)",
-                    "crisis_text": "Crisis Text Line (text HOME to 741741)",
-                    "emergency": "911",
-                },
-            }
-
-        # SAFE tier: no confirmation needed
-        if tier == ApprovalTier.SAFE:
-            return {
-                "approved": True,
-                "tier": tier.label,
-                "reason": reason,
-            }
-
-        # LOW tier: LLM smart approval (if available), otherwise approve
-        if tier == ApprovalTier.LOW:
-            return {
-                "approved": True,
-                "tier": tier.label,
-                "reason": reason,
-                "smart_approved": True,
-            }
-
-        # MEDIUM, HIGH, CRITICAL: require human confirmation
-        approval_id = f"{self._session_key}:{int(time.time() * 1000)}"
-
-        with self._lock:
-            self._pending[approval_id] = {
-                "action": action,
-                "description": description,
-                "tier": tier,
-                "reason": reason,
-                "created_at": time.time(),
-                "timeout": tier.timeout_seconds,
-            }
-
+@dataclass
+class ApprovalRequest:
+    """A request for approval."""
+    action: str
+    tier: ApprovalTier
+    command: str
+    reason: str
+    session_key: str
+    timeout_seconds: Optional[int] = None
+    
+    def to_dict(self) -> Dict[str, Any]:
        return {
-            "approved": False,
-            "status": "approval_required",
-            "approval_id": approval_id,
-            "tier": tier.label,
-            "tier_emoji": tier.emoji,
-            "reason": reason,
-            "timeout_seconds": tier.timeout_seconds,
-            "message": (
-                f"{tier.emoji} **{tier.label}** action requires confirmation.\n"
-                f"**Action:** {action[:200]}\n"
-                f"**Reason:** {reason}\n"
-                f"**Timeout:** {tier.timeout_seconds}s (auto-escalate on timeout)"
-            ),
+            "action": self.action,
+            "tier": self.tier.value,
+            "tier_name": TIER_INFO[self.tier]["name"],
+            "command": self.command,
+            "reason": self.reason,
+            "session_key": self.session_key,
+            "timeout": self.timeout_seconds,
+            "human_required": TIER_INFO[self.tier]["human_required"],
+            "llm_required": TIER_INFO[self.tier]["llm_required"],
        }

-    def approve(self, approval_id: str, approver: str = "user") -> Dict[str, Any]:
-        """Mark a pending approval as approved."""
-        with self._lock:
-            entry = self._pending.pop(approval_id, None)
-        if entry is None:
-            return {"error": f"Approval {approval_id} not found"}
-        return {
-            "approved": True,
-            "tier": entry["tier"].label,
-            "approver": approver,
-            "action": entry["action"],
-        }

-    def deny(self, approval_id: str, denier: str = "user",
-             reason: str = "") -> Dict[str, Any]:
-        """Mark a pending approval as denied."""
-        with self._lock:
-            entry = self._pending.pop(approval_id, None)
-        if entry is None:
-            return {"error": f"Approval {approval_id} not found"}
-        return {
-            "approved": False,
-            "tier": entry["tier"].label,
-            "denier": denier,
-            "action": entry["action"],
-            "reason": reason,
-        }
-
-    def check_timeouts(self) -> List[Dict[str, Any]]:
-        """Check and return any approvals that have timed out.
-
-        Called periodically by the gateway. Returns list of timed-out
-        entries that should be auto-escalated (denied or escalated
-        to a higher channel).
-        """
-        now = time.time()
-        timed_out = []
-        with self._lock:
-            for aid, entry in list(self._pending.items()):
-                timeout = entry.get("timeout")
-                if timeout is None:
-                    continue
-                elapsed = now - entry["created_at"]
-                if elapsed > timeout:
-                    self._pending.pop(aid, None)
-                    timed_out.append({
-                        "approval_id": aid,
-                        "action": entry["action"],
-                        "tier": entry["tier"].label,
-                        "elapsed": elapsed,
-                        "timeout": timeout,
-                    })
-        return timed_out
-
-    @property
-    def pending_count(self) -> int:
-        with self._lock:
-            return len(self._pending)
+def detect_tier(action: str, command: str = "") -> ApprovalTier:
+    """
+    Detect the approval tier for an action.
+    
+    Checks action name first, then falls back to pattern matching.
+    """
+    # Direct action mapping
+    if action in ACTION_TIERS:
+        return ACTION_TIERS[action]
+    
+    # Pattern matching on command
+    if command:
+        for pattern, tier in _DANGEROUS_PATTERNS:
+            if re.search(pattern, command, re.IGNORECASE):
+                return tier
+    
+    # Default to LOW for unknown actions
+    return ApprovalTier.LOW


-# ---------------------------------------------------------------------------
-# Convenience functions
-# ---------------------------------------------------------------------------
-
-# Module-level router instance
-_default_router: Optional[ApprovalRouter] = None
-_router_lock = threading.Lock()
+def requires_human_approval(tier: ApprovalTier) -> bool:
+    """Check if tier requires human approval."""
+    return TIER_INFO[tier]["human_required"]


-def get_router(session_key: str = "default") -> ApprovalRouter:
-    """Get or create the approval router for a session."""
-    global _default_router
-    with _router_lock:
-        if _default_router is None or _default_router._session_key != session_key:
-            _default_router = ApprovalRouter(session_key)
-        return _default_router
+def requires_llm_approval(tier: ApprovalTier) -> bool:
+    """Check if tier requires LLM approval."""
+    return TIER_INFO[tier]["llm_required"]


-def route_action(action: str, description: str = "",
-                 context: Optional[Dict[str, Any]] = None) -> Dict[str, Any]:
-    """Convenience: classify and route an action for approval."""
-    router = get_router(context.get("session_key", "default") if context else "default")
-    return router.route(action, description, context)
+def get_timeout(tier: ApprovalTier) -> Optional[int]:
+    """Get timeout in seconds for a tier."""
+    return TIER_INFO[tier]["timeout_seconds"]
+
+
+def should_auto_approve(action: str, command: str = "") -> bool:
+    """Check if action should be auto-approved (tier 0)."""
+    tier = detect_tier(action, command)
+    return tier == ApprovalTier.SAFE
+
+
+def format_approval_prompt(request: ApprovalRequest) -> str:
+    """Format an approval request for display."""
+    info = TIER_INFO[request.tier]
+    lines = []
+    lines.append(f"⚠️ Approval Required (Tier {request.tier.value}: {info['name']})")
+    lines.append(f"")
+    lines.append(f"Action: {request.action}")
+    lines.append(f"Command: {request.command[:100]}{'...' if len(request.command) > 100 else ''}")
+    lines.append(f"Reason: {request.reason}")
+    lines.append(f"")
+    
+    if info["human_required"]:
+        lines.append(f"👤 Human approval required")
+    if info["llm_required"]:
+        lines.append(f"🤖 LLM approval required")
+    if info["timeout_seconds"]:
+        lines.append(f"⏱️ Timeout: {info['timeout_seconds']}s")
+    
+    return "\n".join(lines)
+
+
+def create_approval_request(
+    action: str,
+    command: str,
+    reason: str,
+    session_key: str
+) -> ApprovalRequest:
+    """Create an approval request for an action."""
+    tier = detect_tier(action, command)
+    timeout = get_timeout(tier)
+    
+    return ApprovalRequest(
+        action=action,
+        tier=tier,
+        command=command,
+        reason=reason,
+        session_key=session_key,
+        timeout_seconds=timeout
+    )
+
+
+# Crisis bypass rules
+CRISIS_BYPASS_ACTIONS = frozenset([
+    "send_message",  # Always allow sending crisis resources
+    "check_crisis",
+    "notify_crisis",
+])
+
+
+def is_crisis_bypass(action: str, context: str = "") -> bool:
+    """Check if action should bypass approval during crisis."""
+    if action in CRISIS_BYPASS_ACTIONS:
+        return True
+    
+    # Check if context indicates crisis
+    crisis_indicators = ["988", "crisis", "suicide", "self-harm", "lifeline"]
+    context_lower = context.lower()
+    return any(indicator in context_lower for indicator in crisis_indicators)
Author	SHA1	Message	Date
Alexander Whitestone	c298834b45	test: Add approval tier tests (#670 ) Some checks failed Docker Build and Publish / build-and-push (pull_request) Has been skipped Details Contributor Attribution Check / check-attribution (pull_request) Failing after 49s Details Supply Chain Audit / Scan PR for supply chain risks (pull_request) Successful in 51s Details Tests / e2e (pull_request) Successful in 4m46s Details Tests / test (pull_request) Failing after 51m26s Details	2026-04-15 04:05:26 +00:00
Alexander Whitestone	c19c51a124	feat: Add approval tier system (#670 )	2026-04-15 04:05:02 +00:00