From 9bfe185a2e31bcc5743cf30cc195d7b35a14b565 Mon Sep 17 00:00:00 2001
From: teknium1 <teknium1@gmail.com>
Date: Tue, 3 Feb 2026 16:15:49 -0800
Subject: [PATCH] Implement interrupt handling for agent and CLI input and
 persistent prompt line at bottom of CLI :)

- Enhanced the AIAgent class to support interrupt requests, allowing for graceful interruption of ongoing tasks and processing of new messages.
- Updated the HermesCLI to manage user input in a persistent manner, enabling real-time interruption of the agent's conversation.
- Introduced a mechanism in the GatewayRunner to handle incoming messages while an agent is running, allowing for immediate response to user commands.
- Improved overall user experience by providing feedback during interruptions and ensuring that pending messages are processed correctly.
---
 cli.py         | 200 ++++++++++++++++++++++++++++++++++++++++++-------
 gateway/run.py | 104 +++++++++++++++++++++++--
 run_agent.py   |  66 +++++++++++++++-
 3 files changed, 336 insertions(+), 34 deletions(-)

diff --git a/cli.py b/cli.py
index 9718ebea0..795c880be 100755
--- a/cli.py
+++ b/cli.py
@@ -33,6 +33,15 @@ from prompt_toolkit.history import FileHistory
 from prompt_toolkit.styles import Style as PTStyle
 from prompt_toolkit.formatted_text import HTML
 from prompt_toolkit.patch_stdout import patch_stdout
+from prompt_toolkit.application import Application, get_app
+from prompt_toolkit.buffer import Buffer
+from prompt_toolkit.layout import Layout, HSplit, Window, FormattedTextControl
+from prompt_toolkit.layout.processors import BeforeInput
+from prompt_toolkit.widgets import TextArea
+from prompt_toolkit.key_binding import KeyBindings
+import asyncio
+import threading
+import queue
 
 # Load environment variables first
 from dotenv import load_dotenv
@@ -1284,17 +1293,52 @@ class HermesCLI:
         print("─" * 60, flush=True)
         
         try:
-            # Run the conversation
-            result = self.agent.run_conversation(
-                user_message=message,
-                conversation_history=self.conversation_history[:-1],  # Exclude the message we just added
-            )
+            # Run the conversation with interrupt monitoring
+            result = None
+            
+            def run_agent():
+                nonlocal result
+                result = self.agent.run_conversation(
+                    user_message=message,
+                    conversation_history=self.conversation_history[:-1],  # Exclude the message we just added
+                )
+            
+            # Start agent in background thread
+            agent_thread = threading.Thread(target=run_agent)
+            agent_thread.start()
+            
+            # Monitor for new input in the pending queue while agent runs
+            interrupt_msg = None
+            while agent_thread.is_alive():
+                # Check if there's new input in the queue (from the persistent input area)
+                if hasattr(self, '_pending_input'):
+                    try:
+                        interrupt_msg = self._pending_input.get(timeout=0.1)
+                        if interrupt_msg:
+                            print(f"\n⚡ New message detected, interrupting...")
+                            self.agent.interrupt(interrupt_msg)
+                            break
+                    except:
+                        pass  # Queue empty or timeout, continue waiting
+                else:
+                    # Fallback if no queue (shouldn't happen)
+                    agent_thread.join(0.1)
+            
+            agent_thread.join()  # Ensure agent thread completes
             
             # Update history with full conversation
-            self.conversation_history = result.get("messages", self.conversation_history)
+            self.conversation_history = result.get("messages", self.conversation_history) if result else self.conversation_history
             
             # Get the final response
-            response = result.get("final_response", "")
+            response = result.get("final_response", "") if result else ""
+            
+            # Handle interrupt - check if we were interrupted
+            pending_message = None
+            if result and result.get("interrupted"):
+                pending_message = result.get("interrupt_message") or interrupt_msg
+                # Add indicator that we were interrupted
+                if response and pending_message:
+                    response = response + "\n\n---\n_[Interrupted - processing new message]_"
             
             if response:
                 # Use simple print for compatibility with prompt_toolkit's patch_stdout
@@ -1307,6 +1351,11 @@ class HermesCLI:
                 print()
                 print("─" * 60)
             
+            # If we have a pending message from interrupt, process it immediately
+            if pending_message:
+                print(f"\n📨 Processing: '{pending_message[:50]}{'...' if len(pending_message) > 50 else ''}'")
+                return self.chat(pending_message)  # Recursive call to handle the new message
+            
             return response
             
         except Exception as e:
@@ -1345,22 +1394,101 @@ class HermesCLI:
             return None
     
     def run(self):
-        """Run the interactive CLI loop with fixed input at bottom."""
+        """Run the interactive CLI loop with persistent input at bottom."""
         self.show_banner()
-        
-        # These Rich prints work fine BEFORE patch_stdout
         self.console.print("[#FFF8DC]Welcome to Hermes Agent! Type your message or /help for commands.[/]")
         self.console.print()
         
-        # Use patch_stdout to ensure all output appears above the input prompt
-        with patch_stdout():
-            while True:
+        # State for async operation
+        self._agent_running = False
+        self._pending_input = queue.Queue()
+        self._should_exit = False
+        
+        # Create a persistent input area using prompt_toolkit Application
+        input_buffer = Buffer()
+        
+        # Key bindings for the input area
+        kb = KeyBindings()
+        
+        @kb.add('enter')
+        def handle_enter(event):
+            """Handle Enter key - submit input."""
+            text = event.app.current_buffer.text.strip()
+            if text:
+                # Store the input
+                self._pending_input.put(text)
+                # Clear the buffer
+                event.app.current_buffer.reset()
+        
+        @kb.add('c-c')
+        def handle_ctrl_c(event):
+            """Handle Ctrl+C - interrupt or exit."""
+            if self._agent_running and self.agent:
+                print("\n⚡ Interrupting agent...")
+                self.agent.interrupt()
+            else:
+                self._should_exit = True
+                event.app.exit()
+        
+        @kb.add('c-d')
+        def handle_ctrl_d(event):
+            """Handle Ctrl+D - exit."""
+            self._should_exit = True
+            event.app.exit()
+        
+        # Create the input area widget
+        input_area = TextArea(
+            height=1,
+            prompt='❯ ',
+            style='class:input-area',
+            multiline=False,
+            wrap_lines=False,
+        )
+        
+        # Create a status line that shows when agent is working
+        def get_status_text():
+            if self._agent_running:
+                return [('class:status', ' 🔄 Agent working... (type to interrupt) ')]
+            return [('class:status', '')]
+        
+        status_window = Window(
+            content=FormattedTextControl(get_status_text),
+            height=1,
+        )
+        
+        # Layout with status and input at bottom
+        layout = Layout(
+            HSplit([
+                Window(height=0),  # Spacer that expands
+                status_window,
+                input_area,
+            ])
+        )
+        
+        # Style for the application
+        style = PTStyle.from_dict({
+            'input-area': '#FFF8DC',
+            'status': 'bg:#333333 #FFD700',
+        })
+        
+        # Create the application
+        app = Application(
+            layout=layout,
+            key_bindings=kb,
+            style=style,
+            full_screen=False,
+            mouse_support=False,
+        )
+        
+        # Background thread to process inputs and run agent
+        def process_loop():
+            while not self._should_exit:
                 try:
-                    user_input = self.get_input()
-                    
-                    if user_input is None:
-                        print("\nGoodbye! ⚕")
-                        break
+                    # Check for pending input with timeout
+                    try:
+                        user_input = self._pending_input.get(timeout=0.1)
+                    except queue.Empty:
+                        continue
                     
                     if not user_input:
                         continue
@@ -1368,16 +1496,38 @@ class HermesCLI:
                     # Check for commands
                     if user_input.startswith("/"):
                         if not self.process_command(user_input):
-                            print("\nGoodbye! ⚕")
-                            break
+                            self._should_exit = True
+                            # Schedule app exit
+                            if app.is_running:
+                                app.exit()
                         continue
                     
-                    # Regular chat message
-                    self.chat(user_input)
+                    # Regular chat - run agent
+                    self._agent_running = True
+                    app.invalidate()  # Refresh status line
                     
-                except KeyboardInterrupt:
-                    print("\nInterrupted. Type /quit to exit.")
-                    continue
+                    try:
+                        self.chat(user_input)
+                    finally:
+                        self._agent_running = False
+                        app.invalidate()  # Refresh status line
+                    
+                except Exception as e:
+                    print(f"Error: {e}")
+        
+        # Start processing thread
+        process_thread = threading.Thread(target=process_loop, daemon=True)
+        process_thread.start()
+        
+        # Run the application with patch_stdout for proper output handling
+        try:
+            with patch_stdout():
+                app.run()
+        except (EOFError, KeyboardInterrupt):
+            pass
+        finally:
+            self._should_exit = True
+            print("\nGoodbye! ⚕")
 
 
 # ============================================================================
diff --git a/gateway/run.py b/gateway/run.py
index b10f4cf54..76f9d4db4 100644
--- a/gateway/run.py
+++ b/gateway/run.py
@@ -72,6 +72,11 @@ class GatewayRunner:
         self.delivery_router = DeliveryRouter(self.config)
         self._running = False
         self._shutdown_event = asyncio.Event()
+        
+        # Track running agents per session for interrupt support
+        # Key: session_key, Value: AIAgent instance
+        self._running_agents: Dict[str, Any] = {}
+        self._pending_messages: Dict[str, str] = {}  # Queued messages during interrupt
     
     async def start(self) -> bool:
         """
@@ -217,10 +222,11 @@ class GatewayRunner:
         This is the core message processing pipeline:
         1. Check user authorization
         2. Check for commands (/new, /reset, etc.)
-        3. Get or create session
-        4. Build context for agent
-        5. Run agent conversation
-        6. Return response
+        3. Check for running agent and interrupt if needed
+        4. Get or create session
+        5. Build context for agent
+        6. Run agent conversation
+        7. Return response
         """
         source = event.source
         
@@ -229,7 +235,7 @@ class GatewayRunner:
             print(f"[gateway] Unauthorized user: {source.user_id} ({source.user_name}) on {source.platform.value}")
             return None  # Silently ignore unauthorized users
         
-        # Check for reset commands
+        # Check for commands
         command = event.get_command()
         if command in ["new", "reset"]:
             return await self._handle_reset_command(event)
@@ -237,8 +243,21 @@ class GatewayRunner:
         if command == "status":
             return await self._handle_status_command(event)
         
+        if command == "stop":
+            return await self._handle_stop_command(event)
+        
         # Get or create session
         session_entry = self.session_store.get_or_create_session(source)
+        session_key = session_entry.session_key
+        
+        # Check if there's already a running agent for this session
+        if session_key in self._running_agents:
+            running_agent = self._running_agents[session_key]
+            print(f"[gateway] ⚡ Interrupting running agent for session {session_key[:20]}...")
+            running_agent.interrupt(event.text)
+            # Store the new message to be processed after current agent finishes
+            self._pending_messages[session_key] = event.text
+            return None  # Don't respond yet - let the interrupt handle it
         
         # Build session context
         context = build_session_context(source, self.config, session_entry)
@@ -259,7 +278,8 @@ class GatewayRunner:
                 context_prompt=context_prompt,
                 history=history,
                 source=source,
-                session_id=session_entry.session_id
+                session_id=session_entry.session_id,
+                session_key=session_key
             )
             
             # Append to transcript
@@ -309,6 +329,10 @@ class GatewayRunner:
         
         connected_platforms = [p.value for p in self.adapters.keys()]
         
+        # Check if there's an active agent
+        session_key = session_entry.session_key
+        is_running = session_key in self._running_agents
+        
         lines = [
             "📊 **Hermes Gateway Status**",
             "",
@@ -316,12 +340,26 @@ class GatewayRunner:
             f"**Created:** {session_entry.created_at.strftime('%Y-%m-%d %H:%M')}",
             f"**Last Activity:** {session_entry.updated_at.strftime('%Y-%m-%d %H:%M')}",
             f"**Tokens:** {session_entry.total_tokens:,}",
+            f"**Agent Running:** {'Yes ⚡' if is_running else 'No'}",
             "",
             f"**Connected Platforms:** {', '.join(connected_platforms)}",
         ]
         
         return "\n".join(lines)
     
+    async def _handle_stop_command(self, event: MessageEvent) -> str:
+        """Handle /stop command - interrupt a running agent."""
+        source = event.source
+        session_entry = self.session_store.get_or_create_session(source)
+        session_key = session_entry.session_key
+        
+        if session_key in self._running_agents:
+            agent = self._running_agents[session_key]
+            agent.interrupt()
+            return "⚡ Stopping the current task... The agent will finish its current step and respond."
+        else:
+            return "No active task to stop."
+    
     def _set_session_env(self, context: SessionContext) -> None:
         """Set environment variables for the current session."""
         os.environ["HERMES_SESSION_PLATFORM"] = context.source.platform.value
@@ -341,12 +379,14 @@ class GatewayRunner:
         context_prompt: str,
         history: List[Dict[str, Any]],
         source: SessionSource,
-        session_id: str
+        session_id: str,
+        session_key: str = None
     ) -> str:
         """
         Run the agent with the given message and context.
         
         This is run in a thread pool to not block the event loop.
+        Supports interruption via new messages.
         """
         from run_agent import AIAgent
         import queue
@@ -432,6 +472,10 @@ class GatewayRunner:
                     print(f"[Gateway] Progress message error: {e}")
                     await asyncio.sleep(1)
         
+        # We need to share the agent instance for interrupt support
+        agent_holder = [None]  # Mutable container for the agent instance
+        result_holder = [None]  # Mutable container for the result
+        
         def run_sync():
             # Read from env var or use default (same as CLI)
             max_iterations = int(os.getenv("HERMES_MAX_ITERATIONS", "60"))
@@ -446,6 +490,9 @@ class GatewayRunner:
                 tool_progress_callback=progress_callback if tool_progress_enabled else None,
             )
             
+            # Store agent reference for interrupt support
+            agent_holder[0] = agent
+            
             # Convert transcript history to agent format
             # Transcript has timestamps; agent expects {"role": ..., "content": ...}
             agent_history = []
@@ -456,6 +503,7 @@ class GatewayRunner:
                     agent_history.append({"role": role, "content": content})
             
             result = agent.run_conversation(message, conversation_history=agent_history)
+            result_holder[0] = result
             
             # Return final response, or a message if something went wrong
             final_response = result.get("final_response")
@@ -472,14 +520,56 @@ class GatewayRunner:
         if tool_progress_enabled:
             progress_task = asyncio.create_task(send_progress_messages())
         
+        # Track this agent as running for this session (for interrupt support)
+        # We do this in a callback after the agent is created
+        async def track_agent():
+            # Wait for agent to be created
+            while agent_holder[0] is None:
+                await asyncio.sleep(0.05)
+            if session_key:
+                self._running_agents[session_key] = agent_holder[0]
+        
+        tracking_task = asyncio.create_task(track_agent())
+        
         try:
             # Run in thread pool to not block
             loop = asyncio.get_event_loop()
             response = await loop.run_in_executor(None, run_sync)
+            
+            # Check if we were interrupted and have a pending message
+            result = result_holder[0]
+            if result and result.get("interrupted") and session_key:
+                pending = self._pending_messages.pop(session_key, None)
+                if pending:
+                    print(f"[gateway] 📨 Processing interrupted message: '{pending[:40]}...'")
+                    # Add an indicator to the response
+                    if response:
+                        response = response + "\n\n---\n_[Interrupted - processing your new message]_"
+                    
+                    # Send the interrupted response first
+                    adapter = self.adapters.get(source.platform)
+                    if adapter and response:
+                        await adapter.send(chat_id=source.chat_id, content=response)
+                    
+                    # Now process the pending message with updated history
+                    updated_history = result.get("messages", history)
+                    return await self._run_agent(
+                        message=pending,
+                        context_prompt=context_prompt,
+                        history=updated_history,
+                        source=source,
+                        session_id=session_id,
+                        session_key=session_key
+                    )
         finally:
             # Stop progress sender
             if progress_task:
                 progress_task.cancel()
+            
+            # Clean up tracking
+            tracking_task.cancel()
+            if session_key and session_key in self._running_agents:
+                del self._running_agents[session_key]
                 try:
                     await progress_task
                 except asyncio.CancelledError:
diff --git a/run_agent.py b/run_agent.py
index 72541f6bd..7b70289ff 100644
--- a/run_agent.py
+++ b/run_agent.py
@@ -639,6 +639,10 @@ class AIAgent:
         self.tool_progress_callback = tool_progress_callback
         self._last_reported_tool = None  # Track for "new tool" mode
         
+        # Interrupt mechanism for breaking out of tool loops
+        self._interrupt_requested = False
+        self._interrupt_message = None  # Optional message that triggered interrupt
+        
         # Store OpenRouter provider preferences
         self.providers_allowed = providers_allowed
         self.providers_ignored = providers_ignored
@@ -1302,6 +1306,42 @@ class AIAgent:
             if self.verbose_logging:
                 logging.warning(f"Failed to save session log: {e}")
     
+    def interrupt(self, message: str = None) -> None:
+        """
+        Request the agent to interrupt its current tool-calling loop.
+        
+        Call this from another thread (e.g., input handler, message receiver)
+        to gracefully stop the agent and process a new message.
+        
+        Args:
+            message: Optional new message that triggered the interrupt.
+                     If provided, the agent will include this in its response context.
+        
+        Example (CLI):
+            # In a separate input thread:
+            if user_typed_something:
+                agent.interrupt(user_input)
+        
+        Example (Messaging):
+            # When new message arrives for active session:
+            if session_has_running_agent:
+                running_agent.interrupt(new_message.text)
+        """
+        self._interrupt_requested = True
+        self._interrupt_message = message
+        if not self.quiet_mode:
+            print(f"\n⚡ Interrupt requested" + (f": '{message[:40]}...'" if message and len(message) > 40 else f": '{message}'" if message else ""))
+    
+    def clear_interrupt(self) -> None:
+        """Clear any pending interrupt request."""
+        self._interrupt_requested = False
+        self._interrupt_message = None
+    
+    @property
+    def is_interrupted(self) -> bool:
+        """Check if an interrupt has been requested."""
+        return self._interrupt_requested
+    
     def run_conversation(
         self,
         user_message: str,
@@ -1359,8 +1399,19 @@ class AIAgent:
         # Main conversation loop
         api_call_count = 0
         final_response = None
+        interrupted = False
+        
+        # Clear any stale interrupt state at start
+        self.clear_interrupt()
         
         while api_call_count < self.max_iterations:
+            # Check for interrupt request (e.g., user sent new message)
+            if self._interrupt_requested:
+                interrupted = True
+                if not self.quiet_mode:
+                    print(f"\n⚡ Breaking out of tool loop due to interrupt...")
+                break
+            
             api_call_count += 1
             
             # Prepare messages for API call
@@ -2059,13 +2110,24 @@ class AIAgent:
         self._session_messages = messages
         self._save_session_log(messages)
         
-        return {
+        # Build result with interrupt info if applicable
+        result = {
             "final_response": final_response,
             "messages": messages,
             "api_calls": api_call_count,
             "completed": completed,
-            "partial": False  # True only when stopped due to invalid tool calls
+            "partial": False,  # True only when stopped due to invalid tool calls
+            "interrupted": interrupted,
         }
+        
+        # Include interrupt message if one triggered the interrupt
+        if interrupted and self._interrupt_message:
+            result["interrupt_message"] = self._interrupt_message
+        
+        # Clear interrupt state after handling
+        self.clear_interrupt()
+        
+        return result
     
     def chat(self, message: str) -> str:
         """