Implement interrupt handling for agent and CLI input and persistent prompt line at bottom of CLI :)

- Enhanced the AIAgent class to support interrupt requests, allowing for graceful interruption of ongoing tasks and processing of new messages. - Updated the HermesCLI to manage user input in a persistent manner, enabling real-time interruption of the agent's conversation. - Introduced a mechanism in the GatewayRunner to handle incoming messages while an agent is running, allowing for immediate response to user commands. - Improved overall user experience by providing feedback during interruptions and ensuring that pending messages are processed correctly.
2026-02-03 16:15:49 -08:00
parent beeb7896e0
commit 9bfe185a2e
3 changed files with 336 additions and 34 deletions
--- a/cli.py
+++ b/cli.py
@@ -33,6 +33,15 @@ from prompt_toolkit.history import FileHistory
 from prompt_toolkit.styles import Style as PTStyle
 from prompt_toolkit.formatted_text import HTML
 from prompt_toolkit.patch_stdout import patch_stdout
+from prompt_toolkit.application import Application, get_app
+from prompt_toolkit.buffer import Buffer
+from prompt_toolkit.layout import Layout, HSplit, Window, FormattedTextControl
+from prompt_toolkit.layout.processors import BeforeInput
+from prompt_toolkit.widgets import TextArea
+from prompt_toolkit.key_binding import KeyBindings
+import asyncio
+import threading
+import queue

 # Load environment variables first
 from dotenv import load_dotenv
@@ -1284,17 +1293,52 @@ class HermesCLI:
        print("─" * 60, flush=True)
        
        try:
-            # Run the conversation
-            result = self.agent.run_conversation(
-                user_message=message,
-                conversation_history=self.conversation_history[:-1],  # Exclude the message we just added
-            )
+            # Run the conversation with interrupt monitoring
+            result = None
+            
+            def run_agent():
+                nonlocal result
+                result = self.agent.run_conversation(
+                    user_message=message,
+                    conversation_history=self.conversation_history[:-1],  # Exclude the message we just added
+                )
+            
+            # Start agent in background thread
+            agent_thread = threading.Thread(target=run_agent)
+            agent_thread.start()
+            
+            # Monitor for new input in the pending queue while agent runs
+            interrupt_msg = None
+            while agent_thread.is_alive():
+                # Check if there's new input in the queue (from the persistent input area)
+                if hasattr(self, '_pending_input'):
+                    try:
+                        interrupt_msg = self._pending_input.get(timeout=0.1)
+                        if interrupt_msg:
+                            print(f"\n⚡ New message detected, interrupting...")
+                            self.agent.interrupt(interrupt_msg)
+                            break
+                    except:
+                        pass  # Queue empty or timeout, continue waiting
+                else:
+                    # Fallback if no queue (shouldn't happen)
+                    agent_thread.join(0.1)
+            
+            agent_thread.join()  # Ensure agent thread completes
            
            # Update history with full conversation
-            self.conversation_history = result.get("messages", self.conversation_history)
+            self.conversation_history = result.get("messages", self.conversation_history) if result else self.conversation_history
            
            # Get the final response
-            response = result.get("final_response", "")
+            response = result.get("final_response", "") if result else ""
+            
+            # Handle interrupt - check if we were interrupted
+            pending_message = None
+            if result and result.get("interrupted"):
+                pending_message = result.get("interrupt_message") or interrupt_msg
+                # Add indicator that we were interrupted
+                if response and pending_message:
+                    response = response + "\n\n---\n_[Interrupted - processing new message]_"
            
            if response:
                # Use simple print for compatibility with prompt_toolkit's patch_stdout
@@ -1307,6 +1351,11 @@ class HermesCLI:
                print()
                print("─" * 60)
            
+            # If we have a pending message from interrupt, process it immediately
+            if pending_message:
+                print(f"\n📨 Processing: '{pending_message[:50]}{'...' if len(pending_message) > 50 else ''}'")
+                return self.chat(pending_message)  # Recursive call to handle the new message
+            
            return response
            
        except Exception as e:
@@ -1345,22 +1394,101 @@ class HermesCLI:
            return None
    
    def run(self):
-        """Run the interactive CLI loop with fixed input at bottom."""
+        """Run the interactive CLI loop with persistent input at bottom."""
        self.show_banner()
-        
-        # These Rich prints work fine BEFORE patch_stdout
        self.console.print("[#FFF8DC]Welcome to Hermes Agent! Type your message or /help for commands.[/]")
        self.console.print()
        
-        # Use patch_stdout to ensure all output appears above the input prompt
-        with patch_stdout():
-            while True:
+        # State for async operation
+        self._agent_running = False
+        self._pending_input = queue.Queue()
+        self._should_exit = False
+        
+        # Create a persistent input area using prompt_toolkit Application
+        input_buffer = Buffer()
+        
+        # Key bindings for the input area
+        kb = KeyBindings()
+        
+        @kb.add('enter')
+        def handle_enter(event):
+            """Handle Enter key - submit input."""
+            text = event.app.current_buffer.text.strip()
+            if text:
+                # Store the input
+                self._pending_input.put(text)
+                # Clear the buffer
+                event.app.current_buffer.reset()
+        
+        @kb.add('c-c')
+        def handle_ctrl_c(event):
+            """Handle Ctrl+C - interrupt or exit."""
+            if self._agent_running and self.agent:
+                print("\n⚡ Interrupting agent...")
+                self.agent.interrupt()
+            else:
+                self._should_exit = True
+                event.app.exit()
+        
+        @kb.add('c-d')
+        def handle_ctrl_d(event):
+            """Handle Ctrl+D - exit."""
+            self._should_exit = True
+            event.app.exit()
+        
+        # Create the input area widget
+        input_area = TextArea(
+            height=1,
+            prompt='❯ ',
+            style='class:input-area',
+            multiline=False,
+            wrap_lines=False,
+        )
+        
+        # Create a status line that shows when agent is working
+        def get_status_text():
+            if self._agent_running:
+                return [('class:status', ' 🔄 Agent working... (type to interrupt) ')]
+            return [('class:status', '')]
+        
+        status_window = Window(
+            content=FormattedTextControl(get_status_text),
+            height=1,
+        )
+        
+        # Layout with status and input at bottom
+        layout = Layout(
+            HSplit([
+                Window(height=0),  # Spacer that expands
+                status_window,
+                input_area,
+            ])
+        )
+        
+        # Style for the application
+        style = PTStyle.from_dict({
+            'input-area': '#FFF8DC',
+            'status': 'bg:#333333 #FFD700',
+        })
+        
+        # Create the application
+        app = Application(
+            layout=layout,
+            key_bindings=kb,
+            style=style,
+            full_screen=False,
+            mouse_support=False,
+        )
+        
+        # Background thread to process inputs and run agent
+        def process_loop():
+            while not self._should_exit:
                try:
-                    user_input = self.get_input()
-                    
-                    if user_input is None:
-                        print("\nGoodbye! ⚕")
-                        break
+                    # Check for pending input with timeout
+                    try:
+                        user_input = self._pending_input.get(timeout=0.1)
+                    except queue.Empty:
+                        continue
                    
                    if not user_input:
                        continue
@@ -1368,16 +1496,38 @@ class HermesCLI:
                    # Check for commands
                    if user_input.startswith("/"):
                        if not self.process_command(user_input):
-                            print("\nGoodbye! ⚕")
-                            break
+                            self._should_exit = True
+                            # Schedule app exit
+                            if app.is_running:
+                                app.exit()
                        continue
                    
-                    # Regular chat message
-                    self.chat(user_input)
+                    # Regular chat - run agent
+                    self._agent_running = True
+                    app.invalidate()  # Refresh status line
                    
-                except KeyboardInterrupt:
-                    print("\nInterrupted. Type /quit to exit.")
-                    continue
+                    try:
+                        self.chat(user_input)
+                    finally:
+                        self._agent_running = False
+                        app.invalidate()  # Refresh status line
+                    
+                except Exception as e:
+                    print(f"Error: {e}")
+        
+        # Start processing thread
+        process_thread = threading.Thread(target=process_loop, daemon=True)
+        process_thread.start()
+        
+        # Run the application with patch_stdout for proper output handling
+        try:
+            with patch_stdout():
+                app.run()
+        except (EOFError, KeyboardInterrupt):
+            pass
+        finally:
+            self._should_exit = True
+            print("\nGoodbye! ⚕")


 # ============================================================================
--- a/gateway/run.py
+++ b/gateway/run.py
@@ -72,6 +72,11 @@ class GatewayRunner:
        self.delivery_router = DeliveryRouter(self.config)
        self._running = False
        self._shutdown_event = asyncio.Event()
+        
+        # Track running agents per session for interrupt support
+        # Key: session_key, Value: AIAgent instance
+        self._running_agents: Dict[str, Any] = {}
+        self._pending_messages: Dict[str, str] = {}  # Queued messages during interrupt
    
    async def start(self) -> bool:
        """
@@ -217,10 +222,11 @@ class GatewayRunner:
        This is the core message processing pipeline:
        1. Check user authorization
        2. Check for commands (/new, /reset, etc.)
-        3. Get or create session
-        4. Build context for agent
-        5. Run agent conversation
-        6. Return response
+        3. Check for running agent and interrupt if needed
+        4. Get or create session
+        5. Build context for agent
+        6. Run agent conversation
+        7. Return response
        """
        source = event.source
        
@@ -229,7 +235,7 @@ class GatewayRunner:
            print(f"[gateway] Unauthorized user: {source.user_id} ({source.user_name}) on {source.platform.value}")
            return None  # Silently ignore unauthorized users
        
-        # Check for reset commands
+        # Check for commands
        command = event.get_command()
        if command in ["new", "reset"]:
            return await self._handle_reset_command(event)
@@ -237,8 +243,21 @@ class GatewayRunner:
        if command == "status":
            return await self._handle_status_command(event)
        
+        if command == "stop":
+            return await self._handle_stop_command(event)
+        
        # Get or create session
        session_entry = self.session_store.get_or_create_session(source)
+        session_key = session_entry.session_key
+        
+        # Check if there's already a running agent for this session
+        if session_key in self._running_agents:
+            running_agent = self._running_agents[session_key]
+            print(f"[gateway] ⚡ Interrupting running agent for session {session_key[:20]}...")
+            running_agent.interrupt(event.text)
+            # Store the new message to be processed after current agent finishes
+            self._pending_messages[session_key] = event.text
+            return None  # Don't respond yet - let the interrupt handle it
        
        # Build session context
        context = build_session_context(source, self.config, session_entry)
@@ -259,7 +278,8 @@ class GatewayRunner:
                context_prompt=context_prompt,
                history=history,
                source=source,
-                session_id=session_entry.session_id
+                session_id=session_entry.session_id,
+                session_key=session_key
            )
            
            # Append to transcript
@@ -309,6 +329,10 @@ class GatewayRunner:
        
        connected_platforms = [p.value for p in self.adapters.keys()]
        
+        # Check if there's an active agent
+        session_key = session_entry.session_key
+        is_running = session_key in self._running_agents
+        
        lines = [
            "📊 **Hermes Gateway Status**",
            "",
@@ -316,12 +340,26 @@ class GatewayRunner:
            f"**Created:** {session_entry.created_at.strftime('%Y-%m-%d %H:%M')}",
            f"**Last Activity:** {session_entry.updated_at.strftime('%Y-%m-%d %H:%M')}",
            f"**Tokens:** {session_entry.total_tokens:,}",
+            f"**Agent Running:** {'Yes ⚡' if is_running else 'No'}",
            "",
            f"**Connected Platforms:** {', '.join(connected_platforms)}",
        ]
        
        return "\n".join(lines)
    
+    async def _handle_stop_command(self, event: MessageEvent) -> str:
+        """Handle /stop command - interrupt a running agent."""
+        source = event.source
+        session_entry = self.session_store.get_or_create_session(source)
+        session_key = session_entry.session_key
+        
+        if session_key in self._running_agents:
+            agent = self._running_agents[session_key]
+            agent.interrupt()
+            return "⚡ Stopping the current task... The agent will finish its current step and respond."
+        else:
+            return "No active task to stop."
+    
    def _set_session_env(self, context: SessionContext) -> None:
        """Set environment variables for the current session."""
        os.environ["HERMES_SESSION_PLATFORM"] = context.source.platform.value
@@ -341,12 +379,14 @@ class GatewayRunner:
        context_prompt: str,
        history: List[Dict[str, Any]],
        source: SessionSource,
-        session_id: str
+        session_id: str,
+        session_key: str = None
    ) -> str:
        """
        Run the agent with the given message and context.
        
        This is run in a thread pool to not block the event loop.
+        Supports interruption via new messages.
        """
        from run_agent import AIAgent
        import queue
@@ -432,6 +472,10 @@ class GatewayRunner:
                    print(f"[Gateway] Progress message error: {e}")
                    await asyncio.sleep(1)
        
+        # We need to share the agent instance for interrupt support
+        agent_holder = [None]  # Mutable container for the agent instance
+        result_holder = [None]  # Mutable container for the result
+        
        def run_sync():
            # Read from env var or use default (same as CLI)
            max_iterations = int(os.getenv("HERMES_MAX_ITERATIONS", "60"))
@@ -446,6 +490,9 @@ class GatewayRunner:
                tool_progress_callback=progress_callback if tool_progress_enabled else None,
            )
            
+            # Store agent reference for interrupt support
+            agent_holder[0] = agent
+            
            # Convert transcript history to agent format
            # Transcript has timestamps; agent expects {"role": ..., "content": ...}
            agent_history = []
@@ -456,6 +503,7 @@ class GatewayRunner:
                    agent_history.append({"role": role, "content": content})
            
            result = agent.run_conversation(message, conversation_history=agent_history)
+            result_holder[0] = result
            
            # Return final response, or a message if something went wrong
            final_response = result.get("final_response")
@@ -472,14 +520,56 @@ class GatewayRunner:
        if tool_progress_enabled:
            progress_task = asyncio.create_task(send_progress_messages())
        
+        # Track this agent as running for this session (for interrupt support)
+        # We do this in a callback after the agent is created
+        async def track_agent():
+            # Wait for agent to be created
+            while agent_holder[0] is None:
+                await asyncio.sleep(0.05)
+            if session_key:
+                self._running_agents[session_key] = agent_holder[0]
+        
+        tracking_task = asyncio.create_task(track_agent())
+        
        try:
            # Run in thread pool to not block
            loop = asyncio.get_event_loop()
            response = await loop.run_in_executor(None, run_sync)
+            
+            # Check if we were interrupted and have a pending message
+            result = result_holder[0]
+            if result and result.get("interrupted") and session_key:
+                pending = self._pending_messages.pop(session_key, None)
+                if pending:
+                    print(f"[gateway] 📨 Processing interrupted message: '{pending[:40]}...'")
+                    # Add an indicator to the response
+                    if response:
+                        response = response + "\n\n---\n_[Interrupted - processing your new message]_"
+                    
+                    # Send the interrupted response first
+                    adapter = self.adapters.get(source.platform)
+                    if adapter and response:
+                        await adapter.send(chat_id=source.chat_id, content=response)
+                    
+                    # Now process the pending message with updated history
+                    updated_history = result.get("messages", history)
+                    return await self._run_agent(
+                        message=pending,
+                        context_prompt=context_prompt,
+                        history=updated_history,
+                        source=source,
+                        session_id=session_id,
+                        session_key=session_key
+                    )
        finally:
            # Stop progress sender
            if progress_task:
                progress_task.cancel()
+            
+            # Clean up tracking
+            tracking_task.cancel()
+            if session_key and session_key in self._running_agents:
+                del self._running_agents[session_key]
                try:
                    await progress_task
                except asyncio.CancelledError:
--- a/run_agent.py
+++ b/run_agent.py
@@ -639,6 +639,10 @@ class AIAgent:
        self.tool_progress_callback = tool_progress_callback
        self._last_reported_tool = None  # Track for "new tool" mode
        
+        # Interrupt mechanism for breaking out of tool loops
+        self._interrupt_requested = False
+        self._interrupt_message = None  # Optional message that triggered interrupt
+        
        # Store OpenRouter provider preferences
        self.providers_allowed = providers_allowed
        self.providers_ignored = providers_ignored
@@ -1302,6 +1306,42 @@ class AIAgent:
            if self.verbose_logging:
                logging.warning(f"Failed to save session log: {e}")
    
+    def interrupt(self, message: str = None) -> None:
+        """
+        Request the agent to interrupt its current tool-calling loop.
+        
+        Call this from another thread (e.g., input handler, message receiver)
+        to gracefully stop the agent and process a new message.
+        
+        Args:
+            message: Optional new message that triggered the interrupt.
+                     If provided, the agent will include this in its response context.
+        
+        Example (CLI):
+            # In a separate input thread:
+            if user_typed_something:
+                agent.interrupt(user_input)
+        
+        Example (Messaging):
+            # When new message arrives for active session:
+            if session_has_running_agent:
+                running_agent.interrupt(new_message.text)
+        """
+        self._interrupt_requested = True
+        self._interrupt_message = message
+        if not self.quiet_mode:
+            print(f"\n⚡ Interrupt requested" + (f": '{message[:40]}...'" if message and len(message) > 40 else f": '{message}'" if message else ""))
+    
+    def clear_interrupt(self) -> None:
+        """Clear any pending interrupt request."""
+        self._interrupt_requested = False
+        self._interrupt_message = None
+    
+    @property
+    def is_interrupted(self) -> bool:
+        """Check if an interrupt has been requested."""
+        return self._interrupt_requested
+    
    def run_conversation(
        self,
        user_message: str,
@@ -1359,8 +1399,19 @@ class AIAgent:
        # Main conversation loop
        api_call_count = 0
        final_response = None
+        interrupted = False
+        
+        # Clear any stale interrupt state at start
+        self.clear_interrupt()
        
        while api_call_count < self.max_iterations:
+            # Check for interrupt request (e.g., user sent new message)
+            if self._interrupt_requested:
+                interrupted = True
+                if not self.quiet_mode:
+                    print(f"\n⚡ Breaking out of tool loop due to interrupt...")
+                break
+            
            api_call_count += 1
            
            # Prepare messages for API call
@@ -2059,13 +2110,24 @@ class AIAgent:
        self._session_messages = messages
        self._save_session_log(messages)
        
-        return {
+        # Build result with interrupt info if applicable
+        result = {
            "final_response": final_response,
            "messages": messages,
            "api_calls": api_call_count,
            "completed": completed,
-            "partial": False  # True only when stopped due to invalid tool calls
+            "partial": False,  # True only when stopped due to invalid tool calls
+            "interrupted": interrupted,
        }
+        
+        # Include interrupt message if one triggered the interrupt
+        if interrupted and self._interrupt_message:
+            result["interrupt_message"] = self._interrupt_message
+        
+        # Clear interrupt state after handling
+        self.clear_interrupt()
+        
+        return result
    
    def chat(self, message: str) -> str:
        """