tests/gateway/test_run_progress_topics.py

"""Tests for topic-aware gateway progress updates."""

import importlib
import sys
import time
import types
from types import SimpleNamespace

import pytest

from gateway.config import Platform, PlatformConfig
from gateway.platforms.base import BasePlatformAdapter, SendResult
from gateway.session import SessionSource


class ProgressCaptureAdapter(BasePlatformAdapter):
    def __init__(self, platform=Platform.TELEGRAM):
        super().__init__(PlatformConfig(enabled=True, token="***"), platform)
        self.sent = []
        self.edits = []
        self.typing = []

    async def connect(self) -> bool:
        return True

    async def disconnect(self) -> None:
        return None

    async def send(self, chat_id, content, reply_to=None, metadata=None) -> SendResult:
        self.sent.append(
            {
                "chat_id": chat_id,
                "content": content,
                "reply_to": reply_to,
                "metadata": metadata,
            }
        )
        return SendResult(success=True, message_id="progress-1")

    async def edit_message(self, chat_id, message_id, content) -> SendResult:
        self.edits.append(
            {
                "chat_id": chat_id,
                "message_id": message_id,
                "content": content,
            }
        )
        return SendResult(success=True, message_id=message_id)

    async def send_typing(self, chat_id, metadata=None) -> None:
        self.typing.append({"chat_id": chat_id, "metadata": metadata})

    async def get_chat_info(self, chat_id: str):
        return {"id": chat_id}


class FakeAgent:
    def __init__(self, **kwargs):
        self.tool_progress_callback = kwargs.get("tool_progress_callback")
        self.tools = []

    def run_conversation(self, message, conversation_history=None, task_id=None):
        self.tool_progress_callback("terminal", "pwd")
        time.sleep(0.35)
        self.tool_progress_callback("browser_navigate", "https://example.com")
        time.sleep(0.35)
        return {
            "final_response": "done",
            "messages": [],
            "api_calls": 1,
        }


def _make_runner(adapter):
    gateway_run = importlib.import_module("gateway.run")
    GatewayRunner = gateway_run.GatewayRunner

    runner = object.__new__(GatewayRunner)
    runner.adapters = {adapter.platform: adapter}
    runner._voice_mode = {}
    runner._prefill_messages = []
    runner._ephemeral_system_prompt = ""
    runner._reasoning_config = None
    runner._provider_routing = {}
    runner._fallback_model = None
    runner._session_db = None
    runner._running_agents = {}
    runner.hooks = SimpleNamespace(loaded_hooks=False)
    return runner


@pytest.mark.asyncio
async def test_run_agent_progress_stays_in_originating_topic(monkeypatch, tmp_path):
    monkeypatch.setenv("HERMES_TOOL_PROGRESS_MODE", "all")

    fake_dotenv = types.ModuleType("dotenv")
    fake_dotenv.load_dotenv = lambda *args, **kwargs: None
    monkeypatch.setitem(sys.modules, "dotenv", fake_dotenv)

    fake_run_agent = types.ModuleType("run_agent")
    fake_run_agent.AIAgent = FakeAgent
    monkeypatch.setitem(sys.modules, "run_agent", fake_run_agent)

    adapter = ProgressCaptureAdapter()
    runner = _make_runner(adapter)
    gateway_run = importlib.import_module("gateway.run")
    monkeypatch.setattr(gateway_run, "_hermes_home", tmp_path)
    monkeypatch.setattr(gateway_run, "_resolve_runtime_agent_kwargs", lambda: {"api_key": "fake"})
    source = SessionSource(
        platform=Platform.TELEGRAM,
        chat_id="-1001",
        chat_type="group",
        thread_id="17585",
    )

    result = await runner._run_agent(
        message="hello",
        context_prompt="",
        history=[],
        source=source,
        session_id="sess-1",
        session_key="agent:main:telegram:group:-1001:17585",
    )

    assert result["final_response"] == "done"
    assert adapter.sent == [
        {
            "chat_id": "-1001",
            "content": '💻 terminal: "pwd"',
            "reply_to": None,
            "metadata": {"thread_id": "17585"},
        }
    ]
    assert adapter.edits
    assert all(call["metadata"] == {"thread_id": "17585"} for call in adapter.typing)


@pytest.mark.asyncio
async def test_run_agent_progress_does_not_use_event_message_id_for_telegram_dm(monkeypatch, tmp_path):
    """Telegram DM progress must not reuse event message id as thread metadata."""
    monkeypatch.setenv("HERMES_TOOL_PROGRESS_MODE", "all")

    fake_dotenv = types.ModuleType("dotenv")
    fake_dotenv.load_dotenv = lambda *args, **kwargs: None
    monkeypatch.setitem(sys.modules, "dotenv", fake_dotenv)

    fake_run_agent = types.ModuleType("run_agent")
    fake_run_agent.AIAgent = FakeAgent
    monkeypatch.setitem(sys.modules, "run_agent", fake_run_agent)

    adapter = ProgressCaptureAdapter(platform=Platform.TELEGRAM)
    runner = _make_runner(adapter)
    gateway_run = importlib.import_module("gateway.run")
    monkeypatch.setattr(gateway_run, "_hermes_home", tmp_path)
    monkeypatch.setattr(gateway_run, "_resolve_runtime_agent_kwargs", lambda: {"api_key": "***"})

    source = SessionSource(
        platform=Platform.TELEGRAM,
        chat_id="12345",
        chat_type="dm",
        thread_id=None,
    )

    result = await runner._run_agent(
        message="hello",
        context_prompt="",
        history=[],
        source=source,
        session_id="sess-2",
        session_key="agent:main:telegram:dm:12345",
        event_message_id="777",
    )

    assert result["final_response"] == "done"
    assert adapter.sent
    assert adapter.sent[0]["metadata"] is None
    assert all(call["metadata"] is None for call in adapter.typing)


@pytest.mark.asyncio
async def test_run_agent_progress_uses_event_message_id_for_slack_dm(monkeypatch, tmp_path):
    """Slack DM progress should keep event ts fallback threading."""
    monkeypatch.setenv("HERMES_TOOL_PROGRESS_MODE", "all")

    fake_dotenv = types.ModuleType("dotenv")
    fake_dotenv.load_dotenv = lambda *args, **kwargs: None
    monkeypatch.setitem(sys.modules, "dotenv", fake_dotenv)

    fake_run_agent = types.ModuleType("run_agent")
    fake_run_agent.AIAgent = FakeAgent
    monkeypatch.setitem(sys.modules, "run_agent", fake_run_agent)

    adapter = ProgressCaptureAdapter(platform=Platform.SLACK)
    runner = _make_runner(adapter)
    gateway_run = importlib.import_module("gateway.run")
    monkeypatch.setattr(gateway_run, "_hermes_home", tmp_path)
    monkeypatch.setattr(gateway_run, "_resolve_runtime_agent_kwargs", lambda: {"api_key": "***"})

    source = SessionSource(
        platform=Platform.SLACK,
        chat_id="D123",
        chat_type="dm",
        thread_id=None,
    )

    result = await runner._run_agent(
        message="hello",
        context_prompt="",
        history=[],
        source=source,
        session_id="sess-3",
        session_key="agent:main:slack:dm:D123",
        event_message_id="1234567890.000001",
    )

    assert result["final_response"] == "done"
    assert adapter.sent
    assert adapter.sent[0]["metadata"] == {"thread_id": "1234567890.000001"}
    assert all(call["metadata"] == {"thread_id": "1234567890.000001"} for call in adapter.typing)
fix(gateway): isolate telegram forum topic sessions 2026-03-11 09:15:34 +01:00			`"""Tests for topic-aware gateway progress updates."""`

			`import importlib`
			`import sys`
			`import time`
			`import types`
			`from types import SimpleNamespace`

			`import pytest`

			`from gateway.config import Platform, PlatformConfig`
			`from gateway.platforms.base import BasePlatformAdapter, SendResult`
			`from gateway.session import SessionSource`


			`class ProgressCaptureAdapter(BasePlatformAdapter):`
fix(gateway): scope progress thread fallback to Slack only (salvage #3414) (#3488) * test(gateway): map fixture adapter by platform in progress threading tests * fix(gateway): scope progress thread fallback to Slack only --------- Co-authored-by: EmpireOperating <258363005+EmpireOperating@users.noreply.github.com> 2026-03-27 22:37:53 -07:00			`def __init__(self, platform=Platform.TELEGRAM):`
			`super().__init__(PlatformConfig(enabled=True, token="***"), platform)`
fix(gateway): isolate telegram forum topic sessions 2026-03-11 09:15:34 +01:00			`self.sent = []`
			`self.edits = []`
			`self.typing = []`

			`async def connect(self) -> bool:`
			`return True`

			`async def disconnect(self) -> None:`
			`return None`

			`async def send(self, chat_id, content, reply_to=None, metadata=None) -> SendResult:`
			`self.sent.append(`
			`{`
			`"chat_id": chat_id,`
			`"content": content,`
			`"reply_to": reply_to,`
			`"metadata": metadata,`
			`}`
			`)`
			`return SendResult(success=True, message_id="progress-1")`

			`async def edit_message(self, chat_id, message_id, content) -> SendResult:`
			`self.edits.append(`
			`{`
			`"chat_id": chat_id,`
			`"message_id": message_id,`
			`"content": content,`
			`}`
			`)`
			`return SendResult(success=True, message_id=message_id)`

			`async def send_typing(self, chat_id, metadata=None) -> None:`
			`self.typing.append({"chat_id": chat_id, "metadata": metadata})`

			`async def get_chat_info(self, chat_id: str):`
			`return {"id": chat_id}`


			`class FakeAgent:`
			`def __init__(self, **kwargs):`
feat(gateway): cache AIAgent per session for prompt caching The gateway created a fresh AIAgent per message, rebuilding the system prompt (including memory, skills, context files) every turn. This broke prompt prefix caching — providers like Anthropic charge ~10x more for uncached prefixes. Now caches AIAgent instances per session_key with a config signature. The cached agent is reused across messages in the same session, preserving the frozen system prompt and tool schemas. Cache is invalidated when: - Config changes (model, provider, toolsets, reasoning, ephemeral prompt) — detected via signature mismatch - /new, /reset, /clear — explicit session reset - /model — global model change clears all cached agents - /reasoning — global reasoning change clears all cached agents Per-message state (callbacks, stream consumers, progress queues) is set on the agent instance before each run_conversation() call. This matches CLI behavior where a single AIAgent lives across all turns in a session, with _cached_system_prompt built once and reused. 2026-03-21 13:07:08 -07:00			`self.tool_progress_callback = kwargs.get("tool_progress_callback")`
fix(gateway): isolate telegram forum topic sessions 2026-03-11 09:15:34 +01:00			`self.tools = []`

			`def run_conversation(self, message, conversation_history=None, task_id=None):`
			`self.tool_progress_callback("terminal", "pwd")`
			`time.sleep(0.35)`
			`self.tool_progress_callback("browser_navigate", "https://example.com")`
			`time.sleep(0.35)`
			`return {`
			`"final_response": "done",`
			`"messages": [],`
			`"api_calls": 1,`
			`}`


			`def _make_runner(adapter):`
			`gateway_run = importlib.import_module("gateway.run")`
			`GatewayRunner = gateway_run.GatewayRunner`

			`runner = object.__new__(GatewayRunner)`
fix(gateway): scope progress thread fallback to Slack only (salvage #3414) (#3488) * test(gateway): map fixture adapter by platform in progress threading tests * fix(gateway): scope progress thread fallback to Slack only --------- Co-authored-by: EmpireOperating <258363005+EmpireOperating@users.noreply.github.com> 2026-03-27 22:37:53 -07:00			`runner.adapters = {adapter.platform: adapter}`
fix(test): add missing _voice_mode attr to GatewayRunner test stubs 2026-03-11 17:30:38 +03:00			`runner._voice_mode = {}`
fix(gateway): isolate telegram forum topic sessions 2026-03-11 09:15:34 +01:00			`runner._prefill_messages = []`
			`runner._ephemeral_system_prompt = ""`
			`runner._reasoning_config = None`
			`runner._provider_routing = {}`
			`runner._fallback_model = None`
			`runner._session_db = None`
			`runner._running_agents = {}`
			`runner.hooks = SimpleNamespace(loaded_hooks=False)`
			`return runner`


			`@pytest.mark.asyncio`
			`async def test_run_agent_progress_stays_in_originating_topic(monkeypatch, tmp_path):`
			`monkeypatch.setenv("HERMES_TOOL_PROGRESS_MODE", "all")`

			`fake_dotenv = types.ModuleType("dotenv")`
			`fake_dotenv.load_dotenv = lambda args, *kwargs: None`
			`monkeypatch.setitem(sys.modules, "dotenv", fake_dotenv)`

			`fake_run_agent = types.ModuleType("run_agent")`
			`fake_run_agent.AIAgent = FakeAgent`
			`monkeypatch.setitem(sys.modules, "run_agent", fake_run_agent)`

			`adapter = ProgressCaptureAdapter()`
			`runner = _make_runner(adapter)`
			`gateway_run = importlib.import_module("gateway.run")`
			`monkeypatch.setattr(gateway_run, "_hermes_home", tmp_path)`
			`monkeypatch.setattr(gateway_run, "_resolve_runtime_agent_kwargs", lambda: {"api_key": "fake"})`
			`source = SessionSource(`
			`platform=Platform.TELEGRAM,`
			`chat_id="-1001",`
			`chat_type="group",`
			`thread_id="17585",`
			`)`

			`result = await runner._run_agent(`
			`message="hello",`
			`context_prompt="",`
			`history=[],`
			`source=source,`
			`session_id="sess-1",`
			`session_key="agent:main:telegram:group:-1001:17585",`
			`)`

			`assert result["final_response"] == "done"`
			`assert adapter.sent == [`
			`{`
			`"chat_id": "-1001",`
			`"content": '💻 terminal: "pwd"',`
			`"reply_to": None,`
			`"metadata": {"thread_id": "17585"},`
			`}`
			`]`
			`assert adapter.edits`
			`assert all(call["metadata"] == {"thread_id": "17585"} for call in adapter.typing)`
fix(gateway): scope progress thread fallback to Slack only (salvage #3414) (#3488) * test(gateway): map fixture adapter by platform in progress threading tests * fix(gateway): scope progress thread fallback to Slack only --------- Co-authored-by: EmpireOperating <258363005+EmpireOperating@users.noreply.github.com> 2026-03-27 22:37:53 -07:00

			`@pytest.mark.asyncio`
			`async def test_run_agent_progress_does_not_use_event_message_id_for_telegram_dm(monkeypatch, tmp_path):`
			`"""Telegram DM progress must not reuse event message id as thread metadata."""`
			`monkeypatch.setenv("HERMES_TOOL_PROGRESS_MODE", "all")`

			`fake_dotenv = types.ModuleType("dotenv")`
			`fake_dotenv.load_dotenv = lambda args, *kwargs: None`
			`monkeypatch.setitem(sys.modules, "dotenv", fake_dotenv)`

			`fake_run_agent = types.ModuleType("run_agent")`
			`fake_run_agent.AIAgent = FakeAgent`
			`monkeypatch.setitem(sys.modules, "run_agent", fake_run_agent)`

			`adapter = ProgressCaptureAdapter(platform=Platform.TELEGRAM)`
			`runner = _make_runner(adapter)`
			`gateway_run = importlib.import_module("gateway.run")`
			`monkeypatch.setattr(gateway_run, "_hermes_home", tmp_path)`
			`monkeypatch.setattr(gateway_run, "_resolve_runtime_agent_kwargs", lambda: {"api_key": "***"})`

			`source = SessionSource(`
			`platform=Platform.TELEGRAM,`
			`chat_id="12345",`
			`chat_type="dm",`
			`thread_id=None,`
			`)`

			`result = await runner._run_agent(`
			`message="hello",`
			`context_prompt="",`
			`history=[],`
			`source=source,`
			`session_id="sess-2",`
			`session_key="agent:main:telegram:dm:12345",`
			`event_message_id="777",`
			`)`

			`assert result["final_response"] == "done"`
			`assert adapter.sent`
			`assert adapter.sent[0]["metadata"] is None`
			`assert all(call["metadata"] is None for call in adapter.typing)`


			`@pytest.mark.asyncio`
			`async def test_run_agent_progress_uses_event_message_id_for_slack_dm(monkeypatch, tmp_path):`
			`"""Slack DM progress should keep event ts fallback threading."""`
			`monkeypatch.setenv("HERMES_TOOL_PROGRESS_MODE", "all")`

			`fake_dotenv = types.ModuleType("dotenv")`
			`fake_dotenv.load_dotenv = lambda args, *kwargs: None`
			`monkeypatch.setitem(sys.modules, "dotenv", fake_dotenv)`

			`fake_run_agent = types.ModuleType("run_agent")`
			`fake_run_agent.AIAgent = FakeAgent`
			`monkeypatch.setitem(sys.modules, "run_agent", fake_run_agent)`

			`adapter = ProgressCaptureAdapter(platform=Platform.SLACK)`
			`runner = _make_runner(adapter)`
			`gateway_run = importlib.import_module("gateway.run")`
			`monkeypatch.setattr(gateway_run, "_hermes_home", tmp_path)`
			`monkeypatch.setattr(gateway_run, "_resolve_runtime_agent_kwargs", lambda: {"api_key": "***"})`

			`source = SessionSource(`
			`platform=Platform.SLACK,`
			`chat_id="D123",`
			`chat_type="dm",`
			`thread_id=None,`
			`)`

			`result = await runner._run_agent(`
			`message="hello",`
			`context_prompt="",`
			`history=[],`
			`source=source,`
			`session_id="sess-3",`
			`session_key="agent:main:slack:dm:D123",`
			`event_message_id="1234567890.000001",`
			`)`

			`assert result["final_response"] == "done"`
			`assert adapter.sent`
			`assert adapter.sent[0]["metadata"] == {"thread_id": "1234567890.000001"}`
			`assert all(call["metadata"] == {"thread_id": "1234567890.000001"} for call in adapter.typing)`