tests/test_860_dedup.py

"""Tests for issue #860 — SQLite session transcript deduplication.

Verifies that:
1. _flush_messages_to_session_db uses _last_flushed_db_idx to avoid re-writing
2. Multiple _persist_session calls don't duplicate messages
3. append_to_transcript(skip_db=True) skips SQLite but writes JSONL
4. The gateway doesn't double-write messages the agent already persisted
"""

import json
import os
import sqlite3
import tempfile
from pathlib import Path
from unittest.mock import MagicMock, patch

import pytest


# ---------------------------------------------------------------------------
# Test: _flush_messages_to_session_db only writes new messages
# ---------------------------------------------------------------------------

class TestFlushDeduplication:
    """Verify _flush_messages_to_session_db tracks what it already wrote."""

    def _make_agent(self, session_db):
        """Create a minimal AIAgent with a real session DB."""
        with patch.dict(os.environ, {"OPENROUTER_API_KEY": "test-key"}):
            from run_agent import AIAgent
            agent = AIAgent(
                model="test/model",
                quiet_mode=True,
                session_db=session_db,
                session_id="test-session-860",
                skip_context_files=True,
                skip_memory=True,
            )
        return agent

    def test_flush_writes_only_new_messages(self):
        """First flush writes all new messages, second flush writes none."""
        from hermes_state import SessionDB

        with tempfile.TemporaryDirectory() as tmpdir:
            db_path = Path(tmpdir) / "test.db"
            db = SessionDB(db_path=db_path)

            agent = self._make_agent(db)

            conversation_history = [
                {"role": "user", "content": "old message"},
            ]
            messages = list(conversation_history) + [
                {"role": "user", "content": "new question"},
                {"role": "assistant", "content": "new answer"},
            ]

            # First flush — should write 2 new messages
            agent._flush_messages_to_session_db(messages, conversation_history)

            rows = db.get_messages(agent.session_id)
            assert len(rows) == 2, f"Expected 2 messages, got {len(rows)}"

            # Second flush with SAME messages — should write 0 new messages
            agent._flush_messages_to_session_db(messages, conversation_history)

            rows = db.get_messages(agent.session_id)
            assert len(rows) == 2, f"Expected still 2 messages after second flush, got {len(rows)}"

    def test_flush_writes_incrementally(self):
        """Messages added between flushes are written exactly once."""
        from hermes_state import SessionDB

        with tempfile.TemporaryDirectory() as tmpdir:
            db_path = Path(tmpdir) / "test.db"
            db = SessionDB(db_path=db_path)

            agent = self._make_agent(db)

            conversation_history = []
            messages = [
                {"role": "user", "content": "hello"},
            ]

            # First flush — 1 message
            agent._flush_messages_to_session_db(messages, conversation_history)
            rows = db.get_messages(agent.session_id)
            assert len(rows) == 1

            # Add more messages
            messages.append({"role": "assistant", "content": "hi there"})
            messages.append({"role": "user", "content": "follow up"})

            # Second flush — should write only 2 new messages
            agent._flush_messages_to_session_db(messages, conversation_history)
            rows = db.get_messages(agent.session_id)
            assert len(rows) == 3, f"Expected 3 total messages, got {len(rows)}"

    def test_persist_session_multiple_calls_no_duplication(self):
        """Multiple _persist_session calls don't duplicate DB entries."""
        from hermes_state import SessionDB

        with tempfile.TemporaryDirectory() as tmpdir:
            db_path = Path(tmpdir) / "test.db"
            db = SessionDB(db_path=db_path)

            agent = self._make_agent(db)
            # Stub out _save_session_log to avoid file I/O
            agent._save_session_log = MagicMock()

            conversation_history = [{"role": "user", "content": "old"}]
            messages = list(conversation_history) + [
                {"role": "user", "content": "q1"},
                {"role": "assistant", "content": "a1"},
                {"role": "user", "content": "q2"},
                {"role": "assistant", "content": "a2"},
            ]

            # Simulate multiple persist calls (like the agent's many exit paths)
            for _ in range(5):
                agent._persist_session(messages, conversation_history)

            rows = db.get_messages(agent.session_id)
            assert len(rows) == 4, f"Expected 4 messages, got {len(rows)} (duplication bug!)"

    def test_flush_reset_after_compression(self):
        """After compression creates a new session, flush index resets."""
        from hermes_state import SessionDB

        with tempfile.TemporaryDirectory() as tmpdir:
            db_path = Path(tmpdir) / "test.db"
            db = SessionDB(db_path=db_path)

            agent = self._make_agent(db)

            # Write some messages
            messages = [
                {"role": "user", "content": "msg1"},
                {"role": "assistant", "content": "reply1"},
            ]
            agent._flush_messages_to_session_db(messages, [])

            old_session = agent.session_id
            assert agent._last_flushed_db_idx == 2

            # Simulate what _compress_context does: new session, reset idx
            agent.session_id = "compressed-session-new"
            db.create_session(session_id=agent.session_id, source="test")
            agent._last_flushed_db_idx = 0

            # Now flush compressed messages to new session
            compressed_messages = [
                {"role": "user", "content": "summary of conversation"},
            ]
            agent._flush_messages_to_session_db(compressed_messages, [])

            new_rows = db.get_messages(agent.session_id)
            assert len(new_rows) == 1

            # Old session should still have its 2 messages
            old_rows = db.get_messages(old_session)
            assert len(old_rows) == 2


# ---------------------------------------------------------------------------
# Test: append_to_transcript skip_db parameter
# ---------------------------------------------------------------------------

class TestAppendToTranscriptSkipDb:
    """Verify skip_db=True writes JSONL but not SQLite."""

    @pytest.fixture()
    def store(self, tmp_path):
        from gateway.config import GatewayConfig
        from gateway.session import SessionStore
        config = GatewayConfig()
        with patch("gateway.session.SessionStore._ensure_loaded"):
            s = SessionStore(sessions_dir=tmp_path, config=config)
        s._db = None  # no SQLite for these JSONL-focused tests
        s._loaded = True
        return s

    def test_skip_db_writes_jsonl_only(self, store, tmp_path):
        """With skip_db=True, message appears in JSONL but not SQLite."""
        session_id = "test-skip-db"
        msg = {"role": "assistant", "content": "hello world"}
        store.append_to_transcript(session_id, msg, skip_db=True)

        # JSONL should have the message
        jsonl_path = store.get_transcript_path(session_id)
        assert jsonl_path.exists()
        with open(jsonl_path) as f:
            lines = f.readlines()
        assert len(lines) == 1
        parsed = json.loads(lines[0])
        assert parsed["content"] == "hello world"

    def test_skip_db_prevents_sqlite_write(self, tmp_path):
        """With skip_db=True and a real DB, message does NOT appear in SQLite."""
        from gateway.config import GatewayConfig
        from gateway.session import SessionStore
        from hermes_state import SessionDB

        db_path = tmp_path / "test_skip.db"
        db = SessionDB(db_path=db_path)

        config = GatewayConfig()
        with patch("gateway.session.SessionStore._ensure_loaded"):
            store = SessionStore(sessions_dir=tmp_path, config=config)
        store._db = db
        store._loaded = True

        session_id = "test-skip-db-real"
        db.create_session(session_id=session_id, source="test")

        msg = {"role": "assistant", "content": "hello world"}
        store.append_to_transcript(session_id, msg, skip_db=True)

        # SQLite should NOT have the message
        rows = db.get_messages(session_id)
        assert len(rows) == 0, f"Expected 0 DB rows with skip_db=True, got {len(rows)}"

        # But JSONL should have it
        jsonl_path = store.get_transcript_path(session_id)
        with open(jsonl_path) as f:
            lines = f.readlines()
        assert len(lines) == 1

    def test_default_writes_both(self, tmp_path):
        """Without skip_db, message appears in both JSONL and SQLite."""
        from gateway.config import GatewayConfig
        from gateway.session import SessionStore
        from hermes_state import SessionDB

        db_path = tmp_path / "test_both.db"
        db = SessionDB(db_path=db_path)

        config = GatewayConfig()
        with patch("gateway.session.SessionStore._ensure_loaded"):
            store = SessionStore(sessions_dir=tmp_path, config=config)
        store._db = db
        store._loaded = True

        session_id = "test-default-write"
        db.create_session(session_id=session_id, source="test")

        msg = {"role": "user", "content": "test message"}
        store.append_to_transcript(session_id, msg)

        # JSONL should have the message
        jsonl_path = store.get_transcript_path(session_id)
        with open(jsonl_path) as f:
            lines = f.readlines()
        assert len(lines) == 1

        # SQLite should also have the message
        rows = db.get_messages(session_id)
        assert len(rows) == 1


# ---------------------------------------------------------------------------
# Test: _last_flushed_db_idx initialization
# ---------------------------------------------------------------------------

class TestFlushIdxInit:
    """Verify _last_flushed_db_idx is properly initialized."""

    def test_init_zero(self):
        """Agent starts with _last_flushed_db_idx = 0."""
        with patch.dict(os.environ, {"OPENROUTER_API_KEY": "test-key"}):
            from run_agent import AIAgent
            agent = AIAgent(
                model="test/model",
                quiet_mode=True,
                skip_context_files=True,
                skip_memory=True,
            )
        assert agent._last_flushed_db_idx == 0

    def test_no_session_db_noop(self):
        """Without session_db, flush is a no-op and doesn't crash."""
        with patch.dict(os.environ, {"OPENROUTER_API_KEY": "test-key"}):
            from run_agent import AIAgent
            agent = AIAgent(
                model="test/model",
                quiet_mode=True,
                skip_context_files=True,
                skip_memory=True,
            )
        messages = [{"role": "user", "content": "test"}]
        agent._flush_messages_to_session_db(messages, [])
        # Should not crash, idx should remain 0
        assert agent._last_flushed_db_idx == 0
fix: eliminate 3x SQLite message duplication in gateway sessions (#860) Three separate code paths all wrote to the same SQLite state.db with no deduplication, inflating session transcripts by 3-4x: 1. _log_msg_to_db() — wrote each message individually after append 2. _flush_messages_to_session_db() — re-wrote ALL new messages at every _persist_session() call (~18 exit points), with no tracking of what was already written 3. gateway append_to_transcript() — wrote everything a third time after the agent returned Since load_transcript() prefers SQLite over JSONL, the inflated data was loaded on every session resume, causing proportional token waste. Fix: - Remove _log_msg_to_db() and all 16 call sites (redundant with flush) - Add _last_flushed_db_idx tracking in _flush_messages_to_session_db() so repeated _persist_session() calls only write truly new messages - Reset flush cursor on compression (new session ID) - Add skip_db parameter to SessionStore.append_to_transcript() so the gateway skips SQLite writes when the agent already persisted them - Gateway now passes skip_db=True for agent-managed messages, still writes to JSONL as backup Verified: a 12-message CLI session with tool calls produces exactly 12 SQLite rows with zero duplicates (previously would be 36-48). Tests: 9 new tests covering flush deduplication, skip_db behavior, compression reset, and initialization. Full suite passes (2869 tests). 2026-03-10 15:22:44 -07:00			`"""Tests for issue #860 — SQLite session transcript deduplication.`

			`Verifies that:`
			`1. _flush_messages_to_session_db uses _last_flushed_db_idx to avoid re-writing`
			`2. Multiple _persist_session calls don't duplicate messages`
			`3. append_to_transcript(skip_db=True) skips SQLite but writes JSONL`
			`4. The gateway doesn't double-write messages the agent already persisted`
			`"""`

			`import json`
			`import os`
			`import sqlite3`
			`import tempfile`
			`from pathlib import Path`
			`from unittest.mock import MagicMock, patch`

			`import pytest`


			`# ---------------------------------------------------------------------------`
			`# Test: _flush_messages_to_session_db only writes new messages`
			`# ---------------------------------------------------------------------------`

			`class TestFlushDeduplication:`
			`"""Verify _flush_messages_to_session_db tracks what it already wrote."""`

			`def _make_agent(self, session_db):`
			`"""Create a minimal AIAgent with a real session DB."""`
			`with patch.dict(os.environ, {"OPENROUTER_API_KEY": "test-key"}):`
			`from run_agent import AIAgent`
			`agent = AIAgent(`
			`model="test/model",`
			`quiet_mode=True,`
			`session_db=session_db,`
			`session_id="test-session-860",`
			`skip_context_files=True,`
			`skip_memory=True,`
			`)`
			`return agent`

			`def test_flush_writes_only_new_messages(self):`
			`"""First flush writes all new messages, second flush writes none."""`
			`from hermes_state import SessionDB`

			`with tempfile.TemporaryDirectory() as tmpdir:`
			`db_path = Path(tmpdir) / "test.db"`
			`db = SessionDB(db_path=db_path)`

			`agent = self._make_agent(db)`

			`conversation_history = [`
			`{"role": "user", "content": "old message"},`
			`]`
			`messages = list(conversation_history) + [`
			`{"role": "user", "content": "new question"},`
			`{"role": "assistant", "content": "new answer"},`
			`]`

			`# First flush — should write 2 new messages`
			`agent._flush_messages_to_session_db(messages, conversation_history)`

			`rows = db.get_messages(agent.session_id)`
			`assert len(rows) == 2, f"Expected 2 messages, got {len(rows)}"`

			`# Second flush with SAME messages — should write 0 new messages`
			`agent._flush_messages_to_session_db(messages, conversation_history)`

			`rows = db.get_messages(agent.session_id)`
			`assert len(rows) == 2, f"Expected still 2 messages after second flush, got {len(rows)}"`

			`def test_flush_writes_incrementally(self):`
			`"""Messages added between flushes are written exactly once."""`
			`from hermes_state import SessionDB`

			`with tempfile.TemporaryDirectory() as tmpdir:`
			`db_path = Path(tmpdir) / "test.db"`
			`db = SessionDB(db_path=db_path)`

			`agent = self._make_agent(db)`

			`conversation_history = []`
			`messages = [`
			`{"role": "user", "content": "hello"},`
			`]`

			`# First flush — 1 message`
			`agent._flush_messages_to_session_db(messages, conversation_history)`
			`rows = db.get_messages(agent.session_id)`
			`assert len(rows) == 1`

			`# Add more messages`
			`messages.append({"role": "assistant", "content": "hi there"})`
			`messages.append({"role": "user", "content": "follow up"})`

			`# Second flush — should write only 2 new messages`
			`agent._flush_messages_to_session_db(messages, conversation_history)`
			`rows = db.get_messages(agent.session_id)`
			`assert len(rows) == 3, f"Expected 3 total messages, got {len(rows)}"`

			`def test_persist_session_multiple_calls_no_duplication(self):`
			`"""Multiple _persist_session calls don't duplicate DB entries."""`
			`from hermes_state import SessionDB`

			`with tempfile.TemporaryDirectory() as tmpdir:`
			`db_path = Path(tmpdir) / "test.db"`
			`db = SessionDB(db_path=db_path)`

			`agent = self._make_agent(db)`
			`# Stub out _save_session_log to avoid file I/O`
			`agent._save_session_log = MagicMock()`

			`conversation_history = [{"role": "user", "content": "old"}]`
			`messages = list(conversation_history) + [`
			`{"role": "user", "content": "q1"},`
			`{"role": "assistant", "content": "a1"},`
			`{"role": "user", "content": "q2"},`
			`{"role": "assistant", "content": "a2"},`
			`]`

			`# Simulate multiple persist calls (like the agent's many exit paths)`
			`for _ in range(5):`
			`agent._persist_session(messages, conversation_history)`

			`rows = db.get_messages(agent.session_id)`
			`assert len(rows) == 4, f"Expected 4 messages, got {len(rows)} (duplication bug!)"`

			`def test_flush_reset_after_compression(self):`
			`"""After compression creates a new session, flush index resets."""`
			`from hermes_state import SessionDB`

			`with tempfile.TemporaryDirectory() as tmpdir:`
			`db_path = Path(tmpdir) / "test.db"`
			`db = SessionDB(db_path=db_path)`

			`agent = self._make_agent(db)`

			`# Write some messages`
			`messages = [`
			`{"role": "user", "content": "msg1"},`
			`{"role": "assistant", "content": "reply1"},`
			`]`
			`agent._flush_messages_to_session_db(messages, [])`

			`old_session = agent.session_id`
			`assert agent._last_flushed_db_idx == 2`

			`# Simulate what _compress_context does: new session, reset idx`
			`agent.session_id = "compressed-session-new"`
			`db.create_session(session_id=agent.session_id, source="test")`
			`agent._last_flushed_db_idx = 0`

			`# Now flush compressed messages to new session`
			`compressed_messages = [`
			`{"role": "user", "content": "summary of conversation"},`
			`]`
			`agent._flush_messages_to_session_db(compressed_messages, [])`

			`new_rows = db.get_messages(agent.session_id)`
			`assert len(new_rows) == 1`

			`# Old session should still have its 2 messages`
			`old_rows = db.get_messages(old_session)`
			`assert len(old_rows) == 2`


			`# ---------------------------------------------------------------------------`
			`# Test: append_to_transcript skip_db parameter`
			`# ---------------------------------------------------------------------------`

			`class TestAppendToTranscriptSkipDb:`
			`"""Verify skip_db=True writes JSONL but not SQLite."""`

			`@pytest.fixture()`
			`def store(self, tmp_path):`
			`from gateway.config import GatewayConfig`
			`from gateway.session import SessionStore`
			`config = GatewayConfig()`
			`with patch("gateway.session.SessionStore._ensure_loaded"):`
			`s = SessionStore(sessions_dir=tmp_path, config=config)`
			`s._db = None # no SQLite for these JSONL-focused tests`
			`s._loaded = True`
			`return s`

			`def test_skip_db_writes_jsonl_only(self, store, tmp_path):`
			`"""With skip_db=True, message appears in JSONL but not SQLite."""`
			`session_id = "test-skip-db"`
			`msg = {"role": "assistant", "content": "hello world"}`
			`store.append_to_transcript(session_id, msg, skip_db=True)`

			`# JSONL should have the message`
			`jsonl_path = store.get_transcript_path(session_id)`
			`assert jsonl_path.exists()`
			`with open(jsonl_path) as f:`
			`lines = f.readlines()`
			`assert len(lines) == 1`
			`parsed = json.loads(lines[0])`
			`assert parsed["content"] == "hello world"`

			`def test_skip_db_prevents_sqlite_write(self, tmp_path):`
			`"""With skip_db=True and a real DB, message does NOT appear in SQLite."""`
			`from gateway.config import GatewayConfig`
			`from gateway.session import SessionStore`
			`from hermes_state import SessionDB`

			`db_path = tmp_path / "test_skip.db"`
			`db = SessionDB(db_path=db_path)`

			`config = GatewayConfig()`
			`with patch("gateway.session.SessionStore._ensure_loaded"):`
			`store = SessionStore(sessions_dir=tmp_path, config=config)`
			`store._db = db`
			`store._loaded = True`

			`session_id = "test-skip-db-real"`
			`db.create_session(session_id=session_id, source="test")`

			`msg = {"role": "assistant", "content": "hello world"}`
			`store.append_to_transcript(session_id, msg, skip_db=True)`

			`# SQLite should NOT have the message`
			`rows = db.get_messages(session_id)`
			`assert len(rows) == 0, f"Expected 0 DB rows with skip_db=True, got {len(rows)}"`

			`# But JSONL should have it`
			`jsonl_path = store.get_transcript_path(session_id)`
			`with open(jsonl_path) as f:`
			`lines = f.readlines()`
			`assert len(lines) == 1`

			`def test_default_writes_both(self, tmp_path):`
			`"""Without skip_db, message appears in both JSONL and SQLite."""`
			`from gateway.config import GatewayConfig`
			`from gateway.session import SessionStore`
			`from hermes_state import SessionDB`

			`db_path = tmp_path / "test_both.db"`
			`db = SessionDB(db_path=db_path)`

			`config = GatewayConfig()`
			`with patch("gateway.session.SessionStore._ensure_loaded"):`
			`store = SessionStore(sessions_dir=tmp_path, config=config)`
			`store._db = db`
			`store._loaded = True`

			`session_id = "test-default-write"`
			`db.create_session(session_id=session_id, source="test")`

			`msg = {"role": "user", "content": "test message"}`
			`store.append_to_transcript(session_id, msg)`

			`# JSONL should have the message`
			`jsonl_path = store.get_transcript_path(session_id)`
			`with open(jsonl_path) as f:`
			`lines = f.readlines()`
			`assert len(lines) == 1`

			`# SQLite should also have the message`
			`rows = db.get_messages(session_id)`
			`assert len(rows) == 1`


			`# ---------------------------------------------------------------------------`
			`# Test: _last_flushed_db_idx initialization`
			`# ---------------------------------------------------------------------------`

			`class TestFlushIdxInit:`
			`"""Verify _last_flushed_db_idx is properly initialized."""`

			`def test_init_zero(self):`
			`"""Agent starts with _last_flushed_db_idx = 0."""`
			`with patch.dict(os.environ, {"OPENROUTER_API_KEY": "test-key"}):`
			`from run_agent import AIAgent`
			`agent = AIAgent(`
			`model="test/model",`
			`quiet_mode=True,`
			`skip_context_files=True,`
			`skip_memory=True,`
			`)`
			`assert agent._last_flushed_db_idx == 0`

			`def test_no_session_db_noop(self):`
			`"""Without session_db, flush is a no-op and doesn't crash."""`
			`with patch.dict(os.environ, {"OPENROUTER_API_KEY": "test-key"}):`
			`from run_agent import AIAgent`
			`agent = AIAgent(`
			`model="test/model",`
			`quiet_mode=True,`
			`skip_context_files=True,`
			`skip_memory=True,`
			`)`
			`messages = [{"role": "user", "content": "test"}]`
			`agent._flush_messages_to_session_db(messages, [])`
			`# Should not crash, idx should remain 0`
			`assert agent._last_flushed_db_idx == 0`