Files
hermes-agent/tests/run_agent/test_strict_api_validation.py
Siddharth Balyan f3006ebef9 refactor(tests): re-architect tests + fix CI failures (#5946)
* refactor: re-architect tests to mirror the codebase

* Update tests.yml

* fix: add missing tool_error imports after registry refactor

* fix(tests): replace patch.dict with monkeypatch to prevent env var leaks under xdist

patch.dict(os.environ) can leak TERMINAL_ENV across xdist workers,
causing test_code_execution tests to hit the Modal remote path.

* fix(tests): fix update_check and telegram xdist failures

- test_update_check: replace patch("hermes_cli.banner.os.getenv") with
  monkeypatch.setenv("HERMES_HOME") — banner.py no longer imports os
  directly, it uses get_hermes_home() from hermes_constants.

- test_telegram_conflict/approval_buttons: provide real exception classes
  for telegram.error mock (NetworkError, TimedOut, BadRequest) so the
  except clause in connect() doesn't fail with "catching classes that do
  not inherit from BaseException" when xdist pollutes sys.modules.

* fix(tests): accept unavailable_models kwarg in _prompt_model_selection mock
2026-04-07 17:19:07 -07:00

145 lines
5.0 KiB
Python

"""Test validation error prevention for strict APIs (Fireworks, etc.)"""
import sys
import types
from unittest.mock import patch, MagicMock
import pytest
sys.modules.setdefault("fire", types.SimpleNamespace(Fire=lambda *a, **k: None))
sys.modules.setdefault("firecrawl", types.SimpleNamespace(Firecrawl=object))
sys.modules.setdefault("fal_client", types.SimpleNamespace())
from run_agent import AIAgent
# ── Helpers ──────────────────────────────────────────────────────────────────
def _tool_defs(*names):
return [
{
"type": "function",
"function": {
"name": n,
"description": f"{n} tool",
"parameters": {"type": "object", "properties": {}},
},
}
for n in names
]
class _FakeOpenAI:
def __init__(self, **kw):
self.api_key = kw.get("api_key", "test")
self.base_url = kw.get("base_url", "http://test")
def close(self):
pass
def _make_agent(monkeypatch, provider, api_mode="chat_completions", base_url="https://openrouter.ai/api/v1"):
monkeypatch.setattr("run_agent.get_tool_definitions", lambda **kw: _tool_defs("web_search", "terminal"))
monkeypatch.setattr("run_agent.check_toolset_requirements", lambda: {})
monkeypatch.setattr("run_agent.OpenAI", _FakeOpenAI)
return AIAgent(
api_key="test",
base_url=base_url,
provider=provider,
api_mode=api_mode,
max_iterations=4,
quiet_mode=True,
skip_context_files=True,
skip_memory=True,
)
class TestStrictApiValidation:
"""Verify tool_call field sanitization prevents 400 errors on strict APIs."""
def test_fireworks_compatible_messages_after_sanitization(self, monkeypatch):
"""Messages should be Fireworks-compatible after sanitization."""
agent = _make_agent(monkeypatch, "openrouter")
agent.api_mode = "chat_completions" # Fireworks uses chat completions
messages = [
{"role": "user", "content": "hi"},
{
"role": "assistant",
"content": "Checking now.",
"tool_calls": [
{
"id": "call_123",
"call_id": "call_123", # Codex-only field
"response_item_id": "fc_123", # Codex-only field
"type": "function",
"function": {"name": "terminal", "arguments": '{"command":"pwd"}'},
}
],
},
{"role": "tool", "tool_call_id": "call_123", "content": "/tmp"},
]
# After _build_api_kwargs, Codex fields should be stripped
kwargs = agent._build_api_kwargs(messages)
assistant_msg = kwargs["messages"][1]
tool_call = assistant_msg["tool_calls"][0]
# Fireworks rejects these fields
assert "call_id" not in tool_call
assert "response_item_id" not in tool_call
# Standard fields should remain
assert tool_call["id"] == "call_123"
assert tool_call["function"]["name"] == "terminal"
def test_codex_preserves_fields_for_replay(self, monkeypatch):
"""Codex mode should preserve fields for Responses API replay."""
agent = _make_agent(monkeypatch, "openrouter")
agent.api_mode = "codex_responses"
messages = [
{"role": "user", "content": "hi"},
{
"role": "assistant",
"content": "Checking now.",
"tool_calls": [
{
"id": "call_123",
"call_id": "call_123",
"response_item_id": "fc_123",
"type": "function",
"function": {"name": "terminal", "arguments": '{"command":"pwd"}'},
}
],
},
]
# In Codex mode, original messages should NOT be mutated
assert messages[1]["tool_calls"][0]["call_id"] == "call_123"
assert messages[1]["tool_calls"][0]["response_item_id"] == "fc_123"
def test_sanitize_method_with_fireworks_provider(self, monkeypatch):
"""Simulating Fireworks provider should trigger sanitization."""
agent = _make_agent(
monkeypatch,
"fireworks",
api_mode="chat_completions",
base_url="https://api.fireworks.ai/inference/v1"
)
# Should sanitize for Fireworks (chat_completions mode)
assert agent._should_sanitize_tool_calls() is True
def test_no_sanitize_for_codex_responses(self, monkeypatch):
"""Codex responses mode should NOT sanitize."""
agent = _make_agent(
monkeypatch,
"openai",
api_mode="codex_responses",
base_url="https://api.openai.com/v1"
)
# Should NOT sanitize for Codex
assert agent._should_sanitize_tool_calls() is False