This repository has been archived on 2026-03-24. You can view files and clone it. You cannot open issues or pull requests or push a commit.
Files
Timmy-time-dashboard/tests/test_calculator.py
Alexander Payne 6e6b4355bb fix: calculator tool, markdown rendering, prompt guardrails, briefing notification
- Add sandboxed calculator tool to Timmy's toolkit so arithmetic questions
  get exact answers instead of LLM hallucinations
- Update system prompts (lite + full) to instruct Timmy to always use the
  calculator and never attempt multi-digit math in his head
- Add self-contradiction guard to both prompts ("commit to your facts")
- Render Timmy's chat responses as markdown via marked.js + DOMPurify
  instead of raw escaped text
- Suppress empty briefing notification on startup when there are 0
  pending approval items
- Add calculator to session response sanitizer regex
- 18 new calculator tests, 2 updated briefing notification tests

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-26 09:35:59 -05:00

86 lines
1.9 KiB
Python

"""Tests for the calculator tool."""
from timmy.tools import calculator
def test_basic_multiplication():
assert calculator("347 * 829") == "287663"
def test_basic_addition():
assert calculator("100 + 200") == "300"
def test_basic_division():
assert calculator("100 / 4") == "25.0"
def test_integer_division():
assert calculator("100 // 3") == "33"
def test_exponentiation():
assert calculator("2 ** 10") == "1024"
def test_sqrt():
assert calculator("math.sqrt(17161)") == "131.0"
def test_sqrt_non_perfect():
result = float(calculator("math.sqrt(2)"))
assert abs(result - 1.4142135623730951) < 1e-10
def test_log_base_10():
result = float(calculator("math.log10(1000)"))
assert abs(result - 3.0) < 1e-10
def test_log_natural():
result = float(calculator("math.log(math.e)"))
assert abs(result - 1.0) < 1e-10
def test_trig_sin():
result = float(calculator("math.sin(math.pi / 2)"))
assert abs(result - 1.0) < 1e-10
def test_abs_builtin():
assert calculator("abs(-42)") == "42"
def test_round_builtin():
assert calculator("round(3.14159, 2)") == "3.14"
def test_min_max_builtins():
assert calculator("min(3, 7, 1)") == "1"
assert calculator("max(3, 7, 1)") == "7"
def test_complex_expression():
assert calculator("(347 * 829) + (100 / 4)") == "287688.0"
def test_invalid_expression_returns_error():
result = calculator("not a valid expression")
assert result.startswith("Error evaluating")
def test_no_builtins_access():
"""Ensure dangerous builtins like __import__ are blocked."""
result = calculator("__import__('os').system('echo pwned')")
assert result.startswith("Error evaluating")
def test_no_open_access():
result = calculator("open('/etc/passwd').read()")
assert result.startswith("Error evaluating")
def test_division_by_zero():
result = calculator("1 / 0")
assert result.startswith("Error evaluating")