fix: replace eval() with AST-walking safe evaluator in calculator

Fixes #52 - Replace eval() in calculator() with _safe_eval() that walks the AST and only permits: numeric constants, arithmetic ops (+,-,*,/,//,%,**), unary +/-, math module access, and whitelisted builtins (abs, round, min, max) - Reject all other syntax: imports, attribute access on non-math objects, lambdas, comprehensions, string literals, etc. - Add 39 tests covering arithmetic, precedence, math functions, allowed builtins, error handling, and 14 injection prevention cases
2026-03-14 15:51:35 -04:00
parent 122d07471e
commit 70d5dc5ce1
2 changed files with 226 additions and 3 deletions
--- a/src/timmy/tools.py
+++ b/src/timmy/tools.py
@@ -13,6 +13,7 @@ Tools are assigned to agents based on their specialties.

 from __future__ import annotations

+import ast
 import logging
 import math
 from collections.abc import Callable
@@ -115,6 +116,59 @@ def get_tool_stats(agent_id: str | None = None) -> dict:
    return all_stats


+def _safe_eval(node, allowed_names: dict):
+    """Walk an AST and evaluate only safe numeric operations."""
+    if isinstance(node, ast.Expression):
+        return _safe_eval(node.body, allowed_names)
+    if isinstance(node, ast.Constant):
+        if isinstance(node.value, (int, float, complex)):
+            return node.value
+        raise ValueError(f"Unsupported constant: {node.value!r}")
+    if isinstance(node, ast.UnaryOp):
+        operand = _safe_eval(node.operand, allowed_names)
+        if isinstance(node.op, ast.UAdd):
+            return +operand
+        if isinstance(node.op, ast.USub):
+            return -operand
+        raise ValueError(f"Unsupported unary op: {type(node.op).__name__}")
+    if isinstance(node, ast.BinOp):
+        left = _safe_eval(node.left, allowed_names)
+        right = _safe_eval(node.right, allowed_names)
+        ops = {
+            ast.Add: lambda a, b: a + b,
+            ast.Sub: lambda a, b: a - b,
+            ast.Mult: lambda a, b: a * b,
+            ast.Div: lambda a, b: a / b,
+            ast.FloorDiv: lambda a, b: a // b,
+            ast.Mod: lambda a, b: a % b,
+            ast.Pow: lambda a, b: a**b,
+        }
+        op_fn = ops.get(type(node.op))
+        if op_fn is None:
+            raise ValueError(f"Unsupported binary op: {type(node.op).__name__}")
+        return op_fn(left, right)
+    if isinstance(node, ast.Name):
+        if node.id in allowed_names:
+            return allowed_names[node.id]
+        raise ValueError(f"Unknown name: {node.id!r}")
+    if isinstance(node, ast.Attribute):
+        value = _safe_eval(node.value, allowed_names)
+        # Only allow attribute access on the math module
+        if value is math:
+            attr = getattr(math, node.attr, None)
+            if attr is not None:
+                return attr
+        raise ValueError(f"Attribute access not allowed: .{node.attr}")
+    if isinstance(node, ast.Call):
+        func = _safe_eval(node.func, allowed_names)
+        if not callable(func):
+            raise ValueError(f"Not callable: {func!r}")
+        args = [_safe_eval(a, allowed_names) for a in node.args]
+        kwargs = {kw.arg: _safe_eval(kw.value, allowed_names) for kw in node.keywords}
+        return func(*args, **kwargs)
+    raise ValueError(f"Unsupported syntax: {type(node).__name__}")
+
+
 def calculator(expression: str) -> str:
    """Evaluate a mathematical expression and return the exact result.

@@ -128,15 +182,15 @@ def calculator(expression: str) -> str:
    Returns:
        The exact result as a string.
    """
-    # Only expose math functions — no builtins, no file/os access
    allowed_names = {k: getattr(math, k) for k in dir(math) if not k.startswith("_")}
-    allowed_names["math"] = math  # Support math.sqrt(), math.pi, etc.
+    allowed_names["math"] = math
    allowed_names["abs"] = abs
    allowed_names["round"] = round
    allowed_names["min"] = min
    allowed_names["max"] = max
    try:
-        result = eval(expression, {"__builtins__": {}}, allowed_names)  # noqa: S307
+        tree = ast.parse(expression, mode="eval")
+        result = _safe_eval(tree, allowed_names)
        return str(result)
    except Exception as e:
        return f"Error evaluating '{expression}': {e}"
--- a/tests/timmy/test_tools_calculator.py
+++ b/tests/timmy/test_tools_calculator.py
@@ -0,0 +1,169 @@
+"""Tests for the safe calculator tool (issue #52)."""
+
+from __future__ import annotations
+
+import math
+
+from timmy.tools import calculator
+
+# ── Basic arithmetic ──────────────────────────────────────────────
+
+
+class TestBasicArithmetic:
+    def test_addition(self):
+        assert calculator("2 + 3") == "5"
+
+    def test_subtraction(self):
+        assert calculator("10 - 4") == "6"
+
+    def test_multiplication(self):
+        assert calculator("347 * 829") == str(347 * 829)
+
+    def test_division(self):
+        assert calculator("10 / 3") == str(10 / 3)
+
+    def test_floor_division(self):
+        assert calculator("10 // 3") == "3"
+
+    def test_modulo(self):
+        assert calculator("10 % 3") == "1"
+
+    def test_exponent(self):
+        assert calculator("2**10") == "1024"
+
+    def test_negative_number(self):
+        assert calculator("-5 + 3") == "-2"
+
+    def test_unary_plus(self):
+        assert calculator("+5") == "5"
+
+
+# ── Parentheses and precedence ────────────────────────────────────
+
+
+class TestPrecedence:
+    def test_nested_parens(self):
+        assert calculator("(2 + 3) * (4 + 1)") == "25"
+
+    def test_deep_nesting(self):
+        assert calculator("((1 + 2) * (3 + 4)) + 5") == "26"
+
+    def test_operator_precedence(self):
+        assert calculator("2 + 3 * 4") == "14"
+
+
+# ── Math module functions ─────────────────────────────────────────
+
+
+class TestMathFunctions:
+    def test_sqrt(self):
+        assert calculator("math.sqrt(144)") == "12.0"
+
+    def test_log(self):
+        assert calculator("math.log(100, 10)") == str(math.log(100, 10))
+
+    def test_sin(self):
+        assert calculator("math.sin(0)") == "0.0"
+
+    def test_pi(self):
+        assert calculator("math.pi") == str(math.pi)
+
+    def test_e(self):
+        assert calculator("math.e") == str(math.e)
+
+    def test_ceil(self):
+        assert calculator("math.ceil(4.3)") == "5"
+
+    def test_floor(self):
+        assert calculator("math.floor(4.7)") == "4"
+
+    def test_bare_sqrt(self):
+        assert calculator("sqrt(16)") == "4.0"
+
+
+# ── Allowed builtins ──────────────────────────────────────────────
+
+
+class TestAllowedBuiltins:
+    def test_abs(self):
+        assert calculator("abs(-42)") == "42"
+
+    def test_round(self):
+        assert calculator("round(3.14159, 2)") == "3.14"
+
+    def test_min(self):
+        assert calculator("min(3, 1, 2)") == "1"
+
+    def test_max(self):
+        assert calculator("max(3, 1, 2)") == "3"
+
+
+# ── Error handling ────────────────────────────────────────────────
+
+
+class TestErrorHandling:
+    def test_division_by_zero(self):
+        result = calculator("1 / 0")
+        assert "Error" in result
+
+    def test_syntax_error(self):
+        result = calculator("2 +")
+        assert "Error" in result
+
+    def test_empty_expression(self):
+        result = calculator("")
+        assert "Error" in result
+
+
+# ── Injection attempts (the whole point of issue #52) ─────────────
+
+
+class TestInjectionPrevention:
+    def test_import_os(self):
+        result = calculator("__import__('os').system('echo hacked')")
+        assert "Error" in result
+        assert "Unknown name" in result or "Unsupported" in result
+
+    def test_builtins_access(self):
+        result = calculator("__builtins__")
+        assert "Error" in result
+
+    def test_dunder_class(self):
+        result = calculator("().__class__.__bases__[0].__subclasses__()")
+        assert "Error" in result
+
+    def test_exec(self):
+        result = calculator("exec('import os')")
+        assert "Error" in result
+
+    def test_eval_nested(self):
+        result = calculator("eval('1+1')")
+        assert "Error" in result
+
+    def test_open_file(self):
+        result = calculator("open('/etc/passwd').read()")
+        assert "Error" in result
+
+    def test_string_literal_rejected(self):
+        result = calculator("'hello'")
+        assert "Error" in result
+
+    def test_list_comprehension(self):
+        result = calculator("[x for x in range(10)]")
+        assert "Error" in result
+
+    def test_lambda(self):
+        result = calculator("(lambda: 1)()")
+        assert "Error" in result
+
+    def test_attribute_on_non_math(self):
+        result = calculator("(1).__class__")
+        assert "Error" in result
+
+    def test_globals(self):
+        result = calculator("globals()")
+        assert "Error" in result
+
+    def test_breakout_via_format(self):
+        result = calculator("'{}'.format.__globals__")
+        assert "Error" in result