- Remove _extract_raw_output: persist content verbatim (fixes size mismatch bug) - Drop import aliases: import from budget_config directly, one canonical name - BudgetConfig param on maybe_persist_tool_result and enforce_turn_budget - read_file: limit=None signature, pre-read guard fires only when limit omitted (256KB) - Unify binary extensions: file_operations.py imports from binary_extensions.py - Exclude .pdf and .svg from binary set (text-based, agents may inspect) - Remove redundant outer try/except in eval path (internal fallback handles it) - Fix broken tests: update assertion strings for new persistence format - Module-level constants: _PRE_READ_MAX_BYTES, _DEFAULT_READ_LIMIT - Remove redundant pathlib import (Path already at module level) - Update spec.md with IMPLEMENTED annotations and design decisions
43 lines
1.5 KiB
Python
43 lines
1.5 KiB
Python
"""Binary file extensions to skip for text-based operations.
|
|
|
|
These files can't be meaningfully compared as text and are often large.
|
|
Ported from free-code src/constants/files.ts.
|
|
"""
|
|
|
|
BINARY_EXTENSIONS = frozenset({
|
|
# Images
|
|
".png", ".jpg", ".jpeg", ".gif", ".bmp", ".ico", ".webp", ".tiff", ".tif",
|
|
# Videos
|
|
".mp4", ".mov", ".avi", ".mkv", ".webm", ".wmv", ".flv", ".m4v", ".mpeg", ".mpg",
|
|
# Audio
|
|
".mp3", ".wav", ".ogg", ".flac", ".aac", ".m4a", ".wma", ".aiff", ".opus",
|
|
# Archives
|
|
".zip", ".tar", ".gz", ".bz2", ".7z", ".rar", ".xz", ".z", ".tgz", ".iso",
|
|
# Executables/binaries
|
|
".exe", ".dll", ".so", ".dylib", ".bin", ".o", ".a", ".obj", ".lib",
|
|
".app", ".msi", ".deb", ".rpm",
|
|
# Documents (exclude .pdf — text-based, agents may want to inspect)
|
|
".doc", ".docx", ".xls", ".xlsx", ".ppt", ".pptx",
|
|
".odt", ".ods", ".odp",
|
|
# Fonts
|
|
".ttf", ".otf", ".woff", ".woff2", ".eot",
|
|
# Bytecode / VM artifacts
|
|
".pyc", ".pyo", ".class", ".jar", ".war", ".ear", ".node", ".wasm", ".rlib",
|
|
# Database files
|
|
".sqlite", ".sqlite3", ".db", ".mdb", ".idx",
|
|
# Design / 3D
|
|
".psd", ".ai", ".eps", ".sketch", ".fig", ".xd", ".blend", ".3ds", ".max",
|
|
# Flash
|
|
".swf", ".fla",
|
|
# Lock/profiling data
|
|
".lockb", ".dat", ".data",
|
|
})
|
|
|
|
|
|
def has_binary_extension(path: str) -> bool:
|
|
"""Check if a file path has a binary extension. Pure string check, no I/O."""
|
|
dot = path.rfind(".")
|
|
if dot == -1:
|
|
return False
|
|
return path[dot:].lower() in BINARY_EXTENSIONS
|