Files
crewAI/lib/crewai-tools/tests/tools/test_code_interpreter_tool.py
Devin AI fefa6761f9 Fix command injection and sandbox escape in CodeInterpreterTool (#4516)
- Replace os.system() with subprocess.run() using list args in run_code_unsafe()
  to prevent command injection via malicious library names (CWE-78)
- Add BLOCKED_ATTRS set to SandboxPython to block dangerous dunder attributes
  (__class__, __bases__, __subclasses__, __mro__, __globals__, __code__,
  __reduce__, __reduce_ex__, __builtins__) that enable sandbox escape (CWE-94)
- Add getattr, setattr, delattr, type, breakpoint to UNSAFE_BUILTINS
- Add _check_for_blocked_attrs() pre-execution scan for blocked attribute patterns
- Add comprehensive tests for both vulnerabilities

Co-Authored-By: João <joao@crewai.com>
2026-02-19 11:29:42 +00:00

400 lines
13 KiB
Python

from unittest.mock import patch, MagicMock
from crewai_tools.tools.code_interpreter_tool.code_interpreter_tool import (
CodeInterpreterTool,
SandboxPython,
)
import pytest
@pytest.fixture
def printer_mock():
with patch("crewai_tools.printer.Printer.print") as mock:
yield mock
@pytest.fixture
def docker_unavailable_mock():
with patch(
"crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.CodeInterpreterTool._check_docker_available",
return_value=False,
) as mock:
yield mock
@patch("crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.docker_from_env")
def test_run_code_in_docker(docker_mock, printer_mock):
tool = CodeInterpreterTool()
code = "print('Hello, World!')"
libraries_used = ["numpy", "pandas"]
expected_output = "Hello, World!\n"
docker_mock().containers.run().exec_run().exit_code = 0
docker_mock().containers.run().exec_run().output = expected_output.encode()
result = tool.run_code_in_docker(code, libraries_used)
assert result == expected_output
printer_mock.assert_called_with(
"Running code in Docker environment", color="bold_blue"
)
@patch("crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.docker_from_env")
def test_run_code_in_docker_with_error(docker_mock, printer_mock):
tool = CodeInterpreterTool()
code = "print(1/0)"
libraries_used = ["numpy", "pandas"]
expected_output = "Something went wrong while running the code: \nZeroDivisionError: division by zero\n"
docker_mock().containers.run().exec_run().exit_code = 1
docker_mock().containers.run().exec_run().output = (
b"ZeroDivisionError: division by zero\n"
)
result = tool.run_code_in_docker(code, libraries_used)
assert result == expected_output
printer_mock.assert_called_with(
"Running code in Docker environment", color="bold_blue"
)
@patch("crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.docker_from_env")
def test_run_code_in_docker_with_script(docker_mock, printer_mock):
tool = CodeInterpreterTool()
code = """print("This is line 1")
print("This is line 2")"""
libraries_used = []
expected_output = "This is line 1\nThis is line 2\n"
docker_mock().containers.run().exec_run().exit_code = 0
docker_mock().containers.run().exec_run().output = expected_output.encode()
result = tool.run_code_in_docker(code, libraries_used)
assert result == expected_output
printer_mock.assert_called_with(
"Running code in Docker environment", color="bold_blue"
)
def test_restricted_sandbox_basic_code_execution(printer_mock, docker_unavailable_mock):
"""Test basic code execution."""
tool = CodeInterpreterTool()
code = """
result = 2 + 2
print(result)
"""
result = tool.run(code=code, libraries_used=[])
printer_mock.assert_called_with(
"Running code in restricted sandbox", color="yellow"
)
assert result == 4
def test_restricted_sandbox_running_with_blocked_modules(
printer_mock, docker_unavailable_mock
):
"""Test that restricted modules cannot be imported."""
tool = CodeInterpreterTool()
restricted_modules = SandboxPython.BLOCKED_MODULES
for module in restricted_modules:
code = f"""
import {module}
result = "Import succeeded"
"""
result = tool.run(code=code, libraries_used=[])
printer_mock.assert_called_with(
"Running code in restricted sandbox", color="yellow"
)
assert f"An error occurred: Importing '{module}' is not allowed" in result
def test_restricted_sandbox_running_with_blocked_builtins(
printer_mock, docker_unavailable_mock
):
"""Test that restricted builtins are not available."""
tool = CodeInterpreterTool()
restricted_builtins = SandboxPython.UNSAFE_BUILTINS
for builtin in restricted_builtins:
code = f"""
{builtin}("test")
result = "Builtin available"
"""
result = tool.run(code=code, libraries_used=[])
printer_mock.assert_called_with(
"Running code in restricted sandbox", color="yellow"
)
assert f"An error occurred: name '{builtin}' is not defined" in result
def test_restricted_sandbox_running_with_no_result_variable(
printer_mock, docker_unavailable_mock
):
"""Test behavior when no result variable is set."""
tool = CodeInterpreterTool()
code = """
x = 10
"""
result = tool.run(code=code, libraries_used=[])
printer_mock.assert_called_with(
"Running code in restricted sandbox", color="yellow"
)
assert result == "No result variable found."
def test_unsafe_mode_running_with_no_result_variable(
printer_mock, docker_unavailable_mock
):
"""Test behavior when no result variable is set."""
tool = CodeInterpreterTool(unsafe_mode=True)
code = """
x = 10
"""
result = tool.run(code=code, libraries_used=[])
printer_mock.assert_called_with(
"WARNING: Running code in unsafe mode", color="bold_magenta"
)
assert result == "No result variable found."
def test_unsafe_mode_running_unsafe_code(printer_mock, docker_unavailable_mock):
"""Test behavior when no result variable is set."""
tool = CodeInterpreterTool(unsafe_mode=True)
code = """
import os
os.system("ls -la")
result = eval("5/1")
"""
result = tool.run(code=code, libraries_used=[])
printer_mock.assert_called_with(
"WARNING: Running code in unsafe mode", color="bold_magenta"
)
assert 5.0 == result
class TestCommandInjectionPrevention:
"""Tests for command injection prevention in unsafe mode (CVE: CWE-78)."""
@patch(
"crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.subprocess.run"
)
def test_unsafe_mode_uses_subprocess_run_with_list_args(
self, subprocess_mock, printer_mock
):
"""Verify libraries are installed via subprocess.run with list args, not os.system."""
tool = CodeInterpreterTool(unsafe_mode=True)
code = "result = 'done'"
tool.run_code_unsafe(code, ["numpy"])
subprocess_mock.assert_called_once_with(
["pip", "install", "numpy"],
check=True,
capture_output=True,
)
@patch(
"crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.subprocess.run"
)
def test_unsafe_mode_library_with_shell_metacharacters(
self, subprocess_mock, printer_mock
):
"""Ensure shell metacharacters in library names are not interpreted."""
tool = CodeInterpreterTool(unsafe_mode=True)
malicious_lib = "numpy; id #"
code = "result = 'done'"
tool.run_code_unsafe(code, [malicious_lib])
subprocess_mock.assert_called_once_with(
["pip", "install", "numpy; id #"],
check=True,
capture_output=True,
)
@patch(
"crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.subprocess.run"
)
def test_unsafe_mode_library_with_command_substitution(
self, subprocess_mock, printer_mock
):
"""Ensure command substitution in library names is not executed."""
tool = CodeInterpreterTool(unsafe_mode=True)
malicious_lib = "numpy && rm -rf /"
code = "result = 'done'"
tool.run_code_unsafe(code, [malicious_lib])
subprocess_mock.assert_called_once_with(
["pip", "install", "numpy && rm -rf /"],
check=True,
capture_output=True,
)
@patch(
"crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.subprocess.run"
)
def test_unsafe_mode_library_with_backtick_injection(
self, subprocess_mock, printer_mock
):
"""Ensure backtick command injection is not executed."""
tool = CodeInterpreterTool(unsafe_mode=True)
malicious_lib = "numpy`whoami`"
code = "result = 'done'"
tool.run_code_unsafe(code, [malicious_lib])
subprocess_mock.assert_called_once_with(
["pip", "install", "numpy`whoami`"],
check=True,
capture_output=True,
)
@patch(
"crewai_tools.tools.code_interpreter_tool.code_interpreter_tool.subprocess.run"
)
def test_unsafe_mode_multiple_libraries_installed_separately(
self, subprocess_mock, printer_mock
):
"""Each library is installed in a separate subprocess call."""
tool = CodeInterpreterTool(unsafe_mode=True)
code = "result = 'done'"
tool.run_code_unsafe(code, ["numpy", "pandas"])
assert subprocess_mock.call_count == 2
class TestSandboxEscapePrevention:
"""Tests for sandbox escape prevention via object introspection (CVE: CWE-94)."""
def test_sandbox_blocks_class_attribute(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __class__ introspection."""
tool = CodeInterpreterTool()
code = """
result = ().__class__
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__class__' is not allowed" in result
def test_sandbox_blocks_bases_attribute(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __bases__ introspection."""
tool = CodeInterpreterTool()
code = """
result = object.__bases__
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__bases__' is not allowed" in result
def test_sandbox_blocks_subclasses_method(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __subclasses__ introspection."""
tool = CodeInterpreterTool()
code = """
result = object.__subclasses__()
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__subclasses__' is not allowed" in result
def test_sandbox_blocks_mro_attribute(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __mro__ introspection."""
tool = CodeInterpreterTool()
code = """
result = int.__mro__
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__mro__' is not allowed" in result
def test_sandbox_blocks_globals_attribute(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __globals__ introspection."""
tool = CodeInterpreterTool()
code = """
def f(): pass
result = f.__globals__
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__globals__' is not allowed" in result
def test_sandbox_blocks_builtins_attribute(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __builtins__ access."""
tool = CodeInterpreterTool()
code = """
result = __builtins__
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__builtins__' is not allowed" in result
def test_sandbox_blocks_full_introspection_chain(
self, printer_mock, docker_unavailable_mock
):
"""Prevent the full sandbox escape PoC from the issue."""
tool = CodeInterpreterTool()
code = """
for c in ().__class__.__bases__[0].__subclasses__():
if c.__name__ == 'BuiltinImporter':
result = c.load_module('os').system('id')
break
"""
result = tool.run(code=code, libraries_used=[])
assert "is not allowed" in result
def test_sandbox_blocks_getattr_builtin(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via getattr builtin."""
tool = CodeInterpreterTool()
code = """
result = getattr(object, '__subclasses__')()
"""
result = tool.run(code=code, libraries_used=[])
assert "An error occurred" in result
def test_sandbox_blocks_type_builtin(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via type builtin."""
tool = CodeInterpreterTool()
code = """
result = type('X', (object,), {})
"""
result = tool.run(code=code, libraries_used=[])
assert "An error occurred" in result
def test_sandbox_blocks_code_attribute(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __code__ attribute."""
tool = CodeInterpreterTool()
code = """
def f(): pass
result = f.__code__
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__code__' is not allowed" in result
def test_sandbox_allows_normal_code(
self, printer_mock, docker_unavailable_mock
):
"""Ensure normal code still works in sandbox."""
tool = CodeInterpreterTool()
code = """
data = [1, 2, 3, 4, 5]
result = sum(data) * 2
"""
result = tool.run(code=code, libraries_used=[])
assert result == 30
def test_sandbox_blocks_reduce_attribute(
self, printer_mock, docker_unavailable_mock
):
"""Prevent sandbox escape via __reduce__ for pickle attacks."""
tool = CodeInterpreterTool()
code = """
result = [].__reduce__()
"""
result = tool.run(code=code, libraries_used=[])
assert "Access to '__reduce__' is not allowed" in result