Fix #3242: Add reasoning parameter to LLM class to disable reasoning mode

- Add reasoning parameter to LLM.__init__() method - Implement logic in _prepare_completion_params to handle reasoning=False - Add comprehensive tests for reasoning parameter functionality - Ensure reasoning=False overrides reasoning_effort parameter - Add integration test with Agent class The fix ensures that when reasoning=False is set, the reasoning_effort parameter is not included in the LLM completion call, effectively disabling reasoning mode for models like Qwen and Cogito with Ollama. Co-Authored-By: João <joao@crewai.com>
2026-01-24 23:58:15 +00:00 · 2025-07-30 14:37:53 +00:00
parent 498e8dc6e8
commit 22761d74ba
3 changed files with 133 additions and 1 deletions
--- a/tests/agent_reasoning_test.py
+++ b/tests/agent_reasoning_test.py
@@ -2,6 +2,7 @@

 import json
 import pytest
+from unittest.mock import patch

 from crewai import Agent, Task
 from crewai.llm import LLM
@@ -259,3 +260,31 @@ def test_agent_with_function_calling_fallback():
    assert result == "4"
    assert "Reasoning Plan:" in task.description
    assert "Invalid JSON that will trigger fallback" in task.description
+
+
+def test_agent_with_llm_reasoning_disabled():
+    """Test agent with LLM reasoning disabled."""
+    llm = LLM("gpt-3.5-turbo", reasoning=False)
+    
+    agent = Agent(
+        role="Test Agent",
+        goal="To test the LLM reasoning parameter",
+        backstory="I am a test agent created to verify the LLM reasoning parameter works correctly.",
+        llm=llm,
+        reasoning=False,
+        verbose=True
+    )
+    
+    task = Task(
+        description="Simple math task: What's 3+3?",
+        expected_output="The answer should be a number.",
+        agent=agent
+    )
+    
+    with patch.object(agent.llm, 'call') as mock_call:
+        mock_call.return_value = "6"
+        
+        result = agent.execute_task(task)
+        
+        assert result == "6"
+        assert "Reasoning Plan:" not in task.description
--- a/tests/llm_test.py
+++ b/tests/llm_test.py
@@ -711,3 +711,99 @@ def test_ollama_does_not_modify_when_last_is_user(ollama_llm):
    formatted = ollama_llm._format_messages_for_provider(original_messages)

    assert formatted == original_messages
+
+
+def test_llm_reasoning_parameter_false():
+    """Test that reasoning=False disables reasoning mode."""
+    llm = LLM(model="ollama/qwen", reasoning=False)
+    
+    with patch("litellm.completion") as mock_completion:
+        mock_message = MagicMock()
+        mock_message.content = "Test response"
+        mock_choice = MagicMock()
+        mock_choice.message = mock_message
+        mock_response = MagicMock()
+        mock_response.choices = [mock_choice]
+        mock_response.usage = {"prompt_tokens": 5, "completion_tokens": 5, "total_tokens": 10}
+        mock_completion.return_value = mock_response
+        
+        llm.call("Test message")
+        
+        _, kwargs = mock_completion.call_args
+        assert "reasoning_effort" not in kwargs
+
+
+def test_llm_reasoning_parameter_true():
+    """Test that reasoning=True enables reasoning mode."""
+    llm = LLM(model="ollama/qwen", reasoning=True, reasoning_effort="medium")
+    
+    with patch("litellm.completion") as mock_completion:
+        mock_message = MagicMock()
+        mock_message.content = "Test response"
+        mock_choice = MagicMock()
+        mock_choice.message = mock_message
+        mock_response = MagicMock()
+        mock_response.choices = [mock_choice]
+        mock_response.usage = {"prompt_tokens": 5, "completion_tokens": 5, "total_tokens": 10}
+        mock_completion.return_value = mock_response
+        
+        llm.call("Test message")
+        
+        _, kwargs = mock_completion.call_args
+        assert kwargs["reasoning_effort"] == "medium"
+
+
+def test_llm_reasoning_parameter_none_with_reasoning_effort():
+    """Test that reasoning=None with reasoning_effort still includes reasoning_effort."""
+    llm = LLM(model="ollama/qwen", reasoning=None, reasoning_effort="high")
+    
+    with patch("litellm.completion") as mock_completion:
+        mock_message = MagicMock()
+        mock_message.content = "Test response"
+        mock_choice = MagicMock()
+        mock_choice.message = mock_message
+        mock_response = MagicMock()
+        mock_response.choices = [mock_choice]
+        mock_response.usage = {"prompt_tokens": 5, "completion_tokens": 5, "total_tokens": 10}
+        mock_completion.return_value = mock_response
+        
+        llm.call("Test message")
+        
+        _, kwargs = mock_completion.call_args
+        assert kwargs["reasoning_effort"] == "high"
+
+
+def test_llm_reasoning_false_overrides_reasoning_effort():
+    """Test that reasoning=False overrides reasoning_effort."""
+    llm = LLM(model="ollama/qwen", reasoning=False, reasoning_effort="high")
+    
+    with patch("litellm.completion") as mock_completion:
+        mock_message = MagicMock()
+        mock_message.content = "Test response"
+        mock_choice = MagicMock()
+        mock_choice.message = mock_message
+        mock_response = MagicMock()
+        mock_response.choices = [mock_choice]
+        mock_response.usage = {"prompt_tokens": 5, "completion_tokens": 5, "total_tokens": 10}
+        mock_completion.return_value = mock_response
+        
+        llm.call("Test message")
+        
+        _, kwargs = mock_completion.call_args
+        assert "reasoning_effort" not in kwargs
+
+
+@pytest.mark.vcr(filter_headers=["authorization"])
+def test_ollama_qwen_with_reasoning_disabled():
+    """Test Ollama Qwen model with reasoning disabled."""
+    if not os.getenv("OLLAMA_BASE_URL"):
+        pytest.skip("OLLAMA_BASE_URL not set; skipping test.")
+    
+    llm = LLM(
+        model="ollama/qwen",
+        base_url=os.getenv("OLLAMA_BASE_URL", "http://localhost:11434"),
+        reasoning=False
+    )
+    result = llm.call("What is 2+2?")
+    assert isinstance(result, str)
+    assert len(result.strip()) > 0