From 92dd7feec24806d1033153711716b8d5a135d68a Mon Sep 17 00:00:00 2001
From: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
Date: Fri, 21 Feb 2025 18:28:19 +0000
Subject: [PATCH] refactor: Improve Mistral LLM implementation based on
 feedback

- Add MISTRAL_IDENTIFIERS constant
- Use deepcopy for message copying
- Add type annotations
- Improve test organization and add edge cases
- Add error handling and logging

Co-Authored-By: Joe Moura <joao@crewai.com>
---
 src/crewai/llm.py | 24 ++++++++++++-----
 tests/llm_test.py | 67 ++++++++++++++++++++++++++++++++++++-----------
 2 files changed, 70 insertions(+), 21 deletions(-)

diff --git a/src/crewai/llm.py b/src/crewai/llm.py
index 975172055..d730ff7a3 100644
--- a/src/crewai/llm.py
+++ b/src/crewai/llm.py
@@ -21,6 +21,8 @@ from typing import (
 from dotenv import load_dotenv
 from pydantic import BaseModel
 
+logger = logging.getLogger(__name__)
+
 from crewai.utilities.events.tool_usage_events import ToolExecutionErrorEvent
 
 with warnings.catch_warnings():
@@ -133,6 +135,9 @@ def suppress_warnings():
 
 
 class LLM:
+    # Constants for model identification
+    MISTRAL_IDENTIFIERS = {'mistral', 'mixtral'}
+
     def __init__(
         self,
         model: str,
@@ -392,9 +397,11 @@ class LLM:
         Returns:
             List of formatted messages according to provider requirements.
             For Anthropic models, ensures first message has 'user' role.
+            For Mistral models, converts 'assistant' roles to 'user' roles.
 
         Raises:
             TypeError: If messages is None or contains invalid message format.
+            Exception: If message formatting fails for any provider-specific reason.
         """
         if messages is None:
             raise TypeError("Messages cannot be None")
@@ -407,12 +414,17 @@ class LLM:
                 )
 
         # Handle Mistral role requirements
-        if "mistral" in self.model.lower():
-            messages_copy = [dict(message) for message in messages]  # Deep copy
-            for message in messages_copy:
-                if message.get("role") == "assistant":
-                    message["role"] = "user"
-            return messages_copy
+        if any(identifier in self.model.lower() for identifier in self.MISTRAL_IDENTIFIERS):
+            try:
+                from copy import deepcopy
+                messages_copy = deepcopy(messages)
+                for message in messages_copy:
+                    if message.get("role") == "assistant":
+                        message["role"] = "user"
+                return messages_copy
+            except Exception as e:
+                logger.error(f"Error formatting messages for Mistral: {str(e)}")
+                raise
 
         if not self.is_anthropic:
             return messages
diff --git a/tests/llm_test.py b/tests/llm_test.py
index 02fce4fd8..f1bfa9c76 100644
--- a/tests/llm_test.py
+++ b/tests/llm_test.py
@@ -14,24 +14,61 @@ from crewai.utilities.token_counter_callback import TokenCalcHandler
 
 # TODO: This test fails without print statement, which makes me think that something is happening asynchronously that we need to eventually fix and dive deeper into at a later date
 @pytest.mark.vcr(filter_headers=["authorization"])
-@pytest.mark.vcr(filter_headers=["authorization"])
-def test_mistral_with_tools():
-    """Test that Mistral LLM correctly handles role requirements with tools."""
-    llm = LLM(model="mistral/mistral-large-latest")
-    messages = [
-        {"role": "user", "content": "Test message"},
-        {"role": "assistant", "content": "Assistant response"}
-    ]
+@pytest.mark.mistral
+class TestMistralLLM:
+    """Test suite for Mistral LLM functionality."""
     
-    # Get the formatted messages
-    formatted_messages = llm._format_messages_for_provider(messages)
+    @pytest.fixture
+    def mistral_llm(self):
+        """Fixture providing a Mistral LLM instance."""
+        return LLM(model="mistral/mistral-large-latest")
     
-    # Verify that assistant role was changed to user for Mistral
-    assert any(msg["role"] == "user" for msg in formatted_messages if msg["content"] == "Assistant response")
-    assert not any(msg["role"] == "assistant" for msg in formatted_messages)
+    def test_mistral_role_handling(self, mistral_llm):
+        """
+        Verify that roles are handled correctly in various scenarios:
+        - Assistant roles are converted to user roles
+        - Original messages remain unchanged
+        - System messages are preserved
+        """
+        messages = [
+            {"role": "system", "content": "System message"},
+            {"role": "user", "content": "Test message"},
+            {"role": "assistant", "content": "Assistant response"}
+        ]
+        
+        formatted_messages = mistral_llm._format_messages_for_provider(messages)
+        
+        # Verify role conversions
+        assert any(msg["role"] == "user" for msg in formatted_messages if msg["content"] == "Assistant response")
+        assert not any(msg["role"] == "assistant" for msg in formatted_messages)
+        assert any(msg["role"] == "system" for msg in formatted_messages)
+        
+        # Original messages should not be modified
+        assert any(msg["role"] == "assistant" for msg in messages)
     
-    # Original messages should not be modified
-    assert any(msg["role"] == "assistant" for msg in messages)
+    def test_mistral_empty_messages(self, mistral_llm):
+        """Test handling of empty message list."""
+        messages = []
+        formatted_messages = mistral_llm._format_messages_for_provider(messages)
+        assert formatted_messages == []
+    
+    def test_mistral_multiple_assistant_messages(self, mistral_llm):
+        """Test handling of multiple consecutive assistant messages."""
+        messages = [
+            {"role": "user", "content": "User 1"},
+            {"role": "assistant", "content": "Assistant 1"},
+            {"role": "assistant", "content": "Assistant 2"},
+            {"role": "user", "content": "User 2"}
+        ]
+        
+        formatted_messages = mistral_llm._format_messages_for_provider(messages)
+        
+        # All assistant messages should be converted to user
+        assert all(msg["role"] == "user" for msg in formatted_messages 
+                  if msg["content"] in ["Assistant 1", "Assistant 2"])
+        
+        # Original messages should not be modified
+        assert len([msg for msg in messages if msg["role"] == "assistant"]) == 2
 
 
 def test_mistral_role_handling():