Fix Azure structured outputs to use json_object instead of json_schema

- Azure AI Inference SDK doesn't support json_schema response_format - Changed to use json_object format with client-side Pydantic validation - Added comprehensive tests for structured outputs with Azure models - Fixes issue #3906 Co-Authored-By: João <joao@crewai.com>
2026-05-03 08:12:39 +00:00 · 2025-11-13 12:45:55 +00:00
parent ffd717c51a
commit 6442a88856
2 changed files with 102 additions and 7 deletions
--- a/lib/crewai/src/crewai/llms/providers/azure/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/azure/completion.py
@@ -277,14 +277,10 @@ class AzureCompletion(BaseLLM):
            "stream": self.stream,
        }
        # Azure AI Inference SDK doesn't support json_schema response_format (important-comment)
        # Use json_object instead and rely on client-side Pydantic validation
        if response_model and self.is_openai_model:
-            params["response_format"] = {
+            params["response_format"] = {"type": "json_object"}
                "type": "json_schema",
                "json_schema": {
                    "name": response_model.__name__,
                    "schema": response_model.model_json_schema(),
                },
            }
        # Only include model parameter for non-Azure OpenAI endpoints
        # Azure OpenAI endpoints have the deployment name in the URL
--- a/lib/crewai/tests/llms/azure/test_azure.py
+++ b/lib/crewai/tests/llms/azure/test_azure.py
@@ -1086,3 +1086,102 @@ def test_azure_mistral_and_other_models():
            )
            assert "model" in params
            assert params["model"] == model_name
 def test_azure_structured_output_uses_json_object():
    """
    Test that Azure uses json_object response_format instead of json_schema
    for structured outputs (fixes issue #3906)
    """
    from pydantic import BaseModel
    class Greeting(BaseModel):
        name: str
        message: str
    llm = LLM(model="azure/gpt-4")
    # Prepare params with response_model
    params = llm._prepare_completion_params(
        messages=[{"role": "user", "content": "Say hello"}],
        response_model=Greeting
    )
    assert "response_format" in params
    assert params["response_format"] == {"type": "json_object"}
    assert "json_schema" not in params["response_format"]
 def test_azure_structured_output_with_agent():
    """
    Test that structured outputs work correctly with Azure models in agents
    (replicates the issue from #3906)
    """
    from pydantic import BaseModel
    class Greeting(BaseModel):
        name: str
        message: str
    llm = LLM(model="azure/gpt-4")
    # Mock the Azure client response
    with patch.object(llm.client, 'complete') as mock_complete:
        mock_message = MagicMock()
        mock_message.content = '{"name": "Alice", "message": "Hello, Alice!"}'
        mock_message.tool_calls = None
        mock_choice = MagicMock()
        mock_choice.message = mock_message
        mock_response = MagicMock()
        mock_response.choices = [mock_choice]
        mock_response.usage = MagicMock(
            prompt_tokens=10,
            completion_tokens=20,
            total_tokens=30
        )
        mock_complete.return_value = mock_response
        result = llm.call(
            messages=[{"role": "user", "content": "My name is Alice"}],
            response_model=Greeting
        )
        # Verify the call was made
        assert mock_complete.called
        # Verify the params passed to complete
        call_args = mock_complete.call_args
        params = call_args[1] if call_args[1] else call_args[0][0]
        if isinstance(params, dict) and "response_format" in params:
            assert params["response_format"] == {"type": "json_object"}
        assert result is not None
        assert isinstance(result, str)
 def test_azure_structured_output_non_openai_model():
    """
    Test that non-OpenAI models don't get response_format parameter
    """
    from pydantic import BaseModel
    class TestModel(BaseModel):
        field: str
    with patch.dict(os.environ, {
        "AZURE_API_KEY": "test-key",
        "AZURE_ENDPOINT": "https://models.inference.ai.azure.com"
    }):
        llm = LLM(model="azure/mistral-large")
        # Prepare params with response_model for non-OpenAI model
        params = llm._prepare_completion_params(
            messages=[{"role": "user", "content": "test"}],
            response_model=TestModel
        )
        assert "response_format" not in params