feat: add Responses API support for Azure, Bedrock, Gemini, Anthropic providers

- Implement full Responses API support for Azure using OpenAI SDK's AzureOpenAI client - Add api parameter to Bedrock, Gemini, Anthropic with clear NotImplementedError messages - Store api attribute on all providers for runtime inspection - Add 37+ Azure Responses API tests (init, params, tools, structured output, auto-chaining, ZDR) - Add 12 error handling tests for Bedrock, Gemini, Anthropic providers Closes #4957 Co-Authored-By: João <joao@crewai.com>
2026-03-27 22:28:16 +00:00 · 2026-03-19 17:16:53 +00:00
8 changed files with 1984 additions and 3 deletions
--- a/lib/crewai/src/crewai/llms/providers/anthropic/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/anthropic/completion.py
@@ -167,6 +167,7 @@ class AnthropicCompletion(BaseLLM):
        thinking: AnthropicThinkingConfig | None = None,
        response_format: type[BaseModel] | None = None,
        tool_search: AnthropicToolSearchConfig | bool | None = None,
+        api: Literal["completions", "responses"] = "completions",
        **kwargs: Any,
    ):
        """Initialize Anthropic chat completion client.
@@ -192,6 +193,16 @@ class AnthropicCompletion(BaseLLM):
                and a tool search tool is injected into the tools list.
            **kwargs: Additional parameters
        """
+        if api == "responses":
+            raise NotImplementedError(
+                "The Responses API is not supported by Anthropic provider. "
+                "Anthropic uses the Messages API natively. "
+                "The Responses API is available for OpenAI and Azure OpenAI providers. "
+                "Use api='completions' (default) with Anthropic."
+            )
+
+        self.api = api
+
        super().__init__(
            model=model, temperature=temperature, stop=stop_sequences or [], **kwargs
        )
--- a/lib/crewai/src/crewai/llms/providers/azure/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/azure/completion.py
--- a/lib/crewai/src/crewai/llms/providers/bedrock/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/bedrock/completion.py
@@ -5,7 +5,7 @@ from contextlib import AsyncExitStack
 import json
 import logging
 import os
-from typing import TYPE_CHECKING, Any, TypedDict, cast
+from typing import TYPE_CHECKING, Any, Literal, TypedDict, cast

 from pydantic import BaseModel
 from typing_extensions import Required
@@ -246,6 +246,7 @@ class BedrockCompletion(BaseLLM):
        additional_model_response_field_paths: list[str] | None = None,
        interceptor: BaseInterceptor[Any, Any] | None = None,
        response_format: type[BaseModel] | None = None,
+        api: Literal["completions", "responses"] = "completions",
        **kwargs: Any,
    ) -> None:
        """Initialize AWS Bedrock completion client.
@@ -270,6 +271,16 @@ class BedrockCompletion(BaseLLM):
                           response_model is not passed to call()/acall() methods.
            **kwargs: Additional parameters
        """
+        if api == "responses":
+            raise NotImplementedError(
+                "The Responses API is not supported by AWS Bedrock provider. "
+                "Bedrock uses the Converse API natively. "
+                "The Responses API is available for OpenAI and Azure OpenAI providers. "
+                "Use api='completions' (default) with Bedrock."
+            )
+
+        self.api = api
+
        if interceptor is not None:
            raise NotImplementedError(
                "HTTP interceptors are not yet supported for AWS Bedrock provider. "
--- a/lib/crewai/src/crewai/llms/providers/gemini/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/gemini/completion.py
@@ -62,6 +62,7 @@ class GeminiCompletion(BaseLLM):
        use_vertexai: bool | None = None,
        response_format: type[BaseModel] | None = None,
        thinking_config: types.ThinkingConfig | None = None,
+        api: Literal["completions", "responses"] = "completions",
        **kwargs: Any,
    ):
        """Initialize Google Gemini chat completion client.
@@ -100,6 +101,16 @@ class GeminiCompletion(BaseLLM):
                           get include_thoughts=True so thought content is surfaced.
            **kwargs: Additional parameters
        """
+        if api == "responses":
+            raise NotImplementedError(
+                "The Responses API is not supported by Google Gemini provider. "
+                "Gemini uses the generate_content API natively. "
+                "The Responses API is available for OpenAI and Azure OpenAI providers. "
+                "Use api='completions' (default) with Gemini."
+            )
+
+        self.api = api
+
        if interceptor is not None:
            raise NotImplementedError(
                "HTTP interceptors are not yet supported for Google Gemini provider. "
--- a/lib/crewai/tests/llms/anthropic/test_anthropic.py
+++ b/lib/crewai/tests/llms/anthropic/test_anthropic.py
@@ -1463,3 +1463,55 @@ def test_tool_search_saves_input_tokens():
        f"Expected tool_search ({usage_search.prompt_tokens}) to use fewer input tokens "
        f"than no search ({usage_no_search.prompt_tokens})"
    )
+
+# =============================================================================
+# Responses API Error Handling Tests
+# =============================================================================
+
+
+def test_anthropic_responses_api_raises_not_implemented():
+    """Test that Anthropic raises NotImplementedError when api='responses' is used."""
+    from crewai.llms.providers.anthropic.completion import AnthropicCompletion
+
+    with pytest.raises(NotImplementedError, match="Responses API is not supported by Anthropic"):
+        AnthropicCompletion(
+            model="claude-sonnet-4-20250514",
+            api="responses",
+        )
+
+
+def test_anthropic_responses_api_error_suggests_completions():
+    """Test that the error message suggests using api='completions' instead."""
+    from crewai.llms.providers.anthropic.completion import AnthropicCompletion
+
+    with pytest.raises(NotImplementedError) as exc_info:
+        AnthropicCompletion(
+            model="claude-sonnet-4-20250514",
+            api="responses",
+        )
+
+    error_msg = str(exc_info.value)
+    assert "api='completions'" in error_msg
+    assert "Messages API" in error_msg
+
+
+def test_anthropic_completions_api_still_works():
+    """Test that api='completions' (default) still works normally."""
+    from crewai.llms.providers.anthropic.completion import AnthropicCompletion
+
+    # Should not raise any error
+    completion = AnthropicCompletion(
+        model="claude-sonnet-4-20250514",
+        api="completions",
+    )
+    assert completion.api == "completions"
+
+
+def test_anthropic_default_api_is_completions():
+    """Test that the default API is 'completions'."""
+    from crewai.llms.providers.anthropic.completion import AnthropicCompletion
+
+    completion = AnthropicCompletion(
+        model="claude-sonnet-4-20250514",
+    )
+    assert completion.api == "completions"
--- a/lib/crewai/tests/llms/azure/test_azure.py
+++ b/lib/crewai/tests/llms/azure/test_azure.py
@@ -1403,3 +1403,784 @@ def test_azure_stop_words_still_applied_to_regular_responses():
        assert "Observation:" not in result
        assert "Found results" not in result
        assert "I need to search for more information" in result
+
+
+# =============================================================================
+# Azure Responses API Tests
+# =============================================================================
+
+
+def test_azure_responses_api_initialization():
+    """Test that Azure Responses API can be initialized with api='responses'."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            instructions="You are a helpful assistant.",
+            store=True,
+        )
+
+        assert completion.api == "responses"
+        assert completion.instructions == "You are a helpful assistant."
+        assert completion.store is True
+        assert completion.model == "gpt-4o"
+
+
+def test_azure_responses_api_default_is_completions():
+    """Test that the default API is 'completions' for backward compatibility."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    completion = AzureCompletion(
+        model="gpt-4o",
+        api_key="test-key",
+        endpoint="https://test.openai.azure.com",
+    )
+
+    assert completion.api == "completions"
+
+
+def test_azure_responses_api_prepare_params():
+    """Test that Responses API params are prepared correctly."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            instructions="Base instructions.",
+            store=True,
+            temperature=0.7,
+        )
+
+        messages = [
+            {"role": "system", "content": "System message."},
+            {"role": "user", "content": "Hello!"},
+        ]
+
+        params = completion._prepare_responses_params(messages)
+
+        assert params["model"] == "gpt-4o"
+        assert "Base instructions." in params["instructions"]
+        assert "System message." in params["instructions"]
+        assert params["store"] is True
+        assert params["temperature"] == 0.7
+        assert params["input"] == [{"role": "user", "content": "Hello!"}]
+
+
+def test_azure_responses_api_tool_format():
+    """Test that tools are converted to Responses API format (internally-tagged)."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+        tools = [
+            {
+                "name": "get_weather",
+                "description": "Get the weather for a location",
+                "parameters": {
+                    "type": "object",
+                    "properties": {"location": {"type": "string"}},
+                    "required": ["location"],
+                },
+            }
+        ]
+
+        responses_tools = completion._convert_tools_for_responses(tools)
+
+        assert len(responses_tools) == 1
+        tool = responses_tools[0]
+        assert tool["type"] == "function"
+        assert tool["name"] == "get_weather"
+        assert tool["description"] == "Get the weather for a location"
+        assert "parameters" in tool
+        assert "function" not in tool
+
+
+def test_azure_responses_api_structured_output_format():
+    """Test that structured outputs use text.format for Responses API."""
+    from pydantic import BaseModel
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    class Person(BaseModel):
+        name: str
+        age: int
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+        messages = [{"role": "user", "content": "Extract: Jane, 25"}]
+        params = completion._prepare_responses_params(messages, response_model=Person)
+
+        assert "text" in params
+        assert "format" in params["text"]
+        assert params["text"]["format"]["type"] == "json_schema"
+        assert params["text"]["format"]["name"] == "Person"
+        assert params["text"]["format"]["strict"] is True
+
+
+def test_azure_responses_api_with_previous_response_id():
+    """Test that previous_response_id is passed for multi-turn conversations."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            previous_response_id="resp_abc123",
+            store=True,
+        )
+
+        messages = [{"role": "user", "content": "Continue our conversation."}]
+        params = completion._prepare_responses_params(messages)
+
+        assert params["previous_response_id"] == "resp_abc123"
+        assert params["store"] is True
+
+
+def test_azure_responses_api_call_routing():
+    """Test that call() routes to the correct API based on the api parameter."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    completion_completions = AzureCompletion(
+        model="gpt-4o",
+        api="completions",
+        api_key="test-key",
+        endpoint="https://test.openai.azure.com",
+    )
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion_responses = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+    with patch.object(
+        completion_completions, "_handle_completion", return_value="completions result"
+    ) as mock_completions:
+        with patch.object(completion_completions, "_format_messages_for_azure", return_value=[{"role": "user", "content": "Hello"}]):
+            result = completion_completions.call("Hello")
+            mock_completions.assert_called_once()
+            assert result == "completions result"
+
+    with patch.object(
+        completion_responses, "_call_responses", return_value="responses result"
+    ) as mock_responses:
+        with patch.object(completion_responses, "_format_messages_for_azure", return_value=[{"role": "user", "content": "Hello"}]):
+            result = completion_responses.call("Hello")
+            mock_responses.assert_called_once()
+            assert result == "responses result"
+
+
+def test_azure_responses_api_builtin_tools_param():
+    """Test that builtin_tools parameter is properly configured."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            builtin_tools=["web_search", "code_interpreter"],
+        )
+
+        assert completion.builtin_tools == ["web_search", "code_interpreter"]
+
+        messages = [{"role": "user", "content": "Test"}]
+        params = completion._prepare_responses_params(messages)
+
+        assert "tools" in params
+        tool_types = [t["type"] for t in params["tools"]]
+        assert "web_search_preview" in tool_types
+        assert "code_interpreter" in tool_types
+
+
+def test_azure_responses_api_builtin_tools_with_custom_tools():
+    """Test that builtin_tools can be combined with custom function tools."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            builtin_tools=["web_search"],
+        )
+
+        custom_tools = [
+            {
+                "name": "get_weather",
+                "description": "Get weather for a location",
+                "parameters": {"type": "object", "properties": {}},
+            }
+        ]
+
+        messages = [{"role": "user", "content": "Test"}]
+        params = completion._prepare_responses_params(messages, tools=custom_tools)
+
+        assert len(params["tools"]) == 2
+        tool_types = [t.get("type") for t in params["tools"]]
+        assert "web_search_preview" in tool_types
+        assert "function" in tool_types
+
+
+def test_azure_responses_api_parse_tool_outputs_param():
+    """Test that parse_tool_outputs parameter is properly configured."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            parse_tool_outputs=True,
+        )
+
+        assert completion.parse_tool_outputs is True
+
+
+def test_azure_responses_api_parse_tool_outputs_default_false():
+    """Test that parse_tool_outputs defaults to False."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+        assert completion.parse_tool_outputs is False
+
+
+# =============================================================================
+# Auto-Chaining Tests (Azure Responses API)
+# =============================================================================
+
+
+def test_azure_responses_api_auto_chain_param():
+    """Test that auto_chain parameter is properly configured."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain=True,
+        )
+
+        assert completion.auto_chain is True
+        assert completion._last_response_id is None
+
+
+def test_azure_responses_api_auto_chain_default_false():
+    """Test that auto_chain defaults to False."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+        assert completion.auto_chain is False
+
+
+def test_azure_responses_api_last_response_id_property():
+    """Test last_response_id property."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain=True,
+        )
+
+        # Initially None
+        assert completion.last_response_id is None
+
+        # Simulate setting the internal value
+        completion._last_response_id = "resp_test_123"
+        assert completion.last_response_id == "resp_test_123"
+
+
+def test_azure_responses_api_reset_chain():
+    """Test reset_chain() method clears the response ID."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain=True,
+        )
+
+        # Set a response ID
+        completion._last_response_id = "resp_test_123"
+        assert completion.last_response_id == "resp_test_123"
+
+        # Reset the chain
+        completion.reset_chain()
+        assert completion.last_response_id is None
+
+
+def test_azure_responses_api_auto_chain_prepare_params():
+    """Test that _prepare_responses_params uses auto-chained response ID."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain=True,
+        )
+
+        # No previous response ID yet
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert "previous_response_id" not in params
+
+        # Set a previous response ID
+        completion._last_response_id = "resp_previous_123"
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert params.get("previous_response_id") == "resp_previous_123"
+
+
+def test_azure_responses_api_explicit_previous_response_id_takes_precedence():
+    """Test that explicit previous_response_id overrides auto-chained ID."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain=True,
+            previous_response_id="resp_explicit_456",
+        )
+
+        # Set an auto-chained response ID
+        completion._last_response_id = "resp_auto_123"
+
+        # Explicit should take precedence
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert params.get("previous_response_id") == "resp_explicit_456"
+
+
+def test_azure_responses_api_auto_chain_disabled_no_tracking():
+    """Test that response ID is not tracked when auto_chain is False."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain=False,
+        )
+
+        # Even with a "previous" response ID set internally, params shouldn't use it
+        completion._last_response_id = "resp_should_not_use"
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert "previous_response_id" not in params
+
+
+# =============================================================================
+# Encrypted Reasoning for ZDR (Zero Data Retention) Tests
+# =============================================================================
+
+
+def test_azure_responses_api_auto_chain_reasoning_param():
+    """Test that auto_chain_reasoning parameter is properly configured."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=True,
+        )
+
+        assert completion.auto_chain_reasoning is True
+        assert completion._last_reasoning_items == []
+
+
+def test_azure_responses_api_auto_chain_reasoning_default_false():
+    """Test that auto_chain_reasoning defaults to False."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+        assert completion.auto_chain_reasoning is False
+
+
+def test_azure_responses_api_last_reasoning_items_property():
+    """Test last_reasoning_items property."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=True,
+        )
+
+        # Initially empty
+        assert completion.last_reasoning_items == []
+
+        # Simulate setting the internal value
+        mock_items = [{"id": "rs_test_123", "type": "reasoning"}]
+        completion._last_reasoning_items = mock_items
+        assert completion.last_reasoning_items == mock_items
+
+
+def test_azure_responses_api_reset_reasoning_chain():
+    """Test reset_reasoning_chain() method clears reasoning items."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=True,
+        )
+
+        # Set reasoning items
+        mock_items = [{"id": "rs_test_123", "type": "reasoning"}]
+        completion._last_reasoning_items = mock_items
+        assert completion.last_reasoning_items == mock_items
+
+        # Reset the reasoning chain
+        completion.reset_reasoning_chain()
+        assert completion.last_reasoning_items == []
+
+
+def test_azure_responses_api_auto_chain_reasoning_adds_include():
+    """Test that auto_chain_reasoning adds reasoning.encrypted_content to include."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=True,
+        )
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert "include" in params
+        assert "reasoning.encrypted_content" in params["include"]
+
+
+def test_azure_responses_api_auto_chain_reasoning_preserves_existing_include():
+    """Test that auto_chain_reasoning preserves existing include items."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=True,
+            include=["file_search_call.results"],
+        )
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert "include" in params
+        assert "reasoning.encrypted_content" in params["include"]
+        assert "file_search_call.results" in params["include"]
+
+
+def test_azure_responses_api_auto_chain_reasoning_no_duplicate_include():
+    """Test that reasoning.encrypted_content is not duplicated if already in include."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=True,
+            include=["reasoning.encrypted_content"],
+        )
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert "include" in params
+        # Should only appear once
+        assert params["include"].count("reasoning.encrypted_content") == 1
+
+
+def test_azure_responses_api_auto_chain_reasoning_prepends_to_input():
+    """Test that stored reasoning items are prepended to input."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=True,
+        )
+
+        # Simulate stored reasoning items
+        mock_reasoning = MagicMock()
+        mock_reasoning.type = "reasoning"
+        mock_reasoning.id = "rs_test_123"
+        completion._last_reasoning_items = [mock_reasoning]
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+
+        # Input should have reasoning item first, then the message
+        assert len(params["input"]) == 2
+        assert params["input"][0] == mock_reasoning
+        assert params["input"][1]["role"] == "user"
+
+
+def test_azure_responses_api_auto_chain_reasoning_disabled_no_include():
+    """Test that reasoning.encrypted_content is not added when auto_chain_reasoning is False."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=False,
+        )
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        # Should not have include at all (unless explicitly set)
+        assert "include" not in params or "reasoning.encrypted_content" not in params.get("include", [])
+
+
+def test_azure_responses_api_auto_chain_reasoning_disabled_no_prepend():
+    """Test that reasoning items are not prepended when auto_chain_reasoning is False."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain_reasoning=False,
+        )
+
+        # Even with stored reasoning items, they should not be prepended
+        mock_reasoning = MagicMock()
+        mock_reasoning.type = "reasoning"
+        completion._last_reasoning_items = [mock_reasoning]
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+
+        # Input should only have the message, not the reasoning item
+        assert len(params["input"]) == 1
+        assert params["input"][0]["role"] == "user"
+
+
+def test_azure_responses_api_both_auto_chains_work_together():
+    """Test that auto_chain and auto_chain_reasoning can be used together."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            auto_chain=True,
+            auto_chain_reasoning=True,
+        )
+
+        assert completion.auto_chain is True
+        assert completion.auto_chain_reasoning is True
+        assert completion._last_response_id is None
+        assert completion._last_reasoning_items == []
+
+        # Set both internal values
+        completion._last_response_id = "resp_123"
+        mock_reasoning = MagicMock()
+        mock_reasoning.type = "reasoning"
+        completion._last_reasoning_items = [mock_reasoning]
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+
+        # Both should be applied
+        assert params.get("previous_response_id") == "resp_123"
+        assert "reasoning.encrypted_content" in params["include"]
+        assert len(params["input"]) == 2  # Reasoning item + message
+
+
+def test_azure_responses_api_max_completion_tokens():
+    """Test that max_completion_tokens is mapped to max_output_tokens."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            max_completion_tokens=4096,
+        )
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert params["max_output_tokens"] == 4096
+
+
+def test_azure_responses_api_seed_param():
+    """Test that seed parameter is passed through."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            seed=42,
+        )
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert params["seed"] == 42
+
+
+def test_azure_responses_api_reasoning_effort_param():
+    """Test that reasoning_effort parameter is passed through."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            reasoning_effort="high",
+        )
+
+        params = completion._prepare_responses_params(messages=[{"role": "user", "content": "test"}])
+        assert params["reasoning"] == {"effort": "high"}
+
+
+def test_azure_responses_api_init_responses_clients():
+    """Test that _init_responses_clients creates OpenAI AzureOpenAI clients."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients") as mock_init:
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+        # _init_responses_clients should be called during __init__
+        mock_init.assert_called_once()
+
+
+def test_azure_responses_api_system_message_extraction():
+    """Test that system messages are extracted to instructions for Responses API."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+        )
+
+        messages = [
+            {"role": "system", "content": "You are a helpful assistant."},
+            {"role": "user", "content": "Hello!"},
+            {"role": "assistant", "content": "Hi there!"},
+            {"role": "user", "content": "How are you?"},
+        ]
+
+        params = completion._prepare_responses_params(messages)
+
+        # System message should be extracted to instructions
+        assert params["instructions"] == "You are a helpful assistant."
+        # Non-system messages should be in input
+        assert len(params["input"]) == 3
+        assert params["input"][0]["role"] == "user"
+        assert params["input"][1]["role"] == "assistant"
+        assert params["input"][2]["role"] == "user"
+
+
+def test_azure_responses_api_multiple_system_messages_merged():
+    """Test that multiple system messages are merged into instructions."""
+    from crewai.llms.providers.azure.completion import AzureCompletion
+
+    with patch("crewai.llms.providers.azure.completion.AzureCompletion._init_responses_clients"):
+        completion = AzureCompletion(
+            model="gpt-4o",
+            api="responses",
+            api_key="test-key",
+            endpoint="https://test.openai.azure.com",
+            instructions="Base instructions.",
+        )
+
+        messages = [
+            {"role": "system", "content": "System context."},
+            {"role": "user", "content": "Hello!"},
+        ]
+
+        params = completion._prepare_responses_params(messages)
+
+        # Both base instructions and system message should be merged
+        assert "Base instructions." in params["instructions"]
+        assert "System context." in params["instructions"]
--- a/lib/crewai/tests/llms/bedrock/test_bedrock.py
+++ b/lib/crewai/tests/llms/bedrock/test_bedrock.py
@@ -1175,3 +1175,56 @@ def test_bedrock_tool_results_not_merged_across_assistant_messages():
    )
    assert tool_result_messages[0]["content"][0]["toolResult"]["toolUseId"] == "call_a"
    assert tool_result_messages[1]["content"][0]["toolResult"]["toolUseId"] == "call_b"
+
+
+# =============================================================================
+# Responses API Error Handling Tests
+# =============================================================================
+
+
+def test_bedrock_responses_api_raises_not_implemented(bedrock_mocks):
+    """Test that Bedrock raises NotImplementedError when api='responses' is used."""
+    from crewai.llms.providers.bedrock.completion import BedrockCompletion
+
+    with pytest.raises(NotImplementedError, match="Responses API is not supported by AWS Bedrock"):
+        BedrockCompletion(
+            model="anthropic.claude-3-5-sonnet-20241022-v2:0",
+            api="responses",
+        )
+
+
+def test_bedrock_responses_api_error_suggests_completions(bedrock_mocks):
+    """Test that the error message suggests using api='completions' instead."""
+    from crewai.llms.providers.bedrock.completion import BedrockCompletion
+
+    with pytest.raises(NotImplementedError) as exc_info:
+        BedrockCompletion(
+            model="anthropic.claude-3-5-sonnet-20241022-v2:0",
+            api="responses",
+        )
+
+    error_msg = str(exc_info.value)
+    assert "api='completions'" in error_msg
+    assert "Converse API" in error_msg
+
+
+def test_bedrock_completions_api_still_works(bedrock_mocks):
+    """Test that api='completions' (default) still works normally."""
+    from crewai.llms.providers.bedrock.completion import BedrockCompletion
+
+    # Should not raise any error
+    completion = BedrockCompletion(
+        model="anthropic.claude-3-5-sonnet-20241022-v2:0",
+        api="completions",
+    )
+    assert completion.api == "completions"
+
+
+def test_bedrock_default_api_is_completions(bedrock_mocks):
+    """Test that the default API is 'completions'."""
+    from crewai.llms.providers.bedrock.completion import BedrockCompletion
+
+    completion = BedrockCompletion(
+        model="anthropic.claude-3-5-sonnet-20241022-v2:0",
+    )
+    assert completion.api == "completions"
--- a/lib/crewai/tests/llms/google/test_google.py
+++ b/lib/crewai/tests/llms/google/test_google.py
@@ -1190,3 +1190,55 @@ def test_gemini_cached_prompt_tokens_with_tools():
    # cached_prompt_tokens should be populated (may be 0 if Gemini
    # doesn't cache for this particular request, but the field should exist)
    assert usage.cached_prompt_tokens >= 0
+
+# =============================================================================
+# Responses API Error Handling Tests
+# =============================================================================
+
+
+def test_gemini_responses_api_raises_not_implemented():
+    """Test that Gemini raises NotImplementedError when api='responses' is used."""
+    from crewai.llms.providers.gemini.completion import GeminiCompletion
+
+    with pytest.raises(NotImplementedError, match="Responses API is not supported by Google Gemini"):
+        GeminiCompletion(
+            model="gemini-2.0-flash-001",
+            api="responses",
+        )
+
+
+def test_gemini_responses_api_error_suggests_completions():
+    """Test that the error message suggests using api='completions' instead."""
+    from crewai.llms.providers.gemini.completion import GeminiCompletion
+
+    with pytest.raises(NotImplementedError) as exc_info:
+        GeminiCompletion(
+            model="gemini-2.0-flash-001",
+            api="responses",
+        )
+
+    error_msg = str(exc_info.value)
+    assert "api='completions'" in error_msg
+    assert "generate_content" in error_msg
+
+
+def test_gemini_completions_api_still_works():
+    """Test that api='completions' (default) still works normally."""
+    from crewai.llms.providers.gemini.completion import GeminiCompletion
+
+    # Should not raise any error
+    completion = GeminiCompletion(
+        model="gemini-2.0-flash-001",
+        api="completions",
+    )
+    assert completion.api == "completions"
+
+
+def test_gemini_default_api_is_completions():
+    """Test that the default API is 'completions'."""
+    from crewai.llms.providers.gemini.completion import GeminiCompletion
+
+    completion = GeminiCompletion(
+        model="gemini-2.0-flash-001",
+    )
+    assert completion.api == "completions"