fix: emit tool call events in provider-specific LLM streaming implementations

Fixes #3982 This commit adds tool call event emission to all provider-specific LLM streaming implementations. Previously, only text chunks were emitted during streaming, but tool call information was missing. Changes: - Update BaseLLM._emit_stream_chunk_event to infer call_type from tool_call presence when not explicitly provided - Add tool call event emission in OpenAI provider streaming - Add tool call event emission in Azure provider streaming - Add tool call event emission in Gemini provider streaming - Add tool call event emission in Bedrock provider streaming - Add tool call event emission in Anthropic provider streaming - Add comprehensive tests for tool call streaming events The fix ensures that LLMStreamChunkEvent is emitted with: - call_type=LLMCallType.TOOL_CALL when tool calls are received - tool_call dict containing id, function (name, arguments), type, index - chunk containing the tool call arguments being streamed Co-Authored-By: João <joao@crewai.com>
2025-12-16 04:18:35 +00:00 · 2025-11-27 07:19:36 +00:00
parent 2025a26fc3
commit b70c4499d7
7 changed files with 413 additions and 2 deletions
--- a/lib/crewai/src/crewai/llms/base_llm.py
+++ b/lib/crewai/src/crewai/llms/base_llm.py
@@ -316,11 +316,33 @@ class BaseLLM(ABC):
        from_task: Task | None = None,
        from_agent: Agent | None = None,
        tool_call: dict[str, Any] | None = None,
+        call_type: LLMCallType | None = None,
    ) -> None:
-        """Emit stream chunk event."""
+        """Emit stream chunk event.
+
+        Args:
+            chunk: The text content of the chunk
+            from_task: Optional task that initiated the call
+            from_agent: Optional agent that initiated the call
+            tool_call: Optional tool call information as a dict with keys:
+                - id: Tool call ID
+                - function: Dict with 'name' and 'arguments'
+                - type: Tool call type (e.g., 'function')
+                - index: Index of the tool call
+            call_type: Optional call type. If not provided, it will be inferred
+                from the presence of tool_call (TOOL_CALL if tool_call is present,
+                LLM_CALL otherwise)
+        """
        if not hasattr(crewai_event_bus, "emit"):
            raise ValueError("crewai_event_bus does not have an emit method") from None

+        # Infer call_type from tool_call presence if not explicitly provided
+        effective_call_type = call_type
+        if effective_call_type is None:
+            effective_call_type = (
+                LLMCallType.TOOL_CALL if tool_call is not None else LLMCallType.LLM_CALL
+            )
+
        crewai_event_bus.emit(
            self,
            event=LLMStreamChunkEvent(
@@ -328,6 +350,7 @@ class BaseLLM(ABC):
                tool_call=tool_call,
                from_task=from_task,
                from_agent=from_agent,
+                call_type=effective_call_type,
            ),
        )

--- a/lib/crewai/src/crewai/llms/providers/anthropic/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/anthropic/completion.py
@@ -450,9 +450,14 @@ class AnthropicCompletion(BaseLLM):
        # (the SDK sets it internally)
        stream_params = {k: v for k, v in params.items() if k != "stream"}

+        # Track tool use blocks during streaming
+        current_tool_use: dict[str, Any] = {}
+        tool_use_index = 0
+
        # Make streaming API call
        with self.client.messages.stream(**stream_params) as stream:
            for event in stream:
+                # Handle text content
                if hasattr(event, "delta") and hasattr(event.delta, "text"):
                    text_delta = event.delta.text
                    full_response += text_delta
@@ -462,6 +467,55 @@ class AnthropicCompletion(BaseLLM):
                        from_agent=from_agent,
                    )

+                # Handle tool use start (content_block_start event with tool_use type)
+                if hasattr(event, "content_block") and hasattr(event.content_block, "type"):
+                    if event.content_block.type == "tool_use":
+                        current_tool_use = {
+                            "id": getattr(event.content_block, "id", None),
+                            "name": getattr(event.content_block, "name", ""),
+                            "input": "",
+                            "index": tool_use_index,
+                        }
+                        tool_use_index += 1
+                        # Emit tool call start event
+                        tool_call_event_data = {
+                            "id": current_tool_use["id"],
+                            "function": {
+                                "name": current_tool_use["name"],
+                                "arguments": "",
+                            },
+                            "type": "function",
+                            "index": current_tool_use["index"],
+                        }
+                        self._emit_stream_chunk_event(
+                            chunk="",
+                            from_task=from_task,
+                            from_agent=from_agent,
+                            tool_call=tool_call_event_data,
+                        )
+
+                # Handle tool use input delta (input_json events)
+                if hasattr(event, "delta") and hasattr(event.delta, "partial_json"):
+                    partial_json = event.delta.partial_json
+                    if current_tool_use and partial_json:
+                        current_tool_use["input"] += partial_json
+                        # Emit tool call delta event
+                        tool_call_event_data = {
+                            "id": current_tool_use["id"],
+                            "function": {
+                                "name": current_tool_use["name"],
+                                "arguments": partial_json,
+                            },
+                            "type": "function",
+                            "index": current_tool_use["index"],
+                        }
+                        self._emit_stream_chunk_event(
+                            chunk=partial_json,
+                            from_task=from_task,
+                            from_agent=from_agent,
+                            tool_call=tool_call_event_data,
+                        )
+
            final_message: Message = stream.get_final_message()

        usage = self._extract_anthropic_token_usage(final_message)
--- a/lib/crewai/src/crewai/llms/providers/azure/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/azure/completion.py
@@ -503,8 +503,10 @@ class AzureCompletion(BaseLLM):
                            call_id = tool_call.id or "default"
                            if call_id not in tool_calls:
                                tool_calls[call_id] = {
+                                    "id": call_id,
                                    "name": "",
                                    "arguments": "",
+                                    "index": getattr(tool_call, "index", 0) or 0,
                                }

                            if tool_call.function and tool_call.function.name:
@@ -514,6 +516,23 @@ class AzureCompletion(BaseLLM):
                                    tool_call.function.arguments
                                )

+                            # Emit tool call streaming event
+                            tool_call_event_data = {
+                                "id": tool_calls[call_id]["id"],
+                                "function": {
+                                    "name": tool_calls[call_id]["name"],
+                                    "arguments": tool_call.function.arguments if tool_call.function and tool_call.function.arguments else "",
+                                },
+                                "type": "function",
+                                "index": tool_calls[call_id]["index"],
+                            }
+                            self._emit_stream_chunk_event(
+                                chunk=tool_call.function.arguments if tool_call.function and tool_call.function.arguments else "",
+                                from_task=from_task,
+                                from_agent=from_agent,
+                                tool_call=tool_call_event_data,
+                            )
+
        # Handle completed tool calls
        if tool_calls and available_functions:
            for call_data in tool_calls.values():
--- a/lib/crewai/src/crewai/llms/providers/bedrock/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/bedrock/completion.py
@@ -567,12 +567,31 @@ class BedrockCompletion(BaseLLM):

                    elif "contentBlockStart" in event:
                        start = event["contentBlockStart"].get("start", {})
+                        block_index = event["contentBlockStart"].get("contentBlockIndex", 0)
                        if "toolUse" in start:
                            current_tool_use = start["toolUse"]
+                            current_tool_use["_block_index"] = block_index
+                            current_tool_use["_accumulated_input"] = ""
                            tool_use_id = current_tool_use.get("toolUseId")
                            logging.debug(
                                f"Tool use started in stream: {current_tool_use.get('name')} (ID: {tool_use_id})"
                            )
+                            # Emit tool call start event
+                            tool_call_event_data = {
+                                "id": tool_use_id,
+                                "function": {
+                                    "name": current_tool_use.get("name", ""),
+                                    "arguments": "",
+                                },
+                                "type": "function",
+                                "index": block_index,
+                            }
+                            self._emit_stream_chunk_event(
+                                chunk="",
+                                from_task=from_task,
+                                from_agent=from_agent,
+                                tool_call=tool_call_event_data,
+                            )

                    elif "contentBlockDelta" in event:
                        delta = event["contentBlockDelta"]["delta"]
@@ -589,6 +608,23 @@ class BedrockCompletion(BaseLLM):
                            tool_input = delta["toolUse"].get("input", "")
                            if tool_input:
                                logging.debug(f"Tool input delta: {tool_input}")
+                                current_tool_use["_accumulated_input"] += tool_input
+                                # Emit tool call delta event
+                                tool_call_event_data = {
+                                    "id": current_tool_use.get("toolUseId"),
+                                    "function": {
+                                        "name": current_tool_use.get("name", ""),
+                                        "arguments": tool_input,
+                                    },
+                                    "type": "function",
+                                    "index": current_tool_use.get("_block_index", 0),
+                                }
+                                self._emit_stream_chunk_event(
+                                    chunk=tool_input,
+                                    from_task=from_task,
+                                    from_agent=from_agent,
+                                    tool_call=tool_call_event_data,
+                                )

                    # Content block stop - end of a content block
                    elif "contentBlockStop" in event:
--- a/lib/crewai/src/crewai/llms/providers/gemini/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/gemini/completion.py
@@ -1,3 +1,4 @@
+import json
 import logging
 import os
 import re
@@ -496,7 +497,7 @@ class GeminiCompletion(BaseLLM):
            if hasattr(chunk, "candidates") and chunk.candidates:
                candidate = chunk.candidates[0]
                if candidate.content and candidate.content.parts:
-                    for part in candidate.content.parts:
+                    for part_index, part in enumerate(candidate.content.parts):
                        if hasattr(part, "function_call") and part.function_call:
                            call_id = part.function_call.name or "default"
                            if call_id not in function_calls:
@@ -505,8 +506,27 @@ class GeminiCompletion(BaseLLM):
                                    "args": dict(part.function_call.args)
                                    if part.function_call.args
                                    else {},
+                                    "index": part_index,
                                }

+                            # Emit tool call streaming event
+                            args_str = json.dumps(function_calls[call_id]["args"]) if function_calls[call_id]["args"] else ""
+                            tool_call_event_data = {
+                                "id": call_id,
+                                "function": {
+                                    "name": function_calls[call_id]["name"],
+                                    "arguments": args_str,
+                                },
+                                "type": "function",
+                                "index": function_calls[call_id]["index"],
+                            }
+                            self._emit_stream_chunk_event(
+                                chunk=args_str,
+                                from_task=from_task,
+                                from_agent=from_agent,
+                                tool_call=tool_call_event_data,
+                            )
+
        # Handle completed function calls
        if function_calls and available_functions:
            for call_data in function_calls.values():
--- a/lib/crewai/src/crewai/llms/providers/openai/completion.py
+++ b/lib/crewai/src/crewai/llms/providers/openai/completion.py
@@ -510,8 +510,10 @@ class OpenAICompletion(BaseLLM):
                    call_id = tool_call.id or "default"
                    if call_id not in tool_calls:
                        tool_calls[call_id] = {
+                            "id": call_id,
                            "name": "",
                            "arguments": "",
+                            "index": tool_call.index if tool_call.index is not None else 0,
                        }

                    if tool_call.function and tool_call.function.name:
@@ -519,6 +521,23 @@ class OpenAICompletion(BaseLLM):
                    if tool_call.function and tool_call.function.arguments:
                        tool_calls[call_id]["arguments"] += tool_call.function.arguments

+                    # Emit tool call streaming event
+                    tool_call_event_data = {
+                        "id": tool_calls[call_id]["id"],
+                        "function": {
+                            "name": tool_calls[call_id]["name"],
+                            "arguments": tool_call.function.arguments if tool_call.function and tool_call.function.arguments else "",
+                        },
+                        "type": "function",
+                        "index": tool_calls[call_id]["index"],
+                    }
+                    self._emit_stream_chunk_event(
+                        chunk=tool_call.function.arguments if tool_call.function and tool_call.function.arguments else "",
+                        from_task=from_task,
+                        from_agent=from_agent,
+                        tool_call=tool_call_event_data,
+                    )
+
        if tool_calls and available_functions:
            for call_data in tool_calls.values():
                function_name = call_data["name"]
--- a/lib/crewai/tests/test_streaming.py
+++ b/lib/crewai/tests/test_streaming.py
@@ -715,3 +715,243 @@ class TestStreamingImports:
        assert StreamChunk is not None
        assert StreamChunkType is not None
        assert ToolCallChunk is not None
+
+
+class TestLLMStreamChunkEventToolCall:
+    """Tests for LLMStreamChunkEvent with tool call information."""
+
+    def test_llm_stream_chunk_event_with_tool_call(self) -> None:
+        """Test that LLMStreamChunkEvent correctly handles tool call data."""
+        from crewai.events.types.llm_events import (
+            LLMCallType,
+            LLMStreamChunkEvent,
+            ToolCall,
+            FunctionCall,
+        )
+
+        # Create a tool call event
+        tool_call = ToolCall(
+            id="call-123",
+            function=FunctionCall(
+                name="search",
+                arguments='{"query": "test"}',
+            ),
+            type="function",
+            index=0,
+        )
+
+        event = LLMStreamChunkEvent(
+            chunk='{"query": "test"}',
+            tool_call=tool_call,
+            call_type=LLMCallType.TOOL_CALL,
+        )
+
+        assert event.chunk == '{"query": "test"}'
+        assert event.tool_call is not None
+        assert event.tool_call.id == "call-123"
+        assert event.tool_call.function.name == "search"
+        assert event.tool_call.function.arguments == '{"query": "test"}'
+        assert event.call_type == LLMCallType.TOOL_CALL
+
+    def test_llm_stream_chunk_event_with_dict_tool_call(self) -> None:
+        """Test that LLMStreamChunkEvent correctly handles tool call as dict."""
+        from crewai.events.types.llm_events import (
+            LLMCallType,
+            LLMStreamChunkEvent,
+        )
+
+        # Create a tool call event using dict (as providers emit)
+        tool_call_dict = {
+            "id": "call-456",
+            "function": {
+                "name": "get_weather",
+                "arguments": '{"location": "NYC"}',
+            },
+            "type": "function",
+            "index": 1,
+        }
+
+        event = LLMStreamChunkEvent(
+            chunk='{"location": "NYC"}',
+            tool_call=tool_call_dict,
+            call_type=LLMCallType.TOOL_CALL,
+        )
+
+        assert event.chunk == '{"location": "NYC"}'
+        assert event.tool_call is not None
+        assert event.tool_call.id == "call-456"
+        assert event.tool_call.function.name == "get_weather"
+        assert event.tool_call.function.arguments == '{"location": "NYC"}'
+        assert event.call_type == LLMCallType.TOOL_CALL
+
+    def test_llm_stream_chunk_event_text_only(self) -> None:
+        """Test that LLMStreamChunkEvent works for text-only chunks."""
+        from crewai.events.types.llm_events import (
+            LLMCallType,
+            LLMStreamChunkEvent,
+        )
+
+        event = LLMStreamChunkEvent(
+            chunk="Hello, world!",
+            tool_call=None,
+            call_type=LLMCallType.LLM_CALL,
+        )
+
+        assert event.chunk == "Hello, world!"
+        assert event.tool_call is None
+        assert event.call_type == LLMCallType.LLM_CALL
+
+
+class TestBaseLLMEmitStreamChunkEvent:
+    """Tests for BaseLLM._emit_stream_chunk_event method."""
+
+    def test_emit_stream_chunk_event_infers_tool_call_type(self) -> None:
+        """Test that _emit_stream_chunk_event infers TOOL_CALL type when tool_call is present."""
+        from unittest.mock import MagicMock, patch
+        from crewai.llms.base_llm import BaseLLM
+        from crewai.events.types.llm_events import LLMCallType, LLMStreamChunkEvent
+
+        # Create a mock BaseLLM instance
+        with patch.object(BaseLLM, "__abstractmethods__", set()):
+            llm = BaseLLM(model="test-model")  # type: ignore
+
+        captured_events: list[LLMStreamChunkEvent] = []
+
+        def capture_emit(source: Any, event: Any) -> None:
+            if isinstance(event, LLMStreamChunkEvent):
+                captured_events.append(event)
+
+        with patch("crewai.llms.base_llm.crewai_event_bus") as mock_bus:
+            mock_bus.emit = capture_emit
+
+            # Emit with tool_call - should infer TOOL_CALL type
+            tool_call_dict = {
+                "id": "call-789",
+                "function": {
+                    "name": "test_tool",
+                    "arguments": '{"arg": "value"}',
+                },
+                "type": "function",
+                "index": 0,
+            }
+            llm._emit_stream_chunk_event(
+                chunk='{"arg": "value"}',
+                tool_call=tool_call_dict,
+            )
+
+            assert len(captured_events) == 1
+            assert captured_events[0].call_type == LLMCallType.TOOL_CALL
+            assert captured_events[0].tool_call is not None
+
+    def test_emit_stream_chunk_event_infers_llm_call_type(self) -> None:
+        """Test that _emit_stream_chunk_event infers LLM_CALL type when tool_call is None."""
+        from unittest.mock import patch
+        from crewai.llms.base_llm import BaseLLM
+        from crewai.events.types.llm_events import LLMCallType, LLMStreamChunkEvent
+
+        # Create a mock BaseLLM instance
+        with patch.object(BaseLLM, "__abstractmethods__", set()):
+            llm = BaseLLM(model="test-model")  # type: ignore
+
+        captured_events: list[LLMStreamChunkEvent] = []
+
+        def capture_emit(source: Any, event: Any) -> None:
+            if isinstance(event, LLMStreamChunkEvent):
+                captured_events.append(event)
+
+        with patch("crewai.llms.base_llm.crewai_event_bus") as mock_bus:
+            mock_bus.emit = capture_emit
+
+            # Emit without tool_call - should infer LLM_CALL type
+            llm._emit_stream_chunk_event(
+                chunk="Hello, world!",
+                tool_call=None,
+            )
+
+            assert len(captured_events) == 1
+            assert captured_events[0].call_type == LLMCallType.LLM_CALL
+            assert captured_events[0].tool_call is None
+
+    def test_emit_stream_chunk_event_respects_explicit_call_type(self) -> None:
+        """Test that _emit_stream_chunk_event respects explicitly provided call_type."""
+        from unittest.mock import patch
+        from crewai.llms.base_llm import BaseLLM
+        from crewai.events.types.llm_events import LLMCallType, LLMStreamChunkEvent
+
+        # Create a mock BaseLLM instance
+        with patch.object(BaseLLM, "__abstractmethods__", set()):
+            llm = BaseLLM(model="test-model")  # type: ignore
+
+        captured_events: list[LLMStreamChunkEvent] = []
+
+        def capture_emit(source: Any, event: Any) -> None:
+            if isinstance(event, LLMStreamChunkEvent):
+                captured_events.append(event)
+
+        with patch("crewai.llms.base_llm.crewai_event_bus") as mock_bus:
+            mock_bus.emit = capture_emit
+
+            # Emit with explicit call_type - should use provided type
+            llm._emit_stream_chunk_event(
+                chunk="test",
+                tool_call=None,
+                call_type=LLMCallType.TOOL_CALL,  # Explicitly set even though no tool_call
+            )
+
+            assert len(captured_events) == 1
+            assert captured_events[0].call_type == LLMCallType.TOOL_CALL
+
+
+class TestStreamingToolCallExtraction:
+    """Tests for tool call extraction from streaming events."""
+
+    def test_extract_tool_call_info_from_event(self) -> None:
+        """Test that tool call info is correctly extracted from LLMStreamChunkEvent."""
+        from crewai.utilities.streaming import _extract_tool_call_info
+        from crewai.events.types.llm_events import (
+            LLMStreamChunkEvent,
+            ToolCall,
+            FunctionCall,
+        )
+        from crewai.types.streaming import StreamChunkType
+
+        # Create event with tool call
+        tool_call = ToolCall(
+            id="call-extract-test",
+            function=FunctionCall(
+                name="extract_test",
+                arguments='{"key": "value"}',
+            ),
+            type="function",
+            index=2,
+        )
+
+        event = LLMStreamChunkEvent(
+            chunk='{"key": "value"}',
+            tool_call=tool_call,
+        )
+
+        chunk_type, tool_call_chunk = _extract_tool_call_info(event)
+
+        assert chunk_type == StreamChunkType.TOOL_CALL
+        assert tool_call_chunk is not None
+        assert tool_call_chunk.tool_id == "call-extract-test"
+        assert tool_call_chunk.tool_name == "extract_test"
+        assert tool_call_chunk.arguments == '{"key": "value"}'
+        assert tool_call_chunk.index == 2
+
+    def test_extract_tool_call_info_returns_text_for_no_tool_call(self) -> None:
+        """Test that TEXT type is returned when no tool call is present."""
+        from crewai.utilities.streaming import _extract_tool_call_info
+        from crewai.events.types.llm_events import LLMStreamChunkEvent
+        from crewai.types.streaming import StreamChunkType
+
+        event = LLMStreamChunkEvent(
+            chunk="Just text content",
+            tool_call=None,
+        )
+
+        chunk_type, tool_call_chunk = _extract_tool_call_info(event)
+
+        assert chunk_type == StreamChunkType.TEXT
+        assert tool_call_chunk is None