wip

2026-01-22 22:58:13 +00:00 · 2025-04-10 12:30:36 -03:00
parent c9f47e6a37
commit cf45026e75
1 changed files with 91 additions and 62 deletions
--- a/src/crewai/llm.py
+++ b/src/crewai/llm.py
@@ -5,6 +5,7 @@ import sys
 import threading
 import warnings
 from contextlib import contextmanager
 from types import SimpleNamespace
 from typing import (
    Any,
    Dict,
@@ -371,6 +372,8 @@ class LLM(BaseLLM):
        last_chunk = None
        chunk_count = 0
        usage_info = None
        tool_calls = None
        accumulated_tool_args = {}  # Track tool call arguments by index
        # --- 2) Make sure stream is set to True and include usage metrics
        params["stream"] = True
@@ -392,7 +395,6 @@ class LLM(BaseLLM):
                    if isinstance(chunk, dict) and "choices" in chunk:
                        choices = chunk["choices"]
                    elif hasattr(chunk, "choices"):
                        # Check if choices is not a type but an actual attribute with value
                        if not isinstance(getattr(chunk, "choices"), type):
                            choices = getattr(chunk, "choices")
@@ -400,14 +402,97 @@ class LLM(BaseLLM):
                    if isinstance(chunk, dict) and "usage" in chunk:
                        usage_info = chunk["usage"]
                    elif hasattr(chunk, "usage"):
                        # Check if usage is not a type but an actual attribute with value
                        if not isinstance(getattr(chunk, "usage"), type):
                            usage_info = getattr(chunk, "usage")
                    if choices and len(choices) > 0:
                        choice = choices[0]
-                        # Handle different delta formats
+                        # Check for tool calls in the chunk
                        if "delta" in choice:
                            delta = choice["delta"]
                            if "tool_calls" in delta:
                                tool_calls = delta["tool_calls"]
                                # If we have tool calls and available functions, accumulate arguments
                                if tool_calls and available_functions:
                                    for tool_call in tool_calls:
                                        if hasattr(tool_call, "index"):
                                            index = tool_call.index
                                            if index not in accumulated_tool_args:
                                                accumulated_tool_args[index] = {
                                                    "name": None,
                                                    "arguments": "",
                                                }
                                            # Update tool call name if available
                                            if hasattr(
                                                tool_call, "function"
                                            ) and hasattr(tool_call.function, "name"):
                                                if tool_call.function.name:
                                                    accumulated_tool_args[index][
                                                        "name"
                                                    ] = tool_call.function.name
                                            # Accumulate arguments
                                            if hasattr(
                                                tool_call, "function"
                                            ) and hasattr(
                                                tool_call.function, "arguments"
                                            ):
                                                if tool_call.function.arguments:
                                                    accumulated_tool_args[index][
                                                        "arguments"
                                                    ] += tool_call.function.arguments
                                            # Check if we have a complete tool call
                                            if (
                                                accumulated_tool_args[index]["name"]
                                                and accumulated_tool_args[index][
                                                    "arguments"
                                                ]
                                            ):
                                                try:
                                                    # Try to parse the accumulated arguments
                                                    json.loads(
                                                        accumulated_tool_args[index][
                                                            "arguments"
                                                        ]
                                                    )
                                                    # Execute the tool call
                                                    tool_result = self._handle_tool_call(
                                                        [
                                                            SimpleNamespace(
                                                                function=SimpleNamespace(
                                                                    name=accumulated_tool_args[
                                                                        index
                                                                    ][
                                                                        "name"
                                                                    ],
                                                                    arguments=accumulated_tool_args[
                                                                        index
                                                                    ][
                                                                        "arguments"
                                                                    ],
                                                                ),
                                                            )
                                                        ],
                                                        available_functions,
                                                    )
                                                    if tool_result is not None:
                                                        # Stream the tool result
                                                        crewai_event_bus.emit(
                                                            self,
                                                            event=LLMStreamChunkEvent(
                                                                chunk=tool_result
                                                            ),
                                                        )
                                                        return tool_result
                                                except json.JSONDecodeError:
                                                    # If JSON is incomplete, continue accumulating
                                                    continue
                        # Handle different delta formats for content
                        delta = None
                        if isinstance(choice, dict) and "delta" in choice:
                            delta = choice["delta"]
@@ -416,17 +501,13 @@ class LLM(BaseLLM):
                        # Extract content from delta
                        if delta:
                            # Handle dict format
                            if isinstance(delta, dict):
                                if "content" in delta and delta["content"] is not None:
                                    chunk_content = delta["content"]
                            # Handle object format
                            elif hasattr(delta, "content"):
                                chunk_content = getattr(delta, "content")
                            # Handle case where content might be None or empty
                            if chunk_content is None and isinstance(delta, dict):
                                # Some models might send empty content chunks
                                chunk_content = ""
                except Exception as e:
                    logging.debug(f"Error extracting content from chunk: {e}")
@@ -434,10 +515,7 @@ class LLM(BaseLLM):
                # Only add non-None content to the response
                if chunk_content is not None:
                    # Add the chunk content to the full response
                    full_response += chunk_content
                    # Emit the chunk event
                    crewai_event_bus.emit(
                        self,
                        event=LLMStreamChunkEvent(chunk=chunk_content),
@@ -450,9 +528,7 @@ class LLM(BaseLLM):
                )
                non_streaming_params = params.copy()
                non_streaming_params["stream"] = False
-                non_streaming_params.pop(
+                non_streaming_params.pop("stream_options", None)
                    "stream_options", None
                )  # Remove stream_options for non-streaming call
                return self._handle_non_streaming_response(
                    non_streaming_params, callbacks, available_functions
                )
@@ -464,7 +540,6 @@ class LLM(BaseLLM):
                )
                if last_chunk is not None:
                    try:
                        # Try to extract content from the last chunk's message
                        choices = None
                        if isinstance(last_chunk, dict) and "choices" in last_chunk:
                            choices = last_chunk["choices"]
@@ -474,8 +549,6 @@ class LLM(BaseLLM):
                        if choices and len(choices) > 0:
                            choice = choices[0]
                            # Try to get content from message
                            message = None
                            if isinstance(choice, dict) and "message" in choice:
                                message = choice["message"]
@@ -500,57 +573,14 @@ class LLM(BaseLLM):
                            f"Last chunk format: {type(last_chunk)}, content: {last_chunk}"
                        )
-            # --- 6) If still empty, raise an error instead of using a default response
+            # --- 6) If still empty, raise an error
            if not full_response.strip():
                raise Exception(
                    "No content received from streaming response. Received empty chunks or failed to extract content."
                )
-            # --- 7) Check for tool calls in the final response
+            # --- 7) Log token usage and emit completion event
            tool_calls = None
            try:
                if last_chunk:
                    choices = None
                    if isinstance(last_chunk, dict) and "choices" in last_chunk:
                        choices = last_chunk["choices"]
                    elif hasattr(last_chunk, "choices"):
                        if not isinstance(getattr(last_chunk, "choices"), type):
                            choices = getattr(last_chunk, "choices")
                    if choices and len(choices) > 0:
                        choice = choices[0]
                        message = None
                        if isinstance(choice, dict) and "message" in choice:
                            message = choice["message"]
                        elif hasattr(choice, "message"):
                            message = getattr(choice, "message")
                        if message:
                            if isinstance(message, dict) and "tool_calls" in message:
                                tool_calls = message["tool_calls"]
                            elif hasattr(message, "tool_calls"):
                                tool_calls = getattr(message, "tool_calls")
            except Exception as e:
                logging.debug(f"Error checking for tool calls: {e}")
            # --- 8) If no tool calls or no available functions, return the text response directly
            if not tool_calls or not available_functions:
                # Log token usage if available in streaming mode
                self._handle_streaming_callbacks(callbacks, usage_info, last_chunk)
                # Emit completion event and return response
                self._handle_emit_call_events(full_response, LLMCallType.LLM_CALL)
                return full_response
            # --- 9) Handle tool calls if present
            tool_result = self._handle_tool_call(tool_calls, available_functions)
            if tool_result is not None:
                return tool_result
            # --- 10) Log token usage if available in streaming mode
            self._handle_streaming_callbacks(callbacks, usage_info, last_chunk)
            # --- 11) Emit completion event and return response
            self._handle_emit_call_events(full_response, LLMCallType.LLM_CALL)
            return full_response
@@ -561,7 +591,6 @@ class LLM(BaseLLM):
                self._handle_emit_call_events(full_response, LLMCallType.LLM_CALL)
                return full_response
            # Emit failed event and re-raise the exception
            crewai_event_bus.emit(
                self,
                event=LLMCallFailedEvent(error=str(e)),