wip

2026-01-11 00:58:30 +00:00 · 2025-03-17 13:03:57 -04:00
parent 8e3af76252
commit e9fa9c5700
1 changed files with 487 additions and 72 deletions
--- a/src/crewai/lite_agent.py
+++ b/src/crewai/lite_agent.py
@@ -1,6 +1,7 @@
 import asyncio
 import json
 import re
 import uuid  # Add import for generating unique keys
 from typing import Any, Dict, List, Optional, Type, Union, cast
 from pydantic import BaseModel, Field, PrivateAttr, model_validator
@@ -8,8 +9,17 @@ from pydantic import BaseModel, Field, PrivateAttr, model_validator
 from crewai.agents.agent_builder.base_agent import BaseAgent
 from crewai.agents.agent_builder.utilities.base_token_process import TokenProcess
 from crewai.agents.cache import CacheHandler
 from crewai.agents.parser import (
    AgentAction,
    AgentFinish,
    CrewAgentParser,
    OutputParserException,
 )
 from crewai.agents.tools_handler import ToolsHandler
 from crewai.llm import LLM
 from crewai.tools.base_tool import BaseTool
 from crewai.tools.structured_tool import CrewStructuredTool
 from crewai.tools.tool_calling import ToolCalling
 from crewai.types.usage_metrics import UsageMetrics
 from crewai.utilities.events.agent_events import (
    LiteAgentExecutionCompletedEvent,
@@ -17,10 +27,19 @@ from crewai.utilities.events.agent_events import (
    LiteAgentExecutionStartedEvent,
 )
 from crewai.utilities.events.crewai_event_bus import crewai_event_bus
 from crewai.utilities.events.tool_usage_events import ToolUsageStartedEvent
 from crewai.utilities.llm_utils import create_llm
 from crewai.utilities.token_counter_callback import TokenCalcHandler
 class ToolResult:
    """Result of tool execution."""
    def __init__(self, result: str, result_as_answer: bool = False):
        self.result = result
        self.result_as_answer = result_as_answer
 class LiteAgentOutput(BaseModel):
    """Class that represents the result of a LiteAgent execution."""
@@ -104,10 +123,21 @@ class LiteAgent(BaseModel):
    _cache_handler: CacheHandler = PrivateAttr(default_factory=CacheHandler)
    _times_executed: int = PrivateAttr(default=0)
    _max_retry_limit: int = PrivateAttr(default=2)
    _key: str = PrivateAttr(default_factory=lambda: str(uuid.uuid4()))
    # Store tool results for tracking
    _tools_results: List[Dict[str, Any]] = PrivateAttr(default_factory=list)
    # Store messages for conversation
    _messages: List[Dict[str, str]] = PrivateAttr(default_factory=list)
    # Iteration counter
    _iterations: int = PrivateAttr(default=0)
    # Tracking metrics
    _formatting_errors: int = PrivateAttr(default=0)
    _tools_errors: int = PrivateAttr(default=0)
    _delegations: Dict[str, int] = PrivateAttr(default_factory=dict)
    @model_validator(mode="after")
    def setup_llm(self):
-        """Set up the LLM after initialization."""
+        """Set up the LLM and other components after initialization."""
        if self.llm is None:
            raise ValueError("LLM must be provided")
@@ -116,25 +146,83 @@ class LiteAgent(BaseModel):
        return self
    @property
    def key(self) -> str:
        """Get the unique key for this agent instance."""
        return self._key
    @property
    def _original_role(self) -> str:
        """Return the original role for compatibility with tool interfaces."""
        return self.role
    def _get_default_system_prompt(self) -> str:
        """Get the default system prompt for the agent."""
        prompt = f"""You are a helpful AI assistant acting as {self.role}.
-        Your goal is: {self.goal}
+Your goal is: {self.goal}
-        Your backstory: {self.backstory}
+Your backstory: {self.backstory}
-        When using tools, follow this format:
+When using tools, you MUST follow this EXACT format with the precise spacing and newlines as shown:
        Thought: I need to use a tool to help with this task.
        Action: tool_name
        Action Input: {{
            "parameter1": "value1",
            "parameter2": "value2"
        }}
        Observation: [Result of the tool execution]
-        When you have the final answer, respond directly without the above format.
+Thought: <your reasoning about what needs to be done>
-        """
+
 Action: <tool_name>
 Action Input: {{
    "parameter1": "value1",
    "parameter2": "value2"
 }}
 Observation: [Result of the tool execution will appear here]
 You can then continue with another tool:
 Thought: <your reasoning about what to do next>
 Action: <another_tool_name>
 Action Input: {{
    "parameter1": "value1"
 }}
 Observation: [Result of the tool execution will appear here]
 When you have a final answer and don't need to use any more tools, respond with:
 Thought: <your reasoning about the final answer>
 Final Answer: <your final answer to the user>
 Here's a concrete example of proper tool usage:
 Thought: I need to find out the weather in New York City.
 Action: get_weather
 Action Input: {{
    "city": "New York City"
 }}
 Observation: [The weather result would appear here]
 Thought: Now I need to save this weather data.
 Action: save_weather_data
 Action Input: {{
    "filename": "weather_history.txt"
 }}
 Observation: [The result of saving would appear here]
 Thought: I now have all the information I need to answer the user's question.
 Final Answer: The weather in New York City today is [weather details] and I've saved this information to the weather_history.txt file.
 Always maintain the exact format shown above, with blank lines between sections and properly formatted inputs for tools.
 """
        return prompt
    def _format_tools_description(self) -> str:
@@ -147,24 +235,70 @@ class LiteAgent(BaseModel):
            tools_str += f"Tool: {tool.name}\n"
            tools_str += f"Description: {tool.description}\n"
            if hasattr(tool, "args_schema"):
-                tools_str += f"Parameters: {tool.args_schema}\n"
+                schema_info = ""
                try:
                    if hasattr(tool.args_schema, "model_json_schema"):
                        schema = tool.args_schema.model_json_schema()
                        if "properties" in schema:
                            schema_info = ", ".join(
                                [
                                    f"{k}: {v.get('type', 'any')}"
                                    for k, v in schema["properties"].items()
                                ]
                            )
                        else:
                            schema_info = str(schema)
                except Exception:
                    schema_info = "Unable to parse schema"
                tools_str += f"Parameters: {schema_info}\n"
            tools_str += "\n"
        return tools_str
-    def _parse_tools(self) -> List[Any]:
+    def _get_tools_names(self) -> str:
        """Get a comma-separated list of tool names."""
        return ", ".join([tool.name for tool in self.tools])
    def _parse_tools(self) -> List[Dict[str, Any]]:
        """Parse tools to be used by the agent."""
        tools_list = []
-        try:
+        for tool in self.tools:
-            from crewai.tools import BaseTool as CrewAITool
+            try:
                # First try to use the to_structured_tool method if available
                if hasattr(tool, "to_structured_tool"):
                    structured_tool = tool.to_structured_tool()
                    if structured_tool and isinstance(structured_tool, dict):
                        tools_list.append(structured_tool)
                        continue
-            for tool in self.tools:
+                # Fall back to manual conversion if to_structured_tool is not available or fails
-                if isinstance(tool, CrewAITool):
+                tool_dict = {
-                    tools_list.append(tool.to_structured_tool())
+                    "type": "function",
-                else:
+                    "function": {
-                    tools_list.append(tool)
+                        "name": tool.name,
-        except ModuleNotFoundError:
+                        "description": tool.description,
-            tools_list = self.tools
+                    },
                }
                # Add args schema if available
                if hasattr(tool, "args_schema") and tool.args_schema:
                    try:
                        if hasattr(tool.args_schema, "model_json_schema"):
                            tool_dict["function"][
                                "parameters"
                            ] = tool.args_schema.model_json_schema()
                    except Exception as e:
                        if self.verbose:
                            print(
                                f"Warning: Could not get schema for tool {tool.name}: {e}"
                            )
                tools_list.append(tool_dict)
            except Exception as e:
                if self.verbose:
                    print(f"Error converting tool {tool.name}: {e}")
        return tools_list
@@ -218,6 +352,72 @@ class LiteAgent(BaseModel):
                print(f"Error extracting structured output: {e}")
            return None
    def _preprocess_model_output(self, text: str) -> str:
        """Preprocess the model output to correct common formatting issues."""
        # Skip if the text is empty
        if not text or text.strip() == "":
            return "Thought: I need to provide an answer.\n\nFinal Answer: I don't have enough information to provide a complete answer."
        # Remove 'Action' or 'Final Answer' from anywhere after a proper Thought
        if "Thought:" in text and ("Action:" in text and "Final Answer:" in text):
            # This is a case where both Action and Final Answer appear - clear conflict
            # Check which one appears first and keep only that one
            action_index = text.find("Action:")
            final_answer_index = text.find("Final Answer:")
            if action_index != -1 and final_answer_index != -1:
                if action_index < final_answer_index:
                    # Keep only the Action part
                    text = text[:final_answer_index]
                else:
                    # Keep only the Final Answer part
                    text = text[:action_index] + text[final_answer_index:]
                if self.verbose:
                    print("Removed conflicting Action/Final Answer parts")
        # Check if this looks like a tool usage attempt without proper formatting
        if any(tool.name in text for tool in self.tools) and "Action:" not in text:
            # Try to extract tool name and input
            for tool in self.tools:
                if tool.name in text:
                    # Find the tool name in the text
                    parts = text.split(tool.name, 1)
                    if len(parts) > 1:
                        # Try to extract input as JSON
                        input_text = parts[1]
                        json_match = re.search(r"(\{[\s\S]*\})", input_text)
                        if json_match:
                            # Construct a properly formatted response
                            formatted = "Thought: I need to use a tool to help with this task.\n\n"
                            formatted += f"Action: {tool.name}\n\n"
                            formatted += f"Action Input: {json_match.group(1)}\n"
                            if self.verbose:
                                print(f"Reformatted tool usage: {tool.name}")
                            return formatted
        # Check if this looks like a final answer without proper formatting
        if (
            "Final Answer:" not in text
            and not any(tool.name in text for tool in self.tools)
            and "Action:" not in text
        ):
            # This might be a direct response, format it as a final answer
            # Don't format if text already has a "Thought:" section
            if "Thought:" not in text:
                formatted = "Thought: I can now provide the final answer.\n\n"
                formatted += f"Final Answer: {text}\n"
                if self.verbose:
                    print("Reformatted as final answer")
                return formatted
        return text
    def kickoff(self, messages: Union[str, List[Dict[str, str]]]) -> LiteAgentOutput:
        """
        Execute the agent with the given messages.
@@ -246,11 +446,12 @@ class LiteAgent(BaseModel):
        Returns:
            LiteAgentOutput: The result of the agent execution.
        """
-        # Format messages for the LLM
+        # Reset state for this run
-        formatted_messages = self._format_messages(messages)
+        self._iterations = 0
        self._tools_results = []
-        # Prepare tools
+        # Format messages for the LLM
-        parsed_tools = self._parse_tools()
+        self._messages = self._format_messages(messages)
        # Get the original query for event emission
        query = messages if isinstance(messages, str) else messages[-1]["content"]
@@ -275,12 +476,11 @@ class LiteAgent(BaseModel):
        )
        try:
-            # Execute the agent
+            # Execute the agent using invoke loop
-            result = await self._execute_agent(formatted_messages, parsed_tools)
+            result = await self._invoke()
            # Extract structured output if response_format is set
            pydantic_output = None
            if self.response_format:
                structured_output = self._extract_structured_output(result)
                if isinstance(structured_output, BaseModel):
@@ -332,29 +532,243 @@ class LiteAgent(BaseModel):
            raise e
-    async def _execute_agent(
+    async def _invoke(self) -> str:
        self, messages: List[Dict[str, str]], tools: List[Any]
    ) -> str:
        """
-        Execute the agent with the given messages and tools.
+        Run the agent's thought process until it reaches a conclusion or max iterations.
-
+        Similar to _invoke_loop in CrewAgentExecutor.
        Args:
            messages: List of message dictionaries.
            tools: List of parsed tools.
        Returns:
-            str: The result of the agent execution.
+            str: The final result of the agent execution.
        """
-        # Set up available functions for tool execution
+        # Set up tools handler for tool execution
-        available_functions = {}
+        tools_handler = ToolsHandler(cache=self._cache_handler)
        for tool in self.tools:
            available_functions[tool.name] = tool.run
        # Set up callbacks for token tracking
        token_callback = TokenCalcHandler(token_cost_process=self._token_process)
        callbacks = [token_callback]
-        # Execute the LLM with the messages and tools
+        # Prepare tool configurations
        parsed_tools = self._parse_tools()
        tools_description = self._format_tools_description()
        tools_names = self._get_tools_names()
        # Create a mapping of tool names to tools for easier lookup
        tool_map = {tool.name: tool for tool in self.tools}
        # Execute the agent loop
        formatted_answer = None
        while self._iterations < self.max_iterations:
            try:
                # Execute the LLM
                llm_instance = self.llm
                if not isinstance(llm_instance, LLM):
                    llm_instance = create_llm(llm_instance)
                if llm_instance is None:
                    raise ValueError(
                        "LLM instance is None. Please provide a valid LLM."
                    )
                # Set response_format if supported
                try:
                    if (
                        self.response_format
                        and hasattr(llm_instance, "response_format")
                        and not llm_instance.response_format
                    ):
                        provider = getattr(
                            llm_instance, "_get_custom_llm_provider", lambda: None
                        )()
                        from litellm.utils import supports_response_schema
                        if hasattr(llm_instance, "model") and supports_response_schema(
                            model=llm_instance.model, custom_llm_provider=provider
                        ):
                            llm_instance.response_format = self.response_format
                except Exception as e:
                    if self.verbose:
                        print(f"Warning: Could not set response_format: {e}")
                # Get the LLM's response
                answer = llm_instance.call(
                    messages=self._messages,
                    tools=parsed_tools,
                    callbacks=callbacks,
                )
                # Keep a copy of the original answer in case we need to fall back to it
                original_answer = answer
                # Pre-process the answer to correct formatting issues
                answer = self._preprocess_model_output(answer)
                # Parse the response into an action or final answer
                parser = CrewAgentParser(agent=cast(BaseAgent, self))
                try:
                    formatted_answer = parser.parse(answer)
                except OutputParserException as e:
                    if self.verbose:
                        print(f"Parser error: {str(e)}")
                    # If we have a Final Answer format error and the original answer is substantive,
                    # return it directly if it looks like a final answer
                    if (
                        "Final Answer" in str(e)
                        and len(original_answer.strip()) > 20
                        and "Action:" not in original_answer
                    ):
                        if self.verbose:
                            print(
                                "Returning original answer directly as final response"
                            )
                        return original_answer
                    # Try to reformat and parse again
                    reformatted = self._preprocess_model_output(
                        "Thought: I need to provide an answer.\n\nFinal Answer: "
                        + original_answer
                    )
                    # Try parsing again
                    try:
                        formatted_answer = parser.parse(reformatted)
                    except Exception:
                        # If we still can't parse, just use the original answer
                        return original_answer
                # If the agent wants to use a tool
                if isinstance(formatted_answer, AgentAction):
                    # Find the appropriate tool
                    tool_name = formatted_answer.tool
                    tool_input = formatted_answer.tool_input
                    # Emit tool usage event
                    crewai_event_bus.emit(
                        self,
                        event=ToolUsageStartedEvent(
                            agent_key=self.key,
                            agent_role=self.role,
                            tool_name=tool_name,
                            tool_args=tool_input,
                            tool_class=tool_name,
                        ),
                    )
                    # Use the tool
                    if tool_name in tool_map:
                        tool = tool_map[tool_name]
                        try:
                            if hasattr(tool, "_run"):
                                # BaseTool interface
                                # Ensure tool_input is a proper dict with string keys
                                if isinstance(tool_input, dict):
                                    result = tool._run(
                                        **{str(k): v for k, v in tool_input.items()}
                                    )
                                else:
                                    result = tool._run(tool_input)
                            elif hasattr(tool, "run"):
                                # Another common interface
                                if isinstance(tool_input, dict):
                                    result = tool.run(
                                        **{str(k): v for k, v in tool_input.items()}
                                    )
                                else:
                                    result = tool.run(tool_input)
                            else:
                                result = f"Error: Tool '{tool_name}' does not have a supported execution method."
                            # Check if tool result should be the final answer
                            result_as_answer = getattr(tool, "result_as_answer", False)
                            # Add to tools_results for tracking
                            self._tools_results.append(
                                {
                                    "result": result,
                                    "tool_name": tool_name,
                                    "tool_args": tool_input,
                                    "result_as_answer": result_as_answer,
                                }
                            )
                            # Create tool result
                            tool_result = ToolResult(
                                result=result, result_as_answer=result_as_answer
                            )
                            # If the tool result should be the final answer, return it
                            if tool_result.result_as_answer:
                                return tool_result.result
                            # Add the result to the formatted answer and messaging
                            formatted_answer.result = tool_result.result
                            formatted_answer.text += (
                                f"\nObservation: {tool_result.result}"
                            )
                            # Execute the step callback if provided
                            if self.step_callback:
                                self.step_callback(formatted_answer)
                            # Add the assistant message to the conversation
                            self._messages.append(
                                {"role": "assistant", "content": formatted_answer.text}
                            )
                        except Exception as e:
                            error_message = f"Error using tool '{tool_name}': {str(e)}"
                            if self.verbose:
                                print(error_message)
                            # Add error message to conversation
                            self._messages.append(
                                {"role": "user", "content": error_message}
                            )
                    else:
                        # Tool not found
                        error_message = f"Tool '{tool_name}' not found. Available tools: {tools_names}"
                        if self.verbose:
                            print(error_message)
                        # Add error message to conversation
                        self._messages.append(
                            {"role": "user", "content": error_message}
                        )
                # If the agent provided a final answer
                elif isinstance(formatted_answer, AgentFinish):
                    # Execute the step callback if provided
                    if self.step_callback:
                        self.step_callback(formatted_answer)
                    # Return the output
                    return formatted_answer.output
                else:
                    # If formatted_answer is None, return the original answer
                    if not formatted_answer and original_answer:
                        return original_answer
                # Increment the iteration counter
                self._iterations += 1
            except Exception as e:
                if self.verbose:
                    print(f"Error during agent execution: {e}")
                # Add error message to conversation
                self._messages.append({"role": "user", "content": f"Error: {str(e)}"})
                self._iterations += 1
        # If we've reached max iterations without a final answer, force one
        if self.verbose:
            print("Maximum iterations reached. Requesting final answer.")
        # Add a message requesting a final answer
        self._messages.append(
            {
                "role": "user",
                "content": "You've been thinking for a while. Please provide your final answer now.",
            }
        )
        # Get the final answer from the LLM
        llm_instance = self.llm
        if not isinstance(llm_instance, LLM):
            llm_instance = create_llm(llm_instance)
@@ -362,33 +776,34 @@ class LiteAgent(BaseModel):
        if llm_instance is None:
            raise ValueError("LLM instance is None. Please provide a valid LLM.")
-        # Set the response_format on the LLM instance if it's not already set
+        final_answer = llm_instance.call(
-        if self.response_format and not llm_instance.response_format:
+            messages=self._messages,
            llm_instance.response_format = self.response_format
        # Convert tools to dictionaries for LLM call
        formatted_tools = None
        if tools:
            formatted_tools = []
            for tool in tools:
                if hasattr(tool, "dict"):
                    formatted_tools.append(tool.dict())
                elif hasattr(tool, "to_dict"):
                    formatted_tools.append(tool.to_dict())
                elif hasattr(tool, "model_dump"):
                    formatted_tools.append(tool.model_dump())
                else:
                    # If we can't convert the tool, skip it
                    if self.verbose:
                        print(
                            f"Warning: Could not convert tool {tool} to dictionary format"
                        )
        result = llm_instance.call(
            messages=messages,
            tools=formatted_tools,
            callbacks=callbacks,
            available_functions=available_functions,
        )
-        return result
+        return final_answer
    @property
    def tools_results(self) -> List[Dict[str, Any]]:
        """Get the tools results for this agent."""
        return self._tools_results
    def increment_formatting_errors(self) -> None:
        """Increment the formatting errors counter."""
        self._formatting_errors += 1
    def increment_tools_errors(self) -> None:
        """Increment the tools errors counter."""
        self._tools_errors += 1
    def increment_delegations(self, agent_name: Optional[str] = None) -> None:
        """
        Increment the delegations counter for a specific agent.
        Args:
            agent_name: The name of the agent being delegated to.
        """
        if agent_name:
            if agent_name not in self._delegations:
                self._delegations[agent_name] = 0
            self._delegations[agent_name] += 1