Merge branch 'main' into lg-fix-env-cli

fix: ensure env-vars are written in upper case
When creating a Crew via the CLI and selecting the Azure provider, the generated .env file had environment variables in lowercase. This commit ensures that all environment variables are written in uppercase.
2026-03-05 11:28:14 +00:00 · 2025-06-26 12:10:27 -03:00 · 2025-06-26 12:05:18 -03:00
180 changed files with 5425 additions and 19747 deletions
--- a/.cursorrules
+++ b/.cursorrules
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -7,18 +7,14 @@ permissions:

 env:
  OPENAI_API_KEY: fake-api-key
-  PYTHONUNBUFFERED: 1

 jobs:
  tests:
-    name: tests (${{ matrix.python-version }})
    runs-on: ubuntu-latest
    timeout-minutes: 15
    strategy:
-      fail-fast: true
      matrix:
        python-version: ['3.10', '3.11', '3.12', '3.13']
-        group: [1, 2, 3, 4, 5, 6, 7, 8]
    steps:
      - name: Checkout code
        uses: actions/checkout@v4
@@ -27,9 +23,6 @@ jobs:
        uses: astral-sh/setup-uv@v3
        with:
          enable-cache: true
-          cache-dependency-glob: |
-            **/pyproject.toml
-            **/uv.lock

      - name: Set up Python ${{ matrix.python-version }}
        run: uv python install ${{ matrix.python-version }}
@@ -37,14 +30,5 @@ jobs:
      - name: Install the project
        run: uv sync --dev --all-extras

-      - name: Run tests (group ${{ matrix.group }} of 8)
-        run: |
-          uv run pytest \
-            --block-network \
-            --timeout=30 \
-            -vv \
-            --splits 8 \
-            --group ${{ matrix.group }} \
-            --durations=10 \
-            -n auto \
-            --maxfail=3
+      - name: Run tests
+        run: uv run pytest --block-network --timeout=60 -vv
--- a/.gitignore
+++ b/.gitignore
@@ -26,5 +26,4 @@ test_flow.html
 crewairules.mdc
 plan.md
 conceptual_plan.md
-build_image
-chromadb-*.lock
+build_image
--- a/docs/docs.json
+++ b/docs/docs.json
@@ -9,7 +9,12 @@
  },
  "favicon": "/images/favicon.svg",
  "contextual": {
-    "options": ["copy", "view", "chatgpt", "claude"]
+    "options": [
+      "copy",
+      "view",
+      "chatgpt",
+      "claude"
+    ]
  },
  "navigation": {
    "languages": [
@@ -36,11 +41,6 @@
              "anchor": "Get Help",
              "href": "mailto:support@crewai.com",
              "icon": "headset"
-            },
-            {
-              "anchor": "Releases",
-              "href": "https://github.com/crewAIInc/crewAI/releases",
-              "icon": "tag"
            }
          ]
        },
@@ -50,22 +50,32 @@
            "groups": [
              {
                "group": "Get Started",
-                "pages": ["en/introduction", "en/installation", "en/quickstart"]
+                "pages": [
+                  "en/introduction",
+                  "en/installation",
+                  "en/quickstart"
+                ]
              },
              {
                "group": "Guides",
                "pages": [
                  {
                    "group": "Strategy",
-                    "pages": ["en/guides/concepts/evaluating-use-cases"]
+                    "pages": [
+                      "en/guides/concepts/evaluating-use-cases"
+                    ]
                  },
                  {
                    "group": "Agents",
-                    "pages": ["en/guides/agents/crafting-effective-agents"]
+                    "pages": [
+                      "en/guides/agents/crafting-effective-agents"
+                    ]
                  },
                  {
                    "group": "Crews",
-                    "pages": ["en/guides/crews/first-crew"]
+                    "pages": [
+                      "en/guides/crews/first-crew"
+                    ]
                  },
                  {
                    "group": "Flows",
@@ -166,9 +176,7 @@
                      "en/tools/search-research/websitesearchtool",
                      "en/tools/search-research/codedocssearchtool",
                      "en/tools/search-research/youtubechannelsearchtool",
-                      "en/tools/search-research/youtubevideosearchtool",
-                      "en/tools/search-research/tavilysearchtool",
-                      "en/tools/search-research/tavilyextractortool"
+                      "en/tools/search-research/youtubevideosearchtool"
                    ]
                  },
                  {
@@ -227,7 +235,6 @@
                  "en/observability/langtrace",
                  "en/observability/maxim",
                  "en/observability/mlflow",
-                  "en/observability/neatlogs",
                  "en/observability/openlit",
                  "en/observability/opik",
                  "en/observability/patronus-evaluation",
@@ -261,7 +268,9 @@
              },
              {
                "group": "Telemetry",
-                "pages": ["en/telemetry"]
+                "pages": [
+                  "en/telemetry"
+                ]
              }
            ]
          },
@@ -270,7 +279,9 @@
            "groups": [
              {
                "group": "Getting Started",
-                "pages": ["en/enterprise/introduction"]
+                "pages": [
+                  "en/enterprise/introduction"
+                ]
              },
              {
                "group": "Features",
@@ -279,8 +290,7 @@
                  "en/enterprise/features/webhook-streaming",
                  "en/enterprise/features/traces",
                  "en/enterprise/features/hallucination-guardrail",
-                  "en/enterprise/features/integrations",
-                  "en/enterprise/features/agent-repositories"
+                  "en/enterprise/features/integrations"
                ]
              },
              {
@@ -325,7 +335,9 @@
              },
              {
                "group": "Resources",
-                "pages": ["en/enterprise/resources/frequently-asked-questions"]
+                "pages": [
+                  "en/enterprise/resources/frequently-asked-questions"
+                ]
              }
            ]
          },
@@ -334,7 +346,9 @@
            "groups": [
              {
                "group": "Getting Started",
-                "pages": ["en/api-reference/introduction"]
+                "pages": [
+                  "en/api-reference/introduction"
+                ]
              },
              {
                "group": "Endpoints",
@@ -347,7 +361,20 @@
            "groups": [
              {
                "group": "Examples",
-                "pages": ["en/examples/example"]
+                "pages": [
+                  "en/examples/example"
+                ]
+              }
+            ]
+          },
+          {
+            "tab": "Releases",
+            "groups": [
+              {
+                "group": "Releases",
+                "pages": [
+                  "en/changelog"
+                ]
              }
            ]
          }
@@ -376,11 +403,6 @@
              "anchor": "Obter Ajuda",
              "href": "mailto:support@crewai.com",
              "icon": "headset"
-            },
-            {
-              "anchor": "Lançamentos",
-              "href": "https://github.com/crewAIInc/crewAI/releases",
-              "icon": "tag"
            }
          ]
        },
@@ -401,15 +423,21 @@
                "pages": [
                  {
                    "group": "Estratégia",
-                    "pages": ["pt-BR/guides/concepts/evaluating-use-cases"]
+                    "pages": [
+                      "pt-BR/guides/concepts/evaluating-use-cases"
+                    ]
                  },
                  {
                    "group": "Agentes",
-                    "pages": ["pt-BR/guides/agents/crafting-effective-agents"]
+                    "pages": [
+                      "pt-BR/guides/agents/crafting-effective-agents"
+                    ]
                  },
                  {
                    "group": "Crews",
-                    "pages": ["pt-BR/guides/crews/first-crew"]
+                    "pages": [
+                      "pt-BR/guides/crews/first-crew"
+                    ]
                  },
                  {
                    "group": "Flows",
@@ -602,7 +630,9 @@
              },
              {
                "group": "Telemetria",
-                "pages": ["pt-BR/telemetry"]
+                "pages": [
+                  "pt-BR/telemetry"
+                ]
              }
            ]
          },
@@ -611,7 +641,9 @@
            "groups": [
              {
                "group": "Começando",
-                "pages": ["pt-BR/enterprise/introduction"]
+                "pages": [
+                  "pt-BR/enterprise/introduction"
+                ]
              },
              {
                "group": "Funcionalidades",
@@ -676,7 +708,9 @@
            "groups": [
              {
                "group": "Começando",
-                "pages": ["pt-BR/api-reference/introduction"]
+                "pages": [
+                  "pt-BR/api-reference/introduction"
+                ]
              },
              {
                "group": "Endpoints",
@@ -689,7 +723,20 @@
            "groups": [
              {
                "group": "Exemplos",
-                "pages": ["pt-BR/examples/example"]
+                "pages": [
+                  "pt-BR/examples/example"
+                ]
+              }
+            ]
+          },
+          {
+            "tab": "Lançamentos",
+            "groups": [
+              {
+                "group": "Lançamentos",
+                "pages": [
+                  "pt-BR/changelog"
+                ]
              }
            ]
          }
@@ -730,64 +777,6 @@
  "seo": {
    "indexing": "all"
  },
-  "redirects": [
-    {
-      "source": "/introduction",
-      "destination": "/en/introduction"
-    },
-    {
-      "source": "/installation",
-      "destination": "/en/installation"
-    },
-    {
-      "source": "/quickstart",
-      "destination": "/en/quickstart"
-    },
-    {
-      "source": "/changelog",
-      "destination": "https://github.com/crewAIInc/crewAI/releases"
-    },
-    {
-      "source": "/telemetry",
-      "destination": "/en/telemetry"
-    },
-    {
-      "source": "/concepts/:path*",
-      "destination": "/en/concepts/:path*"
-    },
-    {
-      "source": "/guides/:path*",
-      "destination": "/en/guides/:path*"
-    },
-    {
-      "source": "/tools/:path*",
-      "destination": "/en/tools/:path*"
-    },
-    {
-      "source": "/learn/:path*",
-      "destination": "/en/learn/:path*"
-    },
-    {
-      "source": "/mcp/:path*",
-      "destination": "/en/mcp/:path*"
-    },
-    {
-      "source": "/observability/:path*",
-      "destination": "/en/observability/:path*"
-    },
-    {
-      "source": "/enterprise/:path*",
-      "destination": "/en/enterprise/:path*"
-    },
-    {
-      "source": "/api-reference/:path*",
-      "destination": "/en/api-reference/:path*"
-    },
-    {
-      "source": "/examples/:path*",
-      "destination": "/en/examples/:path*"
-    }
-  ],
  "errors": {
    "404": {
      "redirect": true
--- a/docs/en/changelog.mdx
+++ b/docs/en/changelog.mdx
@@ -0,0 +1,473 @@
+---
+title: Changelog
+description: View the latest updates and changes to CrewAI
+icon: timeline
+---
+
+<Update label="2024-05-22" description="v0.121.0" tags={["Latest"]}>
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01210.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.121.0">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Fixed encoding error when creating tools
+  - Fixed failing llama test
+  - Updated logging configuration for consistency
+  - Enhanced telemetry initialization and event handling
+
+  **New Features & Enhancements**
+  - Added **markdown attribute** to the Task class
+  - Added **reasoning attribute** to the Agent class
+  - Added **inject_date flag** to Agent for automatic date injection
+  - Implemented **HallucinationGuardrail** (no-op with test coverage)
+
+  **Documentation & Guides**
+  - Added documentation for **StagehandTool** and improved MDX structure
+  - Added documentation for **MCP integration** and updated enterprise docs
+  - Documented knowledge events and updated reasoning docs
+  - Added stop parameter documentation
+  - Fixed import references in doc examples (before_kickoff, after_kickoff)
+  - General docs updates and restructuring for clarity
+</Update>
+
+<Update label="2024-05-15" description="v0.120.1">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01201.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.120.1">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Fixed **interpolation with hyphens**
+</Update>
+
+<Update label="2024-05-14" description="v0.120.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01200.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.120.0">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Enabled **full Ruff rule set** by default for stricter linting
+  - Addressed race condition in FilteredStream using context managers
+  - Fixed agent knowledge reset issue
+  - Refactored agent fetching logic into utility module
+
+  **New Features & Enhancements**
+  - Added support for **loading an Agent directly from a repository**
+  - Enabled setting an empty context for Task
+  - Enhanced Agent repository feedback and fixed Tool auto-import behavior
+  - Introduced direct initialization of knowledge (bypassing knowledge_sources)
+
+  **Documentation & Guides**
+  - Updated security.md for current security practices
+  - Cleaned up Google setup section for clarity
+  - Added link to AI Studio when entering Gemini key
+  - Updated Arize Phoenix observability guide
+  - Refreshed flow documentation
+</Update>
+
+<Update label="2024-05-08" description="v0.119.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01190.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.119.0">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Improved test reliability by enhancing pytest handling for flaky tests
+  - Fixed memory reset crash when embedding dimensions mismatch
+  - Enabled parent flow identification for Crew and LiteAgent
+  - Prevented telemetry-related crashes when unavailable
+  - Upgraded **LiteLLM version** for better compatibility
+  - Fixed llama converter tests by removing skip_external_api
+
+  **New Features & Enhancements**
+  - Introduced **knowledge retrieval prompt re-writing** in Agent for improved tracking and debugging
+  - Made LLM setup and quickstart guides model-agnostic
+
+  **Documentation & Guides**
+  - Added advanced configuration docs for the RAG tool
+  - Updated Windows troubleshooting guide
+  - Refined documentation examples for better clarity
+  - Fixed typos across docs and config files
+</Update>
+
+<Update label="2024-04-28" description="v0.118.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01180.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.118.0">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Fixed issues with missing prompt or system templates
+  - Removed global logging configuration to avoid unintended overrides
+  - Renamed **TaskGuardrail to LLMGuardrail** for improved clarity
+  - Downgraded litellm to version 1.167.1 for compatibility
+  - Added missing init.py files to ensure proper module initialization
+
+  **New Features & Enhancements**
+  - Added support for **no-code Guardrail creation** to simplify AI behavior controls
+
+  **Documentation & Guides**
+  - Removed CrewStructuredTool from public documentation to reflect internal usage
+  - Updated enterprise documentation and YouTube embed for improved onboarding experience
+</Update>
+
+<Update label="2024-04-20" description="v0.117.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01170.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.117.0">View on GitHub</a>
+  </div>
+
+  **New Features & Enhancements**
+  - Added `result_as_answer` parameter support in `@tool` decorator.
+  - Introduced support for new language models: GPT-4.1, Gemini-2.0, and Gemini-2.5 Pro.
+  - Enhanced knowledge management capabilities.
+  - Added Huggingface provider option in CLI.
+  - Improved compatibility and CI support for Python 3.10+.
+
+  **Core Improvements & Fixes**
+  - Fixed issues with incorrect template parameters and missing inputs.
+  - Improved asynchronous flow handling with coroutine condition checks.
+  - Enhanced memory management with isolated configuration and correct memory object copying.
+  - Fixed initialization of lite agents with correct references.
+  - Addressed Python type hint issues and removed redundant imports.
+  - Updated event placement for improved tool usage tracking.
+  - Raised explicit exceptions when flows fail.
+  - Removed unused code and redundant comments from various modules.
+  - Updated GitHub App token action to v2.
+
+  **Documentation & Guides**
+  - Enhanced documentation structure, including enterprise deployment instructions.
+  - Automatically create output folders for documentation generation.
+  - Fixed broken link in WeaviateVectorSearchTool documentation.
+  - Fixed guardrail documentation usage and import paths for JSON search tools.
+  - Updated documentation for CodeInterpreterTool.
+  - Improved SEO, contextual navigation, and error handling for documentation pages.
+</Update>
+
+<Update label="2024-04-25" description="v0.117.1">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01171.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.117.1">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Upgraded **crewai-tools** to latest version
+  - Upgraded **liteLLM** to latest version
+  - Fixed **Mem0 OSS**
+</Update>
+
+<Update label="2024-04-07" description="v0.114.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01140.png" />
+  </Frame>
+
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.114.0">View on GitHub</a>
+  </div>
+
+  **New Features & Enhancements**
+  - Agents as an atomic unit. (`Agent(...).kickoff()`)
+  - Support for [Custom LLM implementations](https://docs.crewai.com/guides/advanced/custom-llm).
+  - Integrated External Memory and [Opik observability](https://docs.crewai.com/how-to/opik-observability).
+  - Enhanced YAML extraction.
+  - Multimodal agent validation.
+  - Added Secure fingerprints for agents and crews.
+
+  **Core Improvements & Fixes**
+  - Improved serialization, agent copying, and Python compatibility.
+  - Added wildcard support to `emit()`
+  - Added support for additional router calls and context window adjustments.
+  - Fixed typing issues, validation, and import statements.
+  - Improved method performance.
+  - Enhanced agent task handling, event emissions, and memory management.
+  - Fixed CLI issues, conditional tasks, cloning behavior, and tool outputs.
+
+  **Documentation & Guides**
+  - Improved documentation structure, theme, and organization.
+  - Added guides for Local NVIDIA NIM with WSL2, W&B Weave, and Arize Phoenix.
+  - Updated tool configuration examples, prompts, and observability docs.
+  - Guide on using singular agents within Flows.
+</Update>
+
+<Update label="2024-03-17" description="v0.108.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01080.png" />
+  </Frame>
+
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.108.0">View on GitHub</a>
+  </div>
+
+  **New Features & Enhancements**
+  - Converted tabs to spaces in `crew.py` template
+  - Enhanced LLM Streaming Response Handling and Event System
+  - Included `model_name`
+  - Enhanced Event Listener with rich visualization and improved logging
+  - Added fingerprints
+
+  **Bug Fixes**
+  - Fixed Mistral issues
+  - Fixed a bug in documentation
+  - Fixed type check error in fingerprint property
+
+  **Documentation Updates**
+  - Improved tool documentation
+  - Updated installation guide for the `uv` tool package
+  - Added instructions for upgrading crewAI with the `uv` tool
+  - Added documentation for `ApifyActorsTool`
+</Update>
+
+<Update label="2024-03-10" description="v0.105.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01050.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.105.0">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Fixed issues with missing template variables and user memory configuration
+  - Improved async flow support and addressed agent response formatting
+  - Enhanced memory reset functionality and fixed CLI memory commands
+  - Fixed type issues, tool calling properties, and telemetry decoupling
+
+  **New Features & Enhancements**
+  - Added Flow state export and improved state utilities
+  - Enhanced agent knowledge setup with optional crew embedder
+  - Introduced event emitter for better observability and LLM call tracking
+  - Added support for Python 3.10 and ChatOllama from langchain_ollama
+  - Integrated context window size support for the o3-mini model
+  - Added support for multiple router calls
+
+  **Documentation & Guides**
+  - Improved documentation layout and hierarchical structure
+  - Added QdrantVectorSearchTool guide and clarified event listener usage
+  - Fixed typos in prompts and updated Amazon Bedrock model listings
+</Update>
+
+<Update label="2024-02-12" description="v0.102.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01020.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.102.0">View on GitHub</a>
+  </div>
+
+  **Core Improvements & Fixes**
+  - Enhanced LLM Support: Improved structured LLM output, parameter handling, and formatting for Anthropic models
+  - Crew & Agent Stability: Fixed issues with cloning agents/crews using knowledge sources, multiple task outputs in conditional tasks, and ignored Crew task callbacks
+  - Memory & Storage Fixes: Fixed short-term memory handling with Bedrock, ensured correct embedder initialization, and added a reset memories function in the crew class
+  - Training & Execution Reliability: Fixed broken training and interpolation issues with dict and list input types
+
+  **New Features & Enhancements**
+  - Advanced Knowledge Management: Improved naming conventions and enhanced embedding configuration with custom embedder support
+  - Expanded Logging & Observability: Added JSON format support for logging and integrated MLflow tracing documentation
+  - Data Handling Improvements: Updated excel_knowledge_source.py to process multi-tab files
+  - General Performance & Codebase Clean-Up: Streamlined enterprise code alignment and resolved linting issues
+  - Adding new tool: `QdrantVectorSearchTool`
+
+  **Documentation & Guides**
+  - Updated AI & Memory Docs: Improved Bedrock, Google AI, and long-term memory documentation
+  - Task & Workflow Clarity: Added "Human Input" row to Task Attributes, Langfuse guide, and FileWriterTool documentation
+  - Fixed Various Typos & Formatting Issues
+</Update>
+
+<Update label="2024-01-28" description="v0.100.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v01000.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.100.0">View on GitHub</a>
+  </div>
+
+  **Features**
+  - Add Composio docs
+  - Add SageMaker as a LLM provider
+  
+  **Fixes**
+  - Overall LLM connection issues
+  - Using safe accessors on training
+  - Add version check to crew_chat.py
+  
+  **Documentation**
+  - New docs for crewai chat
+  - Improve formatting and clarity in CLI and Composio Tool docs
+</Update>
+
+<Update label="2024-01-20" description="v0.98.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v0980.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.98.0">View on GitHub</a>
+  </div>
+
+  **Features**
+  - Conversation crew v1
+  - Add unique ID to flow states
+  - Add @persist decorator with FlowPersistence interface
+  
+  **Integrations**
+  - Add SambaNova integration
+  - Add NVIDIA NIM provider in cli
+  - Introducing VoyageAI
+  
+  **Fixes**
+  - Fix API Key Behavior and Entity Handling in Mem0 Integration
+  - Fixed core invoke loop logic and relevant tests
+  - Make tool inputs actual objects and not strings
+  - Add important missing parts to creating tools
+  - Drop litellm version to prevent windows issue
+  - Before kickoff if inputs are none
+  - Fixed typos, nested pydantic model issue, and docling issues
+</Update>
+
+<Update label="2024-01-04" description="v0.95.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v0950.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.95.0">View on GitHub</a>
+  </div>
+
+  **New Features**
+  - Adding Multimodal Abilities to Crew
+  - Programatic Guardrails
+  - HITL multiple rounds
+  - Gemini 2.0 Support
+  - CrewAI Flows Improvements
+  - Add Workflow Permissions
+  - Add support for langfuse with litellm
+  - Portkey Integration with CrewAI
+  - Add interpolate_only method and improve error handling
+  - Docling Support
+  - Weviate Support
+  
+  **Fixes**
+  - output_file not respecting system path
+  - disk I/O error when resetting short-term memory
+  - CrewJSONEncoder now accepts enums
+  - Python max version
+  - Interpolation for output_file in Task
+  - Handle coworker role name case/whitespace properly
+  - Add tiktoken as explicit dependency and document Rust requirement
+  - Include agent knowledge in planning process
+  - Change storage initialization to None for KnowledgeStorage
+  - Fix optional storage checks
+  - include event emitter in flows
+  - Docstring, Error Handling, and Type Hints Improvements
+  - Suppressed userWarnings from litellm pydantic issues
+</Update>
+
+<Update label="2024-12-05" description="v0.86.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v0860.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.86.0">View on GitHub</a>
+  </div>
+  **Changes**
+  - Remove all references to pipeline and pipeline router
+  - Add Nvidia NIM as provider in Custom LLM
+  - Add knowledge demo + improve knowledge docs
+  - Add HITL multiple rounds of followup
+  - New docs about yaml crew with decorators
+  - Simplify template crew
+</Update>
+
+<Update label="2024-12-04" description="v0.85.0">
+  ## Release Highlights
+  <Frame>
+    <img src="/images/releases/v0850.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.85.0">View on GitHub</a>
+  </div>
+  **Features**
+  - Added knowledge to agent level
+  - Feat/remove langchain
+  - Improve typed task outputs
+  - Log in to Tool Repository on crewai login
+  
+  **Fixes**
+  - Fixes issues with result as answer not properly exiting LLM loop
+  - Fix missing key name when running with ollama provider
+  - Fix spelling issue found
+  
+  **Documentation**
+  - Update readme for running mypy
+  - Add knowledge to mint.json
+  - Update Github actions
+  - Update Agents docs to include two approaches for creating an agent
+  - Improvements to LLM Configuration and Usage
+</Update>
+
+<Update label="2024-11-25" description="v0.83.0">
+  **New Features**
+  - New before_kickoff and after_kickoff crew callbacks
+  - Support to pre-seed agents with Knowledge
+  - Add support for retrieving user preferences and memories using Mem0
+  
+  **Fixes**
+  - Fix Async Execution
+  - Upgrade chroma and adjust embedder function generator
+  - Update CLI Watson supported models + docs
+  - Reduce level for Bandit
+  - Fixing all tests
+  
+  **Documentation**
+  - Update Docs
+</Update>
+
+<Update label="2024-11-13" description="v0.80.0">
+  **Fixes**
+  - Fixing Tokens callback replacement bug
+  - Fixing Step callback issue
+  - Add cached prompt tokens info on usage metrics
+  - Fix crew_train_success test
+</Update>
--- a/docs/en/concepts/agents.mdx
+++ b/docs/en/concepts/agents.mdx
@@ -526,103 +526,6 @@ agent = Agent(
 The context window management feature works automatically in the background. You don't need to call any special functions - just set `respect_context_window` to your preferred behavior and CrewAI handles the rest!
 </Note>

-## Direct Agent Interaction with `kickoff()`
-
-Agents can be used directly without going through a task or crew workflow using the `kickoff()` method. This provides a simpler way to interact with an agent when you don't need the full crew orchestration capabilities.
-
-### How `kickoff()` Works
-
-The `kickoff()` method allows you to send messages directly to an agent and get a response, similar to how you would interact with an LLM but with all the agent's capabilities (tools, reasoning, etc.).
-
-```python Code
-from crewai import Agent
-from crewai_tools import SerperDevTool
-
-# Create an agent
-researcher = Agent(
-    role="AI Technology Researcher",
-    goal="Research the latest AI developments",
-    tools=[SerperDevTool()],
-    verbose=True
-)
-
-# Use kickoff() to interact directly with the agent
-result = researcher.kickoff("What are the latest developments in language models?")
-
-# Access the raw response
-print(result.raw)
-```
-
-### Parameters and Return Values
-
-| Parameter         | Type                                | Description                                                               |
-| :---------------- | :---------------------------------- | :------------------------------------------------------------------------ |
-| `messages`        | `Union[str, List[Dict[str, str]]]`  | Either a string query or a list of message dictionaries with role/content |
-| `response_format` | `Optional[Type[Any]]`               | Optional Pydantic model for structured output                             |
-
-The method returns a `LiteAgentOutput` object with the following properties:
-
- `raw`: String containing the raw output text
- `pydantic`: Parsed Pydantic model (if a `response_format` was provided)
- `agent_role`: Role of the agent that produced the output
- `usage_metrics`: Token usage metrics for the execution
-
-### Structured Output
-
-You can get structured output by providing a Pydantic model as the `response_format`:
-
-```python Code
-from pydantic import BaseModel
-from typing import List
-
-class ResearchFindings(BaseModel):
-    main_points: List[str]
-    key_technologies: List[str]
-    future_predictions: str
-
-# Get structured output
-result = researcher.kickoff(
-    "Summarize the latest developments in AI for 2025",
-    response_format=ResearchFindings
-)
-
-# Access structured data
-print(result.pydantic.main_points)
-print(result.pydantic.future_predictions)
-```
-
-### Multiple Messages
-
-You can also provide a conversation history as a list of message dictionaries:
-
-```python Code
-messages = [
-    {"role": "user", "content": "I need information about large language models"},
-    {"role": "assistant", "content": "I'd be happy to help with that! What specifically would you like to know?"},
-    {"role": "user", "content": "What are the latest developments in 2025?"}
-]
-
-result = researcher.kickoff(messages)
-```
-
-### Async Support
-
-An asynchronous version is available via `kickoff_async()` with the same parameters:
-
-```python Code
-import asyncio
-
-async def main():
-    result = await researcher.kickoff_async("What are the latest developments in AI?")
-    print(result.raw)
-
-asyncio.run(main())
-```
-
-<Note>
-The `kickoff()` method uses a `LiteAgent` internally, which provides a simpler execution flow while preserving all of the agent's configuration (role, goal, backstory, tools, etc.).
-</Note>
-
 ## Important Considerations and Best Practices

 ### Security and Code Execution
--- a/docs/en/concepts/cli.mdx
+++ b/docs/en/concepts/cli.mdx
@@ -4,8 +4,6 @@ description: Learn how to use the CrewAI CLI to interact with CrewAI.
 icon: terminal
 ---

-<Warning>Since release 0.140.0, CrewAI Enterprise started a process of migrating their login provider. As such, the authentication flow via CLI was updated. Users that use Google to login, or that created their account after July 3rd, 2025 will be unable to log in with older versions of the `crewai` library.</Warning>
-
 ## Overview

 The CrewAI CLI provides a set of commands to interact with CrewAI, allowing you to create, train, run, and manage crews & flows.
@@ -188,7 +186,10 @@ def crew(self) -> Crew:
 Deploy the crew or flow to [CrewAI Enterprise](https://app.crewai.com).

 - **Authentication**: You need to be authenticated to deploy to CrewAI Enterprise.
-    You can login or create an account with:
+    ```shell Terminal
+    crewai signup
+    ```
+    If you already have an account, you can login with:
    ```shell Terminal
    crewai login
    ```
--- a/docs/en/concepts/crews.mdx
+++ b/docs/en/concepts/crews.mdx
@@ -32,7 +32,6 @@ A crew in crewAI represents a collaborative group of agents working together to
 | **Prompt File** _(optional)_          | `prompt_file`          | Path to the prompt JSON file to be used for the crew.                                                                                                                                                                                                     |
 | **Planning** *(optional)*             | `planning`             | Adds planning ability to the Crew. When activated before each Crew iteration, all Crew data is sent to an AgentPlanner that will plan the tasks and this plan will be added to each task description.                                                     |
 | **Planning LLM** *(optional)*         | `planning_llm`         | The language model used by the AgentPlanner in a planning process.                                                                                                                                                                                        |
-| **Knowledge Sources** _(optional)_    | `knowledge_sources`    | Knowledge sources available at the crew level, accessible to all the agents.                                                                                                                                                                                    |

 <Tip>
 **Crew Max RPM**: The `max_rpm` attribute sets the maximum number of requests per minute the crew can perform to avoid rate limits and will override individual agents' `max_rpm` settings if you set it.
--- a/docs/en/concepts/event-listener.mdx
+++ b/docs/en/concepts/event-listener.mdx
@@ -255,17 +255,6 @@ CrewAI provides a wide range of events that you can listen for:
 - **LLMCallFailedEvent**: Emitted when an LLM call fails
 - **LLMStreamChunkEvent**: Emitted for each chunk received during streaming LLM responses

-### Memory Events
-
- **MemoryQueryStartedEvent**: Emitted when a memory query is started. Contains the query, limit, and optional score threshold.
- **MemoryQueryCompletedEvent**: Emitted when a memory query is completed successfully. Contains the query, results, limit, score threshold, and query execution time.
- **MemoryQueryFailedEvent**: Emitted when a memory query fails. Contains the query, limit, score threshold, and error message.
- **MemorySaveStartedEvent**: Emitted when a memory save operation is started. Contains the value to be saved, metadata, and optional agent role.
- **MemorySaveCompletedEvent**: Emitted when a memory save operation is completed successfully. Contains the saved value, metadata, agent role, and save execution time.
- **MemorySaveFailedEvent**: Emitted when a memory save operation fails. Contains the value, metadata, agent role, and error message.
- **MemoryRetrievalStartedEvent**: Emitted when memory retrieval for a task prompt starts. Contains the optional task ID.
- **MemoryRetrievalCompletedEvent**: Emitted when memory retrieval for a task prompt completes successfully. Contains the task ID, memory content, and retrieval execution time.
-
 ## Event Handler Structure

 Each event handler receives two parameters:
--- a/docs/en/concepts/llms.mdx
+++ b/docs/en/concepts/llms.mdx
@@ -749,58 +749,9 @@ CrewAI supports streaming responses from LLMs, allowing your application to rece
    ```

    <Tip>
-      [Click here](https://docs.crewai.com/concepts/event-listener#event-listeners) for more details
+      [Click here](https://docs.crewai.com/concepts/event-listener#event-listeners) for more details 
    </Tip>
  </Tab>
-
-  <Tab title="Agent & Task Tracking">
-    All LLM events in CrewAI include agent and task information, allowing you to track and filter LLM interactions by specific agents or tasks:
-
-    ```python
-    from crewai import LLM, Agent, Task, Crew
-    from crewai.utilities.events import LLMStreamChunkEvent
-    from crewai.utilities.events.base_event_listener import BaseEventListener
-
-    class MyCustomListener(BaseEventListener):
-        def setup_listeners(self, crewai_event_bus):
-            @crewai_event_bus.on(LLMStreamChunkEvent)
-            def on_llm_stream_chunk(source, event):
-                if researcher.id == event.agent_id:
-                    print("\n==============\n Got event:", event, "\n==============\n")
-
-
-    my_listener = MyCustomListener()
-
-    llm = LLM(model="gpt-4o-mini", temperature=0, stream=True)
-
-    researcher = Agent(
-        role="About User",
-        goal="You know everything about the user.",
-        backstory="""You are a master at understanding people and their preferences.""",
-        llm=llm,
-    )
-
-    search = Task(
-        description="Answer the following questions about the user: {question}",
-        expected_output="An answer to the question.",
-        agent=researcher,
-    )
-
-    crew = Crew(agents=[researcher], tasks=[search])
-
-    result = crew.kickoff(
-        inputs={"question": "..."}
-    )
-    ```
-
-    <Info>
-      This feature is particularly useful for:
-      - Debugging specific agent behaviors
-      - Logging LLM usage by task type
-      - Auditing which agents are making what types of LLM calls
-      - Performance monitoring of specific tasks
-    </Info>
-  </Tab>
 </Tabs>

 ## Structured LLM Calls
@@ -896,7 +847,7 @@ Learn how to get the most out of your LLM configuration:
      Remember to regularly monitor your token usage and adjust your configuration as needed to optimize costs and performance.
    </Info>
  </Accordion>
-
+  
  <Accordion title="Drop Additional Parameters">
    CrewAI internally uses Litellm for LLM calls, which allows you to drop additional parameters that are not needed for your specific use case. This can help simplify your code and reduce the complexity of your LLM configuration.
    For example, if you don't need to send the <code>stop</code> parameter, you can simply omit it from your LLM call:
--- a/docs/en/concepts/memory.mdx
+++ b/docs/en/concepts/memory.mdx
@@ -9,7 +9,7 @@ icon: database
 The CrewAI framework provides a sophisticated memory system designed to significantly enhance AI agent capabilities. CrewAI offers **three distinct memory approaches** that serve different use cases:

 1. **Basic Memory System** - Built-in short-term, long-term, and entity memory
-2. **User Memory** - User-specific memory with Mem0 integration (legacy approach)
+2. **User Memory** - User-specific memory with Mem0 integration (legacy approach)  
 3. **External Memory** - Standalone external memory providers (new approach)

 ## Memory System Components
@@ -62,7 +62,7 @@ By default, CrewAI uses the `appdirs` library to determine storage locations fol
 ```
 ~/Library/Application Support/CrewAI/{project_name}/
 ├── knowledge/           # Knowledge base ChromaDB files
-├── short_term_memory/   # Short-term memory ChromaDB files
+├── short_term_memory/   # Short-term memory ChromaDB files  
 ├── long_term_memory/    # Long-term memory ChromaDB files
 ├── entities/            # Entity memory ChromaDB files
 └── long_term_memory_storage.db  # SQLite database
@@ -252,7 +252,7 @@ chroma_path = os.path.join(storage_path, "knowledge")
 if os.path.exists(chroma_path):
    client = chromadb.PersistentClient(path=chroma_path)
    collections = client.list_collections()
-
+    
    print("ChromaDB Collections:")
    for collection in collections:
        print(f"  - {collection.name}: {collection.count()} documents")
@@ -269,7 +269,7 @@ crew = Crew(agents=[...], tasks=[...], memory=True)

 # Reset specific memory types
 crew.reset_memories(command_type='short')     # Short-term memory
-crew.reset_memories(command_type='long')      # Long-term memory
+crew.reset_memories(command_type='long')      # Long-term memory  
 crew.reset_memories(command_type='entity')    # Entity memory
 crew.reset_memories(command_type='knowledge') # Knowledge storage
 ```
@@ -596,7 +596,7 @@ providers_to_test = [
    {
        "name": "Ollama",
        "config": {
-            "provider": "ollama",
+            "provider": "ollama", 
            "config": {"model": "mxbai-embed-large"}
        }
    }
@@ -604,7 +604,7 @@ providers_to_test = [

 for provider in providers_to_test:
    print(f"\nTesting {provider['name']} embeddings...")
-
+    
    # Create crew with specific embedder
    crew = Crew(
        agents=[...],
@@ -612,7 +612,7 @@ for provider in providers_to_test:
        memory=True,
        embedder=provider['config']
    )
-
+    
    # Run your test and measure performance
    result = crew.kickoff()
    print(f"{provider['name']} completed successfully")
@@ -655,17 +655,17 @@ import time

 def test_embedding_performance(embedder_config, test_text="This is a test document"):
    start_time = time.time()
-
+    
    crew = Crew(
        agents=[...],
        tasks=[...],
        memory=True,
        embedder=embedder_config
    )
-
+    
    # Simulate memory operation
    crew.kickoff()
-
+    
    end_time = time.time()
    return end_time - start_time

@@ -676,7 +676,7 @@ openai_time = test_embedding_performance({
 })

 ollama_time = test_embedding_performance({
-    "provider": "ollama",
+    "provider": "ollama", 
    "config": {"model": "mxbai-embed-large"}
 })

@@ -712,7 +712,7 @@ crew = Crew(
    memory_config={
        "provider": "mem0",
        "config": {"user_id": "john"},
-        "user_memory": {}  # DEPRECATED: Will be removed in version 0.156.0 or on 2025-08-04, use external_memory instead
+        "user_memory": {}  # Required - triggers user memory initialization
    },
    process=Process.sequential,
    verbose=True
@@ -783,7 +783,7 @@ os.environ["MEM0_API_KEY"] = "your-api-key"
 # Create external memory instance
 external_memory = ExternalMemory(
    embedder_config={
-        "provider": "mem0",
+        "provider": "mem0", 
        "config": {"user_id": "U-123"}
    }
 )
@@ -808,8 +808,8 @@ class CustomStorage(Storage):

    def save(self, value, metadata=None, agent=None):
        self.memories.append({
-            "value": value,
-            "metadata": metadata,
+            "value": value, 
+            "metadata": metadata, 
            "agent": agent
        })

@@ -986,201 +986,7 @@ crew = Crew(
 - 🫡 **Enhanced Personalization:** Memory enables agents to remember user preferences and historical interactions, leading to personalized experiences.
 - 🧠 **Improved Problem Solving:** Access to a rich memory store aids agents in making more informed decisions, drawing on past learnings and contextual insights.

-## Memory Events
-
-CrewAI's event system provides powerful insights into memory operations. By leveraging memory events, you can monitor, debug, and optimize your memory system's performance and behavior.
-
-### Available Memory Events
-
-CrewAI emits the following memory-related events:
-
-| Event | Description | Key Properties |
-| :---- | :---------- | :------------- |
-| **MemoryQueryStartedEvent** | Emitted when a memory query begins | `query`, `limit`, `score_threshold` |
-| **MemoryQueryCompletedEvent** | Emitted when a memory query completes successfully | `query`, `results`, `limit`, `score_threshold`, `query_time_ms` |
-| **MemoryQueryFailedEvent** | Emitted when a memory query fails | `query`, `limit`, `score_threshold`, `error` |
-| **MemorySaveStartedEvent** | Emitted when a memory save operation begins | `value`, `metadata`, `agent_role` |
-| **MemorySaveCompletedEvent** | Emitted when a memory save operation completes successfully | `value`, `metadata`, `agent_role`, `save_time_ms` |
-| **MemorySaveFailedEvent** | Emitted when a memory save operation fails | `value`, `metadata`, `agent_role`, `error` |
-| **MemoryRetrievalStartedEvent** | Emitted when memory retrieval for a task prompt starts | `task_id` |
-| **MemoryRetrievalCompletedEvent** | Emitted when memory retrieval completes successfully | `task_id`, `memory_content`, `retrieval_time_ms` |
-
-### Practical Applications
-
-#### 1. Memory Performance Monitoring
-
-Track memory operation timing to optimize your application:
-
-```python
-from crewai.utilities.events.base_event_listener import BaseEventListener
-from crewai.utilities.events import (
-    MemoryQueryCompletedEvent,
-    MemorySaveCompletedEvent
-)
-import time
-
-class MemoryPerformanceMonitor(BaseEventListener):
-    def __init__(self):
-        super().__init__()
-        self.query_times = []
-        self.save_times = []
-
-    def setup_listeners(self, crewai_event_bus):
-        @crewai_event_bus.on(MemoryQueryCompletedEvent)
-        def on_memory_query_completed(source, event: MemoryQueryCompletedEvent):
-            self.query_times.append(event.query_time_ms)
-            print(f"Memory query completed in {event.query_time_ms:.2f}ms. Query: '{event.query}'")
-            print(f"Average query time: {sum(self.query_times)/len(self.query_times):.2f}ms")
-
-        @crewai_event_bus.on(MemorySaveCompletedEvent)
-        def on_memory_save_completed(source, event: MemorySaveCompletedEvent):
-            self.save_times.append(event.save_time_ms)
-            print(f"Memory save completed in {event.save_time_ms:.2f}ms")
-            print(f"Average save time: {sum(self.save_times)/len(self.save_times):.2f}ms")
-
-# Create an instance of your listener
-memory_monitor = MemoryPerformanceMonitor()
-```
-
-#### 2. Memory Content Logging
-
-Log memory operations for debugging and insights:
-
-```python
-from crewai.utilities.events.base_event_listener import BaseEventListener
-from crewai.utilities.events import (
-    MemorySaveStartedEvent,
-    MemoryQueryStartedEvent,
-    MemoryRetrievalCompletedEvent
-)
-import logging
-
-# Configure logging
-logger = logging.getLogger('memory_events')
-
-class MemoryLogger(BaseEventListener):
-    def setup_listeners(self, crewai_event_bus):
-        @crewai_event_bus.on(MemorySaveStartedEvent)
-        def on_memory_save_started(source, event: MemorySaveStartedEvent):
-            if event.agent_role:
-                logger.info(f"Agent '{event.agent_role}' saving memory: {event.value[:50]}...")
-            else:
-                logger.info(f"Saving memory: {event.value[:50]}...")
-
-        @crewai_event_bus.on(MemoryQueryStartedEvent)
-        def on_memory_query_started(source, event: MemoryQueryStartedEvent):
-            logger.info(f"Memory query started: '{event.query}' (limit: {event.limit})")
-
-        @crewai_event_bus.on(MemoryRetrievalCompletedEvent)
-        def on_memory_retrieval_completed(source, event: MemoryRetrievalCompletedEvent):
-            if event.task_id:
-                logger.info(f"Memory retrieved for task {event.task_id} in {event.retrieval_time_ms:.2f}ms")
-            else:
-                logger.info(f"Memory retrieved in {event.retrieval_time_ms:.2f}ms")
-            logger.debug(f"Memory content: {event.memory_content}")
-
-# Create an instance of your listener
-memory_logger = MemoryLogger()
-```
-
-#### 3. Error Tracking and Notifications
-
-Capture and respond to memory errors:
-
-```python
-from crewai.utilities.events.base_event_listener import BaseEventListener
-from crewai.utilities.events import (
-    MemorySaveFailedEvent,
-    MemoryQueryFailedEvent
-)
-import logging
-from typing import Optional
-
-# Configure logging
-logger = logging.getLogger('memory_errors')
-
-class MemoryErrorTracker(BaseEventListener):
-    def __init__(self, notify_email: Optional[str] = None):
-        super().__init__()
-        self.notify_email = notify_email
-        self.error_count = 0
-
-    def setup_listeners(self, crewai_event_bus):
-        @crewai_event_bus.on(MemorySaveFailedEvent)
-        def on_memory_save_failed(source, event: MemorySaveFailedEvent):
-            self.error_count += 1
-            agent_info = f"Agent '{event.agent_role}'" if event.agent_role else "Unknown agent"
-            error_message = f"Memory save failed: {event.error}. {agent_info}"
-            logger.error(error_message)
-
-            if self.notify_email and self.error_count % 5 == 0:
-                self._send_notification(error_message)
-
-        @crewai_event_bus.on(MemoryQueryFailedEvent)
-        def on_memory_query_failed(source, event: MemoryQueryFailedEvent):
-            self.error_count += 1
-            error_message = f"Memory query failed: {event.error}. Query: '{event.query}'"
-            logger.error(error_message)
-
-            if self.notify_email and self.error_count % 5 == 0:
-                self._send_notification(error_message)
-
-    def _send_notification(self, message):
-        # Implement your notification system (email, Slack, etc.)
-        print(f"[NOTIFICATION] Would send to {self.notify_email}: {message}")
-
-# Create an instance of your listener
-error_tracker = MemoryErrorTracker(notify_email="admin@example.com")
-```
-
-### Integrating with Analytics Platforms
-
-Memory events can be forwarded to analytics and monitoring platforms to track performance metrics, detect anomalies, and visualize memory usage patterns:
-
-```python
-from crewai.utilities.events.base_event_listener import BaseEventListener
-from crewai.utilities.events import (
-    MemoryQueryCompletedEvent,
-    MemorySaveCompletedEvent
-)
-
-class MemoryAnalyticsForwarder(BaseEventListener):
-    def __init__(self, analytics_client):
-        super().__init__()
-        self.client = analytics_client
-
-    def setup_listeners(self, crewai_event_bus):
-        @crewai_event_bus.on(MemoryQueryCompletedEvent)
-        def on_memory_query_completed(source, event: MemoryQueryCompletedEvent):
-            # Forward query metrics to analytics platform
-            self.client.track_metric({
-                "event_type": "memory_query",
-                "query": event.query,
-                "duration_ms": event.query_time_ms,
-                "result_count": len(event.results) if hasattr(event.results, "__len__") else 0,
-                "timestamp": event.timestamp
-            })
-
-        @crewai_event_bus.on(MemorySaveCompletedEvent)
-        def on_memory_save_completed(source, event: MemorySaveCompletedEvent):
-            # Forward save metrics to analytics platform
-            self.client.track_metric({
-                "event_type": "memory_save",
-                "agent_role": event.agent_role,
-                "duration_ms": event.save_time_ms,
-                "timestamp": event.timestamp
-            })
-```
-
-### Best Practices for Memory Event Listeners
-
-1. **Keep handlers lightweight**: Avoid complex processing in event handlers to prevent performance impacts
-2. **Use appropriate logging levels**: Use INFO for normal operations, DEBUG for details, ERROR for issues
-3. **Batch metrics when possible**: Accumulate metrics before sending to external systems
-4. **Handle exceptions gracefully**: Ensure your event handlers don't crash due to unexpected data
-5. **Consider memory consumption**: Be mindful of storing large amounts of event data
-
 ## Conclusion

-Integrating CrewAI's memory system into your projects is straightforward. By leveraging the provided memory components and configurations,
+Integrating CrewAI's memory system into your projects is straightforward. By leveraging the provided memory components and configurations, 
 you can quickly empower your agents with the ability to remember, reason, and learn from their interactions, unlocking new levels of intelligence and capability.
--- a/docs/en/concepts/tasks.mdx
+++ b/docs/en/concepts/tasks.mdx
@@ -57,7 +57,6 @@ crew = Crew(
 | **Output JSON** _(optional)_     | `output_json`     | `Optional[Type[BaseModel]]`   | A Pydantic model to structure the JSON output.                                                                       |
 | **Output Pydantic** _(optional)_ | `output_pydantic` | `Optional[Type[BaseModel]]`   | A Pydantic model for task output.                                                                                    |
 | **Callback** _(optional)_        | `callback`        | `Optional[Any]`               | Function/object to be executed after task completion.                                                                |
-| **Guardrail** _(optional)_       | `guardrail`       | `Optional[Union[Callable, str]]` | Function or string description to validate task output before proceeding to next task.                            |

 ## Creating Tasks

@@ -87,7 +86,6 @@ research_task:
  expected_output: >
    A list with 10 bullet points of the most relevant information about {topic}
  agent: researcher
-  guardrail: ensure each bullet contains a minimum of 100 words

 reporting_task:
  description: >
@@ -334,13 +332,9 @@ Task guardrails provide a way to validate and transform task outputs before they
 are passed to the next task. This feature helps ensure data quality and provides
 feedback to agents when their output doesn't meet specific criteria.

-**Guardrails can be defined in two ways:**
-1. **Function-based guardrails**: Python functions that implement custom validation logic
-2. **String-based guardrails**: Natural language descriptions that are automatically converted to LLM-powered validation
+### Using Task Guardrails

-### Function-Based Guardrails
-
-To add a function-based guardrail to a task, provide a validation function through the `guardrail` parameter:
+To add a guardrail to a task, provide a validation function through the `guardrail` parameter:

 ```python Code
 from typing import Tuple, Union, Dict, Any
@@ -378,82 +372,9 @@ blog_task = Task(
   - On success: it returns a tuple of `(bool, Any)`. For example: `(True, validated_result)`
   - On Failure: it returns a tuple of `(bool, str)`. For example: `(False, "Error message explain the failure")`

-### String-Based Guardrails
+### LLMGuardrail

-String-based guardrails allow you to describe validation criteria in natural language. When you provide a string instead of a function, CrewAI automatically converts it to an `LLMGuardrail` that uses an AI agent to validate the task output.
-
-#### Using String Guardrails in Python
-
-```python Code
-from crewai import Task
-
-# Simple string-based guardrail
-blog_task = Task(
-    description="Write a blog post about AI",
-    expected_output="A blog post under 200 words",
-    agent=blog_agent,
-    guardrail="Ensure the blog post is under 200 words and includes practical examples"
-)
-
-# More complex validation criteria
-research_task = Task(
-    description="Research AI trends for 2025",
-    expected_output="A comprehensive research report",
-    agent=research_agent,
-    guardrail="Ensure each finding includes a credible source and is backed by recent data from 2024-2025"
-)
-```
-
-#### Using String Guardrails in YAML
-
-```yaml
-research_task:
-  description: Research the latest AI developments
-  expected_output: A list of 10 bullet points about AI
-  agent: researcher
-  guardrail: ensure each bullet contains a minimum of 100 words
-
-validation_task:
-  description: Validate the research findings
-  expected_output: A validation report
-  agent: validator
-  guardrail: confirm all sources are from reputable publications and published within the last 2 years
-```
-
-#### How String Guardrails Work
-
-When you provide a string guardrail, CrewAI automatically:
-1. Creates an `LLMGuardrail` instance using the string as validation criteria
-2. Uses the task's agent LLM to power the validation
-3. Creates a temporary validation agent that checks the output against your criteria
-4. Returns detailed feedback if validation fails
-
-This approach is ideal when you want to use natural language to describe validation rules without writing custom validation functions.
-
-### LLMGuardrail Class
-
-The `LLMGuardrail` class is the underlying mechanism that powers string-based guardrails. You can also use it directly for more advanced control:
-
-```python Code
-from crewai import Task
-from crewai.tasks.llm_guardrail import LLMGuardrail
-from crewai.llm import LLM
-
-# Create a custom LLMGuardrail with specific LLM
-custom_guardrail = LLMGuardrail(
-    description="Ensure the response contains exactly 5 bullet points with proper citations",
-    llm=LLM(model="gpt-4o-mini")
-)
-
-task = Task(
-    description="Research AI safety measures",
-    expected_output="A detailed analysis with bullet points",
-    agent=research_agent,
-    guardrail=custom_guardrail
-)
-```
-
-**Note**: When you use a string guardrail, CrewAI automatically creates an `LLMGuardrail` instance using your task's agent LLM. Using `LLMGuardrail` directly gives you more control over the validation process and LLM selection.
+The `LLMGuardrail` class offers a robust mechanism for validating task outputs.

 ### Error Handling Best Practices

@@ -877,7 +798,166 @@ While creating and executing tasks, certain validation mechanisms are in place t

 These validations help in maintaining the consistency and reliability of task executions within the crewAI framework.

+## Task Guardrails

+Task guardrails provide a powerful way to validate, transform, or filter task outputs before they are passed to the next task. Guardrails are optional functions that execute before the next task starts, allowing you to ensure that task outputs meet specific requirements or formats.
+
+### Basic Usage
+
+#### Define your own logic to validate
+
+```python Code
+from typing import Tuple, Union
+from crewai import Task
+
+def validate_json_output(result: str) -> Tuple[bool, Union[dict, str]]:
+    """Validate that the output is valid JSON."""
+    try:
+        json_data = json.loads(result)
+        return (True, json_data)
+    except json.JSONDecodeError:
+        return (False, "Output must be valid JSON")
+
+task = Task(
+    description="Generate JSON data",
+    expected_output="Valid JSON object",
+    guardrail=validate_json_output
+)
+```
+
+#### Leverage a no-code approach for validation
+
+```python Code
+from crewai import Task
+
+task = Task(
+    description="Generate JSON data",
+    expected_output="Valid JSON object",
+    guardrail="Ensure the response is a valid JSON object"
+)
+```
+
+#### Using YAML
+
+```yaml
+research_task:
+  ...
+  guardrail: make sure each bullet contains a minimum of 100 words
+  ...
+```
+
+```python Code
+@CrewBase
+class InternalCrew:
+    agents_config = "config/agents.yaml"
+    tasks_config = "config/tasks.yaml"
+
+    ...
+    @task
+    def research_task(self):
+        return Task(config=self.tasks_config["research_task"])  # type: ignore[index]
+    ...
+```
+
+
+#### Use custom models for code generation
+
+```python Code
+from crewai import Task
+from crewai.llm import LLM
+
+task = Task(
+    description="Generate JSON data",
+    expected_output="Valid JSON object",
+    guardrail=LLMGuardrail(
+        description="Ensure the response is a valid JSON object",
+        llm=LLM(model="gpt-4o-mini"),
+    )
+)
+```
+
+### How Guardrails Work
+
+1. **Optional Attribute**: Guardrails are an optional attribute at the task level, allowing you to add validation only where needed.
+2. **Execution Timing**: The guardrail function is executed before the next task starts, ensuring valid data flow between tasks.
+3. **Return Format**: Guardrails must return a tuple of `(success, data)`:
+   - If `success` is `True`, `data` is the validated/transformed result
+   - If `success` is `False`, `data` is the error message
+4. **Result Routing**:
+   - On success (`True`), the result is automatically passed to the next task
+   - On failure (`False`), the error is sent back to the agent to generate a new answer
+
+### Common Use Cases
+
+#### Data Format Validation
+```python Code
+def validate_email_format(result: str) -> Tuple[bool, Union[str, str]]:
+    """Ensure the output contains a valid email address."""
+    import re
+    email_pattern = r'^[\w\.-]+@[\w\.-]+\.\w+$'
+    if re.match(email_pattern, result.strip()):
+        return (True, result.strip())
+    return (False, "Output must be a valid email address")
+```
+
+#### Content Filtering
+```python Code
+def filter_sensitive_info(result: str) -> Tuple[bool, Union[str, str]]:
+    """Remove or validate sensitive information."""
+    sensitive_patterns = ['SSN:', 'password:', 'secret:']
+    for pattern in sensitive_patterns:
+        if pattern.lower() in result.lower():
+            return (False, f"Output contains sensitive information ({pattern})")
+    return (True, result)
+```
+
+#### Data Transformation
+```python Code
+def normalize_phone_number(result: str) -> Tuple[bool, Union[str, str]]:
+    """Ensure phone numbers are in a consistent format."""
+    import re
+    digits = re.sub(r'\D', '', result)
+    if len(digits) == 10:
+        formatted = f"({digits[:3]}) {digits[3:6]}-{digits[6:]}"
+        return (True, formatted)
+    return (False, "Output must be a 10-digit phone number")
+```
+
+### Advanced Features
+
+#### Chaining Multiple Validations
+```python Code
+def chain_validations(*validators):
+    """Chain multiple validators together."""
+    def combined_validator(result):
+        for validator in validators:
+            success, data = validator(result)
+            if not success:
+                return (False, data)
+            result = data
+        return (True, result)
+    return combined_validator
+
+# Usage
+task = Task(
+    description="Get user contact info",
+    expected_output="Email and phone",
+    guardrail=chain_validations(
+        validate_email_format,
+        filter_sensitive_info
+    )
+)
+```
+
+#### Custom Retry Logic
+```python Code
+task = Task(
+    description="Generate data",
+    expected_output="Valid data",
+    guardrail=validate_data,
+    max_retries=5  # Override default retry limit
+)
+```

 ## Creating Directories when Saving Files

--- a/docs/en/concepts/training.mdx
+++ b/docs/en/concepts/training.mdx
@@ -6,10 +6,10 @@ icon: dumbbell

 ## Overview

-The training feature in CrewAI allows you to train your AI agents using the command-line interface (CLI).
+The training feature in CrewAI allows you to train your AI agents using the command-line interface (CLI). 
 By running the command `crewai train -n <n_iterations>`, you can specify the number of iterations for the training process.

-During training, CrewAI utilizes techniques to optimize the performance of your agents along with human feedback.
+During training, CrewAI utilizes techniques to optimize the performance of your agents along with human feedback. 
 This helps the agents improve their understanding, decision-making, and problem-solving abilities.

 ### Training Your Crew Using the CLI
@@ -42,8 +42,8 @@ filename = "your_model.pkl"

 try:
    YourCrewName_Crew().crew().train(
-      n_iterations=n_iterations,
-      inputs=inputs,
+      n_iterations=n_iterations, 
+      inputs=inputs, 
      filename=filename
    )

@@ -64,68 +64,4 @@ Once the training is complete, your agents will be equipped with enhanced capabi
 Remember to regularly update and retrain your agents to ensure they stay up-to-date with the latest information and advancements in the field.

 Happy training with CrewAI! 🚀
-
-## Small Language Model Considerations
-
-<Warning>
-  When using smaller language models (≤7B parameters) for training data evaluation, be aware that they may face challenges with generating structured outputs and following complex instructions.
-</Warning>
-
-### Limitations of Small Models in Training Evaluation
-
-<CardGroup cols={2}>
-  <Card title="JSON Output Accuracy" icon="triangle-exclamation">
-    Smaller models often struggle with producing valid JSON responses needed for structured training evaluations, leading to parsing errors and incomplete data.
-  </Card>
-  <Card title="Evaluation Quality" icon="chart-line">
-    Models under 7B parameters may provide less nuanced evaluations with limited reasoning depth compared to larger models.
-  </Card>
-  <Card title="Instruction Following" icon="list-check">
-    Complex training evaluation criteria may not be fully followed or considered by smaller models.
-  </Card>
-  <Card title="Consistency" icon="rotate">
-    Evaluations across multiple training iterations may lack consistency with smaller models.
-  </Card>
-</CardGroup>
-
-### Recommendations for Training
-
-<Tabs>
-  <Tab title="Best Practice">
-    For optimal training quality and reliable evaluations, we strongly recommend using models with at least 7B parameters or larger:
-
-    ```python
-    from crewai import Agent, Crew, Task, LLM
-
-    # Recommended minimum for training evaluation
-    llm = LLM(model="mistral/open-mistral-7b")
-
-    # Better options for reliable training evaluation
-    llm = LLM(model="anthropic/claude-3-sonnet-20240229-v1:0")
-    llm = LLM(model="gpt-4o")
-
-    # Use this LLM with your agents
-    agent = Agent(
-        role="Training Evaluator",
-        goal="Provide accurate training feedback",
-        llm=llm
-    )
-    ```
-
-    <Tip>
-      More powerful models provide higher quality feedback with better reasoning, leading to more effective training iterations.
-    </Tip>
-  </Tab>
-  <Tab title="Small Model Usage">
-    If you must use smaller models for training evaluation, be aware of these constraints:
-
-    ```python
-    # Using a smaller model (expect some limitations)
-    llm = LLM(model="huggingface/microsoft/Phi-3-mini-4k-instruct")
-    ```
-
-    <Warning>
-      While CrewAI includes optimizations for small models, expect less reliable and less nuanced evaluation results that may require more human intervention during training.
-    </Warning>
-  </Tab>
-</Tabs>
+  
--- a/docs/en/enterprise/features/agent-repositories.mdx
+++ b/docs/en/enterprise/features/agent-repositories.mdx
@@ -1,155 +0,0 @@
---
-title: 'Agent Repositories'
-description: 'Learn how to use Agent Repositories to share and reuse your agents across teams and projects'
-icon: 'database'
---
-
-Agent Repositories allow enterprise users to store, share, and reuse agent definitions across teams and projects. This feature enables organizations to maintain a centralized library of standardized agents, promoting consistency and reducing duplication of effort.
-
-## Benefits of Agent Repositories
-
- **Standardization**: Maintain consistent agent definitions across your organization
- **Reusability**: Create an agent once and use it in multiple crews and projects
- **Governance**: Implement organization-wide policies for agent configurations
- **Collaboration**: Enable teams to share and build upon each other's work
-
-## Using Agent Repositories
-
-### Prerequisites
-
-1. You must have an account at CrewAI, try the [free plan](https://app.crewai.com).
-2. You need to be authenticated using the CrewAI CLI.
-3. If you have more than one organization, make sure you are switched to the correct organization using the CLI command:
-
-```bash
-crewai org switch <org_id>
-```
-
-### Creating and Managing Agents in Repositories
-
-To create and manage agents in repositories,Enterprise Dashboard.
-
-### Loading Agents from Repositories
-
-You can load agents from repositories in your code using the `from_repository` parameter:
-
-```python
-from crewai import Agent
-
-# Create an agent by loading it from a repository
-# The agent is loaded with all its predefined configurations
-researcher = Agent(
-    from_repository="market-research-agent"
-)
-
-```
-
-### Overriding Repository Settings
-
-You can override specific settings from the repository by providing them in the configuration:
-
-```python
-researcher = Agent(
-    from_repository="market-research-agent",
-    goal="Research the latest trends in AI development",  # Override the repository goal
-    verbose=True  # Add a setting not in the repository
-)
-```
-
-### Example: Creating a Crew with Repository Agents
-
-```python
-from crewai import Crew, Agent, Task
-
-# Load agents from repositories
-researcher = Agent(
-    from_repository="market-research-agent"
-)
-
-writer = Agent(
-    from_repository="content-writer-agent"
-)
-
-# Create tasks
-research_task = Task(
-    description="Research the latest trends in AI",
-    agent=researcher
-)
-
-writing_task = Task(
-    description="Write a comprehensive report based on the research",
-    agent=writer
-)
-
-# Create the crew
-crew = Crew(
-    agents=[researcher, writer],
-    tasks=[research_task, writing_task],
-    verbose=True
-)
-
-# Run the crew
-result = crew.kickoff()
-```
-
-### Example: Using `kickoff()` with Repository Agents
-
-You can also use repository agents directly with the `kickoff()` method for simpler interactions:
-
-```python
-from crewai import Agent
-from pydantic import BaseModel
-from typing import List
-
-# Define a structured output format
-class MarketAnalysis(BaseModel):
-    key_trends: List[str]
-    opportunities: List[str]
-    recommendation: str
-
-# Load an agent from repository
-analyst = Agent(
-    from_repository="market-analyst-agent",
-    verbose=True
-)
-
-# Get a free-form response
-result = analyst.kickoff("Analyze the AI market in 2025")
-print(result.raw)  # Access the raw response
-
-# Get structured output
-structured_result = analyst.kickoff(
-    "Provide a structured analysis of the AI market in 2025",
-    response_format=MarketAnalysis
-)
-
-# Access structured data
-print(f"Key Trends: {structured_result.pydantic.key_trends}")
-print(f"Recommendation: {structured_result.pydantic.recommendation}")
-```
-
-## Best Practices
-
-1. **Naming Convention**: Use clear, descriptive names for your repository agents
-2. **Documentation**: Include comprehensive descriptions for each agent
-3. **Tool Management**: Ensure that tools referenced by repository agents are available in your environment
-4. **Access Control**: Manage permissions to ensure only authorized team members can modify repository agents
-
-## Organization Management
-
-To switch between organizations or see your current organization, use the CrewAI CLI:
-
-```bash
-# View current organization
-crewai org current
-
-# Switch to a different organization
-crewai org switch <org_id>
-
-# List all available organizations
-crewai org list
-```
-
-<Note>
-When loading agents from repositories, you must be authenticated and switched to the correct organization. If you receive errors, check your authentication status and organization settings using the CLI commands above.
-</Note>
--- a/docs/en/enterprise/guides/deploy-crew.mdx
+++ b/docs/en/enterprise/guides/deploy-crew.mdx
@@ -41,8 +41,11 @@ The CLI provides the fastest way to deploy locally developed crews to the Enterp
    First, you need to authenticate your CLI with the CrewAI Enterprise platform:

    ```bash
-    # If you already have a CrewAI Enterprise account, or want to create one:
+    # If you already have a CrewAI Enterprise account
    crewai login
+
+    # If you're creating a new account
+    crewai signup
    ```

    When you run either command, the CLI will:
--- a/docs/en/installation.mdx
+++ b/docs/en/installation.mdx
@@ -72,7 +72,7 @@ If you haven't installed `uv` yet, follow **step 1** to quickly get it set up on
          </Warning>

          <Warning>
-            If you encounter the `chroma-hnswlib==0.7.6` build error (`fatal error C1083: Cannot open include file: 'float.h'`) on Windows, install [Visual Studio Build Tools](https://visualstudio.microsoft.com/downloads/) with *Desktop development with C++*.
+            If you encounter the `chroma-hnswlib==0.7.6` build error (`fatal error C1083: Cannot open include file: 'float.h'`) on Windows, install (Visual Studio Build Tools)[https://visualstudio.microsoft.com/downloads/] with *Desktop development with C++*.
          </Warning>

      - To verify that `crewai` is installed, run:
@@ -104,6 +104,7 @@ We recommend using the `YAML` template scaffolding for a structured approach to
      ```

    - This creates a new project with the following structure:
+      <Frame>
      ```
      my_project/
      ├── .gitignore
@@ -123,6 +124,7 @@ We recommend using the `YAML` template scaffolding for a structured approach to
                  ├── agents.yaml
                  └── tasks.yaml
      ```
+      </Frame>
  </Step>

  <Step title="Customize Your Project">
@@ -170,7 +172,7 @@ For teams and organizations, CrewAI offers enterprise deployment options that el

 ### CrewAI Factory (Self-hosted)
 - Containerized deployment for your infrastructure
- Supports any hyperscaler including on prem deployments
+- Supports any hyperscaler including on prem depployments
 - Integration with your existing security systems

 <Card title="Explore Enterprise Options" icon="building" href="https://crewai.com/enterprise">
--- a/docs/en/observability/neatlogs.mdx
+++ b/docs/en/observability/neatlogs.mdx
@@ -1,134 +0,0 @@
---
-title: Neatlogs Integration
-description: Understand, debug, and share your CrewAI agent runs
-icon: magnifying-glass-chart
---
-
-# Introduction
-
-Neatlogs helps you **see what your agent did**, **why**, and **share it**.
-
-It captures every step: thoughts, tool calls, responses, evaluations. No raw logs. Just clear, structured traces. Great for debugging and collaboration.
-
-## Why use Neatlogs?
-
-CrewAI agents use multiple tools and reasoning steps. When something goes wrong, you need context — not just errors.
-
-Neatlogs lets you:
-
- Follow the full decision path
- Add feedback directly on steps
- Chat with the trace using AI assistant
- Share runs publicly for feedback
- Turn insights into tasks
-
-All in one place.
-
-Manage your traces effortlessly
-
-![Traces](/images/neatlogs-1.png)
-![Trace Response](/images/neatlogs-2.png)
-
-The best UX to view a CrewAI trace. Post comments anywhere you want. Use AI to debug.
-
-![Trace Details](/images/neatlogs-3.png)
-![Ai Chat Bot With A Trace](/images/neatlogs-4.png)
-![Comments Drawer](/images/neatlogs-5.png)
-
-## Core Features
-
- **Trace Viewer**: Track thoughts, tools, and decisions in sequence
- **Inline Comments**: Tag teammates on any trace step
- **Feedback & Evaluation**: Mark outputs as correct or incorrect
- **Error Highlighting**: Automatic flagging of API/tool failures
- **Task Conversion**: Convert comments into assigned tasks
- **Ask the Trace (AI)**: Chat with your trace using Neatlogs AI bot
- **Public Sharing**: Publish trace links to your community
-
-## Quick Setup with CrewAI
-
-<Steps>
-  <Step title="Sign Up & Get API Key">
-    Visit [neatlogs.com](https://neatlogs.com/?utm_source=crewAI-docs), create a project, copy the API key.
-  </Step>
-  <Step title="Install SDK">
-    ```bash
-    pip install neatlogs
-    ```
-    (Latest version 0.8.0, Python 3.8+; MIT license)
-  </Step>
-  <Step title="Initialize Neatlogs">
-    Before starting Crew agents, add:
-
-    ```python
-    import neatlogs
-    neatlogs.init("YOUR_PROJECT_API_KEY")
-    ```
-
-    Agents run as usual. Neatlogs captures everything automatically.
-
-  </Step>
-</Steps>
-
-
-
-## Under the Hood
-
-According to GitHub, Neatlogs:
-
- Captures thoughts, tool calls, responses, errors, and token stats
- Supports AI-powered task generation and robust evaluation workflows
-
-All with just two lines of code.
-
-
-
-## Watch It Work
-
-### 🔍 Full Demo (4 min)
-
-<iframe
-  width="100%"
-  height="315"
-  src="https://www.youtube.com/embed/8KDme9T2I7Q?si=b8oHteaBwFNs_Duk"
-  title="YouTube video player"
-  frameBorder="0"
-  allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture"
-  allowFullScreen
-></iframe>
-
-### ⚙️ CrewAI Integration (30 s)
-
-<iframe
-  className="w-full aspect-video rounded-xl"
-  src="https://www.loom.com/embed/9c78b552af43452bb3e4783cb8d91230?sid=e9d7d370-a91a-49b0-809e-2f375d9e801d"
-  title="Loom video player"
-  frameBorder="0"
-  allowFullScreen
-></iframe>
-
-
-
-## Links & Support
-
- 📘 [Neatlogs Docs](https://docs.neatlogs.com/)
- 🔐 [Dashboard & API Key](https://app.neatlogs.com/)
- 🐦 [Follow on Twitter](https://twitter.com/neatlogs)
- 📧 Contact: hello@neatlogs.com
- 🛠 [GitHub SDK](https://github.com/NeatLogs/neatlogs)
-
-
-
-## TL;DR
-
-With just:
-
-```bash
-pip install neatlogs
-
-import neatlogs
-neatlogs.init("YOUR_API_KEY")
-
-You can now capture, understand, share, and act on your CrewAI agent runs in seconds.
-No setup overhead. Full trace transparency. Full team collaboration.
-```
--- a/docs/en/tools/search-research/overview.mdx
+++ b/docs/en/tools/search-research/overview.mdx
@@ -44,14 +44,6 @@ These tools enable your agents to search the web, research topics, and find info
  <Card title="YouTube Video Search" icon="play" href="/en/tools/search-research/youtubevideosearchtool">
    Find and analyze YouTube videos by topic, keyword, or criteria.
  </Card>
-
-  <Card title="Tavily Search Tool" icon="magnifying-glass" href="/en/tools/search-research/tavilysearchtool">
-    Comprehensive web search using Tavily's AI-powered search API.
-  </Card>
-
-  <Card title="Tavily Extractor Tool" icon="file-text" href="/en/tools/search-research/tavilyextractortool">
-    Extract structured content from web pages using the Tavily API.
-  </Card>
 </CardGroup>

 ## **Common Use Cases**
@@ -63,19 +55,17 @@ These tools enable your agents to search the web, research topics, and find info
 - **Academic Research**: Find scholarly articles and technical papers

 ```python
-from crewai_tools import SerperDevTool, GitHubSearchTool, YoutubeVideoSearchTool, TavilySearchTool, TavilyExtractorTool
+from crewai_tools import SerperDevTool, GitHubSearchTool, YoutubeVideoSearchTool

 # Create research tools
 web_search = SerperDevTool()
 code_search = GitHubSearchTool()
 video_research = YoutubeVideoSearchTool()
-tavily_search = TavilySearchTool()
-content_extractor = TavilyExtractorTool()

 # Add to your agent
 agent = Agent(
    role="Research Analyst",
-    tools=[web_search, code_search, video_research, tavily_search, content_extractor],
+    tools=[web_search, code_search, video_research],
    goal="Gather comprehensive information on any topic"
 )
 ```
--- a/docs/en/tools/search-research/tavilyextractortool.mdx
+++ b/docs/en/tools/search-research/tavilyextractortool.mdx
@@ -1,139 +0,0 @@
---
-title: "Tavily Extractor Tool"
-description: "Extract structured content from web pages using the Tavily API"
-icon: "file-text"
---
-
-The `TavilyExtractorTool` allows CrewAI agents to extract structured content from web pages using the Tavily API. It can process single URLs or lists of URLs and provides options for controlling the extraction depth and including images.
-
-## Installation
-
-To use the `TavilyExtractorTool`, you need to install the `tavily-python` library:
-
-```shell
-pip install 'crewai[tools]' tavily-python
-```
-
-You also need to set your Tavily API key as an environment variable:
-
-```bash
-export TAVILY_API_KEY='your-tavily-api-key'
-```
-
-## Example Usage
-
-Here's how to initialize and use the `TavilyExtractorTool` within a CrewAI agent:
-
-```python
-import os
-from crewai import Agent, Task, Crew
-from crewai_tools import TavilyExtractorTool
-
-# Ensure TAVILY_API_KEY is set in your environment
-# os.environ["TAVILY_API_KEY"] = "YOUR_API_KEY"
-
-# Initialize the tool
-tavily_tool = TavilyExtractorTool()
-
-# Create an agent that uses the tool
-extractor_agent = Agent(
-    role='Web Content Extractor',
-    goal='Extract key information from specified web pages',
-    backstory='You are an expert at extracting relevant content from websites using the Tavily API.',
-    tools=[tavily_tool],
-    verbose=True
-)
-
-# Define a task for the agent
-extract_task = Task(
-    description='Extract the main content from the URL https://example.com using basic extraction depth.',
-    expected_output='A JSON string containing the extracted content from the URL.',
-    agent=extractor_agent
-)
-
-# Create and run the crew
-crew = Crew(
-    agents=[extractor_agent],
-    tasks=[extract_task],
-    verbose=2
-)
-
-result = crew.kickoff()
-print(result)
-```
-
-## Configuration Options
-
-The `TavilyExtractorTool` accepts the following arguments:
-
- `urls` (Union[List[str], str]): **Required**. A single URL string or a list of URL strings to extract data from.
- `include_images` (Optional[bool]): Whether to include images in the extraction results. Defaults to `False`.
- `extract_depth` (Literal["basic", "advanced"]): The depth of extraction. Use `"basic"` for faster, surface-level extraction or `"advanced"` for more comprehensive extraction. Defaults to `"basic"`.
- `timeout` (int): The maximum time in seconds to wait for the extraction request to complete. Defaults to `60`.
-
-## Advanced Usage
-
-### Multiple URLs with Advanced Extraction
-
-```python
-# Example with multiple URLs and advanced extraction
-multi_extract_task = Task(
-    description='Extract content from https://example.com and https://anotherexample.org using advanced extraction.',
-    expected_output='A JSON string containing the extracted content from both URLs.',
-    agent=extractor_agent
-)
-
-# Configure the tool with custom parameters
-custom_extractor = TavilyExtractorTool(
-    extract_depth='advanced',
-    include_images=True,
-    timeout=120
-)
-
-agent_with_custom_tool = Agent(
-    role="Advanced Content Extractor",
-    goal="Extract comprehensive content with images",
-    tools=[custom_extractor]
-)
-```
-
-### Tool Parameters
-
-You can customize the tool's behavior by setting parameters during initialization:
-
-```python
-# Initialize with custom configuration
-extractor_tool = TavilyExtractorTool(
-    extract_depth='advanced',  # More comprehensive extraction
-    include_images=True,       # Include image results
-    timeout=90                 # Custom timeout
-)
-```
-
-## Features
-
- **Single or Multiple URLs**: Extract content from one URL or process multiple URLs in a single request
- **Configurable Depth**: Choose between basic (fast) and advanced (comprehensive) extraction modes
- **Image Support**: Optionally include images in the extraction results
- **Structured Output**: Returns well-formatted JSON containing the extracted content
- **Error Handling**: Robust handling of network timeouts and extraction errors
-
-## Response Format
-
-The tool returns a JSON string representing the structured data extracted from the provided URL(s). The exact structure depends on the content of the pages and the `extract_depth` used.
-
-Common response elements include:
- **Title**: The page title
- **Content**: Main text content of the page
- **Images**: Image URLs and metadata (when `include_images=True`)
- **Metadata**: Additional page information like author, description, etc.
-
-## Use Cases
-
- **Content Analysis**: Extract and analyze content from competitor websites
- **Research**: Gather structured data from multiple sources for analysis
- **Content Migration**: Extract content from existing websites for migration
- **Monitoring**: Regular extraction of content for change detection
- **Data Collection**: Systematic extraction of information from web sources
-
-Refer to the [Tavily API documentation](https://docs.tavily.com/docs/tavily-api/python-sdk#extract) for detailed information about the response structure and available options.
--- a/docs/en/tools/search-research/tavilysearchtool.mdx
+++ b/docs/en/tools/search-research/tavilysearchtool.mdx
@@ -1,122 +0,0 @@
---
-title: "Tavily Search Tool"
-description: "Perform comprehensive web searches using the Tavily Search API"
-icon: "magnifying-glass"
---
-
-The `TavilySearchTool` provides an interface to the Tavily Search API, enabling CrewAI agents to perform comprehensive web searches. It allows for specifying search depth, topics, time ranges, included/excluded domains, and whether to include direct answers, raw content, or images in the results.
-
-## Installation
-
-To use the `TavilySearchTool`, you need to install the `tavily-python` library:
-
-```shell
-pip install 'crewai[tools]' tavily-python
-```
-
-## Environment Variables
-
-Ensure your Tavily API key is set as an environment variable:
-
-```bash
-export TAVILY_API_KEY='your_tavily_api_key'
-```
-
-## Example Usage
-
-Here's how to initialize and use the `TavilySearchTool` within a CrewAI agent:
-
-```python
-import os
-from crewai import Agent, Task, Crew
-from crewai_tools import TavilySearchTool
-
-# Ensure the TAVILY_API_KEY environment variable is set
-# os.environ["TAVILY_API_KEY"] = "YOUR_TAVILY_API_KEY"
-
-# Initialize the tool
-tavily_tool = TavilySearchTool()
-
-# Create an agent that uses the tool
-researcher = Agent(
-    role='Market Researcher',
-    goal='Find information about the latest AI trends',
-    backstory='An expert market researcher specializing in technology.',
-    tools=[tavily_tool],
-    verbose=True
-)
-
-# Create a task for the agent
-research_task = Task(
-    description='Search for the top 3 AI trends in 2024.',
-    expected_output='A JSON report summarizing the top 3 AI trends found.',
-    agent=researcher
-)
-
-# Form the crew and kick it off
-crew = Crew(
-    agents=[researcher],
-    tasks=[research_task],
-    verbose=2
-)
-
-result = crew.kickoff()
-print(result)
-```
-
-## Configuration Options
-
-The `TavilySearchTool` accepts the following arguments during initialization or when calling the `run` method:
-
- `query` (str): **Required**. The search query string.
- `search_depth` (Literal["basic", "advanced"], optional): The depth of the search. Defaults to `"basic"`.
- `topic` (Literal["general", "news", "finance"], optional): The topic to focus the search on. Defaults to `"general"`.
- `time_range` (Literal["day", "week", "month", "year"], optional): The time range for the search. Defaults to `None`.
- `days` (int, optional): The number of days to search back. Relevant if `time_range` is not set. Defaults to `7`.
- `max_results` (int, optional): The maximum number of search results to return. Defaults to `5`.
- `include_domains` (Sequence[str], optional): A list of domains to prioritize in the search. Defaults to `None`.
- `exclude_domains` (Sequence[str], optional): A list of domains to exclude from the search. Defaults to `None`.
- `include_answer` (Union[bool, Literal["basic", "advanced"]], optional): Whether to include a direct answer synthesized from the search results. Defaults to `False`.
- `include_raw_content` (bool, optional): Whether to include the raw HTML content of the searched pages. Defaults to `False`.
- `include_images` (bool, optional): Whether to include image results. Defaults to `False`.
- `timeout` (int, optional): The request timeout in seconds. Defaults to `60`.
-
-## Advanced Usage
-
-You can configure the tool with custom parameters:
-
-```python
-# Example: Initialize with specific parameters
-custom_tavily_tool = TavilySearchTool(
-    search_depth='advanced',
-    max_results=10,
-    include_answer=True
-)
-
-# The agent will use these defaults
-agent_with_custom_tool = Agent(
-    role="Advanced Researcher",
-    goal="Conduct detailed research with comprehensive results",
-    tools=[custom_tavily_tool]
-)
-```
-
-## Features
-
- **Comprehensive Search**: Access to Tavily's powerful search index
- **Configurable Depth**: Choose between basic and advanced search modes
- **Topic Filtering**: Focus searches on general, news, or finance topics
- **Time Range Control**: Limit results to specific time periods
- **Domain Control**: Include or exclude specific domains
- **Direct Answers**: Get synthesized answers from search results
- **Content Filtering**: Prevent context window issues with automatic content truncation
-
-## Response Format
-
-The tool returns search results as a JSON string containing:
- Search results with titles, URLs, and content snippets
- Optional direct answers to queries
- Optional image results
- Optional raw HTML content (when enabled)
-
-Content for each result is automatically truncated to prevent context window issues while maintaining the most relevant information.
--- a/docs/images/neatlogs-1.png
+++ b/docs/images/neatlogs-1.png
--- a/docs/images/neatlogs-2.png
+++ b/docs/images/neatlogs-2.png
--- a/docs/images/neatlogs-3.png
+++ b/docs/images/neatlogs-3.png
--- a/docs/images/neatlogs-4.png
+++ b/docs/images/neatlogs-4.png
--- a/docs/images/neatlogs-5.png
+++ b/docs/images/neatlogs-5.png
--- a/docs/pt-BR/changelog.mdx
+++ b/docs/pt-BR/changelog.mdx
@@ -0,0 +1,473 @@
+---
+title: Registro de Alterações
+description: Veja as atualizações e mudanças mais recentes do CrewAI
+icon: timeline
+---
+
+<Update label="2024-05-22" description="v0.121.0" tags={["Latest"]}>
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01210.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.121.0">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Corrigido erro de codificação ao criar ferramentas
+  - Corrigido teste do llama com falha
+  - Configuração de logs atualizada para mais consistência
+  - Inicialização e tratamento de eventos de telemetria aprimorados
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Adicionado **atributo markdown** à classe Task
+  - Adicionado **atributo reasoning** à classe Agent
+  - Adicionada flag **inject_date** ao Agent para injeção automática de data
+  - Implementado **HallucinationGuardrail** (sem-operação, com cobertura de testes)
+
+  **Documentação & Guias**
+  - Documentação adicionada para **StagehandTool** e melhoria na estrutura MDX
+  - Inclusa documentação para integração **MCP** e atualização nos docs corporativos
+  - Eventos de conhecimento documentados e documentação de reasoning atualizada
+  - Adicionada explicação do parâmetro stop
+  - Corrigidas referências de import nos exemplos de documentação (before_kickoff, after_kickoff)
+  - Atualizações gerais e reestruturação nos docs para maior clareza
+</Update>
+
+<Update label="2024-05-15" description="v0.120.1">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01201.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.120.1">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Corrigida **interpolação com hífens**
+</Update>
+
+<Update label="2024-05-14" description="v0.120.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01200.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.120.0">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Conjunto completo de regras do Ruff habilitado por padrão para linting mais rigoroso
+  - Corrigida condição de corrida no FilteredStream usando context managers
+  - Corrigido problema de reset de conhecimento do agente
+  - Lógica de busca de agente refatorada para módulo utilitário
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Suporte adicionado para **carregar um Agent diretamente de um repositório**
+  - Permitida configuração de contexto vazio em Task
+  - Feedback do repositório de Agent aprimorado e correção no comportamento de auto-import de Tool
+  - Inicialização direta de conhecimento introduzida (bypassando knowledge_sources)
+
+  **Documentação & Guias**
+  - security.md atualizado para refletir práticas atuais de segurança
+  - Seção de configuração do Google revisada para mais clareza
+  - Adicionado link para AI Studio ao inserir chave Gemini
+  - Guia de observabilidade do Arize Phoenix atualizado
+  - Documentação de fluxo renovada
+</Update>
+
+<Update label="2024-05-08" description="v0.119.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01190.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.119.0">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Confiabilidade de testes aprimorada melhorando o tratamento do pytest para testes instáveis
+  - Corrigido crash no reset de memória por incompatibilidade de dimensões de embeddings
+  - Identificação do fluxo pai habilitada para Crew e LiteAgent
+  - Crashes de telemetria prevenidos quando indisponíveis
+  - Atualização da versão do **LiteLLM** para melhor compatibilidade
+  - Corrigidos testes do conversor de llama removendo skip_external_api
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Introduzida **reescrita de prompt de recuperação de conhecimento** no Agent para melhor rastreamento e debug
+  - Guias de configuração do LLM e início rápido tornados independentes do modelo
+
+  **Documentação & Guias**
+  - Adicionada documentação de configuração avançada para o RAG tool
+  - Guia de resolução de problemas no Windows atualizado
+  - Exemplos na documentação refinados para maior clareza
+  - Correção de erros ortográficos em docs e arquivos de configuração
+</Update>
+
+<Update label="2024-04-28" description="v0.118.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01180.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.118.0">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Corrigidos problemas com prompt ou templates de sistema ausentes
+  - Removida configuração global de logs para evitar sobreposição não intencional
+  - Renomeado **TaskGuardrail para LLMGuardrail** para maior clareza
+  - Versão do litellm rebaixada para 1.167.1 visando compatibilidade
+  - Adicionados arquivos init.py ausentes para garantir inicialização correta dos módulos
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Suporte adicionado para **criação de Guardrails sem código** facilitando o controle de comportamento da IA
+
+  **Documentação & Guias**
+  - CrewStructuredTool removido da documentação pública para refletir uso interno
+  - Documentação corporativa e embed do YouTube atualizados para melhor onboarding
+</Update>
+
+<Update label="2024-04-20" description="v0.117.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01170.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.117.0">Ver no GitHub</a>
+  </div>
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Adicionado suporte ao parâmetro `result_as_answer` no decorator `@tool`.
+  - Suporte a novos modelos de linguagem: GPT-4.1, Gemini-2.0 e Gemini-2.5 Pro.
+  - Capacidades de gerenciamento de conhecimento aprimoradas.
+  - Adicionado provedor Huggingface na CLI.
+  - Compatibilidade e suporte CI melhorados para Python 3.10+.
+
+  **Melhorias & Correções no Núcleo**
+  - Corrigidos problemas com parâmetros de template incorretos e entradas ausentes.
+  - Fluxo assíncrono aprimorado com verificações de condição coroutine.
+  - Gerenciamento de memória aprimorado com configuração isolada e cópia correta dos objetos.
+  - Inicialização de lite agents corrigida com referências corretas.
+  - Corrigidos problemas de type hint em Python e remoção de imports redundantes.
+  - Atualização do posicionamento de eventos para rastreamento do uso de ferramentas.
+  - Exceções explícitas lançadas quando fluxos falham.
+  - Remoção de código e comentários redundantes em diversos módulos.
+  - Atualização da ação de token do GitHub App para v2.
+
+  **Documentação & Guias**
+  - Estrutura documental aprimorada, incluindo instruções para implantação corporativa.
+  - Criação automática de pastas de saída para geração de documentação.
+  - Link quebrado reparado na documentação do WeaviateVectorSearchTool.
+  - Correções na documentação do guardrail e nos caminhos de import dos search tools para JSON.
+  - Atualização na documentação do CodeInterpreterTool.
+  - Aprimoramento de SEO, navegação contextual e tratamento de erros nas páginas de documentação.
+</Update>
+
+<Update label="2024-04-25" description="v0.117.1">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01171.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.117.1">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Versão do **crewai-tools** atualizada para a mais recente
+  - Versão do **liteLLM** atualizada para a mais recente
+  - Correção no **Mem0 OSS**
+</Update>
+
+<Update label="2024-04-07" description="v0.114.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01140.png" />
+  </Frame>
+
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.114.0">Ver no GitHub</a>
+  </div>
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Agents como unidade atômica. (`Agent(...).kickoff()`)
+  - Suporte para [implementações Custom LLM](https://docs.crewai.com/guides/advanced/custom-llm).
+  - Memória externa integrada e [Opik observability](https://docs.crewai.com/how-to/opik-observability).
+  - Extração de YAML aprimorada.
+  - Validação multimodal de agentes.
+  - Impressões digitais seguras adicionadas para agents e crews.
+
+  **Melhorias & Correções no Núcleo**
+  - Serialização, cópia de agent e compatibilidade Python aprimoradas.
+  - Suporte a curingas adicionado a `emit()`
+  - Suporte a chamadas adicionais do roteador e ajustes de janela de contexto.
+  - Correções em typing, validação e imports.
+  - Melhoria na performance de métodos.
+  - Manipulação de tasks do agent, emissão de eventos e gerenciamento de memória aprimorados.
+  - Correções na CLI, tarefas condicionais, comportamento de clonagem e saídas de ferramentas.
+
+  **Documentação & Guias**
+  - Estrutura, tema e organização da documentação aprimorados.
+  - Guias para Local NVIDIA NIM com WSL2, W&B Weave e Arize Phoenix adicionados.
+  - Exemplos de configuração de ferramentas, prompts e docs de observabilidade atualizados.
+  - Guia para usar agentes singulares nos Flows.
+</Update>
+
+<Update label="2024-03-17" description="v0.108.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01080.png" />
+  </Frame>
+
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.108.0">Ver no GitHub</a>
+  </div>
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Conversão de tabs para espaços no template `crew.py`
+  - Streaming de respostas LLM e sistema de eventos aprimorados
+  - Inclusão de `model_name`
+  - Event Listener aprimorado com visualização rica e logs melhorados
+  - Impressões digitais adicionadas
+
+  **Correções de Bugs**
+  - Correções de problemas com Mistral
+  - Correção de bug na documentação
+  - Correção de erro de type check na propriedade fingerprint
+
+  **Atualizações em Documentação**
+  - Documentação de ferramentas aprimorada
+  - Guia de instalação atualizado para o pacote `uv` tool
+  - Instruções adicionadas para upgrade do crewAI com o `uv` tool
+  - Documentação para `ApifyActorsTool` incluída
+</Update>
+
+<Update label="2024-03-10" description="v0.105.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01050.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.105.0">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Correção de variáveis de template ausentes e configuração de memória de usuário
+  - Suporte a fluxo assíncrono melhorado e resolução para formatação de respostas do agente
+  - Função de reset de memória aprimorada e correção nos comandos de memória da CLI
+  - Correções em tipos, propriedades de chamadas de ferramenta e desacoplamento de telemetria
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Exportação de estado do Flow e utilitários de estado melhorados
+  - Configuração de conhecimento do agente aprimorada com embedder opcional para crew
+  - Emissor de eventos adicionado para melhor observabilidade e rastreamento de chamadas LLM
+  - Suporte para Python 3.10 e ChatOllama via langchain_ollama
+  - Suporte ao tamanho da janela de contexto para o modelo o3-mini
+  - Adicionada capacidade de múltiplas chamadas de roteador
+
+  **Documentação & Guias**
+  - Layout e estrutura hierárquica da documentação aprimorados
+  - Guia para QdrantVectorSearchTool incluído e uso de event listener esclarecido
+  - Correções de erros nos prompts e atualização da lista de modelos do Amazon Bedrock
+</Update>
+
+<Update label="2024-02-12" description="v0.102.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01020.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.102.0">Ver no GitHub</a>
+  </div>
+
+  **Melhorias & Correções no Núcleo**
+  - Suporte LLM expandido: melhorar saída estruturada do LLM, manuseio de parâmetros e formatação para modelos Anthropic
+  - Estabilidade de Crew & Agent: corrigido clonagem de agents/crews com knowledge sources, múltiplas saídas de task em tarefas condicionais e callbacks de tarefa de Crew ignorados
+  - Correções de Memória & Armazenamento: melhora no gerenciamento de memória de curto prazo com Bedrock, inicialização correta do embedder e função reset memories adicionada na classe crew
+  - Confiabilidade em Treinamento & Execução: corrigidos treinamento quebrado e questões de interpolação com tipos de entrada dict e list
+
+  **Novas Funcionalidades & Aprimoramentos**
+  - Gerenciamento Avançado de Conhecimento: convencionamento de nomes melhorado e configuração de embedding aprimorada com suporte a embedder customizado
+  - Logging & Observabilidade Expandidos: suporte ao formato JSON para logging e documentação de rastreamento no MLflow integrada
+  - Melhorias no Tratamento de Dados: atualização do excel_knowledge_source.py para processar arquivos com múltipl abas
+  - Desempenho Geral & Limpeza do Código: alinhamento de código corporativo e resolução de problemas de linting
+  - Novo tool adicionado: `QdrantVectorSearchTool`
+
+  **Documentação & Guias**
+  - Docs de AI & Memória atualizados: melhorias em documentação do Bedrock, Google AI e memória de longo prazo
+  - Clareza em tarefas & fluxos: adicionada linha "Entrada Humana" em Task Attributes, guia para Langfuse e documentação para FileWriterTool
+  - Diversas correções de ortografia & formatação
+</Update>
+
+<Update label="2024-01-28" description="v0.100.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v01000.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.100.0">Ver no GitHub</a>
+  </div>
+
+  **Funcionalidades**
+  - Adição dos docs Composio
+  - Adicionado SageMaker como provedor LLM
+  
+  **Correções**
+  - Correção geral nas conexões LLM
+  - Uso de acessores seguros no treinamento
+  - Checagem de versão adicionada ao crew_chat.py
+  
+  **Documentação**
+  - Novos docs para crewai chat
+  - Melhorias no formato e clareza nos docs da CLI e da Composio Tool
+</Update>
+
+<Update label="2024-01-20" description="v0.98.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v0980.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.98.0">Ver no GitHub</a>
+  </div>
+
+  **Funcionalidades**
+  - Conversation crew v1
+  - Adição de ID único para estados de flow
+  - Adição do decorator @persist com a interface FlowPersistence
+  
+  **Integrações**
+  - Integração SambaNova adicionada
+  - Novo provedor NVIDIA NIM na CLI
+  - Apresentando VoyageAI
+  
+  **Correções**
+  - Correção de comportamento de chave API e tratamento de entidades na integração com Mem0
+  - Correção na lógica de invoke principal e nos testes relacionados
+  - Inputs de ferramentas agora são objetos reais em vez de strings
+  - Partes importantes adicionadas no processo de criação de ferramentas
+  - Versão do litellm foi rebaixada para prevenir problema no Windows
+  - Correção antes da execução caso inputs estejam nulos
+  - Corrigidos erros, modelo pydantic aninhado e falhas de docling
+</Update>
+
+<Update label="2024-01-04" description="v0.95.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v0950.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.95.0">Ver no GitHub</a>
+  </div>
+
+  **Novas Funcionalidades**
+  - Adição de habilidades multimodais ao Crew
+  - Guardrails programáticos
+  - HITL com múltiplas rodadas
+  - Suporte ao Gemini 2.0
+  - Melhorias em CrewAI Flows
+  - Permissões de workflow adicionadas
+  - Suporte a langfuse com litellm
+  - Integração Portkey com CrewAI
+  - Método interpolate_only e melhorias em tratamento de erros
+  - Suporte ao Docling
+  - Suporte ao Weviate
+  
+  **Correções**
+  - output_file não respeitava caminho do sistema
+  - Erro de I/O em disco ao resetar memória de curto prazo
+  - CrewJSONEncoder agora aceita enums
+  - Versão máxima do Python
+  - Interpolação de output_file em Task
+  - Manipulação adequada de nomes de funções coworker quanto a caixa e espaços
+  - tiktoken adicionado como dependência explícita e documentação do requisito Rust
+  - Inclusão do conhecimento do agent no processo de planejamento
+  - Inicialização do armazenamento definida como None em KnowledgeStorage
+  - Verificações opcionais de armazenamento corrigidas
+  - Emissor de eventos incluído nos flows
+  - Melhorias em docstring, tratamento de erros e type hints
+  - Suppressão de userWarnings de problemas pydantic no litellm
+</Update>
+
+<Update label="2024-12-05" description="v0.86.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v0860.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.86.0">Ver no GitHub</a>
+  </div>
+  **Alterações**
+  - Removidas todas referências a pipeline e roteador de pipeline
+  - Adicionado Nvidia NIM como provedor em Custom LLM
+  - Adicionado demo de knowledge + melhorias nos docs de knowledge
+  - Adicionado suporte a múltiplas rodadas de HITL
+  - Novos docs sobre crew em yaml com decorators
+  - Template de crew simplificado
+</Update>
+
+<Update label="2024-12-04" description="v0.85.0">
+  ## Destaques da Versão
+  <Frame>
+    <img src="/images/releases/v0850.png" />
+  </Frame>
+  
+  <div style={{ textAlign: 'center', marginBottom: '1rem' }}>
+    <a href="https://github.com/crewAIInc/crewAI/releases/tag/0.85.0">Ver no GitHub</a>
+  </div>
+  **Funcionalidades**
+  - Adicionado conhecimento em nível de agent
+  - Feat/remover langchain
+  - Aprimoradas saídas tipadas das tasks
+  - Login no Tool Repository ao fazer login no crewai
+  
+  **Correções**
+  - Correção em issues de result as answer não encerrando loop do LLM corretamente
+  - Correção de ausência de nome de chave ao rodar com o provedor ollama
+  - Correção em erro ortográfico identificado
+  
+  **Documentação**
+  - Atualização no readme para rodar mypy
+  - Adição do conhecimento em mint.json
+  - Atualização das ações do Github
+  - Atualização na documentação de Agents para incluir duas abordagens na criação de agent
+  - Melhorias na Configuração e Uso do LLM
+</Update>
+
+<Update label="2024-11-25" description="v0.83.0">
+  **Novas Funcionalidades**
+  - Novos callbacks before_kickoff e after_kickoff em crew
+  - Suporte para pre-seed de agents com Knowledge
+  - Adicionado suporte para recuperação de preferências de usuário e memórias usando Mem0
+  
+  **Correções**
+  - Correção em execução assíncrona
+  - Upgrade do chroma e ajuste no gerador de funções do embedder
+  - Atualização do CLI Watson com modelos suportados + docs
+  - Redução do nível para Bandit
+  - Correção de todos os testes
+  
+  **Documentação**
+  - Documentação atualizada
+</Update>
+
+<Update label="2024-11-13" description="v0.80.0">
+  **Correções**
+  - Correção em bug de substituição do callback Tokens
+  - Correção em issue de callback Step
+  - Informação de prompt tokens em cache adicionada nas métricas de uso
+  - Correção no teste crew_train_success
+</Update>
--- a/docs/pt-BR/concepts/agents.mdx
+++ b/docs/pt-BR/concepts/agents.mdx
@@ -149,33 +149,34 @@ from crewai_tools import SerperDevTool

 # Crie um agente com todos os parâmetros disponíveis
 agent = Agent(
-    role="Cientista de Dados Sênior",
-    goal="Analisar e interpretar conjuntos de dados complexos para fornecer insights acionáveis",
-    backstory="Com mais de 10 anos de experiência em ciência de dados e aprendizado de máquina, você é especialista em encontrar padrões em grandes volumes de dados.",
-    llm="gpt-4",  # Padrão: OPENAI_MODEL_NAME ou "gpt-4"
-    function_calling_llm=None,  # Opcional: LLM separado para chamadas de ferramentas
-    verbose=False,  # Padrão: False
-    allow_delegation=False,  # Padrão: False
-    max_iter=20,  # Padrão: 20 iterações
-    max_rpm=None,  # Opcional: Limite de requisições por minuto
-    max_execution_time=None,  # Opcional: Tempo máximo de execução em segundos
-    max_retry_limit=2,  # Padrão: 2 tentativas em caso de erro
-    allow_code_execution=False,  # Padrão: False
-    code_execution_mode="safe",  # Padrão: "safe" (opções: "safe", "unsafe")
-    respect_context_window=True,  # Padrão: True
-    use_system_prompt=True,  # Padrão: True
-    multimodal=False,  # Padrão: False
-    inject_date=False,  # Padrão: False
-    date_format="%Y-%m-%d",  # Padrão: formato ISO
-    reasoning=False,  # Padrão: False
-    max_reasoning_attempts=None,  # Padrão: None
-    tools=[SerperDevTool()],  # Opcional: Lista de ferramentas
-    knowledge_sources=None,  # Opcional: Lista de fontes de conhecimento
-    embedder=None,  # Opcional: Configuração de embedder customizado
-    system_template=None,  # Opcional: Template de prompt de sistema
-    prompt_template=None,  # Opcional: Template de prompt customizado
-    response_template=None,  # Opcional: Template de resposta customizado
-    step_callback=None,  # Opcional: Função de callback para monitoramento
+    role="Senior Data Scientist",
+    goal="Analyze and interpret complex datasets to provide actionable insights",
+    backstory="With over 10 years of experience in data science and machine learning, "
+              "you excel at finding patterns in complex datasets.",
+    llm="gpt-4",  # Default: OPENAI_MODEL_NAME or "gpt-4"
+    function_calling_llm=None,  # Optional: Separate LLM for tool calling
+    verbose=False,  # Default: False
+    allow_delegation=False,  # Default: False
+    max_iter=20,  # Default: 20 iterations
+    max_rpm=None,  # Optional: Rate limit for API calls
+    max_execution_time=None,  # Optional: Maximum execution time in seconds
+    max_retry_limit=2,  # Default: 2 retries on error
+    allow_code_execution=False,  # Default: False
+    code_execution_mode="safe",  # Default: "safe" (options: "safe", "unsafe")
+    respect_context_window=True,  # Default: True
+    use_system_prompt=True,  # Default: True
+    multimodal=False,  # Default: False
+    inject_date=False,  # Default: False
+    date_format="%Y-%m-%d",  # Default: ISO format
+    reasoning=False,  # Default: False
+    max_reasoning_attempts=None,  # Default: None
+    tools=[SerperDevTool()],  # Optional: List of tools
+    knowledge_sources=None,  # Optional: List of knowledge sources
+    embedder=None,  # Optional: Custom embedder configuration
+    system_template=None,  # Optional: Custom system prompt template
+    prompt_template=None,  # Optional: Custom prompt template
+    response_template=None,  # Optional: Custom response template
+    step_callback=None,  # Optional: Callback function for monitoring
 )
 ```

@@ -184,62 +185,65 @@ Vamos detalhar algumas combinações de parâmetros-chave para casos de uso comu
 #### Agente de Pesquisa Básico
 ```python Code
 research_agent = Agent(
-    role="Analista de Pesquisa",
-    goal="Encontrar e resumir informações sobre tópicos específicos",
-    backstory="Você é um pesquisador experiente com atenção aos detalhes",
+    role="Research Analyst",
+    goal="Find and summarize information about specific topics",
+    backstory="You are an experienced researcher with attention to detail",
    tools=[SerperDevTool()],
-    verbose=True  # Ativa logs para depuração
+    verbose=True  # Enable logging for debugging
 )
 ```

 #### Agente de Desenvolvimento de Código
 ```python Code
 dev_agent = Agent(
-    role="Desenvolvedor Python Sênior",
-    goal="Escrever e depurar códigos Python",
-    backstory="Desenvolvedor Python especialista com 10 anos de experiência",
+    role="Senior Python Developer",
+    goal="Write and debug Python code",
+    backstory="Expert Python developer with 10 years of experience",
    allow_code_execution=True,
-    code_execution_mode="safe",  # Usa Docker para segurança
-    max_execution_time=300,  # Limite de 5 minutos
-    max_retry_limit=3  # Mais tentativas para tarefas complexas
+    code_execution_mode="safe",  # Uses Docker for safety
+    max_execution_time=300,  # 5-minute timeout
+    max_retry_limit=3  # More retries for complex code tasks
 )
 ```

 #### Agente de Análise de Longa Duração
 ```python Code
 analysis_agent = Agent(
-    role="Analista de Dados",
-    goal="Realizar análise aprofundada de grandes conjuntos de dados",
-    backstory="Especialista em análise de big data e reconhecimento de padrões",
+    role="Data Analyst",
+    goal="Perform deep analysis of large datasets",
+    backstory="Specialized in big data analysis and pattern recognition",
    memory=True,
    respect_context_window=True,
-    max_rpm=10,  # Limite de requisições por minuto
-    function_calling_llm="gpt-4o-mini"  # Modelo mais econômico para chamadas de ferramentas
+    max_rpm=10,  # Limit API calls
+    function_calling_llm="gpt-4o-mini"  # Cheaper model for tool calls
 )
 ```

 #### Agente com Template Personalizado
 ```python Code
 custom_agent = Agent(
-    role="Atendente de Suporte ao Cliente",
-    goal="Auxiliar clientes com suas dúvidas e solicitações",
-    backstory="Experiente em atendimento ao cliente com foco em satisfação",
-    system_template="""<|start_header_id|>system<|end_header_id|>\n                        {{ .System }}<|eot_id|>""",
-    prompt_template="""<|start_header_id|>user<|end_header_id|>\n                        {{ .Prompt }}<|eot_id|>""",
-    response_template="""<|start_header_id|>assistant<|end_header_id|>\n                        {{ .Response }}<|eot_id|>""",
+    role="Customer Service Representative",
+    goal="Assist customers with their inquiries",
+    backstory="Experienced in customer support with a focus on satisfaction",
+    system_template="""<|start_header_id|>system<|end_header_id|>
+                        {{ .System }}<|eot_id|>""",
+    prompt_template="""<|start_header_id|>user<|end_header_id|>
+                        {{ .Prompt }}<|eot_id|>""",
+    response_template="""<|start_header_id|>assistant<|end_header_id|>
+                        {{ .Response }}<|eot_id|>""",
 )
 ```

 #### Agente Ciente de Data, com Raciocínio
 ```python Code
 strategic_agent = Agent(
-    role="Analista de Mercado",
-    goal="Acompanhar movimentos do mercado com referências de datas precisas e planejamento estratégico",
-    backstory="Especialista em análise financeira sensível ao tempo e relatórios estratégicos",
-    inject_date=True,  # Injeta automaticamente a data atual nas tarefas
-    date_format="%d de %B de %Y",  # Exemplo: "21 de maio de 2025"
-    reasoning=True,  # Ativa planejamento estratégico
-    max_reasoning_attempts=2,  # Limite de iterações de planejamento
+    role="Market Analyst",
+    goal="Track market movements with precise date references and strategic planning",
+    backstory="Expert in time-sensitive financial analysis and strategic reporting",
+    inject_date=True,  # Automatically inject current date into tasks
+    date_format="%B %d, %Y",  # Format as "May 21, 2025"
+    reasoning=True,  # Enable strategic planning
+    max_reasoning_attempts=2,  # Limit planning iterations
    verbose=True
 )
 ```
@@ -247,12 +251,12 @@ strategic_agent = Agent(
 #### Agente de Raciocínio
 ```python Code
 reasoning_agent = Agent(
-    role="Planejador Estratégico",
-    goal="Analisar problemas complexos e criar planos de execução detalhados",
-    backstory="Especialista em planejamento estratégico que desmembra desafios complexos metodicamente",
-    reasoning=True,  # Ativa raciocínio e planejamento
-    max_reasoning_attempts=3,  # Limite de tentativas de raciocínio
-    max_iter=30,  # Permite mais iterações para planejamento complexo
+    role="Strategic Planner",
+    goal="Analyze complex problems and create detailed execution plans",
+    backstory="Expert strategic planner who methodically breaks down complex challenges",
+    reasoning=True,  # Enable reasoning and planning
+    max_reasoning_attempts=3,  # Limit reasoning attempts
+    max_iter=30,  # Allow more iterations for complex planning
    verbose=True
 )
 ```
@@ -260,10 +264,10 @@ reasoning_agent = Agent(
 #### Agente Multimodal
 ```python Code
 multimodal_agent = Agent(
-    role="Analista de Conteúdo Visual",
-    goal="Analisar e processar tanto conteúdo textual quanto visual",
-    backstory="Especialista em análise multimodal combinando compreensão de texto e imagem",
-    multimodal=True,  # Ativa capacidades multimodais
+    role="Visual Content Analyst",
+    goal="Analyze and process both text and visual content",
+    backstory="Specialized in multimodal analysis combining text and image understanding",
+    multimodal=True,  # Enable multimodal capabilities
    verbose=True
 )
 ```
@@ -332,8 +336,8 @@ wiki_tool = WikipediaTools()

 # Adicionar ferramentas ao agente
 researcher = Agent(
-    role="Pesquisador de Tecnologia em IA",
-    goal="Pesquisar os últimos avanços em IA",
+    role="AI Technology Researcher",
+    goal="Research the latest AI developments",
    tools=[search_tool, wiki_tool],
    verbose=True
 )
@@ -347,9 +351,9 @@ Agentes podem manter a memória de suas interações e usar contexto de tarefas
 from crewai import Agent

 analyst = Agent(
-    role="Analista de Dados",
-    goal="Analisar e memorizar padrões complexos de dados",
-    memory=True,  # Ativa memória
+    role="Data Analyst",
+    goal="Analyze and remember complex data patterns",
+    memory=True,  # Enable memory
    verbose=True
 )
 ```
@@ -376,10 +380,10 @@ Esta é a **configuração padrão e recomendada** para a maioria dos casos. Qua
 ```python Code
 # Agente com gerenciamento automático de contexto (padrão)
 smart_agent = Agent(
-    role="Analista de Pesquisa",
-    goal="Analisar grandes documentos e conjuntos de dados",
-    backstory="Especialista em processar informações extensas",
-    respect_context_window=True,  # 🔑 Padrão: gerencia limites de contexto automaticamente
+    role="Research Analyst",
+    goal="Analyze large documents and datasets",
+    backstory="Expert at processing extensive information",
+    respect_context_window=True,  # 🔑 Default: auto-handle context limits
    verbose=True
 )
 ```
--- a/docs/pt-BR/concepts/cli.mdx
+++ b/docs/pt-BR/concepts/cli.mdx
@@ -3,7 +3,6 @@ title: CLI
 description: Aprenda a usar o CLI do CrewAI para interagir com o CrewAI.
 icon: terminal
 ---
-<Warning>A partir da versão 0.140.0, a plataforma CrewAI Enterprise iniciou um processo de migração de seu provedor de login. Como resultado, o fluxo de autenticação via CLI foi atualizado. Usuários que utlizam o Google para fazer login, ou que criaram conta após 3 de julho de 2025 não poderão fazer login com versões anteriores da biblioteca `crewai`.</Warning>

 ## Visão Geral

@@ -76,22 +75,6 @@ Exemplo:
 crewai train -n 10 -f my_training_data.pkl
 ```

-```python
-# Exemplo de uso programático do comando train
-n_iterations = 2
-inputs = {"topic": "Treinamento CrewAI"}
-filename = "seu_modelo.pkl"
-
-try:
-    SuaCrew().crew().train(
-      n_iterations=n_iterations, 
-      inputs=inputs, 
-      filename=filename
-    )
-except Exception as e:
-    raise Exception(f"Ocorreu um erro ao treinar a crew: {e}")
-```
-
 ### 4. Replay

 Reexecute a execução do crew a partir de uma tarefa específica.
--- a/docs/pt-BR/concepts/collaboration.mdx
+++ b/docs/pt-BR/concepts/collaboration.mdx
@@ -15,18 +15,18 @@ from crewai import Agent, Crew, Task

 # Enable collaboration for agents
 researcher = Agent(
-    role="Especialista em Pesquisa",
-    goal="Realizar pesquisas aprofundadas sobre qualquer tema",
-    backstory="Pesquisador especialista com acesso a diversas fontes",
-    allow_delegation=True,  # 🔑 Configuração chave para colaboração
+    role="Research Specialist",
+    goal="Conduct thorough research on any topic",
+    backstory="Expert researcher with access to various sources",
+    allow_delegation=True,  # 🔑 Key setting for collaboration
    verbose=True
 )

 writer = Agent(
-    role="Redator de Conteúdo",
-    goal="Criar conteúdo envolvente com base em pesquisas",
-    backstory="Redator habilidoso que transforma pesquisas em conteúdo atraente",
-    allow_delegation=True,  # 🔑 Permite fazer perguntas a outros agentes
+    role="Content Writer", 
+    goal="Create engaging content based on research",
+    backstory="Skilled writer who transforms research into compelling content",
+    allow_delegation=True,  # 🔑 Enables asking questions to other agents
    verbose=True
 )

@@ -67,17 +67,19 @@ from crewai import Agent, Crew, Task, Process

 # Create collaborative agents
 researcher = Agent(
-    role="Especialista em Pesquisa",
-    goal="Realizar pesquisas aprofundadas sobre qualquer tema",
-    backstory="Pesquisador especialista com acesso a diversas fontes",
+    role="Research Specialist",
+    goal="Find accurate, up-to-date information on any topic",
+    backstory="""You're a meticulous researcher with expertise in finding 
+    reliable sources and fact-checking information across various domains.""",
    allow_delegation=True,
    verbose=True
 )

 writer = Agent(
-    role="Redator de Conteúdo",
-    goal="Criar conteúdo envolvente com base em pesquisas",
-    backstory="Redator habilidoso que transforma pesquisas em conteúdo atraente",
+    role="Content Writer",
+    goal="Create engaging, well-structured content",
+    backstory="""You're a skilled content writer who excels at transforming 
+    research into compelling, readable content for different audiences.""",
    allow_delegation=True,
    verbose=True
 )
@@ -93,17 +95,17 @@ editor = Agent(

 # Create a task that encourages collaboration
 article_task = Task(
-    description="""Escreva um artigo abrangente de 1000 palavras sobre 'O Futuro da IA na Saúde'.
-
-O artigo deve incluir:
- Aplicações atuais de IA na saúde
- Tendências e tecnologias emergentes
- Desafios potenciais e considerações éticas
- Previsões de especialistas para os próximos 5 anos
-
-Colabore com seus colegas para garantir precisão e qualidade.""",
-    expected_output="Um artigo bem pesquisado, envolvente, com 1000 palavras, estrutura adequada e citações",
-    agent=writer  # O redator lidera, mas pode delegar pesquisa ao pesquisador
+    description="""Write a comprehensive 1000-word article about 'The Future of AI in Healthcare'.
+    
+    The article should include:
+    - Current AI applications in healthcare
+    - Emerging trends and technologies  
+    - Potential challenges and ethical considerations
+    - Expert predictions for the next 5 years
+    
+    Collaborate with your teammates to ensure accuracy and quality.""",
+    expected_output="A well-researched, engaging 1000-word article with proper structure and citations",
+    agent=writer  # Writer leads, but can delegate research to researcher
 )

 # Create collaborative crew
@@ -122,37 +124,37 @@ result = crew.kickoff()
 ### Padrão 1: Pesquisa → Redação → Edição
 ```python
 research_task = Task(
-    description="Pesquise os últimos avanços em computação quântica",
-    expected_output="Resumo abrangente da pesquisa com principais descobertas e fontes",
+    description="Research the latest developments in quantum computing",
+    expected_output="Comprehensive research summary with key findings and sources",
    agent=researcher
 )

 writing_task = Task(
-    description="Escreva um artigo com base nos achados da pesquisa",
-    expected_output="Artigo envolvente de 800 palavras sobre computação quântica",
+    description="Write an article based on the research findings",
+    expected_output="Engaging 800-word article about quantum computing",
    agent=writer,
-    context=[research_task]  # Recebe a saída da pesquisa como contexto
+    context=[research_task]  # Gets research output as context
 )

 editing_task = Task(
-    description="Edite e revise o artigo para publicação",
-    expected_output="Artigo pronto para publicação, com clareza e fluidez aprimoradas",
+    description="Edit and polish the article for publication",
+    expected_output="Publication-ready article with improved clarity and flow",
    agent=editor,
-    context=[writing_task]  # Recebe o rascunho do artigo como contexto
+    context=[writing_task]  # Gets article draft as context
 )
 ```

 ### Padrão 2: Tarefa Única Colaborativa
 ```python
 collaborative_task = Task(
-    description="""Crie uma estratégia de marketing para um novo produto de IA.
-
-Redator: Foque em mensagens e estratégia de conteúdo
-Pesquisador: Forneça análise de mercado e insights de concorrentes
-
-Trabalhem juntos para criar uma estratégia abrangente.""",
-    expected_output="Estratégia de marketing completa com embasamento em pesquisa",
-    agent=writer  # Agente líder, mas pode delegar ao pesquisador
+    description="""Create a marketing strategy for a new AI product.
+    
+    Writer: Focus on messaging and content strategy
+    Researcher: Provide market analysis and competitor insights
+    
+    Work together to create a comprehensive strategy.""",
+    expected_output="Complete marketing strategy with research backing",
+    agent=writer  # Lead agent, but can delegate to researcher
 )
 ```

@@ -165,35 +167,35 @@ from crewai import Agent, Crew, Task, Process

 # Manager agent coordinates the team
 manager = Agent(
-    role="Gerente de Projetos",
-    goal="Coordenar esforços da equipe e garantir o sucesso do projeto",
-    backstory="Gerente de projetos experiente, habilidoso em delegação e controle de qualidade",
+    role="Project Manager",
+    goal="Coordinate team efforts and ensure project success",
+    backstory="Experienced project manager skilled at delegation and quality control",
    allow_delegation=True,
    verbose=True
 )

 # Specialist agents
 researcher = Agent(
-    role="Pesquisador",
-    goal="Fornecer pesquisa e análise precisas",
-    backstory="Pesquisador especialista com habilidades analíticas profundas",
-    allow_delegation=False,  # Especialistas focam em sua expertise
+    role="Researcher",
+    goal="Provide accurate research and analysis",
+    backstory="Expert researcher with deep analytical skills",
+    allow_delegation=False,  # Specialists focus on their expertise
    verbose=True
 )

 writer = Agent(
-    role="Redator",
-    goal="Criar conteúdo envolvente",
-    backstory="Redator habilidoso que cria conteúdo atraente",
+    role="Writer", 
+    goal="Create compelling content",
+    backstory="Skilled writer who creates engaging content",
    allow_delegation=False,
    verbose=True
 )

 # Manager-led task
 project_task = Task(
-    description="Crie um relatório de análise de mercado completo com recomendações",
-    expected_output="Resumo executivo, análise detalhada e recomendações estratégicas",
-    agent=manager  # O gerente delega para especialistas
+    description="Create a comprehensive market analysis report with recommendations",
+    expected_output="Executive summary, detailed analysis, and strategic recommendations",
+    agent=manager  # Manager will delegate to specialists
 )

 # Hierarchical crew
--- a/docs/pt-BR/concepts/crews.mdx
+++ b/docs/pt-BR/concepts/crews.mdx
@@ -153,32 +153,32 @@ from crewai_tools import YourCustomTool
 class YourCrewName:
    def agent_one(self) -> Agent:
        return Agent(
-            role="Analista de Dados",
-            goal="Analisar tendências de dados no mercado brasileiro",
-            backstory="Analista experiente com formação em economia",
+            role="Data Analyst",
+            goal="Analyze data trends in the market",
+            backstory="An experienced data analyst with a background in economics",
            verbose=True,
            tools=[YourCustomTool()]
        )

    def agent_two(self) -> Agent:
        return Agent(
-            role="Pesquisador de Mercado",
-            goal="Coletar informações sobre a dinâmica do mercado nacional",
-            backstory="Pesquisador dedicado com olhar atento aos detalhes",
+            role="Market Researcher",
+            goal="Gather information on market dynamics",
+            backstory="A diligent researcher with a keen eye for detail",
            verbose=True
        )

    def task_one(self) -> Task:
        return Task(
-            description="Coletar dados recentes do mercado brasileiro e identificar tendências.",
-            expected_output="Um relatório resumido com as principais tendências do mercado.",
+            description="Collect recent market data and identify trends.",
+            expected_output="A report summarizing key trends in the market.",
            agent=self.agent_one()
        )

    def task_two(self) -> Task:
        return Task(
-            description="Pesquisar fatores que afetam a dinâmica do mercado nacional.",
-            expected_output="Uma análise dos fatores que influenciam o mercado.",
+            description="Research factors affecting market dynamics.",
+            expected_output="An analysis of factors influencing the market.",
            agent=self.agent_two()
        )

--- a/docs/pt-BR/concepts/event-listener.mdx
+++ b/docs/pt-BR/concepts/event-listener.mdx
@@ -51,24 +51,24 @@ from crewai.utilities.events import (
 )
 from crewai.utilities.events.base_event_listener import BaseEventListener

-class MeuListenerPersonalizado(BaseEventListener):
+class MyCustomListener(BaseEventListener):
    def __init__(self):
        super().__init__()

    def setup_listeners(self, crewai_event_bus):
        @crewai_event_bus.on(CrewKickoffStartedEvent)
-        def ao_iniciar_crew(source, event):
-            print(f"Crew '{event.crew_name}' iniciou a execução!")
+        def on_crew_started(source, event):
+            print(f"Crew '{event.crew_name}' has started execution!")

        @crewai_event_bus.on(CrewKickoffCompletedEvent)
-        def ao_finalizar_crew(source, event):
-            print(f"Crew '{event.crew_name}' finalizou a execução!")
-            print(f"Saída: {event.output}")
+        def on_crew_completed(source, event):
+            print(f"Crew '{event.crew_name}' has completed execution!")
+            print(f"Output: {event.output}")

        @crewai_event_bus.on(AgentExecutionCompletedEvent)
-        def ao_finalizar_execucao_agente(source, event):
-            print(f"Agente '{event.agent.role}' concluiu a tarefa")
-            print(f"Saída: {event.output}")
+        def on_agent_execution_completed(source, event):
+            print(f"Agent '{event.agent.role}' completed task")
+            print(f"Output: {event.output}")
 ```

 ## Registrando Corretamente Seu Listener
--- a/docs/pt-BR/concepts/flows.mdx
+++ b/docs/pt-BR/concepts/flows.mdx
@@ -486,9 +486,8 @@ Existem duas formas de executar um flow:
 Você pode executar um flow programaticamente criando uma instância da sua classe de flow e chamando o método `kickoff()`:

 ```python
-# Exemplo de execução de flow em português
-flow = ExemploFlow()
-resultado = flow.kickoff()
+flow = ExampleFlow()
+result = flow.kickoff()
 ```

 ### Usando a CLI
--- a/docs/pt-BR/concepts/knowledge.mdx
+++ b/docs/pt-BR/concepts/knowledge.mdx
@@ -39,17 +39,17 @@ llm = LLM(model="gpt-4o-mini", temperature=0)

 # Create an agent with the knowledge store
 agent = Agent(
-    role="Sobre o Usuário",
-    goal="Você sabe tudo sobre o usuário.",
-    backstory="Você é mestre em entender pessoas e suas preferências.",
+    role="About User",
+    goal="You know everything about the user.",
+    backstory="You are a master at understanding people and their preferences.",
    verbose=True,
    allow_delegation=False,
    llm=llm,
 )

 task = Task(
-    description="Responda às seguintes perguntas sobre o usuário: {question}",
-    expected_output="Uma resposta para a pergunta.",
+    description="Answer the following questions about the user: {question}",
+    expected_output="An answer to the question.",
    agent=agent,
 )

@@ -87,17 +87,17 @@ llm = LLM(model="gpt-4o-mini", temperature=0)

 # Create an agent with the knowledge store
 agent = Agent(
-    role="Sobre artigos",
-    goal="Você sabe tudo sobre os artigos.",
-    backstory="Você é mestre em entender artigos e seus conteúdos.",
+    role="About papers",
+    goal="You know everything about the papers.",
+    backstory="You are a master at understanding papers and their content.",
    verbose=True,
    allow_delegation=False,
    llm=llm,
 )

 task = Task(
-    description="Responda às seguintes perguntas sobre os artigos: {question}",
-    expected_output="Uma resposta para a pergunta.",
+    description="Answer the following questions about the papers: {question}",
+    expected_output="An answer to the question.",
    agent=agent,
 )

@@ -201,16 +201,16 @@ specialist_knowledge = StringKnowledgeSource(
 )

 specialist_agent = Agent(
-    role="Especialista Técnico",
-    goal="Fornecer expertise técnica",
-    backstory="Especialista em domínios técnicos especializados",
-    knowledge_sources=[specialist_knowledge]  # Conhecimento específico do agente
+    role="Technical Specialist",
+    goal="Provide technical expertise",
+    backstory="Expert in specialized technical domains",
+    knowledge_sources=[specialist_knowledge]  # Agent-specific knowledge
 )

 task = Task(
-    description="Responda perguntas técnicas",
+    description="Answer technical questions",
    agent=specialist_agent,
-    expected_output="Resposta técnica"
+    expected_output="Technical answer"
 )

 # No crew-level knowledge required
@@ -240,7 +240,7 @@ Cada nível de knowledge usa coleções de armazenamento independentes:

 ```python
 # Agent knowledge storage
-agent_collection_name = agent.role  # e.g., "Especialista Técnico"
+agent_collection_name = agent.role  # e.g., "Technical Specialist"

 # Crew knowledge storage
 crew_collection_name = "crew"
@@ -248,7 +248,7 @@ crew_collection_name = "crew"
 # Both stored in same ChromaDB instance but different collections
 # Path: ~/.local/share/CrewAI/{project}/knowledge/
 #   ├── crew/                    # Crew knowledge collection
-#   ├── Especialista Técnico/    # Agent knowledge collection
+#   ├── Technical Specialist/    # Agent knowledge collection
 #   └── Another Agent Role/      # Another agent's collection
 ```

@@ -265,7 +265,7 @@ agent_knowledge = StringKnowledgeSource(
 )

 agent = Agent(
-    role="Especialista",
+    role="Specialist",
    goal="Use specialized knowledge",
    backstory="Expert with specific knowledge",
    knowledge_sources=[agent_knowledge],
@@ -299,10 +299,10 @@ specialist_knowledge = StringKnowledgeSource(
 )

 specialist = Agent(
-    role="Especialista Técnico",
-    goal="Fornecer expertise técnica",
-    backstory="Especialista em domínios técnicos especializados",
-    knowledge_sources=[specialist_knowledge]  # Conhecimento específico do agente
+    role="Technical Specialist",
+    goal="Provide technical expertise",
+    backstory="Technical expert",
+    knowledge_sources=[specialist_knowledge]  # Agent-specific
 )

 generalist = Agent(
--- a/docs/pt-BR/concepts/llms.mdx
+++ b/docs/pt-BR/concepts/llms.mdx
@@ -78,15 +78,15 @@ Existem diferentes locais no código do CrewAI onde você pode especificar o mod

    # Configuração avançada com parâmetros detalhados
    llm = LLM(
-        model="openai/gpt-4", 
-        temperature=0.8,
-        max_tokens=150,
-        top_p=0.9,
-        frequency_penalty=0.1,
-        presence_penalty=0.1,
-        response_format={"type":"json"},
-        stop=["FIM"],
-        seed=42
+        model="model-id-here",  # gpt-4o, gemini-2.0-flash, anthropic/claude...
+        temperature=0.7,        # Mais alto para saídas criativas
+        timeout=120,            # Segundos para aguardar resposta
+        max_tokens=4000,        # Comprimento máximo da resposta
+        top_p=0.9,              # Parâmetro de amostragem nucleus
+        frequency_penalty=0.1 , # Reduz repetição
+        presence_penalty=0.1,   # Incentiva diversidade de tópicos
+        response_format={"type": "json"},  # Para respostas estruturadas
+        seed=42                 # Para resultados reproduzíveis
    )
    ```

@@ -127,13 +127,13 @@ Nesta seção, você encontrará exemplos detalhados que ajudam a selecionar, co
    from crewai import LLM

    llm = LLM(
-        model="openai/gpt-4",
+        model="openai/gpt-4", # chamar modelo por provider/model_name
        temperature=0.8,
        max_tokens=150,
        top_p=0.9,
        frequency_penalty=0.1,
        presence_penalty=0.1,
-        stop=["FIM"],
+        stop=["END"],
        seed=42
    )
    ```
@@ -169,7 +169,7 @@ Nesta seção, você encontrará exemplos detalhados que ajudam a selecionar, co
    llm = LLM(
        model="meta_llama/Llama-4-Scout-17B-16E-Instruct-FP8",
        temperature=0.8,
-        stop=["FIM"],
+        stop=["END"],
        seed=42
    )
    ```
--- a/docs/pt-BR/concepts/planning.mdx
+++ b/docs/pt-BR/concepts/planning.mdx
@@ -17,7 +17,7 @@ Começar a usar o recurso de planejamento é muito simples, o único passo neces
 from crewai import Crew, Agent, Task, Process

 # Monte sua crew com capacidades de planejamento
-minha_crew = Crew(
+my_crew = Crew(
    agents=self.agents,
    tasks=self.tasks,
    process=Process.sequential,
--- a/docs/pt-BR/concepts/processes.mdx
+++ b/docs/pt-BR/concepts/processes.mdx
@@ -28,23 +28,23 @@ from crewai import Crew, Process

 # Exemplo: Criando uma crew com processo sequencial
 crew = Crew(
-    agents=meus_agentes,
-    tasks=minhas_tarefas,
+    agents=my_agents,
+    tasks=my_tasks,
    process=Process.sequential
 )

 # Exemplo: Criando uma crew com processo hierárquico
 # Certifique-se de fornecer um manager_llm ou manager_agent
 crew = Crew(
-    agents=meus_agentes,
-    tasks=minhas_tarefas,
+    agents=my_agents,
+    tasks=my_tasks,
    process=Process.hierarchical,
    manager_llm="gpt-4o"
    # ou
-    # manager_agent=meu_agente_gerente
+    # manager_agent=my_manager_agent
 )
 ```
-**Nota:** Certifique-se de que `meus_agentes` e `minhas_tarefas` estejam definidos antes de criar o objeto `Crew`, e para o processo hierárquico, é necessário também fornecer o `manager_llm` ou `manager_agent`.
+**Nota:** Certifique-se de que `my_agents` e `my_tasks` estejam definidos antes de criar o objeto `Crew`, e para o processo hierárquico, é necessário também fornecer o `manager_llm` ou `manager_agent`.

 ## Processo Sequencial

--- a/docs/pt-BR/concepts/reasoning.mdx
+++ b/docs/pt-BR/concepts/reasoning.mdx
@@ -15,12 +15,12 @@ Para habilitar o reasoning para um agente, basta definir `reasoning=True` ao cri
 ```python
 from crewai import Agent

-analista = Agent(
-    role="Analista de Dados",
-    goal="Analisar dados e fornecer insights",
-    backstory="Você é um analista de dados especialista.",
-    reasoning=True,
-    max_reasoning_attempts=3  # Opcional: Defina um limite de tentativas de reasoning
+agent = Agent(
+    role="Data Analyst",
+    goal="Analyze complex datasets and provide insights",
+    backstory="You are an experienced data analyst with expertise in finding patterns in complex data.",
+    reasoning=True,  # Enable reasoning
+    max_reasoning_attempts=3  # Optional: Set a maximum number of reasoning attempts
 )
 ```

@@ -53,23 +53,23 @@ Aqui está um exemplo completo:
 from crewai import Agent, Task, Crew

 # Create an agent with reasoning enabled
-analista = Agent(
-    role="Analista de Dados",
-    goal="Analisar dados e fornecer insights",
-    backstory="Você é um analista de dados especialista.",
+analyst = Agent(
+    role="Data Analyst",
+    goal="Analyze data and provide insights",
+    backstory="You are an expert data analyst.",
    reasoning=True,
-    max_reasoning_attempts=3  # Opcional: Defina um limite de tentativas de reasoning
+    max_reasoning_attempts=3  # Optional: Set a limit on reasoning attempts
 )

 # Create a task
 analysis_task = Task(
-    description="Analise os dados de vendas fornecidos e identifique as principais tendências.",
-    expected_output="Um relatório destacando as 3 principais tendências de vendas.",
-    agent=analista
+    description="Analyze the provided sales data and identify key trends.",
+    expected_output="A report highlighting the top 3 sales trends.",
+    agent=analyst
 )

 # Create a crew and run the task
-crew = Crew(agents=[analista], tasks=[analysis_task])
+crew = Crew(agents=[analyst], tasks=[analysis_task])
 result = crew.kickoff()

 print(result)
@@ -90,16 +90,16 @@ logging.basicConfig(level=logging.INFO)

 # Create an agent with reasoning enabled
 agent = Agent(
-    role="Analista de Dados",
-    goal="Analisar dados e fornecer insights",
+    role="Data Analyst",
+    goal="Analyze data and provide insights",
    reasoning=True,
    max_reasoning_attempts=3
 )

 # Create a task
 task = Task(
-    description="Analise os dados de vendas fornecidos e identifique as principais tendências.",
-    expected_output="Um relatório destacando as 3 principais tendências de vendas.",
+    description="Analyze the provided sales data and identify key trends.",
+    expected_output="A report highlighting the top 3 sales trends.",
    agent=agent
 )

@@ -113,7 +113,7 @@ result = agent.execute_task(task)
 Veja um exemplo de como pode ser um plano de reasoning para uma tarefa de análise de dados:

 ```
-Task: Analise os dados de vendas fornecidos e identifique as principais tendências.
+Task: Analyze the provided sales data and identify key trends.

 Reasoning Plan:
 I'll analyze the sales data to identify the top 3 trends.
--- a/docs/pt-BR/concepts/tasks.mdx
+++ b/docs/pt-BR/concepts/tasks.mdx
@@ -57,7 +57,6 @@ crew = Crew(
 | **Saída JSON** _(opcional)_      | `output_json`     | `Optional[Type[BaseModel]]`  | Um modelo Pydantic para estruturar a saída em JSON.                                                                |
 | **Output Pydantic** _(opcional)_ | `output_pydantic` | `Optional[Type[BaseModel]]`  | Um modelo Pydantic para a saída da tarefa.                                                                         |
 | **Callback** _(opcional)_        | `callback`        | `Optional[Any]`              | Função/objeto a ser executado após a conclusão da tarefa.                                                          |
-| **Guardrail** _(opcional)_       | `guardrail`       | `Optional[Union[Callable, str]]` | Função ou descrição em string para validar a saída da tarefa antes de prosseguir para a próxima tarefa.        |

 ## Criando Tarefas

@@ -87,7 +86,6 @@ research_task:
  expected_output: >
    Uma lista com 10 tópicos em bullet points das informações mais relevantes sobre {topic}
  agent: researcher
-  guardrail: garanta que cada bullet point contenha no mínimo 100 palavras

 reporting_task:
  description: >
@@ -332,13 +330,9 @@ analysis_task = Task(

 Guardrails (trilhas de proteção) de tarefas fornecem uma maneira de validar e transformar as saídas das tarefas antes que elas sejam passadas para a próxima tarefa. Esse recurso assegura a qualidade dos dados e oferece feedback aos agentes quando sua saída não atende a critérios específicos.

-**Guardrails podem ser definidos de duas maneiras:**
-1. **Guardrails baseados em função**: Funções Python que implementam lógica de validação customizada
-2. **Guardrails baseados em string**: Descrições em linguagem natural que são automaticamente convertidas em validação baseada em LLM
+### Usando Guardrails em Tarefas

-### Guardrails Baseados em Função
-
-Para adicionar um guardrail baseado em função a uma tarefa, forneça uma função de validação por meio do parâmetro `guardrail`:
+Para adicionar um guardrail a uma tarefa, forneça uma função de validação por meio do parâmetro `guardrail`:

 ```python Code
 from typing import Tuple, Union, Dict, Any
@@ -376,82 +370,9 @@ blog_task = Task(
   - Em caso de sucesso: retorna uma tupla `(True, resultado_validado)`
   - Em caso de falha: retorna uma tupla `(False, "mensagem de erro explicando a falha")`

-### Guardrails Baseados em String
+### LLMGuardrail

-Guardrails baseados em string permitem que você descreva critérios de validação em linguagem natural. Quando você fornece uma string em vez de uma função, o CrewAI automaticamente a converte em um `LLMGuardrail` que usa um agente de IA para validar a saída da tarefa.
-
-#### Usando Guardrails de String em Python
-
-```python Code
-from crewai import Task
-
-# Guardrail simples baseado em string
-blog_task = Task(
-    description="Escreva um post de blog sobre IA",
-    expected_output="Um post de blog com menos de 200 palavras",
-    agent=blog_agent,
-    guardrail="Garanta que o post do blog tenha menos de 200 palavras e inclua exemplos práticos"
-)
-
-# Critérios de validação mais complexos
-research_task = Task(
-    description="Pesquise tendências de IA para 2025",
-    expected_output="Um relatório abrangente de pesquisa",
-    agent=research_agent,
-    guardrail="Garanta que cada descoberta inclua uma fonte confiável e seja respaldada por dados recentes de 2024-2025"
-)
-```
-
-#### Usando Guardrails de String em YAML
-
-```yaml
-research_task:
-  description: Pesquise os últimos desenvolvimentos em IA
-  expected_output: Uma lista de 10 bullet points sobre IA
-  agent: researcher
-  guardrail: garanta que cada bullet point contenha no mínimo 100 palavras
-
-validation_task:
-  description: Valide os achados da pesquisa
-  expected_output: Um relatório de validação
-  agent: validator
-  guardrail: confirme que todas as fontes são de publicações respeitáveis e publicadas nos últimos 2 anos
-```
-
-#### Como Funcionam os Guardrails de String
-
-Quando você fornece um guardrail de string, o CrewAI automaticamente:
-1. Cria uma instância `LLMGuardrail` usando a string como critério de validação
-2. Usa o LLM do agente da tarefa para alimentar a validação
-3. Cria um agente temporário de validação que verifica a saída contra seus critérios
-4. Retorna feedback detalhado se a validação falhar
-
-Esta abordagem é ideal quando você quer usar linguagem natural para descrever regras de validação sem escrever funções de validação customizadas.
-
-### Classe LLMGuardrail
-
-A classe `LLMGuardrail` é o mecanismo subjacente que alimenta os guardrails baseados em string. Você também pode usá-la diretamente para maior controle avançado:
-
-```python Code
-from crewai import Task
-from crewai.tasks.llm_guardrail import LLMGuardrail
-from crewai.llm import LLM
-
-# Crie um LLMGuardrail customizado com LLM específico
-custom_guardrail = LLMGuardrail(
-    description="Garanta que a resposta contenha exatamente 5 bullet points com citações adequadas",
-    llm=LLM(model="gpt-4o-mini")
-)
-
-task = Task(
-    description="Pesquise medidas de segurança em IA",
-    expected_output="Uma análise detalhada com bullet points",
-    agent=research_agent,
-    guardrail=custom_guardrail
-)
-```
-
-**Nota**: Quando você usa um guardrail de string, o CrewAI automaticamente cria uma instância `LLMGuardrail` usando o LLM do agente da sua tarefa. Usar `LLMGuardrail` diretamente lhe dá mais controle sobre o processo de validação e seleção de LLM.
+A classe `LLMGuardrail` oferece um mecanismo robusto para validação das saídas das tarefas.

 ### Melhores Práticas de Tratamento de Erros

@@ -465,7 +386,7 @@ def validate_with_context(result: TaskOutput) -> Tuple[bool, Any]:
        validated_data = perform_validation(result)
        return (True, validated_data)
    except ValidationError as e:
-        return (False, f"ERRO_DE_VALIDACAO: {str(e)}")
+        return (False, f"VALIDATION_ERROR: {str(e)}")
    except Exception as e:
        return (False, str(e))
 ```
--- a/docs/pt-BR/concepts/tools.mdx
+++ b/docs/pt-BR/concepts/tools.mdx
@@ -67,17 +67,17 @@ web_rag_tool = WebsiteSearchTool()

 # Criar agentes
 researcher = Agent(
-    role='Analista de Mercado',
-    goal='Fornecer análise de mercado atualizada da indústria de IA',
-    backstory='Analista especialista com olhar atento para tendências de mercado.',
+    role='Market Research Analyst',
+    goal='Provide up-to-date market analysis of the AI industry',
+    backstory='An expert analyst with a keen eye for market trends.',
    tools=[search_tool, web_rag_tool],
    verbose=True
 )

 writer = Agent(
-    role='Redator de Conteúdo',
-    goal='Criar posts de blog envolventes sobre a indústria de IA',
-    backstory='Redator habilidoso com paixão por tecnologia.',
+    role='Content Writer',
+    goal='Craft engaging blog posts about the AI industry',
+    backstory='A skilled writer with a passion for technology.',
    tools=[docs_tool, file_tool],
    verbose=True
 )
--- a/docs/pt-BR/concepts/training.mdx
+++ b/docs/pt-BR/concepts/training.mdx
@@ -36,18 +36,19 @@ Para treinar sua crew de forma programática, siga estes passos:
 3. Execute o comando de treinamento dentro de um bloco try-except para tratar possíveis erros.

 ```python Code
-n_iteracoes = 2
-entradas = {"topic": "Treinamento CrewAI"}
-nome_arquivo = "seu_modelo.pkl"
+n_iterations = 2
+inputs = {"topic": "CrewAI Training"}
+filename = "your_model.pkl"

 try:
-    SuaCrew().crew().train(
-      n_iterations=n_iteracoes, 
-      inputs=entradas, 
-      filename=nome_arquivo
+    YourCrewName_Crew().crew().train(
+      n_iterations=n_iterations, 
+      inputs=inputs, 
+      filename=filename
    )
+
 except Exception as e:
-    raise Exception(f"Ocorreu um erro ao treinar a crew: {e}")
+    raise Exception(f"An error occurred while training the crew: {e}")
 ```

 ### Pontos Importantes
--- a/docs/pt-BR/enterprise/features/hallucination-guardrail.mdx
+++ b/docs/pt-BR/enterprise/features/hallucination-guardrail.mdx
@@ -26,13 +26,13 @@ from crewai.tasks.hallucination_guardrail import HallucinationGuardrail
 from crewai import LLM

 # Uso básico - utiliza o expected_output da tarefa como contexto
-protecao = HallucinationGuardrail(
+guardrail = HallucinationGuardrail(
    llm=LLM(model="gpt-4o-mini")
 )

 # Com contexto de referência explícito
-protecao_com_contexto = HallucinationGuardrail(
-    context="IA ajuda em várias tarefas, incluindo análise e geração.",
+context_guardrail = HallucinationGuardrail(
+    context="AI helps with various tasks including analysis and generation.",
    llm=LLM(model="gpt-4o-mini")
 )
 ```
@@ -43,11 +43,11 @@ protecao_com_contexto = HallucinationGuardrail(
 from crewai import Task

 # Crie sua tarefa com a proteção
-minha_tarefa = Task(
-    description="Escreva um resumo sobre as capacidades da IA",
-    expected_output="Um resumo factual baseado no contexto fornecido",
-    agent=meu_agente,
-    guardrail=protecao  # Adiciona a proteção para validar a saída
+task = Task(
+    description="Write a summary about AI capabilities",
+    expected_output="A factual summary based on the provided context",
+    agent=my_agent,
+    guardrail=guardrail  # Adiciona a proteção para validar a saída
 )
 ```

@@ -59,8 +59,8 @@ Para validação mais rigorosa, é possível definir um limiar de fidelidade per

 ```python
 # Proteção rigorosa exigindo alta pontuação de fidelidade
-protecao_rigorosa = HallucinationGuardrail(
-    context="Computação quântica utiliza qubits que existem em estados de superposição.",
+strict_guardrail = HallucinationGuardrail(
+    context="Quantum computing uses qubits that exist in superposition states.",
    llm=LLM(model="gpt-4o-mini"),
    threshold=8.0  # Requer pontuação >= 8 para validar
 )
@@ -72,10 +72,10 @@ Se sua tarefa utiliza ferramentas, você pode incluir as respostas das ferrament

 ```python
 # Proteção com contexto de resposta da ferramenta
-protecao_clima = HallucinationGuardrail(
-    context="Informações meteorológicas atuais para o local solicitado",
+weather_guardrail = HallucinationGuardrail(
+    context="Current weather information for the requested location",
    llm=LLM(model="gpt-4o-mini"),
-    tool_response="API do Clima retornou: Temperatura 22°C, Umidade 65%, Céu limpo"
+    tool_response="Weather API returned: Temperature 22°C, Humidity 65%, Clear skies"
 )
 ```

@@ -123,15 +123,15 @@ Quando uma proteção é adicionada à tarefa, ela valida automaticamente a saí

 ```python
 # Fluxo de validação de saída da tarefa
-task_output = meu_agente.execute_task(minha_tarefa)
-resultado_validacao = protecao(task_output)
+task_output = agent.execute_task(task)
+validation_result = guardrail(task_output)

-if resultado_validacao.valid:
+if validation_result.valid:
    # Tarefa concluída com sucesso
    return task_output
 else:
    # Tarefa falha com feedback de validação
-    raise ValidationError(resultado_validacao.feedback)
+    raise ValidationError(validation_result.feedback)
 ```

 ### Rastreamento de Eventos
@@ -151,10 +151,10 @@ A proteção se integra ao sistema de eventos do CrewAI para fornecer observabil
    Inclua todas as informações factuais relevantes nas quais a IA deve basear sua saída:

    ```python
-    contexto = """
-    Empresa XYZ foi fundada em 2020 e é especializada em soluções de energia renovável.
-    Possui 150 funcionários e faturou R$ 50 milhões em 2023.
-    Seus principais produtos incluem painéis solares e turbinas eólicas.
+    context = """
+    Company XYZ was founded in 2020 and specializes in renewable energy solutions.
+    They have 150 employees and generated $50M revenue in 2023.
+    Their main products include solar panels and wind turbines.
    """
    ```
  </Step>
@@ -164,10 +164,10 @@ A proteção se integra ao sistema de eventos do CrewAI para fornecer observabil

    ```python
    # Bom: Contexto focado
-    contexto = "O clima atual em Nova York é 18°C com chuva leve."
+    context = "The current weather in New York is 18°C with light rain."

    # Evite: Informações irrelevantes
-    contexto = "The weather is 18°C. The city has 8 million people. Traffic is heavy."
+    context = "The weather is 18°C. The city has 8 million people. Traffic is heavy."
    ```
  </Step>

--- a/docs/pt-BR/enterprise/features/integrations.mdx
+++ b/docs/pt-BR/enterprise/features/integrations.mdx
@@ -84,31 +84,31 @@ from crewai import Agent, Task, Crew
 from crewai_tools import CrewaiEnterpriseTools

 # Obtenha ferramentas enterprise (a ferramenta Gmail será incluída)
-ferramentas_enterprise = CrewaiEnterpriseTools(
-    enterprise_token="seu_token_enterprise"
+enterprise_tools = CrewaiEnterpriseTools(
+    enterprise_token="your_enterprise_token"
 )
 # imprima as ferramentas
-printf(ferramentas_enterprise)
+print(enterprise_tools)

 # Crie um agente com capacidades do Gmail
-agente_email = Agent(
-    role="Gerente de E-mails",
-    goal="Gerenciar e organizar comunicações por e-mail",
-    backstory="Um assistente de IA especializado em gestão de e-mails e comunicação.",
-    tools=ferramentas_enterprise
+email_agent = Agent(
+    role="Email Manager",
+    goal="Manage and organize email communications",
+    backstory="An AI assistant specialized in email management and communication.",
+    tools=enterprise_tools
 )

 # Tarefa para enviar um e-mail
-tarefa_email = Task(
-    description="Redigir e enviar um e-mail de acompanhamento para john@example.com sobre a atualização do projeto",
-    agent=agente_email,
-    expected_output="Confirmação de que o e-mail foi enviado com sucesso"
+email_task = Task(
+    description="Draft and send a follow-up email to john@example.com about the project update",
+    agent=email_agent,
+    expected_output="Confirmation that email was sent successfully"
 )

 # Execute a tarefa
 crew = Crew(
-    agents=[agente_email],
-    tasks=[tarefa_email]
+    agents=[email_agent],
+    tasks=[email_task]
 )

 # Execute o crew
@@ -125,23 +125,23 @@ enterprise_tools = CrewaiEnterpriseTools(
 )
 gmail_tool = enterprise_tools["gmail_find_email"]

-agente_gmail = Agent(
-    role="Gerente do Gmail",
-    goal="Gerenciar comunicações e notificações do gmail",
-    backstory="Um assistente de IA que ajuda a coordenar comunicações no gmail.",
+gmail_agent = Agent(
+    role="Gmail Manager",
+    goal="Manage gmail communications and notifications",
+    backstory="An AI assistant that helps coordinate gmail communications.",
    tools=[gmail_tool]
 )

-tarefa_notificacao = Task(
-    description="Encontrar o e-mail de john@example.com",
-    agent=agente_gmail,
-    expected_output="E-mail encontrado de john@example.com"
+notification_task = Task(
+    description="Find the email from john@example.com",
+    agent=gmail_agent,
+    expected_output="Email found from john@example.com"
 )

 # Execute a tarefa
 crew = Crew(
-    agents=[agente_gmail],
-    tasks=[tarefa_notificacao]
+    agents=[slack_agent],
+    tasks=[notification_task]
 )
 ```

--- a/docs/pt-BR/enterprise/features/tool-repository.mdx
+++ b/docs/pt-BR/enterprise/features/tool-repository.mdx
@@ -30,7 +30,7 @@ Antes de usar o Repositório de Ferramentas, certifique-se de que você possui:
 Para instalar uma ferramenta:

 ```bash
-crewai tool install <nome-da-ferramenta>
+crewai tool install <tool-name>
 ```

 Isso instala a ferramenta e a adiciona ao `pyproject.toml`.
@@ -40,7 +40,7 @@ Isso instala a ferramenta e a adiciona ao `pyproject.toml`.
 Para criar um novo projeto de ferramenta:

 ```bash
-crewai tool create <nome-da-ferramenta>
+crewai tool create <tool-name>
 ```

 Isso gera um projeto de ferramenta estruturado localmente.
@@ -76,7 +76,7 @@ Para atualizar uma ferramenta publicada:
 3. Faça o commit das alterações e publique

 ```bash
-git commit -m "Atualizar versão para 0.1.1"
+git commit -m "Update version to 0.1.1"
 crewai tool publish
 ```

--- a/docs/pt-BR/enterprise/features/webhook-streaming.mdx
+++ b/docs/pt-BR/enterprise/features/webhook-streaming.mdx
@@ -12,17 +12,16 @@ O Enterprise Event Streaming permite que você receba atualizações em tempo re

 Ao utilizar a API Kickoff, inclua um objeto `webhooks` em sua requisição, por exemplo:

-# Exemplo de uso da API Kickoff com webhooks
 ```json
 {
  "inputs": {"foo": "bar"},
  "webhooks": {
    "events": ["crew_kickoff_started", "llm_call_started"],
-    "url": "https://seu.endpoint/webhook",
+    "url": "https://your.endpoint/webhook",
    "realtime": false,
    "authentication": {
      "strategy": "bearer",
-      "token": "meu-token-secreto"
+      "token": "my-secret-token"
    }
  }
 }
@@ -34,20 +33,19 @@ Se `realtime` estiver definido como `true`, cada evento será entregue individua

 Cada webhook envia uma lista de eventos:

-# Exemplo de evento enviado pelo webhook
 ```json
 {
  "events": [
    {
-      "id": "id-do-evento",
-      "execution_id": "id-da-execucao-do-crew",
+      "id": "event-id",
+      "execution_id": "crew-run-id",
      "timestamp": "2025-02-16T10:58:44.965Z",
      "type": "llm_call_started",
      "data": {
        "model": "gpt-4",
        "messages": [
-          {"role": "system", "content": "Você é um assistente."},
-          {"role": "user", "content": "Resuma este artigo."}
+          {"role": "system", "content": "You are an assistant."},
+          {"role": "user", "content": "Summarize this article."}
        ]
      }
    }
--- a/docs/pt-BR/enterprise/guides/deploy-crew.mdx
+++ b/docs/pt-BR/enterprise/guides/deploy-crew.mdx
@@ -41,8 +41,11 @@ A CLI fornece a maneira mais rápida de implantar crews desenvolvidos localmente
    Primeiro, você precisa autenticar sua CLI com a plataforma CrewAI Enterprise:

    ```bash
-    # Se já possui uma conta CrewAI Enterprise, ou deseja criar uma:
+    # Se já possui uma conta CrewAI Enterprise
    crewai login
+
+    # Se vai criar uma nova conta
+    crewai signup
    ```

    Ao executar qualquer um dos comandos, a CLI irá:
--- a/docs/pt-BR/learn/before-and-after-kickoff-hooks.mdx
+++ b/docs/pt-BR/learn/before-and-after-kickoff-hooks.mdx
@@ -16,17 +16,17 @@ from crewai import CrewBase
 from crewai.project import before_kickoff

@CrewBase
-class MinhaEquipe:
+class MyCrew:
    @before_kickoff
-    def preparar_dados(self, entradas):
-        # Pré-processa ou modifica as entradas
-        entradas['processado'] = True
-        return entradas
+    def prepare_data(self, inputs):
+        # Preprocess or modify inputs
+        inputs['processed'] = True
+        return inputs

 #...
 ```

-Neste exemplo, a função preparar_dados modifica as entradas adicionando um novo par chave-valor indicando que as entradas foram processadas.
+Neste exemplo, a função prepare_data modifica as entradas adicionando um novo par chave-valor indicando que as entradas foram processadas.

 ## Hook Depois do Kickoff

@@ -39,17 +39,17 @@ from crewai import CrewBase
 from crewai.project import after_kickoff

@CrewBase
-class MinhaEquipe:
+class MyCrew:
    @after_kickoff
-    def registrar_resultados(self, resultado):
-        # Registra ou modifica os resultados
-        print("Execução da equipe concluída com resultado:", resultado)
-        return resultado
+    def log_results(self, result):
+        # Log or modify the results
+        print("Crew execution completed with result:", result)
+        return result

 # ...
 ```

-Na função `registrar_resultados`, os resultados da execução da crew são simplesmente impressos. Você pode estender isso para realizar operações mais complexas, como enviar notificações ou integrar com outros serviços.
+Na função `log_results`, os resultados da execução da crew são simplesmente impressos. Você pode estender isso para realizar operações mais complexas, como enviar notificações ou integrar com outros serviços.

 ## Utilizando Ambos os Hooks

--- a/docs/pt-BR/learn/customizing-agents.mdx
+++ b/docs/pt-BR/learn/customizing-agents.mdx
@@ -77,9 +77,9 @@ search_tool = SerperDevTool()

 # Inicialize o agente com opções avançadas
 agent = Agent(
-  role='Analista de Pesquisa',
-  goal='Fornecer análises de mercado atualizadas',
-  backstory='Um analista especialista com olhar atento para tendências de mercado.',
+  role='Research Analyst',
+  goal='Provide up-to-date market analysis',
+  backstory='An expert analyst with a keen eye for market trends.',
  tools=[search_tool],
  memory=True, # Ativa memória
  verbose=True,
@@ -98,9 +98,14 @@ eficiência dentro do ecossistema CrewAI. Se necessário, a delegação pode ser

 ```python Code
 agent = Agent(
-  role='Redator de Conteúdo',
-  goal='Escrever conteúdo envolvente sobre tendências de mercado',
-  backstory='Um redator experiente com expertise em análise de mercado.',
+  role='Content Writer',
+  goal='Write engaging content on market trends',
+  backstory='A seasoned writer with expertise in market analysis.',
  allow_delegation=True # Habilitando delegação
 )
-```
+```
+
+## Conclusão
+
+Personalizar agentes no CrewAI definindo seus papéis, objetivos, histórias e ferramentas, juntamente com opções avançadas como personalização de modelo de linguagem, memória, ajustes de performance e preferências de delegação, 
+proporciona uma equipe de IA sofisticada e preparada para enfrentar desafios complexos.
--- a/docs/pt-BR/learn/kickoff-async.mdx
+++ b/docs/pt-BR/learn/kickoff-async.mdx
@@ -45,17 +45,17 @@ from crewai import Crew, Agent, Task

 # Create an agent with code execution enabled
 coding_agent = Agent(
-    role="Analista de Dados Python",
-    goal="Analisar dados e fornecer insights usando Python",
-    backstory="Você é um analista de dados experiente com fortes habilidades em Python.",
+    role="Python Data Analyst",
+    goal="Analyze data and provide insights using Python",
+    backstory="You are an experienced data analyst with strong Python skills.",
    allow_code_execution=True
 )

 # Create a task that requires code execution
 data_analysis_task = Task(
-    description="Analise o conjunto de dados fornecido e calcule a idade média dos participantes. Idades: {ages}",
+    description="Analyze the given dataset and calculate the average age of participants. Ages: {ages}",
    agent=coding_agent,
-    expected_output="A idade média dos participantes."
+    expected_output="The average age of the participants."
 )

 # Create a crew and add the task
@@ -83,23 +83,23 @@ from crewai import Crew, Agent, Task

 # Create an agent with code execution enabled
 coding_agent = Agent(
-    role="Analista de Dados Python",
-    goal="Analisar dados e fornecer insights usando Python",
-    backstory="Você é um analista de dados experiente com fortes habilidades em Python.",
+    role="Python Data Analyst",
+    goal="Analyze data and provide insights using Python",
+    backstory="You are an experienced data analyst with strong Python skills.",
    allow_code_execution=True
 )

 # Create tasks that require code execution
 task_1 = Task(
-    description="Analise o primeiro conjunto de dados e calcule a idade média dos participantes. Idades: {ages}",
+    description="Analyze the first dataset and calculate the average age of participants. Ages: {ages}",
    agent=coding_agent,
-    expected_output="A idade média dos participantes."
+    expected_output="The average age of the participants."
 )

 task_2 = Task(
-    description="Analise o segundo conjunto de dados e calcule a idade média dos participantes. Idades: {ages}",
+    description="Analyze the second dataset and calculate the average age of participants. Ages: {ages}",
    agent=coding_agent,
-    expected_output="A idade média dos participantes."
+    expected_output="The average age of the participants."
 )

 # Create two crews and add tasks
--- a/docs/pt-BR/mcp/multiple-servers.mdx
+++ b/docs/pt-BR/mcp/multiple-servers.mdx
@@ -43,11 +43,11 @@ try:
    with MCPServerAdapter(server_params_list) as aggregated_tools:
        print(f"Available aggregated tools: {[tool.name for tool in aggregated_tools]}")

-        agente_multiservidor = Agent(
-            role="Assistente Versátil",
-            goal="Utilizar ferramentas de servidores MCP locais Stdio, remotos SSE e remotos HTTP.",
-            backstory="Um agente de IA capaz de aproveitar um conjunto diversificado de ferramentas de múltiplas fontes.",
-            tools=aggregated_tools, # Todas as ferramentas estão disponíveis aqui
+        multi_server_agent = Agent(
+            role="Versatile Assistant",
+            goal="Utilize tools from local Stdio, remote SSE, and remote HTTP MCP servers.",
+            backstory="An AI agent capable of leveraging a diverse set of tools from multiple sources.",
+            tools=aggregated_tools, # All tools are available here
            verbose=True,
        )

--- a/docs/pt-BR/mcp/overview.mdx
+++ b/docs/pt-BR/mcp/overview.mdx
@@ -73,10 +73,10 @@ server_params = {
 with MCPServerAdapter(server_params) as mcp_tools:
    print(f"Available tools: {[tool.name for tool in mcp_tools]}")

-    meu_agente = Agent(
-        role="Usuário de Ferramentas MCP",
-        goal="Utilizar ferramentas de um servidor MCP.",
-        backstory="Posso conectar a servidores MCP e usar suas ferramentas.",
+    my_agent = Agent(
+        role="MCP Tool User",
+        goal="Utilize tools from an MCP server.",
+        backstory="I can connect to MCP servers and use their tools.",
        tools=mcp_tools, # Passe as ferramentas carregadas para o seu agente
        reasoning=True,
        verbose=True
@@ -91,10 +91,10 @@ Este padrão geral mostra como integrar ferramentas. Para exemplos específicos
 with MCPServerAdapter(server_params) as mcp_tools:
    print(f"Available tools: {[tool.name for tool in mcp_tools]}")

-    meu_agente = Agent(
-        role="Usuário de Ferramentas MCP",
-        goal="Utilizar ferramentas de um servidor MCP.",
-        backstory="Posso conectar a servidores MCP e usar suas ferramentas.",
+    my_agent = Agent(
+        role="MCP Tool User",
+        goal="Utilize tools from an MCP server.",
+        backstory="I can connect to MCP servers and use their tools.",
        tools=mcp_tools["tool_name"], # Passe as ferramentas filtradas para o seu agente
        reasoning=True,
        verbose=True
--- a/docs/pt-BR/mcp/sse.mdx
+++ b/docs/pt-BR/mcp/sse.mdx
@@ -37,24 +37,24 @@ try:
        print(f"Available tools from SSE MCP server: {[tool.name for tool in tools]}")

        # Example: Using a tool from the SSE MCP server
-        agente_sse = Agent(
-            role="Usuário de Serviço Remoto",
-            goal="Utilizar uma ferramenta fornecida por um servidor MCP remoto via SSE.",
-            backstory="Um agente de IA que conecta a serviços externos via SSE.",
+        sse_agent = Agent(
+            role="Remote Service User",
+            goal="Utilize a tool provided by a remote SSE MCP server.",
+            backstory="An AI agent that connects to external services via SSE.",
            tools=tools,
            reasoning=True,
            verbose=True,
        )

        sse_task = Task(
-            description="Buscar atualizações em tempo real das ações 'AAPL' usando uma ferramenta SSE.",
-            expected_output="O preço mais recente da ação AAPL.",
-            agent=agente_sse,
+            description="Fetch real-time stock updates for 'AAPL' using an SSE tool.",
+            expected_output="The latest stock price for AAPL.",
+            agent=sse_agent,
            markdown=True
        )

        sse_crew = Crew(
-            agents=[agente_sse],
+            agents=[sse_agent],
            tasks=[sse_task],
            verbose=True,
            process=Process.sequential
@@ -101,16 +101,16 @@ try:
    print(f"Available tools (manual SSE): {[tool.name for tool in tools]}")

    manual_sse_agent = Agent(
-        role="Analista Remoto de Dados",
-        goal="Analisar dados obtidos de um servidor MCP remoto SSE usando gerenciamento manual de conexão.",
-        backstory="Um agente de IA especializado em gerenciar conexões SSE explicitamente.",
+        role="Remote Data Analyst",
+        goal="Analyze data fetched from a remote SSE MCP server using manual connection management.",
+        backstory="An AI skilled in handling SSE connections explicitly.",
        tools=tools,
        verbose=True
    )
    
    analysis_task = Task(
-        description="Buscar e analisar as tendências mais recentes de atividade de usuários do servidor SSE.",
-        expected_output="Um relatório resumido das tendências de atividade dos usuários.",
+        description="Fetch and analyze the latest user activity trends from the SSE server.",
+        expected_output="A summary report of user activity trends.",
        agent=manual_sse_agent
    )
    
--- a/docs/pt-BR/mcp/stdio.mdx
+++ b/docs/pt-BR/mcp/stdio.mdx
@@ -38,24 +38,24 @@ with MCPServerAdapter(server_params) as tools:
    print(f"Available tools from Stdio MCP server: {[tool.name for tool in tools]}")

    # Exemplo: Usando as ferramentas do servidor MCP Stdio em um Agente CrewAI
-    pesquisador_local = Agent(
-        role="Processador Local de Dados",
-        goal="Processar dados usando uma ferramenta local baseada em Stdio.",
-        backstory="Uma IA que utiliza scripts locais via MCP para tarefas especializadas.",
+    research_agent = Agent(
+        role="Local Data Processor",
+        goal="Process data using a local Stdio-based tool.",
+        backstory="An AI that leverages local scripts via MCP for specialized tasks.",
        tools=tools,
        reasoning=True,
        verbose=True,
    )
    
    processing_task = Task(
-        description="Processar o arquivo de dados de entrada 'data.txt' e resumir seu conteúdo.",
-        expected_output="Um resumo dos dados processados.",
-        agent=pesquisador_local,
+        description="Process the input data file 'data.txt' and summarize its contents.",
+        expected_output="A summary of the processed data.",
+        agent=research_agent,
        markdown=True
    )
    
    data_crew = Crew(
-        agents=[pesquisador_local],
+        agents=[research_agent],
        tasks=[processing_task],
        verbose=True,
        process=Process.sequential 
@@ -95,16 +95,16 @@ try:

    # Exemplo: Usando as ferramentas com sua configuração de Agent, Task, Crew
    manual_agent = Agent(
-        role="Executor Local de Tarefas",
-        goal="Executar uma tarefa local específica usando uma ferramenta Stdio gerenciada manualmente.",
-        backstory="Uma IA proficiente em controlar processos locais via MCP.",
+        role="Local Task Executor",
+        goal="Execute a specific local task using a manually managed Stdio tool.",
+        backstory="An AI proficient in controlling local processes via MCP.",
        tools=tools,
        verbose=True
    )
    
    manual_task = Task(
-        description="Executar o comando 'perform_analysis' via ferramenta Stdio.",
-        expected_output="Resultados da análise.",
+        description="Execute the 'perform_analysis' command via the Stdio tool.",
+        expected_output="Results of the analysis.",
        agent=manual_agent
    )
    
--- a/docs/pt-BR/mcp/streamable-http.mdx
+++ b/docs/pt-BR/mcp/streamable-http.mdx
@@ -35,22 +35,22 @@ try:
    with MCPServerAdapter(server_params) as tools:
        print(f"Available tools from Streamable HTTP MCP server: {[tool.name for tool in tools]}")

-        agente_http = Agent(
-            role="Integrador de Serviços HTTP",
-            goal="Utilizar ferramentas de um servidor MCP remoto via Streamable HTTP.",
-            backstory="Um agente de IA especializado em interagir com serviços web complexos.",
+        http_agent = Agent(
+            role="HTTP Service Integrator",
+            goal="Utilize tools from a remote MCP server via Streamable HTTP.",
+            backstory="An AI agent adept at interacting with complex web services.",
            tools=tools,
            verbose=True,
        )

        http_task = Task(
-            description="Realizar uma consulta de dados complexa usando uma ferramenta do servidor Streamable HTTP.",
-            expected_output="O resultado da consulta de dados complexa.",
-            agent=agente_http,
+            description="Perform a complex data query using a tool from the Streamable HTTP server.",
+            expected_output="The result of the complex data query.",
+            agent=http_agent,
        )

        http_crew = Crew(
-            agents=[agente_http],
+            agents=[http_agent],
            tasks=[http_task],
            verbose=True,
            process=Process.sequential
@@ -91,16 +91,16 @@ try:
    print(f"Available tools (manual Streamable HTTP): {[tool.name for tool in tools]}")

    manual_http_agent = Agent(
-        role="Usuário Avançado de Serviços Web",
-        goal="Interagir com um servidor MCP usando conexões HTTP Streamable gerenciadas manualmente.",
-        backstory="Um especialista em IA em ajustar integrações baseadas em HTTP.",
+        role="Advanced Web Service User",
+        goal="Interact with an MCP server using manually managed Streamable HTTP connections.",
+        backstory="An AI specialist in fine-tuning HTTP-based service integrations.",
        tools=tools,
        verbose=True
    )
    
    data_processing_task = Task(
-        description="Enviar dados para processamento e recuperar resultados via Streamable HTTP.",
-        expected_output="Dados processados ou confirmação.",
+        description="Submit data for processing and retrieve results via Streamable HTTP.",
+        expected_output="Processed data or confirmation.",
        agent=manual_http_agent
    )
    
--- a/docs/pt-BR/observability/arize-phoenix.mdx
+++ b/docs/pt-BR/observability/arize-phoenix.mdx
@@ -78,40 +78,47 @@ CrewAIInstrumentor().instrument(skip_dep_check=True, tracer_provider=tracer_prov
 search_tool = SerperDevTool()

 # Defina seus agentes com papéis e objetivos
-pesquisador = Agent(
-    role="Analista Sênior de Pesquisa",
-    goal="Descobrir os avanços mais recentes em IA e ciência de dados",
-    backstory="""
-Você trabalha em um importante think tank de tecnologia. Sua especialidade é identificar tendências emergentes. Você tem habilidade para dissecar dados complexos e apresentar insights acionáveis.
-""",
+researcher = Agent(
+    role="Senior Research Analyst",
+    goal="Uncover cutting-edge developments in AI and data science",
+    backstory="""You work at a leading tech think tank.
+    Your expertise lies in identifying emerging trends.
+    You have a knack for dissecting complex data and presenting actionable insights.""",
    verbose=True,
    allow_delegation=False,
+    # You can pass an optional llm attribute specifying what model you wanna use.
+    # llm=ChatOpenAI(model_name="gpt-3.5", temperature=0.7),
    tools=[search_tool],
 )
 writer = Agent(
-    role="Estrategista de Conteúdo Técnico",
-    goal="Criar conteúdo envolvente sobre avanços tecnológicos",
-    backstory="Você é um Estrategista de Conteúdo renomado, conhecido por seus artigos perspicazes e envolventes. Você transforma conceitos complexos em narrativas atraentes.",
+    role="Tech Content Strategist",
+    goal="Craft compelling content on tech advancements",
+    backstory="""You are a renowned Content Strategist, known for your insightful and engaging articles.
+    You transform complex concepts into compelling narratives.""",
    verbose=True,
    allow_delegation=True,
 )

 # Crie tarefas para seus agentes
 task1 = Task(
-    description="Realize uma análise abrangente dos avanços mais recentes em IA em 2024. Identifique tendências-chave, tecnologias inovadoras e impactos potenciais na indústria.",
-    expected_output="Relatório analítico completo em tópicos",
-    agent=pesquisador,
+    description="""Conduct a comprehensive analysis of the latest advancements in AI in 2024.
+    Identify key trends, breakthrough technologies, and potential industry impacts.""",
+    expected_output="Full analysis report in bullet points",
+    agent=researcher,
 )

 task2 = Task(
-    description="Utilizando os insights fornecidos, desenvolva um blog envolvente destacando os avanços mais significativos em IA. O post deve ser informativo e acessível, voltado para um público técnico. Dê um tom interessante, evite palavras complexas para não soar como IA.",
-    expected_output="Post de blog completo com pelo menos 4 parágrafos",
+    description="""Using the insights provided, develop an engaging blog
+    post that highlights the most significant AI advancements.
+    Your post should be informative yet accessible, catering to a tech-savvy audience.
+    Make it sound cool, avoid complex words so it doesn't sound like AI.""",
+    expected_output="Full blog post of at least 4 paragraphs",
    agent=writer,
 )

 # Instancie seu crew com um processo sequencial
 crew = Crew(
-    agents=[pesquisador, writer], tasks=[task1, task2], verbose=1, process=Process.sequential
+    agents=[researcher, writer], tasks=[task1, task2], verbose=1, process=Process.sequential
 )

 # Coloque seu crew para trabalhar!
--- a/docs/pt-BR/observability/langfuse.mdx
+++ b/docs/pt-BR/observability/langfuse.mdx
@@ -76,20 +76,20 @@ from crewai_tools import (

 web_rag_tool = WebsiteSearchTool()

-escritor = Agent(
-    role="Escritor",
-    goal="Você torna a matemática envolvente e compreensível para crianças pequenas através de poesias",
-    backstory="Você é especialista em escrever haicais mas não sabe nada de matemática.",
-    tools=[web_rag_tool],  
-)
+writer = Agent(
+        role="Writer",
+        goal="Você torna a matemática envolvente e compreensível para crianças pequenas através de poesias",
+        backstory="Você é especialista em escrever haicais mas não sabe nada de matemática.",
+        tools=[web_rag_tool],  
+    )

-tarefa = Task(description=("O que é {multiplicação}?"),
-              expected_output=("Componha um haicai que inclua a resposta."),
-              agent=escritor)
+task = Task(description=("O que é {multiplicação}?"),
+            expected_output=("Componha um haicai que inclua a resposta."),
+            agent=writer)

-equipe = Crew(
-  agents=[escritor],
-  tasks=[tarefa],
+crew = Crew(
+  agents=[writer],
+  tasks=[task],
  share_crew=False
 )
 ```
--- a/docs/pt-BR/observability/langtrace.mdx
+++ b/docs/pt-BR/observability/langtrace.mdx
@@ -35,7 +35,7 @@ Essa integração permite o registro de hiperparâmetros, o monitoramento de reg

    ```python
    from langtrace_python_sdk import langtrace
-    langtrace.init(api_key='<SUA_CHAVE_LANGTRACE>')
+    langtrace.init(api_key='<LANGTRACE_API_KEY>')

    # Agora importe os módulos do CrewAI
    from crewai import Agent, Task, Crew
--- a/docs/pt-BR/observability/maxim.mdx
+++ b/docs/pt-BR/observability/maxim.mdx
@@ -73,24 +73,26 @@ instrument_crewai(logger)
 ### 4. Crie e execute sua aplicação CrewAI normalmente

 ```python
-pesquisador = Agent(
-    role='Pesquisador Sênior',
-    goal='Descobrir os avanços mais recentes em IA',
-    backstory="Você é um pesquisador especialista em um think tank de tecnologia...",
+
+# Crie seu agente
+researcher = Agent(
+    role='Senior Research Analyst',
+    goal='Uncover cutting-edge developments in AI',
+    backstory="You are an expert researcher at a tech think tank...",
    verbose=True,
    llm=llm
 )

 # Defina a tarefa
 research_task = Task(
-    description="Pesquise os avanços mais recentes em IA...",
+    description="Research the latest AI advancements...",
    expected_output="",
-    agent=pesquisador
+    agent=researcher
 )

 # Configure e execute a crew
 crew = Crew(
-    agents=[pesquisador],
+    agents=[researcher],
    tasks=[research_task],
    verbose=True
 )
--- a/docs/pt-BR/observability/mlflow.mdx
+++ b/docs/pt-BR/observability/mlflow.mdx
@@ -70,19 +70,22 @@ O tracing fornece uma forma de registrar os inputs, outputs e metadados associad

      class TripAgents:
          def city_selection_agent(self):
-              especialista_cidades = Agent(
-                  role="Especialista em Seleção de Cidades",
-                  goal="Selecionar a melhor cidade com base no clima, estação e preços",
-                  backstory="Especialista em analisar dados de viagem para escolher destinos ideais",
-                  tools=[search_tool],
+              return Agent(
+                  role="City Selection Expert",
+                  goal="Select the best city based on weather, season, and prices",
+                  backstory="An expert in analyzing travel data to pick ideal destinations",
+                  tools=[
+                      search_tool,
+                  ],
                  verbose=True,
              )

          def local_expert(self):
-              especialista_local = Agent(
-                  role="Especialista Local nesta cidade",
-                  goal="Fornecer as MELHORES informações sobre a cidade selecionada",
-                  backstory="Um guia local experiente com amplo conhecimento sobre a cidade, suas atrações e costumes",
+              return Agent(
+                  role="Local Expert at this city",
+                  goal="Provide the BEST insights about the selected city",
+                  backstory="""A knowledgeable local guide with extensive information
+              about the city, it's attractions and customs""",
                  tools=[search_tool],
                  verbose=True,
              )
@@ -93,36 +96,53 @@ O tracing fornece uma forma de registrar os inputs, outputs e metadados associad
              return Task(
                  description=dedent(
                      f"""
-                      Analise e selecione a melhor cidade para a viagem com base em critérios específicos como padrões climáticos, eventos sazonais e custos de viagem. Esta tarefa envolve comparar várias cidades, considerando fatores como condições climáticas atuais, eventos culturais ou sazonais e despesas gerais de viagem.
-                      Sua resposta final deve ser um relatório detalhado sobre a cidade escolhida e tudo o que você descobriu sobre ela, incluindo custos reais de voo, previsão do tempo e atrações.
+                      Analyze and select the best city for the trip based
+                      on specific criteria such as weather patterns, seasonal
+                      events, and travel costs. This task involves comparing
+                      multiple cities, considering factors like current weather
+                      conditions, upcoming cultural or seasonal events, and
+                      overall travel expenses.
+                      Your final answer must be a detailed
+                      report on the chosen city, and everything you found out
+                      about it, including the actual flight costs, weather
+                      forecast and attractions.

-                      Saindo de: {origin}
-                      Opções de cidades: {cities}
-                      Data da viagem: {range}
-                      Interesses do viajante: {interests}
+                      Traveling from: {origin}
+                      City Options: {cities}
+                      Trip Date: {range}
+                      Traveler Interests: {interests}
                  """
                  ),
                  agent=agent,
-                  expected_output="Relatório detalhado sobre a cidade escolhida incluindo custos de voo, previsão do tempo e atrações",
+                  expected_output="Detailed report on the chosen city including flight costs, weather forecast, and attractions",
              )

          def gather_task(self, agent, origin, interests, range):
              return Task(
                  description=dedent(
                      f"""
-                      Como especialista local nesta cidade, você deve compilar um guia aprofundado para alguém que está viajando para lá e quer ter a MELHOR viagem possível!
-                      Reúna informações sobre principais atrações, costumes locais, eventos especiais e recomendações de atividades diárias.
-                      Encontre os melhores lugares para ir, aqueles que só um local conhece.
-                      Este guia deve fornecer uma visão abrangente do que a cidade tem a oferecer, incluindo joias escondidas, pontos culturais, marcos imperdíveis, previsão do tempo e custos gerais.
-                      A resposta final deve ser um guia completo da cidade, rico em insights culturais e dicas práticas, adaptado para aprimorar a experiência de viagem.
+                      As a local expert on this city you must compile an
+                      in-depth guide for someone traveling there and wanting
+                      to have THE BEST trip ever!
+                      Gather information about key attractions, local customs,
+                      special events, and daily activity recommendations.
+                      Find the best spots to go to, the kind of place only a
+                      local would know.
+                      This guide should provide a thorough overview of what
+                      the city has to offer, including hidden gems, cultural
+                      hotspots, must-visit landmarks, weather forecasts, and
+                      high level costs.
+                      The final answer must be a comprehensive city guide,
+                      rich in cultural insights and practical tips,
+                      tailored to enhance the travel experience.

-                      Data da viagem: {range}
-                      Saindo de: {origin}
-                      Interesses do viajante: {interests}
+                      Trip Date: {range}
+                      Traveling from: {origin}
+                      Traveler Interests: {interests}
                  """
                  ),
                  agent=agent,
-                  expected_output="Guia completo da cidade incluindo joias escondidas, pontos culturais e dicas práticas",
+                  expected_output="Comprehensive city guide including hidden gems, cultural hotspots, and practical travel tips",
              )


@@ -169,7 +189,7 @@ O tracing fornece uma forma de registrar os inputs, outputs e metadados associad
      trip_crew = TripCrew("California", "Tokyo", "Dec 12 - Dec 20", "sports")
      result = trip_crew.run()

-      print("Resultado da equipe:", result)
+      print(result)
      ```
      Consulte a [Documentação de Tracing do MLflow](https://mlflow.org/docs/latest/llms/tracing/index.html) para mais configurações e casos de uso.
    </Step>
--- a/docs/pt-BR/observability/openlit.mdx
+++ b/docs/pt-BR/observability/openlit.mdx
@@ -69,10 +69,10 @@ Essa configuração permite acompanhar hiperparâmetros e monitorar problemas de

          openlit.init(disable_metrics=True)
          # Definir seus agentes
-          pesquisador = Agent(
-              role="Pesquisador",
-              goal="Realizar pesquisas e análises aprofundadas sobre IA e agentes de IA",
-              backstory="Você é um pesquisador especialista em tecnologia, engenharia de software, IA e startups. Trabalha como freelancer e está atualmente pesquisando para um novo cliente.",
+          researcher = Agent(
+              role="Researcher",
+              goal="Conduct thorough research and analysis on AI and AI agents",
+              backstory="You're an expert researcher, specialized in technology, software engineering, AI, and startups. You work as a freelancer and are currently researching for a new client.",
              allow_delegation=False,
              llm='command-r'
          )
@@ -80,24 +80,24 @@ Essa configuração permite acompanhar hiperparâmetros e monitorar problemas de

          # Definir sua task
          task = Task(
-              description="Gere uma lista com 5 ideias interessantes para um artigo e escreva um parágrafo cativante para cada ideia, mostrando o potencial de um artigo completo sobre o tema. Retorne a lista de ideias com seus parágrafos e suas anotações.",
-              expected_output="5 tópicos, cada um com um parágrafo e notas complementares.",
+              description="Generate a list of 5 interesting ideas for an article, then write one captivating paragraph for each idea that showcases the potential of a full article on this topic. Return the list of ideas with their paragraphs and your notes.",
+              expected_output="5 bullet points, each with a paragraph and accompanying notes.",
          )

          # Definir o agente gerente
-          gerente = Agent(
-              role="Gerente de Projeto",
-              goal="Gerenciar eficientemente a equipe e garantir a conclusão de tarefas de alta qualidade",
-              backstory="Você é um gerente de projetos experiente, habilidoso em supervisionar projetos complexos e guiar equipes para o sucesso. Sua função é coordenar os esforços dos membros da equipe, garantindo que cada tarefa seja concluída no prazo e com o mais alto padrão.",
+          manager = Agent(
+              role="Project Manager",
+              goal="Efficiently manage the crew and ensure high-quality task completion",
+              backstory="You're an experienced project manager, skilled in overseeing complex projects and guiding teams to success. Your role is to coordinate the efforts of the crew members, ensuring that each task is completed on time and to the highest standard.",
              allow_delegation=True,
              llm='command-r'
          )

          # Instanciar sua crew com um manager personalizado
          crew = Crew(
-              agents=[pesquisador],
+              agents=[researcher],
              tasks=[task],
-              manager_agent=gerente,
+              manager_agent=manager,
              process=Process.hierarchical,
          )

@@ -132,18 +132,18 @@ Essa configuração permite acompanhar hiperparâmetros e monitorar problemas de

          # Criar um agente com execução de código habilitada
          coding_agent = Agent(
-            role="Analista de Dados Python",
-            goal="Analisar dados e fornecer insights usando Python",
-            backstory="Você é um analista de dados experiente com fortes habilidades em Python.",
+            role="Python Data Analyst",
+            goal="Analyze data and provide insights using Python",
+            backstory="You are an experienced data analyst with strong Python skills.",
            allow_code_execution=True,
            llm="command-r"
          )

          # Criar uma task que exige execução de código
          data_analysis_task = Task(
-            description="Analise o conjunto de dados fornecido e calcule a idade média dos participantes. Idades: {ages}",
+            description="Analyze the given dataset and calculate the average age of participants. Ages: {ages}",
            agent=coding_agent,
-            expected_output="5 tópicos, cada um com um parágrafo e notas complementares.",
+            expected_output="5 bullet points, each with a paragraph and accompanying notes.",
          )

          # Criar uma crew e adicionar a task
--- a/docs/pt-BR/observability/opik.mdx
+++ b/docs/pt-BR/observability/opik.mdx
@@ -58,43 +58,43 @@ Neste guia, utilizaremos o exemplo de início rápido da CrewAI.
      from crewai import Agent, Crew, Task, Process


-      class NomeDaEquipe:
-          def agente_um(self) -> Agent:
+      class YourCrewName:
+          def agent_one(self) -> Agent:
              return Agent(
-                  role="Analista de Dados",
-                  goal="Analisar tendências de dados no mercado",
-                  backstory="Analista de dados experiente com formação em economia",
+                  role="Data Analyst",
+                  goal="Analyze data trends in the market",
+                  backstory="An experienced data analyst with a background in economics",
                  verbose=True,
              )

-          def agente_dois(self) -> Agent:
+          def agent_two(self) -> Agent:
              return Agent(
-                  role="Pesquisador de Mercado",
-                  goal="Coletar informações sobre a dinâmica do mercado",
-                  backstory="Pesquisador dedicado com olhar atento para detalhes",
+                  role="Market Researcher",
+                  goal="Gather information on market dynamics",
+                  backstory="A diligent researcher with a keen eye for detail",
                  verbose=True,
              )

-          def tarefa_um(self) -> Task:
+          def task_one(self) -> Task:
              return Task(
-                  name="Tarefa de Coleta de Dados",
-                  description="Coletar dados recentes do mercado e identificar tendências.",
-                  expected_output="Um relatório resumindo as principais tendências do mercado.",
-                  agent=self.agente_um(),
+                  name="Collect Data Task",
+                  description="Collect recent market data and identify trends.",
+                  expected_output="A report summarizing key trends in the market.",
+                  agent=self.agent_one(),
              )

-          def tarefa_dois(self) -> Task:
+          def task_two(self) -> Task:
              return Task(
-                  name="Tarefa de Pesquisa de Mercado",
-                  description="Pesquisar fatores que afetam a dinâmica do mercado.",
-                  expected_output="Uma análise dos fatores que influenciam o mercado.",
-                  agent=self.agente_dois(),
+                  name="Market Research Task",
+                  description="Research factors affecting market dynamics.",
+                  expected_output="An analysis of factors influencing the market.",
+                  agent=self.agent_two(),
              )

-          def equipe(self) -> Crew:
+          def crew(self) -> Crew:
              return Crew(
-                  agents=[self.agente_um(), self.agente_dois()],
-                  tasks=[self.tarefa_um(), self.tarefa_dois()],
+                  agents=[self.agent_one(), self.agent_two()],
+                  tasks=[self.task_one(), self.task_two()],
                  process=Process.sequential,
                  verbose=True,
              )
@@ -108,7 +108,7 @@ Neste guia, utilizaremos o exemplo de início rápido da CrewAI.

      track_crewai(project_name="crewai-integration-demo")

-      my_crew = NomeDaEquipe().equipe()
+      my_crew = YourCrewName().crew()
      result = my_crew.kickoff()

      print(result)
--- a/docs/pt-BR/observability/patronus-evaluation.mdx
+++ b/docs/pt-BR/observability/patronus-evaluation.mdx
@@ -64,17 +64,17 @@ patronus_eval_tool = PatronusEvalTool()

 # Define an agent that uses the tool
 coding_agent = Agent(
-    role="Agente de Programação",
-    goal="Gerar código de alta qualidade e verificar se a saída é código",
-    backstory="Um programador experiente que pode gerar código Python de alta qualidade.",
+    role="Coding Agent",
+    goal="Generate high quality code and verify that the output is code",
+    backstory="An experienced coder who can generate high quality python code.",
    tools=[patronus_eval_tool],
    verbose=True,
 )

 # Example task to generate and evaluate code
 generate_code_task = Task(
-    description="Crie um programa simples para gerar os N primeiros números da sequência de Fibonacci. Selecione o avaliador e os critérios mais apropriados para avaliar sua saída.",
-    expected_output="Programa que gera os N primeiros números da sequência de Fibonacci.",
+    description="Create a simple program to generate the first N numbers in the Fibonacci sequence. Select the most appropriate evaluator and criteria for evaluating your output.",
+    expected_output="Program that generates the first N numbers in the Fibonacci sequence.",
    agent=coding_agent,
 )

@@ -98,17 +98,17 @@ patronus_eval_tool = PatronusPredefinedCriteriaEvalTool(

 # Define an agent that uses the tool
 coding_agent = Agent(
-    role="Agente de Programação",
-    goal="Gerar código de alta qualidade",
-    backstory="Um programador experiente que pode gerar código Python de alta qualidade.",
+    role="Coding Agent",
+    goal="Generate high quality code",
+    backstory="An experienced coder who can generate high quality python code.",
    tools=[patronus_eval_tool],
    verbose=True,
 )

 # Example task to generate code
 generate_code_task = Task(
-    description="Crie um programa simples para gerar os N primeiros números da sequência de Fibonacci.",
-    expected_output="Programa que gera os N primeiros números da sequência de Fibonacci.",
+    description="Create a simple program to generate the first N numbers in the Fibonacci sequence.",
+    expected_output="Program that generates the first N numbers in the Fibonacci sequence.",
    agent=coding_agent,
 )

@@ -149,17 +149,17 @@ patronus_eval_tool = PatronusLocalEvaluatorTool(

 # Define an agent that uses the tool
 coding_agent = Agent(
-    role="Agente de Programação",
-    goal="Gerar código de alta qualidade",
-    backstory="Um programador experiente que pode gerar código Python de alta qualidade.",
+    role="Coding Agent",
+    goal="Generate high quality code",
+    backstory="An experienced coder who can generate high quality python code.",
    tools=[patronus_eval_tool],
    verbose=True,
 )

 # Example task to generate code
 generate_code_task = Task(
-    description="Crie um programa simples para gerar os N primeiros números da sequência de Fibonacci.",
-    expected_output="Programa que gera os N primeiros números da sequência de Fibonacci.",
+    description="Create a simple program to generate the first N numbers in the Fibonacci sequence.",
+    expected_output="Program that generates the first N numbers in the Fibonacci sequence.",
    agent=coding_agent,
 )

--- a/docs/pt-BR/observability/weave.mdx
+++ b/docs/pt-BR/observability/weave.mdx
@@ -50,48 +50,48 @@ O Weave captura automaticamente rastreamentos (traces) de suas aplicações Crew
      llm = LLM(model="gpt-4o", temperature=0)

      # Crie os agentes
-      pesquisador = Agent(
-          role='Analista de Pesquisa',
-          goal='Encontrar e analisar as melhores oportunidades de investimento',
-          backstory='Especialista em análise financeira e pesquisa de mercado',
+      researcher = Agent(
+          role='Research Analyst',
+          goal='Find and analyze the best investment opportunities',
+          backstory='Expert in financial analysis and market research',
          llm=llm,
          verbose=True,
          allow_delegation=False,
      )

-      redator = Agent(
-          role='Redator de Relatórios',
-          goal='Escrever relatórios de investimento claros e concisos',
-          backstory='Experiente na criação de relatórios financeiros detalhados',
+      writer = Agent(
+          role='Report Writer',
+          goal='Write clear and concise investment reports',
+          backstory='Experienced in creating detailed financial reports',
          llm=llm,
          verbose=True,
          allow_delegation=False,
      )

      # Crie as tarefas
-      pesquisa = Task(
-          description='Pesquisa aprofundada sobre o {tema}',
-          expected_output='Dados de mercado abrangentes incluindo principais players, tamanho de mercado e tendências de crescimento.',
-          agent=pesquisador
+      research_task = Task(
+          description='Deep research on the {topic}',
+          expected_output='Comprehensive market data including key players, market size, and growth trends.',
+          agent=researcher
      )

-      redacao = Task(
-          description='Escreva um relatório detalhado com base na pesquisa',
-          expected_output='O relatório deve ser fácil de ler e entender. Use tópicos quando aplicável.',
-          agent=redator
+      writing_task = Task(
+          description='Write a detailed report based on the research',
+          expected_output='The report should be easy to read and understand. Use bullet points where applicable.',
+          agent=writer
      )

      # Crie o crew
-      equipe = Crew(
-          agents=[pesquisador, redator],
-          tasks=[pesquisa, redacao],
+      crew = Crew(
+          agents=[researcher, writer],
+          tasks=[research_task, writing_task],
          verbose=True,
          process=Process.sequential,
      )

      # Execute o crew
-      resultado = equipe.kickoff(inputs={"tema": "IA em ciência dos materiais"})
-      print(resultado)
+      result = crew.kickoff(inputs={"topic": "AI in material science"})
+      print(result)
      ```
    </Step>
    <Step title="Visualize rastreamentos no Weave">
--- a/docs/pt-BR/quickstart.mdx
+++ b/docs/pt-BR/quickstart.mdx
@@ -39,19 +39,23 @@ Siga os passos abaixo para começar a tripular! 🚣‍♂️
    # src/latest_ai_development/config/agents.yaml
    researcher:
      role: >
-        Pesquisador Sênior de Dados em {topic}
+        {topic} Senior Data Researcher
      goal: >
-        Descobrir os avanços mais recentes em {topic}
+        Uncover cutting-edge developments in {topic}
      backstory: >
-        Você é um pesquisador experiente com talento para descobrir os últimos avanços em {topic}. Conhecido por sua habilidade em encontrar as informações mais relevantes e apresentá-las de forma clara e concisa.
+        You're a seasoned researcher with a knack for uncovering the latest
+        developments in {topic}. Known for your ability to find the most relevant
+        information and present it in a clear and concise manner.

    reporting_analyst:
      role: >
-        Analista de Relatórios em {topic}
+        {topic} Reporting Analyst
      goal: >
-        Criar relatórios detalhados com base na análise de dados e descobertas de pesquisa em {topic}
+        Create detailed reports based on {topic} data analysis and research findings
      backstory: >
-        Você é um analista meticuloso com um olhar atento aos detalhes. É conhecido por sua capacidade de transformar dados complexos em relatórios claros e concisos, facilitando o entendimento e a tomada de decisão por parte dos outros.
+        You're a meticulous analyst with a keen eye for detail. You're known for
+        your ability to turn complex data into clear and concise reports, making
+        it easy for others to understand and act on the information you provide.
    ```
  </Step>
  <Step title="Modifique seu arquivo `tasks.yaml`">
@@ -59,19 +63,20 @@ Siga os passos abaixo para começar a tripular! 🚣‍♂️
    # src/latest_ai_development/config/tasks.yaml
    research_task:
      description: >
-        Realize uma pesquisa aprofundada sobre {topic}.
-        Certifique-se de encontrar informações interessantes e relevantes considerando que o ano atual é 2025.
+        Conduct a thorough research about {topic}
+        Make sure you find any interesting and relevant information given
+        the current year is 2025.
      expected_output: >
-        Uma lista com 10 tópicos dos dados mais relevantes sobre {topic}
+        A list with 10 bullet points of the most relevant information about {topic}
      agent: researcher

    reporting_task:
      description: >
-        Revise o contexto obtido e expanda cada tópico em uma seção completa para um relatório.
-        Certifique-se de que o relatório seja detalhado e contenha todas as informações relevantes.
+        Review the context you got and expand each topic into a full section for a report.
+        Make sure the report is detailed and contains any and all relevant information.
      expected_output: >
-        Um relatório completo com os principais tópicos, cada um com uma seção detalhada de informações.
-        Formate como markdown sem usar '```'
+        A fully fledge reports with the mains topics, each with a full section of information.
+        Formatted as markdown without '```'
      agent: reporting_analyst
      output_file: report.md
    ```
@@ -117,15 +122,15 @@ Siga os passos abaixo para começar a tripular! 🚣‍♂️
      def reporting_task(self) -> Task:
        return Task(
          config=self.tasks_config['reporting_task'], # type: ignore[index]
-          output_file='output/report.md' # Este é o arquivo que conterá o relatório final.
+          output_file='output/report.md' # This is the file that will be contain the final report.
        )

      @crew
      def crew(self) -> Crew:
        """Creates the LatestAiDevelopment crew"""
        return Crew(
-          agents=self.agents, # Criado automaticamente pelo decorador @agent
-          tasks=self.tasks, # Criado automaticamente pelo decorador @task
+          agents=self.agents, # Automatically created by the @agent decorator
+          tasks=self.tasks, # Automatically created by the @task decorator
          process=Process.sequential,
          verbose=True,
        )
@@ -224,7 +229,7 @@ Siga os passos abaixo para começar a tripular! 🚣‍♂️

  <CodeGroup>
    ```markdown output/report.md
-    # Relatório Abrangente sobre a Ascensão e o Impacto dos Agentes de IA em 2025
+    # Comprehensive Report on the Rise and Impact of AI Agents in 2025

    ## 1. Introduction to AI Agents
    In 2025, Artificial Intelligence (AI) agents are at the forefront of innovation across various industries. As intelligent systems that can perform tasks typically requiring human cognition, AI agents are paving the way for significant advancements in operational efficiency, decision-making, and overall productivity within sectors like Human Resources (HR) and Finance. This report aims to detail the rise of AI agents, their frameworks, applications, and potential implications on the workforce.
--- a/docs/pt-BR/tools/search-research/linkupsearchtool.mdx
+++ b/docs/pt-BR/tools/search-research/linkupsearchtool.mdx
@@ -35,18 +35,78 @@ from crewai_tools import LinkupSearchTool
 from crewai import Agent
 import os

-# Inicialize a ferramenta com sua chave de API
-linkup_ferramenta = LinkupSearchTool(api_key=os.getenv("LINKUP_API_KEY"))
+# Initialize the tool with your API key
+linkup_tool = LinkupSearchTool(api_key=os.getenv("LINKUP_API_KEY"))

-# Defina um agente que usa a ferramenta
+# Define an agent that uses the tool
@agent
-def pesquisador(self) -> Agent:
+def researcher(self) -> Agent:
    '''
-    Este agente usa o LinkupSearchTool para recuperar informações contextuais
-    da API do Linkup.
+    This agent uses the LinkupSearchTool to retrieve contextual information
+    from the Linkup API.
    '''
    return Agent(
-        config=self.agentes_config["pesquisador"],
-        tools=[linkup_ferramenta]
+        config=self.agents_config["researcher"],
+        tools=[linkup_tool]
    )
-```
+```
+
+## Parâmetros
+
+O `LinkupSearchTool` aceita os seguintes parâmetros:
+
+### Parâmetros do Construtor
+- **api_key**: Obrigatório. Sua chave de API do Linkup.
+
+### Parâmetros de Execução
+- **query**: Obrigatório. O termo ou frase de busca.
+- **depth**: Opcional. A profundidade da busca. O padrão é "standard".
+- **output_type**: Opcional. O tipo de saída. O padrão é "searchResults".
+
+## Uso Avançado
+
+Você pode personalizar os parâmetros de busca para resultados mais específicos:
+
+```python Code
+# Perform a search with custom parameters
+results = linkup_tool.run(
+    query="Women Nobel Prize Physics",
+    depth="deep",
+    output_type="searchResults"
+)
+```
+
+## Formato de Retorno
+
+A ferramenta retorna resultados no seguinte formato:
+
+```json
+{
+  "success": true,
+  "results": [
+    {
+      "name": "Result Title",
+      "url": "https://example.com/result",
+      "content": "Content of the result..."
+    },
+    // Additional results...
+  ]
+}
+```
+
+Se ocorrer um erro, a resposta será:
+
+```json
+{
+  "success": false,
+  "error": "Error message"
+}
+```
+
+## Tratamento de Erros
+
+A ferramenta lida com erros de API de forma amigável e fornece feedback estruturado. Se a requisição à API falhar, a ferramenta retornará um dicionário com `success: false` e uma mensagem de erro.
+
+## Conclusão
+
+O `LinkupSearchTool` oferece uma forma integrada de incorporar as capacidades de busca de informações contextuais do Linkup aos seus agentes CrewAI. Ao utilizar esta ferramenta, os agentes podem acessar informações relevantes e atualizadas para aprimorar sua tomada de decisão e execução de tarefas.
--- a/docs/reo-tracking.js
+++ b/docs/reo-tracking.js
@@ -1,16 +0,0 @@
-(function() {
-  var clientID = 'e1256ea7e23318f';
-  
-  var initReo = function() {
-    Reo.init({
-      clientID: clientID
-    });
-  };
-  
-  var script = document.createElement('script');
-  script.src = 'https://static.reo.dev/' + clientID + '/reo.js';
-  script.defer = true;
-  script.onload = initReo;
-  
-  document.head.appendChild(script);
-})(); 
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -11,7 +11,7 @@ dependencies = [
    # Core Dependencies
    "pydantic>=2.4.2",
    "openai>=1.13.3",
-    "litellm==1.74.3",
+    "litellm==1.72.0",
    "instructor>=1.3.3",
    # Text Processing
    "pdfplumber>=0.11.4",
@@ -27,19 +27,18 @@ dependencies = [
    "openpyxl>=3.1.5",
    "pyvis>=0.3.2",
    # Authentication and Security
+    "auth0-python>=4.7.1",
    "python-dotenv>=1.0.0",
-    "pyjwt>=2.9.0",
    # Configuration and Utils
    "click>=8.1.7",
    "appdirs>=1.4.4",
    "jsonref>=1.1.0",
-    "json-repair==0.25.2",
+    "json-repair>=0.25.2",
    "uv>=0.4.25",
    "tomli-w>=1.1.0",
    "tomli>=2.0.2",
    "blinker>=1.9.0",
    "json5>=0.10.0",
-    "portalocker==2.7.0",
 ]

 [project.urls]
@@ -48,11 +47,11 @@ Documentation = "https://docs.crewai.com"
 Repository = "https://github.com/crewAIInc/crewAI"

 [project.optional-dependencies]
-tools = ["crewai-tools~=0.55.0"]
+tools = ["crewai-tools~=0.48.0"]
 embeddings = [
    "tiktoken~=0.8.0"
 ]
-agentops = ["agentops==0.3.18"]
+agentops = ["agentops>=0.3.0"]
 pdfplumber = [
    "pdfplumber>=0.11.4",
 ]
@@ -84,8 +83,6 @@ dev-dependencies = [
    "pytest-recording>=0.13.2",
    "pytest-randomly>=3.16.0",
    "pytest-timeout>=2.3.1",
-    "pytest-xdist>=3.6.1",
-    "pytest-split>=0.9.0",
 ]

 [project.scripts]
@@ -126,15 +123,3 @@ path = "src/crewai/__init__.py"
 [build-system]
 requires = ["hatchling"]
 build-backend = "hatchling.build"
-
-[tool.hatch.build.targets.wheel]
-exclude = [
-"docs/**",
-"docs/",
-]
-
-[tool.hatch.build.targets.sdist]
-exclude = [
-"docs/**",
-"docs/",
-]
--- a/src/crewai/init.py
+++ b/src/crewai/init.py
@@ -1,6 +1,4 @@
 import warnings
-import threading
-import urllib.request

 from crewai.agent import Agent
 from crewai.crew import Crew
@@ -13,7 +11,6 @@ from crewai.process import Process
 from crewai.task import Task
 from crewai.tasks.llm_guardrail import LLMGuardrail
 from crewai.tasks.task_output import TaskOutput
-from crewai.telemetry.telemetry import Telemetry

 warnings.filterwarnings(
    "ignore",
@@ -21,40 +18,7 @@ warnings.filterwarnings(
    category=UserWarning,
    module="pydantic.main",
 )
-
-_telemetry_submitted = False
-
-
-def _track_install():
-    """Track package installation/first-use via Scarf analytics."""
-    global _telemetry_submitted
-
-    if _telemetry_submitted or Telemetry._is_telemetry_disabled():
-        return
-
-    try:
-        pixel_url = "https://api.scarf.sh/v2/packages/CrewAI/crewai/docs/00f2dad1-8334-4a39-934e-003b2e1146db"
-
-        req = urllib.request.Request(pixel_url)
-        req.add_header('User-Agent', f'CrewAI-Python/{__version__}')
-
-        with urllib.request.urlopen(req, timeout=2):  # nosec B310
-            _telemetry_submitted = True
-
-    except Exception:
-        pass
-
-
-def _track_install_async():
-    """Track installation in background thread to avoid blocking imports."""
-    if not Telemetry._is_telemetry_disabled():
-        thread = threading.Thread(target=_track_install, daemon=True)
-        thread.start()
-
-
-_track_install_async()
-
-__version__ = "0.148.0"
+__version__ = "0.134.0"
 __all__ = [
    "Agent",
    "Crew",
--- a/src/crewai/agent.py
+++ b/src/crewai/agent.py
@@ -1,18 +1,6 @@
 import shutil
 import subprocess
-import time
-from typing import (
-    Any,
-    Callable,
-    Dict,
-    List,
-    Literal,
-    Optional,
-    Sequence,
-    Tuple,
-    Type,
-    Union,
-)
+from typing import Any, Callable, Dict, List, Literal, Optional, Sequence, Tuple, Type, Union

 from pydantic import Field, InstanceOf, PrivateAttr, model_validator

@@ -44,10 +32,6 @@ from crewai.utilities.events.agent_events import (
    AgentExecutionStartedEvent,
 )
 from crewai.utilities.events.crewai_event_bus import crewai_event_bus
-from crewai.utilities.events.memory_events import (
-    MemoryRetrievalStartedEvent,
-    MemoryRetrievalCompletedEvent,
-)
 from crewai.utilities.events.knowledge_events import (
    KnowledgeQueryCompletedEvent,
    KnowledgeQueryFailedEvent,
@@ -87,12 +71,6 @@ class Agent(BaseAgent):
    """

    _times_executed: int = PrivateAttr(default=0)
-    agent_executor: Optional[CrewAgentExecutor] = Field(
-        default=None,
-        init=False,  # Not included in __init__ as it's created dynamically in create_agent_executor()
-        exclude=True,  # Excluded from serialization to avoid circular references
-        description="The agent executor instance for running tasks. Created dynamically when needed.",
-    )
    max_execution_time: Optional[int] = Field(
        default=None,
        description="Maximum execution time for an agent to execute a task",
@@ -179,7 +157,7 @@ class Agent(BaseAgent):
    )
    guardrail: Optional[Union[Callable[[Any], Tuple[bool, Any]], str]] = Field(
        default=None,
-        description="Function or string description of a guardrail to validate agent output",
+        description="Function or string description of a guardrail to validate agent output"
    )
    guardrail_max_retries: int = Field(
        default=3, description="Maximum number of retries when guardrail fails"
@@ -227,6 +205,7 @@ class Agent(BaseAgent):
                        sources=self.knowledge_sources,
                        embedder=self.embedder,
                        collection_name=self.role,
+                        storage=self.knowledge_storage or None,
                    )
                    self.knowledge.add_sources()
        except (TypeError, ValueError) as e:
@@ -323,15 +302,6 @@ class Agent(BaseAgent):
            )

        if self._is_any_available_memory():
-            crewai_event_bus.emit(
-                self,
-                event=MemoryRetrievalStartedEvent(
-                    task_id=str(task.id) if task else None,
-                    source_type="agent",
-                ),
-            )
-
-            start_time = time.time()
            contextual_memory = ContextualMemory(
                self.crew.memory_config,
                self.crew._short_term_memory,
@@ -343,21 +313,11 @@ class Agent(BaseAgent):
            memory = contextual_memory.build_context_for_task(task, context)
            if memory.strip() != "":
                task_prompt += self.i18n.slice("memory").format(memory=memory)
-
-            crewai_event_bus.emit(
-                self,
-                event=MemoryRetrievalCompletedEvent(
-                    task_id=str(task.id) if task else None,
-                    memory_content=memory,
-                    retrieval_time_ms=(time.time() - start_time) * 1000,
-                    source_type="agent",
-                ),
-            )
        knowledge_config = (
            self.knowledge_config.model_dump() if self.knowledge_config else {}
        )

-        if self.knowledge or (self.crew and self.crew.knowledge):
+        if self.knowledge:
            crewai_event_bus.emit(
                self,
                event=KnowledgeRetrievalStartedEvent(
@@ -369,28 +329,25 @@ class Agent(BaseAgent):
                    task_prompt
                )
                if self.knowledge_search_query:
-                    # Quering agent specific knowledge
-                    if self.knowledge:
-                        agent_knowledge_snippets = self.knowledge.query(
-                            [self.knowledge_search_query], **knowledge_config
-                        )
-                        if agent_knowledge_snippets:
-                            self.agent_knowledge_context = extract_knowledge_context(
-                                agent_knowledge_snippets
-                            )
-                            if self.agent_knowledge_context:
-                                task_prompt += self.agent_knowledge_context
-
-                    # Quering crew specific knowledge
-                    knowledge_snippets = self.crew.query_knowledge(
+                    agent_knowledge_snippets = self.knowledge.query(
                        [self.knowledge_search_query], **knowledge_config
                    )
-                    if knowledge_snippets:
-                        self.crew_knowledge_context = extract_knowledge_context(
-                            knowledge_snippets
+                    if agent_knowledge_snippets:
+                        self.agent_knowledge_context = extract_knowledge_context(
+                            agent_knowledge_snippets
                        )
-                        if self.crew_knowledge_context:
-                            task_prompt += self.crew_knowledge_context
+                        if self.agent_knowledge_context:
+                            task_prompt += self.agent_knowledge_context
+                    if self.crew:
+                        knowledge_snippets = self.crew.query_knowledge(
+                            [self.knowledge_search_query], **knowledge_config
+                        )
+                        if knowledge_snippets:
+                            self.crew_knowledge_context = extract_knowledge_context(
+                                knowledge_snippets
+                            )
+                            if self.crew_knowledge_context:
+                                task_prompt += self.crew_knowledge_context

                    crewai_event_bus.emit(
                        self,
@@ -547,11 +504,6 @@ class Agent(BaseAgent):
        Returns:
            The output of the agent.
        """
-        if not self.agent_executor:
-            raise ValueError(
-                "Agent executor not initialized. Call create_agent_executor() first."
-            )
-
        return self.agent_executor.invoke(
            {
                "input": task_prompt,
@@ -823,7 +775,6 @@ class Agent(BaseAgent):
            LiteAgentOutput: The result of the agent execution.
        """
        lite_agent = LiteAgent(
-            id=self.id,
            role=self.role,
            goal=self.goal,
            backstory=self.backstory,
--- a/src/crewai/agents/crew_agent_executor.py
+++ b/src/crewai/agents/crew_agent_executor.py
@@ -96,7 +96,7 @@ class CrewAgentExecutor(CrewAgentExecutorMixin):
            )
        )

-    def invoke(self, inputs: Dict[str, Union[str, bool, None]]) -> Dict[str, Any]:
+    def invoke(self, inputs: Dict[str, str]) -> Dict[str, Any]:
        if "system" in self.prompt:
            system_prompt = self._format_prompt(self.prompt.get("system", ""), inputs)
            user_prompt = self._format_prompt(self.prompt.get("user", ""), inputs)
@@ -120,7 +120,11 @@ class CrewAgentExecutor(CrewAgentExecutorMixin):
            raise
        except Exception as e:
            handle_unknown_error(self._printer, e)
-            raise
+            if e.__class__.__module__.startswith("litellm"):
+                # Do not retry on litellm errors
+                raise e
+            else:
+                raise e

        if self.ask_for_human_input:
            formatted_answer = self._handle_human_feedback(formatted_answer)
@@ -155,7 +159,6 @@ class CrewAgentExecutor(CrewAgentExecutorMixin):
                    messages=self.messages,
                    callbacks=self.callbacks,
                    printer=self._printer,
-                    from_task=self.task,
                )
                formatted_answer = process_llm_response(answer, self.use_stop_words)

@@ -371,13 +374,10 @@ class CrewAgentExecutor(CrewAgentExecutorMixin):
        training_data[agent_id] = agent_training_data
        training_handler.save(training_data)

-    def _format_prompt(
-        self, prompt: str, inputs: Dict[str, Union[str, bool, None]]
-    ) -> str:
-        # Cast to str to satisfy type checker - these are always strings when called
-        prompt = prompt.replace("{input}", str(inputs["input"]))
-        prompt = prompt.replace("{tool_names}", str(inputs["tool_names"]))
-        prompt = prompt.replace("{tools}", str(inputs["tools"]))
+    def _format_prompt(self, prompt: str, inputs: Dict[str, str]) -> str:
+        prompt = prompt.replace("{input}", inputs["input"])
+        prompt = prompt.replace("{tool_names}", inputs["tool_names"])
+        prompt = prompt.replace("{tools}", inputs["tools"])
        return prompt

    def _handle_human_feedback(self, formatted_answer: AgentFinish) -> AgentFinish:
--- a/src/crewai/cli/authentication/constants.py
+++ b/src/crewai/cli/authentication/constants.py
@@ -2,7 +2,3 @@ ALGORITHMS = ["RS256"]
 AUTH0_DOMAIN = "crewai.us.auth0.com"
 AUTH0_CLIENT_ID = "DEVC5Fw6NlRoSzmDCcOhVq85EfLBjKa8"
 AUTH0_AUDIENCE = "https://crewai.us.auth0.com/api/v2/"
-
-WORKOS_DOMAIN = "login.crewai.com"
-WORKOS_CLI_CONNECT_APP_ID = "client_01JYT06R59SP0NXYGD994NFXXX"
-WORKOS_ENVIRONMENT_ID = "client_01JNJQWBJ4SPFN3SWJM5T7BDG8"
--- a/src/crewai/cli/authentication/main.py
+++ b/src/crewai/cli/authentication/main.py
@@ -5,72 +5,37 @@ from typing import Any, Dict
 import requests
 from rich.console import Console

-from .constants import (
-    AUTH0_AUDIENCE,
-    AUTH0_CLIENT_ID,
-    AUTH0_DOMAIN,
-    WORKOS_DOMAIN,
-    WORKOS_CLI_CONNECT_APP_ID,
-    WORKOS_ENVIRONMENT_ID,
-)
-
-from .utils import TokenManager, validate_jwt_token
-from urllib.parse import quote
-from crewai.cli.plus_api import PlusAPI
-from crewai.cli.config import Settings
+from .constants import AUTH0_AUDIENCE, AUTH0_CLIENT_ID, AUTH0_DOMAIN
+from .utils import TokenManager, validate_token

 console = Console()


 class AuthenticationCommand:
-    AUTH0_DEVICE_CODE_URL = f"https://{AUTH0_DOMAIN}/oauth/device/code"
-    AUTH0_TOKEN_URL = f"https://{AUTH0_DOMAIN}/oauth/token"
-
-    WORKOS_DEVICE_CODE_URL = f"https://{WORKOS_DOMAIN}/oauth2/device_authorization"
-    WORKOS_TOKEN_URL = f"https://{WORKOS_DOMAIN}/oauth2/token"
+    DEVICE_CODE_URL = f"https://{AUTH0_DOMAIN}/oauth/device/code"
+    TOKEN_URL = f"https://{AUTH0_DOMAIN}/oauth/token"

    def __init__(self):
        self.token_manager = TokenManager()
-        # TODO: WORKOS - This variable is temporary until migration to WorkOS is complete.
-        self.user_provider = "workos"

-    def login(self) -> None:
+    def signup(self) -> None:
        """Sign up to CrewAI+"""
-
-        device_code_url = self.WORKOS_DEVICE_CODE_URL
-        token_url = self.WORKOS_TOKEN_URL
-        client_id = WORKOS_CLI_CONNECT_APP_ID
-        audience = None
-
-        console.print("Signing in to CrewAI Enterprise...\n", style="bold blue")
-
-        # TODO: WORKOS - Next line and conditional are temporary until migration to WorkOS is complete.
-        user_provider = self._determine_user_provider()
-        if user_provider == "auth0":
-            device_code_url = self.AUTH0_DEVICE_CODE_URL
-            token_url = self.AUTH0_TOKEN_URL
-            client_id = AUTH0_CLIENT_ID
-            audience = AUTH0_AUDIENCE
-            self.user_provider = "auth0"
-        # End of temporary code.
-
-        device_code_data = self._get_device_code(client_id, device_code_url, audience)
+        console.print("Signing Up to CrewAI+ \n", style="bold blue")
+        device_code_data = self._get_device_code()
        self._display_auth_instructions(device_code_data)

-        return self._poll_for_token(device_code_data, client_id, token_url)
+        return self._poll_for_token(device_code_data)

-    def _get_device_code(
-        self, client_id: str, device_code_url: str, audience: str | None = None
-    ) -> Dict[str, Any]:
+    def _get_device_code(self) -> Dict[str, Any]:
        """Get the device code to authenticate the user."""

        device_code_payload = {
-            "client_id": client_id,
+            "client_id": AUTH0_CLIENT_ID,
            "scope": "openid",
-            "audience": audience,
+            "audience": AUTH0_AUDIENCE,
        }
        response = requests.post(
-            url=device_code_url, data=device_code_payload, timeout=20
+            url=self.DEVICE_CODE_URL, data=device_code_payload, timeout=20
        )
        response.raise_for_status()
        return response.json()
@@ -81,33 +46,38 @@ class AuthenticationCommand:
        console.print("2. Enter the following code: ", device_code_data["user_code"])
        webbrowser.open(device_code_data["verification_uri_complete"])

-    def _poll_for_token(
-        self, device_code_data: Dict[str, Any], client_id: str, token_poll_url: str
-    ) -> None:
-        """Polls the server for the token until it is received, or max attempts are reached."""
-
+    def _poll_for_token(self, device_code_data: Dict[str, Any]) -> None:
+        """Poll the server for the token."""
        token_payload = {
            "grant_type": "urn:ietf:params:oauth:grant-type:device_code",
            "device_code": device_code_data["device_code"],
-            "client_id": client_id,
+            "client_id": AUTH0_CLIENT_ID,
        }

-        console.print("\nWaiting for authentication... ", style="bold blue", end="")
-
        attempts = 0
-        while True and attempts < 10:
-            response = requests.post(token_poll_url, data=token_payload, timeout=30)
+        while True and attempts < 5:
+            response = requests.post(self.TOKEN_URL, data=token_payload, timeout=30)
            token_data = response.json()

            if response.status_code == 200:
-                self._validate_and_save_token(token_data)
+                validate_token(token_data["id_token"])
+                expires_in = 360000  # Token expiration time in seconds
+                self.token_manager.save_tokens(token_data["access_token"], expires_in)

-                console.print(
-                    "Success!",
-                    style="bold green",
-                )
-
-                self._login_to_tool_repository()
+                try:
+                    from crewai.cli.tools.main import ToolCommand
+                    ToolCommand().login()
+                except Exception:
+                    console.print(
+                        "\n[bold yellow]Warning:[/bold yellow] Authentication with the Tool Repository failed.",
+                        style="yellow",
+                    )
+                    console.print(
+                        "Other features will work normally, but you may experience limitations "
+                        "with downloading and publishing tools."
+                        "\nRun [bold]crewai login[/bold] to try logging in again.\n",
+                        style="yellow",
+                    )

                console.print(
                    "\n[bold green]Welcome to CrewAI Enterprise![/bold green]\n"
@@ -123,88 +93,3 @@ class AuthenticationCommand:
        console.print(
            "Timeout: Failed to get the token. Please try again.", style="bold red"
        )
-
-    def _validate_and_save_token(self, token_data: Dict[str, Any]) -> None:
-        """Validates the JWT token and saves the token to the token manager."""
-
-        jwt_token = token_data["access_token"]
-        jwt_token_data = {
-            "jwt_token": jwt_token,
-            "jwks_url": f"https://{WORKOS_DOMAIN}/oauth2/jwks",
-            "issuer": f"https://{WORKOS_DOMAIN}",
-            "audience": WORKOS_ENVIRONMENT_ID,
-        }
-
-        # TODO: WORKOS - The following conditional is temporary until migration to WorkOS is complete.
-        if self.user_provider == "auth0":
-            jwt_token_data["jwks_url"] = f"https://{AUTH0_DOMAIN}/.well-known/jwks.json"
-            jwt_token_data["issuer"] = f"https://{AUTH0_DOMAIN}/"
-            jwt_token_data["audience"] = AUTH0_AUDIENCE
-
-        decoded_token = validate_jwt_token(**jwt_token_data)
-
-        expires_at = decoded_token.get("exp", 0)
-        self.token_manager.save_tokens(jwt_token, expires_at)
-
-    def _login_to_tool_repository(self) -> None:
-        """Login to the tool repository."""
-
-        from crewai.cli.tools.main import ToolCommand
-
-        try:
-            console.print(
-                "Now logging you in to the Tool Repository... ",
-                style="bold blue",
-                end="",
-            )
-
-            ToolCommand().login()
-
-            console.print(
-                "Success!\n",
-                style="bold green",
-            )
-
-            settings = Settings()
-            console.print(
-                f"You are authenticated to the tool repository as [bold cyan]'{settings.org_name}'[/bold cyan] ({settings.org_uuid})",
-                style="green",
-            )
-        except Exception:
-            console.print(
-                "\n[bold yellow]Warning:[/bold yellow] Authentication with the Tool Repository failed.",
-                style="yellow",
-            )
-            console.print(
-                "Other features will work normally, but you may experience limitations "
-                "with downloading and publishing tools."
-                "\nRun [bold]crewai login[/bold] to try logging in again.\n",
-                style="yellow",
-            )
-
-    # TODO: WORKOS - This method is temporary until migration to WorkOS is complete.
-    def _determine_user_provider(self) -> str:
-        """Determine which provider to use for authentication."""
-
-        console.print(
-            "Enter your CrewAI Enterprise account email: ", style="bold blue", end=""
-        )
-        email = input()
-        email_encoded = quote(email)
-
-        # It's not correct to call this method directly, but it's temporary until migration is complete.
-        response = PlusAPI("")._make_request(
-            "GET", f"/crewai_plus/api/v1/me/provider?email={email_encoded}"
-        )
-
-        if response.status_code == 200:
-            if response.json().get("provider") == "auth0":
-                return "auth0"
-            else:
-                return "workos"
-        else:
-            console.print(
-                "Error: Failed to authenticate with crewai enterprise. Ensure that you are using the latest crewai version and please try again. If the problem persists, contact support@crewai.com.",
-                style="red",
-            )
-            raise SystemExit
--- a/src/crewai/cli/authentication/utils.py
+++ b/src/crewai/cli/authentication/utils.py
@@ -1,72 +1,32 @@
 import json
 import os
 import sys
-from datetime import datetime
+from datetime import datetime, timedelta
 from pathlib import Path
 from typing import Optional
-import jwt
-from jwt import PyJWKClient
+
+from auth0.authentication.token_verifier import (
+    AsymmetricSignatureVerifier,
+    TokenVerifier,
+)
 from cryptography.fernet import Fernet

+from .constants import AUTH0_CLIENT_ID, AUTH0_DOMAIN

-def validate_jwt_token(
-    jwt_token: str, jwks_url: str, issuer: str, audience: str
-) -> dict:
+
+def validate_token(id_token: str) -> None:
    """
-    Verify the token's signature and claims using PyJWT.
-    :param jwt_token: The JWT (JWS) string to validate.
-    :param jwks_url: The URL of the JWKS endpoint.
-    :param issuer: The expected issuer of the token.
-    :param audience: The expected audience of the token.
-    :return: The decoded token.
-    :raises Exception: If the token is invalid for any reason (e.g., signature mismatch,
-                       expired, incorrect issuer/audience, JWKS fetching error,
-                       missing required claims).
+    Verify the token and its precedence
+
+    :param id_token:
    """
-
-    decoded_token = None
-
-    try:
-        jwk_client = PyJWKClient(jwks_url)
-        signing_key = jwk_client.get_signing_key_from_jwt(jwt_token)
-
-        _unverified_decoded_token = jwt.decode(
-            jwt_token, options={"verify_signature": False}
-        )
-        decoded_token = jwt.decode(
-            jwt_token,
-            signing_key.key,
-            algorithms=["RS256"],
-            audience=audience,
-            issuer=issuer,
-            options={
-                "verify_signature": True,
-                "verify_exp": True,
-                "verify_nbf": True,
-                "verify_iat": True,
-                "require": ["exp", "iat", "iss", "aud", "sub"],
-            },
-        )
-        return decoded_token
-
-    except jwt.ExpiredSignatureError:
-        raise Exception("Token has expired.")
-    except jwt.InvalidAudienceError:
-        actual_audience = _unverified_decoded_token.get("aud", "[no audience found]")
-        raise Exception(
-            f"Invalid token audience. Got: '{actual_audience}'. Expected: '{audience}'"
-        )
-    except jwt.InvalidIssuerError:
-        actual_issuer = _unverified_decoded_token.get("iss", "[no issuer found]")
-        raise Exception(
-            f"Invalid token issuer. Got: '{actual_issuer}'. Expected: '{issuer}'"
-        )
-    except jwt.MissingRequiredClaimError as e:
-        raise Exception(f"Token is missing required claims: {str(e)}")
-    except jwt.exceptions.PyJWKClientError as e:
-        raise Exception(f"JWKS or key processing error: {str(e)}")
-    except jwt.InvalidTokenError as e:
-        raise Exception(f"Invalid token: {str(e)}")
+    jwks_url = f"https://{AUTH0_DOMAIN}/.well-known/jwks.json"
+    issuer = f"https://{AUTH0_DOMAIN}/"
+    signature_verifier = AsymmetricSignatureVerifier(jwks_url)
+    token_verifier = TokenVerifier(
+        signature_verifier=signature_verifier, issuer=issuer, audience=AUTH0_CLIENT_ID
+    )
+    token_verifier.verify(id_token)


 class TokenManager:
@@ -96,14 +56,14 @@ class TokenManager:
        self.save_secure_file(key_filename, new_key)
        return new_key

-    def save_tokens(self, access_token: str, expires_at: int) -> None:
+    def save_tokens(self, access_token: str, expires_in: int) -> None:
        """
        Save the access token and its expiration time.

        :param access_token: The access token to save.
-        :param expires_at: The UNIX timestamp of the expiration time.
+        :param expires_in: The expiration time of the access token in seconds.
        """
-        expiration_time = datetime.fromtimestamp(expires_at)
+        expiration_time = datetime.now() + timedelta(seconds=expires_in)
        data = {
            "access_token": access_token,
            "expiration": expiration_time.isoformat(),
--- a/src/crewai/cli/cli.py
+++ b/src/crewai/cli/cli.py
@@ -2,7 +2,7 @@ from importlib.metadata import version as get_version
 from typing import Optional

 import click
-from crewai.cli.config import Settings
+
 from crewai.cli.add_crew_to_flow import add_crew_to_flow
 from crewai.cli.create_crew import create_crew
 from crewai.cli.create_flow import create_flow
@@ -138,12 +138,8 @@ def log_tasks_outputs() -> None:
@click.option("-s", "--short", is_flag=True, help="Reset SHORT TERM memory")
@click.option("-e", "--entities", is_flag=True, help="Reset ENTITIES memory")
@click.option("-kn", "--knowledge", is_flag=True, help="Reset KNOWLEDGE storage")
-@click.option(
-    "-akn", "--agent-knowledge", is_flag=True, help="Reset AGENT KNOWLEDGE storage"
-)
-@click.option(
-    "-k", "--kickoff-outputs", is_flag=True, help="Reset LATEST KICKOFF TASK OUTPUTS"
-)
+@click.option("-akn", "--agent-knowledge", is_flag=True, help="Reset AGENT KNOWLEDGE storage")
+@click.option("-k","--kickoff-outputs",is_flag=True,help="Reset LATEST KICKOFF TASK OUTPUTS")
@click.option("-a", "--all", is_flag=True, help="Reset ALL memories")
 def reset_memories(
    long: bool,
@@ -158,23 +154,13 @@ def reset_memories(
    Reset the crew memories (long, short, entity, latest_crew_kickoff_ouputs, knowledge, agent_knowledge). This will delete all the data saved.
    """
    try:
-        memory_types = [
-            long,
-            short,
-            entities,
-            knowledge,
-            agent_knowledge,
-            kickoff_outputs,
-            all,
-        ]
+        memory_types = [long, short, entities, knowledge, agent_knowledge, kickoff_outputs, all]
        if not any(memory_types):
            click.echo(
                "Please specify at least one memory type to reset using the appropriate flags."
            )
            return
-        reset_memories_command(
-            long, short, entities, knowledge, agent_knowledge, kickoff_outputs, all
-        )
+        reset_memories_command(long, short, entities, knowledge, agent_knowledge, kickoff_outputs, all)
    except Exception as e:
        click.echo(f"An error occurred while resetting memories: {e}", err=True)

@@ -224,11 +210,16 @@ def update():
    update_crew()


+@crewai.command()
+def signup():
+    """Sign Up/Login to CrewAI+."""
+    AuthenticationCommand().signup()
+
+
@crewai.command()
 def login():
-    """Sign Up/Login to CrewAI Enterprise."""
-    Settings().clear()
-    AuthenticationCommand().login()
+    """Sign Up/Login to CrewAI+."""
+    AuthenticationCommand().signup()


 # DEPLOY CREWAI+ COMMANDS
--- a/src/crewai/cli/config.py
+++ b/src/crewai/cli/config.py
@@ -37,10 +37,6 @@ class Settings(BaseModel):
        merged_data = {**file_data, **data}
        super().__init__(config_path=config_path, **merged_data)

-    def clear(self) -> None:
-        """Clear all settings"""
-        self.config_path.unlink(missing_ok=True)
-
    def dump(self) -> None:
        """Save current settings to settings.json"""
        if self.config_path.is_file():
--- a/src/crewai/cli/templates/crew/pyproject.toml
+++ b/src/crewai/cli/templates/crew/pyproject.toml
@@ -5,7 +5,7 @@ description = "{{name}} using crewAI"
 authors = [{ name = "Your Name", email = "you@example.com" }]
 requires-python = ">=3.10,<3.14"
 dependencies = [
-    "crewai[tools]>=0.148.0,<1.0.0"
+    "crewai[tools]>=0.134.0,<1.0.0"
 ]

 [project.scripts]
--- a/src/crewai/cli/templates/flow/pyproject.toml
+++ b/src/crewai/cli/templates/flow/pyproject.toml
@@ -5,7 +5,7 @@ description = "{{name}} using crewAI"
 authors = [{ name = "Your Name", email = "you@example.com" }]
 requires-python = ">=3.10,<3.14"
 dependencies = [
-    "crewai[tools]>=0.148.0,<1.0.0",
+    "crewai[tools]>=0.134.0,<1.0.0",
 ]

 [project.scripts]
--- a/src/crewai/cli/templates/tool/pyproject.toml
+++ b/src/crewai/cli/templates/tool/pyproject.toml
@@ -5,7 +5,7 @@ description = "Power up your crews with {{folder_name}}"
 readme = "README.md"
 requires-python = ">=3.10,<3.14"
 dependencies = [
-    "crewai[tools]>=0.148.0"
+    "crewai[tools]>=0.134.0"
 ]

 [tool.crewai]
--- a/src/crewai/cli/tools/main.py
+++ b/src/crewai/cli/tools/main.py
@@ -156,7 +156,7 @@ class ToolCommand(BaseCommand, PlusAPIMixin):

        console.print(f"Successfully installed {handle}", style="bold green")

-    def login(self) -> None:
+    def login(self):
        login_response = self.plus_api_client.login_to_tool_repository()

        if login_response.status_code != 200:
@@ -175,10 +175,18 @@ class ToolCommand(BaseCommand, PlusAPIMixin):
        settings.tool_repository_password = login_response_json["credential"][
            "password"
        ]
-        settings.org_uuid = login_response_json["current_organization"]["uuid"]
-        settings.org_name = login_response_json["current_organization"]["name"]
+        settings.org_uuid = login_response_json["current_organization"][
+            "uuid"
+        ]
+        settings.org_name = login_response_json["current_organization"][
+            "name"
+        ]
        settings.dump()

+        console.print(
+            f"Successfully authenticated to the tool repository as {settings.org_name} ({settings.org_uuid}).", style="bold green"
+        )
+
    def _add_package(self, tool_details: dict[str, Any]):
        is_from_pypi = tool_details.get("source", None) == "pypi"
        tool_handle = tool_details["handle"]
@@ -235,15 +243,9 @@ class ToolCommand(BaseCommand, PlusAPIMixin):

        return env

-    def _print_current_organization(self) -> None:
+    def _print_current_organization(self):
        settings = Settings()
        if settings.org_uuid:
-            console.print(
-                f"Current organization: {settings.org_name} ({settings.org_uuid})",
-                style="bold blue",
-            )
+            console.print(f"Current organization: {settings.org_name} ({settings.org_uuid})", style="bold blue")
        else:
-            console.print(
-                "No organization currently set. We recommend setting one before using: `crewai org switch <org_id>` command.",
-                style="yellow",
-            )
+            console.print("No organization currently set. We recommend setting one before using: `crewai org switch <org_id>` command.", style="yellow")
--- a/src/crewai/crew.py
+++ b/src/crewai/crew.py
@@ -18,11 +18,6 @@ from typing import (
    cast,
 )

-from opentelemetry import baggage
-from opentelemetry.context import attach, detach
-
-from crewai.utilities.crew.models import CrewContext
-
 from pydantic import (
    UUID4,
    BaseModel,
@@ -161,7 +156,7 @@ class Crew(FlowTrackable, BaseModel):
    )
    user_memory: Optional[InstanceOf[UserMemory]] = Field(
        default=None,
-        description="DEPRECATED: Will be removed in version 0.156.0 or on 2025-08-04, whichever comes first. Use external_memory instead.",
+        description="An instance of the UserMemory to be used by the Crew to store/fetch memories of a specific user.",
    )
    external_memory: Optional[InstanceOf[ExternalMemory]] = Field(
        default=None,
@@ -327,7 +322,7 @@ class Crew(FlowTrackable, BaseModel):
        self._short_term_memory = self.short_term_memory
        self._entity_memory = self.entity_memory

-        # UserMemory will be removed in version 0.156.0 or on 2025-08-04, whichever comes first
+        # UserMemory is gonna to be deprecated in the future, but we have to initialize a default value for now
        self._user_memory = None

        if self.memory:
@@ -621,11 +616,6 @@ class Crew(FlowTrackable, BaseModel):
        self,
        inputs: Optional[Dict[str, Any]] = None,
    ) -> CrewOutput:
-        ctx = baggage.set_baggage(
-            "crew_context", CrewContext(id=str(self.id), key=self.key)
-        )
-        token = attach(ctx)
-
        try:
            for before_callback in self.before_kickoff_callbacks:
                if inputs is None:
@@ -686,8 +676,6 @@ class Crew(FlowTrackable, BaseModel):
                CrewKickoffFailedEvent(error=str(e), crew_name=self.name or "crew"),
            )
            raise
-        finally:
-            detach(token)

    def kickoff_for_each(self, inputs: List[Dict[str, Any]]) -> List[CrewOutput]:
        """Executes the Crew's workflow for each input in the list and aggregates results."""
@@ -1255,7 +1243,6 @@ class Crew(FlowTrackable, BaseModel):
        if self.external_memory:
            copied_data["external_memory"] = self.external_memory.model_copy(deep=True)
        if self.user_memory:
-            # DEPRECATED: UserMemory will be removed in version 0.156.0 or on 2025-08-04
            copied_data["user_memory"] = self.user_memory.model_copy(deep=True)

        copied_data.pop("agents", None)
@@ -1332,7 +1319,6 @@ class Crew(FlowTrackable, BaseModel):
                ),
            )
            test_crew = self.copy()
-
            evaluator = CrewEvaluator(test_crew, llm_instance)

            for i in range(1, n_iterations + 1):
--- a/src/crewai/experimental/init.py
+++ b/src/crewai/experimental/init.py
@@ -1,40 +0,0 @@
-from crewai.experimental.evaluation import (
-    BaseEvaluator,
-    EvaluationScore,
-    MetricCategory,
-    AgentEvaluationResult,
-    SemanticQualityEvaluator,
-    GoalAlignmentEvaluator,
-    ReasoningEfficiencyEvaluator,
-    ToolSelectionEvaluator,
-    ParameterExtractionEvaluator,
-    ToolInvocationEvaluator,
-    EvaluationTraceCallback,
-    create_evaluation_callbacks,
-    AgentEvaluator,
-    create_default_evaluator,
-    ExperimentRunner,
-    ExperimentResults,
-    ExperimentResult,
-)
-
-
-__all__ = [
-    "BaseEvaluator",
-    "EvaluationScore",
-    "MetricCategory",
-    "AgentEvaluationResult",
-    "SemanticQualityEvaluator",
-    "GoalAlignmentEvaluator",
-    "ReasoningEfficiencyEvaluator",
-    "ToolSelectionEvaluator",
-    "ParameterExtractionEvaluator",
-    "ToolInvocationEvaluator",
-    "EvaluationTraceCallback",
-    "create_evaluation_callbacks",
-    "AgentEvaluator",
-    "create_default_evaluator",
-    "ExperimentRunner",
-    "ExperimentResults",
-    "ExperimentResult"
-]
--- a/src/crewai/experimental/evaluation/init.py
+++ b/src/crewai/experimental/evaluation/init.py
@@ -1,51 +0,0 @@
-from crewai.experimental.evaluation.base_evaluator import (
-    BaseEvaluator,
-    EvaluationScore,
-    MetricCategory,
-    AgentEvaluationResult
-)
-
-from crewai.experimental.evaluation.metrics import (
-    SemanticQualityEvaluator,
-    GoalAlignmentEvaluator,
-    ReasoningEfficiencyEvaluator,
-    ToolSelectionEvaluator,
-    ParameterExtractionEvaluator,
-    ToolInvocationEvaluator
-)
-
-from crewai.experimental.evaluation.evaluation_listener import (
-    EvaluationTraceCallback,
-    create_evaluation_callbacks
-)
-
-from crewai.experimental.evaluation.agent_evaluator import (
-    AgentEvaluator,
-    create_default_evaluator
-)
-
-from crewai.experimental.evaluation.experiment import (
-    ExperimentRunner,
-    ExperimentResults,
-    ExperimentResult
-)
-
-__all__ = [
-    "BaseEvaluator",
-    "EvaluationScore",
-    "MetricCategory",
-    "AgentEvaluationResult",
-    "SemanticQualityEvaluator",
-    "GoalAlignmentEvaluator",
-    "ReasoningEfficiencyEvaluator",
-    "ToolSelectionEvaluator",
-    "ParameterExtractionEvaluator",
-    "ToolInvocationEvaluator",
-    "EvaluationTraceCallback",
-    "create_evaluation_callbacks",
-    "AgentEvaluator",
-    "create_default_evaluator",
-    "ExperimentRunner",
-    "ExperimentResults",
-    "ExperimentResult"
-]
--- a/src/crewai/experimental/evaluation/agent_evaluator.py
+++ b/src/crewai/experimental/evaluation/agent_evaluator.py
@@ -1,245 +0,0 @@
-import threading
-from typing import Any
-
-from crewai.experimental.evaluation.base_evaluator import AgentEvaluationResult, AggregationStrategy
-from crewai.agent import Agent
-from crewai.task import Task
-from crewai.experimental.evaluation.evaluation_display import EvaluationDisplayFormatter
-from crewai.utilities.events.agent_events import AgentEvaluationStartedEvent, AgentEvaluationCompletedEvent, AgentEvaluationFailedEvent
-from crewai.experimental.evaluation import BaseEvaluator, create_evaluation_callbacks
-from collections.abc import Sequence
-from crewai.utilities.events.crewai_event_bus import crewai_event_bus
-from crewai.utilities.events.utils.console_formatter import ConsoleFormatter
-from crewai.utilities.events.task_events import TaskCompletedEvent
-from crewai.utilities.events.agent_events import LiteAgentExecutionCompletedEvent
-from crewai.experimental.evaluation.base_evaluator import AgentAggregatedEvaluationResult, EvaluationScore, MetricCategory
-
-class ExecutionState:
-    def __init__(self):
-        self.traces = {}
-        self.current_agent_id: str | None = None
-        self.current_task_id: str | None = None
-        self.iteration = 1
-        self.iterations_results = {}
-        self.agent_evaluators = {}
-
-class AgentEvaluator:
-    def __init__(
-        self,
-        agents: list[Agent],
-        evaluators: Sequence[BaseEvaluator] | None = None,
-    ):
-        self.agents: list[Agent] = agents
-        self.evaluators: Sequence[BaseEvaluator] | None = evaluators
-
-        self.callback = create_evaluation_callbacks()
-        self.console_formatter = ConsoleFormatter()
-        self.display_formatter = EvaluationDisplayFormatter()
-
-        self._thread_local: threading.local = threading.local()
-
-        for agent in self.agents:
-            self._execution_state.agent_evaluators[str(agent.id)] = self.evaluators
-
-        self._subscribe_to_events()
-
-    @property
-    def _execution_state(self) -> ExecutionState:
-        if not hasattr(self._thread_local, 'execution_state'):
-            self._thread_local.execution_state = ExecutionState()
-        return self._thread_local.execution_state
-
-    def _subscribe_to_events(self) -> None:
-        from typing import cast
-        crewai_event_bus.register_handler(TaskCompletedEvent, cast(Any, self._handle_task_completed))
-        crewai_event_bus.register_handler(LiteAgentExecutionCompletedEvent, cast(Any, self._handle_lite_agent_completed))
-
-    def _handle_task_completed(self, source: Any, event: TaskCompletedEvent) -> None:
-        assert event.task is not None
-        agent = event.task.agent
-        if agent and str(getattr(agent, 'id', 'unknown')) in self._execution_state.agent_evaluators:
-            self.emit_evaluation_started_event(agent_role=agent.role, agent_id=str(agent.id), task_id=str(event.task.id))
-
-            state = ExecutionState()
-            state.current_agent_id = str(agent.id)
-            state.current_task_id = str(event.task.id)
-
-            assert state.current_agent_id is not None and state.current_task_id is not None
-            trace = self.callback.get_trace(state.current_agent_id, state.current_task_id)
-
-            if not trace:
-                return
-
-            result = self.evaluate(
-                agent=agent,
-                task=event.task,
-                execution_trace=trace,
-                final_output=event.output,
-                state=state
-            )
-
-            current_iteration = self._execution_state.iteration
-            if current_iteration not in self._execution_state.iterations_results:
-                self._execution_state.iterations_results[current_iteration] = {}
-
-            if agent.role not in self._execution_state.iterations_results[current_iteration]:
-                self._execution_state.iterations_results[current_iteration][agent.role] = []
-
-            self._execution_state.iterations_results[current_iteration][agent.role].append(result)
-
-    def _handle_lite_agent_completed(self, source: object, event: LiteAgentExecutionCompletedEvent) -> None:
-        agent_info = event.agent_info
-        agent_id = str(agent_info["id"])
-
-        if agent_id in self._execution_state.agent_evaluators:
-            state = ExecutionState()
-            state.current_agent_id = agent_id
-            state.current_task_id = "lite_task"
-
-            target_agent = None
-            for agent in self.agents:
-                if str(agent.id) == agent_id:
-                    target_agent = agent
-                    break
-
-            if not target_agent:
-                return
-
-            assert state.current_agent_id is not None and state.current_task_id is not None
-            trace = self.callback.get_trace(state.current_agent_id, state.current_task_id)
-
-            if not trace:
-                return
-
-            result = self.evaluate(
-                agent=target_agent,
-                execution_trace=trace,
-                final_output=event.output,
-                state=state
-            )
-
-            current_iteration = self._execution_state.iteration
-            if current_iteration not in self._execution_state.iterations_results:
-                self._execution_state.iterations_results[current_iteration] = {}
-
-            agent_role = target_agent.role
-            if agent_role not in self._execution_state.iterations_results[current_iteration]:
-                self._execution_state.iterations_results[current_iteration][agent_role] = []
-
-            self._execution_state.iterations_results[current_iteration][agent_role].append(result)
-
-    def set_iteration(self, iteration: int) -> None:
-        self._execution_state.iteration = iteration
-
-    def reset_iterations_results(self) -> None:
-        self._execution_state.iterations_results = {}
-
-    def get_evaluation_results(self) -> dict[str, list[AgentEvaluationResult]]:
-        if self._execution_state.iterations_results and self._execution_state.iteration in self._execution_state.iterations_results:
-            return self._execution_state.iterations_results[self._execution_state.iteration]
-        return {}
-
-    def display_results_with_iterations(self) -> None:
-        self.display_formatter.display_summary_results(self._execution_state.iterations_results)
-
-    def get_agent_evaluation(self, strategy: AggregationStrategy = AggregationStrategy.SIMPLE_AVERAGE, include_evaluation_feedback: bool = True) -> dict[str, AgentAggregatedEvaluationResult]:
-        agent_results = {}
-        with crewai_event_bus.scoped_handlers():
-            task_results = self.get_evaluation_results()
-            for agent_role, results in task_results.items():
-                if not results:
-                    continue
-
-                agent_id = results[0].agent_id
-
-                aggregated_result = self.display_formatter._aggregate_agent_results(
-                    agent_id=agent_id,
-                    agent_role=agent_role,
-                    results=results,
-                    strategy=strategy
-                )
-
-                agent_results[agent_role] = aggregated_result
-
-
-            if self._execution_state.iterations_results and self._execution_state.iteration == max(self._execution_state.iterations_results.keys(), default=0):
-                self.display_results_with_iterations()
-
-            if include_evaluation_feedback:
-                self.display_evaluation_with_feedback()
-
-        return agent_results
-
-    def display_evaluation_with_feedback(self) -> None:
-        self.display_formatter.display_evaluation_with_feedback(self._execution_state.iterations_results)
-
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: dict[str, Any],
-        final_output: Any,
-        state: ExecutionState,
-        task: Task | None = None,
-    ) -> AgentEvaluationResult:
-        result = AgentEvaluationResult(
-            agent_id=state.current_agent_id or str(agent.id),
-            task_id=state.current_task_id or (str(task.id) if task else "unknown_task")
-        )
-
-        assert self.evaluators is not None
-        task_id = str(task.id) if task else None
-        for evaluator in self.evaluators:
-            try:
-                self.emit_evaluation_started_event(agent_role=agent.role, agent_id=str(agent.id), task_id=task_id)
-                score = evaluator.evaluate(
-                    agent=agent,
-                    task=task,
-                    execution_trace=execution_trace,
-                    final_output=final_output
-                )
-                result.metrics[evaluator.metric_category] = score
-                self.emit_evaluation_completed_event(agent_role=agent.role, agent_id=str(agent.id), task_id=task_id, metric_category=evaluator.metric_category, score=score)
-            except Exception as e:
-                self.emit_evaluation_failed_event(agent_role=agent.role, agent_id=str(agent.id), task_id=task_id, error=str(e))
-                self.console_formatter.print(f"Error in {evaluator.metric_category.value} evaluator: {str(e)}")
-
-        return result
-
-    def emit_evaluation_started_event(self, agent_role: str, agent_id: str, task_id: str | None = None):
-        crewai_event_bus.emit(
-            self,
-            AgentEvaluationStartedEvent(agent_role=agent_role, agent_id=agent_id, task_id=task_id, iteration=self._execution_state.iteration)
-        )
-
-    def emit_evaluation_completed_event(self, agent_role: str, agent_id: str, task_id: str | None = None, metric_category: MetricCategory | None = None, score: EvaluationScore | None = None):
-        crewai_event_bus.emit(
-            self,
-            AgentEvaluationCompletedEvent(agent_role=agent_role, agent_id=agent_id, task_id=task_id, iteration=self._execution_state.iteration, metric_category=metric_category, score=score)
-        )
-
-    def emit_evaluation_failed_event(self, agent_role: str, agent_id: str, error: str, task_id: str | None = None):
-        crewai_event_bus.emit(
-            self,
-            AgentEvaluationFailedEvent(agent_role=agent_role, agent_id=agent_id, task_id=task_id, iteration=self._execution_state.iteration, error=error)
-        )
-
-def create_default_evaluator(agents: list[Agent], llm: None = None):
-    from crewai.experimental.evaluation import (
-        GoalAlignmentEvaluator,
-        SemanticQualityEvaluator,
-        ToolSelectionEvaluator,
-        ParameterExtractionEvaluator,
-        ToolInvocationEvaluator,
-        ReasoningEfficiencyEvaluator
-    )
-
-    evaluators = [
-        GoalAlignmentEvaluator(llm=llm),
-        SemanticQualityEvaluator(llm=llm),
-        ToolSelectionEvaluator(llm=llm),
-        ParameterExtractionEvaluator(llm=llm),
-        ToolInvocationEvaluator(llm=llm),
-        ReasoningEfficiencyEvaluator(llm=llm),
-    ]
-
-    return AgentEvaluator(evaluators=evaluators, agents=agents)
--- a/src/crewai/experimental/evaluation/base_evaluator.py
+++ b/src/crewai/experimental/evaluation/base_evaluator.py
@@ -1,125 +0,0 @@
-import abc
-import enum
-from enum import Enum
-from typing import Any, Dict, List, Optional
-
-from pydantic import BaseModel, Field
-
-from crewai.agent import Agent
-from crewai.task import Task
-from crewai.llm import BaseLLM
-from crewai.utilities.llm_utils import create_llm
-
-class MetricCategory(enum.Enum):
-    GOAL_ALIGNMENT = "goal_alignment"
-    SEMANTIC_QUALITY = "semantic_quality"
-    REASONING_EFFICIENCY = "reasoning_efficiency"
-    TOOL_SELECTION = "tool_selection"
-    PARAMETER_EXTRACTION = "parameter_extraction"
-    TOOL_INVOCATION = "tool_invocation"
-
-    def title(self):
-        return self.value.replace('_', ' ').title()
-
-
-class EvaluationScore(BaseModel):
-    score: float | None = Field(
-        default=5.0,
-        description="Numeric score from 0-10 where 0 is worst and 10 is best, None if not applicable",
-        ge=0.0,
-        le=10.0
-    )
-    feedback: str = Field(
-        default="",
-        description="Detailed feedback explaining the evaluation score"
-    )
-    raw_response: str | None = Field(
-        default=None,
-        description="Raw response from the evaluator (e.g., LLM)"
-    )
-
-    def __str__(self) -> str:
-        if self.score is None:
-            return f"Score: N/A - {self.feedback}"
-        return f"Score: {self.score:.1f}/10 - {self.feedback}"
-
-
-class BaseEvaluator(abc.ABC):
-    def __init__(self, llm: BaseLLM | None = None):
-        self.llm: BaseLLM | None = create_llm(llm)
-
-    @property
-    @abc.abstractmethod
-    def metric_category(self) -> MetricCategory:
-        pass
-
-    @abc.abstractmethod
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: Dict[str, Any],
-        final_output: Any,
-        task: Task | None = None,
-    ) -> EvaluationScore:
-        pass
-
-
-class AgentEvaluationResult(BaseModel):
-    agent_id: str = Field(description="ID of the evaluated agent")
-    task_id: str = Field(description="ID of the task that was executed")
-    metrics: Dict[MetricCategory, EvaluationScore] = Field(
-        default_factory=dict,
-        description="Evaluation scores for each metric category"
-    )
-
-
-class AggregationStrategy(Enum):
-    SIMPLE_AVERAGE = "simple_average"  # Equal weight to all tasks
-    WEIGHTED_BY_COMPLEXITY = "weighted_by_complexity"  # Weight by task complexity
-    BEST_PERFORMANCE = "best_performance"  # Use best scores across tasks
-    WORST_PERFORMANCE = "worst_performance"  # Use worst scores across tasks
-
-
-class AgentAggregatedEvaluationResult(BaseModel):
-    agent_id: str = Field(
-        default="",
-        description="ID of the agent"
-    )
-    agent_role: str = Field(
-        default="",
-        description="Role of the agent"
-    )
-    task_count: int = Field(
-        default=0,
-        description="Number of tasks included in this aggregation"
-    )
-    aggregation_strategy: AggregationStrategy = Field(
-        default=AggregationStrategy.SIMPLE_AVERAGE,
-        description="Strategy used for aggregation"
-    )
-    metrics: Dict[MetricCategory, EvaluationScore] = Field(
-        default_factory=dict,
-        description="Aggregated metrics across all tasks"
-    )
-    task_results: List[str] = Field(
-        default_factory=list,
-        description="IDs of tasks included in this aggregation"
-    )
-    overall_score: Optional[float] = Field(
-        default=None,
-        description="Overall score for this agent"
-    )
-
-    def __str__(self) -> str:
-        result = f"Agent Evaluation: {self.agent_role}\n"
-        result += f"Strategy: {self.aggregation_strategy.value}\n"
-        result += f"Tasks evaluated: {self.task_count}\n"
-
-        for category, score in self.metrics.items():
-            result += f"\n\n- {category.value.upper()}: {score.score}/10\n"
-
-            if score.feedback:
-                detailed_feedback = "\n  ".join(score.feedback.split('\n'))
-                result += f"  {detailed_feedback}\n"
-
-        return result
--- a/src/crewai/experimental/evaluation/evaluation_display.py
+++ b/src/crewai/experimental/evaluation/evaluation_display.py
@@ -1,333 +0,0 @@
-from collections import defaultdict
-from typing import Dict, Any, List
-from rich.table import Table
-from rich.box import HEAVY_EDGE, ROUNDED
-from collections.abc import Sequence
-from crewai.experimental.evaluation.base_evaluator import AgentAggregatedEvaluationResult, AggregationStrategy, AgentEvaluationResult, MetricCategory
-from crewai.experimental.evaluation import EvaluationScore
-from crewai.utilities.events.utils.console_formatter import ConsoleFormatter
-from crewai.utilities.llm_utils import create_llm
-
-class EvaluationDisplayFormatter:
-    def __init__(self):
-        self.console_formatter = ConsoleFormatter()
-
-    def display_evaluation_with_feedback(self, iterations_results: Dict[int, Dict[str, List[Any]]]):
-        if not iterations_results:
-            self.console_formatter.print("[yellow]No evaluation results to display[/yellow]")
-            return
-
-        all_agent_roles: set[str] = set()
-        for iter_results in iterations_results.values():
-            all_agent_roles.update(iter_results.keys())
-
-        for agent_role in sorted(all_agent_roles):
-            self.console_formatter.print(f"\n[bold cyan]Agent: {agent_role}[/bold cyan]")
-
-            for iter_num, results in sorted(iterations_results.items()):
-                if agent_role not in results or not results[agent_role]:
-                    continue
-
-                agent_results = results[agent_role]
-                agent_id = agent_results[0].agent_id
-
-                aggregated_result = self._aggregate_agent_results(
-                    agent_id=agent_id,
-                    agent_role=agent_role,
-                    results=agent_results,
-                )
-
-                self.console_formatter.print(f"\n[bold]Iteration {iter_num}[/bold]")
-
-                table = Table(box=ROUNDED)
-                table.add_column("Metric", style="cyan")
-                table.add_column("Score (1-10)", justify="center")
-                table.add_column("Feedback", style="green")
-
-                if aggregated_result.metrics:
-                    for metric, evaluation_score in aggregated_result.metrics.items():
-                        score = evaluation_score.score
-
-                        if isinstance(score, (int, float)):
-                            if score >= 8.0:
-                                score_text = f"[green]{score:.1f}[/green]"
-                            elif score >= 6.0:
-                                score_text = f"[cyan]{score:.1f}[/cyan]"
-                            elif score >= 4.0:
-                                score_text = f"[yellow]{score:.1f}[/yellow]"
-                            else:
-                                score_text = f"[red]{score:.1f}[/red]"
-                        else:
-                            score_text = "[dim]N/A[/dim]"
-
-                        table.add_section()
-                        table.add_row(
-                            metric.title(),
-                            score_text,
-                            evaluation_score.feedback or ""
-                        )
-
-                if aggregated_result.overall_score is not None:
-                    overall_score = aggregated_result.overall_score
-                    if overall_score >= 8.0:
-                        overall_color = "green"
-                    elif overall_score >= 6.0:
-                        overall_color = "cyan"
-                    elif overall_score >= 4.0:
-                        overall_color = "yellow"
-                    else:
-                        overall_color = "red"
-
-                    table.add_section()
-                    table.add_row(
-                        "Overall Score",
-                        f"[{overall_color}]{overall_score:.1f}[/]",
-                        "Overall agent evaluation score"
-                    )
-
-                self.console_formatter.print(table)
-
-    def display_summary_results(self, iterations_results: Dict[int, Dict[str, List[AgentAggregatedEvaluationResult]]]):
-        if not iterations_results:
-            self.console_formatter.print("[yellow]No evaluation results to display[/yellow]")
-            return
-
-        self.console_formatter.print("\n")
-
-        table = Table(title="Agent Performance Scores \n (1-10 Higher is better)", box=HEAVY_EDGE)
-
-        table.add_column("Agent/Metric", style="cyan")
-
-        for iter_num in sorted(iterations_results.keys()):
-            run_label = f"Run {iter_num}"
-            table.add_column(run_label, justify="center")
-
-        table.add_column("Avg. Total", justify="center")
-
-        all_agent_roles: set[str] = set()
-        for results in iterations_results.values():
-            all_agent_roles.update(results.keys())
-
-        for agent_role in sorted(all_agent_roles):
-            agent_scores_by_iteration = {}
-            agent_metrics_by_iteration = {}
-
-            for iter_num, results in sorted(iterations_results.items()):
-                if agent_role not in results or not results[agent_role]:
-                    continue
-
-                agent_results = results[agent_role]
-                agent_id = agent_results[0].agent_id
-
-                aggregated_result = self._aggregate_agent_results(
-                    agent_id=agent_id,
-                    agent_role=agent_role,
-                    results=agent_results,
-                    strategy=AggregationStrategy.SIMPLE_AVERAGE
-                )
-
-                valid_scores = [score.score for score in aggregated_result.metrics.values()
-                               if score.score is not None]
-                if valid_scores:
-                    avg_score = sum(valid_scores) / len(valid_scores)
-                    agent_scores_by_iteration[iter_num] = avg_score
-
-                agent_metrics_by_iteration[iter_num] = aggregated_result.metrics
-
-            if not agent_scores_by_iteration:
-                continue
-
-            avg_across_iterations = sum(agent_scores_by_iteration.values()) / len(agent_scores_by_iteration)
-
-            row = [f"[bold]{agent_role}[/bold]"]
-
-            for iter_num in sorted(iterations_results.keys()):
-                if iter_num in agent_scores_by_iteration:
-                    score = agent_scores_by_iteration[iter_num]
-                    if score >= 8.0:
-                        color = "green"
-                    elif score >= 6.0:
-                        color = "cyan"
-                    elif score >= 4.0:
-                        color = "yellow"
-                    else:
-                        color = "red"
-                    row.append(f"[bold {color}]{score:.1f}[/]")
-                else:
-                    row.append("-")
-
-            if avg_across_iterations >= 8.0:
-                color = "green"
-            elif avg_across_iterations >= 6.0:
-                color = "cyan"
-            elif avg_across_iterations >= 4.0:
-                color = "yellow"
-            else:
-                color = "red"
-            row.append(f"[bold {color}]{avg_across_iterations:.1f}[/]")
-
-            table.add_row(*row)
-
-            all_metrics: set[Any] = set()
-            for metrics in agent_metrics_by_iteration.values():
-                all_metrics.update(metrics.keys())
-
-            for metric in sorted(all_metrics, key=lambda x: x.value):
-                metric_scores = []
-
-                row = [f"  - {metric.title()}"]
-
-                for iter_num in sorted(iterations_results.keys()):
-                    if (iter_num in agent_metrics_by_iteration and
-                            metric in agent_metrics_by_iteration[iter_num]):
-                        metric_score = agent_metrics_by_iteration[iter_num][metric].score
-                        if metric_score is not None:
-                            metric_scores.append(metric_score)
-                            if metric_score >= 8.0:
-                                color = "green"
-                            elif metric_score >= 6.0:
-                                color = "cyan"
-                            elif metric_score >= 4.0:
-                                color = "yellow"
-                            else:
-                                color = "red"
-                            row.append(f"[{color}]{metric_score:.1f}[/]")
-                        else:
-                            row.append("[dim]N/A[/dim]")
-                    else:
-                        row.append("-")
-
-                if metric_scores:
-                    avg = sum(metric_scores) / len(metric_scores)
-                    if avg >= 8.0:
-                        color = "green"
-                    elif avg >= 6.0:
-                        color = "cyan"
-                    elif avg >= 4.0:
-                        color = "yellow"
-                    else:
-                        color = "red"
-                    row.append(f"[{color}]{avg:.1f}[/]")
-                else:
-                    row.append("-")
-
-                table.add_row(*row)
-
-            table.add_row(*[""] * (len(sorted(iterations_results.keys())) + 2))
-
-        self.console_formatter.print(table)
-        self.console_formatter.print("\n")
-
-    def _aggregate_agent_results(
-        self,
-        agent_id: str,
-        agent_role: str,
-        results: Sequence[AgentEvaluationResult],
-        strategy: AggregationStrategy = AggregationStrategy.SIMPLE_AVERAGE,
-    ) -> AgentAggregatedEvaluationResult:
-        metrics_by_category: dict[MetricCategory, list[EvaluationScore]] = defaultdict(list)
-
-        for result in results:
-            for metric_name, evaluation_score in result.metrics.items():
-                metrics_by_category[metric_name].append(evaluation_score)
-
-        aggregated_metrics: dict[MetricCategory, EvaluationScore] = {}
-        for category, scores in metrics_by_category.items():
-            valid_scores = [s.score for s in scores if s.score is not None]
-            avg_score = sum(valid_scores) / len(valid_scores) if valid_scores else None
-
-            feedbacks = [s.feedback for s in scores if s.feedback]
-
-            feedback_summary = None
-            if feedbacks:
-                if len(feedbacks) > 1:
-                    feedback_summary = self._summarize_feedbacks(
-                        agent_role=agent_role,
-                        metric=category.title(),
-                        feedbacks=feedbacks,
-                        scores=[s.score for s in scores],
-                        strategy=strategy
-                    )
-                else:
-                    feedback_summary = feedbacks[0]
-
-            aggregated_metrics[category] = EvaluationScore(
-                score=avg_score,
-                feedback=feedback_summary
-            )
-
-        overall_score = None
-        if aggregated_metrics:
-            valid_scores = [m.score for m in aggregated_metrics.values() if m.score is not None]
-            if valid_scores:
-                overall_score = sum(valid_scores) / len(valid_scores)
-
-        return AgentAggregatedEvaluationResult(
-            agent_id=agent_id,
-            agent_role=agent_role,
-            metrics=aggregated_metrics,
-            overall_score=overall_score,
-            task_count=len(results),
-            aggregation_strategy=strategy
-        )
-
-    def _summarize_feedbacks(
-        self,
-        agent_role: str,
-        metric: str,
-        feedbacks: List[str],
-        scores: List[float | None],
-        strategy: AggregationStrategy
-    ) -> str:
-        if len(feedbacks) <= 2 and all(len(fb) < 200 for fb in feedbacks):
-            return "\n\n".join([f"Feedback {i+1}: {fb}" for i, fb in enumerate(feedbacks)])
-
-        try:
-            llm = create_llm()
-
-            formatted_feedbacks = []
-            for i, (feedback, score) in enumerate(zip(feedbacks, scores)):
-                if len(feedback) > 500:
-                    feedback = feedback[:500] + "..."
-                score_text = f"{score:.1f}" if score is not None else "N/A"
-                formatted_feedbacks.append(f"Feedback #{i+1} (Score: {score_text}):\n{feedback}")
-
-            all_feedbacks = "\n\n" + "\n\n---\n\n".join(formatted_feedbacks)
-
-            strategy_guidance = ""
-            if strategy == AggregationStrategy.BEST_PERFORMANCE:
-                strategy_guidance = "Focus on the highest-scoring aspects and strengths demonstrated."
-            elif strategy == AggregationStrategy.WORST_PERFORMANCE:
-                strategy_guidance = "Focus on areas that need improvement and common issues across tasks."
-            else:
-                strategy_guidance = "Provide a balanced analysis of strengths and weaknesses across all tasks."
-
-            prompt = [
-                {"role": "system", "content": f"""You are an expert evaluator creating a comprehensive summary of agent performance feedback.
-                Your job is to synthesize multiple feedback points about the same metric across different tasks.
-
-                Create a concise, insightful summary that captures the key patterns and themes from all feedback.
-                {strategy_guidance}
-
-                Your summary should be:
-                1. Specific and concrete (not vague or general)
-                2. Focused on actionable insights
-                3. Highlighting patterns across tasks
-                4. 150-250 words in length
-
-                The summary should be directly usable as final feedback for the agent's performance on this metric."""},
-                {"role": "user", "content": f"""I need a synthesized summary of the following feedback for:
-
-                Agent Role: {agent_role}
-                Metric: {metric.title()}
-
-                {all_feedbacks}
-                """}
-            ]
-            assert llm is not None
-            response = llm.call(prompt)
-
-            return response
-
-        except Exception:
-            return "Synthesized from multiple tasks: " + "\n\n".join([f"- {fb[:500]}..." for fb in feedbacks])
--- a/src/crewai/experimental/evaluation/evaluation_listener.py
+++ b/src/crewai/experimental/evaluation/evaluation_listener.py
@@ -1,234 +0,0 @@
-from datetime import datetime
-from typing import Any, Dict, Optional
-
-from collections.abc import Sequence
-
-from crewai.agent import Agent
-from crewai.task import Task
-from crewai.utilities.events.base_event_listener import BaseEventListener
-from crewai.utilities.events.crewai_event_bus import CrewAIEventsBus
-from crewai.utilities.events.agent_events import (
-    AgentExecutionStartedEvent,
-    AgentExecutionCompletedEvent,
-    LiteAgentExecutionStartedEvent,
-    LiteAgentExecutionCompletedEvent
-)
-from crewai.utilities.events.tool_usage_events import (
-    ToolUsageFinishedEvent,
-    ToolUsageErrorEvent,
-    ToolExecutionErrorEvent,
-    ToolSelectionErrorEvent,
-    ToolValidateInputErrorEvent
-)
-from crewai.utilities.events.llm_events import (
-    LLMCallStartedEvent,
-    LLMCallCompletedEvent
-)
-
-class EvaluationTraceCallback(BaseEventListener):
-    """Event listener for collecting execution traces for evaluation.
-
-    This listener attaches to the event bus to collect detailed information
-    about the execution process, including agent steps, tool uses, knowledge
-    retrievals, and final output - all for use in agent evaluation.
-    """
-
-    _instance = None
-
-    def __new__(cls):
-        if cls._instance is None:
-            cls._instance = super().__new__(cls)
-            cls._instance._initialized = False
-        return cls._instance
-
-    def __init__(self):
-        if not hasattr(self, "_initialized") or not self._initialized:
-            super().__init__()
-            self.traces = {}
-            self.current_agent_id = None
-            self.current_task_id = None
-            self._initialized = True
-
-    def setup_listeners(self, event_bus: CrewAIEventsBus):
-        @event_bus.on(AgentExecutionStartedEvent)
-        def on_agent_started(source, event: AgentExecutionStartedEvent):
-            self.on_agent_start(event.agent, event.task)
-
-        @event_bus.on(LiteAgentExecutionStartedEvent)
-        def on_lite_agent_started(source, event: LiteAgentExecutionStartedEvent):
-            self.on_lite_agent_start(event.agent_info)
-
-        @event_bus.on(AgentExecutionCompletedEvent)
-        def on_agent_completed(source, event: AgentExecutionCompletedEvent):
-            self.on_agent_finish(event.agent, event.task, event.output)
-
-        @event_bus.on(LiteAgentExecutionCompletedEvent)
-        def on_lite_agent_completed(source, event: LiteAgentExecutionCompletedEvent):
-            self.on_lite_agent_finish(event.output)
-
-        @event_bus.on(ToolUsageFinishedEvent)
-        def on_tool_completed(source, event: ToolUsageFinishedEvent):
-            self.on_tool_use(event.tool_name, event.tool_args, event.output, success=True)
-
-        @event_bus.on(ToolUsageErrorEvent)
-        def on_tool_usage_error(source, event: ToolUsageErrorEvent):
-            self.on_tool_use(event.tool_name, event.tool_args, event.error,
-                           success=False, error_type="usage_error")
-
-        @event_bus.on(ToolExecutionErrorEvent)
-        def on_tool_execution_error(source, event: ToolExecutionErrorEvent):
-            self.on_tool_use(event.tool_name, event.tool_args, event.error,
-                           success=False, error_type="execution_error")
-
-        @event_bus.on(ToolSelectionErrorEvent)
-        def on_tool_selection_error(source, event: ToolSelectionErrorEvent):
-            self.on_tool_use(event.tool_name, event.tool_args, event.error,
-                           success=False, error_type="selection_error")
-
-        @event_bus.on(ToolValidateInputErrorEvent)
-        def on_tool_validate_input_error(source, event: ToolValidateInputErrorEvent):
-            self.on_tool_use(event.tool_name, event.tool_args, event.error,
-                           success=False, error_type="validation_error")
-
-        @event_bus.on(LLMCallStartedEvent)
-        def on_llm_call_started(source, event: LLMCallStartedEvent):
-            self.on_llm_call_start(event.messages, event.tools)
-
-        @event_bus.on(LLMCallCompletedEvent)
-        def on_llm_call_completed(source, event: LLMCallCompletedEvent):
-            self.on_llm_call_end(event.messages, event.response)
-
-    def on_lite_agent_start(self, agent_info: dict[str, Any]):
-        self.current_agent_id = agent_info['id']
-        self.current_task_id = "lite_task"
-
-        trace_key = f"{self.current_agent_id}_{self.current_task_id}"
-        self._init_trace(
-            trace_key=trace_key,
-            agent_id=self.current_agent_id,
-            task_id=self.current_task_id,
-            tool_uses=[],
-            llm_calls=[],
-            start_time=datetime.now(),
-            final_output=None
-        )
-
-    def _init_trace(self, trace_key: str, **kwargs: Any):
-        self.traces[trace_key] = kwargs
-
-    def on_agent_start(self, agent: Agent, task: Task):
-        self.current_agent_id = agent.id
-        self.current_task_id = task.id
-
-        trace_key = f"{agent.id}_{task.id}"
-        self._init_trace(
-            trace_key=trace_key,
-            agent_id=agent.id,
-            task_id=task.id,
-            tool_uses=[],
-            llm_calls=[],
-            start_time=datetime.now(),
-            final_output=None
-        )
-
-    def on_agent_finish(self, agent: Agent, task: Task, output: Any):
-        trace_key = f"{agent.id}_{task.id}"
-        if trace_key in self.traces:
-            self.traces[trace_key]["final_output"] = output
-            self.traces[trace_key]["end_time"] = datetime.now()
-
-        self._reset_current()
-
-    def _reset_current(self):
-        self.current_agent_id = None
-        self.current_task_id = None
-
-    def on_lite_agent_finish(self, output: Any):
-        trace_key = f"{self.current_agent_id}_lite_task"
-        if trace_key in self.traces:
-            self.traces[trace_key]["final_output"] = output
-            self.traces[trace_key]["end_time"] = datetime.now()
-
-        self._reset_current()
-
-    def on_tool_use(self, tool_name: str, tool_args: dict[str, Any] | str, result: Any,
-                   success: bool = True, error_type: str | None = None):
-        if not self.current_agent_id or not self.current_task_id:
-            return
-
-        trace_key = f"{self.current_agent_id}_{self.current_task_id}"
-        if trace_key in self.traces:
-            tool_use = {
-                "tool": tool_name,
-                "args": tool_args,
-                "result": result,
-                "success": success,
-                "timestamp": datetime.now()
-            }
-
-            # Add error information if applicable
-            if not success and error_type:
-                tool_use["error"] = True
-                tool_use["error_type"] = error_type
-
-            self.traces[trace_key]["tool_uses"].append(tool_use)
-
-    def on_llm_call_start(self, messages: str | Sequence[dict[str, Any]] | None, tools: Sequence[dict[str, Any]] | None = None):
-        if not self.current_agent_id or not self.current_task_id:
-            return
-
-        trace_key = f"{self.current_agent_id}_{self.current_task_id}"
-        if trace_key not in self.traces:
-            return
-
-        self.current_llm_call = {
-            "messages": messages,
-            "tools": tools,
-            "start_time": datetime.now(),
-            "response": None,
-            "end_time": None
-        }
-
-    def on_llm_call_end(self, messages: str | list[dict[str, Any]] | None, response: Any):
-        if not self.current_agent_id or not self.current_task_id:
-            return
-
-        trace_key = f"{self.current_agent_id}_{self.current_task_id}"
-        if trace_key not in self.traces:
-            return
-
-        total_tokens = 0
-        if hasattr(response, "usage") and hasattr(response.usage, "total_tokens"):
-            total_tokens = response.usage.total_tokens
-
-        current_time = datetime.now()
-        start_time = None
-        if hasattr(self, "current_llm_call") and self.current_llm_call:
-            start_time = self.current_llm_call.get("start_time")
-
-        if not start_time:
-            start_time = current_time
-        llm_call = {
-            "messages": messages,
-            "response": response,
-            "start_time": start_time,
-            "end_time": current_time,
-            "total_tokens": total_tokens
-        }
-
-        self.traces[trace_key]["llm_calls"].append(llm_call)
-
-        if hasattr(self, "current_llm_call"):
-            self.current_llm_call = {}
-
-    def get_trace(self, agent_id: str, task_id: str) -> Optional[Dict[str, Any]]:
-        trace_key = f"{agent_id}_{task_id}"
-        return self.traces.get(trace_key)
-
-
-def create_evaluation_callbacks() -> EvaluationTraceCallback:
-    from crewai.utilities.events.crewai_event_bus import crewai_event_bus
-
-    callback = EvaluationTraceCallback()
-    callback.setup_listeners(crewai_event_bus)
-    return callback
--- a/src/crewai/experimental/evaluation/experiment/init.py
+++ b/src/crewai/experimental/evaluation/experiment/init.py
@@ -1,8 +0,0 @@
-from crewai.experimental.evaluation.experiment.runner import ExperimentRunner
-from crewai.experimental.evaluation.experiment.result import ExperimentResults, ExperimentResult
-
-__all__ = [
-    "ExperimentRunner",
-    "ExperimentResults",
-    "ExperimentResult"
-]
--- a/src/crewai/experimental/evaluation/experiment/result.py
+++ b/src/crewai/experimental/evaluation/experiment/result.py
@@ -1,122 +0,0 @@
-import json
-import os
-from datetime import datetime, timezone
-from typing import Any
-from pydantic import BaseModel
-
-class ExperimentResult(BaseModel):
-    identifier: str
-    inputs: dict[str, Any]
-    score: int | dict[str, int | float]
-    expected_score: int | dict[str, int | float]
-    passed: bool
-    agent_evaluations: dict[str, Any] | None = None
-
-class ExperimentResults:
-    def __init__(self, results: list[ExperimentResult], metadata: dict[str, Any] | None = None):
-        self.results = results
-        self.metadata = metadata or {}
-        self.timestamp = datetime.now(timezone.utc)
-
-        from crewai.experimental.evaluation.experiment.result_display import ExperimentResultsDisplay
-        self.display = ExperimentResultsDisplay()
-
-    def to_json(self, filepath: str | None = None) -> dict[str, Any]:
-        data = {
-            "timestamp": self.timestamp.isoformat(),
-            "metadata": self.metadata,
-            "results": [r.model_dump(exclude={"agent_evaluations"}) for r in self.results]
-        }
-
-        if filepath:
-            with open(filepath, 'w') as f:
-                json.dump(data, f, indent=2)
-            self.display.console.print(f"[green]Results saved to {filepath}[/green]")
-
-        return data
-
-    def compare_with_baseline(self, baseline_filepath: str, save_current: bool = True, print_summary: bool = False) -> dict[str, Any]:
-        baseline_runs = []
-
-        if os.path.exists(baseline_filepath) and os.path.getsize(baseline_filepath) > 0:
-            try:
-                with open(baseline_filepath, 'r') as f:
-                    baseline_data = json.load(f)
-
-                if isinstance(baseline_data, dict) and "timestamp" in baseline_data:
-                    baseline_runs = [baseline_data]
-                elif isinstance(baseline_data, list):
-                    baseline_runs = baseline_data
-            except (json.JSONDecodeError, FileNotFoundError) as e:
-                self.display.console.print(f"[yellow]Warning: Could not load baseline file: {str(e)}[/yellow]")
-
-        if not baseline_runs:
-            if save_current:
-                current_data = self.to_json()
-                with open(baseline_filepath, 'w') as f:
-                    json.dump([current_data], f, indent=2)
-                self.display.console.print(f"[green]Saved current results as new baseline to {baseline_filepath}[/green]")
-            return {"is_baseline": True, "changes": {}}
-
-        baseline_runs.sort(key=lambda x: x.get("timestamp", ""), reverse=True)
-        latest_run = baseline_runs[0]
-
-        comparison = self._compare_with_run(latest_run)
-
-        if print_summary:
-            self.display.comparison_summary(comparison, latest_run["timestamp"])
-
-        if save_current:
-            current_data = self.to_json()
-            baseline_runs.append(current_data)
-            with open(baseline_filepath, 'w') as f:
-                json.dump(baseline_runs, f, indent=2)
-            self.display.console.print(f"[green]Added current results to baseline file {baseline_filepath}[/green]")
-
-        return comparison
-
-    def _compare_with_run(self, baseline_run: dict[str, Any]) -> dict[str, Any]:
-        baseline_results = baseline_run.get("results", [])
-
-        baseline_lookup = {}
-        for result in baseline_results:
-            test_identifier = result.get("identifier")
-            if test_identifier:
-                baseline_lookup[test_identifier] = result
-
-        improved = []
-        regressed = []
-        unchanged = []
-        new_tests = []
-
-        for result in self.results:
-            test_identifier = result.identifier
-            if not test_identifier or test_identifier not in baseline_lookup:
-                new_tests.append(test_identifier)
-                continue
-
-            baseline_result = baseline_lookup[test_identifier]
-            baseline_passed = baseline_result.get("passed", False)
-            if result.passed and not baseline_passed:
-                improved.append(test_identifier)
-            elif not result.passed and baseline_passed:
-                regressed.append(test_identifier)
-            else:
-                unchanged.append(test_identifier)
-
-        missing_tests = []
-        current_test_identifiers = {result.identifier for result in self.results}
-        for result in baseline_results:
-            test_identifier = result.get("identifier")
-            if test_identifier and test_identifier not in current_test_identifiers:
-                missing_tests.append(test_identifier)
-
-        return {
-            "improved": improved,
-            "regressed": regressed,
-            "unchanged": unchanged,
-            "new_tests": new_tests,
-            "missing_tests": missing_tests,
-            "total_compared": len(improved) + len(regressed) + len(unchanged),
-            "baseline_timestamp": baseline_run.get("timestamp", "unknown")
-        }
--- a/src/crewai/experimental/evaluation/experiment/result_display.py
+++ b/src/crewai/experimental/evaluation/experiment/result_display.py
@@ -1,70 +0,0 @@
-from typing import Dict, Any
-from rich.console import Console
-from rich.table import Table
-from rich.panel import Panel
-from crewai.experimental.evaluation.experiment.result import ExperimentResults
-
-class ExperimentResultsDisplay:
-    def __init__(self):
-        self.console = Console()
-
-    def summary(self, experiment_results: ExperimentResults):
-        total = len(experiment_results.results)
-        passed = sum(1 for r in experiment_results.results if r.passed)
-
-        table = Table(title="Experiment Summary")
-        table.add_column("Metric", style="cyan")
-        table.add_column("Value", style="green")
-
-        table.add_row("Total Test Cases", str(total))
-        table.add_row("Passed", str(passed))
-        table.add_row("Failed", str(total - passed))
-        table.add_row("Success Rate", f"{(passed / total * 100):.1f}%" if total > 0 else "N/A")
-
-        self.console.print(table)
-
-    def comparison_summary(self, comparison: Dict[str, Any], baseline_timestamp: str):
-        self.console.print(Panel(f"[bold]Comparison with baseline run from {baseline_timestamp}[/bold]",
-                                 expand=False))
-
-        table = Table(title="Results Comparison")
-        table.add_column("Metric", style="cyan")
-        table.add_column("Count", style="white")
-        table.add_column("Details", style="dim")
-
-        improved = comparison.get("improved", [])
-        if improved:
-            details = ", ".join([f"{test_identifier}" for test_identifier in improved[:3]])
-            if len(improved) > 3:
-                details += f" and {len(improved) - 3} more"
-            table.add_row("✅ Improved", str(len(improved)), details)
-        else:
-            table.add_row("✅ Improved", "0", "")
-
-        regressed = comparison.get("regressed", [])
-        if regressed:
-            details = ", ".join([f"{test_identifier}" for test_identifier in regressed[:3]])
-            if len(regressed) > 3:
-                details += f" and {len(regressed) - 3} more"
-            table.add_row("❌ Regressed", str(len(regressed)), details, style="red")
-        else:
-            table.add_row("❌ Regressed", "0", "")
-
-        unchanged = comparison.get("unchanged", [])
-        table.add_row("⏺ Unchanged", str(len(unchanged)), "")
-
-        new_tests = comparison.get("new_tests", [])
-        if new_tests:
-            details = ", ".join(new_tests[:3])
-            if len(new_tests) > 3:
-                details += f" and {len(new_tests) - 3} more"
-            table.add_row("➕ New Tests", str(len(new_tests)), details)
-
-        missing_tests = comparison.get("missing_tests", [])
-        if missing_tests:
-            details = ", ".join(missing_tests[:3])
-            if len(missing_tests) > 3:
-                details += f" and {len(missing_tests) - 3} more"
-            table.add_row("➖ Missing Tests", str(len(missing_tests)), details)
-
-        self.console.print(table)
--- a/src/crewai/experimental/evaluation/experiment/runner.py
+++ b/src/crewai/experimental/evaluation/experiment/runner.py
@@ -1,125 +0,0 @@
-from collections import defaultdict
-from hashlib import md5
-from typing import Any
-
-from crewai import Crew, Agent
-from crewai.experimental.evaluation import AgentEvaluator, create_default_evaluator
-from crewai.experimental.evaluation.experiment.result_display import ExperimentResultsDisplay
-from crewai.experimental.evaluation.experiment.result import ExperimentResults, ExperimentResult
-from crewai.experimental.evaluation.evaluation_display import AgentAggregatedEvaluationResult
-
-class ExperimentRunner:
-    def __init__(self, dataset: list[dict[str, Any]]):
-        self.dataset = dataset or []
-        self.evaluator: AgentEvaluator | None = None
-        self.display = ExperimentResultsDisplay()
-
-    def run(self, crew: Crew | None = None, agents: list[Agent] | None = None, print_summary: bool = False) -> ExperimentResults:
-        if crew and not agents:
-            agents = crew.agents
-
-        assert agents is not None
-        self.evaluator = create_default_evaluator(agents=agents)
-
-        results = []
-
-        for test_case in self.dataset:
-            self.evaluator.reset_iterations_results()
-            result = self._run_test_case(test_case=test_case, crew=crew, agents=agents)
-            results.append(result)
-
-        experiment_results = ExperimentResults(results)
-
-        if print_summary:
-            self.display.summary(experiment_results)
-
-        return experiment_results
-
-    def _run_test_case(self, test_case: dict[str, Any], agents: list[Agent], crew: Crew | None = None) -> ExperimentResult:
-        inputs = test_case["inputs"]
-        expected_score = test_case["expected_score"]
-        identifier = test_case.get("identifier") or md5(str(test_case).encode(), usedforsecurity=False).hexdigest()
-
-        try:
-            self.display.console.print(f"[dim]Running crew with input: {str(inputs)[:50]}...[/dim]")
-            self.display.console.print("\n")
-            if crew:
-                crew.kickoff(inputs=inputs)
-            else:
-                for agent in agents:
-                    agent.kickoff(**inputs)
-
-            assert self.evaluator is not None
-            agent_evaluations = self.evaluator.get_agent_evaluation()
-
-            actual_score = self._extract_scores(agent_evaluations)
-
-            passed = self._assert_scores(expected_score, actual_score)
-            return ExperimentResult(
-                identifier=identifier,
-                inputs=inputs,
-                score=actual_score,
-                expected_score=expected_score,
-                passed=passed,
-                agent_evaluations=agent_evaluations
-            )
-
-        except Exception as e:
-            self.display.console.print(f"[red]Error running test case: {str(e)}[/red]")
-            return ExperimentResult(
-                identifier=identifier,
-                inputs=inputs,
-                score=0,
-                expected_score=expected_score,
-                passed=False
-            )
-
-    def _extract_scores(self, agent_evaluations: dict[str, AgentAggregatedEvaluationResult]) -> float | dict[str,  float]:
-        all_scores: dict[str, list[float]] = defaultdict(list)
-        for evaluation in agent_evaluations.values():
-            for metric_name, score in evaluation.metrics.items():
-                if score.score is not None:
-                    all_scores[metric_name.value].append(score.score)
-
-        avg_scores = {m: sum(s)/len(s) for m, s in all_scores.items()}
-
-        if len(avg_scores) == 1:
-            return list(avg_scores.values())[0]
-
-        return avg_scores
-
-    def _assert_scores(self, expected: float | dict[str, float],
-                        actual: float | dict[str, float]) -> bool:
-        """
-        Compare expected and actual scores, and return whether the test case passed.
-
-        The rules for comparison are as follows:
-        - If both expected and actual scores are single numbers, the actual score must be >= expected.
-        - If expected is a single number and actual is a dict, compare against the average of actual values.
-        - If expected is a dict and actual is a single number, actual must be >= all expected values.
-        - If both are dicts, actual must have matching keys with values >= expected values.
-        """
-
-        if isinstance(expected, (int, float)) and isinstance(actual, (int, float)):
-            return actual >= expected
-
-        if isinstance(expected, dict) and isinstance(actual, (int, float)):
-            return all(actual >= exp_score for exp_score in expected.values())
-
-        if isinstance(expected, (int, float)) and isinstance(actual, dict):
-            if not actual:
-                return False
-            avg_score = sum(actual.values()) / len(actual)
-            return avg_score >= expected
-
-        if isinstance(expected, dict) and isinstance(actual, dict):
-            if not expected:
-                return True
-            matching_keys = set(expected.keys()) & set(actual.keys())
-            if not matching_keys:
-                return False
-
-            # All matching keys must have actual >= expected
-            return all(actual[key] >= expected[key] for key in matching_keys)
-
-        return False
--- a/src/crewai/experimental/evaluation/json_parser.py
+++ b/src/crewai/experimental/evaluation/json_parser.py
@@ -1,30 +0,0 @@
-"""Robust JSON parsing utilities for evaluation responses."""
-
-import json
-import re
-from typing import Any
-
-
-def extract_json_from_llm_response(text: str) -> dict[str, Any]:
-    try:
-        return json.loads(text)
-    except json.JSONDecodeError:
-        pass
-
-    json_patterns = [
-        # Standard markdown code blocks with json
-        r'```json\s*([\s\S]*?)\s*```',
-        # Code blocks without language specifier
-        r'```\s*([\s\S]*?)\s*```',
-        # Inline code with JSON
-        r'`([{\\[].*[}\]])`',
-    ]
-
-    for pattern in json_patterns:
-        matches = re.findall(pattern, text, re.IGNORECASE | re.DOTALL)
-        for match in matches:
-            try:
-                return json.loads(match.strip())
-            except json.JSONDecodeError:
-                continue
-    raise ValueError("No valid JSON found in the response")
--- a/src/crewai/experimental/evaluation/metrics/init.py
+++ b/src/crewai/experimental/evaluation/metrics/init.py
@@ -1,26 +0,0 @@
-from crewai.experimental.evaluation.metrics.reasoning_metrics import (
-    ReasoningEfficiencyEvaluator
-)
-
-from crewai.experimental.evaluation.metrics.tools_metrics import (
-    ToolSelectionEvaluator,
-    ParameterExtractionEvaluator,
-    ToolInvocationEvaluator
-)
-
-from crewai.experimental.evaluation.metrics.goal_metrics import (
-    GoalAlignmentEvaluator
-)
-
-from crewai.experimental.evaluation.metrics.semantic_quality_metrics import (
-    SemanticQualityEvaluator
-)
-
-__all__ = [
-    "ReasoningEfficiencyEvaluator",
-    "ToolSelectionEvaluator",
-    "ParameterExtractionEvaluator",
-    "ToolInvocationEvaluator",
-    "GoalAlignmentEvaluator",
-    "SemanticQualityEvaluator"
-]
--- a/src/crewai/experimental/evaluation/metrics/goal_metrics.py
+++ b/src/crewai/experimental/evaluation/metrics/goal_metrics.py
@@ -1,69 +0,0 @@
-from typing import Any, Dict
-
-from crewai.agent import Agent
-from crewai.task import Task
-
-from crewai.experimental.evaluation.base_evaluator import BaseEvaluator, EvaluationScore, MetricCategory
-from crewai.experimental.evaluation.json_parser import extract_json_from_llm_response
-
-class GoalAlignmentEvaluator(BaseEvaluator):
-    @property
-    def metric_category(self) -> MetricCategory:
-        return MetricCategory.GOAL_ALIGNMENT
-
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: Dict[str, Any],
-        final_output: Any,
-        task: Task | None = None,
-    ) -> EvaluationScore:
-        task_context = ""
-        if task is not None:
-            task_context = f"Task description: {task.description}\nExpected output: {task.expected_output}\n"
-
-        prompt = [
-            {"role": "system", "content": """You are an expert evaluator assessing how well an AI agent's output aligns with its assigned task goal.
-
-Score the agent's goal alignment on a scale from 0-10 where:
- 0: Complete misalignment, agent did not understand or attempt the task goal
- 5: Partial alignment, agent attempted the task but missed key requirements
- 10: Perfect alignment, agent fully satisfied all task requirements
-
-Consider:
-1. Did the agent correctly interpret the task goal?
-2. Did the final output directly address the requirements?
-3. Did the agent focus on relevant aspects of the task?
-4. Did the agent provide all requested information or deliverables?
-
-Return your evaluation as JSON with fields 'score' (number) and 'feedback' (string).
-"""},
-            {"role": "user", "content": f"""
-Agent role: {agent.role}
-Agent goal: {agent.goal}
-{task_context}
-
-Agent's final output:
-{final_output}
-
-Evaluate how well the agent's output aligns with the assigned task goal.
-"""}
-        ]
-        assert self.llm is not None
-        response = self.llm.call(prompt)
-
-        try:
-            evaluation_data: dict[str, Any] = extract_json_from_llm_response(response)
-            assert evaluation_data is not None
-
-            return EvaluationScore(
-                score=evaluation_data.get("score", 0),
-                feedback=evaluation_data.get("feedback", response),
-                raw_response=response
-            )
-        except Exception:
-            return EvaluationScore(
-                score=None,
-                feedback=f"Failed to parse evaluation. Raw response: {response}",
-                raw_response=response
-            )
--- a/src/crewai/experimental/evaluation/metrics/reasoning_metrics.py
+++ b/src/crewai/experimental/evaluation/metrics/reasoning_metrics.py
@@ -1,361 +0,0 @@
-"""Agent reasoning efficiency evaluators.
-
-This module provides evaluator implementations for:
- Reasoning efficiency
- Loop detection
- Thinking-to-action ratio
-"""
-
-import logging
-import re
-from enum import Enum
-from typing import Any, Dict, List, Tuple
-import numpy as np
-from collections.abc import Sequence
-
-from crewai.agent import Agent
-from crewai.task import Task
-
-from crewai.experimental.evaluation.base_evaluator import BaseEvaluator, EvaluationScore, MetricCategory
-from crewai.experimental.evaluation.json_parser import extract_json_from_llm_response
-from crewai.tasks.task_output import TaskOutput
-
-class ReasoningPatternType(Enum):
-    EFFICIENT = "efficient"  # Good reasoning flow
-    LOOP = "loop"  # Agent is stuck in a loop
-    VERBOSE = "verbose"  # Agent is unnecessarily verbose
-    INDECISIVE = "indecisive"  # Agent struggles to make decisions
-    SCATTERED = "scattered"  # Agent jumps between topics without focus
-
-
-class ReasoningEfficiencyEvaluator(BaseEvaluator):
-    @property
-    def metric_category(self) -> MetricCategory:
-        return MetricCategory.REASONING_EFFICIENCY
-
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: Dict[str, Any],
-        final_output: TaskOutput | str,
-        task: Task | None = None,
-    ) -> EvaluationScore:
-        task_context = ""
-        if task is not None:
-            task_context = f"Task description: {task.description}\nExpected output: {task.expected_output}\n"
-
-        llm_calls = execution_trace.get("llm_calls", [])
-
-        if not llm_calls or len(llm_calls) < 2:
-            return EvaluationScore(
-                score=None,
-                feedback="Insufficient LLM calls to evaluate reasoning efficiency."
-            )
-
-        total_calls = len(llm_calls)
-        total_tokens = sum(call.get("total_tokens", 0) for call in llm_calls)
-        avg_tokens_per_call = total_tokens / total_calls if total_calls > 0 else 0
-        time_intervals = []
-        has_reliable_timing = True
-        for i in range(1, len(llm_calls)):
-            start_time = llm_calls[i-1].get("end_time")
-            end_time = llm_calls[i].get("start_time")
-            if start_time and end_time and start_time != end_time:
-                try:
-                    interval = end_time - start_time
-                    time_intervals.append(interval.total_seconds() if hasattr(interval, 'total_seconds') else 0)
-                except Exception:
-                    has_reliable_timing = False
-            else:
-                has_reliable_timing = False
-
-        loop_detected, loop_details = self._detect_loops(llm_calls)
-        pattern_analysis = self._analyze_reasoning_patterns(llm_calls)
-
-        efficiency_metrics = {
-            "total_llm_calls": total_calls,
-            "total_tokens": total_tokens,
-            "avg_tokens_per_call": avg_tokens_per_call,
-            "reasoning_pattern": pattern_analysis["primary_pattern"].value,
-            "loops_detected": loop_detected,
-        }
-
-        if has_reliable_timing and time_intervals:
-            efficiency_metrics["avg_time_between_calls"] = np.mean(time_intervals)
-
-        loop_info = f"Detected {len(loop_details)} potential reasoning loops." if loop_detected else "No significant reasoning loops detected."
-
-        call_samples = self._get_call_samples(llm_calls)
-
-        final_output = final_output.raw if isinstance(final_output, TaskOutput) else final_output
-
-        prompt = [
-            {"role": "system", "content": """You are an expert evaluator assessing the reasoning efficiency of an AI agent's thought process.
-
-Evaluate the agent's reasoning efficiency across these five key subcategories:
-
-1. Focus (0-10): How well the agent stays on topic and avoids unnecessary tangents
-2. Progression (0-10): How effectively the agent builds on previous thoughts rather than repeating or circling
-3. Decision Quality (0-10): How decisively and appropriately the agent makes decisions
-4. Conciseness (0-10): How efficiently the agent communicates without unnecessary verbosity
-5. Loop Avoidance (0-10): How well the agent avoids getting stuck in repetitive thinking patterns
-
-For each subcategory, provide a score from 0-10 where:
- 0: Completely inefficient
- 5: Moderately efficient
- 10: Highly efficient
-
-The overall score should be a weighted average of these subcategories.
-
-Return your evaluation as JSON with the following structure:
-{
-    "overall_score": float,
-    "scores": {
-        "focus": float,
-        "progression": float,
-        "decision_quality": float,
-        "conciseness": float,
-        "loop_avoidance": float
-    },
-    "feedback": string (general feedback about overall reasoning efficiency),
-    "optimization_suggestions": string (concrete suggestions for improving reasoning efficiency),
-    "detected_patterns": string (describe any inefficient reasoning patterns you observe)
-}"""},
-            {"role": "user", "content": f"""
-Agent role: {agent.role}
-{task_context}
-
-Reasoning efficiency metrics:
- Total LLM calls: {efficiency_metrics["total_llm_calls"]}
- Average tokens per call: {efficiency_metrics["avg_tokens_per_call"]:.1f}
- Primary reasoning pattern: {efficiency_metrics["reasoning_pattern"]}
- {loop_info}
-{"- Average time between calls: {:.2f} seconds".format(efficiency_metrics.get("avg_time_between_calls", 0)) if "avg_time_between_calls" in efficiency_metrics else ""}
-
-Sample of agent reasoning flow (chronological sequence):
-{call_samples}
-
-Agent's final output:
-{final_output[:500]}... (truncated)
-
-Evaluate the reasoning efficiency of this agent based on these interaction patterns.
-Identify any inefficient reasoning patterns and provide specific suggestions for optimization.
-"""}
-        ]
-
-        assert self.llm is not None
-        response = self.llm.call(prompt)
-
-        try:
-            evaluation_data = extract_json_from_llm_response(response)
-
-            scores = evaluation_data.get("scores", {})
-            focus = scores.get("focus", 5.0)
-            progression = scores.get("progression", 5.0)
-            decision_quality = scores.get("decision_quality", 5.0)
-            conciseness = scores.get("conciseness", 5.0)
-            loop_avoidance = scores.get("loop_avoidance", 5.0)
-
-            overall_score = evaluation_data.get("overall_score", evaluation_data.get("score", 5.0))
-            feedback = evaluation_data.get("feedback", "No detailed feedback provided.")
-            optimization_suggestions = evaluation_data.get("optimization_suggestions", "No specific suggestions provided.")
-
-            detailed_feedback = "Reasoning Efficiency Evaluation:\n"
-            detailed_feedback += f"• Focus: {focus}/10 - Staying on topic without tangents\n"
-            detailed_feedback += f"• Progression: {progression}/10 - Building on previous thinking\n"
-            detailed_feedback += f"• Decision Quality: {decision_quality}/10 - Making appropriate decisions\n"
-            detailed_feedback += f"• Conciseness: {conciseness}/10 - Communicating efficiently\n"
-            detailed_feedback += f"• Loop Avoidance: {loop_avoidance}/10 - Avoiding repetitive patterns\n\n"
-
-            detailed_feedback += f"Feedback:\n{feedback}\n\n"
-            detailed_feedback += f"Optimization Suggestions:\n{optimization_suggestions}"
-
-            return EvaluationScore(
-                score=float(overall_score),
-                feedback=detailed_feedback,
-                raw_response=response
-            )
-        except Exception as e:
-            logging.warning(f"Failed to parse reasoning efficiency evaluation: {e}")
-            return EvaluationScore(
-                score=None,
-                feedback=f"Failed to parse reasoning efficiency evaluation. Raw response: {response[:200]}...",
-                raw_response=response
-            )
-
-    def _detect_loops(self, llm_calls: List[Dict]) -> Tuple[bool, List[Dict]]:
-        loop_details = []
-
-        messages = []
-        for call in llm_calls:
-            content = call.get("response", "")
-            if isinstance(content, str):
-                messages.append(content)
-            elif isinstance(content, list) and len(content) > 0:
-                # Handle message list format
-                for msg in content:
-                    if isinstance(msg, dict) and "content" in msg:
-                        messages.append(msg["content"])
-
-        # Simple n-gram based similarity detection
-        # For a more robust implementation, consider using embedding-based similarity
-        for i in range(len(messages) - 2):
-            for j in range(i + 1, len(messages) - 1):
-                # Check for repeated patterns (simplistic approach)
-                # A more sophisticated approach would use semantic similarity
-                similarity = self._calculate_text_similarity(messages[i], messages[j])
-                if similarity > 0.7:  # Arbitrary threshold
-                    loop_details.append({
-                        "first_occurrence": i,
-                        "second_occurrence": j,
-                        "similarity": similarity,
-                        "snippet": messages[i][:100] + "..."
-                    })
-
-        return len(loop_details) > 0, loop_details
-
-    def _calculate_text_similarity(self, text1: str, text2: str) -> float:
-        text1 = re.sub(r'\s+', ' ', text1.lower()).strip()
-        text2 = re.sub(r'\s+', ' ', text2.lower()).strip()
-
-        # Simple Jaccard similarity on word sets
-        words1 = set(text1.split())
-        words2 = set(text2.split())
-
-        intersection = len(words1.intersection(words2))
-        union = len(words1.union(words2))
-
-        return intersection / union if union > 0 else 0.0
-
-    def _analyze_reasoning_patterns(self, llm_calls: List[Dict]) -> Dict[str, Any]:
-        call_lengths = []
-        response_times = []
-
-        for call in llm_calls:
-            content = call.get("response", "")
-            if isinstance(content, str):
-                call_lengths.append(len(content))
-            elif isinstance(content, list) and len(content) > 0:
-                # Handle message list format
-                total_length = 0
-                for msg in content:
-                    if isinstance(msg, dict) and "content" in msg:
-                        total_length += len(msg["content"])
-                call_lengths.append(total_length)
-
-            start_time = call.get("start_time")
-            end_time = call.get("end_time")
-            if start_time and end_time:
-                try:
-                    response_times.append(end_time - start_time)
-                except Exception:
-                    pass
-
-        avg_length = np.mean(call_lengths) if call_lengths else 0
-        std_length = np.std(call_lengths) if call_lengths else 0
-        length_trend = self._calculate_trend(call_lengths)
-
-        primary_pattern = ReasoningPatternType.EFFICIENT
-        details = "Agent demonstrates efficient reasoning patterns."
-
-        loop_score = self._calculate_loop_likelihood(call_lengths, response_times)
-        if loop_score > 0.7:
-            primary_pattern = ReasoningPatternType.LOOP
-            details = "Agent appears to be stuck in repetitive thinking patterns."
-        elif avg_length > 1000 and std_length / avg_length < 0.3:
-            primary_pattern = ReasoningPatternType.VERBOSE
-            details = "Agent is consistently verbose across interactions."
-        elif len(llm_calls) > 10 and length_trend > 0.5:
-            primary_pattern = ReasoningPatternType.INDECISIVE
-            details = "Agent shows signs of indecisiveness with increasing message lengths."
-        elif std_length / avg_length > 0.8:
-            primary_pattern = ReasoningPatternType.SCATTERED
-            details = "Agent shows inconsistent reasoning flow with highly variable responses."
-
-        return {
-            "primary_pattern": primary_pattern,
-            "details": details,
-            "metrics": {
-                "avg_length": avg_length,
-                "std_length": std_length,
-                "length_trend": length_trend,
-                "loop_score": loop_score
-            }
-        }
-
-    def _calculate_trend(self, values: Sequence[float | int]) -> float:
-        if not values or len(values) < 2:
-            return 0.0
-
-        try:
-            x = np.arange(len(values))
-            y = np.array(values)
-
-            # Simple linear regression
-            slope = np.polyfit(x, y, 1)[0]
-
-            # Normalize slope to -1 to 1 range
-            max_possible_slope = max(values) - min(values)
-            if max_possible_slope > 0:
-                normalized_slope = slope / max_possible_slope
-                return max(min(normalized_slope, 1.0), -1.0)
-            return 0.0
-        except Exception:
-            return 0.0
-
-    def _calculate_loop_likelihood(self, call_lengths: Sequence[float], response_times: Sequence[float]) -> float:
-        if not call_lengths or len(call_lengths) < 3:
-            return 0.0
-
-        indicators = []
-
-        if len(call_lengths) >= 4:
-            repeated_lengths = 0
-            for i in range(len(call_lengths) - 2):
-                ratio = call_lengths[i] / call_lengths[i + 2] if call_lengths[i + 2] > 0 else 0
-                if 0.85 <= ratio <= 1.15:
-                    repeated_lengths += 1
-
-            length_repetition_score = repeated_lengths / (len(call_lengths) - 2)
-            indicators.append(length_repetition_score)
-
-        if response_times and len(response_times) >= 3:
-            try:
-                std_time = np.std(response_times)
-                mean_time = np.mean(response_times)
-                if mean_time > 0:
-                    time_consistency = 1.0 - (std_time / mean_time)
-                    indicators.append(max(0, time_consistency - 0.3) * 1.5)
-            except Exception:
-                pass
-
-        return np.mean(indicators) if indicators else 0.0
-
-    def _get_call_samples(self, llm_calls: List[Dict]) -> str:
-        samples = []
-
-        if len(llm_calls) <= 6:
-            sample_indices = list(range(len(llm_calls)))
-        else:
-            sample_indices = [0, 1, len(llm_calls) // 2 - 1, len(llm_calls) // 2,
-                             len(llm_calls) - 2, len(llm_calls) - 1]
-
-        for idx in sample_indices:
-            call = llm_calls[idx]
-            content = call.get("response", "")
-
-            if isinstance(content, str):
-                sample = content
-            elif isinstance(content, list) and len(content) > 0:
-                sample_parts = []
-                for msg in content:
-                    if isinstance(msg, dict) and "content" in msg:
-                        sample_parts.append(msg["content"])
-                sample = "\n".join(sample_parts)
-            else:
-                sample = str(content)
-
-            truncated = sample[:200] + "..." if len(sample) > 200 else sample
-            samples.append(f"Call {idx + 1}:\n{truncated}\n")
-
-        return "\n".join(samples)
--- a/src/crewai/experimental/evaluation/metrics/semantic_quality_metrics.py
+++ b/src/crewai/experimental/evaluation/metrics/semantic_quality_metrics.py
@@ -1,68 +0,0 @@
-from typing import Any, Dict
-
-from crewai.agent import Agent
-from crewai.task import Task
-
-from crewai.experimental.evaluation.base_evaluator import BaseEvaluator, EvaluationScore, MetricCategory
-from crewai.experimental.evaluation.json_parser import extract_json_from_llm_response
-
-class SemanticQualityEvaluator(BaseEvaluator):
-    @property
-    def metric_category(self) -> MetricCategory:
-        return MetricCategory.SEMANTIC_QUALITY
-
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: Dict[str, Any],
-        final_output: Any,
-        task: Task | None = None,
-    ) -> EvaluationScore:
-        task_context = ""
-        if task is not None:
-            task_context = f"Task description: {task.description}"
-        prompt = [
-            {"role": "system", "content": """You are an expert evaluator assessing the semantic quality of an AI agent's output.
-
-Score the semantic quality on a scale from 0-10 where:
- 0: Completely incoherent, confusing, or logically flawed output
- 5: Moderately clear and logical output with some issues
- 10: Exceptionally clear, coherent, and logically sound output
-
-Consider:
-1. Is the output well-structured and organized?
-2. Is the reasoning logical and well-supported?
-3. Is the language clear, precise, and appropriate for the task?
-4. Are claims supported by evidence when appropriate?
-5. Is the output free from contradictions and logical fallacies?
-
-Return your evaluation as JSON with fields 'score' (number) and 'feedback' (string).
-"""},
-            {"role": "user", "content": f"""
-Agent role: {agent.role}
-{task_context}
-
-Agent's final output:
-{final_output}
-
-Evaluate the semantic quality and reasoning of this output.
-"""}
-        ]
-
-        assert self.llm is not None
-        response = self.llm.call(prompt)
-
-        try:
-            evaluation_data: dict[str, Any] = extract_json_from_llm_response(response)
-            assert evaluation_data is not None
-            return EvaluationScore(
-                score=float(evaluation_data["score"]) if evaluation_data.get("score") is not None else None,
-                feedback=evaluation_data.get("feedback", response),
-                raw_response=response
-            )
-        except Exception:
-            return EvaluationScore(
-                score=None,
-                feedback=f"Failed to parse evaluation. Raw response: {response}",
-                raw_response=response
-            )
--- a/src/crewai/experimental/evaluation/metrics/tools_metrics.py
+++ b/src/crewai/experimental/evaluation/metrics/tools_metrics.py
@@ -1,410 +0,0 @@
-import json
-from typing import Dict, Any
-
-from crewai.experimental.evaluation.base_evaluator import BaseEvaluator, EvaluationScore, MetricCategory
-from crewai.experimental.evaluation.json_parser import extract_json_from_llm_response
-from crewai.agent import Agent
-from crewai.task import Task
-
-
-class ToolSelectionEvaluator(BaseEvaluator):
-
-    @property
-    def metric_category(self) -> MetricCategory:
-        return MetricCategory.TOOL_SELECTION
-
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: Dict[str, Any],
-        final_output: str,
-        task: Task | None = None,
-    ) -> EvaluationScore:
-        task_context = ""
-        if task is not None:
-            task_context = f"Task description: {task.description}"
-
-        tool_uses = execution_trace.get("tool_uses", [])
-        tool_count = len(tool_uses)
-        unique_tool_types = set([tool.get("tool", "Unknown tool") for tool in tool_uses])
-
-        if tool_count == 0:
-            if not agent.tools:
-                return EvaluationScore(
-                    score=None,
-                    feedback="Agent had no tools available to use."
-                )
-            else:
-                return EvaluationScore(
-                    score=None,
-                    feedback="Agent had tools available but didn't use any."
-                )
-
-        available_tools_info = ""
-        if agent.tools:
-            for tool in agent.tools:
-                available_tools_info += f"- {tool.name}: {tool.description}\n"
-        else:
-            available_tools_info = "No tools available"
-
-        tool_types_summary = "Tools selected by the agent:\n"
-        for tool_type in sorted(unique_tool_types):
-            tool_types_summary += f"- {tool_type}\n"
-
-        prompt = [
-            {"role": "system", "content": """You are an expert evaluator assessing if an AI agent selected the most appropriate tools for a given task.
-
-You must evaluate based on these 2 criteria:
-1. Relevance (0-10): Were the tools chosen directly aligned with the task's goals?
-2. Coverage (0-10): Did the agent select ALL appropriate tools from the AVAILABLE tools?
-
-IMPORTANT:
- ONLY consider tools that are listed as available to the agent
- DO NOT suggest tools that aren't in the 'Available tools' list
- DO NOT evaluate the quality or accuracy of tool outputs/results
- DO NOT evaluate how many times each tool was used
- DO NOT evaluate how the agent used the parameters
- DO NOT evaluate whether the agent interpreted the task correctly
-
-Focus ONLY on whether the correct CATEGORIES of tools were selected from what was available.
-
-Return your evaluation as JSON with these fields:
- scores: {"relevance": number, "coverage": number}
- overall_score: number (average of all scores, 0-10)
- feedback: string (focused ONLY on tool selection decisions from available tools)
- improvement_suggestions: string (ONLY suggest better selection from the AVAILABLE tools list, NOT new tools)
-"""},
-            {"role": "user", "content": f"""
-Agent role: {agent.role}
-{task_context}
-
-Available tools for this agent:
-{available_tools_info}
-
-{tool_types_summary}
-
-Based ONLY on the task description and comparing the AVAILABLE tools with those that were selected (listed above), evaluate if the agent selected the appropriate tool types for this task.
-
-IMPORTANT:
- ONLY evaluate selection from tools listed as available
- DO NOT suggest new tools that aren't in the available tools list
- DO NOT evaluate tool usage or results
-"""}
-        ]
-        assert self.llm is not None
-        response = self.llm.call(prompt)
-
-        try:
-            evaluation_data = extract_json_from_llm_response(response)
-            assert evaluation_data is not None
-
-            scores = evaluation_data.get("scores", {})
-            relevance = scores.get("relevance", 5.0)
-            coverage = scores.get("coverage", 5.0)
-            overall_score = float(evaluation_data.get("overall_score", 5.0))
-
-            feedback = "Tool Selection Evaluation:\n"
-            feedback += f"• Relevance: {relevance}/10 - Selection of appropriate tool types for the task\n"
-            feedback += f"• Coverage: {coverage}/10 - Selection of all necessary tool types\n"
-            if "improvement_suggestions" in evaluation_data:
-                feedback += f"Improvement Suggestions:\n{evaluation_data['improvement_suggestions']}"
-            else:
-                feedback += evaluation_data.get("feedback", "No detailed feedback available.")
-
-            return EvaluationScore(
-                score=overall_score,
-                feedback=feedback,
-                raw_response=response
-            )
-        except Exception as e:
-            return EvaluationScore(
-                score=None,
-                feedback=f"Error evaluating tool selection: {e}",
-                raw_response=response
-            )
-
-
-class ParameterExtractionEvaluator(BaseEvaluator):
-    @property
-    def metric_category(self) -> MetricCategory:
-        return MetricCategory.PARAMETER_EXTRACTION
-
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: Dict[str, Any],
-        final_output: str,
-        task: Task | None = None,
-    ) -> EvaluationScore:
-        task_context = ""
-        if task is not None:
-            task_context = f"Task description: {task.description}"
-        tool_uses = execution_trace.get("tool_uses", [])
-        tool_count = len(tool_uses)
-
-        if tool_count == 0:
-            return EvaluationScore(
-                score=None,
-                feedback="No tool usage detected. Cannot evaluate parameter extraction."
-            )
-
-        validation_errors = []
-        for tool_use in tool_uses:
-            if not tool_use.get("success", True) and tool_use.get("error_type") == "validation_error":
-                validation_errors.append({
-                    "tool": tool_use.get("tool", "Unknown tool"),
-                    "error": tool_use.get("result"),
-                    "args": tool_use.get("args", {})
-                })
-
-        validation_error_rate = len(validation_errors) / tool_count if tool_count > 0 else 0
-
-        param_samples = []
-        for i, tool_use in enumerate(tool_uses[:5]):
-            tool_name = tool_use.get("tool", "Unknown tool")
-            tool_args = tool_use.get("args", {})
-            success = tool_use.get("success", True) and not tool_use.get("error", False)
-            error_type = tool_use.get("error_type", "") if not success else ""
-
-            is_validation_error = error_type == "validation_error"
-
-            sample = f"Tool use #{i+1} - {tool_name}:\n"
-            sample += f"- Parameters: {json.dumps(tool_args, indent=2)}\n"
-            sample += f"- Success: {'No' if not success else 'Yes'}"
-
-            if is_validation_error:
-                sample += " (PARAMETER VALIDATION ERROR)\n"
-                sample += f"- Error: {tool_use.get('result', 'Unknown error')}"
-            elif not success:
-                sample += f" (Other error: {error_type})\n"
-
-            param_samples.append(sample)
-
-        validation_errors_info = ""
-        if validation_errors:
-            validation_errors_info = f"\nParameter validation errors detected: {len(validation_errors)} ({validation_error_rate:.1%} of tool uses)\n"
-            for i, err in enumerate(validation_errors[:3]):
-                tool_name = err.get("tool", "Unknown tool")
-                error_msg = err.get("error", "Unknown error")
-                args = err.get("args", {})
-                validation_errors_info += f"\nValidation Error #{i+1}:\n- Tool: {tool_name}\n- Args: {json.dumps(args, indent=2)}\n- Error: {error_msg}"
-
-            if len(validation_errors) > 3:
-                validation_errors_info += f"\n...and {len(validation_errors) - 3} more validation errors."
-        param_samples_text = "\n\n".join(param_samples)
-        prompt = [
-            {"role": "system", "content": """You are an expert evaluator assessing how well an AI agent extracts and formats PARAMETER VALUES for tool calls.
-
-Your job is to evaluate ONLY whether the agent used the correct parameter VALUES, not whether the right tools were selected or how the tools were invoked.
-
-Evaluate parameter extraction based on these criteria:
-1. Accuracy (0-10): Are parameter values correctly identified from the context/task?
-2. Formatting (0-10): Are values formatted correctly for each tool's requirements?
-3. Completeness (0-10): Are all required parameter values provided, with no missing information?
-
-IMPORTANT: DO NOT evaluate:
- Whether the right tool was chosen (that's the ToolSelectionEvaluator's job)
- How the tools were structurally invoked (that's the ToolInvocationEvaluator's job)
- The quality of results from tools
-
-Focus ONLY on the PARAMETER VALUES - whether they were correctly extracted from the context, properly formatted, and complete.
-
-Validation errors are important signals that parameter values weren't properly extracted or formatted.
-
-Return your evaluation as JSON with these fields:
- scores: {"accuracy": number, "formatting": number, "completeness": number}
- overall_score: number (average of all scores, 0-10)
- feedback: string (focused ONLY on parameter value extraction quality)
- improvement_suggestions: string (concrete suggestions for better parameter VALUE extraction)
-"""},
-            {"role": "user", "content": f"""
-Agent role: {agent.role}
-{task_context}
-
-Parameter extraction examples:
-{param_samples_text}
-{validation_errors_info}
-
-Evaluate the quality of the agent's parameter extraction for this task.
-"""}
-        ]
-
-        assert self.llm is not None
-        response = self.llm.call(prompt)
-
-        try:
-            evaluation_data = extract_json_from_llm_response(response)
-            assert evaluation_data is not None
-
-            scores = evaluation_data.get("scores", {})
-            accuracy = scores.get("accuracy", 5.0)
-            formatting = scores.get("formatting", 5.0)
-            completeness = scores.get("completeness", 5.0)
-
-            overall_score = float(evaluation_data.get("overall_score", 5.0))
-
-            feedback = "Parameter Extraction Evaluation:\n"
-            feedback += f"• Accuracy: {accuracy}/10 - Correctly identifying required parameters\n"
-            feedback += f"• Formatting: {formatting}/10 - Properly formatting parameters for tools\n"
-            feedback += f"• Completeness: {completeness}/10 - Including all necessary information\n\n"
-
-            if "improvement_suggestions" in evaluation_data:
-                feedback += f"Improvement Suggestions:\n{evaluation_data['improvement_suggestions']}"
-            else:
-                feedback += evaluation_data.get("feedback", "No detailed feedback available.")
-
-            return EvaluationScore(
-                score=overall_score,
-                feedback=feedback,
-                raw_response=response
-            )
-        except Exception as e:
-            return EvaluationScore(
-                score=None,
-                feedback=f"Error evaluating parameter extraction: {e}",
-                raw_response=response
-            )
-
-
-class ToolInvocationEvaluator(BaseEvaluator):
-    @property
-    def metric_category(self) -> MetricCategory:
-        return MetricCategory.TOOL_INVOCATION
-
-    def evaluate(
-        self,
-        agent: Agent,
-        execution_trace: Dict[str, Any],
-        final_output: str,
-        task: Task | None = None,
-    ) -> EvaluationScore:
-        task_context = ""
-        if task is not None:
-            task_context = f"Task description: {task.description}"
-        tool_uses = execution_trace.get("tool_uses", [])
-        tool_errors = []
-        tool_count = len(tool_uses)
-
-        if tool_count == 0:
-            return EvaluationScore(
-                score=None,
-                feedback="No tool usage detected. Cannot evaluate tool invocation."
-            )
-
-        for tool_use in tool_uses:
-            if not tool_use.get("success", True) or tool_use.get("error", False):
-                error_info = {
-                    "tool": tool_use.get("tool", "Unknown tool"),
-                    "error": tool_use.get("result"),
-                    "error_type": tool_use.get("error_type", "unknown_error")
-                }
-                tool_errors.append(error_info)
-
-        error_rate = len(tool_errors) / tool_count if tool_count > 0 else 0
-
-        error_types = {}
-        for error in tool_errors:
-            error_type = error.get("error_type", "unknown_error")
-            if error_type not in error_types:
-                error_types[error_type] = 0
-            error_types[error_type] += 1
-
-        invocation_samples = []
-        for i, tool_use in enumerate(tool_uses[:5]):
-            tool_name = tool_use.get("tool", "Unknown tool")
-            tool_args = tool_use.get("args", {})
-            success = tool_use.get("success", True) and not tool_use.get("error", False)
-            error_type = tool_use.get("error_type", "") if not success else ""
-            error_msg = tool_use.get("result", "No error") if not success else "No error"
-
-            sample = f"Tool invocation #{i+1}:\n"
-            sample += f"- Tool: {tool_name}\n"
-            sample += f"- Parameters: {json.dumps(tool_args, indent=2)}\n"
-            sample += f"- Success: {'No' if not success else 'Yes'}\n"
-            if not success:
-                sample += f"- Error type: {error_type}\n"
-                sample += f"- Error: {error_msg}"
-            invocation_samples.append(sample)
-
-        error_type_summary = ""
-        if error_types:
-            error_type_summary = "Error type breakdown:\n"
-            for error_type, count in error_types.items():
-                error_type_summary += f"- {error_type}: {count} occurrences ({(count/tool_count):.1%})\n"
-
-        invocation_samples_text = "\n\n".join(invocation_samples)
-        prompt = [
-            {"role": "system", "content": """You are an expert evaluator assessing how correctly an AI agent's tool invocations are STRUCTURED.
-
-Your job is to evaluate ONLY the structural and syntactical aspects of how the agent called tools, NOT which tools were selected or what parameter values were used.
-
-Evaluate the agent's tool invocation based on these criteria:
-1. Structure (0-10): Does the tool call follow the expected syntax and format?
-2. Error Handling (0-10): Does the agent handle tool errors appropriately?
-3. Invocation Patterns (0-10): Are tool calls properly sequenced, batched, or managed?
-
-Error types that indicate invocation issues:
- execution_error: The tool was called correctly but failed during execution
- usage_error: General errors in how the tool was used structurally
-
-IMPORTANT: DO NOT evaluate:
- Whether the right tool was chosen (that's the ToolSelectionEvaluator's job)
- Whether the parameter values are correct (that's the ParameterExtractionEvaluator's job)
- The quality of results from tools
-
-Focus ONLY on HOW tools were invoked - the structure, format, and handling of the invocation process.
-
-Return your evaluation as JSON with these fields:
- scores: {"structure": number, "error_handling": number, "invocation_patterns": number}
- overall_score: number (average of all scores, 0-10)
- feedback: string (focused ONLY on structural aspects of tool invocation)
- improvement_suggestions: string (concrete suggestions for better structuring of tool calls)
-"""},
-            {"role": "user", "content": f"""
-Agent role: {agent.role}
-{task_context}
-
-Tool invocation examples:
-{invocation_samples_text}
-
-Tool error rate: {error_rate:.2%} ({len(tool_errors)} errors out of {tool_count} invocations)
-{error_type_summary}
-
-Evaluate the quality of the agent's tool invocation structure during this task.
-"""}
-        ]
-
-        assert self.llm is not None
-        response = self.llm.call(prompt)
-
-        try:
-            evaluation_data = extract_json_from_llm_response(response)
-            assert evaluation_data is not None
-            scores = evaluation_data.get("scores", {})
-            structure = scores.get("structure", 5.0)
-            error_handling = scores.get("error_handling", 5.0)
-            invocation_patterns = scores.get("invocation_patterns", 5.0)
-
-            overall_score = float(evaluation_data.get("overall_score", 5.0))
-
-            feedback = "Tool Invocation Evaluation:\n"
-            feedback += f"• Structure: {structure}/10 - Following proper syntax and format\n"
-            feedback += f"• Error Handling: {error_handling}/10 - Appropriately handling tool errors\n"
-            feedback += f"• Invocation Patterns: {invocation_patterns}/10 - Proper sequencing and management of calls\n\n"
-
-            if "improvement_suggestions" in evaluation_data:
-                feedback += f"Improvement Suggestions:\n{evaluation_data['improvement_suggestions']}"
-            else:
-                feedback += evaluation_data.get("feedback", "No detailed feedback available.")
-
-            return EvaluationScore(
-                score=overall_score,
-                feedback=feedback,
-                raw_response=response
-            )
-        except Exception as e:
-            return EvaluationScore(
-                score=None,
-                feedback=f"Error evaluating tool invocation: {e}",
-                raw_response=response
-            )
--- a/src/crewai/experimental/evaluation/testing.py
+++ b/src/crewai/experimental/evaluation/testing.py
@@ -1,52 +0,0 @@
-import inspect
-
-from typing_extensions import Any
-import warnings
-from crewai.experimental.evaluation.experiment import ExperimentResults, ExperimentRunner
-from crewai import Crew, Agent
-
-def assert_experiment_successfully(experiment_results: ExperimentResults, baseline_filepath: str | None = None) -> None:
-    failed_tests = [result for result in experiment_results.results if not result.passed]
-
-    if failed_tests:
-        detailed_failures: list[str] = []
-
-        for result in failed_tests:
-            expected = result.expected_score
-            actual = result.score
-            detailed_failures.append(f"- {result.identifier}: expected {expected}, got {actual}")
-
-        failure_details = "\n".join(detailed_failures)
-        raise AssertionError(f"The following test cases failed:\n{failure_details}")
-
-    baseline_filepath = baseline_filepath or _get_baseline_filepath_fallback()
-    comparison = experiment_results.compare_with_baseline(baseline_filepath=baseline_filepath)
-    assert_experiment_no_regression(comparison)
-
-def assert_experiment_no_regression(comparison_result: dict[str, list[str]]) -> None:
-    regressed = comparison_result.get("regressed", [])
-    if regressed:
-        raise AssertionError(f"Regression detected! The following tests that previously passed now fail: {regressed}")
-
-    missing_tests = comparison_result.get("missing_tests", [])
-    if missing_tests:
-        warnings.warn(
-            f"Warning: {len(missing_tests)} tests from the baseline are missing in the current run: {missing_tests}",
-            UserWarning
-        )
-
-def run_experiment(dataset: list[dict[str, Any]], crew: Crew | None = None, agents: list[Agent] | None = None, verbose: bool = False) -> ExperimentResults:
-    runner = ExperimentRunner(dataset=dataset)
-
-    return runner.run(agents=agents, crew=crew, print_summary=verbose)
-
-def _get_baseline_filepath_fallback() -> str:
-    test_func_name = "experiment_fallback"
-
-    try:
-        current_frame = inspect.currentframe()
-        if current_frame is not None:
-            test_func_name = current_frame.f_back.f_back.f_code.co_name # type: ignore[union-attr]
-    except Exception:
-        ...
-    return f"{test_func_name}_results.json"
--- a/src/crewai/knowledge/storage/knowledge_storage.py
+++ b/src/crewai/knowledge/storage/knowledge_storage.py
@@ -18,7 +18,6 @@ from crewai.utilities.chromadb import sanitize_collection_name
 from crewai.utilities.constants import KNOWLEDGE_DIRECTORY
 from crewai.utilities.logger import Logger
 from crewai.utilities.paths import db_storage_path
-from crewai.utilities.chromadb import create_persistent_client


@contextlib.contextmanager
@@ -85,11 +84,14 @@ class KnowledgeStorage(BaseKnowledgeStorage):
                raise Exception("Collection not initialized")

    def initialize_knowledge_storage(self):
-        self.app = create_persistent_client(
-            path=os.path.join(db_storage_path(), "knowledge"),
+        base_path = os.path.join(db_storage_path(), "knowledge")
+        chroma_client = chromadb.PersistentClient(
+            path=base_path,
            settings=Settings(allow_reset=True),
        )

+        self.app = chroma_client
+
        try:
            collection_name = (
                f"knowledge_{self.collection_name}"
@@ -109,8 +111,9 @@ class KnowledgeStorage(BaseKnowledgeStorage):
    def reset(self):
        base_path = os.path.join(db_storage_path(), KNOWLEDGE_DIRECTORY)
        if not self.app:
-            self.app = create_persistent_client(
-                path=base_path, settings=Settings(allow_reset=True)
+            self.app = chromadb.PersistentClient(
+                path=base_path,
+                settings=Settings(allow_reset=True),
            )

        self.app.reset()
--- a/src/crewai/lite_agent.py
+++ b/src/crewai/lite_agent.py
@@ -15,20 +15,18 @@ from typing import (
    get_origin,
 )

-
 try:
    from typing import Self
 except ImportError:
    from typing_extensions import Self

 from pydantic import (
-    UUID4,
    BaseModel,
    Field,
    InstanceOf,
    PrivateAttr,
    model_validator,
-    field_validator
+    field_validator,
 )

 from crewai.agents.agent_builder.base_agent import BaseAgent
@@ -40,7 +38,7 @@ from crewai.agents.parser import (
    OutputParserException,
 )
 from crewai.flow.flow_trackable import FlowTrackable
-from crewai.llm import LLM, BaseLLM
+from crewai.llm import LLM
 from crewai.tools.base_tool import BaseTool
 from crewai.tools.structured_tool import CrewStructuredTool
 from crewai.utilities import I18N
@@ -131,11 +129,10 @@ class LiteAgent(FlowTrackable, BaseModel):
    model_config = {"arbitrary_types_allowed": True}

    # Core Agent Properties
-    id: UUID4 = Field(default_factory=uuid.uuid4, frozen=True)
    role: str = Field(description="Role of the agent")
    goal: str = Field(description="Goal of the agent")
    backstory: str = Field(description="Backstory of the agent")
-    llm: Optional[Union[str, InstanceOf[BaseLLM], Any]] = Field(
+    llm: Optional[Union[str, InstanceOf[LLM], Any]] = Field(
        default=None, description="Language model that will run the agent"
    )
    tools: List[BaseTool] = Field(
@@ -209,8 +206,8 @@ class LiteAgent(FlowTrackable, BaseModel):
    def setup_llm(self):
        """Set up the LLM and other components after initialization."""
        self.llm = create_llm(self.llm)
-        if not isinstance(self.llm, BaseLLM):
-            raise ValueError(f"Expected LLM instance of type BaseLLM, got {type(self.llm).__name__}")
+        if not isinstance(self.llm, LLM):
+            raise ValueError("Unable to create LLM instance")

        # Initialize callbacks
        token_callback = TokenCalcHandler(token_cost_process=self._token_process)
@@ -232,8 +229,7 @@ class LiteAgent(FlowTrackable, BaseModel):
        elif isinstance(self.guardrail, str):
            from crewai.tasks.llm_guardrail import LLMGuardrail

-            if not isinstance(self.llm, BaseLLM):
-                raise TypeError(f"Guardrail requires LLM instance of type BaseLLM, got {type(self.llm).__name__}")
+            assert isinstance(self.llm, LLM)

            self._guardrail = LLMGuardrail(description=self.guardrail, llm=self.llm)

@@ -305,7 +301,6 @@ class LiteAgent(FlowTrackable, BaseModel):
        """
        # Create agent info for event emission
        agent_info = {
-            "id": self.id,
            "role": self.role,
            "goal": self.goal,
            "backstory": self.backstory,
@@ -522,7 +517,6 @@ class LiteAgent(FlowTrackable, BaseModel):
                        messages=self._messages,
                        tools=None,
                        callbacks=self._callbacks,
-                        from_agent=self,
                    ),
                )

@@ -532,24 +526,21 @@ class LiteAgent(FlowTrackable, BaseModel):
                        messages=self._messages,
                        callbacks=self._callbacks,
                        printer=self._printer,
-                        from_agent=self,
                    )

                    # Emit LLM call completed event
                    crewai_event_bus.emit(
                        self,
                        event=LLMCallCompletedEvent(
-                            messages=self._messages,
                            response=answer,
                            call_type=LLMCallType.LLM_CALL,
-                            from_agent=self,
                        ),
                    )
                except Exception as e:
                    # Emit LLM call failed event
                    crewai_event_bus.emit(
                        self,
-                        event=LLMCallFailedEvent(error=str(e), from_agent=self),
+                        event=LLMCallFailedEvent(error=str(e)),
                    )
                    raise e

@@ -622,4 +613,4 @@ class LiteAgent(FlowTrackable, BaseModel):

    def _append_message(self, text: str, role: str = "assistant") -> None:
        """Append a message to the message list with the given role."""
-        self._messages.append(format_message_for_llm(text, role=role))
+        self._messages.append(format_message_for_llm(text, role=role))
--- a/src/crewai/llm.py
+++ b/src/crewai/llm.py
@@ -59,7 +59,6 @@ from crewai.utilities.exceptions.context_window_exceeding_exception import (

 load_dotenv()

-litellm.suppress_debug_info = True

 class FilteredStream(io.TextIOBase):
    _lock = None
@@ -77,7 +76,9 @@ class FilteredStream(io.TextIOBase):

            # Skip common noisy LiteLLM banners and any other lines that contain "litellm"
            if (
-                "litellm.info:" in lower_s
+                "give feedback / get help" in lower_s
+                or "litellm.info:" in lower_s
+                or "litellm" in lower_s
                or "Consider using a smaller input or implementing a text splitting strategy" in lower_s
            ):
                return 0
@@ -418,8 +419,6 @@ class LLM(BaseLLM):
        params: Dict[str, Any],
        callbacks: Optional[List[Any]] = None,
        available_functions: Optional[Dict[str, Any]] = None,
-        from_task: Optional[Any] = None,
-        from_agent: Optional[Any] = None,
    ) -> str:
        """Handle a streaming response from the LLM.

@@ -427,8 +426,6 @@ class LLM(BaseLLM):
            params: Parameters for the completion call
            callbacks: Optional list of callback functions
            available_functions: Dict of available functions
-            from_task: Optional task object
-            from_agent: Optional agent object

        Returns:
            str: The complete response text
@@ -507,15 +504,13 @@ class LLM(BaseLLM):
                            # Enable tool calls using streaming
                            if "tool_calls" in delta:
                                tool_calls = delta["tool_calls"]
+
                                if tool_calls:
                                    result = self._handle_streaming_tool_calls(
                                        tool_calls=tool_calls,
                                        accumulated_tool_args=accumulated_tool_args,
                                        available_functions=available_functions,
-                                        from_task=from_task,
-                                        from_agent=from_agent,
                                    )
-
                                    if result is not None:
                                        chunk_content = result

@@ -532,7 +527,7 @@ class LLM(BaseLLM):
                    assert hasattr(crewai_event_bus, "emit")
                    crewai_event_bus.emit(
                        self,
-                        event=LLMStreamChunkEvent(chunk=chunk_content, from_task=from_task, from_agent=from_agent),
+                        event=LLMStreamChunkEvent(chunk=chunk_content),
                    )
            # --- 4) Fallback to non-streaming if no content received
            if not full_response.strip() and chunk_count == 0:
@@ -545,7 +540,7 @@ class LLM(BaseLLM):
                    "stream_options", None
                )  # Remove stream_options for non-streaming call
                return self._handle_non_streaming_response(
-                    non_streaming_params, callbacks, available_functions, from_task, from_agent
+                    non_streaming_params, callbacks, available_functions
                )

            # --- 5) Handle empty response with chunks
@@ -630,7 +625,7 @@ class LLM(BaseLLM):
                # Log token usage if available in streaming mode
                self._handle_streaming_callbacks(callbacks, usage_info, last_chunk)
                # Emit completion event and return response
-                self._handle_emit_call_events(response=full_response, call_type=LLMCallType.LLM_CALL, from_task=from_task, from_agent=from_agent, messages=params["messages"])
+                self._handle_emit_call_events(full_response, LLMCallType.LLM_CALL)
                return full_response

            # --- 9) Handle tool calls if present
@@ -642,7 +637,7 @@ class LLM(BaseLLM):
            self._handle_streaming_callbacks(callbacks, usage_info, last_chunk)

            # --- 11) Emit completion event and return response
-            self._handle_emit_call_events(response=full_response, call_type=LLMCallType.LLM_CALL, from_task=from_task, from_agent=from_agent, messages=params["messages"])
+            self._handle_emit_call_events(full_response, LLMCallType.LLM_CALL)
            return full_response

        except ContextWindowExceededError as e:
@@ -654,14 +649,14 @@ class LLM(BaseLLM):
            logging.error(f"Error in streaming response: {str(e)}")
            if full_response.strip():
                logging.warning(f"Returning partial response despite error: {str(e)}")
-                self._handle_emit_call_events(response=full_response, call_type=LLMCallType.LLM_CALL, from_task=from_task, from_agent=from_agent, messages=params["messages"])
+                self._handle_emit_call_events(full_response, LLMCallType.LLM_CALL)
                return full_response

            # Emit failed event and re-raise the exception
            assert hasattr(crewai_event_bus, "emit")
            crewai_event_bus.emit(
                self,
-                event=LLMCallFailedEvent(error=str(e), from_task=from_task, from_agent=from_agent),
+                event=LLMCallFailedEvent(error=str(e)),
            )
            raise Exception(f"Failed to get streaming response: {str(e)}")

@@ -670,8 +665,6 @@ class LLM(BaseLLM):
        tool_calls: List[ChatCompletionDeltaToolCall],
        accumulated_tool_args: DefaultDict[int, AccumulatedToolArgs],
        available_functions: Optional[Dict[str, Any]] = None,
-        from_task: Optional[Any] = None,
-        from_agent: Optional[Any] = None,
    ) -> None | str:
        for tool_call in tool_calls:
            current_tool_accumulator = accumulated_tool_args[tool_call.index]
@@ -689,8 +682,6 @@ class LLM(BaseLLM):
                event=LLMStreamChunkEvent(
                    tool_call=tool_call.to_dict(),
                    chunk=tool_call.function.arguments,
-                    from_task=from_task,
-                    from_agent=from_agent,
                ),
            )

@@ -757,17 +748,13 @@ class LLM(BaseLLM):
        params: Dict[str, Any],
        callbacks: Optional[List[Any]] = None,
        available_functions: Optional[Dict[str, Any]] = None,
-        from_task: Optional[Any] = None,
-        from_agent: Optional[Any] = None,
-    ) -> str | Any:
+    ) -> str:
        """Handle a non-streaming response from the LLM.

        Args:
            params: Parameters for the completion call
            callbacks: Optional list of callback functions
            available_functions: Dict of available functions
-            from_task: Optional Task that invoked the LLM
-            from_agent: Optional Agent that invoked the LLM

        Returns:
            str: The response text
@@ -783,11 +770,13 @@ class LLM(BaseLLM):
            # Convert litellm's context window error to our own exception type
            # for consistent handling in the rest of the codebase
            raise LLMContextLengthExceededException(str(e))
+
        # --- 2) Extract response message and content
        response_message = cast(Choices, cast(ModelResponse, response).choices)[
            0
        ].message
        text_response = response_message.content or ""
+
        # --- 3) Handle callbacks with usage info
        if callbacks and len(callbacks) > 0:
            for callback in callbacks:
@@ -800,23 +789,22 @@ class LLM(BaseLLM):
                            start_time=0,
                            end_time=0,
                        )
+
        # --- 4) Check for tool calls
        tool_calls = getattr(response_message, "tool_calls", [])

-        # --- 5) If no tool calls or no available functions, return the text response directly as long as there is a text response
-        if (not tool_calls or not available_functions) and text_response:
-            self._handle_emit_call_events(response=text_response, call_type=LLMCallType.LLM_CALL, from_task=from_task, from_agent=from_agent, messages=params["messages"])
+        # --- 5) If no tool calls or no available functions, return the text response directly
+        if not tool_calls or not available_functions:
+            self._handle_emit_call_events(text_response, LLMCallType.LLM_CALL)
            return text_response
-        # --- 6) If there is no text response, no available functions, but there are tool calls, return the tool calls
-        elif tool_calls and not available_functions and not text_response:
-            return tool_calls

-        # --- 7) Handle tool calls if present
+        # --- 6) Handle tool calls if present
        tool_result = self._handle_tool_call(tool_calls, available_functions)
        if tool_result is not None:
            return tool_result
-        # --- 8) If tool call handling didn't return a result, emit completion event and return text response
-        self._handle_emit_call_events(response=text_response, call_type=LLMCallType.LLM_CALL, from_task=from_task, from_agent=from_agent, messages=params["messages"])
+
+        # --- 7) If tool call handling didn't return a result, emit completion event and return text response
+        self._handle_emit_call_events(text_response, LLMCallType.LLM_CALL)
        return text_response

    def _handle_tool_call(
@@ -859,7 +847,6 @@ class LLM(BaseLLM):
                        tool_args=function_args,
                    ),
                )
-
                result = fn(**function_args)
                crewai_event_bus.emit(
                    self,
@@ -873,7 +860,7 @@ class LLM(BaseLLM):
                )

                # --- 3.3) Emit success event
-                self._handle_emit_call_events(response=result, call_type=LLMCallType.TOOL_CALL)
+                self._handle_emit_call_events(result, LLMCallType.TOOL_CALL)
                return result
            except Exception as e:
                # --- 3.4) Handle execution errors
@@ -902,8 +889,6 @@ class LLM(BaseLLM):
        tools: Optional[List[dict]] = None,
        callbacks: Optional[List[Any]] = None,
        available_functions: Optional[Dict[str, Any]] = None,
-        from_task: Optional[Any] = None,
-        from_agent: Optional[Any] = None,
    ) -> Union[str, Any]:
        """High-level LLM call method.

@@ -918,8 +903,6 @@ class LLM(BaseLLM):
                      during and after the LLM call.
            available_functions: Optional dict mapping function names to callables
                               that can be invoked by the LLM.
-            from_task: Optional Task that invoked the LLM
-            from_agent: Optional Agent that invoked the LLM

        Returns:
            Union[str, Any]: Either a text response from the LLM (str) or
@@ -939,8 +922,6 @@ class LLM(BaseLLM):
                tools=tools,
                callbacks=callbacks,
                available_functions=available_functions,
-                from_task=from_task,
-                from_agent=from_agent,
            ),
        )

@@ -950,26 +931,30 @@ class LLM(BaseLLM):
        # --- 3) Convert string messages to proper format if needed
        if isinstance(messages, str):
            messages = [{"role": "user", "content": messages}]
+
        # --- 4) Handle O1 model special case (system messages not supported)
        if "o1" in self.model.lower():
            for message in messages:
                if message.get("role") == "system":
                    message["role"] = "assistant"
+
        # --- 5) Set up callbacks if provided
        with suppress_warnings():
            if callbacks and len(callbacks) > 0:
                self.set_callbacks(callbacks)
+
            try:
                # --- 6) Prepare parameters for the completion call
                params = self._prepare_completion_params(messages, tools)
+
                # --- 7) Make the completion call and handle response
                if self.stream:
                    return self._handle_streaming_response(
-                        params, callbacks, available_functions, from_task, from_agent
+                        params, callbacks, available_functions
                    )
                else:
                    return self._handle_non_streaming_response(
-                        params, callbacks, available_functions, from_task, from_agent
+                        params, callbacks, available_functions
                    )

            except LLMContextLengthExceededException:
@@ -978,48 +963,25 @@ class LLM(BaseLLM):
                # whether to summarize the content or abort based on the respect_context_window flag
                raise
            except Exception as e:
-                unsupported_stop = "Unsupported parameter" in str(e) and "'stop'" in str(e)
-
-                if unsupported_stop:
-                    if "additional_drop_params" in self.additional_params and isinstance(self.additional_params["additional_drop_params"], list):
-                        self.additional_params["additional_drop_params"].append("stop")
-                    else:
-                        self.additional_params = {"additional_drop_params": ["stop"]}
-
-                    logging.info(
-                        "Retrying LLM call without the unsupported 'stop'"
-                    )
-
-                    return self.call(
-                        messages,
-                        tools=tools,
-                        callbacks=callbacks,
-                        available_functions=available_functions,
-                        from_task=from_task,
-                        from_agent=from_agent,
-                    )
-
                assert hasattr(crewai_event_bus, "emit")
                crewai_event_bus.emit(
                    self,
-                    event=LLMCallFailedEvent(error=str(e), from_task=from_task, from_agent=from_agent),
+                    event=LLMCallFailedEvent(error=str(e)),
                )
+                logging.error(f"LiteLLM call failed: {str(e)}")
                raise

-    def _handle_emit_call_events(self, response: Any, call_type: LLMCallType, from_task: Optional[Any] = None, from_agent: Optional[Any] = None, messages: str | list[dict[str, Any]] | None = None):
+    def _handle_emit_call_events(self, response: Any, call_type: LLMCallType):
        """Handle the events for the LLM call.

        Args:
            response (str): The response from the LLM call.
            call_type (str): The type of call, either "tool_call" or "llm_call".
-            from_task: Optional task object
-            from_agent: Optional agent object
-            messages: Optional messages object
        """
        assert hasattr(crewai_event_bus, "emit")
        crewai_event_bus.emit(
            self,
-            event=LLMCallCompletedEvent(messages=messages, response=response, call_type=call_type, from_task=from_task, from_agent=from_agent),
+            event=LLMCallCompletedEvent(response=response, call_type=call_type),
        )

    def _format_messages_for_provider(
@@ -1072,15 +1034,6 @@ class LLM(BaseLLM):
                messages.append({"role": "user", "content": "Please continue."})
            return messages

-        # TODO: Remove this code after merging PR https://github.com/BerriAI/litellm/pull/10917
-        # Ollama doesn't supports last message to be 'assistant'
-        if "ollama" in self.model.lower() and messages and messages[-1]["role"] == "assistant":
-            messages = messages.copy()
-            messages.append(
-                {"role": "user", "content": ""}
-            )
-            return messages
-
        # Handle Anthropic models
        if not self.is_anthropic:
            return messages
--- a/src/crewai/llms/base_llm.py
+++ b/src/crewai/llms/base_llm.py
@@ -1,5 +1,5 @@
 from abc import ABC, abstractmethod
-from typing import Any, Dict, List, Optional, Union
+from typing import Any, Callable, Dict, List, Optional, Union


 class BaseLLM(ABC):
@@ -47,8 +47,6 @@ class BaseLLM(ABC):
        tools: Optional[List[dict]] = None,
        callbacks: Optional[List[Any]] = None,
        available_functions: Optional[Dict[str, Any]] = None,
-        from_task: Optional[Any] = None,
-        from_agent: Optional[Any] = None,
    ) -> Union[str, Any]:
        """Call the LLM with the given messages.

@@ -63,7 +61,6 @@ class BaseLLM(ABC):
                      during and after the LLM call.
            available_functions: Optional dict mapping function names to callables
                               that can be invoked by the LLM.
-            from_task: Optional task caller to be used for the LLM call.

        Returns:
            Either a text response from the LLM (str) or
--- a/Show More
+++ b/Show More