Fix issue #5736: Agent.kickoff() must honor executor_class

The two parallel agent-executor implementations (CrewAgentExecutor and the experimental AgentExecutor) had drifted enough that the Agent class silently routed kickoff() and execute_task() to different executors: * Agent.execute_task() instantiated self.executor_class (default CrewAgentExecutor). * Agent.kickoff() hard-coded AgentExecutor, ignoring executor_class. * The reasoning-gate guard 'self.executor_class is not AgentExecutor' coupled feature behavior to literal class identity, so a subclass of either executor that opted into / out of internal planning was handled incorrectly. This patch introduces two ClassVar capability flags on BaseAgentExecutor: * supports_internal_planning - whether the executor runs its own planning/replanning loop (and therefore should NOT have the external handle_reasoning step run before task execution). * supports_kickoff - whether the executor implements the Flow-based kickoff entry point. AgentExecutor sets both to True; CrewAgentExecutor leaves both False. The Agent class now consults these flags instead of testing class identity: * The reasoning gate is 'not getattr(executor_class, supports_internal_planning, False)'. * Agent.kickoff() routes through _resolve_kickoff_executor_class() which honors executor_class when it advertises supports_kickoff and otherwise emits a DeprecationWarning before falling back to AgentExecutor for backwards compatibility. A new test module lib/crewai/tests/agents/test_executor_consistency.py pins down the contract. Co-Authored-By: João <joao@crewai.com>
2026-05-07 10:12:38 +00:00 · 2026-05-07 00:17:44 +00:00
parent d165bcb65f
commit 7b586968f1
4 changed files with 411 additions and 4 deletions
--- a/lib/crewai/src/crewai/agent/core.py
+++ b/lib/crewai/src/crewai/agent/core.py
@@ -512,7 +512,7 @@ class Agent(BaseAgent):
            The task prompt after memory retrieval, ready for knowledge lookup.
        """
        get_env_context()
-        if self.executor_class is not AgentExecutor:
+        if not getattr(self.executor_class, "supports_internal_planning", False):
            handle_reasoning(self, task)

        self._inject_date_to_task(task)
@@ -1102,6 +1102,40 @@ class Agent(BaseAgent):
        self.agent_executor.tools_handler = self.tools_handler
        self.agent_executor.request_within_rpm_limit = rpm_limit_fn

+    def _resolve_kickoff_executor_class(self) -> type[AgentExecutor]:
+        """Resolve the executor class to use for ``Agent.kickoff()``.
+
+        ``Agent.kickoff()`` requires a Flow-based executor (one that sets
+        ``supports_kickoff = True`` on the class). When the configured
+        :attr:`executor_class` does not support the kickoff flow, this method
+        emits a :class:`DeprecationWarning` and falls back to
+        :class:`~crewai.experimental.agent_executor.AgentExecutor` so that
+        existing default-configured agents continue to work; the warning makes
+        the previously silent override visible to the caller.
+
+        Returns:
+            The :class:`AgentExecutor` subclass to instantiate for kickoff.
+        """
+        executor_cls = self.executor_class
+        supports_kickoff = getattr(executor_cls, "supports_kickoff", False)
+        if supports_kickoff and isinstance(executor_cls, type):
+            return cast("type[AgentExecutor]", executor_cls)
+
+        warnings.warn(
+            (
+                f"Agent.kickoff() requires a Flow-based AgentExecutor but "
+                f"executor_class={getattr(executor_cls, '__name__', executor_cls)!r} "
+                "does not advertise supports_kickoff=True. Falling back to "
+                "crewai.experimental.agent_executor.AgentExecutor for this "
+                "kickoff() call. Set executor_class=AgentExecutor explicitly "
+                "to silence this warning. The silent fallback will be removed "
+                "in a future release."
+            ),
+            DeprecationWarning,
+            stacklevel=3,
+        )
+        return AgentExecutor
+
    def get_delegation_tools(self, agents: Sequence[BaseAgent]) -> list[BaseTool]:
        agent_tools = AgentTools(agents=agents)
        return agent_tools.tools()
@@ -1399,7 +1433,8 @@ class Agent(BaseAgent):
            executor.request_within_rpm_limit = rpm_limit_fn
            executor.callbacks = [TokenCalcHandler(self._token_process)]
        else:
-            executor = AgentExecutor(
+            kickoff_executor_cls = self._resolve_kickoff_executor_class()
+            executor = kickoff_executor_cls(
                llm=cast(BaseLLM, self.llm),
                agent=self,
                prompt=prompt,
--- a/lib/crewai/src/crewai/agents/agent_builder/base_agent_executor.py
+++ b/lib/crewai/src/crewai/agents/agent_builder/base_agent_executor.py
@@ -1,6 +1,6 @@
 from __future__ import annotations

-from typing import TYPE_CHECKING
+from typing import TYPE_CHECKING, ClassVar

 from pydantic import BaseModel, Field, PrivateAttr

@@ -20,6 +20,25 @@ class BaseAgentExecutor(BaseModel):
    model_config = {"arbitrary_types_allowed": True}

    executor_type: str = "base"
+
+    supports_internal_planning: ClassVar[bool] = False
+    """Whether this executor implements its own planning/replanning loop.
+
+    When True, ``Agent`` skips the external ``handle_reasoning()`` step before
+    task execution and lets the executor drive planning itself. This is a
+    class-level capability flag so callers can query it without instantiating
+    the executor (e.g. ``self.executor_class.supports_internal_planning``).
+    """
+
+    supports_kickoff: ClassVar[bool] = False
+    """Whether this executor supports the standalone ``Agent.kickoff()`` flow.
+
+    Executors that do not implement the Flow-based kickoff loop should leave
+    this ``False``; ``Agent.kickoff()`` will then refuse to silently fall back
+    to a different executor and instead emit a ``DeprecationWarning`` so the
+    silent override is visible to the caller.
+    """
+
    crew: Crew | None = Field(default=None, exclude=True)
    agent: BaseAgent | None = Field(default=None, exclude=True)
    task: Task | None = Field(default=None, exclude=True)
--- a/lib/crewai/src/crewai/experimental/agent_executor.py
+++ b/lib/crewai/src/crewai/experimental/agent_executor.py
@@ -9,7 +9,7 @@ from datetime import datetime
 import inspect
 import json
 import threading
-from typing import TYPE_CHECKING, Any, Literal, TypeVar, cast
+from typing import TYPE_CHECKING, Any, ClassVar, Literal, TypeVar, cast
 from uuid import uuid4

 from crewai_core.printer import PRINTER
@@ -172,6 +172,10 @@ class AgentExecutor(Flow[AgentExecutorState], BaseAgentExecutor):
    _skip_auto_memory: bool = True

    executor_type: Literal["experimental"] = "experimental"
+
+    supports_internal_planning: ClassVar[bool] = True
+    supports_kickoff: ClassVar[bool] = True
+
    suppress_flow_events: bool = True  # always suppress for executor
    llm: BaseLLM = Field(exclude=True)
    prompt: SystemPromptResult | StandardPromptResult = Field(exclude=True)
--- a/lib/crewai/tests/agents/test_executor_consistency.py
+++ b/lib/crewai/tests/agents/test_executor_consistency.py
@@ -0,0 +1,349 @@
+"""Regression tests for issue #5736: parallel agent executors must be consistent.
+
+The repository has historically carried two parallel ``BaseAgentExecutor``
+subclasses — :class:`crewai.agents.crew_agent_executor.CrewAgentExecutor` and
+:class:`crewai.experimental.agent_executor.AgentExecutor`. The issue reported
+two concrete bugs caused by the split:
+
+1. ``Agent.kickoff()`` silently ignored ``Agent.executor_class`` and always
+   instantiated ``AgentExecutor``, so the user-visible default
+   (``CrewAgentExecutor``) did not match the executor that ``kickoff()``
+   actually used.
+2. The ``handle_reasoning()`` step was gated on a literal class identity check
+   (``self.executor_class is not AgentExecutor``), so reasoning was silently
+   skipped depending on the executor and could not be controlled via a
+   capability flag.
+
+These tests pin down the new contract:
+
+* Capability flags (``supports_internal_planning`` / ``supports_kickoff``) are
+  the single source of truth for executor differences.
+* ``Agent.kickoff()`` honors ``executor_class`` when it is kickoff-capable and
+  otherwise emits a ``DeprecationWarning`` instead of silently overriding.
+* ``Agent.execute_task()`` instantiates ``self.executor_class`` (not a
+  hard-coded class).
+* ``handle_reasoning()`` is gated on the capability flag, not class identity.
+"""
+
+from __future__ import annotations
+
+from typing import Any, ClassVar, Literal
+import warnings
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from crewai import Agent, Task
+from crewai.agents.agent_builder.base_agent_executor import BaseAgentExecutor
+from crewai.agents.crew_agent_executor import CrewAgentExecutor
+from crewai.experimental.agent_executor import AgentExecutor
+from crewai.llms.base_llm import BaseLLM
+
+
+@pytest.fixture
+def mock_llm() -> MagicMock:
+    """Create a mock LLM that satisfies BaseLLM's protocol."""
+    llm = MagicMock(spec=BaseLLM)
+    llm.supports_stop_words.return_value = True
+    llm.stop = []
+    llm.model = "gpt-4o-mini"
+    return llm
+
+
+@pytest.fixture
+def test_agent(mock_llm: MagicMock) -> Agent:
+    """A plain Agent that uses default ``executor_class``."""
+    return Agent(
+        role="Test Agent",
+        goal="Verify executor consistency",
+        backstory="An agent used by issue #5736 regression tests.",
+        llm=mock_llm,
+        verbose=False,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Capability flags
+# ---------------------------------------------------------------------------
+
+
+class TestExecutorCapabilityFlags:
+    """``supports_internal_planning`` / ``supports_kickoff`` advertise the
+    differences between executors so callers don't have to ``isinstance``-check
+    against a specific class."""
+
+    def test_base_executor_has_no_capabilities(self) -> None:
+        assert BaseAgentExecutor.supports_internal_planning is False
+        assert BaseAgentExecutor.supports_kickoff is False
+
+    def test_crew_agent_executor_has_no_capabilities(self) -> None:
+        """The legacy executor neither plans internally nor handles kickoff."""
+        assert CrewAgentExecutor.supports_internal_planning is False
+        assert CrewAgentExecutor.supports_kickoff is False
+
+    def test_agent_executor_advertises_full_capabilities(self) -> None:
+        """The Flow-based executor implements both plan-and-execute and kickoff."""
+        assert AgentExecutor.supports_internal_planning is True
+        assert AgentExecutor.supports_kickoff is True
+
+
+# ---------------------------------------------------------------------------
+# Agent.kickoff() honors executor_class
+# ---------------------------------------------------------------------------
+
+
+class TestKickoffRespectsExecutorClass:
+    """Issue #5736 part 1: ``Agent.kickoff()`` must honor ``executor_class``."""
+
+    def test_kickoff_uses_explicit_agent_executor_without_warning(
+        self, mock_llm: MagicMock
+    ) -> None:
+        """When the user explicitly opts into ``AgentExecutor``, no warning fires."""
+        agent = Agent(
+            role="r",
+            goal="g",
+            backstory="b",
+            llm=mock_llm,
+            executor_class=AgentExecutor,
+        )
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            executor_cls = agent._resolve_kickoff_executor_class()
+
+        assert executor_cls is AgentExecutor
+        kickoff_warnings = [
+            w for w in caught if "Agent.kickoff()" in str(w.message)
+        ]
+        assert kickoff_warnings == [], (
+            f"Did not expect any kickoff warning, got: {[str(w.message) for w in kickoff_warnings]}"
+        )
+
+    def test_kickoff_uses_kickoff_capable_subclass_of_agent_executor(
+        self, mock_llm: MagicMock
+    ) -> None:
+        """A user-defined subclass that opts into kickoff is honored verbatim
+        (rather than being silently replaced with ``AgentExecutor``)."""
+
+        class CustomAgentExecutor(AgentExecutor):
+            executor_type: Literal["custom"] = "custom"  # type: ignore[assignment]
+            supports_kickoff: ClassVar[bool] = True
+            supports_internal_planning: ClassVar[bool] = True
+
+        agent = Agent(
+            role="r",
+            goal="g",
+            backstory="b",
+            llm=mock_llm,
+            executor_class=CustomAgentExecutor,
+        )
+
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            executor_cls = agent._resolve_kickoff_executor_class()
+
+        assert executor_cls is CustomAgentExecutor
+        kickoff_warnings = [
+            w for w in caught if "Agent.kickoff()" in str(w.message)
+        ]
+        assert kickoff_warnings == []
+
+    def test_kickoff_warns_and_falls_back_when_executor_class_is_not_kickoff_capable(
+        self, mock_llm: MagicMock
+    ) -> None:
+        """Default-configured agents (``executor_class=CrewAgentExecutor``) used
+        to silently flip to ``AgentExecutor`` on ``kickoff()``. The fix keeps
+        the fallback for backwards compatibility but emits a
+        ``DeprecationWarning`` so the silent override is now visible."""
+        agent = Agent(
+            role="r",
+            goal="g",
+            backstory="b",
+            llm=mock_llm,
+            executor_class=CrewAgentExecutor,  # the default
+        )
+
+        with pytest.warns(DeprecationWarning, match=r"Agent\.kickoff\(\)"):
+            executor_cls = agent._resolve_kickoff_executor_class()
+
+        assert executor_cls is AgentExecutor
+
+    def test_kickoff_fallback_warning_mentions_explicit_opt_in(
+        self, mock_llm: MagicMock
+    ) -> None:
+        """The deprecation message should tell users how to silence it — by
+        setting ``executor_class=AgentExecutor`` explicitly."""
+        agent = Agent(
+            role="r",
+            goal="g",
+            backstory="b",
+            llm=mock_llm,
+            executor_class=CrewAgentExecutor,
+        )
+
+        with pytest.warns(DeprecationWarning) as record:
+            agent._resolve_kickoff_executor_class()
+
+        assert any(
+            "executor_class=AgentExecutor" in str(w.message) for w in record
+        )
+
+    def test_kickoff_constructs_executor_via_resolve_helper(
+        self, test_agent: Agent
+    ) -> None:
+        """``_prepare_kickoff()`` must route through ``_resolve_kickoff_executor_class``
+        rather than instantiating ``AgentExecutor`` directly. This guards against
+        regressing back to the issue #5736 hardcoded-class behavior."""
+        sentinel = MagicMock(name="sentinel_executor_cls")
+        sentinel.return_value = MagicMock(name="sentinel_executor")
+
+        with patch.object(
+            test_agent,
+            "_resolve_kickoff_executor_class",
+            return_value=sentinel,
+        ) as mock_resolve, patch.object(
+            test_agent, "_build_execution_prompt"
+        ) as mock_build_prompt:
+            mock_build_prompt.return_value = (
+                {"system": "sys"},
+                ["Observation:"],
+                None,
+            )
+            test_agent._prepare_kickoff(messages="hello")
+
+        mock_resolve.assert_called_once_with()
+        sentinel.assert_called_once()
+
+
+# ---------------------------------------------------------------------------
+# Agent.execute_task() honors executor_class (sanity check; pre-existing
+# behavior we don't want to regress)
+# ---------------------------------------------------------------------------
+
+
+class TestExecuteTaskRespectsExecutorClass:
+    """``Agent.execute_task()`` already routed through ``self.executor_class``
+    — these tests pin that contract so future refactors keep both entry points
+    honoring the user's executor choice."""
+
+    def test_execute_task_instantiates_self_executor_class(
+        self, test_agent: Agent
+    ) -> None:
+        """The non-resuming branch of ``Agent.create_agent_executor`` should
+        call ``self.executor_class(...)``. Stubbing ``executor_class`` with a
+        factory lets us observe the instantiation without running the LLM
+        loop."""
+        captured: dict[str, Any] = {}
+
+        def fake_factory(*args: Any, **kwargs: Any) -> MagicMock:
+            captured["called"] = True
+            captured["kwargs"] = kwargs
+            return MagicMock(spec=CrewAgentExecutor)
+
+        task = Task(
+            description="d",
+            expected_output="e",
+            agent=test_agent,
+        )
+        test_agent.agent_executor = None
+        test_agent.executor_class = fake_factory  # type: ignore[assignment]
+
+        with patch.object(test_agent, "_build_execution_prompt") as mock_bp:
+            mock_bp.return_value = ({"system": "s"}, ["Obs:"], None)
+            test_agent.create_agent_executor(task=task)
+
+        assert captured.get("called") is True
+        # The agent passed itself to its executor.
+        assert captured["kwargs"].get("agent") is test_agent
+        assert captured["kwargs"].get("task") is task
+
+
+# ---------------------------------------------------------------------------
+# handle_reasoning gate: capability flag, not class identity
+# ---------------------------------------------------------------------------
+
+
+class TestReasoningGateUsesCapabilityFlag:
+    """Issue #5736 part 2: the reasoning gate must consult
+    ``supports_internal_planning`` rather than testing class identity. This
+    way a ``CrewAgentExecutor`` subclass that opts into internal planning is
+    treated correctly — and so is an ``AgentExecutor`` subclass that doesn't."""
+
+    def test_reasoning_runs_for_executor_without_internal_planning(
+        self, test_agent: Agent
+    ) -> None:
+        """Default ``executor_class`` is ``CrewAgentExecutor`` which does NOT
+        plan internally, so the legacy ``handle_reasoning`` step must run."""
+        task = Task(description="d", expected_output="e", agent=test_agent)
+
+        assert test_agent.executor_class is CrewAgentExecutor
+        assert (
+            getattr(
+                test_agent.executor_class, "supports_internal_planning", False
+            )
+            is False
+        )
+
+        with patch(
+            "crewai.agent.core.handle_reasoning"
+        ) as mock_handle_reasoning, patch.object(
+            test_agent, "_inject_date_to_task"
+        ), patch.object(
+            test_agent, "_retrieve_memory_context", return_value="prompt"
+        ):
+            test_agent._prepare_task_execution(task=task, context=None)
+
+        mock_handle_reasoning.assert_called_once_with(test_agent, task)
+
+    def test_reasoning_skipped_for_executor_with_internal_planning(
+        self, test_agent: Agent
+    ) -> None:
+        """``AgentExecutor.supports_internal_planning is True``, so the agent
+        should not invoke the external ``handle_reasoning`` step (the executor
+        runs its own ``generate_plan`` flow instead)."""
+        test_agent.executor_class = AgentExecutor  # type: ignore[assignment]
+        task = Task(description="d", expected_output="e", agent=test_agent)
+
+        assert (
+            getattr(
+                test_agent.executor_class, "supports_internal_planning", False
+            )
+            is True
+        )
+
+        with patch(
+            "crewai.agent.core.handle_reasoning"
+        ) as mock_handle_reasoning, patch.object(
+            test_agent, "_inject_date_to_task"
+        ), patch.object(
+            test_agent, "_retrieve_memory_context", return_value="prompt"
+        ):
+            test_agent._prepare_task_execution(task=task, context=None)
+
+        mock_handle_reasoning.assert_not_called()
+
+    def test_reasoning_gate_does_not_use_isinstance_or_class_identity(
+        self, test_agent: Agent
+    ) -> None:
+        """A ``CrewAgentExecutor`` subclass that opts into internal planning
+        (``supports_internal_planning = True``) must skip the legacy reasoning
+        step. This is the key behavioral promise of replacing the old
+        ``self.executor_class is not AgentExecutor`` check with a flag-based
+        check."""
+
+        class PlanningCrewExecutor(CrewAgentExecutor):
+            executor_type: Literal["crew_planning"] = "crew_planning"  # type: ignore[assignment]
+            supports_internal_planning: ClassVar[bool] = True
+
+        test_agent.executor_class = PlanningCrewExecutor  # type: ignore[assignment]
+        task = Task(description="d", expected_output="e", agent=test_agent)
+
+        with patch(
+            "crewai.agent.core.handle_reasoning"
+        ) as mock_handle_reasoning, patch.object(
+            test_agent, "_inject_date_to_task"
+        ), patch.object(
+            test_agent, "_retrieve_memory_context", return_value="prompt"
+        ):
+            test_agent._prepare_task_execution(task=task, context=None)
+
+        mock_handle_reasoning.assert_not_called()