Fix #4509 : Strip markdown code-block fences from LLM JSON responses in Converter

When LLMs return JSON wrapped in markdown code blocks (e.g. ```json...```), the Converter.to_pydantic() method failed to parse the response, causing Pydantic validation errors when saving to long-term memory. Changes: - Add _strip_markdown_fences() helper to remove markdown code-block delimiters - Apply fence stripping before model_validate_json() in both function-calling and non-function-calling paths of Converter.to_pydantic() - Add handle_partial_json() fallback in the function-calling path - Apply fence stripping in convert_to_model() before json.loads() - Add 11 tests covering the fix Co-Authored-By: João <joao@crewai.com>
2026-04-12 22:12:37 +00:00 · 2026-02-18 13:18:51 +00:00
2 changed files with 207 additions and 5 deletions
--- a/lib/crewai/src/crewai/utilities/converter.py
+++ b/lib/crewai/src/crewai/utilities/converter.py
@@ -21,9 +21,32 @@ if TYPE_CHECKING:
    from crewai.llms.base_llm import BaseLLM

 _JSON_PATTERN: Final[re.Pattern[str]] = re.compile(r"({.*})", re.DOTALL)
+_MARKDOWN_FENCE_PATTERN: Final[re.Pattern[str]] = re.compile(
+    r"^\s*```(?:json)?\s*\n(.*)\n\s*```\s*$", re.DOTALL
+)
 _I18N = get_i18n()


+def _strip_markdown_fences(text: str) -> str:
+    """Strip markdown code-block fences that some LLMs wrap around JSON.
+
+    Handles patterns like:
+        ```json\n{...}\n```
+        ```\n{...}\n```
+
+    Args:
+        text: Raw LLM response that may contain markdown fences.
+
+    Returns:
+        The inner content with fences removed, or the original text if
+        no fences are detected.
+    """
+    match = _MARKDOWN_FENCE_PATTERN.match(text)
+    if match:
+        return match.group(1)
+    return text
+
+
 class ConverterError(Exception):
    """Error raised when Converter fails to parse the input."""

@@ -65,7 +88,25 @@ class Converter(OutputConverter):
                if isinstance(response, BaseModel):
                    result = response
                else:
-                    result = self.model.model_validate_json(response)
+                    cleaned = _strip_markdown_fences(response)
+                    try:
+                        result = self.model.model_validate_json(cleaned)
+                    except (ValidationError, ValueError):
+                        result = handle_partial_json(
+                            result=response,
+                            model=self.model,
+                            is_json_output=False,
+                            agent=None,
+                        )
+                        if not isinstance(result, BaseModel):
+                            if isinstance(result, dict):
+                                result = self.model.model_validate(result)
+                            elif isinstance(result, str):
+                                result = self.model.model_validate_json(result)
+                            else:
+                                raise ConverterError(
+                                    "handle_partial_json returned an unexpected type."
+                                ) from None
            else:
                response = self.llm.call(
                    [
@@ -74,9 +115,9 @@ class Converter(OutputConverter):
                    ]
                )
                try:
-                    # Try to directly validate the response JSON
-                    result = self.model.model_validate_json(response)
-                except ValidationError:
+                    cleaned = _strip_markdown_fences(response)
+                    result = self.model.model_validate_json(cleaned)
+                except (ValidationError, ValueError):
                    # If direct validation fails, attempt to extract valid JSON
                    result = handle_partial_json(  # type: ignore[assignment]
                        result=response,
@@ -185,7 +226,8 @@ def convert_to_model(
        )

    try:
-        escaped_result = json.dumps(json.loads(result, strict=False))
+        cleaned_result = _strip_markdown_fences(result)
+        escaped_result = json.dumps(json.loads(cleaned_result, strict=False))
        return validate_model(
            result=escaped_result, model=model, is_json_output=bool(output_json)
        )
--- a/lib/crewai/tests/utilities/test_converter.py
+++ b/lib/crewai/tests/utilities/test_converter.py
@@ -8,6 +8,7 @@ from crewai.llm import LLM
 from crewai.utilities.converter import (
    Converter,
    ConverterError,
+    _strip_markdown_fences,
    convert_to_model,
    convert_with_instructions,
    create_converter,
@@ -952,3 +953,162 @@ def test_internal_instructor_real_unsupported_provider() -> None:

    # Verify it's a configuration error about unsupported provider
    assert "Unsupported provider" in str(exc_info.value) or "unsupported" in str(exc_info.value).lower()
+
+
+# ---------------------------------------------------------------------------
+# Tests for _strip_markdown_fences  (issue #4509)
+# ---------------------------------------------------------------------------
+
+
+def test_strip_markdown_fences_with_json_tag() -> None:
+    raw = '```json\n{"name": "Alice", "age": 30}\n```'
+    assert _strip_markdown_fences(raw) == '{"name": "Alice", "age": 30}'
+
+
+def test_strip_markdown_fences_without_language_tag() -> None:
+    raw = '```\n{"name": "Bob", "age": 25}\n```'
+    assert _strip_markdown_fences(raw) == '{"name": "Bob", "age": 25}'
+
+
+def test_strip_markdown_fences_multiline_json() -> None:
+    raw = '```json\n{\n  "name": "Charlie",\n  "age": 35\n}\n```'
+    result = _strip_markdown_fences(raw)
+    parsed = json.loads(result)
+    assert parsed == {"name": "Charlie", "age": 35}
+
+
+def test_strip_markdown_fences_plain_json_unchanged() -> None:
+    raw = '{"name": "Dave", "age": 40}'
+    assert _strip_markdown_fences(raw) == raw
+
+
+def test_strip_markdown_fences_with_surrounding_whitespace() -> None:
+    raw = '  ```json\n{"key": "value"}\n```  '
+    assert json.loads(_strip_markdown_fences(raw)) == {"key": "value"}
+
+
+# ---------------------------------------------------------------------------
+# Tests for Converter.to_pydantic with markdown-wrapped JSON (issue #4509)
+# ---------------------------------------------------------------------------
+
+
+def test_converter_to_pydantic_strips_markdown_fences_function_calling() -> None:
+    """When LLM supports function calling but returns markdown-wrapped JSON string,
+    the converter should strip fences and parse successfully."""
+    llm = Mock(spec=LLM)
+    llm.supports_function_calling.return_value = True
+    llm.call.return_value = '```json\n{"name": "Alice", "age": 30}\n```'
+
+    converter = Converter(
+        llm=llm,
+        text="Name: Alice, Age: 30",
+        model=SimpleModel,
+        instructions="Convert to JSON.",
+    )
+
+    output = converter.to_pydantic()
+    assert isinstance(output, SimpleModel)
+    assert output.name == "Alice"
+    assert output.age == 30
+
+
+def test_converter_to_pydantic_strips_markdown_fences_no_function_calling() -> None:
+    """When LLM does NOT support function calling and returns markdown-wrapped JSON,
+    the converter should strip fences and parse successfully."""
+    llm = Mock(spec=LLM)
+    llm.supports_function_calling.return_value = False
+    llm.call.return_value = '```json\n{"name": "Bob", "age": 25}\n```'
+
+    converter = Converter(
+        llm=llm,
+        text="Name: Bob, Age: 25",
+        model=SimpleModel,
+        instructions="Convert to JSON.",
+    )
+
+    output = converter.to_pydantic()
+    assert isinstance(output, SimpleModel)
+    assert output.name == "Bob"
+    assert output.age == 25
+
+
+def test_converter_to_pydantic_strips_fences_multiline_function_calling() -> None:
+    """Multiline markdown-fenced JSON should be parsed correctly (function calling path)."""
+    from crewai.utilities.evaluators.task_evaluator import Entity, TaskEvaluation
+
+    evaluation_json = json.dumps({
+        "suggestions": ["Improve research depth"],
+        "quality": 8.5,
+        "entities": [
+            {
+                "name": "AI",
+                "type": "Technology",
+                "description": "Artificial Intelligence",
+                "relationships": ["Healthcare"],
+            }
+        ],
+    })
+    llm = Mock(spec=LLM)
+    llm.supports_function_calling.return_value = True
+    llm.call.return_value = f"```json\n{evaluation_json}\n```"
+
+    converter = Converter(
+        llm=llm,
+        text="Evaluate this task.",
+        model=TaskEvaluation,
+        instructions="Convert to JSON.",
+    )
+
+    output = converter.to_pydantic()
+    assert isinstance(output, TaskEvaluation)
+    assert output.quality == 8.5
+    assert len(output.suggestions) == 1
+    assert len(output.entities) == 1
+    assert output.entities[0].name == "AI"
+
+
+def test_converter_to_pydantic_strips_fences_multiline_no_function_calling() -> None:
+    """Multiline markdown-fenced JSON should be parsed correctly (non-function-calling path)."""
+    from crewai.utilities.evaluators.task_evaluator import Entity, TaskEvaluation
+
+    evaluation_json = json.dumps({
+        "suggestions": ["Better analysis needed"],
+        "quality": 7.0,
+        "entities": [],
+    })
+    llm = Mock(spec=LLM)
+    llm.supports_function_calling.return_value = False
+    llm.call.return_value = f"```json\n{evaluation_json}\n```"
+
+    converter = Converter(
+        llm=llm,
+        text="Evaluate this task.",
+        model=TaskEvaluation,
+        instructions="Convert to JSON.",
+    )
+
+    output = converter.to_pydantic()
+    assert isinstance(output, TaskEvaluation)
+    assert output.quality == 7.0
+
+
+# ---------------------------------------------------------------------------
+# Tests for convert_to_model with markdown-wrapped JSON (issue #4509)
+# ---------------------------------------------------------------------------
+
+
+def test_convert_to_model_with_markdown_fenced_json() -> None:
+    """convert_to_model should handle markdown-fenced JSON strings."""
+    result = '```json\n{"name": "Eve", "age": 28}\n```'
+    output = convert_to_model(result, SimpleModel, None, None)
+    assert isinstance(output, SimpleModel)
+    assert output.name == "Eve"
+    assert output.age == 28
+
+
+def test_convert_to_model_with_markdown_fenced_json_output() -> None:
+    """convert_to_model should handle markdown-fenced JSON when output_json is set."""
+    result = '```json\n{"name": "Frank", "age": 45}\n```'
+    output = convert_to_model(result, None, SimpleModel, None)
+    assert isinstance(output, dict)
+    assert output == {"name": "Frank", "age": 45}