Add all Patronus eval tools and update example

2026-01-30 02:28:13 +00:00 · 2024-12-26 17:37:22 -05:00
parent d94f7e03dc
commit 0ac6f915fb
2 changed files with 314 additions and 24 deletions
--- a/src/crewai_tools/tools/patronus_eval_tool/example.py
+++ b/src/crewai_tools/tools/patronus_eval_tool/example.py
@@ -1,15 +1,37 @@
 from crewai import Agent, Crew, Task
-from patronus_eval_tool import PatronusEvalTool
-
-
-patronus_eval_tool = PatronusEvalTool(
-    evaluators=[{"evaluator": "judge", "criteria": "patronus:is-code"}], tags={}
+from patronus_eval_tool import (
+    PatronusEvalTool,
+    PatronusPredifinedCriteriaEvalTool,
+    PatronusLocalEvaluatorTool,
 )
+from patronus import Client, EvaluationResult
+
+# Test the PatronusEvalTool where agent can pick the best evaluator and criteria
+patronus_eval_tool = PatronusEvalTool()
+
+# Test the PatronusPredifinedCriteriaEvalTool where agent uses the defined evaluator and criteria
+patronus_eval_tool = PatronusPredifinedCriteriaEvalTool(
+    evaluators=[{"evaluator": "judge", "criteria": "contains-code"}]
+)
+
+# Test the PatronusLocalEvaluatorTool where agent uses the local evaluator
+client = Client()
+
+
+@client.register_local_evaluator("local_evaluator_name")
+def my_evaluator(**kwargs):
+    return EvaluationResult(pass_="PASS", score=0.5, explanation="Explanation test")
+
+
+patronus_eval_tool = PatronusLocalEvaluatorTool(
+    evaluator="local_evaluator_name", evaluated_model_gold_answer="test"
+)
+

 # Create a new agent
 coding_agent = Agent(
    role="Coding Agent",
-    goal="Generate high quality code and verify that the code is correct by using Patronus AI's evaluation tool to check validity of your output code.",
+    goal="Generate high quality code and verify that the output is code by using Patronus AI's evaluation tool.",
    backstory="You are an experienced coder who can generate high quality python code. You can follow complex instructions accurately and effectively.",
    tools=[patronus_eval_tool],
    verbose=True,
@@ -17,7 +39,7 @@ coding_agent = Agent(

 # Define tasks
 generate_code = Task(
-    description="Create a simple program to generate the first N numbers in the Fibonacci sequence. Use the evaluator as `judge` from Patronus AI with the criteria `patronus:is-code` and feed your task input as input and your code as output to verify your code validity.",
+    description="Create a simple program to generate the first N numbers in the Fibonacci sequence. Select the most appropriate evaluator and criteria for evaluating your output.",
    expected_output="Program that generates the first N numbers in the Fibonacci sequence.",
    agent=coding_agent,
 )