Learn how to evaluate the accuracy of an Agent that is using tools.
from typing import Optional from agno.agent import Agent from agno.eval.accuracy import AccuracyEval, AccuracyResult from agno.models.openai import OpenAIChat from agno.tools.calculator import CalculatorTools evaluation = AccuracyEval( name="Tools Evaluation", model=OpenAIChat(id="o4-mini"), agent=Agent( model=OpenAIChat(id="gpt-5-mini"), tools=[CalculatorTools()], ), input="What is 10!?", expected_output="3628800", ) result: Optional[AccuracyResult] = evaluation.run(print_results=True) assert result is not None and result.avg_score >= 8