from agno.agent import Agent
from agno.eval.accuracy import AccuracyEval
from agno.models.openai import OpenAIChat
evaluation = AccuracyEval(
model=OpenAIChat(id="gpt-4o"),
agent=Agent(model=OpenAIChat(id="gpt-4o")),
input="What is 10*5 then to the power of 2? do it step by step",
expected_output="2500",
monitoring=True, # This activates monitoring
)
# This run will be tracked on the Agno platform
result = evaluation.run(print_results=True)