GaiaAgentEvaluator / test_agent.py
davidgturner's picture
- changes for app.py
08e2c16
raw
history blame
1 kB
import os
from app import GaiaAgent
# Initialize the agent
agent = GaiaAgent()
# Test cases from the logs that were failing
test_questions = [
"How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)?",
".rewsna eht sa \"tfel\" drow eht fo etisoppo eht etirw ,ecnetnes siht dnatsrednu uoy fI",
"Who nominated the only Featured Article on English Wikipedia about a dinosaur that was promoted in November 2016?",
"What is the first name of the only Malko Competition recipient from the 20th Century (after 1977) whose nationality on record is a country that no longer exists?",
"In the video https://www.youtube.com/watch?v=L1vXCYZAYYM, what is the highest number of bird species to be on camera simultaneously?"
]
# Test the agent
for question in test_questions:
print(f"\nTesting question: {question}")
try:
answer = agent(question)
print(f"Agent answer: {answer}")
except Exception as e:
print(f"Error: {e}")