Spaces:
Sleeping
Sleeping
Test agent on question 1 only ("How many studio albums")
Browse files- simuGAIA.py +4 -3
simuGAIA.py
CHANGED
@@ -240,9 +240,10 @@ def run_simuGAIA_all( profile: gr.OAuthProfile | None, submit: Optional[bool] =
|
|
240 |
print(f"Skipping item with missing task_id or question: {item}")
|
241 |
continue
|
242 |
try:
|
243 |
-
|
244 |
-
|
245 |
-
|
|
|
246 |
except Exception as e:
|
247 |
print(f"Error running agent on task {task_id}: {e}")
|
248 |
results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
|
|
|
240 |
print(f"Skipping item with missing task_id or question: {item}")
|
241 |
continue
|
242 |
try:
|
243 |
+
if question_text.startswith("How many studio albums")
|
244 |
+
submitted_answer = agent(question_text)
|
245 |
+
answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
|
246 |
+
results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
|
247 |
except Exception as e:
|
248 |
print(f"Error running agent on task {task_id}: {e}")
|
249 |
results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
|