GAIA_Agent

Sleeping

App Files Files Community

ArturoNereu commited on Jun 1

Commit

edab6f8

1 Parent(s): 8c77163

modified gitignore

Browse files

Files changed (4) hide show

app.py +2 -11
gaia_agent.py +16 -23
gaia_tools.py +22 -2
requirements.txt +2 -1

app.py CHANGED Viewed

@@ -12,17 +12,6 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 # To check if we are running locally
 running_on_hf = False
-# --- Basic Agent Definition ---
-# ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-# class BasicAgent:
-#     def __init__(self):
-#         print("BasicAgent initialized.")
-#     def __call__(self, question: str) -> str:
-#         print(f"Agent received question (first 50 chars): {question[:50]}...")
-#         fixed_answer = "This is a default answer."
-#         print(f"Agent returning fixed answer: {fixed_answer}")
-#         return fixed_answer
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,
@@ -89,6 +78,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
             continue
         try:
             submitted_answer = agent(question_text)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
@@ -156,6 +146,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
 # --- Build Gradio Interface using Blocks ---
 with gr.Blocks() as demo:
     gr.Markdown("# GAIA Agent")
     gr.Markdown(
         """
         **Instructions:**

 # To check if we are running locally
 running_on_hf = False
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,
             continue
         try:
             submitted_answer = agent(question_text)
+            print(type(submitted_answer))
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
 # --- Build Gradio Interface using Blocks ---
 with gr.Blocks() as demo:
     gr.Markdown("# GAIA Agent")
+    gr.Image(value="assets/AI_Programmer.png")
     gr.Markdown(
         """
         **Instructions:**

gaia_agent.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import os
 from smolagents import InferenceClientModel, ToolCallingAgent
 from smolagents import DuckDuckGoSearchTool, VisitWebpageTool
 class GaiaAgent:
     def __init__(self):
@@ -13,7 +14,8 @@ class GaiaAgent:
         self.tools = [
             DuckDuckGoSearchTool(),
-            VisitWebpageTool()
         ]
         self.agent = ToolCallingAgent(
@@ -24,33 +26,24 @@ class GaiaAgent:
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
-        prompt = f""" You are an agent solving the GAIA benchmark and you are required to provide exact answers.
-        Rules to follow:
-        1. Return only the exact requested answered: no explanation and no reasoning.
-        2. For yes/no questions, return exactly "Yes" or "No".
-        3. For dates, use the exact format requested.
-        4. For numbers, use the exact number, no other format.
-        5. For names, use the exact name as found in sources.
-        6. If the question has an associated file, download the file first using the task ID
-        Examples of good responses:
-        - "42"
-        - "Arturo Nunez"
-        - "Yes"
-        - "October 5, 2001"
-        - "Buenos Aires"
-        Never include phrases like "the answer is..." or "Based on my research".
-        Only return the exact answer.
-        QUESTION:
-        {question}
-        """
-        # messages = [
-        #     {"role": "user", "content": question}
-        # ]
         try:
             result = self.agent.run(prompt)

 import os
 from smolagents import InferenceClientModel, ToolCallingAgent
 from smolagents import DuckDuckGoSearchTool, VisitWebpageTool
+from gaia_tools import RunPythonFileTool
 class GaiaAgent:
     def __init__(self):
         self.tools = [
             DuckDuckGoSearchTool(),
+            VisitWebpageTool(),
+            RunPythonFileTool
         ]
         self.agent = ToolCallingAgent(
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
+        prompt = f"""
+        You are a helpful agent that must provide exact answers to questions. Do not explain or format your answer in any way.
+        If a question can be solved with reasoning, riddles, puzzles, or reversing text — solve it yourself.
+        If the query involves a known Wikipedia page, use VisitWebpageTool to open it and extract the needed info directly. Do not rely on summaries.
+        If the query requires the execution of python code, make sure the code is valid before trying to execute it.
+        Question: {question}
+        Rules:
+        - If the question is reversed, reverse it and solve it.
+        - If the answer is a single word, output only that word.
+        - Do not say anything else.
+        Only output the final answer.
+        """
         try:
             result = self.agent.run(prompt)

gaia_tools.py CHANGED Viewed

@@ -1,2 +1,22 @@
-from smolagents import Tool, DuckDuckGoSearchTool, PythonInterpreterTool, VisitWebpageTool
-import requests

+from smolagents import PythonInterpreterTool, tool
+import requests
+@tool
+def RunPythonFileTool(file_path: str) -> str:
+    """
+    Executes a Python script loaded from the specified path using the PythonInterpreterTool.
+    Args:
+        file_path (str): The full path to the python (.py) file containing the Python code.
+    Returns:
+        str: The output produced by the code execution, or an error code if it fails.
+    """
+    try:
+        with open(file_path, "r") as f:
+            code = f.read()
+        interpreter = PythonInterpreterTool()
+        result = interpreter.run({"code": code})
+        return result
+    except Exception as e:
+        return f"Execution failed: {e}"

requirements.txt CHANGED Viewed

@@ -1,4 +1,5 @@
 gradio[oauth]
 requests
 smolagents
-duckduckgo-search

 gradio[oauth]
 requests
 smolagents
+duckduckgo-search
+openai