Final_Assignment_Template

Sleeping

App Files Files Community

dlaima commited on Jun 2

Commit

c64bf2e

verified ·

1 Parent(s): 03f0224

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -53

app.py CHANGED Viewed

@@ -1,22 +1,16 @@
 import os
 import requests
-from smolagents import Agent
 from audio_transcriber import AudioTranscriptionTool
 from image_analyzer import ImageAnalysisTool
 from wikipedia_searcher import WikipediaSearcher
-from openai import OpenAI
-from dotenv import load_dotenv
-load_dotenv()
-# Tools
-audio_tool = AudioTranscriptionTool()
-image_tool = ImageAnalysisTool()
-wiki_tool = WikipediaSearcher()
-# Static system prompt
-def build_prompt(question: str) -> str:
-    return f"""You are an agent solving the GAIA benchmark and you are required to provide exact answers.
 Rules to follow:
 1. Return only the exact requested answer: no explanation and no reasoning.
 2. For yes/no questions, return exactly "Yes" or "No".
@@ -30,52 +24,45 @@ Examples of good responses:
 - "October 5, 2001"
 - "Buenos Aires"
 Never include phrases like "the answer is..." or "Based on my research".
-Only return the exact answer.
-QUESTION:
-{question}
-"""
-# Main agent function
-class GAIAAgent:
     def __init__(self):
-        self.llm = OpenAI(model="gpt-4-turbo", temperature=0)
     def __call__(self, task: dict) -> str:
         question = task.get("question", "")
-        attachment_url = task.get("attachment", "")
-        # Handle audio
-        if attachment_url.endswith((".mp3", ".wav")):
-            transcript = audio_tool.forward(attachment_url)
-            question += f"\n\nTranscript of attached audio:\n{transcript}"
-        # Handle image
-        elif attachment_url.endswith((".jpg", ".jpeg", ".png")):
-            return image_tool.forward(attachment_url, question)
-        # Handle Python file
-        elif attachment_url.endswith(".py"):
-            try:
-                code_text = requests.get(attachment_url).text
-                question += f"\n\nAttached Python file content:\n{code_text}"
-            except Exception as e:
-                return f"Error retrieving Python file: {e}"
-        # Wikipedia queries (if task type or instruction indicates)
-        if "wikipedia" in question.lower():
-            return wiki_tool.search(question)
-        # Build prompt
-        prompt = build_prompt(question)
-        # Run model
-        response = self.llm.chat.completions.create(
-            messages=[{"role": "system", "content": prompt}],
-            model="gpt-4-turbo"
-        )
-        return response.choices[0].message.content.strip()
 def run_and_submit_all(profile: gr.OAuthProfile | None):

 import os
 import requests
+import gradio as gr
+import pandas as pd
+from smolagents import CodeAgent, DuckDuckGoSearchTool
+from smolagents.models import OpenAIServerModel
 from audio_transcriber import AudioTranscriptionTool
 from image_analyzer import ImageAnalysisTool
 from wikipedia_searcher import WikipediaSearcher
+# Static system prompt for all completions
+SYSTEM_PROMPT = """You are an agent solving the GAIA benchmark and you are required to provide exact answers.
 Rules to follow:
 1. Return only the exact requested answer: no explanation and no reasoning.
 2. For yes/no questions, return exactly "Yes" or "No".
 - "October 5, 2001"
 - "Buenos Aires"
 Never include phrases like "the answer is..." or "Based on my research".
+Only return the exact answer."""
+class PatchedOpenAIServerModel(OpenAIServerModel):
+    def generate(self, messages, stop_sequences=None, **kwargs):
+        if isinstance(messages, list):
+            if not any(m["role"] == "system" for m in messages):
+                messages = [{"role": "system", "content": SYSTEM_PROMPT}] + messages
+        return super().generate(messages=messages, stop_sequences=stop_sequences, **kwargs)
+class MyAgent:
     def __init__(self):
+        self.model = PatchedOpenAIServerModel(model_id="gpt-4-turbo")
+        self.agent = CodeAgent(
+            tools=[
+                DuckDuckGoSearchTool(),
+                WikipediaSearcher(),
+                AudioTranscriptionTool(),
+                ImageAnalysisTool()
+            ],
+            model=self.model
+        )
     def __call__(self, task: dict) -> str:
         question = task.get("question", "")
+        attachment = task.get("attachment")
+        if attachment:
+            if attachment.endswith((".mp3", ".wav")):
+                question += f"\n\nAudio file: {attachment}"
+            elif attachment.endswith((".jpg", ".jpeg", ".png")):
+                question += f"\n\nImage file: {attachment}"
+            elif attachment.endswith(".py"):
+                try:
+                    content = requests.get(attachment).text
+                    question += f"\n\nPython code:\n{content}"
+                except Exception as e:
+                    question += f"\n\nError loading code: {e}"
+        return self.agent.run(question)
 def run_and_submit_all(profile: gr.OAuthProfile | None):