Final_Assignment_Template

Sleeping

App Files Files Community

dawid-lorek commited on 10 days ago

Commit

6e92f6f

verified ·

1 Parent(s): dc1160b

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -24

app.py CHANGED Viewed

@@ -1,41 +1,57 @@
 import os
 import gradio as gr
 import requests
 import pandas as pd
-from smolagents import CodeAgent, DuckDuckGoSearchTool, OpenAIServerModel
 # Constants
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-MAX_QUESTION_LENGTH = 4000  # Character-based limit for questions
-MAX_WEBPAGE_CONTENT = 3000  # Character limit for visited pages (GPT-4 context safe)
-# --- Agent Definition ---
 class SmartGAIAAgent:
     def __init__(self):
         self.api_key = os.getenv("OPENAI_API_KEY")
         if not self.api_key:
             raise ValueError("Missing OPENAI_API_KEY")
         self.model = OpenAIServerModel(model_id="gpt-4", api_key=self.api_key)
         self.agent = CodeAgent(
-            tools=[DuckDuckGoSearchTool()],
             model=self.model,
             add_base_tools=True
         )
-    def truncate_if_needed(self, question: str) -> str:
         return question[:MAX_QUESTION_LENGTH]
     def __call__(self, question: str) -> str:
         try:
-            clean_question = self.truncate_if_needed(question)
             result = self.agent.run(clean_question)
             return result.strip()
         except Exception as e:
             print(f"Agent error: {e}")
             return "error"
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     space_id = os.getenv("SPACE_ID")
     if profile:
@@ -44,9 +60,8 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     else:
         return "Please Login to Hugging Face with the button.", None
-    api_url = DEFAULT_API_URL
-    questions_url = f"{api_url}/questions"
-    submit_url = f"{api_url}/submit"
     try:
         agent = SmartGAIAAgent()
@@ -54,7 +69,6 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         return f"Error initializing agent: {e}", None
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
-    print(f"Code link: {agent_code}")
     try:
         response = requests.get(questions_url, timeout=15)
@@ -70,18 +84,16 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         task_id = item.get("task_id")
         question_text = item.get("question", "")
-        # Skip problematic questions
-        skip_keywords = [
-            'attached', '.mp3', '.wav', '.png', '.jpg', '.jpeg',
-            'youtube', '.mp4', 'video', 'listen', 'watch'
-        ]
         if not task_id or not question_text:
             continue
         if len(question_text) > MAX_QUESTION_LENGTH:
             print(f"Skipping long question: {task_id}")
             continue
-        if any(keyword in question_text.lower() for keyword in skip_keywords):
-            print(f"Skipping unsupported question ({task_id}): {question_text[:60]}...")
             continue
         try:
@@ -113,17 +125,17 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         response.raise_for_status()
         result_data = response.json()
         final_status = (
-            f"Submission Successful!\n"
-            f"User: {result_data.get('username')}\n"
             f"Score: {result_data.get('score')}% "
-            f"({result_data.get('correct_count')}/{result_data.get('total_attempted')})\n"
             f"Message: {result_data.get('message')}"
         )
         return final_status, pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission failed: {e}", pd.DataFrame(results_log)
-# --- Gradio UI ---
 with gr.Blocks() as demo:
     gr.Markdown("# 🧠 GAIA Agent Evaluation")
     gr.Markdown("""

 import os
+import time
 import gradio as gr
 import requests
 import pandas as pd
+from smolagents import CodeAgent, OpenAIServerModel
+from langchain_community.tools import DuckDuckGoSearchRun
 # Constants
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+MAX_QUESTION_LENGTH = 4000
+MAX_WEBPAGE_CONTENT = 3000
+# --- Reliable DuckDuckGo Tool with Retry ---
+class ReliableDuckDuckGoTool(DuckDuckGoSearchRun):
+    def _run(self, query: str) -> str:
+        for attempt in range(3):
+            try:
+                return super()._run(query)
+            except Exception as e:
+                if "ratelimit" in str(e).lower() or "202" in str(e):
+                    print(f"Rate limited. Retry {attempt + 1}/3...")
+                    time.sleep(3 * (attempt + 1))
+                else:
+                    raise e
+        raise RuntimeError("DuckDuckGo search failed after retries")
+# --- Smart GAIA Agent ---
 class SmartGAIAAgent:
     def __init__(self):
         self.api_key = os.getenv("OPENAI_API_KEY")
         if not self.api_key:
             raise ValueError("Missing OPENAI_API_KEY")
         self.model = OpenAIServerModel(model_id="gpt-4", api_key=self.api_key)
         self.agent = CodeAgent(
+            tools=[ReliableDuckDuckGoTool()],
             model=self.model,
             add_base_tools=True
         )
+    def truncate_question(self, question: str) -> str:
         return question[:MAX_QUESTION_LENGTH]
     def __call__(self, question: str) -> str:
         try:
+            clean_question = self.truncate_question(question)
             result = self.agent.run(clean_question)
             return result.strip()
         except Exception as e:
             print(f"Agent error: {e}")
             return "error"
+# --- Evaluation + Submission ---
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     space_id = os.getenv("SPACE_ID")
     if profile:
     else:
         return "Please Login to Hugging Face with the button.", None
+    questions_url = f"{DEFAULT_API_URL}/questions"
+    submit_url = f"{DEFAULT_API_URL}/submit"
     try:
         agent = SmartGAIAAgent()
         return f"Error initializing agent: {e}", None
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
     try:
         response = requests.get(questions_url, timeout=15)
         task_id = item.get("task_id")
         question_text = item.get("question", "")
         if not task_id or not question_text:
             continue
         if len(question_text) > MAX_QUESTION_LENGTH:
             print(f"Skipping long question: {task_id}")
             continue
+        if any(keyword in question_text.lower() for keyword in [
+            'attached', '.mp3', '.wav', '.png', '.jpg', '.jpeg',
+            'youtube', '.mp4', 'video', 'listen', 'watch'
+        ]):
+            print(f"Skipping unsupported media question: {task_id}")
             continue
         try:
         response.raise_for_status()
         result_data = response.json()
         final_status = (
+            f"Submission Successful!\\n"
+            f"User: {result_data.get('username')}\\n"
             f"Score: {result_data.get('score')}% "
+            f"({result_data.get('correct_count')}/{result_data.get('total_attempted')})\\n"
             f"Message: {result_data.get('message')}"
         )
         return final_status, pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission failed: {e}", pd.DataFrame(results_log)
+# --- Gradio Interface ---
 with gr.Blocks() as demo:
     gr.Markdown("# 🧠 GAIA Agent Evaluation")
     gr.Markdown("""