Final_Assignment_Template

Sleeping

App Files Files Community

IngoTB303 commited on Apr 28

Commit

1aa16a4

1 Parent(s): 81917a3

Refactor app structure: add agent and tools, enhance question fetching with attachments, and update requirements

Browse files

Files changed (7) hide show

.gitignore +96 -0
TODOs.txt +6 -0
agent.py +34 -0
agent_tools.py +71 -0
app-test.py +139 -0
app.py +33 -12
requirements.txt +6 -1

.gitignore ADDED Viewed

	@@ -0,0 +1,96 @@

+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+*.egg-info/
+.installed.cfg
+*.egg
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+.hypothesis/
+.pytest_cache/
+# Jupyter Notebook
+.ipynb_checkpoints
+# pyenv
+.python-version
+# mypy
+.mypy_cache/
+.dmypy.json
+# Pyre type checker
+.pyre/
+# VS Code
+.vscode/
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# IDEs
+.idea/
+*.sublime-workspace
+*.sublime-project
+# Mac
+.DS_Store
+# Windows
+Thumbs.db
+Desktop.ini
+# Logs
+*.log
+# Local config
+*.local
+# Secret files
+*.secret
+*.key
+*.pem
+# Azure
+.azure/
+app_tokens.py
+questions.json
+answers.json

TODOs.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+Notes:
+- prompt tuning
+- check existing agents
+- check existing classes for tools: video/image capabilities, audio transcription, etc.
+- checkout different models
+- checkout https://huggingface.co/blog/open-deep-research#using-a-codeagent and https://github.com/huggingface/smolagents/tree/main/examples/open_deep_research

agent.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import agent_tools
+from smolagents import CodeAgent, FinalAnswerTool, DuckDuckGoSearchTool, AzureOpenAIServerModel
+import app_tokens
+model = AzureOpenAIServerModel(
+    model_id = app_tokens.AZURE_OPENAI_MODEL,
+    azure_endpoint = app_tokens.AZURE_OPENAI_ENDPOINT,
+    api_key = app_tokens.AZURE_OPENAI_API_KEY,
+    api_version = app_tokens.OPENAI_API_VERSION
+)
+class BasicAgent:
+    def __init__(self):
+        self.web_agent = CodeAgent(
+            model=model,
+            tools=[agent_tools.VisitWebpageTool(), FinalAnswerTool(), DuckDuckGoSearchTool()],
+            max_steps=8,
+            name="web_agent",
+            description="Runs web searches for you."
+        )
+        self.manager_agent = CodeAgent(
+            model=model,
+            tools=[],
+            managed_agents=[self.web_agent],
+            additional_authorized_imports=["json","pandas","numpy", "regex"],
+            planning_interval=5,
+            verbosity_level=2,
+            max_steps=12,
+        )
+    def forward(self, question: str) -> str:
+        result = self.manager_agent.run(question)
+        return result

agent_tools.py ADDED Viewed

	@@ -0,0 +1,71 @@

+from smolagents import tool, Tool
+from tavily import TavilyClient
+import app_tokens
+@tool
+def web_search(query: str, proxy: bool = False) -> str:
+    """Searches the web for your query.
+    Args:
+        query: Your query.
+        proxy: An optional boolean parameter, if a local proxy should be used or not.
+    """
+    # tavily_client = TavilyClient(api_key=os.getenv("TAVILY_API_KEY"))
+    if proxy:
+        tavily_client = TavilyClient(api_key=app_tokens.get_tavily_api_key(), proxies={'http': 'http://localhost:3128', 'https': 'http://localhost:3128'}, verify=False)
+    else:
+        tavily_client = TavilyClient(api_key=app_tokens.get_tavily_api_key())
+    response = tavily_client.search(query)
+    return str(response["results"])
+class VisitWebpageTool(Tool):
+    name = "visit_webpage"
+    description = (
+        "Visits a webpage at the given url and reads its content as a markdown string. Use this to browse webpages."
+    )
+    inputs = {
+        "url": {
+            "type": "string",
+            "description": "The url of the webpage to visit.",
+        },
+        "proxy": {
+            "type": "boolean",
+            "description": "An optional boolean parameter, if a local proxy should be used or not. Should be True, if the request timed out.",
+            "nullable": "True",
+        },
+    }
+    output_type = "string"
+    def forward(self, url: str, proxy: bool = True) -> str:
+        try:
+            import re
+            import requests
+            from markdownify import markdownify
+            from requests.exceptions import RequestException
+            from smolagents.utils import truncate_content
+        except ImportError as e:
+            raise ImportError(
+                "You must install packages `markdownify` and `requests` to run this tool: for instance run `pip install markdownify requests`."
+            ) from e
+        try:
+            if proxy:
+                response = requests.get(url, timeout=20, proxies={'http': 'http://localhost:3128', 'https': 'http://localhost:3128'}, verify=False)
+            else:
+                response = requests.get(url, timeout=20)
+            response.raise_for_status()  # Raise an exception for bad status codes
+            markdown_content = markdownify(response.text).strip()
+            markdown_content = re.sub(r"\n{3,}", "\n\n", markdown_content)
+            return truncate_content(markdown_content, 40000)
+        except requests.exceptions.Timeout:
+            return "The request timed out. Please try again later or check the URL."
+        except RequestException as e:
+            return f"Error fetching the webpage: {str(e)}"
+        except Exception as e:
+            return f"An unexpected error occurred: {str(e)}"
+# test = VisitWebpageTool()
+# print(test.forward("https://www.wikipedia.de", proxy=True))

app-test.py ADDED Viewed

	@@ -0,0 +1,139 @@

+import requests
+from huggingface_hub import login
+import agent
+import json
+import base64
+DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+SPACE_ID = "https://huggingface.co/spaces/IngoTB303/Final_Assignment_Template/tree/main"
+api_url = DEFAULT_API_URL
+questions_url = f"{api_url}/questions"
+attachments_url = f"{api_url}/files/"
+submit_url = f"{api_url}/submit"
+agent = agent.BasicAgent()
+def fetch_questions(proxy: bool = True):
+    """Fetch questions from the API endpoint."""
+    print(f"Fetching questions from: {questions_url}")
+    try:
+        if proxy:
+            response = requests.get(questions_url, timeout=30, proxies={'http': 'http://localhost:3128', 'https': 'http://localhost:3128'}, verify=False)
+        else:
+            response = requests.get(questions_url, timeout=30)
+        response.raise_for_status()
+        questions_data = response.json()
+        if not questions_data:
+            return None
+        # Fetch attachments for questions with file_name
+        for question in questions_data:
+            file_name = question.get("file_name", "")
+            task_id = question.get("task_id")
+            if file_name and task_id:
+                try:
+                    if proxy:
+                        att_response = requests.get(f"{attachments_url}{task_id}", timeout=15, proxies={'http': 'http://localhost:3128', 'https': 'http://localhost:3128'}, verify=False)
+                    else:
+                        att_response = requests.get(f"{attachments_url}{task_id}", timeout=15)
+                    att_response.raise_for_status()
+                    # Encode binary content to base64 string
+                    question["attachment_b64"] = base64.b64encode(att_response.content).decode("utf-8")
+                except Exception as e:
+                    print(f"Error fetching attachment for task {task_id}: {e}")
+                    question["attachment_b64"] = None
+        return questions_data
+    except Exception as e:
+        print(f"Error fetching questions: {e}")
+    finally:
+        if questions_data:
+            with open("questions.json", "w", encoding="utf-8") as f:
+                json.dump(questions_data, f, ensure_ascii=False, indent=2)
+def run_agent(questions_data):
+    answers_payload = []
+    print(f"Running agent on {len(questions_data)} questions...")
+    for item in questions_data:
+        task_id = item.get("task_id")
+        question_text = item.get("question", "")
+        attachment_b64 = item.get("attachment_b64", "")
+        # Concatenate question and attachment_b64 if present
+        if attachment_b64:
+            question_text = f"{question_text}\n\n[ATTACHMENT:]\n{attachment_b64}"
+        if not task_id or question_text is None:
+            print(f"Skipping item with missing task_id or question: {item}")
+            continue
+        try:
+            submitted_answer = agent.forward(question=question_text)
+            answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
+        except Exception as e:
+             print(f"Error running agent on task {task_id}: {e}")
+    return answers_payload
+def load_questions(filename):
+    """Load questions from a local JSON file and return as questions_data."""
+    try:
+        with open(filename, "r", encoding="utf-8") as f:
+            questions_data = json.load(f)
+        return questions_data
+    except Exception as e:
+        print(f"Error loading questions from {filename}: {e}")
+        return None
+def load_answers(filename):
+    """Load answers from a local JSON file."""
+    try:
+        with open(filename, "r", encoding="utf-8") as f:
+            answers = json.load(f)
+        return answers
+    except Exception as e:
+        print(f"Error loading answers from {filename}: {e}")
+        return None
+def submit_answers_to_hf(username, agent_code, answers_payload):
+    # Prepare Submission
+    submission_data = {"username": username.strip(), "agent_code": agent_code, "answers": answers_payload}
+    status_update = f"Agent finished. Submitting {len(answers_payload)} answers for user '{username}'..."
+    print(status_update)
+    # Submit
+    print(f"Submitting {len(answers_payload)} answers to: {submit_url}")
+    try:
+        response = requests.post(submit_url, json=submission_data, timeout=60)
+        response.raise_for_status()
+        result_data = response.json()
+        final_status = (
+            f"Submission Successful!\n"
+            f"User: {result_data.get('username')}\n"
+            f"Overall Score: {result_data.get('score', 'N/A')}% "
+            f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
+            f"Message: {result_data.get('message', 'No message received.')}"
+        )
+        print("Submission successful.")
+        return final_status
+    except Exception as e:
+        status_message = f"An unexpected error occurred during submission: {e}"
+        print(status_message)
+        return status_message
+# # for use without proxy
+# questions = fetch_questions()
+# for use with proxy, after questions have been fetched
+questions = load_questions("questions.json")
+# # test print the questions to verify, if attachments were loaded
+# for question in questions:
+#     print(question["question"],"\n")
+# # for use with proxy
+# answers = run_agent(questions)
+# # save answers to publish them later without use of proxy
+# if answers:
+#     with open("answers.json", "w", encoding="utf-8") as f:
+#         json.dump(answers, f, ensure_ascii=False, indent=2)
+# submit results to Huggingface
+answers = load_answers("answers.json")
+assignment_results = submit_answers_to_hf("IngoTB303", SPACE_ID, answers)
+print(assignment_results)

app.py CHANGED Viewed

@@ -3,21 +3,25 @@ import gradio as gr
 import requests
 import inspect
 import pandas as pd
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# --- Basic Agent Definition ---
-# ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-class BasicAgent:
-    def __init__(self):
-        print("BasicAgent initialized.")
-    def __call__(self, question: str) -> str:
-        print(f"Agent received question (first 50 chars): {question[:50]}...")
-        fixed_answer = "This is a default answer."
-        print(f"Agent returning fixed answer: {fixed_answer}")
-        return fixed_answer
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
@@ -36,11 +40,12 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     api_url = DEFAULT_API_URL
     questions_url = f"{api_url}/questions"
     submit_url = f"{api_url}/submit"
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
-        agent = BasicAgent()
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None
@@ -58,6 +63,18 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
              print("Fetched questions list is empty.")
              return "Fetched questions list is empty or invalid format.", None
         print(f"Fetched {len(questions_data)} questions.")
     except requests.exceptions.RequestException as e:
         print(f"Error fetching questions: {e}")
         return f"Error fetching questions: {e}", None
@@ -75,7 +92,11 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     print(f"Running agent on {len(questions_data)} questions...")
     for item in questions_data:
         task_id = item.get("task_id")
-        question_text = item.get("question")
         if not task_id or question_text is None:
             print(f"Skipping item with missing task_id or question: {item}")
             continue

 import requests
 import inspect
 import pandas as pd
+from smolagents import CodeAgent, HfApiModel, FinalAnswerTool, DuckDuckGoSearchTool, AzureOpenAIServerModel
+from huggingface_hub import login
+import app_tokens
+login(os.getenv('HF_API_KEY'))
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+model = AzureOpenAIServerModel(
+    model_id = app_tokens.AZURE_OPENAI_MODEL,
+    azure_endpoint = app_tokens.AZURE_OPENAI_ENDPOINT,
+    api_key = app_tokens.AZURE_OPENAI_API_KEY,
+    api_version = app_tokens.OPENAI_API_VERSION
+)
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     api_url = DEFAULT_API_URL
     questions_url = f"{api_url}/questions"
+    attachments_url = f"{api_url}/files/"
     submit_url = f"{api_url}/submit"
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
+        agent = agent.BasicAgent()
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None
              print("Fetched questions list is empty.")
              return "Fetched questions list is empty or invalid format.", None
         print(f"Fetched {len(questions_data)} questions.")
+        # Fetch attachments for questions with file_name
+        for q in questions_data:
+            file_name = q.get("file_name", "")
+            task_id = q.get("task_id")
+            if file_name and task_id:
+                try:
+                    att_response = requests.get(f"{attachments_url}{task_id}", timeout=15)
+                    att_response.raise_for_status()
+                    q["attachment_b64"] = att_response.text
+                except Exception as e:
+                    print(f"Error fetching attachment for task {task_id}: {e}")
+                    q["attachment_b64"] = None
     except requests.exceptions.RequestException as e:
         print(f"Error fetching questions: {e}")
         return f"Error fetching questions: {e}", None
     print(f"Running agent on {len(questions_data)} questions...")
     for item in questions_data:
         task_id = item.get("task_id")
+        question_text = item.get("question", "")
+        attachment_b64 = item.get("attachment_b64", "")
+        # Concatenate question and attachment_b64 if present
+        if attachment_b64:
+            question_text = f"{question_text}\n\n[ATTACHMENT:]\n{attachment_b64}"
         if not task_id or question_text is None:
             print(f"Skipping item with missing task_id or question: {item}")
             continue

requirements.txt CHANGED Viewed

@@ -1,2 +1,7 @@
 gradio
-requests

 gradio
+requests
+tavily-python
+smolagents
+regex
+pandas
+numpy