HF_Agents_Final_Project

Sleeping

App Files Files Community

Yago Bolivar commited on May 23

Commit

577039e

1 Parent(s): 27568a1

recover app.py and prompts.yaml from f3d56b

Browse files

Files changed (2) hide show

app.py +104 -26
prompts.yaml +89 -27

app.py CHANGED Viewed

@@ -26,21 +26,36 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 # --- Basic Agent Definition ---
-# # Configure the Language Model. Overloaded or not available
-# model = HfApiModel(
-#     max_tokens=2096,
-#     temperature=0.5,
-# #    model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud/', # nope
-# #    model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded
-#     custom_role_conversions=None,
-# )
-# Try to use OpenAI API
-model = OpenAIServerModel(
-    model_id="gpt-4o",
-    api_base="https://api.openai.com/v1",
-    api_key=os.environ["OPENAI_API_KEY"],
-)
 # Instantiate Tools
 final_answer_tool = FinalAnswerTool()
@@ -54,24 +69,86 @@ spreadsheet_tool = SpreadsheetTool()
 text_reversal_tool = TextReversalTool()
 video_processing_tool = VideoProcessingTool()
 # Load Prompts
 try:
     with open("prompts.yaml", 'r') as stream:
         prompt_templates = yaml.safe_load(stream)
 except FileNotFoundError:
-    print("Error: prompts.yaml not found. Please ensure it is in the root project directory.")
-    prompt_templates = {} # Fallback to empty templates
 except yaml.YAMLError as e:
     print(f"Error parsing prompts.yaml: {e}")
-    prompt_templates = {}
-# Enhance the agent class to conform to the template's interface
 class EnhancedCodeAgent(CodeAgent):
     def __call__(self, question: str) -> str:
-        response = self.run(question)
-        return response
 # Create the Agent
 agent_tools = [
     final_answer_tool,
@@ -86,13 +163,14 @@ agent_tools = [
     video_processing_tool
 ]
 agent = EnhancedCodeAgent(
     model=model,
     tools=agent_tools,
-    max_steps=15,
-    verbosity_level=1,
-    name="ComprehensiveQuestionAgent",
-    description="An agent equipped with a suite of tools to answer diverse questions from the common_questions.json set.",
     prompt_templates=prompt_templates
 )

 # --- Basic Agent Definition ---
+# Enhanced Phase 1: Lightweight Model and Token Management for HF Spaces
+try:
+    # Try OpenAI first (if API key available) - Use mini version for better token management
+    model = OpenAIServerModel(
+        model_id="gpt-4o-mini",  # Use mini version for better token management
+        api_base="https://api.openai.com/v1",
+        api_key=os.environ.get("OPENAI_API_KEY"),
+        max_tokens=2000,  # Increased from 1000 for better reasoning capability
+        temperature=0.1,  # Lower temperature for more consistent outputs
+    )
+    print("Using OpenAI gpt-4o-mini model")
+except Exception as e:
+    print(f"OpenAI model initialization failed: {e}")
+    # Fallback to HF model - More capable than DialoGPT-medium
+    try:
+        model = HfApiModel(
+            model_id="microsoft/DialoGPT-large",  # Upgraded from medium for better capability
+            max_tokens=2000,
+            temperature=0.1,
+            custom_role_conversions=None,
+        )
+        print("Using fallback HF DialoGPT-large model")
+    except Exception as fallback_error:
+        print(f"Fallback model initialization failed: {fallback_error}")
+        # Final fallback to basic HF model
+        model = HfApiModel(
+            max_tokens=2000,
+            temperature=0.1,
+        )
+        print("Using basic HF model as final fallback")
 # Instantiate Tools
 final_answer_tool = FinalAnswerTool()
 text_reversal_tool = TextReversalTool()
 video_processing_tool = VideoProcessingTool()
+# Add debug prints for file paths
+print("Current directory:", os.getcwd())
+print("prompts.yaml exists:", os.path.exists("prompts.yaml"))
 # Load Prompts
 try:
     with open("prompts.yaml", 'r') as stream:
         prompt_templates = yaml.safe_load(stream)
+        print("Loaded prompts.yaml successfully. Structure:", type(prompt_templates))  # Debug
+        if isinstance(prompt_templates, dict):
+            print("Keys:", prompt_templates.keys())  # Debug
+        else:
+            print("Loaded prompt_templates is not a dictionary.")
 except FileNotFoundError:
+    print("Error: prompts.yaml not found. Using default templates.")
+    prompt_templates = {
+        "system_prompt": { # This was a single string, now a dict
+            "base": "You are an expert assistant...", # Default value
+            "with_tools": "At each step...", # Default value
+        },
+        "system": { # This section was already a dict, kept for consistency
+            "base": "You are a GAIA benchmark agent running in HF Spaces. Be concise and efficient in your responses.",
+            "with_tools": "Think briefly, act decisively. Use tools efficiently to solve GAIA benchmark tasks."
+        },
+        "human": {
+            "base": "Here is your task: {{task}}\\\\nProvide exact answer. Be concise and efficient.", # Updated base
+            "with_tools": "Here is your task: {{task}}\\\\nUse available tools strategically. Be direct and resource-conscious: {{tools}}" # Updated with_tools
+        },
+        "planning": {
+            "initial_facts": "Task: {{task}}. Identify key facts and missing information concisely.",
+            "initial_plan": "Develop an efficient 3-5 step plan for this GAIA task using available tools."
+            # etc...
+        },
+        "managed_agent": {
+            "task": "Managed agent task: {{task}}",
+            "report": "Managed agent report: {{final_answer}}"
+        },
+        "final_answer": {
+            "base": "The final answer is: {{answer}}"
+        }
+        # Include all other required sections as per your YAML structure if they exist
+    }
 except yaml.YAMLError as e:
     print(f"Error parsing prompts.yaml: {e}")
+    print("Using default templates optimized for HF Spaces")
+    prompt_templates = {
+        "system_prompt": "You are a helpful AI assistant. Please be concise and efficient.",
+        "system": {
+            "base": "You are a GAIA benchmark agent running in HF Spaces. Be concise and efficient in your responses.",
+            "with_tools": "Think briefly, act decisively. Use tools efficiently to solve GAIA benchmark tasks."
+        },
+        "human": {
+            "base": "GAIA Task: {{task}}\\\\nProvide exact answer. Be concise and efficient.",
+            "with_tools": "GAIA Task: {{task}}\\\\nUse available tools strategically. Be direct and resource-conscious: {{tools}}"
+        },
+        "planning": {
+            "initial_facts": "Task: {{task}}. Identify key facts and missing information concisely.",
+            "initial_plan": "Develop an efficient 3-5 step plan for this GAIA task using available tools."
+        },
+        "managed_agent": {
+            "task": "Managed agent task: {{task}}",
+            "report": "Managed agent report: {{final_answer}}"
+        },
+        "final_answer": { # Placeholder, structure might need refinement based on agent's specific use
+            "base": "The final answer is: {{answer}}"
+        }
+    }
+# Enhanced agent configuration for HF Spaces optimization
 class EnhancedCodeAgent(CodeAgent):
     def __call__(self, question: str) -> str:
+        try:
+            response = self.run(question)
+            return response
+        except Exception as e:
+            print(f"Agent execution error: {e}")
+            # Provide a graceful fallback response
+            return f"I encountered an issue while processing your request. Here's what I know: {str(e)}"
 # Create the Agent
 agent_tools = [
     final_answer_tool,
     video_processing_tool
 ]
+# Enhanced agent configuration for HF Spaces optimization
 agent = EnhancedCodeAgent(
     model=model,
     tools=agent_tools,
+    max_steps=8,  # Increased from 5 to handle multi-step reasoning while staying efficient
+    verbosity_level=1,  # Keep some verbosity for debugging in HF Spaces
+    name="GAIAAgent",  # Updated name to reflect GAIA benchmark focus
+    description="Efficient GAIA benchmark agent optimized for HF Spaces with enhanced token management",
     prompt_templates=prompt_templates
 )

prompts.yaml CHANGED Viewed

@@ -1,4 +1,4 @@
-system:
   base: |-
     You are an expert assistant who can solve any task using code blobs. You will be given a task to solve as best you can.
     To do so, you have been given access to a list of tools: these tools are basically Python functions which you can call with code.
@@ -9,20 +9,18 @@ system:
     During each intermediate step, you can use 'print()' to save whatever important information you will then need.
     These print outputs will then appear in the 'Observation:' field, which will be available as input for the next step.
     In the end you have to return a final answer using the `final_answer` tool.
     You have access to these tools:
-    {% raw %}{%- for tool in tools.values() %}{% endraw %}
-    - {{ tool.name }}: {{ tool.description }}
-        Takes inputs: {{tool.inputs}}
-        Returns an output of type: {{tool.output_type}}
-    {% raw %}{%- endfor %}{% endraw %}# filepath: /Users/yagoairm2/Desktop/agents/final project/HF_Agents_Final_Project/prompts.yaml
-  Current subtask: {{subtask}}
-  {% if context %}
-  Additional context: {{context}}
-  {% endif %}
-  Provide your response in a clear and structured format that the manager agent can use.
 human:
   base: |-
@@ -38,13 +36,80 @@ human:
 planning:
   initial_facts: |-
     Below I will present you a task.
     You will now build a comprehensive preparatory survey of which facts we have at our disposal and which ones we still need.
     To do so, you will have to read the task and identify things that must be discovered in order to successfully complete it.
-    Don't make any assumptions. For each item, provide a thorough reasoning.
   initial_plan: |-
     You are a world expert at making efficient plans to solve any task using a set of carefully crafted tools.
     Now for the given task, develop a step-by-step high-level plan taking into account the above inputs and list of facts.
 managed_agent:
   task: |-
@@ -54,23 +119,20 @@ managed_agent:
     Task:
     {{task}}
     ---
-    You're helping your manager solve a wider task: so make sure to not provide a one-line answer.
   report: |-
     Here is the final answer from your managed agent '{{name}}':
     {{final_answer}}
-  Current subtask: {{subtask}}
-  {% if context %}
-  Additional context: {{context}}
-  {% endif %}
-  Provide your response in a clear and structured format that the manager agent can use.
-planning: |-
-  Here's my plan to solve this task:
-  {{plan}}
 manager_prompt: |
   Task: {{task_description}}
   {% if file_url %}
@@ -88,4 +150,4 @@ manager_prompt: |
   Based on the task and any provided file, devise a plan and call the appropriate agent(s) to gather information and formulate an answer.
   Generate the Python code to call these agents and produce the final answer.
-  Your final response should be the answer to the task.

+system_prompt:
   base: |-
     You are an expert assistant who can solve any task using code blobs. You will be given a task to solve as best you can.
     To do so, you have been given access to a list of tools: these tools are basically Python functions which you can call with code.
     During each intermediate step, you can use 'print()' to save whatever important information you will then need.
     These print outputs will then appear in the 'Observation:' field, which will be available as input for the next step.
     In the end you have to return a final answer using the `final_answer` tool.
     You have access to these tools:
+    - WebSearchAgent: Call this agent for web browsing and fetching URL content.
+    - FileProcessorAgent: Call this agent for identifying file types, parsing spreadsheets, transcribing audio, and parsing markdown tables.
+    - VisionAgent: Call this agent for image processing, OCR, and chess image analysis.
+    - VideoAgent: Call this agent for video processing tasks.
+    - CodeInterpreterAgent: Call this agent to execute Python code.
+    - TextToolAgent: Call this agent for simple text manipulations like reversing text.
+final_answer: |-
+  Here is the final answer to the task:
+  {{answer}}
 human:
   base: |-
 planning:
   initial_facts: |-
     Below I will present you a task.
     You will now build a comprehensive preparatory survey of which facts we have at our disposal and which ones we still need.
     To do so, you will have to read the task and identify things that must be discovered in order to successfully complete it.
+    Don't make any assumptions. For each item, provide a thorough reasoning. Here is how you will structure this survey:
+    ---
+    ### 1. Facts given in the task
+    List here the specific facts given in the task that could help you (there might be nothing here).
+    ### 2. Facts to look up
+    List here any facts that we may need to look up.
+    Also list where to find each of these, for instance a website, a file... - maybe the task contains some sources that you should re-use here.
+    ### 3. Facts to derive
+    List here anything that we want to derive from the above by logical reasoning, for instance computation or simulation.
   initial_plan: |-
     You are a world expert at making efficient plans to solve any task using a set of carefully crafted tools.
     Now for the given task, develop a step-by-step high-level plan taking into account the above inputs and list of facts.
+    This plan should involve individual tasks based on the available tools, that if executed correctly will yield the correct answer.
+    Do not skip steps, do not add any superfluous steps. Only write the high-level plan, DO NOT DETAIL INDIVIDUAL TOOL CALLS.
+    After writing the final step of the plan, write the '\n<end_plan>' tag and stop there.
+  update_facts_pre_messages: |-
+    You are a world expert at gathering known and unknown facts based on a conversation.
+    Below you will find a task, and a history of attempts made to solve the task. You will have to produce a list of these:
+    ### 1. Facts given in the task
+    ### 2. Facts that we have learned
+    ### 3. Facts still to look up
+    ### 4. Facts still to derive
+    Find the task and history below:
+  update_facts_post_messages: |-
+    Earlier we've built a list of facts.
+    But since in your previous steps you may have learned useful new facts or invalidated some false ones.
+    Please update your list of facts based on the previous history, and provide these headings:
+    ### 1. Facts given in the task
+    ### 2. Facts that we have learned
+    ### 3. Facts still to look up
+    ### 4. Facts still to derive
+    Now write your new list of facts below.
+  update_plan_pre_messages: |-
+    You are a world expert at making efficient plans to solve any task using a set of carefully crafted tools.
+    You have been given a task:
+    ```
+    {{task}}
+    ```
+    Find below the record of what has been tried so far to solve it. Then you will be asked to make an updated plan to solve the task.
+    If the previous tries so far have met some success, you can make an updated plan based on these actions.
+    If you are stalled, you can make a completely new plan starting from scratch.
+  update_plan_post_messages: |-
+    You're still working towards solving this task:
+    ```
+    {{task}}
+    ```
+    You can leverage these tools:
+    {{tools}}
+    Here is the up to date list of facts that you know:
+    ```
+    {{facts_update}}
+    ```
+    Now for the given task, develop a step-by-step high-level plan taking into account the above inputs and list of facts.
+    This plan should involve individual tasks based on the available tools, that if executed correctly will yield the correct answer.
+    Beware that you have {remaining_steps} steps remaining.
+    Do not skip steps, do not add any superfluous steps. Only write the high-level plan, DO NOT DETAIL INDIVIDUAL TOOL CALLS.
+    After writing the final step of the plan, write the '\n<end_plan>' tag and stop there.
 managed_agent:
   task: |-
     Task:
     {{task}}
     ---
+    You're helping your manager solve a wider task: so make sure to not provide a one-line answer, but give as much information as possible to give them a clear understanding of the answer.
+    Your final_answer WILL HAVE to contain these parts:
+    ### 1. Task outcome (short version):
+    ### 2. Task outcome (extremely detailed version):
+    ### 3. Additional context (if relevant):
+    Put all these in your final_answer tool, everything that you do not pass as an argument to final_answer will be lost.
+    And even if your task resolution is not successful, please return as much context as possible, so that your manager can act upon this feedback.
   report: |-
     Here is the final answer from your managed agent '{{name}}':
     {{final_answer}}
 manager_prompt: |
   Task: {{task_description}}
   {% if file_url %}
   Based on the task and any provided file, devise a plan and call the appropriate agent(s) to gather information and formulate an answer.
   Generate the Python code to call these agents and produce the final answer.
+  Your final response should be the answer to the task.