Final_Assignment_AWorld

Sleeping

App Files Files Community

Jofthomas commited on Apr 22

Commit

e80aab9

verified ·

1 Parent(s): fa7d846

Update app.py

Browse files

Files changed (1) hide show

app.py +416 -81

app.py CHANGED Viewed

@@ -1,16 +1,21 @@
 import os
 import gradio as gr
-# Keep using gradio.ChatMessage for type hints if needed, but not for yielding complex structures directly to ChatInterface
-# from gradio import ChatMessage # Maybe remove this import if not used elsewhere
 import requests
-from typing import Dict, List, AsyncGenerator, Union, Tuple
-from langchain_core.messages import HumanMessage, AIMessage, ToolMessage # Use LangChain messages internally
 from langchain_core.tools import tool
 from langchain_openai import ChatOpenAI
 from langgraph.checkpoint.memory import MemorySaver
 from langgraph.prebuilt import create_react_agent
-# --- Tools remain the same ---
 @tool
 def get_lat_lng(location_description: str) -> dict[str, float]:
     """Get the latitude and longitude of a location."""
@@ -30,7 +35,6 @@ def get_weather(lat: float, lng: float) -> dict[str, str]:
     """Get the weather at a location."""
     print(f"Tool: Getting weather for lat={lat}, lng={lng}")
     # Replace with actual API call in a real app
-    # Dummy logic based on lat
     if lat > 45: # Northern locations
         return {"temperature": "15°C", "description": "Cloudy"}
     elif lat > 30: # Mid locations
@@ -38,81 +42,412 @@ def get_weather(lat: float, lng: float) -> dict[str, str]:
     else: # Southern locations
         return {"temperature": "30°C", "description": "Very Sunny"}
-async def Answer_from_agent(message: str, history: List[List[str]]) -> AsyncGenerator[str, None]:
-    """Processes message through LangChain agent, yielding intermediate steps as strings."""
-    # Convert Gradio history to LangChain messages
-    lc_messages = []
-    for user_msg, ai_msg in history:
-        if user_msg:
-            lc_messages.append(HumanMessage(content=user_msg))
-        if ai_msg:
-            # Important: Handle potential previous intermediate strings from AI
-            # If the ai_msg contains markers like "🛠️ Using", it was an intermediate step.
-            # For simplicity here, we assume full AI responses were stored previously.
-            # A more robust solution might involve storing message types in history.
-            if not ai_msg.startswith("🛠️ Using") and not ai_msg.startswith("Result:"):
-                 lc_messages.append(AIMessage(content=ai_msg))
-    lc_messages.append(HumanMessage(content=message))
-    llm = ChatOpenAI(temperature=0, model="gpt-4")
-    memory = MemorySaver() # Be mindful of memory state if agent is re-initialized every time
-    tools = [get_lat_lng, get_weather]
-    agent_executor = create_react_agent(llm, tools, checkpointer=memory)
-    # Use a unique thread_id per session if needed, or manage state differently
-    # Using a fixed one like "abc123" means all users share the same memory if server restarts aren't frequent
-    thread_id = "user_session_" + str(os.urandom(4).hex()) # Example: generate unique ID
-    full_response = ""
-    async for chunk in agent_executor.astream_events(
-        {"messages": lc_messages},
-        config={"configurable": {"thread_id": thread_id}},
-        version="v1" # Use v1 for events streaming
-    ):
-        event = chunk["event"]
-        data = chunk["data"]
-        if event == "on_chat_model_stream":
-            content = data["chunk"].content
-            if content:
-                full_response += content
-                yield full_response
-        elif event == "on_tool_start":
-            tool_input_str = str(data.get('input', ''))
-            yield f"🛠️ Using tool: **{data['name']}** with input: `{tool_input_str}`"
-        elif event == "on_tool_end":
-             tool_output_str = str(data.get('output', ''))
-             yield f"Tool **{data['name']}** finished.\nResult: `{tool_output_str}`"
-             if full_response:
-                 yield full_response
-    if full_response and (not chunk or chunk["event"] != "on_chat_model_stream"):
-         yield full_response
-# --- Gradio Interface (mostly unchanged) ---
-demo = gr.ChatInterface(
-    fn=Answer_from_agent,
-    type="messages",
-    title="🤖 AGent template",
-    description="Ask about the weather anywhere! Watch as I gather the information step by step.",
-    cache_examples=False,
-    save_history=True,
-    editable=True,
-)
-if __name__ == "__main__":
-    # Load environment variables
     try:
-        openai_api_key = os.getenv("OPENAI_API_KEY")
-        if openai_api_key:
-            print("OPENAI_API_KEY found.")
-    except:
-        alert("Warning: OPENAI_API_KEY not found in environment variables.")
-    demo.launch(debug=True, server_name="0.0.0.0")

 import os
 import gradio as gr
 import requests
+import inspect # To get source code for __repr__
+import asyncio
+from typing import Dict, List, AsyncGenerator, Union, Tuple, Optional
+# --- LangChain Specific Imports ---
+from langchain_core.messages import HumanMessage, AIMessage, BaseMessage
 from langchain_core.tools import tool
 from langchain_openai import ChatOpenAI
 from langgraph.checkpoint.memory import MemorySaver
 from langgraph.prebuilt import create_react_agent
+# --- Constants ---
+DEFAULT_API_URL = "http://127.0.0.1:8000" # Default URL for your FastAPI app
+# --- Tools (Keep these defined globally or ensure they are included in __repr__) ---
 @tool
 def get_lat_lng(location_description: str) -> dict[str, float]:
     """Get the latitude and longitude of a location."""
     """Get the weather at a location."""
     print(f"Tool: Getting weather for lat={lat}, lng={lng}")
     # Replace with actual API call in a real app
     if lat > 45: # Northern locations
         return {"temperature": "15°C", "description": "Cloudy"}
     elif lat > 30: # Mid locations
     else: # Southern locations
         return {"temperature": "30°C", "description": "Very Sunny"}
+# --- Agent Class Definition ---
+class MyLangChainAgent:
+    """
+    A sample LangChain agent class designed for interaction and submission.
+    NOTE: The current tools (weather/location) are placeholders and WILL NOT
+          correctly answer GAIA benchmark questions. This class structure
+          demonstrates how to integrate an agent with the submission API.
+          Replace LLM, tools, and potentially the agent type for actual GAIA tasks.
+    """
+    def __init__(self, model_name="gpt-4", temperature=0):
+        # Ensure API key is available
+        if not os.getenv("OPENAI_API_KEY"):
+            raise ValueError("OPENAI_API_KEY environment variable not set.")
+        self.llm = ChatOpenAI(temperature=temperature, model=model_name)
+        self.tools = [get_lat_lng, get_weather] # Use the globally defined tools
+        self.memory = MemorySaver()
+        # Create the agent executor
+        self.agent_executor = create_react_agent(self.llm, self.tools, checkpointer=self.memory)
+        print("MyLangChainAgent initialized.")
+    async def __call__(self, question: str, thread_id: str) -> AsyncGenerator[Union[str, Dict[str, str]], str]:
+        """
+        Runs the agent asynchronously, yielding intermediate steps and returning the final answer.
+        Args:
+            question: The input question string.
+            thread_id: A unique identifier for the conversation thread.
+        Yields:
+            Intermediate steps (tool calls/results) as strings or dicts.
+        Returns:
+            The final AI answer as a string.
+        """
+        print(f"Agent executing for thread_id: {thread_id} on question: {question[:50]}...")
+        lc_messages: List[BaseMessage] = [HumanMessage(content=question)]
+        final_answer = ""
+        full_response_content = "" # Store the complete AI response chunks
+        async for chunk in self.agent_executor.astream_events(
+            {"messages": lc_messages},
+            config={"configurable": {"thread_id": thread_id}},
+            version="v1"
+        ):
+            event = chunk["event"]
+            data = chunk["data"]
+            # print(f"DEBUG: Event: {event}, Data Keys: {data.keys()}") # Debugging line
+            if event == "on_chat_model_stream":
+                content = data["chunk"].content
+                if content:
+                    # print(f"DEBUG: AI Chunk: {content}") # Debugging line
+                    full_response_content += content
+                    # Yield potentially incomplete response for live typing effect if needed
+                    # yield {"type": "stream", "content": content }
+            elif event == "on_tool_start":
+                tool_input_str = str(data.get('input', ''))
+                yield f"🛠️ Using tool: **{data['name']}** with input: `{tool_input_str}`"
+            elif event == "on_tool_end":
+                 tool_output_str = str(data.get('output', ''))
+                 yield f"✅ Tool **{data['name']}** finished.\nResult: `{tool_output_str}`"
+            # Detect the end of the conversation turn (heuristic)
+            # The 'on_chain_end' event for the top-level graph might signal the end.
+            # Or check the 'messages' list in the final state if available.
+            # For create_react_agent, the final AIMessage is often the last main event.
+            # We will capture the last full AI message content after the loop.
+        # After iterating through all chunks, the final answer should be in full_response_content
+        final_answer = full_response_content.strip()
+        print(f"Agent execution finished. Final Answer: {final_answer[:100]}...")
+        # Yield the complete final answer distinctly if needed
+        # yield {"type": "final_answer_marker", "content": final_answer} # Example marker
+        return final_answer # Return the final answer
+    def __repr__(self) -> str:
+        """
+        Return the source code required to reconstruct this agent, including
+        the class definition, tool functions, and necessary imports.
+        """
+        imports = [
+            "import os",
+            "from typing import Dict, List, AsyncGenerator, Union, Tuple, Optional",
+            "from langchain_core.messages import HumanMessage, AIMessage, BaseMessage",
+            "from langchain_core.tools import tool",
+            "from langchain_openai import ChatOpenAI",
+            "from langgraph.checkpoint.memory import MemorySaver",
+            "from langgraph.prebuilt import create_react_agent",
+            "import inspect", # Needed if repr itself uses inspect dynamically
+            "import asyncio", # Needed for async call
+            "\n"
+        ]
+        # Get source code of tool functions
+        tool_sources = []
+        for t in self.tools:
+             try:
+                 tool_sources.append(inspect.getsource(t))
+             except (TypeError, OSError) as e:
+                  print(f"Warning: Could not get source for tool {t.__name__}: {e}")
+                  tool_sources.append(f"# Could not automatically get source for tool: {t.__name__}\n")
+        # Get source code of the class itself
+        class_source = inspect.getsource(MyLangChainAgent)
+        # Combine imports, tools, and class definition
+        full_source = "\n".join(imports) + "\n\n" + \
+                      "\n\n".join(tool_sources) + "\n\n" + \
+                      class_source
+        return full_source
+# --- Gradio UI and Logic ---
+# Initialize the agent (do this once outside the request functions)
+# Handle potential API key error during initialization
+try:
+    agent_instance = MyLangChainAgent()
+except ValueError as e:
+    print(f"ERROR initializing agent: {e}")
+    # Provide a dummy agent or exit if critical
+    agent_instance = None # Or raise SystemExit("Agent initialization failed")
+def format_chat_history(history: List[List[Optional[str]]]) -> List[Tuple[Optional[str], Optional[str]]]:
+    """Helper to format Gradio history for display."""
+    # Gradio's history format is List[List[user_msg | None, ai_msg | None]]
+    # We want List[Tuple[user_msg | None, ai_msg | None]] for Chatbot
+    formatted = []
+    for turn in history:
+        formatted.append(tuple(turn))
+    return formatted
+async def fetch_and_display_question(api_url: str):
+    """Calls the backend to get a random question."""
+    if not api_url:
+        return "Please enter the API URL.", "", "", gr.update(value=""), gr.update(value="") # Clear chat too
+    question_url = f"{api_url.strip('/')}/random-question"
+    print(f"Fetching question from: {question_url}")
     try:
+        response = requests.get(question_url, timeout=10)
+        response.raise_for_status() # Raise HTTPError for bad responses (4xx or 5xx)
+        data = response.json()
+        task_id = data.get("task_id")
+        question_text = data.get("question")
+        if task_id and question_text:
+            print(f"Fetched Task ID: {task_id}")
+            # Return updates for Gradio components: Status, Task ID, Question Text, Clear Agent Answer, Clear Chat
+            return "Question fetched successfully!", task_id, question_text, "", [] # Clears answer and chat history
+        else:
+            return "Error: Invalid data format received from API.", "", "", "", []
+    except requests.exceptions.RequestException as e:
+        print(f"Error fetching question: {e}")
+        return f"Error fetching question: {e}", "", "", "", []
+    except Exception as e:
+        print(f"An unexpected error occurred: {e}")
+        return f"An unexpected error occurred: {e}", "", "", "", []
+async def run_agent_interaction(
+    message: str,
+    history: List[List[Optional[str]]],
+    current_task_id: str,
+    # agent_instance: MyLangChainAgent # Agent passed via state potentially
+):
+    """Handles the chat interaction, runs the agent, yields steps, updates final answer state."""
+    if agent_instance is None:
+         yield "Agent not initialized. Please check API keys and restart."
+         return
+    if not current_task_id:
+        yield "Please fetch a question first using the button above."
+        return
+    # The 'message' here is the user's latest input in the chat.
+    # For this workflow, we assume the main input is the fetched question.
+    # We'll use the fetched question (implicitly stored) to run the agent.
+    # If you want interactive chat *about* the question, the logic needs adjustment.
+    # For simplicity, let's assume the user's message *is* the question or a prompt related to it.
+    # In the GAIA context, usually, the agent just runs on the provided question directly.
+    # We'll use the `current_task_id` to generate a unique thread_id for LangGraph memory.
+    thread_id = f"gaia_task_{current_task_id}_{os.urandom(4).hex()}"
+    print(f"Running agent for user message: {message[:50]}...")
+    history.append([message, None]) # Add user message to history
+    final_agent_answer = None
+    full_yielded_response = ""
+    # Use the agent's __call__ method
+    async for step in agent_instance(message, thread_id=thread_id):
+        if isinstance(step, str):
+            # Intermediate step (tool call, result, maybe stream chunk)
+            history[-1][1] = step # Update the AI's response in the last turn
+            yield format_chat_history(history) # Update chatbot UI
+            full_yielded_response = step # Track last yielded message
+        # If __call__ yielded dicts for streaming, handle here:
+        # elif isinstance(step, dict) and step.get("type") == "stream":
+        #     history[-1][1] = (history[-1][1] or "") + step["content"]
+        #     yield format_chat_history(history)
+    # After the loop, the `step` variable holds the return value (final answer)
+    final_agent_answer = step
+    print(f"Agent final answer received: {final_agent_answer[:100]}...")
+    # Update the history with the definitive final answer
+    if final_agent_answer:
+        history[-1][1] = final_agent_answer # Replace intermediate steps with final one
+    elif full_yielded_response:
+        # Fallback if final answer wasn't returned correctly but we yielded something
+         history[-1][1] = full_yielded_response
+         final_agent_answer = full_yielded_response # Use the last yielded message as answer
+    else:
+         history[-1][1] = "Agent did not produce a final answer."
+         final_agent_answer = "" # Ensure it's a string
+    # Yield the final state of the history and update the hidden state for the final answer
+    yield format_chat_history(history), final_agent_answer
+def submit_to_leaderboard(
+    api_url: str,
+    username: str,
+    task_id: str,
+    agent_answer: str,
+    # agent_instance: MyLangChainAgent # Pass agent via state if needed
+):
+    """Submits the agent's answer and code to the FastAPI backend."""
+    if agent_instance is None:
+        return "Agent not initialized. Cannot submit."
+    if not api_url:
+        return "Please enter the API URL."
+    if not username:
+        return "Please enter your Hugging Face username."
+    if not task_id:
+        return "No task ID available. Please fetch a question first."
+    if agent_answer is None or agent_answer.strip() == "": # Check if None or empty
+        # Maybe allow submission of empty answer? Depends on requirements.
+        print("Warning: Submitting empty answer.")
+        # return "Agent has not provided an answer yet."
+    submit_url = f"{api_url.strip('/')}/submit"
+    print(f"Submitting to: {submit_url}")
+    # Get agent code
+    try:
+        agent_code = agent_instance.__repr__()
+        # print(f"Agent Code (first 200 chars):\n{agent_code[:200]}...") # Debug
+    except Exception as e:
+        print(f"Error getting agent representation: {e}")
+        return f"Error generating agent code for submission: {e}"
+    # Prepare submission data according to Pydantic model in FastAPI
+    submission_data = {
+        "username": username.strip(),
+        "agent_code": agent_code,
+        "answers": [
+            {
+                "task_id": task_id,
+                "submitted_answer": agent_answer # Use the stored final answer
+            }
+            # Add more answers here if submitting a batch
+        ]
+    }
+    try:
+        response = requests.post(submit_url, json=submission_data, timeout=30)
+        response.raise_for_status()
+        result_data = response.json()
+        # Format the result nicely for display
+        result_message = (
+            f"Submission Successful!\n"
+            f"User: {result_data.get('username')}\n"
+            f"Score: {result_data.get('score')}\n"
+            f"Correct: {result_data.get('correct_count')}/{result_data.get('total_attempted')}\n"
+            f"Message: {result_data.get('message')}\n"
+            f"Timestamp: {result_data.get('timestamp')}"
+        )
+        print("Submission successful.")
+        return result_message
+    except requests.exceptions.HTTPError as e:
+        # Try to get detail from response body if available
+        error_detail = e.response.text
+        try:
+            error_json = e.response.json()
+            error_detail = error_json.get('detail', error_detail)
+        except requests.exceptions.JSONDecodeError:
+            pass # Keep the raw text if not JSON
+        print(f"HTTP Error during submission: {e.response.status_code} - {error_detail}")
+        return f"Submission Failed (HTTP {e.response.status_code}): {error_detail}"
+    except requests.exceptions.RequestException as e:
+        print(f"Network error during submission: {e}")
+        return f"Submission Failed: Network error - {e}"
+    except Exception as e:
+        print(f"An unexpected error occurred during submission: {e}")
+        return f"Submission Failed: An unexpected error occurred - {e}"
+# --- Build Gradio Interface using Blocks ---
+with gr.Blocks() as demo:
+    gr.Markdown("# Agent Evaluation Interface")
+    gr.Markdown(
+        "Fetch a random question from the evaluation API, interact with the agent "
+        "(Note: the default agent answers weather questions, not GAIA), "
+        "and submit the agent's final answer to the leaderboard."
+    )
+    # --- State Variables ---
+    # Store current task info, agent's final answer, and the agent instance
+    current_task_id = gr.State("")
+    current_question_text = gr.State("")
+    current_agent_answer = gr.State("") # Stores the final answer string from the agent
+    # agent_state = gr.State(agent_instance) # Pass agent instance via state
+    with gr.Row():
+        api_url_input = gr.Textbox(label="FastAPI API URL", value=DEFAULT_API_URL)
+        hf_username_input = gr.Textbox(label="Hugging Face Username")
+    with gr.Row():
+        fetch_button = gr.Button("Get Random Question")
+        submission_status_display = gr.Textbox(label="Status", interactive=False) # For fetch status
+    with gr.Row():
+        question_display = gr.Textbox(label="Current Question", lines=3, interactive=False)
+    gr.Markdown("---")
+    gr.Markdown("## Agent Interaction")
+    chatbot = gr.Chatbot(label="Agent Conversation", height=400)
+    msg_input = gr.Textbox(label="Send a message to the Agent (or just observe)") # Input for chat
+    # Hidden Textbox to display the final extracted answer (optional, for clarity)
+    final_answer_display = gr.Textbox(label="Agent's Final Answer (Extracted)", interactive=False)
+    gr.Markdown("---")
+    gr.Markdown("## Submission")
+    with gr.Row():
+         submit_button = gr.Button("Submit Current Answer to Leaderboard")
+    submission_result_display = gr.Markdown(label="Submission Result", value="*Submit an answer to see the result here.*") # Use Markdown for better formatting
+    # --- Component Interactions ---
+    # Fetch Button Action
+    fetch_button.click(
+        fn=fetch_and_display_question,
+        inputs=[api_url_input],
+        outputs=[
+            submission_status_display, # Shows fetch status
+            current_task_id,           # Updates hidden state
+            question_display,          # Updates question text box
+            final_answer_display,      # Clears old final answer
+            chatbot                    # Clears chat history
+        ]
+    )
+    # Chat Submission Action (when user sends message in chat)
+    msg_input.submit(
+        fn=run_agent_interaction,
+        inputs=[
+            msg_input,                  # User message from chat input
+            chatbot,                    # Current chat history
+            current_task_id,            # Current task ID from state
+            # agent_state               # Pass agent instance state
+        ],
+        outputs=[
+            chatbot,                    # Updated chat history
+            current_agent_answer        # Update the hidden state holding the final answer
+        ]
+    ).then(
+        # After agent runs, update the visible "Final Answer" box from the state
+        lambda answer_state: answer_state,
+        inputs=[current_agent_answer],
+        outputs=[final_answer_display]
+    )
+    # Clear message input after submission
+    msg_input.submit(lambda: "", None, msg_input, queue=False)
+    # Submit Button Action
+    submit_button.click(
+        fn=submit_to_leaderboard,
+        inputs=[
+            api_url_input,
+            hf_username_input,
+            current_task_id,
+            current_agent_answer,       # Use the stored final answer state
+            # agent_state               # Pass agent instance state
+        ],
+        outputs=[submission_result_display] # Display result message
+    )
+if __name__ == "__main__":
+    if agent_instance is None:
+        print("\nFATAL: Agent could not be initialized. Gradio app will not run correctly.")
+        print("Please ensure OPENAI_API_KEY is set and valid.\n")
+        # Optionally exit here if agent is critical
+        # exit(1)
+    else:
+        print("Launching Gradio Interface...")
+        demo.launch(debug=True, server_name="0.0.0.0") # Share=False by default for security