New_Final_Assignment

Sleeping

App Files Files Community

naman1102 commited on Jun 2

Commit

51b14d9

1 Parent(s): 7dbc634

short

Browse files

Files changed (2) hide show

app.py +25 -9
tools.py +1 -0

app.py CHANGED Viewed

@@ -95,15 +95,16 @@ def plan_node(state: AgentState) -> AgentState:
 # ─── 3) Revised finalize_node ───
 def finalize_node(state: AgentState) -> AgentState:
     if state.get("final_answer") is not None:
-        print(">>> finalize_node: returning existing final_answer:", state["final_answer"])
         return {"final_answer": state["final_answer"]}
     question = ""
     for msg in reversed(state.get("messages", [])):
         if isinstance(msg, HumanMessage):
             question = msg.content
             break
     combined = f"USER_QUESTION: {question}\n"
     if sr := state.get("web_search_result"):
         combined += f"WEB_SEARCH_RESULT: {sr}\n"
@@ -111,20 +112,35 @@ def finalize_node(state: AgentState) -> AgentState:
         combined += f"OCR_RESULT: {orc}\n"
     if exr := state.get("excel_result"):
         combined += f"EXCEL_RESULT: {exr}\n"
-    audio_transcript = state.get("audio_transcript") or state.get("transcript")
-    if audio_transcript:
-        combined += f"AUDIO_TRANSCRIPT: {audio_transcript}\n"
     combined += (
-        "Based on the above, provide ONLY the final answer. "
-        "…(rest of your instructions)…"
     )
-    # DEBUG: show exactly what we're sending to GPT-4 for final answer
-    print("\n>>> finalize_node prompt to LLM:\n" + combined + "\n<<< end prompt >>>\n")
     llm_response = llm([SystemMessage(content=combined)])
-    return {"final_answer": llm_response.content.strip()}
 # ─── 4) Wrap tools in a ToolNode ───
 def tool_node(state: AgentState) -> AgentState:

 # ─── 3) Revised finalize_node ───
 def finalize_node(state: AgentState) -> AgentState:
     if state.get("final_answer") is not None:
         return {"final_answer": state["final_answer"]}
+    # Re‐extract the last user question
     question = ""
     for msg in reversed(state.get("messages", [])):
         if isinstance(msg, HumanMessage):
             question = msg.content
             break
+    # Build one monolithic context
     combined = f"USER_QUESTION: {question}\n"
     if sr := state.get("web_search_result"):
         combined += f"WEB_SEARCH_RESULT: {sr}\n"
         combined += f"OCR_RESULT: {orc}\n"
     if exr := state.get("excel_result"):
         combined += f"EXCEL_RESULT: {exr}\n"
+    # Note: your code already stores the audio transcription under "transcript"
+    if tr := state.get("transcript"):
+        combined += f"AUDIO_TRANSCRIPT: {tr}\n"
+    # Here we demand a JSON response with a single key "final_answer"
     combined += (
+        "Based on the above, respond with exactly one JSON object, and nothing else. "
+        "The JSON object must have exactly one key: \"final_answer\". "
+        "For example:\n"
+        "{\"final_answer\":\"42\"}\n"
+        "Do NOT include any explanation, markdown, or any extra whitespace outside the JSON object. "
+        "If the answer is multiple words, put them in a comma-separated string, e.g. \"red,green,blue\". "
+        "If the answer is a number, it must be digits only—e.g. \"725.00\".\n"
     )
+    # Debug print
+    print("\n>>> finalize_node JSON‐strict prompt:\n" + combined + "\n<<< end prompt >>>\n")
     llm_response = llm([SystemMessage(content=combined)])
+    raw = llm_response.content.strip()
+    print(">>> finalize_node got raw response:", raw)
+    try:
+        parsed = json.loads(raw)
+        return {"final_answer": parsed["final_answer"]}
+    except Exception as e:
+        # If the LLM did not return valid JSON, store the error so you can see it
+        print(">>> finalize_node JSON parse error:", e, "raw was:", raw)
+        return {"final_answer": f"ERROR: invalid JSON from finalize_node: {raw}"}
 # ─── 4) Wrap tools in a ToolNode ───
 def tool_node(state: AgentState) -> AgentState:

tools.py CHANGED Viewed

@@ -6,6 +6,7 @@ from pathlib import Path
 from PIL import Image
 import pytesseract
 from state import AgentState
 def web_search_tool(state: AgentState) -> AgentState:
     """
     Expects: state["web_search_query"] is a non‐empty string.

 from PIL import Image
 import pytesseract
 from state import AgentState
+from langchain.schema import HumanMessage
 def web_search_tool(state: AgentState) -> AgentState:
     """
     Expects: state["web_search_query"] is a non‐empty string.