Final_Assignment_Project

Sleeping

wt002 commited on May 15

Commit

57de9d7

verified ·

1 Parent(s): 7f0bbf2

Update agent.py

Files changed (1) hide show

agent.py CHANGED Viewed

@@ -368,18 +368,23 @@ class MyVectorStore:
 import json
 from langchain.schema import Document
-def get_question(raw_question) -> str:
-    """Convert list to string and fix reversed text"""
-    # Handle lists (join with spaces)
-    if isinstance(raw_question, list):
-        text = " ".join(raw_question)
-    else:
-        text = str(raw_question)
-    # Fix reversed text like ".rewsna..."
     if text.startswith(('.', ',')):
-        return text[::-1].replace("\\", "").strip()
     return text
 with open("questions.json", "r", encoding="utf-8") as f:
@@ -387,15 +392,15 @@ with open("questions.json", "r", encoding="utf-8") as f:
 docs = [
     Document(
-        page_content=get_question(item["question"]),
         metadata={
             "task_id": item["task_id"],
-            "level": item.get("Level", "unknown"),
-            "file_name": item.get("file_name", "")
         }
     )
     for item in data
-    if "question" in item and item["question"]  # Skip missing/empty
 ]
 texts = [doc.page_content for doc in docs]

 import json
 from langchain.schema import Document
+from typing import Any
+def process_content(raw_content: Any) -> str:
+    """Convert any input to a clean string, handling lists and reversed text"""
+    # Flatten nested lists
+    def flatten(nested):
+        if isinstance(nested, list):
+            return " ".join(flatten(e) for e in nested)
+        return str(nested)
+    # Convert to string and clean
+    text = flatten(raw_content)
+    # Fix reversed text patterns like ".rewsna..."
     if text.startswith(('.', ',')):
+        text = text[::-1].replace("\\", "").strip()
     return text
 with open("questions.json", "r", encoding="utf-8") as f:
 docs = [
     Document(
+        page_content=process_content(item["question"]),
         metadata={
             "task_id": item["task_id"],
+            "level": str(item.get("Level", "")),  # Force string conversion
+            "file_name": str(item.get("file_name", ""))
         }
     )
     for item in data
+    if "question" in item  # Skip items without questions
 ]
 texts = [doc.page_content for doc in docs]