Final_Assignment_Project

Sleeping

App Files Files Community

wt002 commited on May 15

Commit

59d0991

verified ·

1 Parent(s): bd864cc

Update agent.py

Browse files

Files changed (1) hide show

agent.py +22 -8

agent.py CHANGED Viewed

@@ -368,18 +368,18 @@ def reverse_text(text: str) -> str:
     return text[::-1].replace("\\", "").strip() if text.startswith(('.', ',')) else text
 # 3. Unified Document Creation
-def create_documents(data_source: str, data: List[dict]) -> List[Document]:
     """Handle both Gradio chat and JSON questions"""
     docs = []
     for item in data:
         # Process different data sources
-        if data_source == "gradio":
-            content = "\n".join(item["messages"])
-        elif data_source == "json":
             raw_question = item.get("question", "")
-            content = reverse_text(process_content(raw_question))
         else:
             continue
         # Ensure metadata type safety
@@ -389,14 +389,28 @@ def create_documents(data_source: str, data: List[dict]) -> List[Document]:
             "file_name": str(item.get("file_name", ""))
         }
-        # Make sure that the content and metadata are valid
         if content.strip():  # Only append non-empty content
             docs.append(Document(page_content=content, metadata=metadata))
         else:
-            print(f"Skipping invalid entry: {item}")
     return docs
@@ -420,7 +434,7 @@ class MyVector_Store:
 # -----------------------------
 # Process JSON data and create documents
 # -----------------------------
-file_path = "/home/wendy/my_hf_agent_course_projects/src/data.json"
 try:
     with open(file_path, "r", encoding="utf-8") as f:

     return text[::-1].replace("\\", "").strip() if text.startswith(('.', ',')) else text
 # 3. Unified Document Creation
+def create_documents(data_source: str, data: list) -> list:
     """Handle both Gradio chat and JSON questions"""
     docs = []
     for item in data:
+        content = ""
         # Process different data sources
+        if data_source == "json":
             raw_question = item.get("question", "")
+            content = raw_question  # Adjust as per your content processing logic
         else:
+            print(f"Skipping invalid data source: {data_source}")
             continue
         # Ensure metadata type safety
             "file_name": str(item.get("file_name", ""))
         }
+        # Check if content is non-empty
         if content.strip():  # Only append non-empty content
             docs.append(Document(page_content=content, metadata=metadata))
         else:
+            print(f"Skipping invalid entry with empty content: {item}")
     return docs
+# Path to your data.json
+file_path = "/home/wendy/my_hf_agent_course_projects/src/data.json"
+# Check if the file exists
+if os.path.exists(file_path):
+    # Load the data from the JSON file
+    with open(file_path, "r", encoding="utf-8") as f:
+        data = json.load(f)
+    # Create documents from the loaded data
+    docs = create_documents("json", data)
+    print(f"Documents created: {len(docs)}")
+else:
+    print(f"Error: File {file_path} not found.")
 # -----------------------------
 # Process JSON data and create documents
 # -----------------------------
+file_path = "/home/wendy/Downloads/questions.json"
 try:
     with open(file_path, "r", encoding="utf-8") as f: