Spaces:

TeamTonic
/

HereChatBackend

Runtime error

App Files Files Community

Tonic commited on Nov 15, 2023

Commit

a13c2af

1 Parent(s): 4d5f35d

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -5

app.py CHANGED Viewed

@@ -132,6 +132,9 @@ def embed_pdf(file, filename, collection_name, file_type):
             return {"error": f"Error downloading file from URL: {e}"}
     elif file_type == "Binary":
         # Handle binary file
         file_content = file
         file_path = os.path.join('./', filename)
         with open(file_path, 'wb') as f:
@@ -139,6 +142,7 @@ def embed_pdf(file, filename, collection_name, file_type):
     else:
         return {"error": "Invalid file type"}
     # Checking filetype for document parsing
     mime_type = mimetypes.guess_type(file_path)[0]
     loader = UnstructuredFileLoader(file_path)
@@ -218,20 +222,31 @@ def combined_interface(query, file, collection_name):
         article_info = retrieve_info(query)
         return article_info
     elif file is not None and collection_name:
-        # Extract filename and content from the file object
-        filename = file[1]  # file[1] contains the filename
-        file_content = file[0]  # file[0] contains the file content
-        # Determine if the file is a binary or a URL
         if isinstance(file_content, str) and file_content.startswith("http"):
             file_type = "URL"
         else:
             file_type = "Binary"
-        return embed_pdf(file_content, filename, collection_name, file_type)
     else:
         return "Please enter a query or upload a PDF file and specify a collection name."
 iface = gr.Interface(
     fn=combined_interface,
     inputs=[

             return {"error": f"Error downloading file from URL: {e}"}
     elif file_type == "Binary":
         # Handle binary file
+        if isinstance(file, str):
+            # Convert string to bytes if necessary
+            file = file.encode()
         file_content = file
         file_path = os.path.join('./', filename)
         with open(file_path, 'wb') as f:
     else:
         return {"error": "Invalid file type"}
     # Checking filetype for document parsing
     mime_type = mimetypes.guess_type(file_path)[0]
     loader = UnstructuredFileLoader(file_path)
         article_info = retrieve_info(query)
         return article_info
     elif file is not None and collection_name:
+        filename = file[1]  # Extract filename
+        file_content = file[0]  # Extract file content
+        # Check if file_content is a URL or binary data
         if isinstance(file_content, str) and file_content.startswith("http"):
             file_type = "URL"
+            # Handle URL case (if needed)
         else:
             file_type = "Binary"
+            # Write binary data to a temporary file
+            with tempfile.NamedTemporaryFile(delete=False, suffix=os.path.splitext(filename)[1]) as temp_file:
+                temp_file.write(file_content)
+                temp_filepath = temp_file.name
+            # Pass the file path to embed_pdf
+            result = embed_pdf(temp_filepath, collection_name)
+            # Clean up the temporary file
+            os.remove(temp_filepath)
+            return result
     else:
         return "Please enter a query or upload a PDF file and specify a collection name."
 iface = gr.Interface(
     fn=combined_interface,
     inputs=[