Spaces:

Nymbo
/

data-boards

Sleeping

prithivMLmods commited on Dec 20, 2024

Commit

a5f8478

verified ·

1 Parent(s): a9bbdc9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,6 +9,7 @@ title_and_description = """
 # PDF to Word and Word to PDF Converter
 This tool allows you to convert PDF files to Word documents and Word documents to PDF files.
 """
 def pdf_to_word(pdf_file):
@@ -16,6 +17,12 @@ def pdf_to_word(pdf_file):
     Converts a PDF file to a Word document.
     """
     try:
         # Create a temporary directory to store the output file
         with tempfile.TemporaryDirectory() as temp_dir:
             docx_filename = os.path.join(temp_dir, os.path.basename(pdf_file.name).replace('.pdf', '.docx'))
@@ -90,4 +97,4 @@ with gr.Blocks() as app:
                 convert_word_to_pdf.click(word_to_pdf, inputs=[word_input], outputs=[pdf_output])
-app.launch()

 # PDF to Word and Word to PDF Converter
 This tool allows you to convert PDF files to Word documents and Word documents to PDF files.
+Note: Scanned PDFs (image-based PDFs) are not supported.
 """
 def pdf_to_word(pdf_file):
     Converts a PDF file to a Word document.
     """
     try:
+        # Check if the PDF is scanned (image-based)
+        with open(pdf_file.name, 'rb') as f:
+            first_page = f.read(1024)  # Read the first 1024 bytes of the PDF
+            if b"/Image" in first_page or b"/XObject" in first_page:
+                return "Error: Scanned PDFs (image-based PDFs) are not supported."
         # Create a temporary directory to store the output file
         with tempfile.TemporaryDirectory() as temp_dir:
             docx_filename = os.path.join(temp_dir, os.path.basename(pdf_file.name).replace('.pdf', '.docx'))
                 convert_word_to_pdf.click(word_to_pdf, inputs=[word_input], outputs=[pdf_output])
+app.launch(share=True)