Spaces:

albhu
/

legalgeek

Runtime error

albhu commited on Apr 25, 2024

Commit

eec0661

verified ·

1 Parent(s): 01da382

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -29,16 +29,19 @@ if document_file is not None:
         st.error("A dokumentum mérete túl nagy. Kérlek válassz egy kisebb méretű dokumentumot!")
     else:
         if document_file.type == "application/pdf":
             with pdfplumber.open(document_file) as pdf:
                 document_text = ""
                 for page in pdf.pages:
                     document_text += page.extract_text()
         elif document_file.type == "application/vnd.openxmlformats-officedocument.wordprocessingml.document":
             docx_file = docx.Document(document_file)
             document_text = ""
             for paragraph in docx_file.paragraphs:
                 document_text += paragraph.text
         elif document_file.type == "application/msword":
             doc_file = docx.Document(document_file)
             document_text = ""
             for paragraph in doc_file.paragraphs:

         st.error("A dokumentum mérete túl nagy. Kérlek válassz egy kisebb méretű dokumentumot!")
     else:
         if document_file.type == "application/pdf":
+            # PDF fájl feldolgozása lapozás útján
             with pdfplumber.open(document_file) as pdf:
                 document_text = ""
                 for page in pdf.pages:
                     document_text += page.extract_text()
         elif document_file.type == "application/vnd.openxmlformats-officedocument.wordprocessingml.document":
+            # DOCX fájl feldolgozása részletekben
             docx_file = docx.Document(document_file)
             document_text = ""
             for paragraph in docx_file.paragraphs:
                 document_text += paragraph.text
         elif document_file.type == "application/msword":
+            # DOC fájl feldolgozása részletekben
             doc_file = docx.Document(document_file)
             document_text = ""
             for paragraph in doc_file.paragraphs: