Pdf-Processing / app.py
Rivalcoder
Add application file
6928eef
raw
history blame contribute delete
762 Bytes
import fitz # PyMuPDF
import gradio as gr
def extract_text_from_pdf(file):
if file is None:
return "No file uploaded."
try:
doc = fitz.open(file.name) # Use file path directly
full_text = ""
for page_num in range(len(doc)):
page = doc.load_page(page_num)
text = page.get_text()
full_text += f"\n\n--- Page {page_num + 1} ---\n\n{text}"
return full_text
except Exception as e:
return f"Error: {str(e)}"
gr.Interface(
fn=extract_text_from_pdf,
inputs=gr.File(label="Upload PDF", file_types=[".pdf"]),
outputs="text",
title="PDF to Text Extractor",
description="Upload a PDF file and get all the extracted text from each page.",
).launch()