Spaces:
Sleeping
Sleeping
import os | |
import fitz # PyMuPDF | |
def extract_text_from_file(file_obj): | |
name = file_obj.name | |
if name.endswith(".pdf"): | |
doc = fitz.open(stream=file_obj.read(), filetype="pdf") | |
return "\n".join(page.get_text() for page in doc) | |
elif name.endswith(".txt"): | |
return file_obj.read().decode("utf-8") | |
else: | |
return "" | |