EvoPlatformV3 / utils.py
HemanM's picture
Create utils.py
b6e3c51 verified
raw
history blame contribute delete
356 Bytes
import os
import fitz # PyMuPDF
def extract_text_from_file(file_obj):
name = file_obj.name
if name.endswith(".pdf"):
doc = fitz.open(stream=file_obj.read(), filetype="pdf")
return "\n".join(page.get_text() for page in doc)
elif name.endswith(".txt"):
return file_obj.read().decode("utf-8")
else:
return ""