studymate / ocr.py
saranya19b's picture
Upload 5 files
3f7f9d9 verified
raw
history blame contribute delete
211 Bytes
import fitz # PyMuPDF
def extract_text_from_pdf(file) -> str:
doc = fitz.open(stream=file.read(), filetype="pdf")
text = ""
for page in doc:
text += page.get_text()
return text.strip()