File size: 356 Bytes
b6e3c51
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
import os
import fitz  # PyMuPDF

def extract_text_from_file(file_obj):
    name = file_obj.name
    if name.endswith(".pdf"):
        doc = fitz.open(stream=file_obj.read(), filetype="pdf")
        return "\n".join(page.get_text() for page in doc)
    elif name.endswith(".txt"):
        return file_obj.read().decode("utf-8")
    else:
        return ""