ai_systems / src /file_loader.py
amiguel's picture
Upload 5 files
d765c07 verified
raw
history blame contribute delete
595 Bytes
import pandas as pd
import pdfplumber
def load_file(uploaded_file):
ext = uploaded_file.name.split(".")[-1].lower()
if ext == "pdf":
with pdfplumber.open(uploaded_file) as pdf:
return [page.extract_text() for page in pdf.pages if page.extract_text()]
elif ext == "csv":
df = pd.read_csv(uploaded_file)
return df.astype(str).apply(" ".join, axis=1).tolist()
elif ext == "xlsx":
df = pd.read_excel(uploaded_file)
return df.astype(str).apply(" ".join, axis=1).tolist()
else:
raise ValueError("Unsupported file type")