Spaces:
Sleeping
Sleeping
import pandas as pd | |
import pdfplumber | |
def load_file(uploaded_file): | |
ext = uploaded_file.name.split(".")[-1].lower() | |
if ext == "pdf": | |
with pdfplumber.open(uploaded_file) as pdf: | |
return [page.extract_text() for page in pdf.pages if page.extract_text()] | |
elif ext == "csv": | |
df = pd.read_csv(uploaded_file) | |
return df.astype(str).apply(" ".join, axis=1).tolist() | |
elif ext == "xlsx": | |
df = pd.read_excel(uploaded_file) | |
return df.astype(str).apply(" ".join, axis=1).tolist() | |
else: | |
raise ValueError("Unsupported file type") | |