Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -8,7 +8,7 @@ import requests
|
|
8 |
from typing import List, Dict, Union
|
9 |
import pandas as pd
|
10 |
import wikipediaapi
|
11 |
-
import
|
12 |
from docx import Document
|
13 |
|
14 |
load_dotenv()
|
@@ -82,7 +82,7 @@ class BasicAgent:
|
|
82 |
try:
|
83 |
if ext == '.pdf':
|
84 |
with open(file_path, 'rb') as f:
|
85 |
-
reader =
|
86 |
return "\n".join([page.extract_text() for page in reader.pages])
|
87 |
elif ext in ('.doc', '.docx'):
|
88 |
doc = Document(file_path)
|
|
|
8 |
from typing import List, Dict, Union
|
9 |
import pandas as pd
|
10 |
import wikipediaapi
|
11 |
+
import PyPDF
|
12 |
from docx import Document
|
13 |
|
14 |
load_dotenv()
|
|
|
82 |
try:
|
83 |
if ext == '.pdf':
|
84 |
with open(file_path, 'rb') as f:
|
85 |
+
reader = PyPDF.PdfReader(f)
|
86 |
return "\n".join([page.extract_text() for page in reader.pages])
|
87 |
elif ext in ('.doc', '.docx'):
|
88 |
doc = Document(file_path)
|