Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -1683,6 +1683,7 @@ def extract_images_from_pdf(pdf_path: Path):
|
|
1683 |
filename=str(pdf_path), # partition_pdf might expect a string
|
1684 |
strategy="hi_res",
|
1685 |
extract_image_block_types=["Image"],
|
|
|
1686 |
extract_image_block_to_payload=True,
|
1687 |
)
|
1688 |
print(f"ELEMENTS")
|
@@ -2306,6 +2307,7 @@ def process_pdf():
|
|
2306 |
# logger.info(f"Created project folder: {project_folder}")
|
2307 |
logger.info(f"Saved uploaded PDF to: {saved_pdf_path}")
|
2308 |
logger.info(f"Saved uploaded PDF to: {pdf_file}")
|
|
|
2309 |
# Extract & process
|
2310 |
# output_path, result = extract_images_from_pdf(saved_pdf_path, json_path)
|
2311 |
output_path, result = extract_images_from_pdf(saved_pdf_path)
|
|
|
1683 |
filename=str(pdf_path), # partition_pdf might expect a string
|
1684 |
strategy="hi_res",
|
1685 |
extract_image_block_types=["Image"],
|
1686 |
+
hi_res_model_name="yolox",
|
1687 |
extract_image_block_to_payload=True,
|
1688 |
)
|
1689 |
print(f"ELEMENTS")
|
|
|
2307 |
# logger.info(f"Created project folder: {project_folder}")
|
2308 |
logger.info(f"Saved uploaded PDF to: {saved_pdf_path}")
|
2309 |
logger.info(f"Saved uploaded PDF to: {pdf_file}")
|
2310 |
+
print("--------------------------------pdf_file_path---------------------",pdf_file,saved_pdf_path)
|
2311 |
# Extract & process
|
2312 |
# output_path, result = extract_images_from_pdf(saved_pdf_path, json_path)
|
2313 |
output_path, result = extract_images_from_pdf(saved_pdf_path)
|