Update app.py
Browse files
app.py
CHANGED
|
@@ -1683,6 +1683,7 @@ def extract_images_from_pdf(pdf_path: Path):
|
|
| 1683 |
filename=str(pdf_path), # partition_pdf might expect a string
|
| 1684 |
strategy="hi_res",
|
| 1685 |
extract_image_block_types=["Image"],
|
|
|
|
| 1686 |
extract_image_block_to_payload=True,
|
| 1687 |
)
|
| 1688 |
print(f"ELEMENTS")
|
|
@@ -2306,6 +2307,7 @@ def process_pdf():
|
|
| 2306 |
# logger.info(f"Created project folder: {project_folder}")
|
| 2307 |
logger.info(f"Saved uploaded PDF to: {saved_pdf_path}")
|
| 2308 |
logger.info(f"Saved uploaded PDF to: {pdf_file}")
|
|
|
|
| 2309 |
# Extract & process
|
| 2310 |
# output_path, result = extract_images_from_pdf(saved_pdf_path, json_path)
|
| 2311 |
output_path, result = extract_images_from_pdf(saved_pdf_path)
|
|
|
|
| 1683 |
filename=str(pdf_path), # partition_pdf might expect a string
|
| 1684 |
strategy="hi_res",
|
| 1685 |
extract_image_block_types=["Image"],
|
| 1686 |
+
hi_res_model_name="yolox",
|
| 1687 |
extract_image_block_to_payload=True,
|
| 1688 |
)
|
| 1689 |
print(f"ELEMENTS")
|
|
|
|
| 2307 |
# logger.info(f"Created project folder: {project_folder}")
|
| 2308 |
logger.info(f"Saved uploaded PDF to: {saved_pdf_path}")
|
| 2309 |
logger.info(f"Saved uploaded PDF to: {pdf_file}")
|
| 2310 |
+
print("--------------------------------pdf_file_path---------------------",pdf_file,saved_pdf_path)
|
| 2311 |
# Extract & process
|
| 2312 |
# output_path, result = extract_images_from_pdf(saved_pdf_path, json_path)
|
| 2313 |
output_path, result = extract_images_from_pdf(saved_pdf_path)
|