Spaces:

1oscon
/

PaddleOCR

Runtime error

App Files Files Community

1oscon commited on 16 days ago

Commit

bb6244a

verified ·

1 Parent(s): a7822df

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -7

app.py CHANGED Viewed

@@ -10,10 +10,10 @@ import os
 OUTPUT_DIR = "output_results"
 os.makedirs(OUTPUT_DIR, exist_ok=True)
-# --- 模型加载器 ---
 def load_gpu_model():
-    print("正在加载经过版本锁定的PaddleOCR GPU模型...")
-    # 使用与锁定版本兼容的参数：use_gpu=True是必需的
     ocr_model = PaddleOCR(use_angle_cls=True, lang='ch', use_gpu=True)
     print("GPU模型加载成功。")
     return ocr_model
@@ -33,7 +33,7 @@ def process_pdf_max_speed(pdf_file, progress=gr.Progress(track_tqdm=True)):
         doc = fitz.open(pdf_file.name)
         total_pages = len(doc)
-        batch_size = 4  # 批处理大小
         full_text_result = []
         for i in progress.tqdm(range(0, total_pages, batch_size), desc="🚀 批处理中..."):
@@ -46,7 +46,6 @@ def process_pdf_max_speed(pdf_file, progress=gr.Progress(track_tqdm=True)):
                 batch_images.append(np.array(img))
             if batch_images:
-                # 使用与锁定版本兼容的调用方式：需要 cls=True
                 results = ocr.ocr(batch_images, cls=True)
                 for page_index, page_result in enumerate(results):
@@ -77,7 +76,7 @@ def process_pdf_max_speed(pdf_file, progress=gr.Progress(track_tqdm=True)):
 with gr.Blocks(title="极速PDF识别器", theme=gr.themes.Soft()) as demo:
     gr.Markdown(
         """
-        # 🔥 极速PDF识别器 (GPU加速稳定版) 🔥
         **速度拉满！实时进度显示，处理期间请勿关闭页面。**
         """
     )
@@ -93,7 +92,7 @@ with gr.Blocks(title="极速PDF识别器", theme=gr.themes.Soft()) as demo:
     submit_btn.click(
         fn=process_pdf_max_speed,
         inputs=[pdf_input],
-        outputs=[result_display, download_link]
     )
 demo.queue().launch()

 OUTPUT_DIR = "output_results"
 os.makedirs(OUTPUT_DIR, exist_ok=True)
+# --- 模型加载器 (这个函数将在GPU容器中被安全调用) ---
 def load_gpu_model():
+    print("正在Docker容器中加载PaddleOCR GPU模型...")
+    # 使用与2.7.3版本兼容的参数
     ocr_model = PaddleOCR(use_angle_cls=True, lang='ch', use_gpu=True)
     print("GPU模型加载成功。")
     return ocr_model
         doc = fitz.open(pdf_file.name)
         total_pages = len(doc)
+        batch_size = 4
         full_text_result = []
         for i in progress.tqdm(range(0, total_pages, batch_size), desc="🚀 批处理中..."):
                 batch_images.append(np.array(img))
             if batch_images:
                 results = ocr.ocr(batch_images, cls=True)
                 for page_index, page_result in enumerate(results):
 with gr.Blocks(title="极速PDF识别器", theme=gr.themes.Soft()) as demo:
     gr.Markdown(
         """
+        # ✅ 极速PDF识别器 (终极稳定版) ✅
         **速度拉满！实时进度显示，处理期间请勿关闭页面。**
         """
     )
     submit_btn.click(
         fn=process_pdf_max_speed,
         inputs=[pdf_input],
+        outputs=[display, download_link]
     )
 demo.queue().launch()