Spaces:

Mageia
/

GOT-OCR-Optimize

Sleeping

App Files Files Community

Mageia commited on Oct 16, 2024

Commit

d0f2987

unverified ·

1 Parent(s): 2a61207

fix: process pdf once

Browse files

Files changed (1) hide show

app.py +10 -2

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import base64
 import os
 import gradio as gr
 import spaces
@@ -15,7 +16,7 @@ model = model.eval().to(device)
 @spaces.GPU()
-def ocr_process(image, got_mode, ocr_color="", ocr_box=""):
     if image is None:
         return "错误:未提供图片"
@@ -23,18 +24,24 @@ def ocr_process(image, got_mode, ocr_color="", ocr_box=""):
         image_path = image
         result_path = f"{os.path.splitext(image_path)[0]}_result.html"
         if "plain" in got_mode:
             if "multi-crop" in got_mode:
                 res = model.chat_crop(tokenizer, image_path, ocr_type="ocr")
             else:
                 res = model.chat(tokenizer, image_path, ocr_type="ocr", ocr_box=ocr_box, ocr_color=ocr_color)
             return res
         elif "format" in got_mode:
             if "multi-crop" in got_mode:
                 res = model.chat_crop(tokenizer, image_path, ocr_type="format", render=True, save_render_file=result_path)
             else:
                 res = model.chat(tokenizer, image_path, ocr_type="format", ocr_box=ocr_box, ocr_color=ocr_color, render=True, save_render_file=result_path)
             if os.path.exists(result_path):
                 with open(result_path, "r", encoding="utf-8") as f:
                     html_content = f.read()
@@ -42,7 +49,8 @@ def ocr_process(image, got_mode, ocr_color="", ocr_box=""):
                 data_uri = f"data:text/html;charset=utf-8;base64,{encoded_html}"
                 preview = f'<iframe src="{data_uri}" width="100%" height="600px"></iframe>'
                 download_link = f'<a href="{data_uri}" download="result.html">下载完整结果</a>'
-                return f"{download_link}\n\n{preview}\n\n识别结果：\n"
         return "错误: 未知的OCR模式"
     except Exception as e:

 import base64
 import os
+import time
 import gradio as gr
 import spaces
 @spaces.GPU()
+def ocr_process(image, got_mode, ocr_color="", ocr_box="", progress=gr.Progress()):
     if image is None:
         return "错误:未提供图片"
         image_path = image
         result_path = f"{os.path.splitext(image_path)[0]}_result.html"
+        progress(0, desc="开始处理...")
         if "plain" in got_mode:
+            progress(0.3, desc="执行OCR识别...")
             if "multi-crop" in got_mode:
                 res = model.chat_crop(tokenizer, image_path, ocr_type="ocr")
             else:
                 res = model.chat(tokenizer, image_path, ocr_type="ocr", ocr_box=ocr_box, ocr_color=ocr_color)
+            progress(1, desc="处理完成")
             return res
         elif "format" in got_mode:
+            progress(0.3, desc="执行OCR识别...")
             if "multi-crop" in got_mode:
                 res = model.chat_crop(tokenizer, image_path, ocr_type="format", render=True, save_render_file=result_path)
             else:
                 res = model.chat(tokenizer, image_path, ocr_type="format", ocr_box=ocr_box, ocr_color=ocr_color, render=True, save_render_file=result_path)
+            progress(0.7, desc="生成结果...")
             if os.path.exists(result_path):
                 with open(result_path, "r", encoding="utf-8") as f:
                     html_content = f.read()
                 data_uri = f"data:text/html;charset=utf-8;base64,{encoded_html}"
                 preview = f'<iframe src="{data_uri}" width="100%" height="600px"></iframe>'
                 download_link = f'<a href="{data_uri}" download="result.html">下载完整结果</a>'
+                progress(1, desc="处理完成")
+                return f"{download_link}\n\n{preview}"
         return "错误: 未知的OCR模式"
     except Exception as e: