OCR-DEMO

Running on Zero

erow commited on Oct 23

Commit

f0568ad

1 Parent(s): 51c0d3d

fix error

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 import gradio as gr
 import torch
 from transformers import AutoModel, AutoTokenizer
@@ -34,7 +35,7 @@ def find_result_image(path):
 # --- 2. Main Processing Function (UPDATED for multi-bbox drawing) ---
 @spaces.GPU
-def process_ocr_task(image, model_size, ref_text, task_type="📝 Free OCR"):
     """
     Processes an image with DeepSeek-OCR for all supported tasks.
     Now draws ALL detected bounding boxes for ANY task.
@@ -151,7 +152,8 @@ with gr.Blocks(title="Text Extraction Demo", theme=gr.themes.Soft()) as demo:
                     free_output_image = gr.Image(label="🖼️ Image Result (if any)", type="pil")
             # Wire Free OCR button
-            free_btn.click(fn=process_ocr_task, inputs=[free_image, free_model_size, gr.Textbox(value="", visible=False), "Free OCR"], outputs=[free_output_text, free_output_image])
         with gr.TabItem("Locate"):
             with gr.Row():
@@ -167,7 +169,8 @@ with gr.Blocks(title="Text Extraction Demo", theme=gr.themes.Soft()) as demo:
                     loc_output_image = gr.Image(label="🖼️ Image Result (if any)", type="pil")
             # Wire Locate button
-            loc_btn.click(fn=process_ocr_task, inputs=[loc_image, loc_model_size, ref_text_input, "🔍 Locate Object by Reference"], outputs=[loc_output_text, loc_output_image])
     # Keep examples (they'll run process_ocr_task directly) - provide a compact examples widget pointing to the free tab inputs
     gr.Examples(

+from functools import partial
 import gradio as gr
 import torch
 from transformers import AutoModel, AutoTokenizer
 # --- 2. Main Processing Function (UPDATED for multi-bbox drawing) ---
 @spaces.GPU
+def process_ocr_task(image, model_size, ref_text, task_type):
     """
     Processes an image with DeepSeek-OCR for all supported tasks.
     Now draws ALL detected bounding boxes for ANY task.
                     free_output_image = gr.Image(label="🖼️ Image Result (if any)", type="pil")
             # Wire Free OCR button
+            free_ocr = partial(process_ocr_task, task_type="📝 Free OCR", ref_text="")
+            free_btn.click(fn=free_ocr, inputs=[free_image, free_model_size], outputs=[free_output_text, free_output_image])
         with gr.TabItem("Locate"):
             with gr.Row():
                     loc_output_image = gr.Image(label="🖼️ Image Result (if any)", type="pil")
             # Wire Locate button
+            pets_detection = partial(process_ocr_task, task_type="🔍 Locate Object by Reference", ref_text="pets")
+            loc_btn.click(fn=pets_detection, inputs=[loc_image, loc_model_size], outputs=[loc_output_text, loc_output_image])
     # Keep examples (they'll run process_ocr_task directly) - provide a compact examples widget pointing to the free tab inputs
     gr.Examples(