Spaces:

mrinalcs
/

deepseek-ocr-api

Runtime error

mrinalcs commited on Nov 20, 2025

Commit

68f50cf

verified ·

1 Parent(s): ddefe9c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,15 +13,13 @@ print("Loading model...")
 model = AutoModel.from_pretrained(
     model_name,
     trust_remote_code=True,
-    _attn_implementation="flash_attention_2",
-    use_safetensors=True
-).cuda().to(torch.bfloat16).eval()
 def ocr_infer(image):
-    # Save temporary image
     image.save("input.png")
-    # Standard OCR prompt
     prompt = "<image>\nFree OCR."
     result = model.infer(
@@ -29,20 +27,18 @@ def ocr_infer(image):
         prompt=prompt,
         image_file="input.png",
         output_path=".",
-        base_size=1024,
         image_size=640,
-        crop_mode=True,
-        save_results=False
     )
     return result["text"]
 demo = gr.Interface(
     fn=ocr_infer,
     inputs=gr.Image(type="pil"),
     outputs="text",
-    title="DeepSeek-OCR API (HuggingFace)",
-    description="Upload an image and get OCR text using DeepSeek-OCR"
 )
 demo.launch()

 model = AutoModel.from_pretrained(
     model_name,
     trust_remote_code=True,
+    use_safetensors=True,
+    low_cpu_mem_usage=True
+).cuda().eval()
 def ocr_infer(image):
     image.save("input.png")
     prompt = "<image>\nFree OCR."
     result = model.infer(
         prompt=prompt,
         image_file="input.png",
         output_path=".",
         image_size=640,
+        crop_mode=True
     )
     return result["text"]
 demo = gr.Interface(
     fn=ocr_infer,
     inputs=gr.Image(type="pil"),
     outputs="text",
+    title="DeepSeek-OCR (HF Space)",
+    description="GPU OCR API"
 )
 demo.launch()