Spaces:

upprize
/

ocr

Sleeping

upprize commited on Oct 10, 2025

Commit

700ddbf

1 Parent(s): 8a06d9f

.

Files changed (2) hide show

README.md CHANGED Viewed

@@ -8,6 +8,7 @@ sdk_version: 5.49.1
 app_file: app.py
 pinned: false
 license: mit
 models:
   - rednote-hilab/DotsOCR
 tags:

 app_file: app.py
 pinned: false
 license: mit
+short_description: Multilingual document layout parsing with OCR
 models:
   - rednote-hilab/DotsOCR
 tags:

app.py CHANGED Viewed

@@ -27,13 +27,23 @@ def load_model():
     global model, processor
     if model is None:
         print(f"Loading model weights from {MODEL_PATH}...")
         model = AutoModelForCausalLM.from_pretrained(
             MODEL_PATH,
-            attn_implementation="flash_attention_2",
-            torch_dtype=torch.bfloat16,
             device_map="auto",
             trust_remote_code=True,
-            token=HF_TOKEN
         )
         print("Model loaded successfully.")

     global model, processor
     if model is None:
         print(f"Loading model weights from {MODEL_PATH}...")
+        # Try to use FlashAttention2 if available, otherwise use default attention
+        try:
+            import flash_attn
+            attn_implementation = "flash_attention_2"
+            print("Using FlashAttention2 for faster inference")
+        except ImportError:
+            attn_implementation = "eager"
+            print("FlashAttention2 not available, using default attention")
         model = AutoModelForCausalLM.from_pretrained(
             MODEL_PATH,
+            dtype=torch.bfloat16,
             device_map="auto",
             trust_remote_code=True,
+            token=HF_TOKEN,
+            attn_implementation=attn_implementation
         )
         print("Model loaded successfully.")