Spaces:

longjava2024
/

ocr

No application file

longjava2024 commited on Dec 22, 2025

Commit

1edb9b1

verified ·

1 Parent(s): ddd807c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -28,8 +28,9 @@ app = FastAPI(title="CCCD OCR with Vintern-1B-v2")
 MODEL_NAME = "5CD-AI/Vintern-1B-v2"
-DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
-DTYPE = torch.bfloat16 if DEVICE == "cuda" else torch.float32
 print(f"Loading model `{MODEL_NAME}` on {DEVICE} ...")
@@ -237,10 +238,7 @@ def normalize_base64(image_base64: str) -> str:
 def ocr_by_llm(image_base64: str, prompt: str) -> str:
     pixel_values = load_image_from_base64(image_base64, max_num=6)
-    if DEVICE == "cuda":
-        pixel_values = pixel_values.to(dtype=torch.bfloat16, device=DEVICE)
-    else:
-        pixel_values = pixel_values.to(dtype=torch.float32, device=DEVICE)
     with torch.no_grad():
         response_message = model.chat(
             tokenizer,

 MODEL_NAME = "5CD-AI/Vintern-1B-v2"
+# Force CPU-only to avoid NVIDIA driver / CUDA issues on Spaces
+DEVICE = "cpu"
+DTYPE = torch.float32
 print(f"Loading model `{MODEL_NAME}` on {DEVICE} ...")
 def ocr_by_llm(image_base64: str, prompt: str) -> str:
     pixel_values = load_image_from_base64(image_base64, max_num=6)
+    pixel_values = pixel_values.to(dtype=torch.float32, device=DEVICE)
     with torch.no_grad():
         response_message = model.chat(
             tokenizer,