Spaces:

ivanhoang
/

email-order-extractor

Build error

ivanhoang commited on Sep 19

Commit

62477e6

verified ·

1 Parent(s): 1ad2e0c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,21 +13,21 @@ print(f"Đang sử dụng thiết bị: {device}")
 # 1. Tải mô hình OCR (Sử dụng phiên bản 'base' thay vì 'large')
 print("Đang tải mô hình OCR (Florence-2-base)...")
-ocr_model_id = "microsoft/Florence-2-base" # THAY ĐỔI 1: Dùng model base nhỏ hơn
 ocr_processor = AutoProcessor.from_pretrained(ocr_model_id, trust_remote_code=True)
 quantization_config = BitsAndBytesConfig(load_in_4bit=True)
 ocr_model = AutoModelForCausalLM.from_pretrained(
     ocr_model_id,
-    device_map="auto", # Để transformers tự quyết định device map
     torch_dtype=torch.bfloat16,
     quantization_config=quantization_config,
-    trust_remote_code=True
 )
 print("Tải xong mô hình OCR.")
 # 2. Tải mô hình LLM (Sử dụng phiên bản đã được nén sẵn)
 print("Đang tải mô hình LLM (Unsloth Llama 3 8B 4-bit)...")
-# THAY ĐỔI 2: Dùng phiên bản Llama-3 đã được nén sẵn của Unsloth, rất hiệu quả về bộ nhớ
 llm_model_id = "unsloth/llama-3-8b-Instruct-bnb-4bit"
 llm_pipeline = pipeline(
     "text-generation",

 # 1. Tải mô hình OCR (Sử dụng phiên bản 'base' thay vì 'large')
 print("Đang tải mô hình OCR (Florence-2-base)...")
+ocr_model_id = "microsoft/Florence-2-base"
 ocr_processor = AutoProcessor.from_pretrained(ocr_model_id, trust_remote_code=True)
 quantization_config = BitsAndBytesConfig(load_in_4bit=True)
 ocr_model = AutoModelForCausalLM.from_pretrained(
     ocr_model_id,
+    device_map="auto",
     torch_dtype=torch.bfloat16,
     quantization_config=quantization_config,
+    trust_remote_code=True,
+    attn_implementation="eager" # <-- THÊM DÒNG NÀY ĐỂ SỬA LỖI
 )
 print("Tải xong mô hình OCR.")
 # 2. Tải mô hình LLM (Sử dụng phiên bản đã được nén sẵn)
 print("Đang tải mô hình LLM (Unsloth Llama 3 8B 4-bit)...")
 llm_model_id = "unsloth/llama-3-8b-Instruct-bnb-4bit"
 llm_pipeline = pipeline(
     "text-generation",