Spaces:

ranbac
/

PaddleOCR

Sleeping

App Files Files Community

ranbac commited on 23 days ago

Commit

14d33c0

verified ·

1 Parent(s): d77ca99

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -48

app.py CHANGED Viewed

@@ -3,60 +3,45 @@ from paddleocr import PaddleOCR
 from PIL import Image
 import numpy as np
-# 1. Khởi tạo PaddleOCR
 # use_gpu=False: BẮT BUỘC cho CPU Basic
-# lang='ch': Hỗ trợ tiếng Trung và tiếng Anh
-# use_angle_cls=True: Tự động xoay ảnh nếu văn bản bị nghiêng
-ocr = PaddleOCR(use_angle_cls=True, lang='ch')
-def inference(img):
-    if img is None:
-        return None, "Vui lòng tải ảnh lên."
-    # Chuyển đổi ảnh sang numpy array nếu cần thiết
-    if isinstance(img, Image.Image):
-        img = np.array(img)
-    # 2. Thực hiện OCR
-    # result trả về danh sách các hộp (box), văn bản (text), và độ tin cậy (score)
-    result = ocr.ocr(img, cls=True)
     txts = []
     if result and result[0]:
-        # Trích xuất chỉ phần văn bản để hiển thị
-        txts = [line[1][0] for line in result[0]]
     else:
-        return img, "Không tìm thấy văn bản nào."
-    # 3. Vẽ kết quả lên ảnh (Optional - dùng hàm có sẵn của Paddle)
-    from paddleocr import draw_ocr
-    boxes = [line[0] for line in result[0]]
-    scores = [line[1][1] for line in result[0]]
-    # Cần font tiếng Trung để vẽ lên ảnh, nếu không sẽ bị lỗi ô vuông
-    # PaddleOCR tự động tải font mặc định, nhưng để an toàn ta trả về text trước
-    im_show = draw_ocr(img, boxes, txts, scores, font_path='./fonts/simfang.ttf')
-    im_show = Image.fromarray(im_show)
-    return im_show, "\n".join(txts)
-# 4. Giao diện Gradio
-title = "PaddleOCR Chinese - CPU Optimized"
-description = "Nhận diện tiếng Trung/Anh sử dụng PaddleOCR v4 chạy trên Hugging Face CPU Basic."
-with gr.Blocks() as demo:
-    gr.Markdown(f"# {title}")
-    gr.Markdown(description)
-    with gr.Row():
-        with gr.Column():
-            img_input = gr.Image(label="Tải ảnh lên", type="pil")
-            submit_btn = gr.Button("Chạy OCR")
-        with gr.Column():
-            img_output = gr.Image(label="Kết quả Visualized", type="pil")
-            text_output = gr.Textbox(label="Văn bản trích xuất", lines=10)
-    submit_btn.click(fn=inference, inputs=img_input, outputs=[img_output, text_output])
-# Launch
-demo.launch()

 from PIL import Image
 import numpy as np
+# Khởi tạo PaddleOCR
+# use_angle_cls=True: Tự động xoay ảnh nếu bị nghiêng
+# lang='vi': Hỗ trợ tiếng Việt (và tiếng Anh)
 # use_gpu=False: BẮT BUỘC cho CPU Basic
+print("Đang tải model PaddleOCR...")
+ocr = PaddleOCR(use_angle_cls=True, lang='vi', use_gpu=False)
+print("Đã tải model thành công!")
+def predict(image):
+    if image is None:
+        return "Vui lòng tải ảnh lên."
+    # Chuyển đổi ảnh sang numpy array nếu cần
+    if isinstance(image, Image.Image):
+        image = np.array(image)
+    # Thực hiện OCR
+    result = ocr.ocr(image, cls=True)
+    # Xử lý kết quả trả về
     txts = []
     if result and result[0]:
+        for line in result[0]:
+            # line cấu trúc: [[box], [text, confidence]]
+            text = line[1][0]
+            txts.append(text)
+        return "\n".join(txts)
     else:
+        return "Không tìm thấy văn bản nào."
+# Tạo giao diện Gradio
+iface = gr.Interface(
+    fn=predict,
+    inputs=gr.Image(type="pil", label="Tải ảnh lên"),
+    outputs=gr.Textbox(label="Kết quả nhận dạng", lines=10),
+    title="PaddleOCR Tiếng Việt - CPU Basic",
+    description="Demo nhận dạng văn bản tiếng Việt chạy trên Hugging Face Spaces (Docker CPU).",
+    examples=[] # Bạn có thể thêm đường dẫn ảnh mẫu vào đây nếu muốn
+)
+if __name__ == "__main__":
+    iface.launch(server_name="0.0.0.0", server_port=7860)