Spaces:

ranbac
/

PaddleOCR

Running

App Files Files Community

ranbac commited on 24 days ago

Commit

e8fb7a1

verified ·

1 Parent(s): f286775

Create app.py

Browse files

Files changed (1) hide show

app.py +62 -0

app.py ADDED Viewed

	@@ -0,0 +1,62 @@

+import gradio as gr
+from paddleocr import PaddleOCR
+from PIL import Image
+import numpy as np
+# 1. Khởi tạo PaddleOCR
+# use_gpu=False: BẮT BUỘC cho CPU Basic
+# lang='ch': Hỗ trợ tiếng Trung và tiếng Anh
+# use_angle_cls=True: Tự động xoay ảnh nếu văn bản bị nghiêng
+ocr = PaddleOCR(use_angle_cls=True, lang='ch', use_gpu=False)
+def inference(img):
+    if img is None:
+        return None, "Vui lòng tải ảnh lên."
+    # Chuyển đổi ảnh sang numpy array nếu cần thiết
+    if isinstance(img, Image.Image):
+        img = np.array(img)
+    # 2. Thực hiện OCR
+    # result trả về danh sách các hộp (box), văn bản (text), và độ tin cậy (score)
+    result = ocr.ocr(img, cls=True)
+    txts = []
+    if result and result[0]:
+        # Trích xuất chỉ phần văn bản để hiển thị
+        txts = [line[1][0] for line in result[0]]
+    else:
+        return img, "Không tìm thấy văn bản nào."
+    # 3. Vẽ kết quả lên ảnh (Optional - dùng hàm có sẵn của Paddle)
+    from paddleocr import draw_ocr
+    boxes = [line[0] for line in result[0]]
+    scores = [line[1][1] for line in result[0]]
+    # Cần font tiếng Trung để vẽ lên ảnh, nếu không sẽ bị lỗi ô vuông
+    # PaddleOCR tự động tải font mặc định, nhưng để an toàn ta trả về text trước
+    im_show = draw_ocr(img, boxes, txts, scores, font_path='./fonts/simfang.ttf')
+    im_show = Image.fromarray(im_show)
+    return im_show, "\n".join(txts)
+# 4. Giao diện Gradio
+title = "PaddleOCR Chinese - CPU Optimized"
+description = "Nhận diện tiếng Trung/Anh sử dụng PaddleOCR v4 chạy trên Hugging Face CPU Basic."
+with gr.Blocks() as demo:
+    gr.Markdown(f"# {title}")
+    gr.Markdown(description)
+    with gr.Row():
+        with gr.Column():
+            img_input = gr.Image(label="Tải ảnh lên", type="pil")
+            submit_btn = gr.Button("Chạy OCR")
+        with gr.Column():
+            img_output = gr.Image(label="Kết quả Visualized", type="pil")
+            text_output = gr.Textbox(label="Văn bản trích xuất", lines=10)
+    submit_btn.click(fn=inference, inputs=img_input, outputs=[img_output, text_output])
+# Launch
+demo.launch()