Spaces:

minhvh
/

ocr

Sleeping

App Files Files Community

minhvh commited on Sep 5, 2025

Commit

6a009c3

verified ·

1 Parent(s): 9fb3717

Update app.py

Browse files

Files changed (1) hide show

app.py +60 -52

app.py CHANGED Viewed

@@ -1,69 +1,77 @@
 import gradio as gr
-import cv2
 import numpy as np
-import easyocr
-from paddleocr import PaddleOCR
-# Khởi tạo EasyOCR cho English, Japanese
-readers = {
-    "English": easyocr.Reader(['en'], gpu=False),
-    "Japanese": easyocr.Reader(['ja', 'en'], gpu=False),
 }
-# Khởi tạo PaddleOCR cho Chinese (Simplified)
-paddle_reader = PaddleOCR(
-    use_doc_orientation_classify=False,
-    use_doc_unwarping=False,
-    use_textline_orientation=False
-)
-def preprocess_image(image, max_width=1024):
     """
-    Resize ảnh nếu quá lớn, convert sang RGB.
     """
-    if image.shape[2] == 4:
-        image = cv2.cvtColor(image, cv2.COLOR_RGBA2RGB)
-    h, w = image.shape[:2]
-    if w > max_width:
-        ratio = max_width / w
-        image = cv2.resize(image, (max_width, int(h * ratio)))
-    return image
-def ocr_image(image, lang_choice):
-    """
-    OCR với EasyOCR (English/Japanese) hoặc PaddleOCR (Chinese).
-    """
-    # image = preprocess_image(image)
-    if lang_choice == "Chinese (Simplified)":
-        # PaddleOCR: input có thể là numpy array
-        results = paddle_reader.ocr(image, cls=False)
-        texts = []
-        for res in results:
-            for line in res:
-                texts.append(line[1][0])  # line[1] = (text, confidence)
-        return "\n".join(texts) if texts else "Không nhận diện được văn bản"
-    else:
-        # EasyOCR
-        reader = readers[lang_choice]
-        results = reader.readtext(image)
-        texts = [res[1] for res in results]
-        return "\n".join(texts) if texts else "Không nhận diện được văn bản"
-# Giao diện Gradio
 demo = gr.Interface(
-    fn=ocr_image,
     inputs=[
-        gr.Image(type="numpy", label="Upload ảnh"),
-        gr.Dropdown(
-            choices=["English", "Chinese (Simplified)", "Japanese"],
-            value="English",
-            label="Chọn ngôn ngữ OCR"
-        )
     ],
-    outputs="text",
-    title="OCR Đa Ngôn Ngữ (EasyOCR + PaddleOCR)",
-    description="English & Japanese dùng EasyOCR, Chinese Simplified dùng PaddleOCR"
 )
 if __name__ == "__main__":

 import gradio as gr
+from paddleocr import PaddleOCR, draw_ocr
+from PIL import Image
 import numpy as np
+# ===== Khởi tạo model OCR cho từng ngôn ngữ =====
+LANG_CONFIG = {
+    "ch": "Chinese (Simplified)",
+    "en": "English",
+    "japan": "Japanese",
+    "korean": "Korean",
+    "fr": "French",
+    "german": "German",
 }
+# Load toàn bộ model sẵn (startup lâu nhưng inference nhanh)
+ocr_models = {
+    lang: PaddleOCR(lang=lang, use_angle_cls=True, use_gpu=False)
+    for lang in LANG_CONFIG.keys()
+}
+def inference(img, lang):
     """
+    Nhận diện text bằng PaddleOCR và vẽ kết quả ra ảnh.
     """
+    # OCR
+    ocr = ocr_models[lang]
+    result = ocr.ocr(img, cls=True)[0]
+    # Load ảnh gốc bằng PIL
+    image = Image.open(img).convert("RGB")
+    # Lấy bbox, text, confidence
+    boxes = [line[0] for line in result]
+    txts = [line[1][0] for line in result]
+    scores = [line[1][1] for line in result]
+    # Vẽ kết quả OCR
+    im_show = draw_ocr(image, boxes, txts, scores, font_path="./simfang.ttf")
+    im_show = Image.fromarray(im_show.astype(np.uint8))  # từ numpy -> PIL
+    # Trả về text + ảnh
+    text_out = "\n".join([f"{t} (conf={s:.2f})" for t, s in zip(txts, scores)])
+    return im_show, text_out
+# ===== Giao diện Gradio =====
+title = "PaddleOCR Multi-language"
+description = """
+PaddleOCR hỗ trợ Chinese, English, Japanese, Korean, French, German.
+- Upload ảnh + chọn ngôn ngữ để nhận diện.
+- Model load sẵn toàn bộ, inference nhanh.
+"""
+examples = [
+    ["en_example.jpg", "en"],
+    ["cn_example.jpg", "ch"],
+    ["jp_example.jpg", "japan"],
+]
 demo = gr.Interface(
+    fn=inference,
     inputs=[
+        gr.Image(type="filepath", label="Upload ảnh"),
+        gr.Dropdown(choices=list(LANG_CONFIG.keys()), value="ch", label="Ngôn ngữ OCR")
+    ],
+    outputs=[
+        gr.Image(type="pil", label="Ảnh kết quả"),
+        gr.Textbox(label="Kết quả nhận diện")
     ],
+    title=title,
+    description=description,
+    examples=examples,
+    cache_examples=False,
 )
 if __name__ == "__main__":