Spaces:

ranbac
/

PaddleOCR

Sleeping

App Files Files Community

ranbac commited on Feb 13

Commit

b722821

verified ·

1 Parent(s): a018f41

Update app.py

Browse files

Files changed (1) hide show

app.py +48 -37

app.py CHANGED Viewed

@@ -2,65 +2,77 @@ import gradio as gr
 import logging
 import os
 import re
-# Đặt biến môi trường TRƯỚC KHI import paddle để tắt hoàn toàn MKLDNN ở cấp độ OS
-os.environ["FLAGS_use_mkldnn"] = "0"
-os.environ["FLAGS_enable_mkldnn"] = "0"
-os.environ["CPP_MIN_LOG_LEVEL"] = "3"
 from paddleocr import PaddleOCR
 from PIL import Image
 import numpy as np
-# Tắt log Python
 logging.getLogger("ppocr").setLevel(logging.WARNING)
-print("Đang khởi tạo PaddleOCR (Safe Mode - No MKLDNN)...")
 try:
-    # --- CẤU HÌNH AN TOÀN TUYỆT ĐỐI ---
-    # enable_mkldnn=False: Bắt buộc tắt để tránh lỗi std::exception
-    # use_angle_cls=True: Dùng tham số cũ cho tương thích (hoặc use_textline_orientation=True)
-    # lang='ch': Tiếng Trung
     ocr = PaddleOCR(
-        use_angle_cls=True,
-        lang='ch',
-        use_gpu=False,
-        enable_mkldnn=False, # QUAN TRỌNG NHẤT: Tắt tăng tốc phần cứng gây lỗi
-        show_log=False
     )
 except Exception as e:
-    print(f"Lỗi khởi tạo: {e}. Thử lại chế độ tối giản...")
-    # Fallback mode
-    ocr = PaddleOCR(lang='ch', enable_mkldnn=False)
 print("Model đã sẵn sàng!")
-# --- HÀM QUÉT ĐỆ QUY ---
 def deep_extract_text(data):
     found_texts = []
     if isinstance(data, str):
-        if len(data.strip()) > 0: return [data]
         return []
     if isinstance(data, (list, tuple)):
         for item in data:
             found_texts.extend(deep_extract_text(item))
     elif isinstance(data, dict):
         for val in data.values():
             found_texts.extend(deep_extract_text(val))
     elif hasattr(data, '__dict__'):
         found_texts.extend(deep_extract_text(data.__dict__))
     return found_texts
-# --- HÀM LỌC RÁC ---
 def clean_text_result(text_list):
     cleaned = []
     block_list = ['min', 'max', 'general', 'header', 'footer', 'structure']
     for t in text_list:
         t = t.strip()
-        if len(t) < 2 and not any(u'\u4e00' <= c <= u'\u9fff' for c in t): continue
-        if t.lower().endswith(('.ttf', '.json', '.pdparams', '.yml')): continue
-        if t.lower() in block_list: continue
-        if not re.search(r'[\w\u4e00-\u9fff]', t): continue
         cleaned.append(t)
     return cleaned
@@ -69,18 +81,16 @@ def predict(image):
         return "请上传图片 / Vui lòng tải ảnh lên."
     try:
-        # --- CHUẨN HÓA ẢNH (FIX LỖI C++ CRASH) ---
-        # Paddle C++ rất ghét ảnh RGBA (trong suốt), bắt buộc convert về RGB
         if isinstance(image, Image.Image):
-            if image.mode != 'RGB':
-                image = image.convert('RGB')
             image = np.array(image)
-        # Gọi OCR
         raw_result = ocr.ocr(image)
-        # Xử lý kết quả
         all_texts = deep_extract_text(raw_result)
         final_texts = clean_text_result(all_texts)
         if len(final_texts) > 0:
@@ -91,15 +101,16 @@ def predict(image):
     except Exception as e:
         import traceback
         traceback.print_exc()
-        return f"Lỗi hệ thống: {str(e)}"
-# Giao diện
 iface = gr.Interface(
     fn=predict,
     inputs=gr.Image(type="pil", label="Input Image"),
-    outputs=gr.Textbox(label="Kết quả", lines=15),
-    title="PaddleOCR Chinese (Safe Mode)",
-    description="Phiên bản đã tắt MKLDNN để sửa lỗi std::exception.",
     examples=[]
 )

 import logging
 import os
 import re
 from paddleocr import PaddleOCR
 from PIL import Image
 import numpy as np
+# Tắt log hệ thống
+os.environ["CPP_MIN_LOG_LEVEL"] = "3"
 logging.getLogger("ppocr").setLevel(logging.WARNING)
+print("Đang khởi tạo PaddleOCR (PaddleX 3.0)...")
+# --- PHẦN SỬA LỖI QUAN TRỌNG ---
+# Đã xóa hoàn toàn 'use_gpu=False' để tránh lỗi ValueError
 try:
     ocr = PaddleOCR(
+        use_textline_orientation=True,
+        lang='ch'
     )
 except Exception as e:
+    print(f"Lỗi khởi tạo tham số: {e}. Chuyển sang chế độ mặc định.")
+    ocr = PaddleOCR(lang='ch')
 print("Model đã sẵn sàng!")
+# --- HÀM QUÉT ĐỆ QUY (Để lấy text từ cấu trúc phức tạp) ---
 def deep_extract_text(data):
     found_texts = []
+    # Nếu là chuỗi -> Lấy luôn
     if isinstance(data, str):
+        if len(data.strip()) > 0:
+            return [data]
         return []
+    # Nếu là List/Tuple -> Quét từng phần tử
     if isinstance(data, (list, tuple)):
         for item in data:
             found_texts.extend(deep_extract_text(item))
+    # Nếu là Dict -> Quét Values
     elif isinstance(data, dict):
         for val in data.values():
             found_texts.extend(deep_extract_text(val))
+    # Nếu là Object lạ -> Quét thuộc tính
     elif hasattr(data, '__dict__'):
         found_texts.extend(deep_extract_text(data.__dict__))
     return found_texts
+# --- HÀM LỌC RÁC (Loại bỏ min, general, .ttf) ---
 def clean_text_result(text_list):
     cleaned = []
+    # Danh sách từ khóa rác cần chặn
     block_list = ['min', 'max', 'general', 'header', 'footer', 'structure']
     for t in text_list:
         t = t.strip()
+        # 1. Bỏ qua chuỗi quá ngắn (trừ khi là chữ Hán)
+        if len(t) < 2:
+            # Kiểm tra Unicode range chữ Hán
+            if not any(u'\u4e00' <= c <= u'\u9fff' for c in t):
+                continue
+        # 2. Bỏ qua file hệ thống
+        if t.lower().endswith(('.ttf', '.json', '.pdparams', '.yml', '.yaml')):
+            continue
+        # 3. Bỏ qua từ khóa hệ thống
+        if t.lower() in block_list:
+            continue
+        # 4. Chỉ lấy dòng có nội dung thực sự
+        if not re.search(r'[\w\u4e00-\u9fff]', t):
+            continue
         cleaned.append(t)
     return cleaned
         return "请上传图片 / Vui lòng tải ảnh lên."
     try:
         if isinstance(image, Image.Image):
             image = np.array(image)
+        # Gọi OCR (Không truyền tham số nào khác)
         raw_result = ocr.ocr(image)
+        # Trích xuất toàn bộ text
         all_texts = deep_extract_text(raw_result)
+        # Lọc sạch kết quả
         final_texts = clean_text_result(all_texts)
         if len(final_texts) > 0:
     except Exception as e:
         import traceback
         traceback.print_exc()
+        return f"Lỗi xử lý: {str(e)}"
+# Giao diện Gradio
 iface = gr.Interface(
     fn=predict,
     inputs=gr.Image(type="pil", label="Input Image"),
+    # Bỏ show_copy_button=True để tránh lỗi với Gradio cũ
+    outputs=gr.Textbox(label="Kết quả (Đã lọc nhiễu)", lines=15),
+    title="PaddleOCR Tiếng Trung (PaddleX 3.0 Clean)",
+    description="Phiên bản đã Fix lỗi use_gpu và tích hợp bộ lọc rác thông minh.",
     examples=[]
 )