Spaces:

HoagMin
/

FoodDetection

Sleeping

App Files Files Community

HoagMin commited on Feb 27

Commit

751fef8

1 Parent(s): b29d4b3

update ocr service

Browse files

Files changed (1) hide show

services/ocr_service.py +23 -34

services/ocr_service.py CHANGED Viewed

@@ -10,11 +10,9 @@ logging.getLogger("paddle").setLevel(logging.ERROR)
 class OCRService:
     def __init__(self):
-        """Khởi tạo PaddleOCR cho phiên bản Pipeline mới."""
-        # Với bản mới, các tham số cấu hình thường được nhận tự động hoặc qua config file.
-        # Ta khởi tạo đơn giản nhất để tránh lỗi tham số lạ.
-        self.ocr = PaddleOCR(lang='vi', use_textline_orientation=False, use_doc_orientation_classify=False,
-    use_doc_unwarping=False)
     def extract_text(self, img_path: str) -> List[str]:
         """
@@ -25,27 +23,19 @@ class OCRService:
             return []
         try:
-            # --- 1. CHẠY OCR (Dùng .predict theo yêu cầu của thư viện) ---
-            # KHÔNG truyền cls=True vào đây nữa
-            results = self.ocr.predict(img_path)
             raw_texts = []
-            # --- 2. XỬ LÝ KẾT QUẢ (Structure mới) ---
-            # Kết quả trả về là một list các object, mỗi object chứa thông tin nhận diện
-            for res in results:
-                # Kiểm tra xem object có thuộc tính 'rec_texts' không (đây là đặc trưng bản mới)
-                if hasattr(res, 'rec_texts'):
-                    if res.rec_texts:
-                        for text in res.rec_texts:
-                            if text:
-                                raw_texts.append(str(text))
-                # Dự phòng: Nếu nó trả về Dictionary (một số version khác)
-                elif isinstance(res, dict) and 'rec_texts' in res:
-                    raw_texts.extend(res['rec_texts'])
-            # --- 3. BỘ LỌC RÁC (Giữ nguyên logic cũ) ---
             clean_texts = []
             for text in raw_texts:
                 text = text.strip()
@@ -72,15 +62,14 @@ class OCRService:
             traceback.print_exc()
             return []
- #--- TEST CODE ---
-#if __name__ == "__main__":
- #   service = OCRService()
-  #  test_path = r"static/debug/bunbohue.png"
-  #  print(f"🔍 Đang đọc: {test_path}")
-  #  texts = service.extract_text(test_path)
-  #
-  #  print("-" * 30)
-  #  print(f"✅ KẾT QUẢ ({len(texts)} dòng):")
-  #  for t in texts:
-  #      print(f"  - {t}") ##

 class OCRService:
     def __init__(self):
+        """Khởi tạo PaddleOCR cho phiên bản 2.8.1 ổn định."""
+        # Tham số use_angle_cls thay thế cho các cấu hình doc orientation bản mới
+        self.ocr = PaddleOCR(lang='vi', use_angle_cls=False)
     def extract_text(self, img_path: str) -> List[str]:
         """
             return []
         try:
+            # --- 1. CHẠY OCR (Dùng .ocr thay vì .predict) ---
+            results = self.ocr.ocr(img_path, cls=False)
             raw_texts = []
+            # --- 2. XỬ LÝ KẾT QUẢ (Structure của bản 2.x) ---
+            # Kết quả trả về là list các dòng, mỗi dòng có dạng: [tọa_độ_box, (text, độ_tự_tin)]
+            if results and len(results) > 0 and results[0] is not None:
+                for line in results[0]:
+                    text = line[1][0] # line[1] là tuple (text, score), lấy phần tử đầu tiên
+                    raw_texts.append(text)
+            # --- 3. BỘ LỌC RÁC (Giữ nguyên logic cực kỳ xịn của bạn) ---
             clean_texts = []
             for text in raw_texts:
                 text = text.strip()
             traceback.print_exc()
             return []
+# --- TEST CODE ---
+# if __name__ == "__main__":
+#     service = OCRService()
+#     test_path = r"static/debug/bunbohue.png"
+#     print(f"🔍 Đang đọc: {test_path}")
+#     texts = service.extract_text(test_path)
+#
+#     print("-" * 30)
+#     print(f"✅ KẾT QUẢ ({len(texts)} dòng):")
+#     for t in texts:
+#         print(f"  - {t}")