Spaces:

eoeooe
/

OcrBroTest

Sleeping

App Files Files Community

eoeooe commited on Sep 1, 2025

Commit

400665c

verified ·

1 Parent(s): 259b92e

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -7

app.py CHANGED Viewed

@@ -11,11 +11,23 @@ def ocr_with_boxes(image):
     # แปลงจาก PIL → OpenCV
     img = cv2.cvtColor(np.array(image), cv2.COLOR_RGB2BGR)
-    # config ไทย + อังกฤษ
-    custom_config = r'-l tha+eng --oem 3 --psm 6'
     # OCR with bounding boxes
-    data = pytesseract.image_to_data(img, config=custom_config, output_type=Output.DICT)
     totalBox = len(data['text'])
     lines = defaultdict(list)
@@ -37,7 +49,7 @@ def ocr_with_boxes(image):
     extracted_texts = [" ".join(words) for _, words in sorted(lines.items())]
     final_text = "\n".join(extracted_texts)
-    # 🔧 แก้เว้นวรรคภาษาไทยตรงนี้เลย
     final_text = re.sub(r'([\u0E00-\u0E7F])\s+([\u0E00-\u0E7F])', r'\1\2', final_text)
     # แปลงกลับเป็น PIL
@@ -51,8 +63,8 @@ demo = gr.Interface(
     fn=ocr_with_boxes,
     inputs=gr.Image(type="pil", label="อัปโหลดภาพ"),
     outputs=[gr.Image(label="ผลลัพธ์พร้อมกรอบข้อความ"), gr.Textbox(label="ข้อความ OCR")],
-    title="OCR ไทย + อังกฤษ (Tesseract + Fix Spacing)",
-    description="อัปโหลดภาพ ระบบจะ OCR ไทย+อังกฤษ วาดกรอบ และแก้เว้นวรรคภาษาไทยอัตโนมัติ"
 )
 if __name__ == "__main__":

     # แปลงจาก PIL → OpenCV
     img = cv2.cvtColor(np.array(image), cv2.COLOR_RGB2BGR)
+    # --- Preprocessing เพื่อให้ OCR อ่านโลโก้แม่นขึ้น ---
+    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)  # เป็น grayscale
+    gray = cv2.adaptiveThreshold(
+        gray, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
+        cv2.THRESH_BINARY, 11, 2
+    )
+    kernel = np.ones((2, 2), np.uint8)
+    gray = cv2.dilate(gray, kernel, iterations=1)
+    gray = cv2.erode(gray, kernel, iterations=1)
+    # --- Tesseract config ---
+    # oem 3 = LSTM neural net, psm 6 = assume a block of text
+    # whitelist สำหรับตัวอักษรอังกฤษ + ตัวเลข
+    custom_config = r'-l tha+eng --oem 3 --psm 6 -c tessedit_char_whitelist=ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789'
     # OCR with bounding boxes
+    data = pytesseract.image_to_data(gray, config=custom_config, output_type=Output.DICT)
     totalBox = len(data['text'])
     lines = defaultdict(list)
     extracted_texts = [" ".join(words) for _, words in sorted(lines.items())]
     final_text = "\n".join(extracted_texts)
+    # 🔧 แก้เว้นวรรคภาษาไทย
     final_text = re.sub(r'([\u0E00-\u0E7F])\s+([\u0E00-\u0E7F])', r'\1\2', final_text)
     # แปลงกลับเป็น PIL
     fn=ocr_with_boxes,
     inputs=gr.Image(type="pil", label="อัปโหลดภาพ"),
     outputs=[gr.Image(label="ผลลัพธ์พร้อมกรอบข้อความ"), gr.Textbox(label="ข้อความ OCR")],
+    title="OCR ไทย + อังกฤษ (Tesseract + Logo Fix)",
+    description="อัปโหลดภาพ ระบบจะ OCR ไทย+อังกฤษ วาดกรอบ และแก้เว้นวรรคภาษาไทยอัตโนมัติ พร้อมปรับให้โลโก้ภาษาอังกฤษอ่านแม่นขึ้น"
 )
 if __name__ == "__main__":