Spaces:

eoeooe
/

OcrBroTest

Sleeping

eoeooe commited on Sep 1, 2025

Commit

4d37a12

verified ·

1 Parent(s): df312e5

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,40 +1,45 @@
-import gradio as gr
 import cv2
 import numpy as np
-from paddleocr import PaddleOCR, draw_ocr
 from PIL import Image
-# โหลดโมเดล PaddleOCR (ไทย+อังกฤษ)
-ocr = PaddleOCR(use_angle_cls=True, lang='th')
-def ocr_with_paddle(image):
-    # แปลงจาก PIL → OpenCV
-    img = cv2.cvtColor(np.array(image), cv2.COLOR_RGB2BGR)
     # OCR
-    result = ocr.ocr(img, cls=True)
-    # ดึงกล่อง + ข้อความ
-    boxes = [line[0] for line in result[0]]
-    texts = [line[1][0] for line in result[0]]
-    scores = [line[1][1] for line in result[0]]
-    # วาดกรอบ
-    im_show = draw_ocr(img, boxes, texts, scores, font_path='th_font.ttf')
-    im_show = Image.fromarray(im_show)
-    # รวมข้อความ
-    extracted_text = "\n".join(texts)
-    return im_show, extracted_text
-demo = gr.Interface(
-    fn=ocr_with_paddle,
     inputs=gr.Image(type="pil"),
-    outputs=[gr.Image(type="pil", label="Detected Image"), gr.Textbox(label="Extracted Text")],
-    title="Fast OCR (Thai+English) with PaddleOCR",
-    description="OCR ภาษาไทย-อังกฤษ ที่เร็วกว่า EasyOCR"
 )
-if __name__ == "__main__":
-    demo.launch()

 import cv2
+import pytesseract
+from pytesseract import Output
+import gradio as gr
 import numpy as np
 from PIL import Image
+def preprocess_image(img):
+    """Preprocessing เพื่อให้ OCR ไทย+อังกฤษ แม่นขึ้น"""
+    gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+    # ลด noise
+    gray = cv2.medianBlur(gray, 3)
+    # Thresholding (adaptive) เพื่อให้ text ชัด
+    thresh = cv2.adaptiveThreshold(
+        gray, 255, cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
+        cv2.THRESH_BINARY, 11, 2
+    )
+    return thresh
+def ocr_image(img_pil):
+    # แปลง PIL -> OpenCV
+    img = cv2.cvtColor(np.array(img_pil), cv2.COLOR_RGB2BGR)
+    # Preprocessing
+    processed_img = preprocess_image(img)
+    # Config สำหรับไทย+อังกฤษ
+    custom_config = r'-l tha+eng --oem 3 --psm 6 -c language_model_ngram_space_delimited_language=1'
     # OCR
+    text = pytesseract.image_to_string(processed_img, config=custom_config)
+    return text
+# Gradio interface
+iface = gr.Interface(
+    fn=ocr_image,
     inputs=gr.Image(type="pil"),
+    outputs="text",
+    title="OCR ไทย + อังกฤษ (Preprocessed)",
+    description="อัปโหลดรูปเพื่ออ่านข้อความภาษาไทยและอังกฤษ พร้อมปรับภาพให้แม่นยำขึ้น"
 )
+iface.launch()