Spaces:

YOUKKASS
/

manga01

Runtime error

App Files Files Community

YOUKKASS commited on Sep 10, 2025

Commit

b1ff060

verified ·

1 Parent(s): ea01e9d

Update modules/ocr.py

Browse files

Files changed (1) hide show

modules/ocr.py +75 -120

modules/ocr.py CHANGED Viewed

@@ -2,141 +2,96 @@ from paddleocr import PaddleOCR
 import cv2
 import numpy as np
 import os
-import uuid
-# تخزين محركات OCR لكل لغة لتجنّب إعادة التهيئة
-_OCR_ENGINES = {}
-def _get_engine(lang='en'):
-    if lang not in _OCR_ENGINES:
         try:
-            # استخدام الإعدادات المتوافقة مع الإصدار الحالي
-            _OCR_ENGINES[lang] = PaddleOCR(
                 use_angle_cls=True,
-                lang=lang,
                 show_log=False,
-                det_db_thresh=0.3,   # تخفيض threshold للكشف
-                det_db_box_thresh=0.3
-                # تم إزالة rec_thresh لأنه غير مدعوم
             )
-            print("✅ تم تهيئة محرك PaddleOCR بنجاح")
         except Exception as e:
             print(f"❌ فشل في تهيئة PaddleOCR: {e}")
             raise
-    return _OCR_ENGINES[lang]
-def preprocess_for_ocr(input_path, upscale=2):
-    """
-    يعيد مسارات لعدّة نسخ مُحسّنة من الصورة لتجربتها مع OCR.
-    """
-    img = cv2.imread(input_path)
-    if img is None:
-        return []
-    # تكبير لزيادة وضوح الحروف
-    h, w = img.shape[:2]
-    img_up = cv2.resize(img, (w * upscale, h * upscale), interpolation=cv2.INTER_CUBIC)
-    # تدرج رمادي
-    gray = cv2.cvtColor(img_up, cv2.COLOR_BGR2GRAY)
-    # زيادة التباين (CLAHE)
-    clahe = cv2.createCLAHE(clipLimit=3.0, tileGridSize=(8, 8))
-    gray = clahe.apply(gray)
-    # إزالة ضوضاء خفيفة
-    gray = cv2.fastNlMeansDenoising(gray, None, h=3, templateWindowSize=7, searchWindowSize=21)
-    # تمويه خفيف + Otsu
-    blur = cv2.GaussianBlur(gray, (3, 3), 0)
-    _, th = cv2.threshold(blur, 0, 255, cv2.THRESH_BINARY + cv2.THRESH_OTSU)
-    # نسخة معكوسة (في حال كان النص أبيض على خلفية داكنة)
-    inv = cv2.bitwise_not(th)
-    # غلق مورفولوجي لتقوية الحروف
-    kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (3, 3))
-    th = cv2.morphologyEx(th, cv2.MORPH_CLOSE, kernel, iterations=1)
-    inv = cv2.morphologyEx(inv, cv2.MORPH_CLOSE, kernel, iterations=1)
-    # حفظ نسخ مؤقتة
-    out_paths = []
-    for mat in (th, inv):
-        temp_name = f"/tmp/ink_{uuid.uuid4().hex}.png"
-        cv2.imwrite(temp_name, mat)
-        out_paths.append(temp_name)
-    return out_paths
-def _run_ocr(image_path, lang='en'):
     """
-    يشغّل OCR ويُعيد (texts, boxes, scores)
     """
-    ocr = _get_engine(lang)
-    result = ocr.ocr(image_path, cls=True)
-    texts, boxes, scores = [], [], []
-    if result is not None and len(result) > 0:
-        for line in result[0]:
-            if line and len(line) >= 2:
-                try:
-                    box = line[0]
                     text = line[1][0]
-                    score = float(line[1][1]) if isinstance(line[1][1], (int, float)) else 0.0
-                    if text is not None and box is not None:
                         texts.append(text)
-                        boxes.append(box)
-                        scores.append(score)
-                except Exception as e:
-                    print(f"⚠️ خطأ في معالجة نتيجة OCR: {e}")
-                    continue
-    return texts, boxes, scores
-def extract_texts(image_path: str, ocr_lang: str = 'en', preprocess: bool = True, min_score: float = 0.35):
-    """
-    يحاول استخراج نصوص من النسخة الأصلية والنسخ المُحسّنة ويختار أفضل نتيجة.
-    """
-    best = {"texts": [], "boxes": [], "scores": []}
-    # 1) المحاولة على الصورة الأصلية
-    t0, b0, s0 = _run_ocr(image_path, lang=ocr_lang)
-    # فلترة حسب min_score
-    filtered0 = [(t, b, s) for t, b, s in zip(t0, b0, s0) if s >= min_score]
-    if filtered0:
-        best["texts"], best["boxes"], best["scores"] = zip(*filtered0)
-        best["texts"], best["boxes"], best["scores"] = list(best["texts"]), list(best["boxes"]), list(best["scores"])
-    else:
-        best["texts"], best["boxes"], best["scores"] = [], [], []
-    print(f"📊 النتائج الأصلية: {len(best['texts'])} نصوص")
-    # 2) المحاولات المُحسّنة
-    if preprocess:
-        variant_paths = preprocess_for_ocr(image_path)
-        print(f"🔄 معالجة {len(variant_paths)} نسخة محسنة")
-        for i, p in enumerate(variant_paths):
-            t, b, s = _run_ocr(p, lang=ocr_lang)
-            filtered = [(tt, bb, ss) for tt, bb, ss in zip(t, b, s) if ss >= min_score]
-            # تنظيف الملف المؤقت
             try:
-                os.remove(p)
             except:
                 pass
-            # اختر النتيجة الأفضل
-            if filtered:
-                current_score = np.mean([ss for _, _, ss in filtered]) if filtered else 0
-                best_score = np.mean(best["scores"]) if best["scores"] else 0
-                if (len(filtered) > len(best["texts"])) or (
-                    len(filtered) == len(best["texts"]) and current_score > best_score
-                ):
-                    best["texts"], best["boxes"], best["scores"] = zip(*filtered)
-                    best["texts"], best["boxes"], best["scores"] = list(best["texts"]), list(best["boxes"]), list(best["scores"])
-                    print(f"✅ النسخة المحسنة {i+1}: وجدت {len(filtered)} نصوص بجودة أفضل")
-    print(f"🎯 النتائج النهائية: {len(best['texts'])} نصوص")
-    return best["texts"], best["boxes"]

 import cv2
 import numpy as np
 import os
+import tempfile
+# تهيئة محرك OCR مرة واحدة فقط
+ocr_engine = None
+def get_ocr_engine():
+    """الحصول على أو إنشاء محرك OCR"""
+    global ocr_engine
+    if ocr_engine is None:
         try:
+            # استخدام الإعدادات المتوافقة مع الإصدار 2.7.0
+            ocr_engine = PaddleOCR(
                 use_angle_cls=True,
+                lang='en',
                 show_log=False,
+                det_db_thresh=0.3,
+                det_db_box_thresh=0.3,
+                # rec_thresh غير مدعوم في الإصدار 2.7.0 - تمت إزالته
+                use_space_char=True
             )
+            print("✅ تم تهيئة محرك PaddleOCR بنجاح (الإصدار 2.7.0)")
         except Exception as e:
             print(f"❌ فشل في تهيئة PaddleOCR: {e}")
             raise
+    return ocr_engine
+def preprocess_image(image_path):
+    """معالجة مسبقة بسيطة للصورة"""
+    try:
+        img = cv2.imread(image_path)
+        if img is None:
+            return image_path
+        # تحويل إلى تدرج الرمادي
+        gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+        # زيادة التباين البسيط
+        enhanced = cv2.convertScaleAbs(gray, alpha=1.3, beta=40)
+        # حفظ الصورة المحسنة مؤقتاً
+        _, temp_path = tempfile.mkstemp(suffix='.png')
+        cv2.imwrite(temp_path, enhanced)
+        return temp_path
+    except Exception as e:
+        print(f"⚠️ خطأ في معالجة الصورة: {e}")
+        return image_path
+def extract_texts(image_path: str, preprocess: bool = True):
     """
+    استخراج النصوص من الصورة مع معالجة مسبقة اختيارية
     """
+    try:
+        ocr = get_ocr_engine()
+        processed_path = image_path
+        # المعالجة المسبقة إذا requested
+        if preprocess:
+            processed_path = preprocess_image(image_path)
+        # استخراج النصوص
+        result = ocr.ocr(processed_path, cls=True)
+        texts = []
+        boxes = []
+        if result and result[0]:
+            for line in result[0]:
+                if line and len(line) >= 2:
                     text = line[1][0]
+                    confidence = line[1][1] if len(line[1]) > 1 else 0.5
+                    # فلترة النصوص ذات الثقة المنخفضة يدوياً
+                    if confidence > 0.3 and text.strip():
                         texts.append(text)
+                        boxes.append(line[0])
+                        print(f"📝 تم استخراج: '{text}' (ثقة: {confidence:.2f})")
+        # تنظيف الملف المؤقت إذا تم إنشاؤه
+        if preprocess and processed_path != image_path and os.path.exists(processed_path):
             try:
+                os.remove(processed_path)
             except:
                 pass
+        print(f"✅ تم استخراج {len(texts)} نصاً من الصورة")
+        return texts, boxes
+    except Exception as e:
+        print(f"❌ خطأ في استخراج النصوص: {e}")
+        import traceback
+        traceback.print_exc()
+        return [], []