Spaces:

mohamed12ahmed
/

full_ocr

Sleeping

mohamed12ahmed commited on Sep 14, 2025

Commit

ee00213

verified ·

1 Parent(s): 816321e

Update ocr_processing.py

Files changed (1) hide show

ocr_processing.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import cv2
 import numpy as np
 from PIL import Image
-import pytesseract
 # Skew Correction
 def deskew(image):
@@ -30,13 +30,15 @@ def correct_lighting(image):
     final = cv2.cvtColor(limg, cv2.COLOR_LAB2BGR)
     return final
-# OCR Extraction (Multi-language)
-def extract_text(image, langs="eng+ara"):
-    text = pytesseract.image_to_string(image, lang=langs)
     return text
-# Full Pipeline
-def process_image(file, langs="eng+ara"):
     img = Image.open(file).convert('RGB')
     img_cv = np.array(img)
     img_cv = deskew(img_cv)

 import cv2
 import numpy as np
 from PIL import Image
+import easyocr
 # Skew Correction
 def deskew(image):
     final = cv2.cvtColor(limg, cv2.COLOR_LAB2BGR)
     return final
+# OCR Extraction using EasyOCR
+def extract_text(image, langs=['en']):
+    reader = easyocr.Reader(langs, gpu=False)  # GPU=True لو عندك دعم CUDA
+    results = reader.readtext(image, detail=0)
+    text = "\n".join(results)
     return text
+# Full pipeline
+def process_image(file, langs=['en']):
     img = Image.open(file).convert('RGB')
     img_cv = np.array(img)
     img_cv = deskew(img_cv)