Spaces:

gabai-capstone
/

GabAI

Sleeping

Arjooohn commited on Mar 15

Commit

b1b53ca

verified ·

1 Parent(s): 8efeaf2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,21 +6,37 @@ from PIL import Image
 from gtts import gTTS
 import os
 def preprocess(image):
     """
-    Preprocess the image for OCR:
     - Convert to grayscale
-    - Apply Gaussian blur
-    - Apply Otsu threshold
     """
     img = np.array(image)
     gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
-    blur = cv2.GaussianBlur(gray, (5, 5), 0)
-    thresh = cv2.threshold(
-        blur, 0, 255,
-        cv2.THRESH_BINARY + cv2.THRESH_OTSU
-    )[1]
     return thresh
 def extract_and_speak(image):
     """

 from gtts import gTTS
 import os
+# --- REPLACE your old preprocess function with this ---
 def preprocess(image):
     """
+    Preprocess the image for better OCR results:
     - Convert to grayscale
+    - Sharpen edges
+    - Denoise
+    - Adaptive thresholding for better contrast
     """
     img = np.array(image)
+    # Convert to grayscale
     gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+    # Sharpen image
+    kernel = np.array([[0,-1,0], [-1,5,-1], [0,-1,0]])
+    gray = cv2.filter2D(gray, -1, kernel)
+    # Denoise
+    gray = cv2.fastNlMeansDenoising(gray, None, 30, 7, 21)
+    # Adaptive threshold
+    thresh = cv2.adaptiveThreshold(
+        gray, 255,
+        cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
+        cv2.THRESH_BINARY,
+        31, 10
+    )
     return thresh
+# --- End of preprocess function ---
 def extract_and_speak(image):
     """