Spaces:

gabai-capstone
/

GabAI

Sleeping

Arjooohn commited on about 1 month ago

Commit

6516b6c

verified ·

1 Parent(s): 3b3a60d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,10 +2,11 @@ import gradio as gr
 import pytesseract
 import cv2
 import numpy as np
 from gtts import gTTS
 def preprocess(image):
-    # Convert to grayscale, blur, threshold; no flipping
     img = np.array(image)
     gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
     blur = cv2.GaussianBlur(gray, (5,5), 0)
@@ -17,6 +18,7 @@ def preprocess(image):
 def extract_and_speak(image):
     processed = preprocess(image)
     text = pytesseract.image_to_string(processed, lang="eng")
     if text.strip() == "":
@@ -29,13 +31,13 @@ def extract_and_speak(image):
 interface = gr.Interface(
     fn=extract_and_speak,
-    inputs=gr.Image(type="pil", sources=["webcam"]),  # Webcam preview mirrored by default
     outputs=[
         gr.Textbox(label="Extracted Text"),
         gr.Audio(label="Text-to-Speech Output")
     ],
     title="GabAI - AI Assistive Reading System",
-    description="Use your webcam to capture printed text. Preview is mirrored, but captured image is normal for OCR."
 )
 interface.launch()

 import pytesseract
 import cv2
 import numpy as np
+from PIL import Image
 from gtts import gTTS
+import os
 def preprocess(image):
     img = np.array(image)
     gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
     blur = cv2.GaussianBlur(gray, (5,5), 0)
 def extract_and_speak(image):
     processed = preprocess(image)
     text = pytesseract.image_to_string(processed, lang="eng")
     if text.strip() == "":
 interface = gr.Interface(
     fn=extract_and_speak,
+    inputs=gr.Image(type="pil", source="webcam", tool=None),  # Only webcam, no upload/paste
     outputs=[
         gr.Textbox(label="Extracted Text"),
         gr.Audio(label="Text-to-Speech Output")
     ],
     title="GabAI - AI Assistive Reading System",
+    description="Use your webcam to capture printed text. The system extracts the text and converts it into speech."
 )
 interface.launch()