Spaces:

gopichandra
/

Duplicate

Runtime error

App Files Files Community

gopichandra commited on Jan 25, 2025

Commit

319a527

verified ·

1 Parent(s): ae6ccdc

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -27

app.py CHANGED Viewed

@@ -2,34 +2,20 @@ import gradio as gr
 from paddleocr import PaddleOCR
 from PIL import Image, ImageOps
 import numpy as np
-import cv2
-import io
 # Initialize PaddleOCR
 ocr = PaddleOCR(use_angle_cls=True, lang='en')
-# Function to extract an image from video and process it
-def process_video_frame(video_data, camera_type="rear"):
-    if video_data is None:
-        return "No video feed provided."
-    # Decode video bytes
-    video_stream = io.BytesIO(video_data)
-    video_stream.seek(0)
-    video_array = np.frombuffer(video_stream.read(), np.uint8)
-    video_frame = cv2.imdecode(video_array, cv2.IMREAD_COLOR)
-    if video_frame is None:
-        return "Failed to decode video feed."
-    # Convert frame to PIL Image
-    image = Image.fromarray(cv2.cvtColor(video_frame, cv2.COLOR_BGR2RGB))
-    # Flip the image horizontally for rear camera
     if camera_type == "rear":
         image = ImageOps.mirror(image)
-    # Perform OCR
     result = ocr.ocr(np.array(image))
     extracted_text = []
     for line in result[0]:
@@ -41,9 +27,9 @@ def create_app():
     with gr.Blocks() as app:
         gr.Markdown("## OCR Processor with Rear Camera Fix")
-        # Inputs for video feed and camera type
         with gr.Row():
-            video_input = gr.Video(label="Capture Video Feed")
             camera_type = gr.Dropdown(
                 choices=["rear", "front"],
                 value="rear",
@@ -53,11 +39,11 @@ def create_app():
         # Output for extracted text
         extracted_text = gr.Textbox(label="Extracted Text")
-        # Button to process the video feed
-        process_button = gr.Button("Process Frame for OCR")
         process_button.click(
-            fn=process_video_frame,
-            inputs=[video_input, camera_type],
             outputs=extracted_text
         )

 from paddleocr import PaddleOCR
 from PIL import Image, ImageOps
 import numpy as np
 # Initialize PaddleOCR
 ocr = PaddleOCR(use_angle_cls=True, lang='en')
+# Function to process captured images
+def process_image(image, camera_type="rear"):
+    if image is None:
+        return "No image captured."
+    # Flip the image horizontally for the rear camera
     if camera_type == "rear":
         image = ImageOps.mirror(image)
+    # Perform OCR on the corrected image
     result = ocr.ocr(np.array(image))
     extracted_text = []
     for line in result[0]:
     with gr.Blocks() as app:
         gr.Markdown("## OCR Processor with Rear Camera Fix")
+        # Inputs for image capture and camera type selection
         with gr.Row():
+            image_input = gr.Image(type="pil", label="Capture Image")  # For image capture
             camera_type = gr.Dropdown(
                 choices=["rear", "front"],
                 value="rear",
         # Output for extracted text
         extracted_text = gr.Textbox(label="Extracted Text")
+        # Button to process the captured image
+        process_button = gr.Button("Process Image")
         process_button.click(
+            fn=process_image,
+            inputs=[image_input, camera_type],
             outputs=extracted_text
         )