Spaces:

shayansjm
/

ocr2

Sleeping

App Files Files Community

shayansjm commited on Jan 7

Commit

1210071

verified ·

1 Parent(s): 26fdeb9

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -41

app.py CHANGED Viewed

@@ -1,74 +1,67 @@
 import gradio as gr
 from paddleocr import PaddleOCR
-from PIL import Image, ImageOps, ImageEnhance
 import numpy as np
-# 1. Clean Initialization for 2026 (PaddleOCR 3.0+)
 try:
     ocr = PaddleOCR(
         lang='en',
-        ocr_version='PP-OCRv4', # Stable & accurate for handwriting
-        use_angle_cls=True
     )
 except Exception as e:
-    print(f"Initialization Error: {e}")
-def process_bank_form(image):
     if image is None:
         return "Please upload an image."
     try:
-        # 2. ENHANCE HANDWRITING (Pre-processing)
-        # We sharpen and increase contrast to help the AI see light pen marks
         img = image.convert("RGB")
-        img = ImageOps.exif_transpose(img) # Fix auto-rotation from phones
-        enhancer = ImageEnhance.Contrast(img)
-        img = enhancer.enhance(1.5) # Boost contrast by 50%
         img_array = np.array(img)
-        # 3. RUN OCR
         result = ocr.ocr(img_array)
-        # 4. SAFE PARSING (Fixes 'string index out of range')
-        if not result or result[0] is None:
-            return "No text detected. Try a closer photo or darker ink."
         extracted_text = []
         for line in result[0]:
-            # Each 'line' is [[box_coords], [text, confidence]]
-            # We must verify the text content exists before accessing it
-            if len(line) > 1 and len(line[1]) > 0:
-                text_str = str(line[1][0]).strip()
-                confidence = float(line[1][1])
-                # If the string is empty, skip it to avoid the index error
-                if text_str and confidence > 0.30:
-                    extracted_text.append(text_str)
         if not extracted_text:
-            return "AI found text boxes but couldn't read the words. Try more light."
         return "\n".join(extracted_text)
     except Exception as e:
-        return f"Processing Error: {str(e)}\nTip: If the error persists, try a smaller/cropped image."
-# 5. UI Setup
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🏦 English Bank Form Reader (Stable v3.0)")
-    gr.Markdown("Optimized for handwriting and noisy document scans.")
-    with gr.Row():
-        with gr.Column():
-            input_img = gr.Image(type="pil", label="Bank Form Photo")
-            submit_btn = gr.Button("Extract All Text", variant="primary")
-        with gr.Column():
-            #output_text = gr.Textbox(label="Extracted Content", lines=20, show_copy_button=True)
-            output_text = gr.Textbox(label="Result", lines=20)
-    submit_btn.click(fn=process_bank_form, inputs=input_img, outputs=output_text)
 if __name__ == "__main__":
-    # max_threads=1 prevents memory overlap on free CPU tiers
     demo.launch(max_threads=1)

 import gradio as gr
 from paddleocr import PaddleOCR
+from PIL import Image, ImageOps
 import numpy as np
+# Initializing with explicit CPU settings for Hugging Face
 try:
     ocr = PaddleOCR(
         lang='en',
+        ocr_version='PP-OCRv4',
+        use_angle_cls=True,
+        use_gpu=False  # Force CPU to prevent memory-related runtime errors
     )
 except Exception as e:
+    print(f"Startup error: {e}")
+def safe_ocr_process(image):
     if image is None:
         return "Please upload an image."
     try:
+        # 1. Correct image orientation (common phone photo fix)
         img = image.convert("RGB")
+        img = ImageOps.exif_transpose(img)
         img_array = np.array(img)
+        # 2. Run OCR
         result = ocr.ocr(img_array)
+        # 3. Defensive Parsing (The Fix for 'Index Out of Range')
+        if not result or not isinstance(result, list) or result[0] is None:
+            return "No text detected. Try a closer, clearer photo."
         extracted_text = []
+        # PaddleOCR result is a list of lists: result[0] contains the lines
         for line in result[0]:
+            # Each 'line' is [[box], [text, confidence]]
+            # We check if 'line' has exactly two elements and if the text part is valid
+            if isinstance(line, list) and len(line) >= 2:
+                text_data = line[1] # This is [text_string, confidence_score]
+                if isinstance(text_data, (list, tuple)) and len(text_data) >= 1:
+                    raw_string = text_data[0]
+                    confidence = text_data[1]
+                    # Ensure it's a non-empty string and confidence is okay
+                    if raw_string and isinstance(raw_string, str) and confidence > 0.3:
+                        extracted_text.append(raw_string.strip())
         if not extracted_text:
+            return "Detection found boxes, but couldn't read the words. Try more light."
         return "\n".join(extracted_text)
     except Exception as e:
+        return f"Final Stability Error: {str(e)}\nTip: This usually happens if the image is too large for the CPU. Try cropping the form."
+# Simple, reliable UI
+demo = gr.Interface(
+    fn=safe_ocr_process,
+    inputs=gr.Image(type="pil", label="Bank Form Image"),
+    outputs=gr.Textbox(label="Extracted Text", lines=20),
+    title="🏦 Stable Bank OCR"
+)
 if __name__ == "__main__":
     demo.launch(max_threads=1)