Spaces:

mrrtmob
/

kiri-ocr

Running

mrrtmob commited on Jan 24

Commit

f948409

verified ·

1 Parent(s): b112477

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,11 +2,13 @@ import gradio as gr
 from kiri_ocr import OCR
 from PIL import Image, ImageDraw
 import numpy as np
 # Initialize OCR
 try:
     print("Loading Kiri OCR model...")
-    ocr = OCR()
     print("Model loaded successfully")
 except Exception as e:
     print(f"Error loading model: {e}")
@@ -20,8 +22,11 @@ def process_image(image_path):
         return None, "Please upload an image."
     try:
         # extract_text returns (text, results)
-        text, results = ocr.extract_text(image_path)
         # Open image for drawing
         img = Image.open(image_path)
@@ -34,11 +39,15 @@ def process_image(image_path):
         for item in results:
             if 'box' in item:
                 x, y, w, h = item['box']
                 draw.rectangle([x, y, x + w, y + h], outline="red", width=3)
         return np.array(img), text
     except Exception as e:
         return None, f"Error during extraction: {str(e)}"
 # Build the interface
@@ -51,8 +60,8 @@ demo = gr.Interface(
     ],
     title="Kiri OCR Demo",
     description="Upload an image to extract English and Khmer text. Detected regions are highlighted in red.",
-    examples=[["images/demo1.png"]]
 )
 if __name__ == "__main__":
-    demo.launch()

 from kiri_ocr import OCR
 from PIL import Image, ImageDraw
 import numpy as np
+import os
 # Initialize OCR
 try:
     print("Loading Kiri OCR model...")
+    # Use verbose=True to see what's happening
+    ocr = OCR(verbose=True)
     print("Model loaded successfully")
 except Exception as e:
     print(f"Error loading model: {e}")
         return None, "Please upload an image."
     try:
+        print(f"Processing image: {image_path}")
         # extract_text returns (text, results)
+        text, results = ocr.extract_text(image_path, verbose=True)
+        print(f"Extracted {len(results)} regions.")
         # Open image for drawing
         img = Image.open(image_path)
         for item in results:
             if 'box' in item:
                 x, y, w, h = item['box']
+                # Ensure coordinates are ints
+                x, y, w, h = int(x), int(y), int(w), int(h)
                 draw.rectangle([x, y, x + w, y + h], outline="red", width=3)
         return np.array(img), text
     except Exception as e:
+        import traceback
+        traceback.print_exc()
         return None, f"Error during extraction: {str(e)}"
 # Build the interface
     ],
     title="Kiri OCR Demo",
     description="Upload an image to extract English and Khmer text. Detected regions are highlighted in red.",
+    examples=[]
 )
 if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860, share=False)