Spaces:

GiantAnalytics
/

ArabicOCRExtractor

Running

App Files Files Community

GiantAnalytics commited on Jan 13, 2025

Commit

ef9ba78

verified ·

1 Parent(s): e880c5e

first version

Browse files

Files changed (1) hide show

app.py +53 -0

app.py ADDED Viewed

	@@ -0,0 +1,53 @@

+import gradio as gr
+import paddle
+from paddleocr import PaddleOCR, draw_ocr
+import cv2
+from PIL import Image
+import numpy as np
+# Initialize PaddleOCR for Arabic
+ocr = PaddleOCR(use_angle_cls=True, lang='ar')
+def ocr_extract_text(image):
+    # Perform OCR on the uploaded image
+    result = ocr.ocr(image, cls=True)
+    # Initialize a list to store detected text
+    detected_text = []
+    # Loop through the results and extract text
+    for line in result[0]:  # result[0] contains the OCR results for text regions
+        text = line[1][0]  # Detected text
+        detected_text.append(text)
+    # Draw the OCR results on the image
+    boxes = [line[0] for line in result[0]]  # Bounding box coordinates
+    texts = [line[1][0] for line in result[0]]  # Detected text
+    scores = [line[1][1] for line in result[0]]  # Confidence scores
+    annotated_image = draw_ocr(image, boxes, texts, scores, font_path="path/to/arabic/font.ttf")
+    # Convert the annotated image to a format that Gradio can display
+    annotated_image = Image.fromarray(np.uint8(annotated_image))
+    # Return the text and annotated image
+    return "\n".join(detected_text), annotated_image
+# Define Gradio interface with the button to trigger OCR
+def start_ocr(image):
+    # Trigger OCR extraction when button is clicked
+    return ocr_extract_text(image)
+iface = gr.Interface(
+    fn=start_ocr,  # Function to trigger OCR extraction on button click
+    inputs=gr.Image(type="pil"),  # Image input only
+    outputs=[gr.Textbox(label="Extracted Text"), gr.Image(label="Annotated Image")],  # Outputs
+    live=False,  # Set live=False as we want to trigger the process with a button click
+    title="Arabic OCR Extractor",  # Title of the interface
+    description="Upload an Arabic document or image, and click 'Start Extracting Text' to extract the text using OCR.",  # Description
+    allow_flagging="never"  # Prevent flagging if it's not required
+)
+if __name__ == "__main__":
+    # This ensures Gradio runs in debug mode and with queue for better debugging
+    iface.queue().launch(debug=True)