Spaces:

mohammad2928git
/

OCR_V1

Build error

App Files Files Community

mohammad2928git commited on May 17, 2025

Commit

3599d1b

verified ·

1 Parent(s): ed67370

Create app.py

Browse files

Files changed (1) hide show

app.py +153 -0

app.py ADDED Viewed

	@@ -0,0 +1,153 @@

+import gradio as gr
+import tensorflow as tf
+import keras_ocr
+import requests
+import cv2
+import os
+import csv
+import numpy as np
+import pandas as pd
+import huggingface_hub
+from huggingface_hub import Repository
+from datetime import datetime
+import scipy.ndimage.interpolation as inter
+import easyocr
+import datasets
+from datasets import load_dataset, Image
+from PIL import Image
+from paddleocr import PaddleOCR
+from save_data import flag
+import pytesseract
+from pdf2image import convert_from_path
+from PIL import Image
+import os
+# Function to perform OCR
+def ocr(input_file, lang='fas'):  # 'fas': Persian language (Farsi)
+    extracted_text = ""
+    # Check if the input file is a PDF or an image
+    if isinstance(input_file, str) and input_file.endswith('.pdf'):  # Check if the file is a PDF
+        # Convert PDF to images
+        images = convert_from_path(input_file)
+        # Loop through each image and perform OCR
+        for page_number, image in enumerate(images):
+            text = pytesseract.image_to_string(image, lang=lang)
+            extracted_text += text
+    elif isinstance(input_file, Image.Image):  # If the input is an image
+        text = pytesseract.image_to_string(input_file, lang=lang)
+        extracted_text = text
+    return extracted_text
+"""
+Paddle OCR
+"""
+def ocr_with_paddle(img):
+    finaltext = ''
+    ocr = PaddleOCR(lang='en', use_angle_cls=True)
+    # img_path = 'exp.jpeg'
+    result = ocr.ocr(img)
+    for i in range(len(result[0])):
+        text = result[0][i][1][0]
+        finaltext += ' '+ text
+    return finaltext
+"""
+Keras OCR
+"""
+def ocr_with_keras(img):
+    output_text = ''
+    pipeline=keras_ocr.pipeline.Pipeline()
+    images=[keras_ocr.tools.read(img)]
+    predictions=pipeline.recognize(images)
+    first=predictions[0]
+    for text,box in first:
+        output_text += ' '+ text
+    return output_text
+"""
+easy OCR
+"""
+# gray scale image
+def get_grayscale(image):
+    return cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+# Thresholding or Binarization
+def thresholding(src):
+    return cv2.threshold(src,127,255, cv2.THRESH_TOZERO)[1]
+def ocr_with_easy(img):
+    gray_scale_image=get_grayscale(img)
+    thresholding(gray_scale_image)
+    cv2.imwrite('image.png',gray_scale_image)
+    reader = easyocr.Reader(['th','en'])
+    bounds = reader.readtext('image.png',paragraph="False",detail = 0)
+    bounds = ''.join(bounds)
+    return bounds
+"""
+Generate OCR
+"""
+def process(input_type, file, lang):
+    if input_type == "PDF":
+        extracted_text = ocr(file.name, lang)
+    else:
+        image = Image.open(file.name)
+        extracted_text = ocr(image, lang)
+    return extracted_text
+def generate_ocr(Method,img):
+    text_output = ''
+    if (img).any():
+        add_csv = []
+        image_id = 1
+        print("Method___________________",Method)
+        if Method == 'EasyOCR':
+            text_output = ocr_with_easy(img)
+        if Method == 'KerasOCR':
+            text_output = ocr_with_keras(img)
+        if Method == 'PaddleOCR':
+            text_output = ocr_with_paddle(img)
+        if Method == 'tesseract':
+            text_output = process("img", img, "fas")
+        try:
+            flag(Method,text_output,img)
+        except Exception as e:
+            print(e)
+        return text_output
+    else:
+        raise gr.Error("Please upload an image!!!!")
+"""
+Create user interface for OCR demo
+"""
+# image = gr.Image(shape=(300, 300))
+image = gr.Image()
+method = gr.Radio(["PaddleOCR","EasyOCR", "KerasOCR", "tesseract"],value="PaddleOCR")
+output = gr.Textbox(label="Output")
+demo = gr.Interface(
+    generate_ocr,
+    [method, image],
+    output,
+    title="Optical Character Recognition",
+    css=".gradio-container {background-color: lightgray} #radio_div {background-color: #FFD8B4; font-size: 40px;}",
+    article = """<p style='text-align: center;'>Feel free to give us your thoughts on this demo and please contact us at
+                    <a href="mailto:letstalk@pragnakalp.com" target="_blank">letstalk@pragnakalp.com</a>
+                    <p style='text-align: center;'>Developed by: <a href="https://www.pragnakalp.com" target="_blank">Pragnakalp Techlabs</a></p>"""
+)
+# demo.launch(enable_queue = False)
+demo.launch()