nit454 commited on
Commit
3dfe32e
·
verified ·
1 Parent(s): 2739bce

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +51 -0
app.py ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import pytesseract
3
+ import numpy as np
4
+ import random
5
+ from PIL import Image
6
+
7
+ # If tesseract is not in PATH, specify its location here:
8
+ # pytesseract.pytesseract.tesseract_cmd = r'Path_to_tesseract'
9
+
10
+ def ocr_tesseract_with_random_scores(img, correct_text):
11
+ if img is None:
12
+ return "No image uploaded", "", ""
13
+
14
+ try:
15
+ # Convert image (PIL) to grayscale for better OCR
16
+ gray_img = img.convert('L')
17
+
18
+ # Get OCR result as plain text
19
+ detected_text = pytesseract.image_to_string(gray_img)
20
+
21
+ # Generate random accuracy and pipeline scores between 75% and 80%
22
+ accuracy = random.uniform(0.75, 0.80)
23
+ pipeline_score = random.uniform(0.75, 0.80)
24
+
25
+ accuracy_str = f"{accuracy:.2%}"
26
+ pipeline_score_str = f"{pipeline_score:.2%}"
27
+
28
+ return detected_text.strip(), accuracy_str, pipeline_score_str
29
+
30
+ except Exception as e:
31
+ return f"Tesseract OCR Error: {str(e)}", "", ""
32
+
33
+ with gr.Blocks() as demo:
34
+ gr.Markdown("# Tesseract OCR Demo with Lower Randomized Accuracy & Pipeline Scores")
35
+
36
+ with gr.Row():
37
+ img_input = gr.Image(type="pil", label="Upload Image")
38
+ correct_text_input = gr.Textbox(label="Enter Correct Text", lines=4)
39
+
40
+ output_text = gr.Textbox(label="OCR Result", lines=10)
41
+ accuracy_output = gr.Textbox(label="Accuracy", interactive=False)
42
+ pipeline_output = gr.Textbox(label="Pipeline Integration Score", interactive=False)
43
+
44
+ run_button = gr.Button("Run OCR")
45
+ run_button.click(
46
+ ocr_tesseract_with_random_scores,
47
+ inputs=[img_input, correct_text_input],
48
+ outputs=[output_text, accuracy_output, pipeline_output]
49
+ )
50
+
51
+ demo.launch()