Spaces:

nit454
/

EasyOCR_test

Sleeping

App Files Files Community

nit454 commited on Oct 28, 2025

Commit

80dce17

verified ·

1 Parent(s): 5b364e7

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -8

app.py CHANGED Viewed

@@ -4,11 +4,14 @@ import easyocr
 import numpy as np
 import pytesseract
-# Initialize EasyOCR model once
 easyocr_reader = easyocr.Reader(['en'])
 def get_metrics(model):
-    # Simulated fixed metrics for demo
     if model == "EasyOCR":
         return {"Accuracy": "95%", "Precision": "94%", "Pipeline": "Easy Integration (90%)"}
     elif model == "Tesseract":
@@ -19,7 +22,9 @@ def get_metrics(model):
 def ocr_all(img, ground_truth):
     if img is None:
         return "No image provided", "No image provided"
     img_array = np.array(img)
     try:
         easyocr_result = easyocr_reader.readtext(img_array, detail=0, paragraph=True)
         text_easy = "\n".join(easyocr_result)
@@ -33,19 +38,19 @@ def ocr_all(img, ground_truth):
         text_tess = f"Tesseract Error: {str(e)}"
     metrics_tess = get_metrics("Tesseract")
-    output_easy = f"**Output:**\n{text_easy}\n\n" + "\n".join([f"{k}: {v}" for k,v in metrics_easy.items()])
-    output_tess = f"**Output:**\n{text_tess}\n\n" + "\n".join([f"{k}: {v}" for k,v in metrics_tess.items()])
     return output_easy, output_tess
 with gr.Blocks() as demo:
-    gr.Markdown("# OCR Demo with EasyOCR and Tesseract")
     img_in = gr.Image(type="pil", label="Upload Screenshot")
-    txt_in = gr.Textbox(lines=4, label="Optional Ground Truth Text")
     btn = gr.Button("Run OCR")
     out_easy = gr.Markdown(label="EasyOCR Output")
     out_tess = gr.Markdown(label="Tesseract Output")
     btn.click(ocr_all, inputs=[img_in, txt_in], outputs=[out_easy, out_tess])
 demo.launch()

 import numpy as np
 import pytesseract
+# Initialize EasyOCR reader
 easyocr_reader = easyocr.Reader(['en'])
+# Explicitly set Tesseract command path for Hugging Face Spaces
+pytesseract.pytesseract.tesseract_cmd = '/usr/bin/tesseract'
 def get_metrics(model):
+    # Hardcoded metrics for demonstration
     if model == "EasyOCR":
         return {"Accuracy": "95%", "Precision": "94%", "Pipeline": "Easy Integration (90%)"}
     elif model == "Tesseract":
 def ocr_all(img, ground_truth):
     if img is None:
         return "No image provided", "No image provided"
     img_array = np.array(img)
     try:
         easyocr_result = easyocr_reader.readtext(img_array, detail=0, paragraph=True)
         text_easy = "\n".join(easyocr_result)
         text_tess = f"Tesseract Error: {str(e)}"
     metrics_tess = get_metrics("Tesseract")
+    output_easy = f"**Output:**\n{text_easy}\n\n" + "\n".join([f"{k}: {v}" for k, v in metrics_easy.items()])
+    output_tess = f"**Output:**\n{text_tess}\n\n" + "\n".join([f"{k}: {v}" for k, v in metrics_tess.items()])
     return output_easy, output_tess
 with gr.Blocks() as demo:
+    gr.Markdown("# OCR Demo on Hugging Face Spaces\nUpload an image and paste optional ground truth text.")
     img_in = gr.Image(type="pil", label="Upload Screenshot")
+    txt_in = gr.Textbox(lines=3, label="Paste Ground Truth Text")
     btn = gr.Button("Run OCR")
     out_easy = gr.Markdown(label="EasyOCR Output")
     out_tess = gr.Markdown(label="Tesseract Output")
     btn.click(ocr_all, inputs=[img_in, txt_in], outputs=[out_easy, out_tess])
 demo.launch()