Spaces:

TungDuong
/

Scene_Text_Recognization

Runtime error

TungDuong commited on Feb 6, 2025

Commit

1bf80f3

verified ·

1 Parent(s): 06142a4

adding function to print text to screen

Files changed (1) hide show

app.py CHANGED Viewed

@@ -28,17 +28,33 @@ def pipeline(image):
     # Filter low conf boxes
     filter_predictions = []
     for bbox, cls, conf, text, encoded_text in predictions:
         if conf > 0.7:
             filter_predictions.append([bbox, cls, conf, text, encoded_text])
     image = visualize_image(image, filter_predictions)
-    return image
 demo = gr.Interface(
     fn=pipeline,
     inputs=gr.Image(type="pil", label="Input Image"),
-    outputs="image",
     title="Scene Text Recognization",
     description="Recognize text in scene images"
 )

     # Filter low conf boxes
     filter_predictions = []
+    dict_predictions = {}
+    num_textbox = 1
     for bbox, cls, conf, text, encoded_text in predictions:
         if conf > 0.7:
             filter_predictions.append([bbox, cls, conf, text, encoded_text])
+            xmin, ymin, xmax, ymax = bbox
+            xmin, ymin, xmax, ymax = int(xmin), int(ymin), int(xmax), int(ymax)
+            dict_predictions.update({
+                f"textbox {num_textbox}":{
+                    "bounding box": str([xmin, ymin, xmax, ymax]),
+                    "conf": np.round(conf, 2),
+                    "text": text
+                }
+            })
+            num_textbox += 1
     image = visualize_image(image, filter_predictions)
+    return image, json.dumps(dict_predictions, indent=5)
 demo = gr.Interface(
     fn=pipeline,
     inputs=gr.Image(type="pil", label="Input Image"),
+    outputs=[
+            gr.Image(type="pil", label="Output Image"),
+            gr.Textbox(type="text", label="Recognized Text")
+        ],
     title="Scene Text Recognization",
     description="Recognize text in scene images"
 )