Spaces:

pluniak
/

ocrd

Sleeping

App Files Files Community

pluniak commited on May 16, 2024

Commit

6470dc2

verified ·

1 Parent(s): 7bdb729

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -3

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ from helpers import OCRD
-def run_ocrd_pipeline(img_path, status=gr.Progress(), binarize_mode='detailed', min_pixel_sum=30, median_bounds=(None, None), font_size=30):
     """
     Executes the OCRD pipeline on an image from file loading to text overlay creation. This function orchestrates
     the calling of various OCRD class methods to process the image, extract and recognize text, and then overlay
@@ -11,12 +11,12 @@ def run_ocrd_pipeline(img_path, status=gr.Progress(), binarize_mode='detailed',
     Parameters:
         img_path (str): Path to the image file.
         binarize_mode (str): Mode to be used for image binarization. Can be 'detailed', 'fast', or 'no'.
         min_pixel_sum (int, optional): Minimum sum of pixels to consider a text line segmentation for extraction.
             If 'default', default values are applied.
         median_bounds (tuple, optional): Bounds to filter text line segmentations based on size relative to the median.
             If 'default', default values are applied.
-        font_size (int, optional): Font size to be used in text overlay. If 'default', a default size or scaling logic is applied.
     Returns:
         Image: An image with overlay text, where text is extracted and recognized from the original image.
@@ -29,6 +29,16 @@ def run_ocrd_pipeline(img_path, status=gr.Progress(), binarize_mode='detailed',
     - Creating an image overlay with recognized text.
     """
     # prepare kwargs
     efadt_kwargs = {}
     if min_pixel_sum != 'default':
@@ -41,7 +51,6 @@ def run_ocrd_pipeline(img_path, status=gr.Progress(), binarize_mode='detailed',
         ctoi_kwargs['font_size'] = font_size
     # run pipeline
-    #status(0, desc="\nReading image...\n")
     ocrd = OCRD(img_path)
     status(0, desc='\nStep 1/5: Binarizing image...\n')
     binarized = ocrd.binarize_image(ocrd.image, binarize_mode)

+def run_ocrd_pipeline(img_path, font_size=30, binarize_mode='detailed', min_pixel_sum=30, median_bounds=(None, None), status=gr.Progress()):
     """
     Executes the OCRD pipeline on an image from file loading to text overlay creation. This function orchestrates
     the calling of various OCRD class methods to process the image, extract and recognize text, and then overlay
     Parameters:
         img_path (str): Path to the image file.
+        font_size (int, optional): Font size to be used in text overlay. If 'default', a default size or scaling logic is applied.
         binarize_mode (str): Mode to be used for image binarization. Can be 'detailed', 'fast', or 'no'.
         min_pixel_sum (int, optional): Minimum sum of pixels to consider a text line segmentation for extraction.
             If 'default', default values are applied.
         median_bounds (tuple, optional): Bounds to filter text line segmentations based on size relative to the median.
             If 'default', default values are applied.
     Returns:
         Image: An image with overlay text, where text is extracted and recognized from the original image.
     - Creating an image overlay with recognized text.
     """
+    # convert gradio app dropdown options
+    if font_size == 'small':
+        font_size = 30
+    if font_size == 'medium':
+        font_size = 50
+    if font_size == 'large':
+        font_size = 70
+    elif font_size == 'adjusted':
+        font_size = -1
     # prepare kwargs
     efadt_kwargs = {}
     if min_pixel_sum != 'default':
         ctoi_kwargs['font_size'] = font_size
     # run pipeline
     ocrd = OCRD(img_path)
     status(0, desc='\nStep 1/5: Binarizing image...\n')
     binarized = ocrd.binarize_image(ocrd.image, binarize_mode)