Spaces:

RWTHMaterials
/

DP800_DamageClassification

Sleeping

App Files Files Community

kerzel commited on Jun 26, 2025

Commit

7b779c6

1 Parent(s): e360db8

try to fix utils.py with all the gradio fixes

Browse files

Files changed (1) hide show

utils.py +86 -35

utils.py CHANGED Viewed

@@ -1,5 +1,5 @@
 """
-Collection of various utils
 """
 import numpy as np
@@ -12,16 +12,15 @@ Image.MAX_IMAGE_PIXELS = 933120000
 import matplotlib.pyplot as plt
 import matplotlib.patches as patches
 from matplotlib.lines import Line2D
 import math
 ###
-### load SEM images
-###
 def load_image(filename : str) -> np.ndarray :
-    """Load an SEM image
     Args:
         filename (str): full path and name of the image file to be loaded
@@ -34,38 +33,66 @@ def load_image(filename : str) -> np.ndarray :
     return image
 ###
 ### show SEM image with boxes in various colours around each damage site
 ###
 def show_boxes(image : np.ndarray, damage_sites : dict, box_size = [250,250],
                save_image = False, image_path : str = None) :
-    """_summary_
     Args:
-        image (np.ndarray): SEM image to be shown
-        damage_sites (dict): python dictionary using the coordinates as key (x,y), and the label as value
-        box_size (list, optional): size of the rectangle drawn around each centroid. Defaults to [250,250].
-        save_image (bool, optional): save the image with the boxes or not. Defaults to False.
-        image_path (str, optional) : Full path and name of the output file to be saved
     """
     _, ax = plt.subplots(1)
-    ax.imshow(image, cmap='gray')  # show image on correct axis
     ax.set_xticks([])
     ax.set_yticks([])
     for key, label in damage_sites.items():
-        position = [key[0], key[1]]
         edgecolor = {
             'Inclusion': 'b',
             'Interface': 'g',
             'Martensite': 'r',
             'Notch': 'y',
-            'Shadowing': 'm'
         }.get(label, 'k')  # default: black
-        rect = patches.Rectangle((position[1] - box_size[1] / 2., position[0] - box_size[0] / 2),
                                  box_size[1], box_size[0],
                                  linewidth=1, edgecolor=edgecolor, facecolor='none')
         ax.add_patch(rect)
@@ -95,13 +122,13 @@ def show_boxes(image : np.ndarray, damage_sites : dict, box_size = [250,250],
     plt.close(fig)
-    return data
 ###
 ### cut out small images from panorama, append colour information
 ###
-def prepare_classifier_input(panorama: np.ndarray, centroids: list, window_size=[250, 250]) -> list:
     """
     Extracts square image patches centered at each given centroid from a grayscale panoramic SEM image.
@@ -110,8 +137,9 @@ def prepare_classifier_input(panorama: np.ndarray, centroids: list, window_size=
     Parameters
     ----------
-    panorama : np.ndarray
-        Input SEM image. Should be a 2D array (H, W) or a 3D array (H, W, 1) representing grayscale data.
     centroids : list of [int, int]
         List of (y, x) coordinates marking the centers of regions of interest. These are typically damage sites
@@ -126,14 +154,44 @@ def prepare_classifier_input(panorama: np.ndarray, centroids: list, window_size=
         List of extracted and normalized 3-channel image patches, each with shape (height, width, 3). Only
         centroids that allow full window extraction within image bounds are used.
     """
-    if panorama.ndim == 2:
-        panorama = np.expand_dims(panorama, axis=-1)  # (H, W, 1)
-    H, W, _ = panorama.shape
     win_h, win_w = window_size
     images = []
     for (cy, cx) in centroids:
         x1 = int(cx - win_w / 2)
         y1 = int(cy - win_h / 2)
         x2 = x1 + win_w
@@ -141,11 +199,12 @@ def prepare_classifier_input(panorama: np.ndarray, centroids: list, window_size=
         # Skip if patch would go out of bounds
         if x1 < 0 or y1 < 0 or x2 > W or y2 > H:
             continue
         # Extract and normalize patch
-        patch = panorama[y1:y2, x1:x2, 0].astype(np.float32)
-        patch = patch * 2. / 255. - 1.
         # Replicate grayscale channel to simulate RGB
         patch_color = np.repeat(patch[:, :, np.newaxis], 3, axis=2)
@@ -153,11 +212,3 @@ def prepare_classifier_input(panorama: np.ndarray, centroids: list, window_size=
     return images

 """
+Collection of various utils
 """
 import numpy as np
 import matplotlib.pyplot as plt
 import matplotlib.patches as patches
 from matplotlib.lines import Line2D
+import logging # ADDED for logging
 import math
 ###
+### load SEM images (Note: Not directly used with Gradio gr.Image(type="pil"))
+###
 def load_image(filename : str) -> np.ndarray :
+    """Load an SEM image
     Args:
         filename (str): full path and name of the image file to be loaded
     return image
 ###
 ### show SEM image with boxes in various colours around each damage site
 ###
 def show_boxes(image : np.ndarray, damage_sites : dict, box_size = [250,250],
                save_image = False, image_path : str = None) :
+    """
+    Shows an SEM image with colored boxes around identified damage sites.
     Args:
+        image (np.ndarray): SEM image to be shown.
+        damage_sites (dict): Python dictionary using the coordinates as key (x,y), and the label as value.
+        box_size (list, optional): Size of the rectangle drawn around each centroid. Defaults to [250,250].
+        save_image (bool, optional): Save the image with the boxes or not. Defaults to False.
+        image_path (str, optional) : Full path and name of the output file to be saved.
     """
+    logging.info(f"show_boxes: Input image type: {type(image)}") # Added logging
+    # Ensure image is a NumPy array of appropriate type for matplotlib
+    if isinstance(image, Image.Image):
+        image_to_plot = np.array(image.convert('L')) # Convert to grayscale NumPy array
+        logging.info("show_boxes: Converted PIL Image to grayscale NumPy array for plotting.")
+    elif isinstance(image, np.ndarray):
+        if image.ndim == 3 and image.shape[2] in [3,4]: # RGB or RGBA NumPy array
+            image_to_plot = np.mean(image, axis=2).astype(image.dtype) # Convert to grayscale
+            logging.info("show_boxes: Converted multi-channel NumPy array to grayscale for plotting.")
+        else: # Assume grayscale already
+            image_to_plot = image
+            logging.info("show_boxes: Image is already a grayscale NumPy array.")
+    else:
+        logging.error("show_boxes: Unsupported image format received.")
+        image_to_plot = np.zeros((100,100), dtype=np.uint8) # Fallback to black image
     _, ax = plt.subplots(1)
+    ax.imshow(image_to_plot, cmap='gray')  # show image on correct axis
     ax.set_xticks([])
     ax.set_yticks([])
     for key, label in damage_sites.items():
+        position = [key[0], key[1]] # Assuming key[0] is y (row) and key[1] is x (column)
         edgecolor = {
             'Inclusion': 'b',
             'Interface': 'g',
             'Martensite': 'r',
             'Notch': 'y',
+            'Shadowing': 'm',
+            'Not Classified': 'k' # Added Not Classified for completeness
         }.get(label, 'k')  # default: black
+        # Ensure box_size elements are floats for division
+        half_box_w = box_size[1] / 2.0
+        half_box_h = box_size[0] / 2.0
+        # x-coordinate of the bottom-left corner
+        rect_x = position[1] - half_box_w
+        # y-coordinate of the bottom-left corner (matplotlib origin is bottom-left)
+        rect_y = position[0] - half_box_h
+        rect = patches.Rectangle((rect_x, rect_y),
                                  box_size[1], box_size[0],
                                  linewidth=1, edgecolor=edgecolor, facecolor='none')
         ax.add_patch(rect)
     plt.close(fig)
+    return data
 ###
 ### cut out small images from panorama, append colour information
 ###
+def prepare_classifier_input(panorama, centroids: list, window_size=[250, 250]) -> list: # Removed np.ndarray type hint for panorama
     """
     Extracts square image patches centered at each given centroid from a grayscale panoramic SEM image.
     Parameters
     ----------
+    panorama : PIL.Image.Image or np.ndarray
+        Input SEM image. Should be a 2D array (H, W) or a 3D array (H, W, 1) representing grayscale data,
+        or a PIL Image object.
     centroids : list of [int, int]
         List of (y, x) coordinates marking the centers of regions of interest. These are typically damage sites
         List of extracted and normalized 3-channel image patches, each with shape (height, width, 3). Only
         centroids that allow full window extraction within image bounds are used.
     """
+    logging.info(f"prepare_classifier_input: Input panorama type: {type(panorama)}") # Added logging
+    # --- MINIMAL FIX START ---
+    # Convert PIL Image to NumPy array if necessary
+    if isinstance(panorama, Image.Image):
+        # Convert to grayscale NumPy array as your original code expects this structure for processing
+        if panorama.mode == 'RGB':
+            panorama_array = np.array(panorama.convert('L'))
+            logging.info("prepare_classifier_input: Converted RGB PIL Image to grayscale NumPy array.")
+        else:
+            panorama_array = np.array(panorama)
+            logging.info("prepare_classifier_input: Converted PIL Image to grayscale NumPy array.")
+    elif isinstance(panorama, np.ndarray):
+        # Ensure it's treated as a grayscale array for consistency with original logic
+        if panorama.ndim == 3 and panorama.shape[2] in [3, 4]: # RGB or RGBA NumPy array
+            panorama_array = np.mean(panorama, axis=2).astype(panorama.dtype) # Convert to grayscale
+            logging.info("prepare_classifier_input: Converted multi-channel NumPy array to grayscale.")
+        else:
+            panorama_array = panorama # Assume it's already grayscale 2D or (H,W,1)
+            logging.info("prepare_classifier_input: Panorama is already a suitable NumPy array.")
+    else:
+        logging.error("prepare_classifier_input: Unsupported panorama format received. Expected PIL Image or NumPy array.")
+        raise ValueError("Unsupported panorama format for classifier input.")
+    # Now, ensure panorama_array has a channel dimension if it's 2D for consistency
+    if panorama_array.ndim == 2:
+        panorama_array = np.expand_dims(panorama_array, axis=-1)  # (H, W, 1)
+        logging.info("prepare_classifier_input: Expanded 2D panorama to 3D (H,W,1).")
+    # --- MINIMAL FIX END ---
+    H, W, _ = panorama_array.shape # Use panorama_array here
     win_h, win_w = window_size
     images = []
     for (cy, cx) in centroids:
+        # Ensure coordinates are integers
+        cy, cx = int(round(cy)), int(round(cx))
         x1 = int(cx - win_w / 2)
         y1 = int(cy - win_h / 2)
         x2 = x1 + win_w
         # Skip if patch would go out of bounds
         if x1 < 0 or y1 < 0 or x2 > W or y2 > H:
+            logging.warning(f"prepare_classifier_input: Skipping centroid ({cy},{cx}) as patch is out of bounds.") # Added warning
             continue
         # Extract and normalize patch
+        patch = panorama_array[y1:y2, x1:x2, 0].astype(np.float32) # Use panorama_array
+        patch = patch * 2. / 255. - 1. # Keep your original normalization
         # Replicate grayscale channel to simulate RGB
         patch_color = np.repeat(patch[:, :, np.newaxis], 3, axis=2)
     return images