Spaces:

RWTHMaterials
/

DP800_DamageClassification

Sleeping

App Files Files Community

kerzel commited on Jun 26, 2025

Commit

e360db8

1 Parent(s): da6b0fd

fix in clustering to operate on image

Browse files

Files changed (2) hide show

app.py +1 -1
clustering.py +63 -37

app.py CHANGED Viewed

@@ -147,7 +147,7 @@ with gr.Blocks() as app:
     gr.Markdown('Setareh Medghalchi, Ehsan Karimi, Sang-Hyeok Lee, Benjamin Berkels, Ulrich Kerzel, Sandra Korte-Kerzel, Three-dimensional characterisation of deformation-induced damage in dual phase steel using deep learning, Materials & Design, Volume 232, 2023, 112108, ISSN 0264-1275, [link] (https://doi.org/10.1016/j.matdes.2023.112108')
     gr.Markdown('Original data and code, including the network weights,  can be found at Zenodo [link](https://zenodo.org/records/8065752)')
-    image_input = gr.Image(value='data/X4-Aligned_cropped_upperleft_small.png', label='Example SEM Image (DP800 steel)',)
     with gr.Row():
         with gr.Column(scale=1):
             image_input = gr.Image(type="pil", label="Upload SEM Image")

     gr.Markdown('Setareh Medghalchi, Ehsan Karimi, Sang-Hyeok Lee, Benjamin Berkels, Ulrich Kerzel, Sandra Korte-Kerzel, Three-dimensional characterisation of deformation-induced damage in dual phase steel using deep learning, Materials & Design, Volume 232, 2023, 112108, ISSN 0264-1275, [link] (https://doi.org/10.1016/j.matdes.2023.112108')
     gr.Markdown('Original data and code, including the network weights,  can be found at Zenodo [link](https://zenodo.org/records/8065752)')
+    #image_input = gr.Image(value='data/X4-Aligned_cropped_upperleft_small.png', label='Example SEM Image (DP800 steel)',)
     with gr.Row():
         with gr.Column(scale=1):
             image_input = gr.Image(type="pil", label="Upload SEM Image")

clustering.py CHANGED Viewed

@@ -5,21 +5,19 @@
 """
 import numpy as np
 import scipy.ndimage as ndi
 from scipy.spatial import KDTree
 from sklearn.cluster import DBSCAN
 import logging
-def get_centroids(image : np.ndarray, image_threshold = 20,
                   eps=1, min_samples=5, metric='euclidean',
-                  min_size = 20, fill_holes = False,
-                  filter_close_centroids = False, filter_radius = 50) -> list:
-    """    Determine centroids of clusters corresponding to potential damage sites.
     In a first step, a threshold is applied to the input image to identify areas of potential damage sites.
     Using DBSCAN, these agglomerations of pixels are fitted into clusters. Then, the mean x/y values are determined
     from pixels belonging to one cluster. If the number of pixels in a given cluster excees the threshold given by min_size, this cluster is added
@@ -31,27 +29,50 @@ def get_centroids(image : np.ndarray, image_threshold = 20,
     DBScan documentation: https://scikit-learn.org/stable/modules/generated/sklearn.cluster.DBSCAN.html
     Args:
-        image (np.ndarray): Input SEM image
         image_threshold (int, optional): Threshold to be applied to the image to identify candidates for damage sites. Defaults to 20.
         eps (int, optional): parameter eps of DBSCAN: The maximum distance between two samples for one to be considered as in the neighborhood of the other. Defaults to 1.
         min_samples (int, optional): parameter min_samples of DBSCAN: The number of samples (or total weight) in a neighborhood for a point to be considered as a core point. Defaults to 5.
         metric (str, optional): parameter metric of DBSCAN. Defaults to 'euclidean'.
         min_size (int, optional): Minimum number of pixels in a cluster for the damage site candidate to be considered in the final list. Defaults to 20.
         fill_holes (bool, optional): Fill small holes in damage sites clusters using binary_fill_holes. Defaults to False.
-        filter_close_centroids (book optional): Filter cluster centroids within a given radius. Defaults to False
         filter_radius (float, optional): Radius within which centroids are considered to be the same. Defaults to 50
     Returns:
         list: list of (x,y) coordinates of the centroids of the clusters of accepted damage site candidates.
     """
     centroids = []
-    #print('Threshold: ', image_threshold)
     # apply the threshold to identify regions of "dark" pixels
-    # the result is a binary mask (true/false) whether a given pixel is above or below the threshold
-    cluster_candidates = image < image_threshold
     # sometimes the clusters have small holes in them, for example, individual pixels
     # inside a region below the threshold. This may confuse the clustering algorith later on
@@ -59,20 +80,21 @@ def get_centroids(image : np.ndarray, image_threshold = 20,
     # https://docs.scipy.org/doc/scipy/reference/generated/scipy.ndimage.binary_fill_holes.html
     # N.B. the algorith only works on binay data
     if fill_holes:
-        cluster_candidates = ndi.binary_fill_holes(cluster_candidates)
-    # apply the treshold to the image to identify regions of "dark" pixels
-    #cluster_candidates = np.asarray(image < image_threshold).nonzero()
     # transform image format into a numpy array to pass on to DBSCAN clustering
-    cluster_candidates = np.asarray(cluster_candidates).nonzero()
     cluster_candidates = np.transpose(cluster_candidates)
     # run the DBSCAN clustering algorithm, candidate sites that are not attributed to a cluster are labelled as "-1", i.e. "noise"
     # (e.g. they are too small, etc)
     # For the remaining pixels, a label is assigned to each pixel, indicating to which cluster (or noise) they belong to.
-    dbscan = DBSCAN(eps=eps, min_samples=min_samples, metric='euclidean')
     dbscan.fit(cluster_candidates)
@@ -87,25 +109,29 @@ def get_centroids(image : np.ndarray, image_threshold = 20,
     # we use "set" here, as the labels are attributed to individual pixels, i.e. they appear as often as we have pixels
     # in the cluster candidates
     for i in set(labels):
-        if i>-1:
             # all points belonging to a given cluster
-            cluster_points = cluster_candidates[labels==i, :]
             if len(cluster_points) > min_size:
-                x_mean=np.mean(cluster_points, axis=0)[0]
-                y_mean=np.mean(cluster_points, axis=0)[1]
-                centroids.append([x_mean,y_mean])
-    if filter_close_centroids:
         proximity_tree = KDTree(centroids)
         pairs = proximity_tree.query_pairs(filter_radius)
-        for p in pairs:
-            #print('pair: ', p, ' p[0]: ', p[0], ' p[1]:', p[1])
-            #print('coords: ', proximity_tree.data[p[0]], '  ', proximity_tree.data[p[1]])
-            coords_to_remove = [proximity_tree.data[p[0]][0], proximity_tree.data[p[0]][1]]
-            try:
-                idx = centroids.index(coords_to_remove)
-                centroids.pop(idx)
-            except ValueError:
-                pass
-    return centroids

 """
 import numpy as np
 import scipy.ndimage as ndi
 from scipy.spatial import KDTree
 from sklearn.cluster import DBSCAN
 import logging
+from PIL import Image # ADDED: Import PIL for image type checking/conversion
+def get_centroids(image, image_threshold=20, # Removed type hint np.ndarray as it can also be PIL.Image.Image initially
                   eps=1, min_samples=5, metric='euclidean',
+                  min_size=20, fill_holes=False,
+                  filter_close_centroids=False, filter_radius=50) -> list:
+    """
+    Determine centroids of clusters corresponding to potential damage sites.
     In a first step, a threshold is applied to the input image to identify areas of potential damage sites.
     Using DBSCAN, these agglomerations of pixels are fitted into clusters. Then, the mean x/y values are determined
     from pixels belonging to one cluster. If the number of pixels in a given cluster excees the threshold given by min_size, this cluster is added
     DBScan documentation: https://scikit-learn.org/stable/modules/generated/sklearn.cluster.DBSCAN.html
     Args:
+        image: Input SEM image (PIL Image or NumPy array).
         image_threshold (int, optional): Threshold to be applied to the image to identify candidates for damage sites. Defaults to 20.
         eps (int, optional): parameter eps of DBSCAN: The maximum distance between two samples for one to be considered as in the neighborhood of the other. Defaults to 1.
         min_samples (int, optional): parameter min_samples of DBSCAN: The number of samples (or total weight) in a neighborhood for a point to be considered as a core point. Defaults to 5.
         metric (str, optional): parameter metric of DBSCAN. Defaults to 'euclidean'.
         min_size (int, optional): Minimum number of pixels in a cluster for the damage site candidate to be considered in the final list. Defaults to 20.
         fill_holes (bool, optional): Fill small holes in damage sites clusters using binary_fill_holes. Defaults to False.
+        filter_close_centroids (bool, optional): Filter cluster centroids within a given radius. Defaults to False
         filter_radius (float, optional): Radius within which centroids are considered to be the same. Defaults to 50
     Returns:
         list: list of (x,y) coordinates of the centroids of the clusters of accepted damage site candidates.
     """
     centroids = []
+    logging.info(f"get_centroids: Input image type: {type(image)}") # Added logging
+    # --- MINIMAL FIX START ---
+    # Convert PIL Image to NumPy array if necessary
+    if isinstance(image, Image.Image):
+        # Convert to grayscale first for thresholding, assuming it's a single-channel operation
+        if image.mode == 'RGB': # Handle RGB images by converting to grayscale 'L' mode
+            image_array = np.array(image.convert('L'))
+            logging.info("get_centroids: Converted RGB PIL Image to grayscale NumPy array.") # Added logging
+        else: # Handle other PIL modes (like 'L' for grayscale)
+            image_array = np.array(image)
+            logging.info("get_centroids: Converted PIL Image to NumPy array.") # Added logging
+    elif isinstance(image, np.ndarray):
+        # If it's already a NumPy array, ensure it's grayscale if it was multi-channel
+        if image.ndim == 3 and image.shape[2] in [3, 4]: # RGB or RGBA NumPy array
+            image_array = np.mean(image, axis=2).astype(image.dtype) # Convert to grayscale by averaging channels
+            logging.info("get_centroids: Converted multi-channel NumPy array to grayscale NumPy array.") # Added logging
+        else: # Assume it's already a suitable grayscale NumPy array
+            image_array = image
+            logging.info("get_centroids: Image is already a suitable NumPy array.") # Added logging
+    else:
+        logging.error("get_centroids: Unsupported image format received. Expected PIL Image or NumPy array.") # Added logging
+        raise ValueError("Unsupported image format. Expected PIL Image or NumPy array for thresholding.")
     # apply the threshold to identify regions of "dark" pixels
+    # The result is a binary mask (true/false) whether a given pixel is above or below the threshold
+    # Now using 'image_array' instead of 'image'
+    cluster_candidates_mask = image_array < image_threshold
+    # --- MINIMAL FIX END ---
     # sometimes the clusters have small holes in them, for example, individual pixels
     # inside a region below the threshold. This may confuse the clustering algorith later on
     # https://docs.scipy.org/doc/scipy/reference/generated/scipy.ndimage.binary_fill_holes.html
     # N.B. the algorith only works on binay data
     if fill_holes:
+        cluster_candidates_mask = ndi.binary_fill_holes(cluster_candidates_mask)
     # transform image format into a numpy array to pass on to DBSCAN clustering
+    cluster_candidates = np.asarray(cluster_candidates_mask).nonzero()
     cluster_candidates = np.transpose(cluster_candidates)
+    # Handle case where no candidates are found after thresholding
+    if cluster_candidates.size == 0: # Added check for empty array
+        logging.warning("No cluster candidates found after thresholding. Returning empty centroids list.")
+        return []
     # run the DBSCAN clustering algorithm, candidate sites that are not attributed to a cluster are labelled as "-1", i.e. "noise"
     # (e.g. they are too small, etc)
     # For the remaining pixels, a label is assigned to each pixel, indicating to which cluster (or noise) they belong to.
+    dbscan = DBSCAN(eps=eps, min_samples=min_samples, metric=metric) # Used 'metric' parameter
     dbscan.fit(cluster_candidates)
     # we use "set" here, as the labels are attributed to individual pixels, i.e. they appear as often as we have pixels
     # in the cluster candidates
     for i in set(labels):
+        if i > -1: # Ensure it's not noise
             # all points belonging to a given cluster
+            cluster_points = cluster_candidates[labels == i, :]
             if len(cluster_points) > min_size:
+                x_mean = np.mean(cluster_points, axis=0)[0]
+                y_mean = np.mean(cluster_points, axis=0)[1]
+                centroids.append([x_mean, y_mean])
+    if filter_close_centroids and len(centroids) > 1: # Only filter if there's more than one centroid
         proximity_tree = KDTree(centroids)
         pairs = proximity_tree.query_pairs(filter_radius)
+        # Use a set to mark indices for removal to avoid modifying list during iteration
+        indices_to_remove = set()
+        for p1_idx, p2_idx in pairs:
+            # Decide which one to remove. For simplicity, remove the one with the higher index
+            # This ensures you don't try to remove an index that might have already been removed
+            indices_to_remove.add(max(p1_idx, p2_idx))
+        # Rebuild the centroids list, excluding the marked ones
+        filtered_centroids = [centroid for i, centroid in enumerate(centroids) if i not in indices_to_remove]
+        centroids = filtered_centroids
+        logging.info(f"Filtered {len(indices_to_remove)} close centroids. Remaining: {len(centroids)}")
+    return centroids