Spaces:

Prathush21
/

test

Runtime error

File size: 14,858 Bytes

bd3e8b6

import cv2
import torch
import torch.nn as nn
import numpy as np
import torchvision
import os
import copy
from sklearn.mixture import GaussianMixture as GMM
from sklearn.cluster import KMeans
from simple_lama_inpainting import SimpleLama
from PIL import Image
from matplotlib.colors import ListedColormap
import matplotlib.pyplot as plt
import matplotlib
import csv

matplotlib.use("Agg")

import base64

from utils import (
    select_sample_images,
    create_cell_descriptors_table,
    calculate_cell_descriptors,
)

preprocessed_folder = "uploads/"
intermediate_folder = "heatmaps/"
segmentation_folder = "segmentations/"
tables_folder = "tables/"
cell_descriptors_path = "cell_descriptors/cell_descriptors.csv"
imgclasses = {0: "abnormal", 1: "normal"}


def toconv(layers):
    newlayers = []
    for i, layer in enumerate(layers):
        if isinstance(layer, nn.Linear):
            newlayer = None
            if i == 0:
                m, n = 512, layer.weight.shape[0]
                newlayer = nn.Conv2d(m, n, 4)
                newlayer.weight = nn.Parameter(layer.weight.reshape(n, m, 4, 4))
            else:
                m, n = layer.weight.shape[1], layer.weight.shape[0]
                newlayer = nn.Conv2d(m, n, 1)
                newlayer.weight = nn.Parameter(layer.weight.reshape(n, m, 1, 1))
            newlayer.bias = nn.Parameter(layer.bias)
            newlayers += [newlayer]
        else:
            newlayers += [layer]
    return newlayers


def newlayer(layer, g):
    layer = copy.deepcopy(layer)
    try:
        layer.weight = nn.Parameter(g(layer.weight))
    except AttributeError:
        pass
    try:
        layer.bias = nn.Parameter(g(layer.bias))
    except AttributeError:
        pass
    return layer


def heatmap(R, sx, sy, intermediate_path):
    b = 10 * ((np.abs(R) ** 3.0).mean() ** (1.0 / 3))
    my_cmap = plt.cm.seismic(np.arange(plt.cm.seismic.N))
    my_cmap[:, 0:3] *= 0.85
    my_cmap = ListedColormap(my_cmap)
    plt.figure(figsize=(sx, sy))
    plt.subplots_adjust(left=0, right=1, bottom=0, top=1)
    plt.axis("off")
    plt.imshow(R, cmap=my_cmap, vmin=-b, vmax=b, interpolation="nearest")
    # plt.show()
    plt.savefig(intermediate_path, bbox_inches="tight", pad_inches=0)
    plt.close()


def get_LRP_heatmap(image, L, layers, imgclasses, intermediate_path):
    img = np.array(image)[..., ::-1] / 255.0
    mean = torch.FloatTensor([0.485, 0.456, 0.406]).reshape(1, -1, 1, 1)  # torch.cuda
    std = torch.FloatTensor([0.229, 0.224, 0.225]).reshape(1, -1, 1, 1)  # torch.cuda
    X = (torch.FloatTensor(img[np.newaxis].transpose([0, 3, 1, 2]) * 1) - mean) / std

    A = [X] + [None] * L
    for l in range(L):
        A[l + 1] = layers[l].forward(A[l])

    scores = np.array(A[-1].cpu().data.view(-1))
    ind = np.argsort(-scores)
    for i in ind[:2]:
        print("%20s (%3d): %6.3f" % (imgclasses[i], i, scores[i]))

    T = torch.FloatTensor(
        (1.0 * (np.arange(2) == ind[0]).reshape([1, 2, 1, 1]))
    )  # SET FOR THE HIGHEST SCORE CLASS
    R = [None] * L + [(A[-1] * T).data]
    for l in range(1, L)[::-1]:
        A[l] = (A[l].data).requires_grad_(True)
        if isinstance(layers[l], torch.nn.MaxPool2d):
            layers[l] = torch.nn.AvgPool2d(2)
        if isinstance(layers[l], torch.nn.Conv2d) or isinstance(
            layers[l], torch.nn.AvgPool2d
        ):
            rho = lambda p: p + 0.25 * p.clamp(min=0)
            incr = lambda z: z + 1e-9  # USE ONLY THE GAMMA RULE FOR ALL LAYERS

            z = incr(newlayer(layers[l], rho).forward(A[l]))  # step 1
            # adding epsilon
            epsilon = 1e-9
            z_nonzero = torch.where(z == 0, torch.tensor(epsilon, device=z.device), z)
            s = (R[l + 1] / z_nonzero).data
            # s = (R[l+1]/z).data                                    # step 2
            (z * s).sum().backward()
            c = A[l].grad  # step 3
            R[l] = (A[l] * c).data  # step 4
        else:
            R[l] = R[l + 1]

    A[0] = (A[0].data).requires_grad_(True)
    lb = (A[0].data * 0 + (0 - mean) / std).requires_grad_(True)
    hb = (A[0].data * 0 + (1 - mean) / std).requires_grad_(True)

    z = layers[0].forward(A[0]) + 1e-9  # step 1 (a)
    z -= newlayer(layers[0], lambda p: p.clamp(min=0)).forward(lb)  # step 1 (b)
    z -= newlayer(layers[0], lambda p: p.clamp(max=0)).forward(hb)  # step 1 (c)

    # adding epsilon
    epsilon = 1e-9
    z_nonzero = torch.where(z == 0, torch.tensor(epsilon, device=z.device), z)
    s = (R[1] / z_nonzero).data  # step 2

    (z * s).sum().backward()
    c, cp, cm = A[0].grad, lb.grad, hb.grad  # step 3
    R[0] = (A[0] * c + lb * cp + hb * cm).data  # step 4
    heatmap(
        np.array(R[0][0].cpu()).sum(axis=0), 2, 2, intermediate_path
    )  # HEATMAPPING TO SEE LRP MAPS WITH NEW RULE
    return R[0][0].cpu()


def get_nucleus_mask_for_graphcut(R):
    res = np.array(R).sum(axis=0)
    # Reshape the data to a 1D array
    data_1d = res.flatten().reshape(-1, 1)
    n_clusters = 2
    kmeans = KMeans(n_clusters=n_clusters, random_state=0)
    # kmeans.fit(data_1d)
    kmeans.fit(data_1d)
    # Step 4: Assign data points to clusters
    cluster_assignments = kmeans.labels_
    # Step 5: Reshape cluster assignments into a 2D binary matrix
    binary_matrix = cluster_assignments.reshape(128, 128)
    # Now, binary_matrix contains 0s and 1s, separating the data into two classes using K-Means clustering
    rel_grouping = np.zeros((128, 128, 3), dtype=np.uint8)
    rel_grouping[binary_matrix == 1] = [255, 0, 0]  # Main object (Blue)
    rel_grouping[binary_matrix == 2] = [128, 0, 0]  # Second label (Dark Blue)
    rel_grouping[binary_matrix == 0] = [0, 0, 255]  # Background (Red)
    return rel_grouping


def segment_nucleus(image, rel_grouping):  # clustered = rel_grouping

    # GET THE BOUNDING BOX FROM CLUSTERED
    blue_pixels = np.sum(np.all(rel_grouping == [255, 0, 0], axis=-1))
    red_pixels = np.sum(np.all(rel_grouping == [0, 0, 255], axis=-1))
    if red_pixels > blue_pixels:
        color = np.array([255, 0, 0])
    else:
        color = np.array([0, 0, 255])
    mask = cv2.inRange(rel_grouping, color, color)
    contours, _ = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
    contour_areas = []
    for contour in contours:
        x, y, w, h = cv2.boundingRect(contour)
        contour_areas.append(cv2.contourArea(contour))
    contour_areas.sort()
    contour_areas = np.array(contour_areas)
    quartile_50 = np.percentile(contour_areas, 50)
    selected_contours = [
        contour for contour in contours if cv2.contourArea(contour) >= quartile_50
    ]
    x, y, w, h = cv2.boundingRect(np.concatenate(selected_contours))

    # APPLY GRABCUT
    fgModel = np.zeros((1, 65), dtype="float")
    bgModel = np.zeros((1, 65), dtype="float")
    mask = np.zeros(image.shape[:2], np.uint8)
    rect = (x, y, x + w, y + h)

    # IF BOUNDING BOX IS THE WHOLE IMAGE, THEN BOUNDING BOX METHOD WONT'T WORK -> SO USE INIT WITH MASK METHOD ITSELF
    if (x, y, x + w, y + h) == (0, 0, 128, 128):

        if (
            red_pixels > blue_pixels
        ):  # red is the dominant color and thus the background
            mask[(rel_grouping == [255, 0, 0]).all(axis=2)] = (
                cv2.GC_PR_FGD
            )  # Probable Foreground
            mask[(rel_grouping == [0, 0, 255]).all(axis=2)] = (
                cv2.GC_PR_BGD
            )  # Probable Background
        else:  # blue is the dominant color and thus the background
            mask[(rel_grouping == [0, 0, 255]).all(axis=2)] = (
                cv2.GC_PR_FGD
            )  # Probable Foreground
            mask[(rel_grouping == [255, 0, 0]).all(axis=2)] = (
                cv2.GC_PR_BGD
            )  # Probable Background

        (mask, bgModel, fgModel) = cv2.grabCut(
            image,
            mask,
            rect,
            bgModel,
            fgModel,
            iterCount=10,
            mode=cv2.GC_INIT_WITH_MASK,
        )

    # ELSE PASS THE BOUNDING BOX FOR GRABCUT
    else:
        (mask, bgModel, fgModel) = cv2.grabCut(
            image,
            mask,
            rect,
            bgModel,
            fgModel,
            iterCount=10,
            mode=cv2.GC_INIT_WITH_RECT,
        )

    # FORM THE COLORED SEGMENTATION MASK
    clean_binary_mask = np.where(
        (mask == cv2.GC_FGD) | (mask == cv2.GC_PR_FGD), 1, 0
    ).astype("uint8")
    nucleus_segment = np.zeros((128, 128, 3), dtype=np.uint8)
    nucleus_segment[clean_binary_mask == 1] = [255, 0, 0]  # Main object (Blue)
    nucleus_segment[clean_binary_mask == 0] = [0, 0, 255]  # Background (Red)
    return nucleus_segment, clean_binary_mask


def remove_nucleus(image1, blue_mask1):  # image, blue_mask, x, y
    # expand the nucleus mask
    # image1 = cv2.resize(image, (128,128))
    # blue_mask1 = cv2.resize(blue_mask, (128,128))
    kernel = np.ones((5, 5), np.uint8)  # Adjust the kernel size as needed
    expandedmask = cv2.dilate(blue_mask1, kernel, iterations=1)
    simple_lama = SimpleLama()
    image_pil = Image.fromarray(cv2.cvtColor(image1, cv2.COLOR_BGR2RGB))
    mask_pil = Image.fromarray(expandedmask)
    result = simple_lama(image_pil, mask_pil)
    result_cv2 = np.array(result)
    result_cv2 = cv2.cvtColor(result_cv2, cv2.COLOR_RGB2BGR)
    # result_cv2 = cv2.resize(result_cv2, (x,y))
    return expandedmask, result_cv2


def get_final_mask(nucleus_removed_img, blue_mask, expanded_mask):
    # apply graphcut - init with rectangle (not mask approximation mask)
    fgModel = np.zeros((1, 65), dtype="float")
    bgModel = np.zeros((1, 65), dtype="float")

    rect = (1, 1, nucleus_removed_img.shape[1], nucleus_removed_img.shape[0])

    (mask, bgModel, fgModel) = cv2.grabCut(
        nucleus_removed_img,
        expanded_mask,
        rect,
        bgModel,
        fgModel,
        iterCount=20,
        mode=cv2.GC_INIT_WITH_RECT,
    )

    clean_binary_mask = np.where(
        (mask == cv2.GC_FGD) | (mask == cv2.GC_PR_FGD), 1, 0
    ).astype("uint8")
    colored_segmentation_mask = np.zeros((128, 128, 3), dtype=np.uint8)
    colored_segmentation_mask[clean_binary_mask == 1] = [
        128,
        0,
        0,
    ]  # Main object (Blue)
    colored_segmentation_mask[clean_binary_mask == 0] = [0, 0, 255]  # Background (Red)
    colored_segmentation_mask[blue_mask > 0] = [255, 0, 0]
    return colored_segmentation_mask


def lrp_main(pixel_conversion):
    i = 0
    return_dict_count = 1
    return_dict = {}
    selected_indices = select_sample_images()
    resized_shape = (128, 128)
    cell_descriptors = [
        ["Image Name", "Nucleus Area", "Cytoplasm Area", "Nucleus to Cytoplasm Ratio"]
    ]

    for imagefile in os.listdir(preprocessed_folder):
        if (
            "MACOSX".lower() in imagefile.lower()
            or "." == imagefile[0]
            or "_" == imagefile[0]
        ):
            print(imagefile)
            continue
        image_path = (
            preprocessed_folder + os.path.splitext(imagefile)[0].lower() + ".png"
        )
        intermediate_path = (
            intermediate_folder
            + os.path.splitext(imagefile)[0].lower()
            + "_heatmap.png"
        )
        save_path = (
            segmentation_folder + os.path.splitext(imagefile)[0].lower() + "_mask.png"
        )
        table_path = (
            tables_folder + os.path.splitext(imagefile)[0].lower() + "_table.png"
        )

        # print(i, imagefile)
        image = cv2.imread(image_path)
        original_shape = image.shape

        image = cv2.resize(image, (128, 128))

        # MODEL SECTION STARTS FOR NEW MODEL
        vgg16 = torchvision.models.vgg16(pretrained=True)
        new_avgpool = nn.AdaptiveAvgPool2d(output_size=(4, 4))
        vgg16.avgpool = new_avgpool
        classifier_list = [
            nn.Linear(8192, vgg16.classifier[0].out_features)
        ]  # vgg16.classifier[0].out_features = 4096
        classifier_list += list(vgg16.classifier.children())[
            1:-1
        ]  # Remove the first and last layers
        classifier_list += [
            nn.Linear(vgg16.classifier[6].in_features, 2)
        ]  # vgg16.classifier[6].in_features = 4096
        vgg16.classifier = nn.Sequential(
            *classifier_list
        )  # Replace the model classifier

        PATH = "herlev_best_adam_vgg16_modified12_final.pth"
        checkpoint = torch.load(PATH, map_location=torch.device("cpu"))
        vgg16.load_state_dict(checkpoint)
        # vgg16.to(torch.device('cuda'))
        vgg16.eval()

        layers = list(vgg16._modules["features"]) + toconv(
            list(vgg16._modules["classifier"])
        )
        L = len(layers)
        # MODEL SECTION ENDS

        R = get_LRP_heatmap(image, L, layers, imgclasses, intermediate_path)

        rel_grouping = get_nucleus_mask_for_graphcut(R)

        nucleus_segment, clean_binary_mask = segment_nucleus(image, rel_grouping)

        expanded_mask, nucleus_removed_image = remove_nucleus(image, clean_binary_mask)

        colored_segmentation_mask = get_final_mask(
            nucleus_removed_image, clean_binary_mask, expanded_mask
        )

        cv2.imwrite(save_path, colored_segmentation_mask)

        nucleus_area, cytoplasm_area, ratio = calculate_cell_descriptors(
            original_shape, resized_shape, pixel_conversion, colored_segmentation_mask
        )
        cell_descriptors.append(
            [
                os.path.splitext(imagefile)[0].lower(),
                nucleus_area,
                cytoplasm_area,
                ratio,
            ]
        )

        create_cell_descriptors_table(table_path, nucleus_area, cytoplasm_area, ratio)

        if i in selected_indices:
            return_dict[f"image{return_dict_count}"] = str(
                base64.b64encode(open(image_path, "rb").read()).decode("utf-8")
            )
            return_dict[f"inter{return_dict_count}"] = str(
                base64.b64encode(open(intermediate_path, "rb").read()).decode("utf-8")
            )
            return_dict[f"mask{return_dict_count}"] = str(
                base64.b64encode(open(save_path, "rb").read()).decode("utf-8")
            )
            return_dict[f"table{return_dict_count}"] = str(
                base64.b64encode(open(table_path, "rb").read()).decode("utf-8")
            )
            return_dict_count += 1

        i += 1

        # Visualization
        # for im in [image, gt2, rel_grouping, nucleus_segment, clean_binary_mask*255, nucleus_removed_image, colored_segmentation_mask]:
        #   cv2_imshow(im)

    # write cell_descriptors list to csv file
    with open(cell_descriptors_path, "w", newline="") as csv_file:
        writer = csv.writer(csv_file)
        writer.writerows(cell_descriptors)

    return return_dict