File size: 15,430 Bytes

ae29340

import numpy as np
from tensorflow.keras import backend as K
import tensorflow.keras as keras
import math
from matplotlib import pyplot as plt
import cv2
import time
import scipy
from os import listdir
from IPython.display import clear_output
import segmentation_models as sm
from PIL import Image
import images_toolkit as tlk


def dice_coef(y_true, y_pred, smooth=1):
    y_true_f = K.flatten(y_true)
    y_pred_f = K.flatten(y_pred)
    intersection = K.sum(y_true_f * y_pred_f)
    return (2.0 * intersection + smooth) / (K.sum(y_true_f) + K.sum(y_pred_f) + smooth)


def dice_loss(alpha=1):
    def dice_coef_loss(y_true, y_pred):
        return 1 - alpha * dice_coef(y_true, y_pred)

    return dice_coef_loss


def categorical_loss():
    def categorical(y_true, y_pred):
        return keras.losses.CategoricalCrossentropy()(y_true, y_pred)

    return categorical


def bce_loss():
    def bce(y_true, y_pred):
        return keras.losses.BinaryCrossentropy()(y_true, y_pred)

    return bce


def tversky(y_true, y_pred, smooth=1, alpha=0.7):
    y_true_pos = K.flatten(y_true)
    y_pred_pos = K.flatten(y_pred)
    true_pos = K.sum(y_true_pos * y_pred_pos)
    false_neg = K.sum(y_true_pos * (1 - y_pred_pos))
    false_pos = K.sum((1 - y_true_pos) * y_pred_pos)
    return (true_pos + smooth) / (
        true_pos + alpha * false_neg + (1 - alpha) * false_pos + smooth
    )


def tversky_loss(y_true, y_pred):
    return 1 - tversky(y_true, y_pred)


# def focal_tversky_loss(y_true, y_pred, gamma=0.75):
#    tv = tversky(y_true, y_pred)
#    return K.pow((1 - tv), gamma)


def categorical_focal_loss(gamma=2.0, alpha=0.25):
    def cate_focal_loss(y_true, y_pred):
        CAT_FL = sm.losses.categorical_focal_loss
        CAT_FL.gamma = gamma
        CAT_FL.alpha = alpha
        return CAT_FL(y_true, y_pred)

    return cate_focal_loss


def focal_loss(gamma=2.0, alpha=0.7):
    def focal_tversky_loss(y_true, y_pred):
        tv = tversky(y_true, y_pred, alpha)
        return K.pow((1 - tv), gamma)

    return focal_tversky_loss


def single_iou(y_true, y_pred, label: int):
    """
    Return the Intersection over Union (IoU) for a given label.
    Args:
        y_true: the expected y values as a one-hot
        y_pred: the predicted y values as a one-hot or softmax output
        label: the label to return the IoU for
    Returns:
        the IoU for the given label
    """
    # extract the label values using the argmax operator then
    # calculate equality of the predictions and truths to the label
    y_true = K.cast(K.equal(K.argmax(y_true), label), K.floatx())
    y_pred = K.cast(K.equal(K.argmax(y_pred), label), K.floatx())

    # y_true = K.cast(K.equal(K.argmax(y_true), 1), K.floatx())
    # y_pred = K.cast(K.equal(K.argmax(y_pred), 1), K.floatx())
    # calculate the |intersection| (AND) of the labels
    intersection = K.sum(y_true * y_pred)
    # calculate the |union| (OR) of the labels
    union = K.sum(y_true) + K.sum(y_pred) - intersection
    # avoid divide by zero - if the union is zero, return 1
    # otherwise, return the intersection over union
    a = K.switch(K.equal(union, 0), 1.0, intersection / union)
    return K.switch(K.equal(union, 0), 1.0, intersection / union)


def iou(y_true, y_pred):
    """
    Return the Intersection over Union (IoU) score.
    Args:
        y_true: the expected y values as a one-hot
        y_pred: the predicted y values as a one-hot or softmax output
    Returns:
        the scalar IoU value (mean over all labels)
    """
    # get number of labels to calculate IoU for
    num_labels = K.int_shape(y_pred)[-1]
    # initialize a variable to store total IoU in
    total_iou = K.variable(0)
    # iterate over labels to calculate IoU for
    for label in range(num_labels):
        total_iou = total_iou + single_iou(y_true, y_pred, label)
    # divide total IoU by number of labels to get mean IoU
    a = total_iou / num_labels
    return total_iou / num_labels


def simple_iou(gt, pred):
    """Computes IoU for a binary classified image. Input shapes: (h, w)"""
    return np.nan_to_num(
        np.sum((gt == 1) & (pred == 1)) / np.sum((gt == 1) | (pred == 1)), 0
    )


def simple_iou_for_multiple_classes(gt, pred, n_classes):
    """Computes IoU for a categorically classified image. Input shapes: (h, w)
    If n_classes > 3, then it will also compute the IoU of the union of all classes
    that are >= 3 (i.e., the IoU of objects as one).
    Returns: array of (h, w, n_classes) if n_classes <= 3
             array of (h, w, n_classes+1) if n_classes > 3
    """
    assert gt.shape == pred.shape and gt.ndim == 2
    assert np.max(gt) < n_classes and np.max(pred) < n_classes

    f_gt = gt.flatten()
    f_pred = pred.flatten()
    gt_matrix = np.zeros((f_gt.size, n_classes), dtype=int)
    pred_matrix = gt_matrix.copy()
    gt_matrix[np.arange(f_gt.size), f_gt] = 1
    pred_matrix[np.arange(f_gt.size), f_pred] = 1
    intersections = np.sum((gt_matrix == 1) & (pred_matrix == 1), axis=0)
    unions = np.sum((gt_matrix == 1) | (pred_matrix == 1), axis=0)
    ious = intersections / unions
    if n_classes > 3:
        gt_as_one = f_gt >= 2
        pred_as_one = f_pred >= 2
        iou_as_one = np.sum(gt_as_one & pred_as_one) / np.sum(gt_as_one | pred_as_one)
        return np.append(ious, iou_as_one)
    else:
        return ious


def add_mask(image, mask):
    b_channel, g_channel, r_channel = cv2.split(image)
    alpha_channel = mask * 255

    alpha_channel = alpha_channel.astype(np.float64)

    g_channel_out = np.clip(np.add(alpha_channel, g_channel), 0, 255)
    g_channel_out = g_channel_out.astype(np.uint8)

    alpha_channel = alpha_channel.astype(np.uint8)
    img_BGRA = cv2.merge((b_channel, g_channel_out, r_channel, alpha_channel))
    image_RGBA = cv2.cvtColor(img_BGRA, cv2.COLOR_BGRA2RGBA)

    return image_RGBA, alpha_channel


def resolution2framesize3cha(resolution):
    if resolution == "640x240":
        framesize = (240, 640, 3)
    if resolution == "640x480":
        framesize = (480, 640, 3)
    if resolution == "1280x480":
        framesize = (480, 1280, 3)
    if resolution == "1280x720":
        framesize = (720, 1280, 3)
    if resolution == "960x540":
        framesize = (540, 960, 3)
    if resolution == "320x240":
        framesize = (240, 320, 3)
    if resolution == "1024x768":
        framesize = (768, 1024, 3)
    if resolution == "2560x960":
        framesize = (960, 2560, 3)
    if resolution == "2560x720":
        framesize = (720, 2560, 3)
    return framesize


def resolution2framesize(resolution):
    if resolution == "640x240":
        framesize = (240, 640)
    if resolution == "640x480":
        framesize = (480, 640)
    if resolution == "1280x480":
        framesize = (480, 1280)
    if resolution == "1280x720":
        framesize = (720, 1280)
    if resolution == "960x540":
        framesize = (540, 960)
    if resolution == "320x240":
        framesize = (240, 320)
    if resolution == "1024x768":
        framesize = (768, 1024)
    if resolution == "2560x960":
        framesize = (960, 2560)
    if resolution == "2560x720":
        framesize = (720, 2560)
    return framesize


def webcam_test(model):

    cap = cv2.VideoCapture(2)
    cont = True

    while cont:

        # Capture a frame from camera

        ret, frame = cap.read()
        print(frame.shape)

        if not ret:
            break

        # x = [frame]
        frame = np.array(frame) / 255.0
        x = np.reshape(frame, (1, 480, 640, 3))

        # frame = cv2.resize(frame, (720,720))
        # x = np.reshape(frame,(1,720,720,3))
        start_t = time.time()
        pred = model.predict(x)
        duration = time.time() - start_t
        pred = pred[0, :, :, :]
        pred = np.argmax(pred, 2)

        print(pred.shape)
        overlap = add_mask(frame, pred)

        print(duration)

        cv2.imshow("Overlap", overlap)
        if cv2.waitKey(1) & 0xFF == ord("q"):
            break


def image_test(model, img_dir, img_num, label_dir=None):

    list_IDs = [f[:-4] for f in listdir(img_dir) if f[-4:] == ".jpg"]
    img_path = img_dir + list_IDs[img_num] + ".jpg"
    test_img = cv2.imread(img_path) / 255.0
    test_img = np.reshape(test_img, (1, test_img.shape[0], test_img.shape[1], 3))

    pred = model.predict(test_img)
    pred = pred[0, :, :, :]
    predict = np.argmax(pred, 2)

    overlapping = add_mask(test_img[0, :, :, :], predict)

    cv2.imshow("Prediction", overlapping)
    cv2.imwrite(
        "./models_repo/frozen_resnet/Trial11/prediction_" + str(img_num) + ".png",
        overlapping,
    )

    if label_dir != None:
        lab = label_dir + list_IDs[img_num] + ".png"

        lab_img = cv2.imread(lab) * 255
        lab_img = np.array(lab_img)
        cv2.imshow("Label", lab_img)
        cv2.imwrite(
            "./models_repo/frozen_resnet/Trial10/label_" + str(img_num) + ".png",
            lab_img,
        )

    cv2.waitKey(0)


class PlotLosses(keras.callbacks.Callback):
    def __init__(self, out_dir):
        self.out_dir = out_dir

    def on_train_begin(self, logs={}):
        self.i = 0
        self.x = []
        self.losses = []
        self.val_losses = []
        # self.fig_loss = plt.figure()
        self.train_iou = []
        self.val_iou = []
        # self.fig_iou = plt.figure()

        self.live_loss = []
        self.fig_livel = plt.figure()

        self.live_iou = []
        self.fig_livei = plt.figure()

        self.logs = []
        self.live_logs = []
        self.b = 0
        self.x_b = []
        self.loss = 0
        self.iou = 0
        self.num = 0

    def on_batch_end(self, batch, logs={}):
        self.iou += logs.get("iou")
        self.loss += logs.get("loss")
        self.num += 1
        if self.b % 50 == 0:
            self.x_b.append(self.num)
            self.live_loss.append(self.loss / float(self.b + 1))
            self.live_iou.append(self.iou / float(self.b + 1))
            clear_output(wait=True)
            plt.ioff()
            fig1 = plt.figure(1)
            plt.ioff()
            plt.plot(self.x_b, self.live_loss, label="Training loss")
            plt.title("Training loss")
            plt.xlabel("Iteration")
            plt.ylabel("Loss")
            plt.savefig(self.out_dir + "training_loss.png")
            plt.close(fig1)
            clear_output(wait=True)
            fig2 = plt.figure(2)
            plt.plot(self.x_b, self.live_iou, label="Training iou")
            plt.title("Training IoU")
            plt.xlabel("Iteration")
            plt.ylabel("IoU")
            plt.savefig(self.out_dir + "training_iou.png")
            plt.close(fig2)
        self.b += 1

    def on_epoch_end(self, epoch, logs={}):
        self.loss = 0
        self.iou = 0
        self.b = 0
        self.logs.append(logs)
        self.x.append(self.i)
        self.losses.append(logs.get("loss"))
        self.val_losses.append(logs.get("val_loss"))
        self.i += 1
        self.train_iou.append(logs.get("iou"))
        self.val_iou.append(logs.get("val_iou"))
        plt.ioff()
        fig3 = plt.figure(3)
        clear_output(wait=True)
        plt.plot(self.x, self.losses, label="loss")
        plt.plot(self.x, self.val_losses, label="val_loss")
        plt.title("Loss curve")
        plt.xlabel("Epoch")
        plt.ylabel("Loss")
        plt.legend()
        plt.savefig(self.out_dir + "loss_curve.png")
        plt.close(fig3)
        fig4 = plt.figure(4)
        clear_output(wait=True)
        plt.plot(self.x, self.train_iou, label="train_iou")
        plt.plot(self.x, self.val_iou, label="val_iou")
        plt.title("IoU curve")
        plt.xlabel("Epoch")
        plt.ylabel("IoU")
        plt.legend()
        plt.savefig(self.out_dir + "mean_iou_curve.png")
        plt.close(fig4)


def step_decay(epoch):
    initial_lrate = 0.1
    drop = 0.5
    epochs_drop = 10.0
    lrate = initial_lrate * math.pow(drop, math.floor((epoch) / epochs_drop))
    return lrate


label_colours = [
    (0, 0, 0),  # 0=background
    # 1=wall,       2=floor,   3=cabinet,     4=bed,       5=chair
    (128, 0, 0),
    (0, 128, 0),
    (128, 128, 0),
    (0, 0, 128),
    (128, 0, 128),
    # 6=sofa,       7=table,           8=door,   9=window, 10=bookshelf
    (0, 128, 128),
    (128, 128, 128),
    (255, 200, 180),
    (192, 0, 0),
    (192, 192, 192),
    # 11=picture,      12=counter,  13=blinds,      14=desk,         15=shelves
    (192, 128, 0),
    (64, 0, 128),
    (192, 0, 128),
    (255, 128, 0),
    (192, 128, 128),
    # 16=curtain, 17=dresser, 18=pillow,    19=mirror,    20=floor_mat,    21=clothes
    (0, 64, 0),
    (128, 64, 0),
    (0, 192, 0),
    (153, 153, 255),
    (0, 64, 128),
    (255, 255, 0),
    # 22=ceiling,     23=books,        24=fridge,       25=tv,         26=paper,      27=towel
    (250, 250, 250),
    (0, 192, 128),
    (250, 102, 250),
    (102, 250, 250),
    (44, 166, 44),
    (44, 44, 166),
    # 28=shower_curtain, 29=box, 30=whiteboard, 31=person, 32=night_stand, 33=toilet
    (166, 44, 44),
    (0, 250, 0),
    (250, 0, 0),
    (0, 0, 250),
    (206, 219, 156),
    (219, 156, 206),
    # 34=sink         #35=lamp         #36=bathtub     #37=bag         #38=Unknown
    (156, 206, 219),
    (23, 190, 207),
    (207, 23, 190),
    (190, 207, 23),
    (153, 0, 76),
]
# #
# label_colours = [(0, 0, 0),  # 0=background
#                  #1=hand,
#                 (128, 0, 0)]


def decode_labels(mask, num_classes=38):
    """Decode batch of segmentation masks.

    Args:
      mask: result of inference after taking argmax.
      num_images: number of images to decode from the batch.
      num_classes: number of classes to predict (including background).

    Returns:
      A batch with num_images RGB images of the same size as the input.
    """
    n, h, w, c = mask.shape
    outputs = np.zeros((h, w, 3), dtype=np.uint8)
    binary = np.zeros((h, w), dtype=np.uint8)
    R = np.zeros((h, w), dtype=np.uint8)
    G = np.zeros((h, w), dtype=np.uint8)
    B = np.zeros((h, w), dtype=np.uint8)

    for i in range(0, num_classes):

        # print("i is",i)
        # tlk.show_image(mask[0,:,:,i])
        binary[mask[0, :, :, i] >= 0.5] = 1
        binary[mask[0, :, :, i] < 0.5] = 0
        # tlk.show_image(binary)
        color_R = label_colours[i][0] * np.ones([h, w])
        color_G = label_colours[i][1] * np.ones([h, w])
        color_B = label_colours[i][2] * np.ones([h, w])
        # print("colour_R.shape",color_R.shape)

        R_aux = np.multiply(binary, color_R)
        R_aux_int = R_aux.astype(np.uint8)
        G_aux = np.multiply(binary, color_G)
        G_aux_int = G_aux.astype(np.uint8)
        B_aux = np.multiply(binary, color_B)
        B_aux_int = B_aux.astype(np.uint8)

        R += R_aux_int
        G += G_aux_int
        B += B_aux_int

        R_ = R.reshape(*R.shape, 1)
        G_ = G.reshape(*G.shape, 1)
        B_ = B.reshape(*B.shape, 1)

        outputs = np.concatenate((R_, G_, B_), axis=2)
        # outputs[:, :,:] = (np.multiply(binary, label_colours[i]))

    # tlk.show_image(outputs)

    # img = Image.new('RGB', (len(mask[0, 0]), len(mask[0])))
    # pixels = img.load()
    # for j_, j in enumerate(mask[0, :, :, 0]):
    #     for k_, k in enumerate(j):
    #       if k < num_classes:
    #         pixels[k_, j_] = label_colours[k]
    #
    # outputs = np.array(img)
    return outputs