jaiyeshchahar's picture
Upload 11 files
5d3cdc9
import torch
import torch.optim as optim
import lightning.pytorch as pl
from lightning.pytorch.tuner import Tuner
from tqdm import tqdm
from torch.optim.lr_scheduler import OneCycleLR
import matplotlib.pyplot as plt
import matplotlib.patches as patches
import albumentations as A
from pytorch_grad_cam.utils.image import show_cam_on_image
from albumentations.pytorch import ToTensorV2
import config
from yolo_lightning import YOLOv3Lightning
import torch
import cv2
import numpy as np
import gradio as gr
import os
from utils_app import *
model = YOLOv3Lightning (config)
model.load_state_dict(torch.load("custom_yolo_model.pth", map_location=torch.device('cpu')), strict=False)
model.setup(stage="test")
IMAGE_SIZE = 416
ANCHORS = [
[(0.28, 0.22), (0.38, 0.48), (0.9, 0.78)],
[(0.07, 0.15), (0.15, 0.11), (0.14, 0.29)],
[(0.02, 0.03), (0.04, 0.07), (0.08, 0.06)],
] # Note these have been rescaled to be between [0, 1]
S = [IMAGE_SIZE // 32, IMAGE_SIZE // 16, IMAGE_SIZE // 8]
scaled_anchors = (
torch.tensor(config.ANCHORS)
* torch.tensor(config.S).unsqueeze(1).unsqueeze(1).repeat(1, 3, 2)
)
def process_image_and_plot(image, model, scaled_anchors):
transformed_image = config.transforms(image=image)["image"].unsqueeze(0)
output = model(transformed_image)
bboxes = [[] for _ in range(1)]
for i in range(3):
batch_size, A, S, _, _ = output[i].shape
anchor = scaled_anchors[i]
boxes_scale_i = cells_to_bboxes(output[i], anchor, S=S, is_preds=True)
for idx, box in enumerate(boxes_scale_i):
bboxes[idx] += box
nms_boxes = non_max_suppression(
bboxes[0], iou_threshold=0.5, threshold=0.4, box_format="midpoint",
)
fig = plot_image(transformed_image[0].permute(1, 2, 0), nms_boxes)
cam = YoloCAM(model=model, target_layers=[model.model.layers[-2]], use_cuda=False)
grayscale_cam = cam(transformed_image, scaled_anchors)[0, :, :]
img = cv2.resize(image, (416, 416))
img = np.float32(img) / 255
cam_image = show_cam_on_image(img, grayscale_cam, use_rgb=True)
return fig,cam_image
examples = [
["images/2012_004288.jpg"],
["images/2012_004314.jpg"],
["images/car.jpg"],
]
def processed_image(image):
figure,gradcam = process_image_and_plot(image, model, scaled_anchors)
return figure,gradcam
title = "YoloV3 on Pascal VOC Dataset (GradCAM)"
description = f"Pytorch Implemetation of YoloV3 trained from scratch on Pascal VOC dataset with GradCAM \n Class in pascol voc: {', '.join(config.PASCAL_CLASSES)}"
demo = gr.Interface(processed_image,
inputs=[
gr.Image(label="Input Image"),
],
outputs=[gr.Plot(),gr.Image(shape=(32, 32), label="GradCAM Prediction")],
title=title,
description=description,
examples=examples,
)
demo.launch()