Spaces:

Arekku21
/

Cub_200_2011_Resnet

Build error

App Files Files Community

Cub_200_2011_Resnet / app.py

Arekku21

Update app.py

c956a74 verified about 2 years ago

raw

history blame contribute delete

3.89 kB

	import gradio as gr
	import torch
	import numpy as np

	import torch
	import torchvision.models as models
	from torch import nn

	from albumentations import (
	HorizontalFlip, VerticalFlip, IAAPerspective, ShiftScaleRotate, CLAHE, RandomRotate90,
	Transpose, ShiftScaleRotate, Blur, OpticalDistortion, GridDistortion, HueSaturationValue,
	IAAAdditiveGaussianNoise, GaussNoise, MotionBlur, MedianBlur, IAAPiecewiseAffine, RandomResizedCrop,
	IAASharpen, IAAEmboss, RandomBrightnessContrast, Flip, OneOf, Compose, Normalize, Cutout, CoarseDropout, ShiftScaleRotate, CenterCrop, Resize, Rotate,
	ShiftScaleRotate, CenterCrop, Crop, Resize, Rotate, RandomShadow, RandomSizedBBoxSafeCrop,
	ChannelShuffle, MotionBlur,Lambda,SmallestMaxSize
	)

	from albumentations.pytorch import ToTensorV2

	# Your Albumentations transformations
	test_transforms = Compose([
	Resize(224, 224),
	Normalize(mean=(0.485, 0.456, 0.406), std=(0.229, 0.224, 0.225)),
	ToTensorV2(),
	])

	def load_cub200_classes():
	"""
	This function loads the classes from the classes.txt file and returns a dictionary
	"""
	with open("classes.txt", encoding="utf-8") as f:
	classes = f.read().splitlines()

	# convert classes to dictionary separating the lines by the first space
	classes = {int(line.split(" ")[0]) : line.split(" ")[1] for line in classes}

	# return the classes dictionary
	return classes

	def load_model():
	"""
	This function loads the trained model and returns it
	"""
	model = models.resnet50(pretrained=True)

	# Freeze the initial layers up to a certain point (e.g., layer 4)
	freeze_layers = 4
	for idx, (name, param) in enumerate(model.named_parameters()):
	if idx < freeze_layers:
	param.requires_grad = False

	# Replace the final fully connected layer for the new task
	num_ftrs = model.fc.in_features
	model.fc = nn.Linear(num_ftrs, 200)

	# Add dropout layers
	model = nn.Sequential(
	model,
	nn.Dropout(0.8), # Adjust the dropout rate as needed
	nn.Linear(200, 200) # Add additional fully connected layer
	)

	# Load the state dictionary from the file
	state_dict = torch.load("resnet50_7511.pt",map_location=torch.device('cpu'))

	# Load the state dictionary into the model object
	model.load_state_dict(state_dict)

	# # Load actual model
	# model = torch.load("resnet18.pth", map_location=torch.device('cpu'))

	# set the model to evaluation mode
	model.eval()

	# return the model
	return model

	def predict_image(image):
	"""
	This function takes an image as input and returns the class label
	"""
	# load the model
	model = load_model()
	# model.eval()
	# load the classes
	classes = load_cub200_classes()

	# Apply Albumentations transformations
	transformed_image = test_transforms(image=image)['image']

	# Convert the image to a PyTorch tensor
	tensor_image = transformed_image.unsqueeze(0)

	# Make prediction
	with torch.no_grad():
	output = model(tensor_image)

	# Assuming the output is a tensor representing class probabilities
	probabilities = torch.nn.functional.softmax(output[0], dim=0).numpy()

	conf_threshold = 0.8

	# Get the class with the highest probability
	predicted_class = np.argmax(probabilities)

	# If the probability is less than the threshold, return unknown else return the class
	if probabilities[predicted_class] < conf_threshold:
	string_to_return = "Predicted Class: Unknown"

	else:
	# Return the class label
	string_to_return = f"Predicted Class: {classes[predicted_class+1]} with probability: {probabilities[predicted_class] * 100:.2f}%"

	# Return the class label
	return string_to_return

	# create a gradio interface
	gr.Interface(fn=predict_image, inputs="image", outputs="text").launch()