Spaces:

ma4389
/

Car_Classification_Brands

Sleeping

App Files Files Community

Car_Classification_Brands / app.py

ma4389

Update app.py

f726feb verified 6 months ago

raw

history blame contribute delete

2.95 kB

	import torch
	import torch.nn as nn
	import torchvision.models as models
	import torchvision.transforms as transforms
	from PIL import Image
	import gradio as gr

	# --------------------
	# Class Mapping
	# --------------------
	class_to_idx = {
	'Acura': 0, 'Alfa Romeo': 1, 'Aston Martin': 2, 'Audi': 3, 'BMW': 4,
	'Bentley': 5, 'Bugatti': 6, 'Buick': 7, 'Cadillac': 8, 'Chevrolet': 9,
	'Chrysler': 10, 'Citroen': 11, 'Daewoo': 12, 'Dodge': 13, 'Ferrari': 14,
	'Fiat': 15, 'Ford': 16, 'GMC': 17, 'Genesis': 18, 'Honda': 19,
	'Hudson': 20, 'Hyundai': 21, 'Infiniti': 22, 'Jaguar': 23, 'Jeep': 24,
	'Kia': 25, 'Land Rover': 26, 'Lexus': 27, 'Lincoln': 28, 'MG': 29,
	'Maserati': 30, 'Mazda': 31, 'Mercedes-Benz': 32, 'Mini': 33,
	'Mitsubishi': 34, 'Nissan': 35, 'Oldsmobile': 36, 'Peugeot': 37,
	'Pontiac': 38, 'Porsche': 39, 'Ram Trucks': 40, 'Renault': 41,
	'Saab': 42, 'Studebaker': 43, 'Subaru': 44, 'Suzuki': 45, 'Tesla': 46,
	'Toyota': 47, 'Volkswagen': 48, 'Volvo': 49
	}
	idx_to_class = {v: k for k, v in class_to_idx.items()}

	# --------------------
	# Image Transform
	# --------------------
	transform = transforms.Compose([
	transforms.Lambda(lambda x: x.convert("RGB")),
	transforms.Resize((224,224)),
	transforms.RandomHorizontalFlip(p=0.5),
	transforms.RandomVerticalFlip(p=0.2),
	transforms.RandomRotation(20),
	transforms.ColorJitter(brightness=0.3, contrast=0.3, saturation=0.3),
	transforms.RandomResizedCrop(224, scale=(0.7, 1.0)),
	transforms.ToTensor(),
	transforms.Normalize([0.5]3, [0.5]3)
	])

	# --------------------
	# Load Model
	# --------------------
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

	# Load pretrained ResNet50 correctly
	base_model = models.resnet50(weights=models.ResNet50_Weights.DEFAULT)

	# Replace final fully connected layer (your head)
	in_features = base_model.fc.in_features # 2048 for ResNet50
	base_model.fc = nn.Sequential(
	nn.Linear(in_features, 512),
	nn.ReLU(),
	nn.Dropout(0.5),
	nn.Linear(512, 50) # 50 classes
	)

	# Load state dict
	state_dict = torch.load("best_model.pth", map_location=device)
	base_model.load_state_dict(state_dict)
	base_model = base_model.to(device)
	base_model.eval()

	# --------------------
	# Prediction Function
	# --------------------
	def predict(img):
	img = transform(img).unsqueeze(0).to(device)

	with torch.no_grad():
	outputs = base_model(img)
	probs = torch.softmax(outputs, dim=1)[0]

	top5_prob, top5_idx = torch.topk(probs, 5)
	result = {idx_to_class[idx.item()]: float(top5_prob[i]) for i, idx in enumerate(top5_idx)}
	return result

	# --------------------
	# Gradio UI
	# --------------------
	demo = gr.Interface(
	fn=predict,
	inputs=gr.Image(type="pil"),
	outputs=gr.Label(num_top_classes=5),
	title="Car Brand Classifier",
	description="Upload a car image to predict its brand."
	)

	if __name__ == "__main__":
	demo.launch()