Spaces:

faranbutt789
/

TrafficSignNet

Sleeping

App Files Files Community

TrafficSignNet / app.py

faranbutt789

Update app.py

8663de3 verified 4 months ago

raw

history blame contribute delete

2.69 kB

	import gradio as gr
	import torch
	import torch.nn as nn
	import torchvision.transforms as T
	import cv2
	import numpy as np
	import pandas as pd

	# ----------------------------
	# Load class names
	# ----------------------------
	df = pd.read_csv("signnames.csv")
	df.set_index("ClassId", inplace=True)
	class_ids = df.to_dict()["SignName"]
	id2int = {v: i for i, (k, v) in enumerate(class_ids.items())}
	int2id = {v: k for k, v in id2int.items()}

	# ----------------------------
	# Define Model
	# ----------------------------
	def conv_func(in_channels, out_channels):
	return nn.Sequential(
	nn.Dropout(0.2),
	nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1),
	nn.ReLU(),
	nn.BatchNorm2d(out_channels),
	nn.MaxPool2d(2),
	)

	class RoadSignClassifierModel(nn.Module):
	def __init__(self, num_classes=len(id2int)):
	super().__init__()
	self.model = nn.Sequential(
	conv_func(3, 64),
	conv_func(64, 64),
	conv_func(64, 128),
	conv_func(128, 256),
	nn.Flatten(),
	nn.Linear(256 * 2 * 2, 256),
	nn.Dropout(0.2),
	nn.ReLU(),
	nn.Linear(256, num_classes),
	)

	def forward(self, x):
	return self.model(x)

	# ----------------------------
	# Load trained model
	# ----------------------------
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	model = RoadSignClassifierModel()
	model.load_state_dict(torch.load("traffic_sign_model.pth", map_location=device))
	model = model.to(device)
	model.eval()

	# ----------------------------
	# Preprocessing
	# ----------------------------
	val_tf = T.Compose([
	T.ToPILImage(),
	T.Resize(32),
	T.CenterCrop(32),
	T.ToTensor(),
	T.Normalize(mean=[0.485, 0.456, 0.406],
	std=[0.229, 0.224, 0.225])
	])

	# ----------------------------
	# Prediction Function
	# ----------------------------
	def predict(img):
	# Convert from Gradio (PIL.Image) to OpenCV
	img = np.array(img.convert("RGB"))
	img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
	img_input = val_tf(cv2.cvtColor(img, cv2.COLOR_BGR2RGB)).unsqueeze(0).to(device)

	with torch.no_grad():
	output = model(img_input)
	pred_class = torch.argmax(output, dim=1).item()

	return {class_ids[pred_class]: 1.0}
	# ----------------------------
	# Gradio UI
	# ----------------------------
	demo = gr.Interface(
	fn=predict,
	inputs=gr.Image(type="pil"),
	outputs=gr.Label(num_top_classes=1),
	title="🚦 Traffic Sign Classifier",
	description="Upload a traffic sign image and the model will predict its category."
	)

	if __name__ == "__main__":
	demo.launch()