Spaces:

LittleMonkeyLab
/

totes-emosh

Sleeping

drdeception

feat: six-emotion replication challenge — totes-emosh EmotionMap build

0d27c43 25 days ago

1.88 kB

	"""
	File: model.py
	Author: Dr. Gordon Wright
	Description: Loads the static ResNet50 face-emotion classifier and sets up
	Grad-CAM. The dynamic LSTM model has been moved to the
	separate video app and is no longer loaded here.
	License: MIT License
	"""

	import torch
	import requests
	from PIL import Image
	from torchvision import transforms
	from pytorch_grad_cam import GradCAM

	from app.config import config_data
	from app.model_architectures import ResNet50


	def load_model(model_url, model_path):
	try:
	with requests.get(model_url, stream=True) as response:
	with open(model_path, "wb") as file:
	for chunk in response.iter_content(chunk_size=8192):
	file.write(chunk)
	return model_path
	except Exception as e:
	print(f"Error loading model: {e}")
	return None


	path_static = load_model(config_data.model_static_url, config_data.model_static_path)
	pth_model_static = ResNet50(7, channels=3)
	pth_model_static.load_state_dict(torch.load(path_static))
	pth_model_static.eval()

	target_layers = [pth_model_static.layer4]
	cam = GradCAM(model=pth_model_static, target_layers=target_layers)


	def pth_processing(fp):
	class PreprocessInput(torch.nn.Module):
	def init(self):
	super(PreprocessInput, self).init()

	def forward(self, x):
	x = x.to(torch.float32)
	x = torch.flip(x, dims=(0,))
	x[0, :, :] -= 91.4953
	x[1, :, :] -= 103.8827
	x[2, :, :] -= 131.0912
	return x

	def get_img_torch(img, target_size=(224, 224)):
	transform = transforms.Compose([transforms.PILToTensor(), PreprocessInput()])
	img = img.resize(target_size, Image.Resampling.NEAREST)
	img = transform(img)
	img = torch.unsqueeze(img, 0)
	return img

	return get_img_torch(fp)