Spaces:

MedicalAILabo
/

CXp-Projection-Rotation-Mislabel-Checker

Sleeping

App Files Files Community

CXp-Projection-Rotation-Mislabel-Checker / lib /component /criterion.py

MedicalAILabo

Upload 14 files

4784da1 verified 6 months ago

raw

history blame contribute delete

10.8 kB

	#!/usr/bin/env python
	# -- coding: utf-8 --

	import torch
	import torch.nn as nn
	from typing import Dict, Union

	# Alias of typing
	# eg. {'labels': {'label_A: torch.Tensor([0, 1, ...]), ...}}
	LabelDict = Dict[str, Dict[str, Union[torch.IntTensor, torch.FloatTensor]]]


	class RMSELoss(nn.Module):
	"""
	Class to calculate RMSE.
	"""
	def __init__(self, eps: float = 1e-7) -> None:
	"""
	Args:
	eps (float, optional): value to avoid 0. Defaults to 1e-7.
	"""
	super().__init__()
	self.mse = nn.MSELoss()
	self.eps = eps

	def forward(self, yhat: float, y: float) -> torch.FloatTensor:
	"""
	Calculate RMSE.

	Args:
	yhat (float): prediction value
	y (float): ground truth value

	Returns:
	float: RMSE
	"""
	_loss = self.mse(yhat, y) + self.eps
	return torch.sqrt(_loss)


	class Regularization:
	"""
	Class to calculate regularization loss.

	Args:
	object (object): object
	"""
	def __init__(self, order: int, weight_decay: float) -> None:
	"""
	The initialization of Regularization class.

	Args:
	order: (int) norm order number
	weight_decay: (float) weight decay rate
	"""
	super().__init__()
	self.order = order
	self.weight_decay = weight_decay

	def __call__(self, network: nn.Module) -> torch.FloatTensor:
	""""
	Calculates regularization(self.order) loss for network.

	Args:
	model: (torch.nn.Module object)

	Returns:
	torch.FloatTensor: the regularization(self.order) loss
	"""
	reg_loss = 0
	for name, w in network.named_parameters():
	if 'weight' in name:
	reg_loss = reg_loss + torch.norm(w, p=self.order)
	reg_loss = self.weight_decay * reg_loss
	return reg_loss


	class NegativeLogLikelihood(nn.Module):
	"""
	Class to calculate RMSE.
	"""
	def __init__(self, device: torch.device) -> None:
	"""
	Args:
	device (torch.device): device
	"""
	super().__init__()
	self.L2_reg = 0.05
	self.reg = Regularization(order=2, weight_decay=self.L2_reg)
	self.device = device

	def forward(
	self,
	output: torch.FloatTensor,
	label: torch.IntTensor,
	periods: torch.FloatTensor,
	network: nn.Module
	) -> torch.FloatTensor:
	"""
	Calculates Negative Log Likelihood.

	Args:
	output (torch.FloatTensor): prediction value, ie risk prediction
	label (torch.IntTensor): occurrence of event
	periods (torch.FloatTensor): period
	network (nn.Network): network

	Returns:
	torch.FloatTensor: Negative Log Likelihood
	"""
	mask = torch.ones(periods.shape[0], periods.shape[0]).to(self.device) # output and mask should be on the same device.
	mask[(periods.T - periods) > 0] = 0

	_loss = torch.exp(output) * mask
	# Note: torch.sum(_loss, dim=0) possibly returns nan, in particular MLP.
	_loss = torch.sum(_loss, dim=0) / torch.sum(mask, dim=0)
	_loss = torch.log(_loss).reshape(-1, 1)
	num_occurs = torch.sum(label)

	if num_occurs.item() == 0.0:
	loss = torch.tensor([1e-7], requires_grad=True).to(self.device) # To avoid zero division, set small value as loss
	return loss
	else:
	neg_log_loss = -torch.sum((output - _loss) * label) / num_occurs
	l2_loss = self.reg(network)
	loss = neg_log_loss + l2_loss
	return loss


	class ClsCriterion:
	"""
	Class of criterion for classification.
	"""
	def __init__(self, device: torch.device = None) -> None:
	"""
	Set CrossEntropyLoss.

	Args:
	device (torch.device): device
	"""
	self.device = device
	self.criterion = nn.CrossEntropyLoss()

	def __call__(
	self,
	outputs: Dict[str, torch.FloatTensor],
	labels: Dict[str, LabelDict]
	) -> Dict[str, torch.FloatTensor]:
	"""
	Calculate loss.

	Args:
	outputs (Dict[str, torch.FloatTensor], optional): output
	labels (Dict[str, LabelDict]): labels

	Returns:
	Dict[str, torch.FloatTensor]: loss for each label and their total loss

	# No reshape and no cast:
	output: [64, 2]: torch.float32
	label: [64] : torch.int64
	label.dtype should be torch.int64, otherwise nn.CrossEntropyLoss() causes error.

	eg.
	outputs = {'label_A': [[0.8, 0.2], ...] 'label_B': [[0.7, 0.3]], ...}
	labels = { 'labels': {'label_A: 1: [1, 1, 0, ...], 'label_B': [0, 0, 1, ...], ...} }

	-> losses = {total: loss_total, label_A: loss_A, label_B: loss_B, ... }
	"""
	_labels = labels['labels']

	# loss for each label and total of their losses
	losses = dict()
	losses['total'] = torch.tensor([0.0], requires_grad=True).to(self.device)
	for label_name in labels['labels'].keys():
	_output = outputs[label_name]
	_label = _labels[label_name]
	_label_loss = self.criterion(_output, _label)
	losses[label_name] = _label_loss
	losses['total'] = torch.add(losses['total'], _label_loss)
	return losses


	class RegCriterion:
	"""
	Class of criterion for regression.
	"""
	def __init__(self, criterion_name: str = None, device: torch.device = None) -> None:
	"""
	Set MSE, RMSE or MAE.

	Args:
	criterion_name (str): 'MSE', 'RMSE', or 'MAE'
	device (torch.device): device
	"""
	self.device = device

	if criterion_name == 'MSE':
	self.criterion = nn.MSELoss()
	elif criterion_name == 'RMSE':
	self.criterion = RMSELoss()
	elif criterion_name == 'MAE':
	self.criterion = nn.L1Loss()
	else:
	raise ValueError(f"Invalid criterion for regression: {criterion_name}.")

	def __call__(
	self,
	outputs: Dict[str, torch.FloatTensor],
	labels: Dict[str, LabelDict]
	) -> Dict[str, torch.FloatTensor]:
	"""
	Calculate loss.

	Args:
	Args:
	outputs (Dict[str, torch.FloatTensor], optional): output
	labels (Dict[str, LabelDict]): labels

	Returns:
	Dict[str, torch.FloatTensor]: loss for each label and their total loss

	# Reshape and cast
	output: [64, 1] -> [64]: torch.float32
	label: [64]: torch.float64 -> torch.float32
	# label.dtype should be torch.float32, otherwise cannot backward.

	eg.
	outputs = {'label_A': [[10.8], ...] 'label_B': [[15.7]], ...}
	labels = {'labels': {'label_A: 1: [10, 9, ...], 'label_B': [12, 17,], ...}}
	-> losses = {total: loss_total, label_A: loss_A, label_B: loss_B, ... }
	"""
	_outputs = {label_name: _output.squeeze() for label_name, _output in outputs.items()}
	_labels = {label_name: _label.to(torch.float32) for label_name, _label in labels['labels'].items()}

	# loss for each label and total of their losses
	losses = dict()
	losses['total'] = torch.tensor([0.0], requires_grad=True).to(self.device)
	for label_name in labels['labels'].keys():
	_output = _outputs[label_name]
	_label = _labels[label_name]
	_label_loss = self.criterion(_output, _label)
	losses[label_name] = _label_loss
	losses['total'] = torch.add(losses['total'], _label_loss)
	return losses


	class DeepSurvCriterion:
	"""
	Class of criterion for deepsurv.
	"""
	def __init__(self, device: torch.device = None) -> None:
	"""
	Set NegativeLogLikelihood.

	Args:
	device (torch.device, optional): device
	"""
	self.device = device
	self.criterion = NegativeLogLikelihood(self.device).to(self.device)

	def __call__(
	self,
	outputs: Dict[str, torch.FloatTensor],
	labels: Dict[str, Union[LabelDict, torch.IntTensor, nn.Module]]
	) -> Dict[str, torch.FloatTensor]:
	"""
	Calculate loss.

	Args:
	outputs (Dict[str, torch.FloatTensor], optional): output
	labels (Dict[str, Union[LabelDict, torch.IntTensor, nn.Module]]): labels, periods, and network

	Returns:
	Dict[str, torch.FloatTensor]: loss for each label and their total loss

	# Reshape and no cast
	output: [64, 1]: torch.float32
	label: [64] -> [64, 1]: torch.int64
	period: [64] -> [64, 1]: torch.float32

	eg.
	outputs = {'label_A': [[10.8], ...] 'label_B': [[15.7]], ...}
	labels = {
	'labels': {'label_A: 1: [1, 0, 1, ...] },
	'periods': [5, 10, 7, ...],
	'network': network
	}
	-> losses = {total: loss_total, label_A: loss_A, label_B: loss_B, ... }
	"""
	_labels = {label_name: _label.reshape(-1, 1) for label_name, _label in labels['labels'].items()}
	_periods = labels['periods'].reshape(-1, 1)
	_network = labels['network']

	# loss for each label and total of their losses
	losses = dict()
	losses['total'] = torch.tensor([0.0], requires_grad=True).to(self.device)
	for label_name in labels['labels'].keys():
	_output = outputs[label_name]
	_label = _labels[label_name]
	_label_loss = self.criterion(_output, _label, _periods, _network)
	losses[label_name] = _label_loss
	losses['total'] = torch.add(losses['total'], _label_loss)
	return losses


	def set_criterion(
	criterion_name: str,
	device: torch.device
	) -> Union[ClsCriterion, RegCriterion, DeepSurvCriterion]:
	"""
	Return criterion class

	Args:
	criterion_name (str): criterion name
	device (torch.device): device

	Returns:
	Union[ClsCriterion, RegCriterion, DeepSurvCriterion]: criterion class
	"""

	if criterion_name == 'CEL':
	return ClsCriterion(device=device)

	elif criterion_name in ['MSE', 'RMSE', 'MAE']:
	return RegCriterion(criterion_name=criterion_name, device=device)

	elif criterion_name == 'NLL':
	return DeepSurvCriterion(device=device)

	else:
	raise ValueError(f"Invalid criterion: {criterion_name}.")