Spaces:

julse
/

maotao

Running

App Files Files Community

maotao / src /mRNA2vec /EMA.py

julse

upload AA2CDS

4707555 verified about 1 month ago

raw

history blame contribute delete

2.22 kB

	import os
	import copy

	import torch
	import torch.nn as nn


	class EMA:
	"""
	Modified version of class fairseq.models.ema.EMAModule.

	Args:
	model (nn.Module):
	cfg (DictConfig):
	device (str):
	skip_keys (list): The keys to skip assigning averaged weights to.
	"""

	def __init__(self, model: nn.Module, skip_keys=None):
	self.model = self.deepcopy_model(model)
	self.model.requires_grad_(False)
	# self.device = 'cuda'
	self.device = 'cpu'
	self.model.to(self.device)
	self.skip_keys = skip_keys or set()
	self.decay = 0.999
	self.num_updates = 0

	@staticmethod
	def deepcopy_model(model):
	try:
	model = copy.deepcopy(model)
	return model
	except RuntimeError:
	tmp_path = 'tmp_model_for_ema_deepcopy.pt'
	torch.save(model, tmp_path)
	model = torch.load(tmp_path)
	os.remove(tmp_path)
	return model

	def step(self, new_model: nn.Module):
	"""
	One EMA step

	Args:
	new_model (nn.Module): Online model to fetch new weights from

	"""
	ema_state_dict = {}
	ema_params = self.model.state_dict()
	for key, param in new_model.state_dict().items():
	ema_param = ema_params[key].float()
	if key in self.skip_keys:
	ema_param = param.to(dtype=ema_param.dtype).clone()
	else:
	ema_param.mul_(self.decay)
	ema_param.add_(param.to(dtype=ema_param.dtype), alpha=1 - self.decay)
	ema_state_dict[key] = ema_param
	self.model.load_state_dict(ema_state_dict, strict=False)
	self.num_updates += 1

	def restore(self, model: nn.Module):
	d = self.model.state_dict()
	model.load_state_dict(d, strict=False)
	return model

	def state_dict(self):
	return self.model.state_dict()

	@staticmethod
	def get_annealed_rate(start, end, curr_step, total_steps):
	"""
	Calculate EMA annealing rate
	"""
	r = end - start
	pct_remaining = 1 - curr_step / total_steps
	return end - r * pct_remaining