Spaces:
Sleeping
Sleeping
| # from pix2pix | |
| import os | |
| import torch | |
| import torch.nn as nn | |
| from torch.nn import init | |
| class BaseModel(nn.Module): | |
| def __init__(self, opt): | |
| super(BaseModel, self).__init__() | |
| self.opt = opt | |
| self.total_steps = 0 | |
| self.isTrain = opt.isTrain | |
| self.save_dir = os.path.join(opt.checkpoints_dir, opt.name) | |
| self.device = ( | |
| torch.device('cuda:{}'.format(opt.gpu_ids[0])) | |
| if opt.gpu_ids | |
| else torch.device('cpu') | |
| ) | |
| def save_networks(self, epoch): | |
| save_filename = 'model_epoch_%s.pth' % epoch | |
| save_path = os.path.join(self.save_dir, save_filename) | |
| # serialize model and optimizer to dict | |
| state_dict = { | |
| 'model': self.model.state_dict(), | |
| 'optimizer': self.optimizer.state_dict(), | |
| 'total_steps': self.total_steps, | |
| } | |
| torch.save(state_dict, save_path) | |
| # load models from the disk | |
| def load_networks(self, epoch): | |
| load_filename = 'model_epoch_%s.pth' % epoch | |
| load_path = os.path.join(self.save_dir, load_filename) | |
| print('loading the model from %s' % load_path) | |
| # if you are using PyTorch newer than 0.4 (e.g., built from | |
| # GitHub source), you can remove str() on self.device | |
| state_dict = torch.load(load_path, map_location=self.device) | |
| if hasattr(state_dict, '_metadata'): | |
| del state_dict._metadata | |
| self.model.load_state_dict(state_dict['model']) | |
| self.total_steps = state_dict['total_steps'] | |
| if self.isTrain and not self.opt.new_optim: | |
| self.optimizer.load_state_dict(state_dict['optimizer']) | |
| ### move optimizer state to GPU | |
| for state in self.optimizer.state.values(): | |
| for k, v in state.items(): | |
| if torch.is_tensor(v): | |
| state[k] = v.to(self.device) | |
| for g in self.optimizer.param_groups: | |
| g['lr'] = self.opt.lr | |
| def eval(self): | |
| self.model.eval() | |
| def test(self): | |
| with torch.no_grad(): | |
| self.forward() | |
| def init_weights(net, init_type='normal', gain=0.02): | |
| def init_func(m): | |
| classname = m.__class__.__name__ | |
| if hasattr(m, 'weight') and ( | |
| classname.find('Conv') != -1 or classname.find('Linear') != -1 | |
| ): | |
| if init_type == 'normal': | |
| init.normal_(m.weight.data, 0.0, gain) | |
| elif init_type == 'xavier': | |
| init.xavier_normal_(m.weight.data, gain=gain) | |
| elif init_type == 'kaiming': | |
| init.kaiming_normal_(m.weight.data, a=0, mode='fan_in') | |
| elif init_type == 'orthogonal': | |
| init.orthogonal_(m.weight.data, gain=gain) | |
| else: | |
| raise NotImplementedError( | |
| 'initialization method [%s] is not implemented' % init_type | |
| ) | |
| if hasattr(m, 'bias') and m.bias is not None: | |
| init.constant_(m.bias.data, 0.0) | |
| elif classname.find('BatchNorm2d') != -1: | |
| init.normal_(m.weight.data, 1.0, gain) | |
| init.constant_(m.bias.data, 0.0) | |
| print('initialize network with %s' % init_type) | |
| net.apply(init_func) | |