TheKernel01's picture
Sync from GitHub via hub-sync
0788e19 verified
import functools
import torch
import torch.nn as nn
from models.clip_models import CLIPModel
from networks.base_model import BaseModel, init_weights
class Trainer(BaseModel):
def name(self):
return 'Trainer'
def __init__(self, opt):
super(Trainer, self).__init__(opt)
if self.isTrain and not opt.continue_train:
self.model = CLIPModel()
if not self.isTrain or opt.continue_train:
self.model = CLIPModel()
params = []
for name, p in self.model.named_parameters():
if name == "fc.weight" or name == "fc.bias":
params.append(p)
else:
p.requires_grad = False
if self.isTrain:
self.loss_fn = nn.BCEWithLogitsLoss()
# initialize optimizers
if opt.optim == 'adam':
self.optimizer = torch.optim.Adam(filter(lambda p: p.requires_grad, self.model.parameters()),
lr=opt.lr, betas=(opt.beta1, 0.999))
elif opt.optim == 'sgd':
self.optimizer = torch.optim.SGD(filter(lambda p: p.requires_grad, self.model.parameters()),
lr=opt.lr, momentum=0.0, weight_decay=0)
else:
raise ValueError("optim should be [adam, sgd]")
if not self.isTrain or opt.continue_train:
self.load_networks(opt.epoch)
self.model.to(opt.gpu_ids[0])
def adjust_learning_rate(self, min_lr=1e-6):
for param_group in self.optimizer.param_groups:
param_group['lr'] *= 0.9
if param_group['lr'] < min_lr:
return False
self.lr = param_group['lr']
print('*'*25)
print(f'Changing lr from {param_group["lr"]/0.9} to {param_group["lr"]}')
print('*'*25)
return True
def set_input(self, input):
self.input = input[0].to(self.device)
self.label = input[1].to(self.device).float()
def forward(self):
self.output = self.model(self.input)
def get_loss(self):
return self.loss_fn(self.output.squeeze(1), self.label)
def optimize_parameters(self):
self.forward()
self.loss = self.loss_fn(self.output.squeeze(1), self.label)
self.optimizer.zero_grad()
self.loss.backward()
self.optimizer.step()