AbstractPhil commited on
Commit
ad77ff7
·
verified ·
1 Parent(s): b6d45f7

Update trainer.py

Browse files
Files changed (1) hide show
  1. trainer.py +2 -5
trainer.py CHANGED
@@ -16,9 +16,6 @@ from tqdm import tqdm
16
  from torchvision import datasets, transforms
17
  from torch.utils.tensorboard import SummaryWriter
18
 
19
- from tri_stream_vit import (
20
- create_tri_stream_vit, MasteryQueue, SimplexBuffer)
21
-
22
  DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
23
  torch.backends.cuda.matmul.allow_tf32 = True
24
  torch.backends.cudnn.allow_tf32 = True
@@ -170,10 +167,10 @@ print(f" GAL Procrustes: every {GAL_UPDATE_INTERVAL} batches, "
170
  f"lr={GAL_LR}, whiten={USE_WHITENED_PROCRUSTES}")
171
  print(f" Mastery: patience={MASTERY_PATIENCE}, queue adaptive "
172
  f"[{MASTERY_MIN_SIZE}–{MASTERY_MAX_SIZE}]")
173
- print(f" Optimizer: AdamW (wd=0.01)")
174
  print(f"{'='*60}")
175
 
176
- optimizer = torch.optim.AdamW(model.parameters(), lr=LR, weight_decay=0.01)
177
 
178
  total_steps = len(train_loader) * EPOCHS
179
  warmup_steps = len(train_loader) * WARMUP
 
16
  from torchvision import datasets, transforms
17
  from torch.utils.tensorboard import SummaryWriter
18
 
 
 
 
19
  DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
20
  torch.backends.cuda.matmul.allow_tf32 = True
21
  torch.backends.cudnn.allow_tf32 = True
 
167
  f"lr={GAL_LR}, whiten={USE_WHITENED_PROCRUSTES}")
168
  print(f" Mastery: patience={MASTERY_PATIENCE}, queue adaptive "
169
  f"[{MASTERY_MIN_SIZE}–{MASTERY_MAX_SIZE}]")
170
+ print(f" Optimizer: Adam")
171
  print(f"{'='*60}")
172
 
173
+ optimizer = torch.optim.Adam(model.parameters(), lr=LR)
174
 
175
  total_steps = len(train_loader) * EPOCHS
176
  warmup_steps = len(train_loader) * WARMUP