File size: 1,441 Bytes
0b0baee
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
{
  "adamw_lr": null,
  "adamw_weight_decay": null,
  "autoencoder_rae_pretrained_name": "nyu-visionx/RAE-dinov2-wReg-base-ViTXL-n08",
  "batch_size": 128,
  "checkpoint_dir": "checkpoints/train_2026-05-06_14-11-11",
  "checkpoint_every": 2000,
  "cls_register_loss_weight": 0.1,
  "decoder_head_dim": 64,
  "decoder_intermediate_size": 3072,
  "decoder_num_heads": 12,
  "decoder_num_layers": 8,
  "decoder_pos_embed_side": 16,
  "disable_wandb": false,
  "dropout": 0.1,
  "grad_accum_steps": 1,
  "image_size": 224,
  "log_every": 10,
  "lr": 0.0001,
  "max_grad_norm": 1.0,
  "max_steps": 50000,
  "mixed_precision": "bf16",
  "mixture_name": "default",
  "muon_lr": null,
  "muon_weight_decay": null,
  "num_proc": 16,
  "num_shards": null,
  "num_vis": 16,
  "num_workers": 4,
  "pretrained_backbone_name": "facebook/dinov2-with-registers-base",
  "pretrained_path": null,
  "recon_loss_weight": 1.0,
  "redistributor_latent_size": 64,
  "refiner_head_dim": 64,
  "refiner_intermediate_size": 3072,
  "refiner_num_heads": 12,
  "refiner_num_layers": 12,
  "resume": "checkpoints/train_2026-05-06_12-27-28/step_14000",
  "seed": 43,
  "shuffle_buffer": 10000,
  "steps_per_epoch": null,
  "train_encoder": true,
  "uncertainty_loss_weight": 0.001,
  "use_muon": true,
  "val_every": 500,
  "val_steps": 100,
  "wandb_mode": null,
  "wandb_project": "finevit-ae",
  "wandb_run_name": null,
  "warmup_steps": 500,
  "weight_decay": 0.01
}