| arch: mambar_base_patch16_224 | |
| batch_size_per_gpu: 64 | |
| clip_grad: 3.0 | |
| drop_path_rate: 0.1 | |
| epochs: 400 | |
| freeze_last_layer: 3 | |
| global_crops_scale: (0.25, 1.0) | |
| gpu: 0 | |
| local_crops_number: 10 | |
| local_crops_scale: (0.05, 0.25) | |
| local_rank: 0 | |
| lr: 0.00075 | |
| min_lr: 1e-06 | |
| momentum_teacher: 0.996 | |
| ngpus: 8 | |
| nodes: 2 | |
| norm_last_layer: True | |
| num_workers: 10 | |
| optimizer: adamw | |
| out_dim: 65536 | |
| patch_size: 16 | |
| rank: 0 | |
| saveckp_freq: 5 | |
| seed: 0 | |
| teacher_temp: 0.07 | |
| use_bn_in_head: False | |
| use_fp16: True | |
| use_volta32: False | |
| warmup_epochs: 10 | |
| warmup_teacher_temp: 0.04 | |
| warmup_teacher_temp_epochs: 50 | |
| weight_decay: 0.04 | |
| weight_decay_end: 0.4 | |
| world_size: 16 |