AbstractPhil commited on
Commit
8a272c4
·
verified ·
1 Parent(s): b06cd14

Upload runs/cifar100_weighted_ADAMW_WarmRestart_20251119_200313/config.yaml with huggingface_hub

Browse files
runs/cifar100_weighted_ADAMW_WarmRestart_20251119_200313/config.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adamw_betas:
2
+ - 0.9
3
+ - 0.999
4
+ adamw_eps: 1.0e-08
5
+ batch_size: 128
6
+ beatrix_tau: 0.25
7
+ checkpoint_upload_interval: 25
8
+ cutout_length: 16
9
+ dataset: cifar100
10
+ device: cuda
11
+ drop_path_rate: 0.1
12
+ dropout: 0.1
13
+ embed_dim: 512
14
+ fusion_mode: weighted
15
+ fusion_window: 32
16
+ grad_clip: 1.0
17
+ hf_repo_name: vit-beans-v3
18
+ hf_token: null
19
+ hf_username: AbstractPhil
20
+ image_size: 32
21
+ k_simplex: 4
22
+ label_smoothing: 0.1
23
+ learning_rate: 0.0003
24
+ log_interval: 50
25
+ lr_gamma: 0.2
26
+ lr_milestones:
27
+ - 60
28
+ - 120
29
+ - 160
30
+ min_lr: 1.0e-07
31
+ model_name: vit-beans-v3
32
+ num_classes: 100
33
+ num_epochs: 300
34
+ num_fusion_blocks: 6
35
+ num_heads: 8
36
+ num_workers: 4
37
+ optimizer_type: adamw
38
+ patch_size: 4
39
+ precompute_geometric: true
40
+ restart_mult: 2
41
+ restart_period: 20
42
+ run_name: cifar100_weighted_ADAMW_WarmRestart_20251119_200313
43
+ save_interval: 10
44
+ scheduler_type: cosine_restarts
45
+ seed: 42
46
+ sgd_momentum: 0.9
47
+ sgd_nesterov: true
48
+ upload_to_hf: true
49
+ use_augmentation: true
50
+ use_autoaugment: true
51
+ use_beatrix: true
52
+ use_cutout: false
53
+ use_mixed_precision: false
54
+ use_torch_compile: true
55
+ warmup_epochs: 10
56
+ weight_decay: 0.05
57
+ weights_dir: weights