| model_name: vit-b16-224-in21k | |
| optimizer: sgd | |
| lr: 0.01 | |
| betas: | |
| - 0.9 | |
| - 0.999 | |
| momentum: 0.9 | |
| weight_decay: 0.0 | |
| scheduler: cosine | |
| warmup_steps: 500 | |
| n_classes: 10 | |
| mixup_alpha: 0.0 | |
| cutmix_alpha: 0.0 | |
| mix_prob: 1.0 | |
| label_smoothing: 0.0 | |
| image_size: 224 | |
| weights: null | |
| training_mode: full | |
| lora_r: 16 | |
| lora_alpha: 16 | |
| lora_target_modules: | |
| - query | |
| - value | |
| lora_dropout: 0.0 | |
| lora_bias: none | |
| from_scratch: false | |
| dataset: custom | |
| root: data/ | |
| num_classes: 10 | |
| size: 224 | |
| min_scale: 0.08 | |
| max_scale: 1.0 | |
| flip_prob: 0.5 | |
| rand_aug_n: 0 | |
| rand_aug_m: 9 | |
| erase_prob: 0.0 | |
| use_trivial_aug: false | |
| mean: | |
| - 0.5 | |
| - 0.5 | |
| - 0.5 | |
| std: | |
| - 0.5 | |
| - 0.5 | |
| - 0.5 | |
| batch_size: 128 | |
| workers: 8 | |