File size: 1,546 Bytes
ff30837 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 | {
"checkpoint_freq": 1,
"dataloader_num_workers": 0,
"gradient_accumulation_steps": 1,
"keep_checkpoints": -1,
"learning_rate": 0.0001,
"logging_dir": "logs",
"mixed_precision": "bf16",
"model": {
"type": "vlmpar",
"model_name": "google/siglip2-base-patch16-224",
"num_classes_dict": {
"upper_body_color": 11,
"lower_body_color": 11,
"gender": 2,
"bag": 2,
"hat": 2
}
},
"num_train_epochs": 10000,
"optimizer": {
"type": "AdamW",
"lr": 0.0001,
"weight_decay": 0.01
},
"project_dir": "outputs",
"scheduler": {
"type": "LinearLR",
"start_factor": 1.0,
"end_factor": 0.0,
"total_iters": 10000
},
"train_batch_size": 32,
"train_dataset": {
"type": "mivia_par_kd_2025",
"root_dir": "/mnt/dati/homes/zsellam/datasets/par2025",
"split": "training",
"processor": "google/siglip2-base-patch16-224"
},
"val_dataset": {
"type": "mivia_par_kd_2025",
"root_dir": "/mnt/dati/homes/zsellam/datasets/par2025",
"split": "validation",
"processor": "google/siglip2-base-patch16-224"
},
"valid_batch_size": 32,
"warmup_ratio": 0.1,
"weight_decay": 0.01,
"config": "./configs/siglip_par_train_config.py",
"seed": null,
"dtype": null,
"report_to": "tensorboard",
"max_grad_norm": 1.0,
"max_train_steps": null,
"validation_split": 0.25
} |