VLM-PAR / config.json
Bekhouche's picture
Upload folder using huggingface_hub
ff30837 verified
{
"checkpoint_freq": 1,
"dataloader_num_workers": 0,
"gradient_accumulation_steps": 1,
"keep_checkpoints": -1,
"learning_rate": 0.0001,
"logging_dir": "logs",
"mixed_precision": "bf16",
"model": {
"type": "vlmpar",
"model_name": "google/siglip2-base-patch16-224",
"num_classes_dict": {
"upper_body_color": 11,
"lower_body_color": 11,
"gender": 2,
"bag": 2,
"hat": 2
}
},
"num_train_epochs": 10000,
"optimizer": {
"type": "AdamW",
"lr": 0.0001,
"weight_decay": 0.01
},
"project_dir": "outputs",
"scheduler": {
"type": "LinearLR",
"start_factor": 1.0,
"end_factor": 0.0,
"total_iters": 10000
},
"train_batch_size": 32,
"train_dataset": {
"type": "mivia_par_kd_2025",
"root_dir": "/mnt/dati/homes/zsellam/datasets/par2025",
"split": "training",
"processor": "google/siglip2-base-patch16-224"
},
"val_dataset": {
"type": "mivia_par_kd_2025",
"root_dir": "/mnt/dati/homes/zsellam/datasets/par2025",
"split": "validation",
"processor": "google/siglip2-base-patch16-224"
},
"valid_batch_size": 32,
"warmup_ratio": 0.1,
"weight_decay": 0.01,
"config": "./configs/siglip_par_train_config.py",
"seed": null,
"dtype": null,
"report_to": "tensorboard",
"max_grad_norm": 1.0,
"max_train_steps": null,
"validation_split": 0.25
}