| { | |
| "checkpoint_freq": 1, | |
| "dataloader_num_workers": 0, | |
| "gradient_accumulation_steps": 1, | |
| "keep_checkpoints": -1, | |
| "learning_rate": 0.0001, | |
| "logging_dir": "logs", | |
| "mixed_precision": "bf16", | |
| "model": { | |
| "type": "vlmpar", | |
| "model_name": "google/siglip2-base-patch16-224", | |
| "num_classes_dict": { | |
| "upper_body_color": 11, | |
| "lower_body_color": 11, | |
| "gender": 2, | |
| "bag": 2, | |
| "hat": 2 | |
| } | |
| }, | |
| "num_train_epochs": 10000, | |
| "optimizer": { | |
| "type": "AdamW", | |
| "lr": 0.0001, | |
| "weight_decay": 0.01 | |
| }, | |
| "project_dir": "outputs", | |
| "scheduler": { | |
| "type": "LinearLR", | |
| "start_factor": 1.0, | |
| "end_factor": 0.0, | |
| "total_iters": 10000 | |
| }, | |
| "train_batch_size": 32, | |
| "train_dataset": { | |
| "type": "mivia_par_kd_2025", | |
| "root_dir": "/mnt/dati/homes/zsellam/datasets/par2025", | |
| "split": "training", | |
| "processor": "google/siglip2-base-patch16-224" | |
| }, | |
| "val_dataset": { | |
| "type": "mivia_par_kd_2025", | |
| "root_dir": "/mnt/dati/homes/zsellam/datasets/par2025", | |
| "split": "validation", | |
| "processor": "google/siglip2-base-patch16-224" | |
| }, | |
| "valid_batch_size": 32, | |
| "warmup_ratio": 0.1, | |
| "weight_decay": 0.01, | |
| "config": "./configs/siglip_par_train_config.py", | |
| "seed": null, | |
| "dtype": null, | |
| "report_to": "tensorboard", | |
| "max_grad_norm": 1.0, | |
| "max_train_steps": null, | |
| "validation_split": 0.25 | |
| } |