| save_frequency: 1 | |
| name: "clsclip_test" | |
| train_data: '/datasets/datacomp_1b/data/{00000..140089}.tar' # please modify to your own path | |
| train_num_samples: 1_280_000_000 | |
| dataset_type: webdataset | |
| precision: 'amp_bfloat16' | |
| warmup: 10000 | |
| global_batch_size: 8000 | |
| batch_size: 0 | |
| epochs: 10 | |
| lr: 1.0e-3 | |
| beta1: 0.9 | |
| beta2: 0.95 | |
| eps: 1.0e-6 | |
| workers: 6 | |
| model: "CLS-ViT-L-16" | |
| seed: 0 | |
| ddp_static_graph: true | |
| local_loss: true | |
| gather_with_grad: true | |
| force_image_size: 224 | |
| grad_checkpointing: true | |
| coca_caption_loss_weight: 0.5 | |
| logs: './logs' | |
| imagenet_val: './imagenet1k/val' # please modify to your own path | |
| report_to: "tensorboard" | |
| log_every_n_steps: 32 | |
| zeroshot_steps: 3052 | |
| val_steps: 3052 | |
| save_every_n_steps: 3052 | |
| delete_prev_step_ckpt: true | |
| aug_cfg: {'scale': [0.4, 1.0], 'color_jitter': [0.32, 0.32, 0.32, 0.08], 'color_jitter_prob': 0.8, 'gray_scale_prob': 0.2} | |
| zeroshot_frequency: 1 | |
| resume: latest |