| accum_freq: 1 | |
| aug_cfg: {} | |
| batch_size: 32 | |
| beta1: 0.9 | |
| beta2: 0.999 | |
| cache_dir: None | |
| checkpoint_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/checkpoints | |
| coca_caption_loss_weight: 2.0 | |
| coca_contrastive_loss_weight: 1.0 | |
| copy_codebase: False | |
| csv_caption_key: title | |
| csv_img_key: filepath | |
| csv_separator: | |
| dataset_resampled: False | |
| dataset_type: hf | |
| ddp_static_graph: False | |
| debug: False | |
| delete_previous_checkpoint: False | |
| device: cuda | |
| dist_backend: None | |
| dist_url: None | |
| distill: False | |
| distill_model: None | |
| distill_pretrained: None | |
| distributed: False | |
| epochs: 30 | |
| epochs_cooldown: None | |
| eps: 1e-08 | |
| force_custom_text: False | |
| force_image_size: None | |
| force_patch_dropout: None | |
| force_quick_gelu: False | |
| gather_with_grad: False | |
| grad_checkpointing: False | |
| grad_clip_norm: None | |
| hf_dataset: photonmz/opi_function_packed | |
| horovod: False | |
| image_interpolation: None | |
| image_mean: None | |
| image_resize_mode: None | |
| image_std: None | |
| imagenet_v2: None | |
| imagenet_val: None | |
| local_loss: False | |
| local_rank: 0 | |
| lock_image: False | |
| lock_image_freeze_bn_stats: False | |
| lock_image_unlocked_groups: 0 | |
| lock_text: False | |
| lock_text_freeze_layer_norm: False | |
| lock_text_unlocked_layers: 0 | |
| log_every_n_steps: 100 | |
| log_level: 20 | |
| log_local: False | |
| log_path: ./logs/2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16/out.log | |
| logs: ./logs/ | |
| loss_dist_impl: None | |
| lr: 0.0002 | |
| lr_cooldown_end: 0.0 | |
| lr_cooldown_power: 1.0 | |
| lr_scheduler: cosine | |
| model: crisp_1 | |
| momentum: None | |
| name: 2025_03_18-18_35_55-model_crisp_1-lr_0.0002-b_32-j_1-p_amp_bfloat16 | |
| no_set_device_rank: False | |
| opt: adamw | |
| precision: amp_bfloat16 | |
| pretrained: | |
| pretrained_image: False | |
| rank: 0 | |
| remote_sync: None | |
| remote_sync_frequency: 300 | |
| remote_sync_protocol: s3 | |
| report_to: wandb | |
| resume: None | |
| save_frequency: 1 | |
| save_most_recent: True | |
| seed: 0 | |
| siglip: False | |
| skip_scheduler: False | |
| tensorboard: False | |
| tensorboard_path: | |
| torchcompile: False | |
| torchscript: False | |
| trace: False | |
| train_data: stub | |
| train_data_upsampling_factors: None | |
| train_num_samples: None | |
| use_bn_sync: False | |
| use_bnb_linear: None | |
| val_data: stub | |
| val_frequency: 1 | |
| val_num_samples: None | |
| wandb: True | |
| wandb_notes: | |
| wandb_project_name: open-clip | |
| warmup: 10000 | |
| wd: 0.1 | |
| workers: 1 | |
| world_size: 1 | |
| zeroshot_frequency: 1 | |