DTP: False accum_freq: 1 aug_cfg: {} batch_size: 1024 beta1: 0.9 beta2: 0.98 checkpoint_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp/checkpoints coca_caption_loss_weight: 2.0 coca_contrastive_loss_weight: 1.0 copy_codebase: False csv_caption_key: title csv_img_key: filepath csv_separator: dataset_resampled: True dataset_type: webdataset ddp_static_graph: False debug: False delete_previous_checkpoint: False device: cuda:0 dist_backend: nccl dist_url: env:// distill: False distill_model: None distill_pretrained: None distributed: True epochs: 30 epochs_cooldown: None eps: 1e-06 force_custom_text: False force_image_size: None force_patch_dropout: None force_quick_gelu: False gather_with_grad: True grad_checkpointing: True grad_clip_norm: None horovod: False image_mean: [0.485, 0.456, 0.406] image_std: [0.229, 0.224, 0.225] imagenet_v2: None imagenet_val: None local_loss: True local_rank: 0 lock_image: False lock_image_freeze_bn_stats: False lock_image_unlocked_groups: 0 lock_text: False lock_text_freeze_layer_norm: False lock_text_unlocked_layers: 0 log_every_n_steps: 1 log_level: 20 log_local: False log_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp/out.log logs: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP lr: 0.0001 lr_cooldown_end: 0.0 lr_cooldown_power: 1.0 lr_scheduler: cosine model: ViT-B-16 name: 2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp no_set_device_rank: False precision: amp pretrained: /fs/scratch/PAS2836/yusenpeng_checkpoint/CLIP/ViT_B_16/checkpoints/epoch_15.pt pretrained_image: False rank: 0 remote_sync: None remote_sync_frequency: 300 remote_sync_protocol: s3 report_to: tensorboard resume: None save_frequency: 1 save_most_recent: False seed: 0 skip_scheduler: False tensorboard: True tensorboard_path: /fs/scratch/PAS2836/yusenpeng_checkpoint/BioCLIP/2025_10_15-10_59_47-model_ViT-B-16-lr_0.0001-b_1024-j_8-p_amp/tensorboard text_type: random torchscript: False trace: False train_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/train/shard-{000000..000164}.tar train_data_upsampling_factors: None train_num_samples: 10000000 use_bn_sync: False val_data: /fs/scratch/PAS2836/yusenpeng_dataset/bioclip/data/TreeOfLife-10M/dataset/evobio10m-CVPR-2024/224x224/val/shard-{000000..000034}.tar val_frequency: 1 val_num_samples: 500000 wandb: False wandb_notes: wandb_project_name: open-clip warmup: 1000 wd: 0.2 workers: 8 world_size: 4 zeroshot_frequency: 2