File size: 2,990 Bytes
78276df
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
accum_freq: 1
audio_ext: flac
audio_fill: repeatpad
audio_fusion: False
audio_int16_normalize: False
audio_trunc: rand_trunc
audio_zeroshot_audio_key: audio
audio_zeroshot_class_key: category
audio_zeroshot_dataset: None
audio_zeroshot_multiprocessing_context: forkserver
audio_zeroshot_split: train
audio_zeroshot_target_key: target
audio_zeroshot_templates: None
audio_zeroshot_workers: 0
aug_cfg: {}
batch_size: 4096
beta1: 0.9
beta2: 0.98
cache_dir: None
checkpoint_path: ./logs/ViT-B-32-Vanilla-resume/checkpoints
coca_caption_loss_weight: 2.0
coca_contrastive_loss_weight: 1.0
copy_codebase: False
csv_caption_key: title
csv_img_key: filepath
csv_separator: 	
dataset_resampled: False
dataset_type: webdataset
ddp_static_graph: False
debug: False
delete_previous_checkpoint: False
device: cuda:0
dist_backend: None
dist_url: None
distill: False
distill_model: None
distill_pretrained: None
distributed: True
epochs: 32
epochs_cooldown: None
eps: 1e-06
force_context_length: None
force_custom_text: False
force_image_size: None
force_naflex_vision: False
force_patch_dropout: None
force_quick_gelu: False
fsdp: False
fsdp_checkpoint: full
fsdp_no_reshard_after_forward: False
fsdp_offload_cpu: False
gather_with_grad: True
grad_checkpointing: False
grad_clip_norm: None
image_interpolation: None
image_mean: None
image_resize_mode: None
image_std: None
imagenet_v2: None
imagenet_val: None
local_loss: True
local_rank: 0
lock_image: False
lock_image_freeze_bn_stats: False
lock_image_unlocked_groups: 0
lock_text: False
lock_text_freeze_layer_norm: False
lock_text_unlocked_layers: 0
log_every_n_steps: 100
log_level: 20
log_local: False
log_path: ./logs/ViT-B-32-Vanilla-resume/out.log
logs: ./logs/
loss_dist_impl: None
lr: 0.0005
lr_cooldown_end: 0.0
lr_cooldown_power: 1.0
lr_scheduler: cosine
model: ViT-B-32
momentum: None
naflex_batch_divisor: 8
naflex_loss_scale: none
naflex_max_image_tokens_per_batch: 16384
naflex_num_train_image_tokens: None
naflex_patch_size_probs: None
naflex_patch_sizes: None
naflex_seq_lens: None
name: ViT-B-32-Vanilla-resume
no_set_device_rank: False
opt: adamw
precision: amp_bfloat16
pretrained: 
pretrained_audio: None
pretrained_image: False
rank: 0
remote_sync: None
remote_sync_frequency: 300
remote_sync_protocol: s3
report_to: wandb
resume: /scratch/work/zhul2/code/open_clip/logs/ViT-B-32-Vanilla/checkpoints/epoch_24.pt
save_frequency: 1
save_most_recent: False
seed: 0
siglip: False
skip_scheduler: False
tensorboard: False
tensorboard_path: 
torchcompile: True
torchcompile_backend: None
torchcompile_mode: None
torchcompile_strategy: task
train_data: /scratch/shareddata/dldata/laion400M/img2dataset/laion400m-data/{00000..41407}.tar
train_data_upsampling_factors: None
train_num_samples: 268836185
use_bn_sync: False
use_bnb_linear: None
use_naflex: False
val_data: None
val_frequency: 1
val_num_samples: None
wandb: True
wandb_notes: 
wandb_project_name: open-clip
warmup: 2000
wd: 0.2
workers: 12
world_size: 8
zeroshot_frequency: 2