Philipp Allgeuer commited on
Commit
8bffec3
·
1 Parent(s): e9f95b5

Add novic checkpoint

Browse files
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  sample_images/*.jpg filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  sample_images/*.jpg filter=lfs diff=lfs merge=lfs -text
37
+ *.train filter=lfs diff=lfs merge=lfs -text
checkpoints/ovod_20240628_142131/hydra/config.yaml ADDED
@@ -0,0 +1,209 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ action: train
2
+ device: cuda
3
+ allow_tf32: true
4
+ cudnn_bench: true
5
+ determ: false
6
+ determ_seed: 1
7
+ dry_run: false
8
+ wandb: true
9
+ wandb_project: ovod
10
+ wandb_entity: null
11
+ wandb_group: null
12
+ wandb_job_type: null
13
+ wandb_name: null
14
+ wandb_tags: null
15
+ embedder_spec: openclip:apple/DFN5B-CLIP-ViT-H-14-378
16
+ embedder_amp: true
17
+ embedder_amp_bf16: false
18
+ embedder_compile: false
19
+ embedder_optimum: false
20
+ batch_size_token: 2048
21
+ batch_size_embed: 512
22
+ batch_size_image: 256
23
+ embedding_dataset: dfn5bl_multiset3c2_cache_vt0.bin
24
+ embedding_datasets: []
25
+ batch_size: 512
26
+ dataset_workers: 8
27
+ vocab_path: $SOURCE/data/object_nouns.json
28
+ vocab_thres: 0
29
+ prompt_path: $SOURCE/data/prompts.json
30
+ prompt_collection: ImageNet1K | CIFAR
31
+ hypernym_collection: None
32
+ noun_cache: true
33
+ noun_recache: false
34
+ noun_cache_dir: $SOURCE/cache/noun_dataset
35
+ embedding_cache_dir: $SOURCE/cache/embedding_cache
36
+ strict_embedder: true
37
+ save_embedding_cache: ''
38
+ cls_dataset: ImageNet1K
39
+ cls_datasets: []
40
+ cls_dataset_root: ~/Datasets
41
+ cls_split: valid
42
+ load_model: ''
43
+ load_models: []
44
+ load_models_dirnum: 1
45
+ model: PrefixedIterDecoder
46
+ with_start_token: false
47
+ with_end_token: true
48
+ compact_ids: true
49
+ fixed_token_length: false
50
+ auto_fixed_token_length: true
51
+ use_masks: true
52
+ use_weights: true
53
+ multi_target: true
54
+ multi_first: false
55
+ fixed_multi_length: false
56
+ amp: false
57
+ amp_bf16: true
58
+ vocab_quant: false
59
+ num_end_loss: 1
60
+ label_smoothing: 0.0
61
+ hidden_dim: 512
62
+ feedfwd_scale: 1/4
63
+ mlp_hidden_layer: none
64
+ mlp_hidden_bias: false
65
+ mlp_hidden_norm: false
66
+ mlp_hidden_activation: gelu
67
+ input_dropout: 0.1
68
+ num_layers: 6
69
+ num_heads: 8
70
+ layer_dropout: 0.1
71
+ layer_activation: gelu
72
+ layer_norm_first: true
73
+ layer_bias: false
74
+ logits_bias: false
75
+ init_bias_zero: true
76
+ init_mlp_mode: balanced
77
+ init_mlp_unit_norm: false
78
+ init_tfrm_mode: balanced
79
+ init_tfrm_unit_norm: false
80
+ init_tfrm_unit_postnorm: true
81
+ init_tfrm_proj_layers: true
82
+ init_zero_norm: false
83
+ init_rezero_mode: none
84
+ mlp_seq_len: 4
85
+ weight_tying: true
86
+ strictly_causal: false
87
+ enable_nested: false
88
+ cross_encoder: true
89
+ num_encoder_layers: 6
90
+ gencfg: ''
91
+ gencfgs: []
92
+ gencfgs_grid: false
93
+ gencfg_method:
94
+ - greedy
95
+ - beam
96
+ gencfg_topk:
97
+ - 3
98
+ - 5
99
+ - 10
100
+ gencfg_prior:
101
+ - none
102
+ - tgt0.25
103
+ - tgt0.5
104
+ - tok0.25
105
+ - tok0.5
106
+ gencfg_guide:
107
+ - plain
108
+ gencfg_tau:
109
+ - 0.5
110
+ - 1
111
+ - 2
112
+ gencfg_alpha:
113
+ - -0.2
114
+ - 0
115
+ - 0.2
116
+ - 0.5
117
+ test_training: true
118
+ test_device: true
119
+ test_patch: true
120
+ test_consistent: false
121
+ test_print: 0
122
+ clip_prompts: true
123
+ measure_gap: false
124
+ multi_target_freq:
125
+ - 1
126
+ - 1
127
+ captions_path: ''
128
+ template_multiplier: 10
129
+ sample_multiplier: 20
130
+ captions_print: 0
131
+ class_names_variant: clip
132
+ images: []
133
+ save_targets: null
134
+ multi_mode: max
135
+ load_train_state: true
136
+ load_lr_state: true
137
+ chunk_scale: 50
138
+ save_every_min: 12
139
+ save_every_max: 48
140
+ save_top1_min: 95.0
141
+ save_top1_delta: 0.5
142
+ max_epochs: 18
143
+ max_chunks: 0
144
+ accum_factor: 16
145
+ optimizer: AdamW
146
+ init_lr: 0.0015
147
+ final_lr: 0.0
148
+ lr_scheduler: cosine
149
+ lr_warmup: 0
150
+ beta1: 0.9
151
+ beta2: 0.95
152
+ weight_decay: 0.1
153
+ weight_decay_1d: false
154
+ nesterov: true
155
+ compile: false
156
+ gradient_clip: 1.0
157
+ loss_ewa_halflife: 4
158
+ last_dropout_chunks: 0
159
+ last_dropout_factor: 0.0
160
+ mean_shift: false
161
+ mean_shift_path: $SOURCE/data/modality_gap_$EMBEDDER.json
162
+ noise_scheme: GaussElemUniformAngle
163
+ noise_vec_norm: 3.25
164
+ noise_angle_min: 45
165
+ noise_angle_max: 75
166
+ noise_angle_std: 0.0
167
+ noise_mix_ratio: 0.15
168
+ fix_force_vtx: false
169
+ eval_train: false
170
+ eval_guided: false
171
+ eval_debug: false
172
+ eval_samples_max: 0
173
+ eval_images: ''
174
+ eval_images_dir: $SOURCE/extras/eval_images
175
+ infer_log: true
176
+ infer_texts: []
177
+ infer_images: []
178
+ infer_image_dir: $SOURCE/extras/infer_images
179
+ infer_all_images_dir: ''
180
+ infer_ann_json: $IMAGEDIR/_class_annotations.json
181
+ infer_ann_json_update: false
182
+ infer_guided: false
183
+ infer_guide_dataset: ''
184
+ infer_guide_targets: []
185
+ infer_debug: false
186
+ infer_pred_json: false
187
+ load_pred_jsons: []
188
+ pred_image_dir: $SOURCE/extras/infer_images
189
+ pred_ann_json: $IMAGEDIR/_class_annotations.json
190
+ pfmt_type: model_topk_v1
191
+ pfmt_topk: 3
192
+ pfmt_model_spec: true
193
+ pfmt_sort: ''
194
+ fmt_type: all_v2
195
+ fmt_models: ''
196
+ fmt_model_hosts: ''
197
+ fmt_hosts: ''
198
+ fmt_min_ago: ''
199
+ fmt_max_ago: ''
200
+ fmt_min_stamp: ''
201
+ fmt_max_stamp: ''
202
+ fmt_sort: ''
203
+ wiki_collect_dir: $SOURCE/extras/wiki_images
204
+ sample_input_dir: ''
205
+ sample_output_dir: $SOURCE/extras/sampled_images
206
+ sample_count: 100
207
+ sample_special: []
208
+ sample_special_mean: 0.05
209
+ sample_special_factor: []
checkpoints/ovod_20240628_142131/hydra/hydra.yaml ADDED
@@ -0,0 +1,135 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: outputs/ovod_${now:%Y%m%d_%H%M%S}
4
+ sweep:
5
+ dir: outputs/ovod_${now:%Y%m%d_%H%M%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ root: null
71
+ disable_existing_loggers: false
72
+ job_logging:
73
+ version: 1
74
+ root: null
75
+ disable_existing_loggers: false
76
+ env: {}
77
+ mode: RUN
78
+ searchpath: []
79
+ callbacks: {}
80
+ output_subdir: hydra
81
+ overrides:
82
+ hydra:
83
+ - hydra.mode=RUN
84
+ task:
85
+ - action=train
86
+ - embedder_spec=openclip:apple/DFN5B-CLIP-ViT-H-14-378
87
+ - embedding_dataset=dfn5bl_multiset3c2_cache_vt0.bin
88
+ - multi_target=True
89
+ - use_weights=True
90
+ - noise_scheme=GaussElemUniformAngle
91
+ - noise_vec_norm=3.25
92
+ - noise_angle_min=45
93
+ - noise_angle_max=75
94
+ - noise_mix_ratio=0.15
95
+ - accum_factor=16
96
+ job:
97
+ name: train
98
+ chdir: null
99
+ override_dirname: accum_factor=16,action=train,embedder_spec=openclip:apple/DFN5B-CLIP-ViT-H-14-378,embedding_dataset=dfn5bl_multiset3c2_cache_vt0.bin,multi_target=True,noise_angle_max=75,noise_angle_min=45,noise_mix_ratio=0.15,noise_scheme=GaussElemUniformAngle,noise_vec_norm=3.25,use_weights=True
100
+ id: ???
101
+ num: ???
102
+ config_name: train
103
+ env_set: {}
104
+ env_copy: []
105
+ config:
106
+ override_dirname:
107
+ kv_sep: '='
108
+ item_sep: ','
109
+ exclude_keys: []
110
+ runtime:
111
+ version: 1.3.2
112
+ version_base: '1.3'
113
+ cwd: /data/strahl/Code/ovod
114
+ config_sources:
115
+ - path: hydra.conf
116
+ schema: pkg
117
+ provider: hydra
118
+ - path: /data/strahl/Code/ovod/config
119
+ schema: file
120
+ provider: main
121
+ - path: ''
122
+ schema: structured
123
+ provider: schema
124
+ output_dir: /data/strahl/Code/ovod/outputs/ovod_20240628_142131
125
+ choices:
126
+ hydra/env: default
127
+ hydra/callbacks: null
128
+ hydra/job_logging: none
129
+ hydra/hydra_logging: none
130
+ hydra/hydra_help: default
131
+ hydra/help: default
132
+ hydra/sweeper: basic
133
+ hydra/launcher: basic
134
+ hydra/output: default
135
+ verbose: false
checkpoints/ovod_20240628_142131/hydra/overrides.yaml ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - action=train
2
+ - embedder_spec=openclip:apple/DFN5B-CLIP-ViT-H-14-378
3
+ - embedding_dataset=dfn5bl_multiset3c2_cache_vt0.bin
4
+ - multi_target=True
5
+ - use_weights=True
6
+ - noise_scheme=GaussElemUniformAngle
7
+ - noise_vec_norm=3.25
8
+ - noise_angle_min=45
9
+ - noise_angle_max=75
10
+ - noise_mix_ratio=0.15
11
+ - accum_factor=16
checkpoints/ovod_20240628_142131/ovod_chunk0433_20240630_235415.train ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01ade7136b777e111a0cc3e08e0800143332beb81bf412ffac6fd1cd066612e8
3
+ size 188603970
checkpoints/ovod_20240628_142131/train.log ADDED
The diff for this file is too large to render. See raw diff