ramdrop commited on
Commit
32c539a
·
1 Parent(s): 06322d3

first commit

Browse files
datt_scannet/wandb/latest-run/files/config.yaml ADDED
@@ -0,0 +1,262 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ CONFIG:
4
+ desc: null
5
+ value: datt_mix_ctrs.yaml
6
+ MODEL:
7
+ desc: null
8
+ value:
9
+ TYPE: dat
10
+ NAME: dat_plus_plus
11
+ PRETRAINED: pretrained_weights/dat_pp_tiny_in1k_224.pth
12
+ DAT:
13
+ img_size: 224
14
+ patch_size: 4
15
+ num_classes: 1000
16
+ expansion: 4
17
+ dim_stem: 64
18
+ dims:
19
+ - 64
20
+ - 128
21
+ - 256
22
+ - 512
23
+ depths:
24
+ - 2
25
+ - 4
26
+ - 18
27
+ - 2
28
+ stage_spec:
29
+ - - N
30
+ - D
31
+ - - N
32
+ - D
33
+ - N
34
+ - D
35
+ - - N
36
+ - D
37
+ - N
38
+ - D
39
+ - N
40
+ - D
41
+ - N
42
+ - D
43
+ - N
44
+ - D
45
+ - N
46
+ - D
47
+ - N
48
+ - D
49
+ - N
50
+ - D
51
+ - N
52
+ - D
53
+ - - D
54
+ - D
55
+ heads:
56
+ - 2
57
+ - 4
58
+ - 8
59
+ - 16
60
+ window_sizes:
61
+ - 7
62
+ - 7
63
+ - 7
64
+ - 7
65
+ groups:
66
+ - 1
67
+ - 2
68
+ - 4
69
+ - 8
70
+ use_pes:
71
+ - true
72
+ - true
73
+ - true
74
+ - true
75
+ dwc_pes:
76
+ - false
77
+ - false
78
+ - false
79
+ - false
80
+ strides:
81
+ - 8
82
+ - 4
83
+ - 2
84
+ - 1
85
+ offset_range_factor:
86
+ - -1
87
+ - -1
88
+ - -1
89
+ - -1
90
+ no_offs:
91
+ - false
92
+ - false
93
+ - false
94
+ - false
95
+ fixed_pes:
96
+ - false
97
+ - false
98
+ - false
99
+ - false
100
+ use_dwc_mlps:
101
+ - true
102
+ - true
103
+ - true
104
+ - true
105
+ use_lpus:
106
+ - true
107
+ - true
108
+ - true
109
+ - true
110
+ use_conv_patches: true
111
+ ksizes:
112
+ - 9
113
+ - 7
114
+ - 5
115
+ - 3
116
+ nat_ksizes:
117
+ - 7
118
+ - 7
119
+ - 7
120
+ - 7
121
+ drop_rate: 0.0
122
+ attn_drop_rate: 0.0
123
+ drop_path_rate: 0.2
124
+ clip_dim: 1024
125
+ quantization:
126
+ method: jacob
127
+ weight:
128
+ num_bits: 8
129
+ axis: per_channel
130
+ calib_method: max
131
+ activation:
132
+ num_bits: 8
133
+ axis: per_tensor
134
+ calib_method: max
135
+ calibration:
136
+ num_batch: 2
137
+ modal: rgbd
138
+ TRAIN:
139
+ desc: null
140
+ value:
141
+ EPOCHS: 120
142
+ WARMUP_EPOCHS: 0
143
+ BASE_LR: 1.0e-06
144
+ WEIGHT_DECAY: 0.05
145
+ WARMUP_LR: 5.0e-07
146
+ MIN_LR: 5.0e-07
147
+ CLIP_GRAD: 5.0
148
+ LR_SCHEDULER:
149
+ NAME: cosine
150
+ DECAY_EPOCHS: 30
151
+ DECAY_RATE: 0.1
152
+ OPTIMIZER:
153
+ NAME: adamw
154
+ EPS: 1.0e-08
155
+ BETAS:
156
+ - 0.9
157
+ - 0.999
158
+ MOMENTUM: 0.9
159
+ CRETERION:
160
+ NAME: TripletMarginLoss
161
+ TRIPLET_MARGIN: 0.3
162
+ MINING_METHOD:
163
+ POSITIVE: easy
164
+ NEGATIVE: random
165
+ TOTAL: semihard
166
+ NEG_NUM: 3
167
+ KD:
168
+ ENABLE: false
169
+ WEIGHT: 10
170
+ WEIGHT: 0.05
171
+ DATA:
172
+ desc: null
173
+ value:
174
+ DATASET: scannet
175
+ ROOT: dbs
176
+ BATCH_SIZE: 4
177
+ VAL_BATCH_SIZE: 32
178
+ EMBEDDING_BATCH_SIZE: 32
179
+ DEPTH_TRANSFORM: rgb
180
+ IS_SUBSET: true
181
+ LABEL_TYPE: pseudo_labels
182
+ DATASET_THRESHOLD: 0.25
183
+ GPU:
184
+ desc: null
185
+ value: 0
186
+ SEED:
187
+ desc: null
188
+ value: 1
189
+ CLIP_MODEL:
190
+ desc: null
191
+ value:
192
+ NAME: ViT-g-14
193
+ PRETRAINED: laion2b_s34b_b88k
194
+ MODAL:
195
+ desc: null
196
+ value: depth
197
+ PHASE:
198
+ desc: null
199
+ value: train_ctrs
200
+ CKPT:
201
+ desc: null
202
+ value: logs/datt_0215_215348/wandb/latest-run/files/src/best_model.pth
203
+ MIX_INPUT:
204
+ desc: null
205
+ value:
206
+ ENABLE: true
207
+ NUM_MIX: 2
208
+ WEIGHTED: false
209
+ ATTENTION:
210
+ desc: null
211
+ value:
212
+ ENABLE: false
213
+ WEIGHTED_SAMPLE:
214
+ desc: null
215
+ value:
216
+ ENABLE: false
217
+ cmd:
218
+ desc: null
219
+ value: run.py --phase=train_ctrs --config=configs/scannet/datt_mix_ctrs.yaml --quant_config=quantization_configs/d2_jacob.yaml
220
+ _wandb:
221
+ desc: null
222
+ value:
223
+ code_path: code/run.py
224
+ python_version: 3.10.13
225
+ cli_version: 0.16.3
226
+ framework: huggingface
227
+ huggingface_version: 4.37.2
228
+ is_jupyter_run: false
229
+ is_kaggle_kernel: false
230
+ start_time: 1708266273.066213
231
+ t:
232
+ 1:
233
+ - 1
234
+ - 5
235
+ - 11
236
+ - 41
237
+ - 49
238
+ - 53
239
+ - 55
240
+ - 63
241
+ - 80
242
+ 2:
243
+ - 1
244
+ - 5
245
+ - 11
246
+ - 41
247
+ - 49
248
+ - 53
249
+ - 55
250
+ - 63
251
+ - 80
252
+ 3:
253
+ - 3
254
+ - 13
255
+ - 16
256
+ - 23
257
+ 4: 3.10.13
258
+ 5: 0.16.3
259
+ 6: 4.37.2
260
+ 8:
261
+ - 5
262
+ 13: linux-x86_64
datt_scannet/wandb/latest-run/files/src/best_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dc2a4016a949a2a9cad3ffd68eccbb99b3d5e389d67896ee40e4671a7a4a837
3
+ size 98227739
datt_scannet/wandb/latest-run/files/src/datt_mix_ctrs.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CONFIG: datt_mix_ctrs.yaml
2
+ MODEL:
3
+ TYPE: dat
4
+ NAME: dat_plus_plus
5
+ PRETRAINED: "pretrained_weights/dat_pp_tiny_in1k_224.pth"
6
+ DAT:
7
+ img_size: 224
8
+ patch_size: 4
9
+ num_classes: 1000
10
+ expansion: 4
11
+ dim_stem: 64
12
+ dims: [64, 128, 256, 512]
13
+ depths: [2, 4, 18, 2]
14
+ stage_spec: [[N, D], [N, D, N, D], [N, D, N, D, N, D, N, D, N, D, N, D, N, D, N, D, N, D], [D, D]]
15
+ heads: [2, 4, 8, 16]
16
+ window_sizes: [7, 7, 7, 7]
17
+ groups: [1, 2, 4, 8]
18
+ use_pes: [True, True, True, True]
19
+ dwc_pes: [False, False, False, False]
20
+ strides: [8, 4, 2, 1]
21
+ offset_range_factor: [-1, -1, -1, -1]
22
+ no_offs: [False, False, False, False]
23
+ fixed_pes: [False, False, False, False]
24
+ use_dwc_mlps: [True, True, True, True]
25
+ use_lpus: [True, True, True, True]
26
+ use_conv_patches: True
27
+ ksizes: [9, 7, 5, 3]
28
+ nat_ksizes: [7, 7, 7, 7]
29
+ drop_rate: 0.0
30
+ attn_drop_rate: 0.0
31
+ drop_path_rate: 0.2
32
+ # quant_bit: 8
33
+ clip_dim: 1024
34
+
35
+
36
+ TRAIN:
37
+ EPOCHS: 120
38
+ WARMUP_EPOCHS: 0
39
+ BASE_LR: 1e-6
40
+ WEIGHT_DECAY: 0.05
41
+ WARMUP_LR: 5e-7
42
+ MIN_LR: 5e-7
43
+ CLIP_GRAD: 5.0
44
+ LR_SCHEDULER:
45
+ NAME: "cosine"
46
+ DECAY_EPOCHS: 30
47
+ DECAY_RATE: 0.1
48
+ OPTIMIZER:
49
+ NAME: "adamw"
50
+ EPS: 1e-8
51
+ BETAS: [0.9, 0.999]
52
+ MOMENTUM: 0.9
53
+ CRETERION:
54
+ NAME: "TripletMarginLoss" # MSE
55
+ TRIPLET_MARGIN: 0.3
56
+ MINING_METHOD:
57
+ POSITIVE: "easy" # easy, hard, random
58
+ NEGATIVE: "random" # easy, hard, random
59
+ TOTAL: "semihard" # all, semihard, hard
60
+ NEG_NUM: 3
61
+ KD:
62
+ ENABLE: False
63
+ WEIGHT: 10
64
+ WEIGHT: 5e-2
65
+
66
+ DATA:
67
+ DATASET: "scannet"
68
+ ROOT: "dbs"
69
+ BATCH_SIZE: 4
70
+ VAL_BATCH_SIZE: 32
71
+ EMBEDDING_BATCH_SIZE: 32
72
+ DEPTH_TRANSFORM: "rgb"
73
+ IS_SUBSET: True
74
+ LABEL_TYPE: "pseudo_labels" # "gt" or "clip_vitb32"
75
+ DATASET_THRESHOLD: 0.25
76
+
77
+
78
+ GPU: 0
79
+ SEED: 1
80
+
81
+ CLIP_MODEL:
82
+ NAME: "ViT-g-14" # "ViT-B/32"
83
+ PRETRAINED: "laion2b_s34b_b88k"
84
+ MODAL: "depth" # "rgb" or "depth"
85
+ PHASE: "train_ctrs" # "train_ctrs" # "test"
86
+ CKPT: "logs/datt_0215_215348/wandb/latest-run/files/src/best_model.pth"
87
+
88
+ # [] Mix Input
89
+ MIX_INPUT:
90
+ ENABLE: True
91
+ NUM_MIX: 2
92
+ WEIGHTED: False
93
+
94
+ # [] Attention
95
+ ATTENTION:
96
+ ENABLE: False
97
+
98
+ # [] Weighted samples
99
+ WEIGHTED_SAMPLE:
100
+ ENABLE: False