TensorBoard
karimknaebel commited on
Commit
f38adb4
·
verified ·
1 Parent(s): 5859ae5

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -43,3 +43,4 @@ semantic_kitti/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
43
  scannet200/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
44
  scannet200/semseg-ptv3_dinov3-L/train.log filter=lfs diff=lfs merge=lfs -text
45
  scannet200/distill-ptv3_scannet200+structured3d_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
 
 
43
  scannet200/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
44
  scannet200/semseg-ptv3_dinov3-L/train.log filter=lfs diff=lfs merge=lfs -text
45
  scannet200/distill-ptv3_scannet200+structured3d_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
46
+ scannet200/distill-ptv3_scannet200_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
scannet200/distill-ptv3_scannet200_dino-L/config.py ADDED
@@ -0,0 +1,395 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = None
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 25001282
6
+ save_path = 'exp/scannet200/2025-03-01_214736'
7
+ wandb_project = 'pointcept_distill_scannet'
8
+ num_worker = 24
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 800
13
+ eval_epoch = 100
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = False
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='img_enc|block', lr=0.0006)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='LossEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None)
28
+ ]
29
+ train = dict(type='DefaultTrainer')
30
+ test = dict()
31
+ CLASS_LABELS_200 = (
32
+ 'wall', 'chair', 'floor', 'table', 'door', 'couch', 'cabinet', 'shelf',
33
+ 'desk', 'office chair', 'bed', 'pillow', 'sink', 'picture', 'window',
34
+ 'toilet', 'bookshelf', 'monitor', 'curtain', 'book', 'armchair',
35
+ 'coffee table', 'box', 'refrigerator', 'lamp', 'kitchen cabinet', 'towel',
36
+ 'clothes', 'tv', 'nightstand', 'counter', 'dresser', 'stool', 'cushion',
37
+ 'plant', 'ceiling', 'bathtub', 'end table', 'dining table', 'keyboard',
38
+ 'bag', 'backpack', 'toilet paper', 'printer', 'tv stand', 'whiteboard',
39
+ 'blanket', 'shower curtain', 'trash can', 'closet', 'stairs', 'microwave',
40
+ 'stove', 'shoe', 'computer tower', 'bottle', 'bin', 'ottoman', 'bench',
41
+ 'board', 'washing machine', 'mirror', 'copier', 'basket', 'sofa chair',
42
+ 'file cabinet', 'fan', 'laptop', 'shower', 'paper', 'person',
43
+ 'paper towel dispenser', 'oven', 'blinds', 'rack', 'plate', 'blackboard',
44
+ 'piano', 'suitcase', 'rail', 'radiator', 'recycling bin', 'container',
45
+ 'wardrobe', 'soap dispenser', 'telephone', 'bucket', 'clock', 'stand',
46
+ 'light', 'laundry basket', 'pipe', 'clothes dryer', 'guitar',
47
+ 'toilet paper holder', 'seat', 'speaker', 'column', 'bicycle', 'ladder',
48
+ 'bathroom stall', 'shower wall', 'cup', 'jacket', 'storage bin',
49
+ 'coffee maker', 'dishwasher', 'paper towel roll', 'machine', 'mat',
50
+ 'windowsill', 'bar', 'toaster', 'bulletin board', 'ironing board',
51
+ 'fireplace', 'soap dish', 'kitchen counter', 'doorframe',
52
+ 'toilet paper dispenser', 'mini fridge', 'fire extinguisher', 'ball',
53
+ 'hat', 'shower curtain rod', 'water cooler', 'paper cutter', 'tray',
54
+ 'shower door', 'pillar', 'ledge', 'toaster oven', 'mouse',
55
+ 'toilet seat cover dispenser', 'furniture', 'cart', 'storage container',
56
+ 'scale', 'tissue box', 'light switch', 'crate', 'power outlet',
57
+ 'decoration', 'sign', 'projector', 'closet door', 'vacuum cleaner',
58
+ 'candle', 'plunger', 'stuffed animal', 'headphones', 'dish rack', 'broom',
59
+ 'guitar case', 'range hood', 'dustpan', 'hair dryer', 'water bottle',
60
+ 'handicap bar', 'purse', 'vent', 'shower floor', 'water pitcher',
61
+ 'mailbox', 'bowl', 'paper bag', 'alarm clock', 'music stand',
62
+ 'projector screen', 'divider', 'laundry detergent', 'bathroom counter',
63
+ 'object', 'bathroom vanity', 'closet wall', 'laundry hamper',
64
+ 'bathroom stall door', 'ceiling light', 'trash bin', 'dumbbell',
65
+ 'stair rail', 'tube', 'bathroom cabinet', 'cd case', 'closet rod',
66
+ 'coffee kettle', 'structure', 'shower head', 'keyboard piano',
67
+ 'case of water bottles', 'coat rack', 'storage organizer', 'folded chair',
68
+ 'fire alarm', 'power strip', 'calendar', 'poster', 'potted plant',
69
+ 'luggage', 'mattress')
70
+ model = dict(
71
+ type='DefaultDistiller',
72
+ backbone_out_channels=64,
73
+ dinov2='large',
74
+ with_cls_tokens=None,
75
+ backbone_bottleneck_channels=512,
76
+ backbone=dict(
77
+ type='PT-v3m1',
78
+ in_channels=6,
79
+ order=('z', 'z-trans', 'hilbert', 'hilbert-trans'),
80
+ stride=(2, 2, 2, 2),
81
+ enc_depths=(2, 2, 2, 6, 2),
82
+ enc_channels=(32, 64, 128, 256, 512),
83
+ enc_num_head=(2, 4, 8, 16, 32),
84
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
85
+ dec_depths=(2, 2, 2, 2),
86
+ dec_channels=(64, 64, 128, 256),
87
+ dec_num_head=(4, 4, 8, 16),
88
+ dec_patch_size=(1024, 1024, 1024, 1024),
89
+ mlp_ratio=4,
90
+ qkv_bias=True,
91
+ qk_scale=None,
92
+ attn_drop=0.0,
93
+ proj_drop=0.0,
94
+ drop_path=0.3,
95
+ shuffle_orders=True,
96
+ pre_norm=True,
97
+ enable_rpe=False,
98
+ enable_flash=True,
99
+ upcast_attention=False,
100
+ upcast_softmax=False,
101
+ cls_mode=False,
102
+ pdnorm_bn=False,
103
+ pdnorm_ln=False,
104
+ pdnorm_decouple=True,
105
+ pdnorm_adaptive=False,
106
+ pdnorm_affine=True,
107
+ pdnorm_conditions=('ScanNet', 'S3DIS', 'Structured3D')),
108
+ criteria=[dict(type='CosineLoss', loss_weight=1.0)])
109
+ optimizer = dict(type='AdamW', lr=0.006, weight_decay=0.05)
110
+ scheduler = dict(
111
+ type='OneCycleLR',
112
+ max_lr=[0.006, 0.0006],
113
+ pct_start=0.05,
114
+ anneal_strategy='cos',
115
+ div_factor=10.0,
116
+ final_div_factor=1000.0)
117
+ dataset_type = 'ScanNet200Dataset'
118
+ data_root = 'data/scannet'
119
+ data = dict(
120
+ num_classes=200,
121
+ ignore_index=-1,
122
+ names=(
123
+ 'wall', 'chair', 'floor', 'table', 'door', 'couch', 'cabinet', 'shelf',
124
+ 'desk', 'office chair', 'bed', 'pillow', 'sink', 'picture', 'window',
125
+ 'toilet', 'bookshelf', 'monitor', 'curtain', 'book', 'armchair',
126
+ 'coffee table', 'box', 'refrigerator', 'lamp', 'kitchen cabinet',
127
+ 'towel', 'clothes', 'tv', 'nightstand', 'counter', 'dresser', 'stool',
128
+ 'cushion', 'plant', 'ceiling', 'bathtub', 'end table', 'dining table',
129
+ 'keyboard', 'bag', 'backpack', 'toilet paper', 'printer', 'tv stand',
130
+ 'whiteboard', 'blanket', 'shower curtain', 'trash can', 'closet',
131
+ 'stairs', 'microwave', 'stove', 'shoe', 'computer tower', 'bottle',
132
+ 'bin', 'ottoman', 'bench', 'board', 'washing machine', 'mirror',
133
+ 'copier', 'basket', 'sofa chair', 'file cabinet', 'fan', 'laptop',
134
+ 'shower', 'paper', 'person', 'paper towel dispenser', 'oven', 'blinds',
135
+ 'rack', 'plate', 'blackboard', 'piano', 'suitcase', 'rail', 'radiator',
136
+ 'recycling bin', 'container', 'wardrobe', 'soap dispenser',
137
+ 'telephone', 'bucket', 'clock', 'stand', 'light', 'laundry basket',
138
+ 'pipe', 'clothes dryer', 'guitar', 'toilet paper holder', 'seat',
139
+ 'speaker', 'column', 'bicycle', 'ladder', 'bathroom stall',
140
+ 'shower wall', 'cup', 'jacket', 'storage bin', 'coffee maker',
141
+ 'dishwasher', 'paper towel roll', 'machine', 'mat', 'windowsill',
142
+ 'bar', 'toaster', 'bulletin board', 'ironing board', 'fireplace',
143
+ 'soap dish', 'kitchen counter', 'doorframe', 'toilet paper dispenser',
144
+ 'mini fridge', 'fire extinguisher', 'ball', 'hat',
145
+ 'shower curtain rod', 'water cooler', 'paper cutter', 'tray',
146
+ 'shower door', 'pillar', 'ledge', 'toaster oven', 'mouse',
147
+ 'toilet seat cover dispenser', 'furniture', 'cart',
148
+ 'storage container', 'scale', 'tissue box', 'light switch', 'crate',
149
+ 'power outlet', 'decoration', 'sign', 'projector', 'closet door',
150
+ 'vacuum cleaner', 'candle', 'plunger', 'stuffed animal', 'headphones',
151
+ 'dish rack', 'broom', 'guitar case', 'range hood', 'dustpan',
152
+ 'hair dryer', 'water bottle', 'handicap bar', 'purse', 'vent',
153
+ 'shower floor', 'water pitcher', 'mailbox', 'bowl', 'paper bag',
154
+ 'alarm clock', 'music stand', 'projector screen', 'divider',
155
+ 'laundry detergent', 'bathroom counter', 'object', 'bathroom vanity',
156
+ 'closet wall', 'laundry hamper', 'bathroom stall door',
157
+ 'ceiling light', 'trash bin', 'dumbbell', 'stair rail', 'tube',
158
+ 'bathroom cabinet', 'cd case', 'closet rod', 'coffee kettle',
159
+ 'structure', 'shower head', 'keyboard piano', 'case of water bottles',
160
+ 'coat rack', 'storage organizer', 'folded chair', 'fire alarm',
161
+ 'power strip', 'calendar', 'poster', 'potted plant', 'luggage',
162
+ 'mattress'),
163
+ train=dict(
164
+ type='ScanNet200Dataset',
165
+ split='train',
166
+ data_root='data/scannet',
167
+ with_images=10,
168
+ transform=[
169
+ dict(type='ImageResize', size=[420, 560]),
170
+ dict(
171
+ type='ImageColorJitter',
172
+ brightness=0.4,
173
+ contrast=0.4,
174
+ saturation=0.2,
175
+ hue=0.1),
176
+ dict(type='ImageRandomHorizontalFlip'),
177
+ dict(type='ImageNormalize'),
178
+ dict(type='CenterShift', apply_z=True),
179
+ dict(
180
+ type='RandomDropout',
181
+ dropout_ratio=0.2,
182
+ dropout_application_ratio=0.2),
183
+ dict(
184
+ type='RandomRotate',
185
+ angle=[-1, 1],
186
+ axis='z',
187
+ center=[0, 0, 0],
188
+ p=0.5),
189
+ dict(
190
+ type='RandomRotate',
191
+ angle=[-0.015625, 0.015625],
192
+ axis='x',
193
+ p=0.5),
194
+ dict(
195
+ type='RandomRotate',
196
+ angle=[-0.015625, 0.015625],
197
+ axis='y',
198
+ p=0.5),
199
+ dict(type='RandomScale', scale=[0.9, 1.1]),
200
+ dict(type='RandomFlip', p=0.5),
201
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
202
+ dict(
203
+ type='ElasticDistortion',
204
+ distortion_params=[[0.2, 0.4], [0.8, 1.6]]),
205
+ dict(type='ChromaticAutoContrast', p=0.2, blend_factor=None),
206
+ dict(type='ChromaticTranslation', p=0.95, ratio=0.05),
207
+ dict(type='ChromaticJitter', p=0.95, std=0.05),
208
+ dict(
209
+ type='GridSample',
210
+ grid_size=0.02,
211
+ hash_type='fnv',
212
+ mode='train',
213
+ keys=('coord', 'color', 'normal', 'segment', 'image_coord',
214
+ 'image_mask'),
215
+ return_grid_coord=True),
216
+ dict(type='SphereCrop', point_max=102400, mode='random'),
217
+ dict(type='CenterShift', apply_z=False),
218
+ dict(type='NormalizeColor'),
219
+ dict(type='ToTensor'),
220
+ dict(
221
+ type='Collect',
222
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
223
+ 'image_mask'),
224
+ feat_keys=('color', 'normal'))
225
+ ],
226
+ test_mode=False,
227
+ loop=8),
228
+ val=dict(
229
+ type='ScanNet200Dataset',
230
+ split='val',
231
+ data_root='data/scannet',
232
+ with_images=10,
233
+ transform=[
234
+ dict(type='ImageResize', size=[420, 560]),
235
+ dict(type='ImageNormalize'),
236
+ dict(type='CenterShift', apply_z=True),
237
+ dict(
238
+ type='GridSample',
239
+ grid_size=0.02,
240
+ hash_type='fnv',
241
+ mode='train',
242
+ keys=('coord', 'color', 'normal', 'segment', 'image_coord',
243
+ 'image_mask'),
244
+ return_grid_coord=True),
245
+ dict(type='CenterShift', apply_z=False),
246
+ dict(type='NormalizeColor'),
247
+ dict(type='ToTensor'),
248
+ dict(
249
+ type='Collect',
250
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
251
+ 'image_mask'),
252
+ feat_keys=('color', 'normal'))
253
+ ],
254
+ test_mode=False),
255
+ test=dict(
256
+ type='ScanNet200Dataset',
257
+ split='val',
258
+ data_root='data/scannet',
259
+ with_images=10,
260
+ transform=[
261
+ dict(type='CenterShift', apply_z=True),
262
+ dict(type='NormalizeColor')
263
+ ],
264
+ test_mode=True,
265
+ test_cfg=dict(
266
+ voxelize=dict(
267
+ type='GridSample',
268
+ grid_size=0.02,
269
+ hash_type='fnv',
270
+ mode='test',
271
+ keys=('coord', 'color', 'normal', 'image_coord', 'image_mask'),
272
+ return_grid_coord=True),
273
+ crop=None,
274
+ post_transform=[
275
+ dict(type='ImageResize', size=[420, 560]),
276
+ dict(type='ImageNormalize'),
277
+ dict(type='CenterShift', apply_z=False),
278
+ dict(type='ToTensor'),
279
+ dict(
280
+ type='Collect',
281
+ keys=('coord', 'grid_coord', 'index', 'image',
282
+ 'image_coord', 'image_mask'),
283
+ feat_keys=('color', 'normal'))
284
+ ],
285
+ aug_transform=[[{
286
+ 'type': 'RandomRotateTargetAngle',
287
+ 'angle': [0],
288
+ 'axis': 'z',
289
+ 'center': [0, 0, 0],
290
+ 'p': 1
291
+ }],
292
+ [{
293
+ 'type': 'RandomRotateTargetAngle',
294
+ 'angle': [0.5],
295
+ 'axis': 'z',
296
+ 'center': [0, 0, 0],
297
+ 'p': 1
298
+ }],
299
+ [{
300
+ 'type': 'RandomRotateTargetAngle',
301
+ 'angle': [1],
302
+ 'axis': 'z',
303
+ 'center': [0, 0, 0],
304
+ 'p': 1
305
+ }],
306
+ [{
307
+ 'type': 'RandomRotateTargetAngle',
308
+ 'angle': [1.5],
309
+ 'axis': 'z',
310
+ 'center': [0, 0, 0],
311
+ 'p': 1
312
+ }],
313
+ [{
314
+ 'type': 'RandomRotateTargetAngle',
315
+ 'angle': [0],
316
+ 'axis': 'z',
317
+ 'center': [0, 0, 0],
318
+ 'p': 1
319
+ }, {
320
+ 'type': 'RandomScale',
321
+ 'scale': [0.95, 0.95]
322
+ }],
323
+ [{
324
+ 'type': 'RandomRotateTargetAngle',
325
+ 'angle': [0.5],
326
+ 'axis': 'z',
327
+ 'center': [0, 0, 0],
328
+ 'p': 1
329
+ }, {
330
+ 'type': 'RandomScale',
331
+ 'scale': [0.95, 0.95]
332
+ }],
333
+ [{
334
+ 'type': 'RandomRotateTargetAngle',
335
+ 'angle': [1],
336
+ 'axis': 'z',
337
+ 'center': [0, 0, 0],
338
+ 'p': 1
339
+ }, {
340
+ 'type': 'RandomScale',
341
+ 'scale': [0.95, 0.95]
342
+ }],
343
+ [{
344
+ 'type': 'RandomRotateTargetAngle',
345
+ 'angle': [1.5],
346
+ 'axis': 'z',
347
+ 'center': [0, 0, 0],
348
+ 'p': 1
349
+ }, {
350
+ 'type': 'RandomScale',
351
+ 'scale': [0.95, 0.95]
352
+ }],
353
+ [{
354
+ 'type': 'RandomRotateTargetAngle',
355
+ 'angle': [0],
356
+ 'axis': 'z',
357
+ 'center': [0, 0, 0],
358
+ 'p': 1
359
+ }, {
360
+ 'type': 'RandomScale',
361
+ 'scale': [1.05, 1.05]
362
+ }],
363
+ [{
364
+ 'type': 'RandomRotateTargetAngle',
365
+ 'angle': [0.5],
366
+ 'axis': 'z',
367
+ 'center': [0, 0, 0],
368
+ 'p': 1
369
+ }, {
370
+ 'type': 'RandomScale',
371
+ 'scale': [1.05, 1.05]
372
+ }],
373
+ [{
374
+ 'type': 'RandomRotateTargetAngle',
375
+ 'angle': [1],
376
+ 'axis': 'z',
377
+ 'center': [0, 0, 0],
378
+ 'p': 1
379
+ }, {
380
+ 'type': 'RandomScale',
381
+ 'scale': [1.05, 1.05]
382
+ }],
383
+ [{
384
+ 'type': 'RandomRotateTargetAngle',
385
+ 'angle': [1.5],
386
+ 'axis': 'z',
387
+ 'center': [0, 0, 0],
388
+ 'p': 1
389
+ }, {
390
+ 'type': 'RandomScale',
391
+ 'scale': [1.05, 1.05]
392
+ }], [{
393
+ 'type': 'RandomFlip',
394
+ 'p': 1
395
+ }]])))
scannet200/distill-ptv3_scannet200_dino-L/events.out.tfevents.1740862155.n23g0009.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:432e0e29cdae50129131f1864c6f7aa34dc62abe303674453f204d35fe83c279
3
+ size 12765310
scannet200/distill-ptv3_scannet200_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf42deadbbe513457be851b3e641e167793e9d8369e3870fd9d8d0ed687a46a0
3
+ size 555366056
scannet200/distill-ptv3_scannet200_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e2f32723283fb1f8ab5c85127d09f5e1109ca9b11b18f69c63a655ec33a452d
3
+ size 555366056
scannet200/distill-ptv3_scannet200_dino-L/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:989821007580b0ac14ddb95b3557b0012011de0a477a98eb58ecd0f572c73201
3
+ size 15758304