TensorBoard
karimknaebel commited on
Commit
fc49bf8
·
verified ·
1 Parent(s): f38adb4

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -44,3 +44,4 @@ scannet200/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
44
  scannet200/semseg-ptv3_dinov3-L/train.log filter=lfs diff=lfs merge=lfs -text
45
  scannet200/distill-ptv3_scannet200+structured3d_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
46
  scannet200/distill-ptv3_scannet200_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
 
 
44
  scannet200/semseg-ptv3_dinov3-L/train.log filter=lfs diff=lfs merge=lfs -text
45
  scannet200/distill-ptv3_scannet200+structured3d_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
46
  scannet200/distill-ptv3_scannet200_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
47
+ scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/config.py ADDED
@@ -0,0 +1,381 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = 'exp/scannet200/2025-03-01_221653/model/model_last.pth'
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 40737252
6
+ save_path = 'exp/scannet200/2025-03-03_021916'
7
+ wandb_project = 'semseg_scannet200'
8
+ num_worker = 24
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 800
13
+ eval_epoch = 100
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = True
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='block', lr=0.0006)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='SemSegEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None),
28
+ dict(type='PreciseEvaluator', test_last=False)
29
+ ]
30
+ train = dict(type='DefaultTrainer')
31
+ test = dict(type='SemSegTester', verbose=True)
32
+ CLASS_LABELS_200 = (
33
+ 'wall', 'chair', 'floor', 'table', 'door', 'couch', 'cabinet', 'shelf',
34
+ 'desk', 'office chair', 'bed', 'pillow', 'sink', 'picture', 'window',
35
+ 'toilet', 'bookshelf', 'monitor', 'curtain', 'book', 'armchair',
36
+ 'coffee table', 'box', 'refrigerator', 'lamp', 'kitchen cabinet', 'towel',
37
+ 'clothes', 'tv', 'nightstand', 'counter', 'dresser', 'stool', 'cushion',
38
+ 'plant', 'ceiling', 'bathtub', 'end table', 'dining table', 'keyboard',
39
+ 'bag', 'backpack', 'toilet paper', 'printer', 'tv stand', 'whiteboard',
40
+ 'blanket', 'shower curtain', 'trash can', 'closet', 'stairs', 'microwave',
41
+ 'stove', 'shoe', 'computer tower', 'bottle', 'bin', 'ottoman', 'bench',
42
+ 'board', 'washing machine', 'mirror', 'copier', 'basket', 'sofa chair',
43
+ 'file cabinet', 'fan', 'laptop', 'shower', 'paper', 'person',
44
+ 'paper towel dispenser', 'oven', 'blinds', 'rack', 'plate', 'blackboard',
45
+ 'piano', 'suitcase', 'rail', 'radiator', 'recycling bin', 'container',
46
+ 'wardrobe', 'soap dispenser', 'telephone', 'bucket', 'clock', 'stand',
47
+ 'light', 'laundry basket', 'pipe', 'clothes dryer', 'guitar',
48
+ 'toilet paper holder', 'seat', 'speaker', 'column', 'bicycle', 'ladder',
49
+ 'bathroom stall', 'shower wall', 'cup', 'jacket', 'storage bin',
50
+ 'coffee maker', 'dishwasher', 'paper towel roll', 'machine', 'mat',
51
+ 'windowsill', 'bar', 'toaster', 'bulletin board', 'ironing board',
52
+ 'fireplace', 'soap dish', 'kitchen counter', 'doorframe',
53
+ 'toilet paper dispenser', 'mini fridge', 'fire extinguisher', 'ball',
54
+ 'hat', 'shower curtain rod', 'water cooler', 'paper cutter', 'tray',
55
+ 'shower door', 'pillar', 'ledge', 'toaster oven', 'mouse',
56
+ 'toilet seat cover dispenser', 'furniture', 'cart', 'storage container',
57
+ 'scale', 'tissue box', 'light switch', 'crate', 'power outlet',
58
+ 'decoration', 'sign', 'projector', 'closet door', 'vacuum cleaner',
59
+ 'candle', 'plunger', 'stuffed animal', 'headphones', 'dish rack', 'broom',
60
+ 'guitar case', 'range hood', 'dustpan', 'hair dryer', 'water bottle',
61
+ 'handicap bar', 'purse', 'vent', 'shower floor', 'water pitcher',
62
+ 'mailbox', 'bowl', 'paper bag', 'alarm clock', 'music stand',
63
+ 'projector screen', 'divider', 'laundry detergent', 'bathroom counter',
64
+ 'object', 'bathroom vanity', 'closet wall', 'laundry hamper',
65
+ 'bathroom stall door', 'ceiling light', 'trash bin', 'dumbbell',
66
+ 'stair rail', 'tube', 'bathroom cabinet', 'cd case', 'closet rod',
67
+ 'coffee kettle', 'structure', 'shower head', 'keyboard piano',
68
+ 'case of water bottles', 'coat rack', 'storage organizer', 'folded chair',
69
+ 'fire alarm', 'power strip', 'calendar', 'poster', 'potted plant',
70
+ 'luggage', 'mattress')
71
+ model = dict(
72
+ type='DefaultSegmentorV2',
73
+ num_classes=200,
74
+ backbone_out_channels=64,
75
+ backbone=dict(
76
+ type='PT-v3m1',
77
+ in_channels=6,
78
+ order=('z', 'z-trans', 'hilbert', 'hilbert-trans'),
79
+ stride=(2, 2, 2, 2),
80
+ enc_depths=(2, 2, 2, 6, 2),
81
+ enc_channels=(32, 64, 128, 256, 512),
82
+ enc_num_head=(2, 4, 8, 16, 32),
83
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
84
+ dec_depths=(2, 2, 2, 2),
85
+ dec_channels=(64, 64, 128, 256),
86
+ dec_num_head=(4, 4, 8, 16),
87
+ dec_patch_size=(1024, 1024, 1024, 1024),
88
+ mlp_ratio=4,
89
+ qkv_bias=True,
90
+ qk_scale=None,
91
+ attn_drop=0.0,
92
+ proj_drop=0.0,
93
+ drop_path=0.3,
94
+ shuffle_orders=True,
95
+ pre_norm=True,
96
+ enable_rpe=False,
97
+ enable_flash=True,
98
+ upcast_attention=False,
99
+ upcast_softmax=False,
100
+ cls_mode=False,
101
+ pdnorm_bn=True,
102
+ pdnorm_ln=True,
103
+ pdnorm_decouple=True,
104
+ pdnorm_adaptive=False,
105
+ pdnorm_affine=True,
106
+ pdnorm_conditions=('ScanNet', 'S3DIS', 'Structured3D')),
107
+ criteria=[
108
+ dict(type='CrossEntropyLoss', loss_weight=1.0, ignore_index=-1),
109
+ dict(
110
+ type='LovaszLoss',
111
+ mode='multiclass',
112
+ loss_weight=1.0,
113
+ ignore_index=-1)
114
+ ])
115
+ optimizer = dict(type='AdamW', lr=0.006, weight_decay=0.05)
116
+ scheduler = dict(
117
+ type='OneCycleLR',
118
+ max_lr=[0.006, 0.0006],
119
+ pct_start=0.05,
120
+ anneal_strategy='cos',
121
+ div_factor=10.0,
122
+ final_div_factor=1000.0)
123
+ dataset_type = 'ScanNet200Dataset'
124
+ data_root = 'data/scannet'
125
+ data = dict(
126
+ num_classes=200,
127
+ ignore_index=-1,
128
+ names=(
129
+ 'wall', 'chair', 'floor', 'table', 'door', 'couch', 'cabinet', 'shelf',
130
+ 'desk', 'office chair', 'bed', 'pillow', 'sink', 'picture', 'window',
131
+ 'toilet', 'bookshelf', 'monitor', 'curtain', 'book', 'armchair',
132
+ 'coffee table', 'box', 'refrigerator', 'lamp', 'kitchen cabinet',
133
+ 'towel', 'clothes', 'tv', 'nightstand', 'counter', 'dresser', 'stool',
134
+ 'cushion', 'plant', 'ceiling', 'bathtub', 'end table', 'dining table',
135
+ 'keyboard', 'bag', 'backpack', 'toilet paper', 'printer', 'tv stand',
136
+ 'whiteboard', 'blanket', 'shower curtain', 'trash can', 'closet',
137
+ 'stairs', 'microwave', 'stove', 'shoe', 'computer tower', 'bottle',
138
+ 'bin', 'ottoman', 'bench', 'board', 'washing machine', 'mirror',
139
+ 'copier', 'basket', 'sofa chair', 'file cabinet', 'fan', 'laptop',
140
+ 'shower', 'paper', 'person', 'paper towel dispenser', 'oven', 'blinds',
141
+ 'rack', 'plate', 'blackboard', 'piano', 'suitcase', 'rail', 'radiator',
142
+ 'recycling bin', 'container', 'wardrobe', 'soap dispenser',
143
+ 'telephone', 'bucket', 'clock', 'stand', 'light', 'laundry basket',
144
+ 'pipe', 'clothes dryer', 'guitar', 'toilet paper holder', 'seat',
145
+ 'speaker', 'column', 'bicycle', 'ladder', 'bathroom stall',
146
+ 'shower wall', 'cup', 'jacket', 'storage bin', 'coffee maker',
147
+ 'dishwasher', 'paper towel roll', 'machine', 'mat', 'windowsill',
148
+ 'bar', 'toaster', 'bulletin board', 'ironing board', 'fireplace',
149
+ 'soap dish', 'kitchen counter', 'doorframe', 'toilet paper dispenser',
150
+ 'mini fridge', 'fire extinguisher', 'ball', 'hat',
151
+ 'shower curtain rod', 'water cooler', 'paper cutter', 'tray',
152
+ 'shower door', 'pillar', 'ledge', 'toaster oven', 'mouse',
153
+ 'toilet seat cover dispenser', 'furniture', 'cart',
154
+ 'storage container', 'scale', 'tissue box', 'light switch', 'crate',
155
+ 'power outlet', 'decoration', 'sign', 'projector', 'closet door',
156
+ 'vacuum cleaner', 'candle', 'plunger', 'stuffed animal', 'headphones',
157
+ 'dish rack', 'broom', 'guitar case', 'range hood', 'dustpan',
158
+ 'hair dryer', 'water bottle', 'handicap bar', 'purse', 'vent',
159
+ 'shower floor', 'water pitcher', 'mailbox', 'bowl', 'paper bag',
160
+ 'alarm clock', 'music stand', 'projector screen', 'divider',
161
+ 'laundry detergent', 'bathroom counter', 'object', 'bathroom vanity',
162
+ 'closet wall', 'laundry hamper', 'bathroom stall door',
163
+ 'ceiling light', 'trash bin', 'dumbbell', 'stair rail', 'tube',
164
+ 'bathroom cabinet', 'cd case', 'closet rod', 'coffee kettle',
165
+ 'structure', 'shower head', 'keyboard piano', 'case of water bottles',
166
+ 'coat rack', 'storage organizer', 'folded chair', 'fire alarm',
167
+ 'power strip', 'calendar', 'poster', 'potted plant', 'luggage',
168
+ 'mattress'),
169
+ train=dict(
170
+ type='ScanNet200Dataset',
171
+ split='train',
172
+ data_root='data/scannet',
173
+ transform=[
174
+ dict(type='CenterShift', apply_z=True),
175
+ dict(
176
+ type='RandomDropout',
177
+ dropout_ratio=0.2,
178
+ dropout_application_ratio=0.2),
179
+ dict(
180
+ type='RandomRotate',
181
+ angle=[-1, 1],
182
+ axis='z',
183
+ center=[0, 0, 0],
184
+ p=0.5),
185
+ dict(
186
+ type='RandomRotate',
187
+ angle=[-0.015625, 0.015625],
188
+ axis='x',
189
+ p=0.5),
190
+ dict(
191
+ type='RandomRotate',
192
+ angle=[-0.015625, 0.015625],
193
+ axis='y',
194
+ p=0.5),
195
+ dict(type='RandomScale', scale=[0.9, 1.1]),
196
+ dict(type='RandomFlip', p=0.5),
197
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
198
+ dict(
199
+ type='ElasticDistortion',
200
+ distortion_params=[[0.2, 0.4], [0.8, 1.6]]),
201
+ dict(type='ChromaticAutoContrast', p=0.2, blend_factor=None),
202
+ dict(type='ChromaticTranslation', p=0.95, ratio=0.05),
203
+ dict(type='ChromaticJitter', p=0.95, std=0.05),
204
+ dict(
205
+ type='GridSample',
206
+ grid_size=0.02,
207
+ hash_type='fnv',
208
+ mode='train',
209
+ return_grid_coord=True),
210
+ dict(type='SphereCrop', point_max=102400, mode='random'),
211
+ dict(type='CenterShift', apply_z=False),
212
+ dict(type='NormalizeColor'),
213
+ dict(type='Add', keys_dict=dict(condition='ScanNet')),
214
+ dict(type='ToTensor'),
215
+ dict(
216
+ type='Collect',
217
+ keys=('coord', 'grid_coord', 'segment', 'condition'),
218
+ feat_keys=('color', 'normal'))
219
+ ],
220
+ test_mode=False,
221
+ loop=8),
222
+ val=dict(
223
+ type='ScanNet200Dataset',
224
+ split='val',
225
+ data_root='data/scannet',
226
+ transform=[
227
+ dict(type='CenterShift', apply_z=True),
228
+ dict(
229
+ type='GridSample',
230
+ grid_size=0.02,
231
+ hash_type='fnv',
232
+ mode='train',
233
+ return_grid_coord=True),
234
+ dict(type='CenterShift', apply_z=False),
235
+ dict(type='NormalizeColor'),
236
+ dict(type='Add', keys_dict=dict(condition='ScanNet')),
237
+ dict(type='ToTensor'),
238
+ dict(
239
+ type='Collect',
240
+ keys=('coord', 'grid_coord', 'segment', 'condition'),
241
+ feat_keys=('color', 'normal'))
242
+ ],
243
+ test_mode=False),
244
+ test=dict(
245
+ type='ScanNet200Dataset',
246
+ split='val',
247
+ data_root='data/scannet',
248
+ transform=[
249
+ dict(type='CenterShift', apply_z=True),
250
+ dict(type='NormalizeColor')
251
+ ],
252
+ test_mode=True,
253
+ test_cfg=dict(
254
+ voxelize=dict(
255
+ type='GridSample',
256
+ grid_size=0.02,
257
+ hash_type='fnv',
258
+ mode='test',
259
+ keys=('coord', 'color', 'normal'),
260
+ return_grid_coord=True),
261
+ crop=None,
262
+ post_transform=[
263
+ dict(type='CenterShift', apply_z=False),
264
+ dict(type='Add', keys_dict=dict(condition='ScanNet')),
265
+ dict(type='ToTensor'),
266
+ dict(
267
+ type='Collect',
268
+ keys=('coord', 'grid_coord', 'index', 'condition'),
269
+ feat_keys=('color', 'normal'))
270
+ ],
271
+ aug_transform=[[{
272
+ 'type': 'RandomRotateTargetAngle',
273
+ 'angle': [0],
274
+ 'axis': 'z',
275
+ 'center': [0, 0, 0],
276
+ 'p': 1
277
+ }],
278
+ [{
279
+ 'type': 'RandomRotateTargetAngle',
280
+ 'angle': [0.5],
281
+ 'axis': 'z',
282
+ 'center': [0, 0, 0],
283
+ 'p': 1
284
+ }],
285
+ [{
286
+ 'type': 'RandomRotateTargetAngle',
287
+ 'angle': [1],
288
+ 'axis': 'z',
289
+ 'center': [0, 0, 0],
290
+ 'p': 1
291
+ }],
292
+ [{
293
+ 'type': 'RandomRotateTargetAngle',
294
+ 'angle': [1.5],
295
+ 'axis': 'z',
296
+ 'center': [0, 0, 0],
297
+ 'p': 1
298
+ }],
299
+ [{
300
+ 'type': 'RandomRotateTargetAngle',
301
+ 'angle': [0],
302
+ 'axis': 'z',
303
+ 'center': [0, 0, 0],
304
+ 'p': 1
305
+ }, {
306
+ 'type': 'RandomScale',
307
+ 'scale': [0.95, 0.95]
308
+ }],
309
+ [{
310
+ 'type': 'RandomRotateTargetAngle',
311
+ 'angle': [0.5],
312
+ 'axis': 'z',
313
+ 'center': [0, 0, 0],
314
+ 'p': 1
315
+ }, {
316
+ 'type': 'RandomScale',
317
+ 'scale': [0.95, 0.95]
318
+ }],
319
+ [{
320
+ 'type': 'RandomRotateTargetAngle',
321
+ 'angle': [1],
322
+ 'axis': 'z',
323
+ 'center': [0, 0, 0],
324
+ 'p': 1
325
+ }, {
326
+ 'type': 'RandomScale',
327
+ 'scale': [0.95, 0.95]
328
+ }],
329
+ [{
330
+ 'type': 'RandomRotateTargetAngle',
331
+ 'angle': [1.5],
332
+ 'axis': 'z',
333
+ 'center': [0, 0, 0],
334
+ 'p': 1
335
+ }, {
336
+ 'type': 'RandomScale',
337
+ 'scale': [0.95, 0.95]
338
+ }],
339
+ [{
340
+ 'type': 'RandomRotateTargetAngle',
341
+ 'angle': [0],
342
+ 'axis': 'z',
343
+ 'center': [0, 0, 0],
344
+ 'p': 1
345
+ }, {
346
+ 'type': 'RandomScale',
347
+ 'scale': [1.05, 1.05]
348
+ }],
349
+ [{
350
+ 'type': 'RandomRotateTargetAngle',
351
+ 'angle': [0.5],
352
+ 'axis': 'z',
353
+ 'center': [0, 0, 0],
354
+ 'p': 1
355
+ }, {
356
+ 'type': 'RandomScale',
357
+ 'scale': [1.05, 1.05]
358
+ }],
359
+ [{
360
+ 'type': 'RandomRotateTargetAngle',
361
+ 'angle': [1],
362
+ 'axis': 'z',
363
+ 'center': [0, 0, 0],
364
+ 'p': 1
365
+ }, {
366
+ 'type': 'RandomScale',
367
+ 'scale': [1.05, 1.05]
368
+ }],
369
+ [{
370
+ 'type': 'RandomRotateTargetAngle',
371
+ 'angle': [1.5],
372
+ 'axis': 'z',
373
+ 'center': [0, 0, 0],
374
+ 'p': 1
375
+ }, {
376
+ 'type': 'RandomScale',
377
+ 'scale': [1.05, 1.05]
378
+ }], [{
379
+ 'type': 'RandomFlip',
380
+ 'p': 1
381
+ }]])))
scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/events.out.tfevents.1740964812.n23g0010.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ee2708e3b54dda898bbc9e79f924a9e2904e7304c4e43a1cebc1972950dcaf9
3
+ size 7830557
scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:687c113e79c3334325ded4316eedf0b24a5c34e236d51a3037517be7f0e212f6
3
+ size 555120740
scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64e4e7277e258c2a832bf7e6e36756e0f6fa44956f269db31bf7a7534f28f87d
3
+ size 555120740
scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7330d6b0c5426a8d36e3a922389523fc45926dec4d55774e19dd66902b16cbfd
3
+ size 18457010