TensorBoard
karimknaebel commited on
Commit
a46f8a7
·
verified ·
1 Parent(s): 0ba4b81

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -40,3 +40,4 @@ nuscenes/semseg-ptv3_dino-B/train.log filter=lfs diff=lfs merge=lfs -text
40
  nuscenes/semseg-ptv3_dino-S/test.log filter=lfs diff=lfs merge=lfs -text
41
  nuscenes/semseg-ptv3_dino-S/train.log filter=lfs diff=lfs merge=lfs -text
42
  semantic_kitti/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
 
 
40
  nuscenes/semseg-ptv3_dino-S/test.log filter=lfs diff=lfs merge=lfs -text
41
  nuscenes/semseg-ptv3_dino-S/train.log filter=lfs diff=lfs merge=lfs -text
42
  semantic_kitti/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
43
+ scannet200/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
scannet200/semseg-ptv3_dino-L/config.py ADDED
@@ -0,0 +1,403 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = 'exp/scannet200/2025-02-28_175612/model/model_best.pth'
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 23761834
6
+ save_path = 'exp/scannet200/2025-02-28_175612'
7
+ wandb_project = 'semseg_scannet200'
8
+ num_worker = 24
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 800
13
+ eval_epoch = 100
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = False
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='img_enc|block', lr=0.0006)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='SemSegEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None),
28
+ dict(type='PreciseEvaluator', test_last=False)
29
+ ]
30
+ train = dict(type='DefaultTrainer')
31
+ test = dict(type='SemSegTester', verbose=True)
32
+ CLASS_LABELS_200 = (
33
+ 'wall', 'chair', 'floor', 'table', 'door', 'couch', 'cabinet', 'shelf',
34
+ 'desk', 'office chair', 'bed', 'pillow', 'sink', 'picture', 'window',
35
+ 'toilet', 'bookshelf', 'monitor', 'curtain', 'book', 'armchair',
36
+ 'coffee table', 'box', 'refrigerator', 'lamp', 'kitchen cabinet', 'towel',
37
+ 'clothes', 'tv', 'nightstand', 'counter', 'dresser', 'stool', 'cushion',
38
+ 'plant', 'ceiling', 'bathtub', 'end table', 'dining table', 'keyboard',
39
+ 'bag', 'backpack', 'toilet paper', 'printer', 'tv stand', 'whiteboard',
40
+ 'blanket', 'shower curtain', 'trash can', 'closet', 'stairs', 'microwave',
41
+ 'stove', 'shoe', 'computer tower', 'bottle', 'bin', 'ottoman', 'bench',
42
+ 'board', 'washing machine', 'mirror', 'copier', 'basket', 'sofa chair',
43
+ 'file cabinet', 'fan', 'laptop', 'shower', 'paper', 'person',
44
+ 'paper towel dispenser', 'oven', 'blinds', 'rack', 'plate', 'blackboard',
45
+ 'piano', 'suitcase', 'rail', 'radiator', 'recycling bin', 'container',
46
+ 'wardrobe', 'soap dispenser', 'telephone', 'bucket', 'clock', 'stand',
47
+ 'light', 'laundry basket', 'pipe', 'clothes dryer', 'guitar',
48
+ 'toilet paper holder', 'seat', 'speaker', 'column', 'bicycle', 'ladder',
49
+ 'bathroom stall', 'shower wall', 'cup', 'jacket', 'storage bin',
50
+ 'coffee maker', 'dishwasher', 'paper towel roll', 'machine', 'mat',
51
+ 'windowsill', 'bar', 'toaster', 'bulletin board', 'ironing board',
52
+ 'fireplace', 'soap dish', 'kitchen counter', 'doorframe',
53
+ 'toilet paper dispenser', 'mini fridge', 'fire extinguisher', 'ball',
54
+ 'hat', 'shower curtain rod', 'water cooler', 'paper cutter', 'tray',
55
+ 'shower door', 'pillar', 'ledge', 'toaster oven', 'mouse',
56
+ 'toilet seat cover dispenser', 'furniture', 'cart', 'storage container',
57
+ 'scale', 'tissue box', 'light switch', 'crate', 'power outlet',
58
+ 'decoration', 'sign', 'projector', 'closet door', 'vacuum cleaner',
59
+ 'candle', 'plunger', 'stuffed animal', 'headphones', 'dish rack', 'broom',
60
+ 'guitar case', 'range hood', 'dustpan', 'hair dryer', 'water bottle',
61
+ 'handicap bar', 'purse', 'vent', 'shower floor', 'water pitcher',
62
+ 'mailbox', 'bowl', 'paper bag', 'alarm clock', 'music stand',
63
+ 'projector screen', 'divider', 'laundry detergent', 'bathroom counter',
64
+ 'object', 'bathroom vanity', 'closet wall', 'laundry hamper',
65
+ 'bathroom stall door', 'ceiling light', 'trash bin', 'dumbbell',
66
+ 'stair rail', 'tube', 'bathroom cabinet', 'cd case', 'closet rod',
67
+ 'coffee kettle', 'structure', 'shower head', 'keyboard piano',
68
+ 'case of water bottles', 'coat rack', 'storage organizer', 'folded chair',
69
+ 'fire alarm', 'power strip', 'calendar', 'poster', 'potted plant',
70
+ 'luggage', 'mattress')
71
+ model = dict(
72
+ type='DefaultSegmentorV2',
73
+ num_classes=200,
74
+ backbone_out_channels=64,
75
+ backbone=dict(
76
+ type='PT-v3m1-image',
77
+ in_channels=6,
78
+ order=('z', 'z-trans', 'hilbert', 'hilbert-trans'),
79
+ stride=(2, 2, 2, 2),
80
+ enc_depths=(2, 2, 2, 6, 2),
81
+ enc_channels=(32, 64, 128, 256, 512),
82
+ enc_num_head=(2, 4, 8, 16, 32),
83
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
84
+ dec_depths=(2, 2, 2, 2),
85
+ dec_channels=(64, 64, 128, 256),
86
+ dec_num_head=(4, 4, 8, 16),
87
+ dec_patch_size=(1024, 1024, 1024, 1024),
88
+ mlp_ratio=4,
89
+ qkv_bias=True,
90
+ qk_scale=None,
91
+ init_values=None,
92
+ attn_drop=0.0,
93
+ proj_drop=0.0,
94
+ drop_path=0.3,
95
+ shuffle_orders=True,
96
+ pre_norm=True,
97
+ enable_rpe=False,
98
+ enable_flash=True,
99
+ upcast_attention=False,
100
+ upcast_softmax=False,
101
+ cls_mode=False,
102
+ pdnorm_bn=False,
103
+ pdnorm_ln=False,
104
+ pdnorm_decouple=True,
105
+ pdnorm_adaptive=False,
106
+ pdnorm_affine=True,
107
+ pdnorm_conditions=('ScanNet', 'S3DIS', 'Structured3D'),
108
+ dinov2='large'),
109
+ criteria=[
110
+ dict(type='CrossEntropyLoss', loss_weight=1.0, ignore_index=-1),
111
+ dict(
112
+ type='LovaszLoss',
113
+ mode='multiclass',
114
+ loss_weight=1.0,
115
+ ignore_index=-1)
116
+ ])
117
+ optimizer = dict(type='AdamW', lr=0.006, weight_decay=0.05)
118
+ scheduler = dict(
119
+ type='OneCycleLR',
120
+ max_lr=[0.006, 0.0006],
121
+ pct_start=0.05,
122
+ anneal_strategy='cos',
123
+ div_factor=10.0,
124
+ final_div_factor=1000.0)
125
+ dataset_type = 'ScanNet200Dataset'
126
+ data_root = 'data/scannet'
127
+ data = dict(
128
+ num_classes=200,
129
+ ignore_index=-1,
130
+ names=(
131
+ 'wall', 'chair', 'floor', 'table', 'door', 'couch', 'cabinet', 'shelf',
132
+ 'desk', 'office chair', 'bed', 'pillow', 'sink', 'picture', 'window',
133
+ 'toilet', 'bookshelf', 'monitor', 'curtain', 'book', 'armchair',
134
+ 'coffee table', 'box', 'refrigerator', 'lamp', 'kitchen cabinet',
135
+ 'towel', 'clothes', 'tv', 'nightstand', 'counter', 'dresser', 'stool',
136
+ 'cushion', 'plant', 'ceiling', 'bathtub', 'end table', 'dining table',
137
+ 'keyboard', 'bag', 'backpack', 'toilet paper', 'printer', 'tv stand',
138
+ 'whiteboard', 'blanket', 'shower curtain', 'trash can', 'closet',
139
+ 'stairs', 'microwave', 'stove', 'shoe', 'computer tower', 'bottle',
140
+ 'bin', 'ottoman', 'bench', 'board', 'washing machine', 'mirror',
141
+ 'copier', 'basket', 'sofa chair', 'file cabinet', 'fan', 'laptop',
142
+ 'shower', 'paper', 'person', 'paper towel dispenser', 'oven', 'blinds',
143
+ 'rack', 'plate', 'blackboard', 'piano', 'suitcase', 'rail', 'radiator',
144
+ 'recycling bin', 'container', 'wardrobe', 'soap dispenser',
145
+ 'telephone', 'bucket', 'clock', 'stand', 'light', 'laundry basket',
146
+ 'pipe', 'clothes dryer', 'guitar', 'toilet paper holder', 'seat',
147
+ 'speaker', 'column', 'bicycle', 'ladder', 'bathroom stall',
148
+ 'shower wall', 'cup', 'jacket', 'storage bin', 'coffee maker',
149
+ 'dishwasher', 'paper towel roll', 'machine', 'mat', 'windowsill',
150
+ 'bar', 'toaster', 'bulletin board', 'ironing board', 'fireplace',
151
+ 'soap dish', 'kitchen counter', 'doorframe', 'toilet paper dispenser',
152
+ 'mini fridge', 'fire extinguisher', 'ball', 'hat',
153
+ 'shower curtain rod', 'water cooler', 'paper cutter', 'tray',
154
+ 'shower door', 'pillar', 'ledge', 'toaster oven', 'mouse',
155
+ 'toilet seat cover dispenser', 'furniture', 'cart',
156
+ 'storage container', 'scale', 'tissue box', 'light switch', 'crate',
157
+ 'power outlet', 'decoration', 'sign', 'projector', 'closet door',
158
+ 'vacuum cleaner', 'candle', 'plunger', 'stuffed animal', 'headphones',
159
+ 'dish rack', 'broom', 'guitar case', 'range hood', 'dustpan',
160
+ 'hair dryer', 'water bottle', 'handicap bar', 'purse', 'vent',
161
+ 'shower floor', 'water pitcher', 'mailbox', 'bowl', 'paper bag',
162
+ 'alarm clock', 'music stand', 'projector screen', 'divider',
163
+ 'laundry detergent', 'bathroom counter', 'object', 'bathroom vanity',
164
+ 'closet wall', 'laundry hamper', 'bathroom stall door',
165
+ 'ceiling light', 'trash bin', 'dumbbell', 'stair rail', 'tube',
166
+ 'bathroom cabinet', 'cd case', 'closet rod', 'coffee kettle',
167
+ 'structure', 'shower head', 'keyboard piano', 'case of water bottles',
168
+ 'coat rack', 'storage organizer', 'folded chair', 'fire alarm',
169
+ 'power strip', 'calendar', 'poster', 'potted plant', 'luggage',
170
+ 'mattress'),
171
+ train=dict(
172
+ type='ScanNet200Dataset',
173
+ split='train',
174
+ data_root='data/scannet',
175
+ with_images=10,
176
+ transform=[
177
+ dict(type='ImageResize', size=[420, 560]),
178
+ dict(
179
+ type='ImageColorJitter',
180
+ brightness=0.4,
181
+ contrast=0.4,
182
+ saturation=0.2,
183
+ hue=0.1),
184
+ dict(type='ImageRandomHorizontalFlip'),
185
+ dict(type='ImageNormalize'),
186
+ dict(type='CenterShift', apply_z=True),
187
+ dict(
188
+ type='RandomDropout',
189
+ dropout_ratio=0.2,
190
+ dropout_application_ratio=0.2),
191
+ dict(
192
+ type='RandomRotate',
193
+ angle=[-1, 1],
194
+ axis='z',
195
+ center=[0, 0, 0],
196
+ p=0.5),
197
+ dict(
198
+ type='RandomRotate',
199
+ angle=[-0.015625, 0.015625],
200
+ axis='x',
201
+ p=0.5),
202
+ dict(
203
+ type='RandomRotate',
204
+ angle=[-0.015625, 0.015625],
205
+ axis='y',
206
+ p=0.5),
207
+ dict(type='RandomScale', scale=[0.9, 1.1]),
208
+ dict(type='RandomFlip', p=0.5),
209
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
210
+ dict(
211
+ type='ElasticDistortion',
212
+ distortion_params=[[0.2, 0.4], [0.8, 1.6]]),
213
+ dict(type='ChromaticAutoContrast', p=0.2, blend_factor=None),
214
+ dict(type='ChromaticTranslation', p=0.95, ratio=0.05),
215
+ dict(type='ChromaticJitter', p=0.95, std=0.05),
216
+ dict(
217
+ type='GridSample',
218
+ grid_size=0.02,
219
+ hash_type='fnv',
220
+ mode='train',
221
+ keys=('coord', 'color', 'normal', 'segment', 'image_coord',
222
+ 'image_mask'),
223
+ return_grid_coord=True),
224
+ dict(type='SphereCrop', point_max=102400, mode='random'),
225
+ dict(type='CenterShift', apply_z=False),
226
+ dict(type='NormalizeColor'),
227
+ dict(type='ToTensor'),
228
+ dict(
229
+ type='Collect',
230
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
231
+ 'image_mask'),
232
+ feat_keys=('color', 'normal'))
233
+ ],
234
+ test_mode=False,
235
+ loop=8),
236
+ val=dict(
237
+ type='ScanNet200Dataset',
238
+ split='val',
239
+ data_root='data/scannet',
240
+ with_images=10,
241
+ transform=[
242
+ dict(type='ImageResize', size=[420, 560]),
243
+ dict(type='ImageNormalize'),
244
+ dict(type='CenterShift', apply_z=True),
245
+ dict(
246
+ type='GridSample',
247
+ grid_size=0.02,
248
+ hash_type='fnv',
249
+ mode='train',
250
+ keys=('coord', 'color', 'normal', 'segment', 'image_coord',
251
+ 'image_mask'),
252
+ return_grid_coord=True),
253
+ dict(type='CenterShift', apply_z=False),
254
+ dict(type='NormalizeColor'),
255
+ dict(type='ToTensor'),
256
+ dict(
257
+ type='Collect',
258
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
259
+ 'image_mask'),
260
+ feat_keys=('color', 'normal'))
261
+ ],
262
+ test_mode=False),
263
+ test=dict(
264
+ type='ScanNet200Dataset',
265
+ split='val',
266
+ data_root='data/scannet',
267
+ with_images=10,
268
+ transform=[
269
+ dict(type='CenterShift', apply_z=True),
270
+ dict(type='NormalizeColor')
271
+ ],
272
+ test_mode=True,
273
+ test_cfg=dict(
274
+ voxelize=dict(
275
+ type='GridSample',
276
+ grid_size=0.02,
277
+ hash_type='fnv',
278
+ mode='test',
279
+ keys=('coord', 'color', 'normal', 'image_coord', 'image_mask'),
280
+ return_grid_coord=True),
281
+ crop=None,
282
+ post_transform=[
283
+ dict(type='ImageResize', size=[420, 560]),
284
+ dict(type='ImageNormalize'),
285
+ dict(type='CenterShift', apply_z=False),
286
+ dict(type='ToTensor'),
287
+ dict(
288
+ type='Collect',
289
+ keys=('coord', 'grid_coord', 'index', 'image',
290
+ 'image_coord', 'image_mask'),
291
+ feat_keys=('color', 'normal'))
292
+ ],
293
+ aug_transform=[[{
294
+ 'type': 'RandomRotateTargetAngle',
295
+ 'angle': [0],
296
+ 'axis': 'z',
297
+ 'center': [0, 0, 0],
298
+ 'p': 1
299
+ }],
300
+ [{
301
+ 'type': 'RandomRotateTargetAngle',
302
+ 'angle': [0.5],
303
+ 'axis': 'z',
304
+ 'center': [0, 0, 0],
305
+ 'p': 1
306
+ }],
307
+ [{
308
+ 'type': 'RandomRotateTargetAngle',
309
+ 'angle': [1],
310
+ 'axis': 'z',
311
+ 'center': [0, 0, 0],
312
+ 'p': 1
313
+ }],
314
+ [{
315
+ 'type': 'RandomRotateTargetAngle',
316
+ 'angle': [1.5],
317
+ 'axis': 'z',
318
+ 'center': [0, 0, 0],
319
+ 'p': 1
320
+ }],
321
+ [{
322
+ 'type': 'RandomRotateTargetAngle',
323
+ 'angle': [0],
324
+ 'axis': 'z',
325
+ 'center': [0, 0, 0],
326
+ 'p': 1
327
+ }, {
328
+ 'type': 'RandomScale',
329
+ 'scale': [0.95, 0.95]
330
+ }],
331
+ [{
332
+ 'type': 'RandomRotateTargetAngle',
333
+ 'angle': [0.5],
334
+ 'axis': 'z',
335
+ 'center': [0, 0, 0],
336
+ 'p': 1
337
+ }, {
338
+ 'type': 'RandomScale',
339
+ 'scale': [0.95, 0.95]
340
+ }],
341
+ [{
342
+ 'type': 'RandomRotateTargetAngle',
343
+ 'angle': [1],
344
+ 'axis': 'z',
345
+ 'center': [0, 0, 0],
346
+ 'p': 1
347
+ }, {
348
+ 'type': 'RandomScale',
349
+ 'scale': [0.95, 0.95]
350
+ }],
351
+ [{
352
+ 'type': 'RandomRotateTargetAngle',
353
+ 'angle': [1.5],
354
+ 'axis': 'z',
355
+ 'center': [0, 0, 0],
356
+ 'p': 1
357
+ }, {
358
+ 'type': 'RandomScale',
359
+ 'scale': [0.95, 0.95]
360
+ }],
361
+ [{
362
+ 'type': 'RandomRotateTargetAngle',
363
+ 'angle': [0],
364
+ 'axis': 'z',
365
+ 'center': [0, 0, 0],
366
+ 'p': 1
367
+ }, {
368
+ 'type': 'RandomScale',
369
+ 'scale': [1.05, 1.05]
370
+ }],
371
+ [{
372
+ 'type': 'RandomRotateTargetAngle',
373
+ 'angle': [0.5],
374
+ 'axis': 'z',
375
+ 'center': [0, 0, 0],
376
+ 'p': 1
377
+ }, {
378
+ 'type': 'RandomScale',
379
+ 'scale': [1.05, 1.05]
380
+ }],
381
+ [{
382
+ 'type': 'RandomRotateTargetAngle',
383
+ 'angle': [1],
384
+ 'axis': 'z',
385
+ 'center': [0, 0, 0],
386
+ 'p': 1
387
+ }, {
388
+ 'type': 'RandomScale',
389
+ 'scale': [1.05, 1.05]
390
+ }],
391
+ [{
392
+ 'type': 'RandomRotateTargetAngle',
393
+ 'angle': [1.5],
394
+ 'axis': 'z',
395
+ 'center': [0, 0, 0],
396
+ 'p': 1
397
+ }, {
398
+ 'type': 'RandomScale',
399
+ 'scale': [1.05, 1.05]
400
+ }], [{
401
+ 'type': 'RandomFlip',
402
+ 'p': 1
403
+ }]])))
scannet200/semseg-ptv3_dino-L/events.out.tfevents.1740761874.n23g0025.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:549b47fa5842b31458814bbb1accee76c81dcb5ffa7e7fe8513bec379273d894
3
+ size 7830557
scannet200/semseg-ptv3_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8088636a8365054af12def50e23ba4db3c8fcc0bae2f3e4da357ded513de95c
3
+ size 561061040
scannet200/semseg-ptv3_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73c47946da58b9b9032a03a4b9d21e344ef5d219896330fe2403d99ead474ce9
3
+ size 561061040
scannet200/semseg-ptv3_dino-L/test.log ADDED
The diff for this file is too large to render. See raw diff
 
scannet200/semseg-ptv3_dino-L/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2ae21a9ea0d2747a75322f20873be6d1ae373f7b5adf271d1396bce854fad2
3
+ size 18577380