TensorBoard
karimknaebel commited on
Commit
beb24c1
·
verified ·
1 Parent(s): 0a84ac1

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -35,3 +35,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  nuscenes/semseg-ptv3_dino-g/train.log filter=lfs diff=lfs merge=lfs -text
37
  nuscenes/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
 
 
 
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  nuscenes/semseg-ptv3_dino-g/train.log filter=lfs diff=lfs merge=lfs -text
37
  nuscenes/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
38
+ nuscenes/semseg-ptv3_dino-B/test.log filter=lfs diff=lfs merge=lfs -text
39
+ nuscenes/semseg-ptv3_dino-B/train.log filter=lfs diff=lfs merge=lfs -text
nuscenes/semseg-ptv3_dino-B/config.py ADDED
@@ -0,0 +1,260 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = 'exp/nuscenes/semseg-ptv3_dino-B/model/model_best.pth'
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 4895131
6
+ save_path = 'exp/nuscenes/semseg-ptv3_dino-B'
7
+ wandb_project = 'semseg_nuscenes'
8
+ num_worker = 16
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 50
13
+ eval_epoch = 50
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = False
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='img_enc|block', lr=0.0002)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='SemSegEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None)
28
+ ]
29
+ train = dict(type='DefaultTrainer')
30
+ test = dict(type='SemSegTester', verbose=True)
31
+ model = dict(
32
+ type='DefaultSegmentorV2',
33
+ num_classes=16,
34
+ backbone_out_channels=64,
35
+ backbone=dict(
36
+ type='PT-v3m1-image',
37
+ in_channels=4,
38
+ order=['z', 'z-trans', 'hilbert', 'hilbert-trans'],
39
+ stride=(2, 2, 2, 2),
40
+ enc_depths=(2, 2, 2, 6, 2),
41
+ enc_channels=(32, 64, 128, 256, 512),
42
+ enc_num_head=(2, 4, 8, 16, 32),
43
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
44
+ dec_depths=(2, 2, 2, 2),
45
+ dec_channels=(64, 64, 128, 256),
46
+ dec_num_head=(4, 4, 8, 16),
47
+ dec_patch_size=(1024, 1024, 1024, 1024),
48
+ mlp_ratio=4,
49
+ qkv_bias=True,
50
+ qk_scale=None,
51
+ init_values=None,
52
+ attn_drop=0.0,
53
+ proj_drop=0.0,
54
+ drop_path=0.3,
55
+ shuffle_orders=True,
56
+ pre_norm=True,
57
+ enable_rpe=False,
58
+ enable_flash=True,
59
+ upcast_attention=False,
60
+ upcast_softmax=False,
61
+ cls_mode=False,
62
+ pdnorm_bn=False,
63
+ pdnorm_ln=False,
64
+ pdnorm_decouple=True,
65
+ pdnorm_adaptive=False,
66
+ pdnorm_affine=True,
67
+ pdnorm_conditions=('nuScenes', 'SemanticKITTI', 'Waymo'),
68
+ dinov2='base',
69
+ dinov2_missing_embedding=False,
70
+ dinov2_drop=0.0,
71
+ dinov2_lora=0,
72
+ dinov2_frozen=True),
73
+ criteria=[
74
+ dict(type='CrossEntropyLoss', loss_weight=1.0, ignore_index=-1),
75
+ dict(
76
+ type='LovaszLoss',
77
+ mode='multiclass',
78
+ loss_weight=1.0,
79
+ ignore_index=-1)
80
+ ])
81
+ optimizer = dict(type='AdamW', lr=0.002, weight_decay=0.005)
82
+ scheduler = dict(
83
+ type='OneCycleLR',
84
+ max_lr=[0.002, 0.0002],
85
+ pct_start=0.04,
86
+ anneal_strategy='cos',
87
+ div_factor=10.0,
88
+ final_div_factor=100.0)
89
+ dataset_type = 'NuScenesDataset'
90
+ data_root = 'data/nuscenes'
91
+ ignore_index = -1
92
+ names = [
93
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle', 'motorcycle',
94
+ 'pedestrian', 'traffic_cone', 'trailer', 'truck', 'driveable_surface',
95
+ 'other_flat', 'sidewalk', 'terrain', 'manmade', 'vegetation'
96
+ ]
97
+ data = dict(
98
+ num_classes=16,
99
+ ignore_index=-1,
100
+ names=[
101
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle',
102
+ 'motorcycle', 'pedestrian', 'traffic_cone', 'trailer', 'truck',
103
+ 'driveable_surface', 'other_flat', 'sidewalk', 'terrain', 'manmade',
104
+ 'vegetation'
105
+ ],
106
+ train=dict(
107
+ type='NuScenesDataset',
108
+ split='train',
109
+ data_root='data/nuscenes',
110
+ with_images=True,
111
+ transform=[
112
+ dict(type='ImageResize', size=[378, 672]),
113
+ dict(
114
+ type='ImageColorJitter',
115
+ brightness=0.4,
116
+ contrast=0.4,
117
+ saturation=0.2,
118
+ hue=0.1),
119
+ dict(type='ImageRandomHorizontalFlip'),
120
+ dict(type='ImageNormalize'),
121
+ dict(
122
+ type='RandomRotate',
123
+ angle=[-1, 1],
124
+ axis='z',
125
+ center=[0, 0, 0],
126
+ p=0.5),
127
+ dict(type='RandomScale', scale=[0.9, 1.1]),
128
+ dict(type='RandomFlip', p=0.5),
129
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
130
+ dict(
131
+ type='GridSample',
132
+ grid_size=0.05,
133
+ hash_type='fnv',
134
+ mode='train',
135
+ keys=('coord', 'strength', 'segment', 'image_coord',
136
+ 'image_mask'),
137
+ return_grid_coord=True),
138
+ dict(type='ToTensor'),
139
+ dict(
140
+ type='Collect',
141
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
142
+ 'image_mask'),
143
+ feat_keys=('coord', 'strength'))
144
+ ],
145
+ test_mode=False,
146
+ ignore_index=-1,
147
+ loop=1),
148
+ val=dict(
149
+ type='NuScenesDataset',
150
+ split='val',
151
+ data_root='data/nuscenes',
152
+ with_images=True,
153
+ transform=[
154
+ dict(type='ImageResize', size=[378, 672]),
155
+ dict(type='ImageNormalize'),
156
+ dict(
157
+ type='GridSample',
158
+ grid_size=0.05,
159
+ hash_type='fnv',
160
+ mode='train',
161
+ keys=('coord', 'strength', 'segment', 'image_coord',
162
+ 'image_mask'),
163
+ return_grid_coord=True),
164
+ dict(type='ToTensor'),
165
+ dict(
166
+ type='Collect',
167
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
168
+ 'image_mask'),
169
+ feat_keys=('coord', 'strength'))
170
+ ],
171
+ test_mode=False,
172
+ ignore_index=-1),
173
+ test=dict(
174
+ type='NuScenesDataset',
175
+ split='val',
176
+ data_root='data/nuscenes',
177
+ with_images=True,
178
+ transform=[
179
+ dict(type='ImageResize', size=[378, 672]),
180
+ dict(type='Copy', keys_dict=dict(segment='origin_segment')),
181
+ dict(
182
+ type='GridSample',
183
+ grid_size=0.025,
184
+ hash_type='fnv',
185
+ mode='train',
186
+ keys=('coord', 'strength', 'segment', 'image_coord',
187
+ 'image_mask'),
188
+ return_inverse=True)
189
+ ],
190
+ test_mode=True,
191
+ test_cfg=dict(
192
+ voxelize=dict(
193
+ type='GridSample',
194
+ grid_size=0.05,
195
+ hash_type='fnv',
196
+ mode='test',
197
+ return_grid_coord=True,
198
+ keys=('coord', 'strength', 'image_coord', 'image_mask')),
199
+ crop=None,
200
+ post_transform=[
201
+ dict(type='ImageNormalize'),
202
+ dict(type='ToTensor'),
203
+ dict(
204
+ type='Collect',
205
+ keys=('coord', 'grid_coord', 'index', 'image',
206
+ 'image_coord', 'image_mask'),
207
+ feat_keys=('coord', 'strength'))
208
+ ],
209
+ aug_transform=[[{
210
+ 'type': 'RandomScale',
211
+ 'scale': [0.9, 0.9]
212
+ }], [{
213
+ 'type': 'RandomScale',
214
+ 'scale': [0.95, 0.95]
215
+ }], [{
216
+ 'type': 'RandomScale',
217
+ 'scale': [1, 1]
218
+ }], [{
219
+ 'type': 'RandomScale',
220
+ 'scale': [1.05, 1.05]
221
+ }], [{
222
+ 'type': 'RandomScale',
223
+ 'scale': [1.1, 1.1]
224
+ }],
225
+ [{
226
+ 'type': 'RandomScale',
227
+ 'scale': [0.9, 0.9]
228
+ }, {
229
+ 'type': 'RandomFlip',
230
+ 'p': 1
231
+ }],
232
+ [{
233
+ 'type': 'RandomScale',
234
+ 'scale': [0.95, 0.95]
235
+ }, {
236
+ 'type': 'RandomFlip',
237
+ 'p': 1
238
+ }],
239
+ [{
240
+ 'type': 'RandomScale',
241
+ 'scale': [1, 1]
242
+ }, {
243
+ 'type': 'RandomFlip',
244
+ 'p': 1
245
+ }],
246
+ [{
247
+ 'type': 'RandomScale',
248
+ 'scale': [1.05, 1.05]
249
+ }, {
250
+ 'type': 'RandomFlip',
251
+ 'p': 1
252
+ }],
253
+ [{
254
+ 'type': 'RandomScale',
255
+ 'scale': [1.1, 1.1]
256
+ }, {
257
+ 'type': 'RandomFlip',
258
+ 'p': 1
259
+ }]]),
260
+ ignore_index=-1))
nuscenes/semseg-ptv3_dino-B/events.out.tfevents.1731234639.w23g0013.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:290aa19b38a1a37eb11cc79969c53d06e58cbfc86a6b62eb3dc73e7e4f90f693
3
+ size 11464320
nuscenes/semseg-ptv3_dino-B/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0927905c25fbbc392d981fc46962e18eb27f41b20685b8949e2717c93fcf8997
3
+ size 559248752
nuscenes/semseg-ptv3_dino-B/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:561300a648bcfa64bd95ae82081212888fb60919f80f1786968472a3ea3640c6
3
+ size 559248752
nuscenes/semseg-ptv3_dino-B/test.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9f40f784a5ea9e53e31ac488df131639aeefb3d7b9436a0564c820ba52b5803
3
+ size 16687931
nuscenes/semseg-ptv3_dino-B/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a0a78c8acd8145a70c21775c017541452d19e865e07cbd793187f9566425edb
3
+ size 32320993