TensorBoard
karimknaebel commited on
Commit
035d482
·
verified ·
1 Parent(s): 43fbf00

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ nuscenes/semseg-ptv3_dino-g/train.log filter=lfs diff=lfs merge=lfs -text
nuscenes/semseg-ptv3_dino-g/config.py ADDED
@@ -0,0 +1,261 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = None
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 38690432
6
+ save_path = 'exp/nuscenes/semseg-ptv3_dino-g'
7
+ wandb_project = 'semseg_nuscenes'
8
+ num_worker = 16
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 50
13
+ eval_epoch = 50
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = False
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='img_enc|block', lr=0.0002)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='SemSegEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None),
28
+ dict(type='PreciseEvaluator', test_last=False)
29
+ ]
30
+ train = dict(type='DefaultTrainer')
31
+ test = dict(type='SemSegTester', verbose=True)
32
+ model = dict(
33
+ type='DefaultSegmentorV2',
34
+ num_classes=16,
35
+ backbone_out_channels=64,
36
+ backbone=dict(
37
+ type='PT-v3m1-image',
38
+ in_channels=4,
39
+ order=['z', 'z-trans', 'hilbert', 'hilbert-trans'],
40
+ stride=(2, 2, 2, 2),
41
+ enc_depths=(2, 2, 2, 6, 2),
42
+ enc_channels=(32, 64, 128, 256, 512),
43
+ enc_num_head=(2, 4, 8, 16, 32),
44
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
45
+ dec_depths=(2, 2, 2, 2),
46
+ dec_channels=(64, 64, 128, 256),
47
+ dec_num_head=(4, 4, 8, 16),
48
+ dec_patch_size=(1024, 1024, 1024, 1024),
49
+ mlp_ratio=4,
50
+ qkv_bias=True,
51
+ qk_scale=None,
52
+ init_values=None,
53
+ attn_drop=0.0,
54
+ proj_drop=0.0,
55
+ drop_path=0.3,
56
+ shuffle_orders=True,
57
+ pre_norm=True,
58
+ enable_rpe=False,
59
+ enable_flash=True,
60
+ upcast_attention=False,
61
+ upcast_softmax=False,
62
+ cls_mode=False,
63
+ pdnorm_bn=False,
64
+ pdnorm_ln=False,
65
+ pdnorm_decouple=True,
66
+ pdnorm_adaptive=False,
67
+ pdnorm_affine=True,
68
+ pdnorm_conditions=('nuScenes', 'SemanticKITTI', 'Waymo'),
69
+ dinov2='giant',
70
+ dinov2_missing_embedding=False,
71
+ dinov2_drop=0.0,
72
+ dinov2_lora=0,
73
+ dinov2_frozen=True),
74
+ criteria=[
75
+ dict(type='CrossEntropyLoss', loss_weight=1.0, ignore_index=-1),
76
+ dict(
77
+ type='LovaszLoss',
78
+ mode='multiclass',
79
+ loss_weight=1.0,
80
+ ignore_index=-1)
81
+ ])
82
+ optimizer = dict(type='AdamW', lr=0.002, weight_decay=0.005)
83
+ scheduler = dict(
84
+ type='OneCycleLR',
85
+ max_lr=[0.002, 0.0002],
86
+ pct_start=0.04,
87
+ anneal_strategy='cos',
88
+ div_factor=10.0,
89
+ final_div_factor=100.0)
90
+ dataset_type = 'NuScenesDataset'
91
+ data_root = 'data/nuscenes'
92
+ ignore_index = -1
93
+ names = [
94
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle', 'motorcycle',
95
+ 'pedestrian', 'traffic_cone', 'trailer', 'truck', 'driveable_surface',
96
+ 'other_flat', 'sidewalk', 'terrain', 'manmade', 'vegetation'
97
+ ]
98
+ data = dict(
99
+ num_classes=16,
100
+ ignore_index=-1,
101
+ names=[
102
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle',
103
+ 'motorcycle', 'pedestrian', 'traffic_cone', 'trailer', 'truck',
104
+ 'driveable_surface', 'other_flat', 'sidewalk', 'terrain', 'manmade',
105
+ 'vegetation'
106
+ ],
107
+ train=dict(
108
+ type='NuScenesDataset',
109
+ split='train',
110
+ data_root='data/nuscenes',
111
+ with_images=True,
112
+ transform=[
113
+ dict(type='ImageResize', size=[378, 672]),
114
+ dict(
115
+ type='ImageColorJitter',
116
+ brightness=0.4,
117
+ contrast=0.4,
118
+ saturation=0.2,
119
+ hue=0.1),
120
+ dict(type='ImageRandomHorizontalFlip'),
121
+ dict(type='ImageNormalize'),
122
+ dict(
123
+ type='RandomRotate',
124
+ angle=[-1, 1],
125
+ axis='z',
126
+ center=[0, 0, 0],
127
+ p=0.5),
128
+ dict(type='RandomScale', scale=[0.9, 1.1]),
129
+ dict(type='RandomFlip', p=0.5),
130
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
131
+ dict(
132
+ type='GridSample',
133
+ grid_size=0.05,
134
+ hash_type='fnv',
135
+ mode='train',
136
+ keys=('coord', 'strength', 'segment', 'image_coord',
137
+ 'image_mask'),
138
+ return_grid_coord=True),
139
+ dict(type='ToTensor'),
140
+ dict(
141
+ type='Collect',
142
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
143
+ 'image_mask'),
144
+ feat_keys=('coord', 'strength'))
145
+ ],
146
+ test_mode=False,
147
+ ignore_index=-1,
148
+ loop=1),
149
+ val=dict(
150
+ type='NuScenesDataset',
151
+ split='val',
152
+ data_root='data/nuscenes',
153
+ with_images=True,
154
+ transform=[
155
+ dict(type='ImageResize', size=[378, 672]),
156
+ dict(type='ImageNormalize'),
157
+ dict(
158
+ type='GridSample',
159
+ grid_size=0.05,
160
+ hash_type='fnv',
161
+ mode='train',
162
+ keys=('coord', 'strength', 'segment', 'image_coord',
163
+ 'image_mask'),
164
+ return_grid_coord=True),
165
+ dict(type='ToTensor'),
166
+ dict(
167
+ type='Collect',
168
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
169
+ 'image_mask'),
170
+ feat_keys=('coord', 'strength'))
171
+ ],
172
+ test_mode=False,
173
+ ignore_index=-1),
174
+ test=dict(
175
+ type='NuScenesDataset',
176
+ split='val',
177
+ data_root='data/nuscenes',
178
+ with_images=True,
179
+ transform=[
180
+ dict(type='ImageResize', size=[378, 672]),
181
+ dict(type='Copy', keys_dict=dict(segment='origin_segment')),
182
+ dict(
183
+ type='GridSample',
184
+ grid_size=0.025,
185
+ hash_type='fnv',
186
+ mode='train',
187
+ keys=('coord', 'strength', 'segment', 'image_coord',
188
+ 'image_mask'),
189
+ return_inverse=True)
190
+ ],
191
+ test_mode=True,
192
+ test_cfg=dict(
193
+ voxelize=dict(
194
+ type='GridSample',
195
+ grid_size=0.05,
196
+ hash_type='fnv',
197
+ mode='test',
198
+ return_grid_coord=True,
199
+ keys=('coord', 'strength', 'image_coord', 'image_mask')),
200
+ crop=None,
201
+ post_transform=[
202
+ dict(type='ImageNormalize'),
203
+ dict(type='ToTensor'),
204
+ dict(
205
+ type='Collect',
206
+ keys=('coord', 'grid_coord', 'index', 'image',
207
+ 'image_coord', 'image_mask'),
208
+ feat_keys=('coord', 'strength'))
209
+ ],
210
+ aug_transform=[[{
211
+ 'type': 'RandomScale',
212
+ 'scale': [0.9, 0.9]
213
+ }], [{
214
+ 'type': 'RandomScale',
215
+ 'scale': [0.95, 0.95]
216
+ }], [{
217
+ 'type': 'RandomScale',
218
+ 'scale': [1, 1]
219
+ }], [{
220
+ 'type': 'RandomScale',
221
+ 'scale': [1.05, 1.05]
222
+ }], [{
223
+ 'type': 'RandomScale',
224
+ 'scale': [1.1, 1.1]
225
+ }],
226
+ [{
227
+ 'type': 'RandomScale',
228
+ 'scale': [0.9, 0.9]
229
+ }, {
230
+ 'type': 'RandomFlip',
231
+ 'p': 1
232
+ }],
233
+ [{
234
+ 'type': 'RandomScale',
235
+ 'scale': [0.95, 0.95]
236
+ }, {
237
+ 'type': 'RandomFlip',
238
+ 'p': 1
239
+ }],
240
+ [{
241
+ 'type': 'RandomScale',
242
+ 'scale': [1, 1]
243
+ }, {
244
+ 'type': 'RandomFlip',
245
+ 'p': 1
246
+ }],
247
+ [{
248
+ 'type': 'RandomScale',
249
+ 'scale': [1.05, 1.05]
250
+ }, {
251
+ 'type': 'RandomFlip',
252
+ 'p': 1
253
+ }],
254
+ [{
255
+ 'type': 'RandomScale',
256
+ 'scale': [1.1, 1.1]
257
+ }, {
258
+ 'type': 'RandomFlip',
259
+ 'p': 1
260
+ }]]),
261
+ ignore_index=-1))
nuscenes/semseg-ptv3_dino-g/events.out.tfevents.1731419596.n23g0016.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57a9b7d94e4fbee4a5103bff83c776e29e45a2061c36a7feede432a2ac035196
3
+ size 11464457
nuscenes/semseg-ptv3_dino-g/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ac78b93852fb8444498a473a6ea91e91616dd222a620fb49ba2e7d2912e0a99
3
+ size 563967344
nuscenes/semseg-ptv3_dino-g/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18431860100702507669d418d34d2913c513cd5c81b579d1ceb17543afe8bfd6
3
+ size 563967344
nuscenes/semseg-ptv3_dino-g/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9be3187a6a54ab2963a102e73c85b8fd7bc9e47f530ca4208473780ab64b5ae
3
+ size 41951454