TensorBoard
karimknaebel commited on
Commit
054f3ed
·
verified ·
1 Parent(s): aad5a45

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -39,3 +39,4 @@ nuscenes/semseg-ptv3_dino-B/test.log filter=lfs diff=lfs merge=lfs -text
39
  nuscenes/semseg-ptv3_dino-B/train.log filter=lfs diff=lfs merge=lfs -text
40
  nuscenes/semseg-ptv3_dino-S/test.log filter=lfs diff=lfs merge=lfs -text
41
  nuscenes/semseg-ptv3_dino-S/train.log filter=lfs diff=lfs merge=lfs -text
 
 
39
  nuscenes/semseg-ptv3_dino-B/train.log filter=lfs diff=lfs merge=lfs -text
40
  nuscenes/semseg-ptv3_dino-S/test.log filter=lfs diff=lfs merge=lfs -text
41
  nuscenes/semseg-ptv3_dino-S/train.log filter=lfs diff=lfs merge=lfs -text
42
+ semantic_kitti/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
semantic_kitti/semseg-ptv3_dino-L/config.py ADDED
@@ -0,0 +1,244 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = 'exp/semantic_kitti/semseg-ptv3_dino-L/model/model_best.pth'
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 32226192
6
+ save_path = 'exp/semantic_kitti/semseg-ptv3_dino-L'
7
+ wandb_project = 'semseg_kitti'
8
+ num_worker = 16
9
+ batch_size = 8
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 50
13
+ eval_epoch = 50
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = False
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='block', lr=0.0002)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='SemSegEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None)
28
+ ]
29
+ train = dict(type='DefaultTrainer')
30
+ test = dict(type='SemSegTester', verbose=True)
31
+ model = dict(
32
+ type='DefaultSegmentorV2',
33
+ num_classes=19,
34
+ backbone_out_channels=64,
35
+ backbone=dict(
36
+ type='PT-v3m1-image',
37
+ in_channels=4,
38
+ order=['z', 'z-trans', 'hilbert', 'hilbert-trans'],
39
+ stride=(2, 2, 2, 2),
40
+ enc_depths=(2, 2, 2, 6, 2),
41
+ enc_channels=(32, 64, 128, 256, 512),
42
+ enc_num_head=(2, 4, 8, 16, 32),
43
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
44
+ dec_depths=(2, 2, 2, 2),
45
+ dec_channels=(64, 64, 128, 256),
46
+ dec_num_head=(4, 4, 8, 16),
47
+ dec_patch_size=(1024, 1024, 1024, 1024),
48
+ mlp_ratio=4,
49
+ qkv_bias=True,
50
+ qk_scale=None,
51
+ attn_drop=0.0,
52
+ proj_drop=0.0,
53
+ drop_path=0.3,
54
+ shuffle_orders=True,
55
+ pre_norm=True,
56
+ enable_rpe=False,
57
+ enable_flash=True,
58
+ upcast_attention=False,
59
+ upcast_softmax=False,
60
+ cls_mode=False,
61
+ pdnorm_bn=False,
62
+ pdnorm_ln=False,
63
+ pdnorm_decouple=True,
64
+ pdnorm_adaptive=False,
65
+ pdnorm_affine=True,
66
+ pdnorm_conditions=('nuScenes', 'SemanticKITTI', 'Waymo'),
67
+ dinov2='large',
68
+ dinov2_missing_embedding=False,
69
+ dinov2_drop=0.0),
70
+ criteria=[
71
+ dict(
72
+ type='CrossEntropyLoss',
73
+ weight=[
74
+ 3.1557, 8.7029, 7.8281, 6.1354, 6.3161, 7.9937, 8.9704,
75
+ 10.1922, 1.6155, 4.2187, 1.9385, 5.5455, 2.0198, 2.6261,
76
+ 1.3212, 5.1102, 2.5492, 5.8585, 7.3929
77
+ ],
78
+ loss_weight=1.0,
79
+ ignore_index=-1),
80
+ dict(
81
+ type='LovaszLoss',
82
+ mode='multiclass',
83
+ loss_weight=1.0,
84
+ ignore_index=-1)
85
+ ])
86
+ optimizer = dict(type='AdamW', lr=0.002, weight_decay=0.005)
87
+ scheduler = dict(
88
+ type='OneCycleLR',
89
+ max_lr=[0.002, 0.0002],
90
+ pct_start=0.04,
91
+ anneal_strategy='cos',
92
+ div_factor=10.0,
93
+ final_div_factor=100.0)
94
+ dataset_type = 'SemanticKITTIDataset'
95
+ data_root = 'data/semantic_kitti'
96
+ ignore_index = -1
97
+ names = [
98
+ 'car', 'bicycle', 'motorcycle', 'truck', 'other-vehicle', 'person',
99
+ 'bicyclist', 'motorcyclist', 'road', 'parking', 'sidewalk', 'other-ground',
100
+ 'building', 'fence', 'vegetation', 'trunk', 'terrain', 'pole',
101
+ 'traffic-sign'
102
+ ]
103
+ data = dict(
104
+ num_classes=19,
105
+ ignore_index=-1,
106
+ names=[
107
+ 'car', 'bicycle', 'motorcycle', 'truck', 'other-vehicle', 'person',
108
+ 'bicyclist', 'motorcyclist', 'road', 'parking', 'sidewalk',
109
+ 'other-ground', 'building', 'fence', 'vegetation', 'trunk', 'terrain',
110
+ 'pole', 'traffic-sign'
111
+ ],
112
+ train=dict(
113
+ type='SemanticKITTIDataset',
114
+ split='train',
115
+ data_root='data/semantic_kitti',
116
+ with_images=True,
117
+ transform=[
118
+ dict(type='ImageResize', size=[378, 1246]),
119
+ dict(
120
+ type='ImageColorJitter',
121
+ brightness=0.4,
122
+ contrast=0.4,
123
+ saturation=0.2,
124
+ hue=0.1),
125
+ dict(type='ImageRandomHorizontalFlip'),
126
+ dict(type='ImageNormalize'),
127
+ dict(
128
+ type='RandomRotate',
129
+ angle=[-1, 1],
130
+ axis='z',
131
+ center=[0, 0, 0],
132
+ p=0.5),
133
+ dict(type='RandomScale', scale=[0.9, 1.1]),
134
+ dict(type='RandomFlip', p=0.5),
135
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
136
+ dict(
137
+ type='GridSample',
138
+ grid_size=0.05,
139
+ hash_type='fnv',
140
+ mode='train',
141
+ keys=('coord', 'strength', 'segment', 'image_coord',
142
+ 'image_mask'),
143
+ return_grid_coord=True),
144
+ dict(
145
+ type='PointClip',
146
+ point_cloud_range=(-35.2, -35.2, -4, 35.2, 35.2, 2)),
147
+ dict(type='SphereCrop', sample_rate=0.8, mode='random'),
148
+ dict(type='SphereCrop', point_max=120000, mode='random'),
149
+ dict(type='ToTensor'),
150
+ dict(
151
+ type='Collect',
152
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
153
+ 'image_mask'),
154
+ feat_keys=('coord', 'strength'))
155
+ ],
156
+ test_mode=False,
157
+ ignore_index=-1,
158
+ loop=1),
159
+ val=dict(
160
+ type='SemanticKITTIDataset',
161
+ split='val',
162
+ data_root='data/semantic_kitti',
163
+ with_images=True,
164
+ transform=[
165
+ dict(type='ImageResize', size=[378, 1246]),
166
+ dict(type='ImageNormalize'),
167
+ dict(
168
+ type='GridSample',
169
+ grid_size=0.05,
170
+ hash_type='fnv',
171
+ mode='train',
172
+ keys=('coord', 'strength', 'segment', 'image_coord',
173
+ 'image_mask'),
174
+ return_grid_coord=True),
175
+ dict(
176
+ type='PointClip',
177
+ point_cloud_range=(-35.2, -35.2, -4, 35.2, 35.2, 2)),
178
+ dict(type='ToTensor'),
179
+ dict(
180
+ type='Collect',
181
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
182
+ 'image_mask'),
183
+ feat_keys=('coord', 'strength'))
184
+ ],
185
+ test_mode=False,
186
+ ignore_index=-1),
187
+ test=dict(
188
+ type='SemanticKITTIDataset',
189
+ split='val',
190
+ data_root='data/semantic_kitti',
191
+ with_images=True,
192
+ transform=[dict(type='ImageResize', size=[378, 1246])],
193
+ test_mode=True,
194
+ test_cfg=dict(
195
+ voxelize=dict(
196
+ type='GridSample',
197
+ grid_size=0.05,
198
+ hash_type='fnv',
199
+ mode='test',
200
+ return_grid_coord=True,
201
+ keys=('coord', 'strength', 'segment', 'image_coord',
202
+ 'image_mask')),
203
+ crop=None,
204
+ post_transform=[
205
+ dict(type='ImageNormalize'),
206
+ dict(
207
+ type='PointClip',
208
+ point_cloud_range=(-35.2, -35.2, -4, 35.2, 35.2, 2)),
209
+ dict(type='ToTensor'),
210
+ dict(
211
+ type='Collect',
212
+ keys=('coord', 'grid_coord', 'index', 'image',
213
+ 'image_coord', 'image_mask'),
214
+ feat_keys=('coord', 'strength'))
215
+ ],
216
+ aug_transform=[[{
217
+ 'type': 'RandomRotateTargetAngle',
218
+ 'angle': [0],
219
+ 'axis': 'z',
220
+ 'center': [0, 0, 0],
221
+ 'p': 1
222
+ }],
223
+ [{
224
+ 'type': 'RandomRotateTargetAngle',
225
+ 'angle': [0.5],
226
+ 'axis': 'z',
227
+ 'center': [0, 0, 0],
228
+ 'p': 1
229
+ }],
230
+ [{
231
+ 'type': 'RandomRotateTargetAngle',
232
+ 'angle': [1],
233
+ 'axis': 'z',
234
+ 'center': [0, 0, 0],
235
+ 'p': 1
236
+ }],
237
+ [{
238
+ 'type': 'RandomRotateTargetAngle',
239
+ 'angle': [1.5],
240
+ 'axis': 'z',
241
+ 'center': [0, 0, 0],
242
+ 'p': 1
243
+ }]]),
244
+ ignore_index=-1))
semantic_kitti/semseg-ptv3_dino-L/events.out.tfevents.1730404883.penguin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b7b89074a12dcbf5002c2d31e32d17d991d63e2198650649badef8abc40dcb5
3
+ size 11694620
semantic_kitti/semseg-ptv3_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef5d5cb30a974f775cf29837a3c406a30e40a1654dffca3cf64dd8504d0d3764
3
+ size 560860208
semantic_kitti/semseg-ptv3_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef5d5cb30a974f775cf29837a3c406a30e40a1654dffca3cf64dd8504d0d3764
3
+ size 560860208
semantic_kitti/semseg-ptv3_dino-L/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4ba267cb2d092f3f6d1f39b5206b247775809179cd5cf8709b8501ee3da32f2
3
+ size 28774255