TensorBoard
karimknaebel commited on
Commit
0a84ac1
·
verified ·
1 Parent(s): 035d482

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  nuscenes/semseg-ptv3_dino-g/train.log filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  nuscenes/semseg-ptv3_dino-g/train.log filter=lfs diff=lfs merge=lfs -text
37
+ nuscenes/semseg-ptv3_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
nuscenes/semseg-ptv3_dino-L/config.py ADDED
@@ -0,0 +1,211 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = 'exp/nuscenes/semseg-ptv3_dino-L/model/model_best.pth'
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 24549500
6
+ save_path = 'exp/nuscenes/semseg-ptv3_dino-L'
7
+ num_worker = 16
8
+ batch_size = 12
9
+ batch_size_val = None
10
+ batch_size_test = None
11
+ epoch = 50
12
+ eval_epoch = 50
13
+ clip_grad = None
14
+ sync_bn = False
15
+ enable_amp = True
16
+ empty_cache = False
17
+ empty_cache_per_epoch = False
18
+ find_unused_parameters = False
19
+ mix_prob = 0.8
20
+ param_dicts = [dict(keyword='^(?!.*img_enc).*block', lr=0.0002)]
21
+ hooks = [
22
+ dict(type='CheckpointLoader'),
23
+ dict(type='IterationTimer', warmup_iter=2),
24
+ dict(type='InformationWriter'),
25
+ dict(type='SemSegEvaluator'),
26
+ dict(type='CheckpointSaver', save_freq=None),
27
+ dict(type='PreciseEvaluator', test_last=False)
28
+ ]
29
+ train = dict(type='DefaultTrainer')
30
+ test = dict(type='SemSegTester', verbose=True)
31
+ model = dict(
32
+ type='DefaultSegmentorV2',
33
+ num_classes=16,
34
+ backbone_out_channels=64,
35
+ backbone=dict(
36
+ type='PT-v3m1-image',
37
+ in_channels=4,
38
+ order=['z', 'z-trans', 'hilbert', 'hilbert-trans'],
39
+ stride=(2, 2, 2, 2),
40
+ enc_depths=(2, 2, 2, 6, 2),
41
+ enc_channels=(32, 64, 128, 256, 512),
42
+ enc_num_head=(2, 4, 8, 16, 32),
43
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
44
+ dec_depths=(2, 2, 2, 2),
45
+ dec_channels=(64, 64, 128, 256),
46
+ dec_num_head=(4, 4, 8, 16),
47
+ dec_patch_size=(1024, 1024, 1024, 1024),
48
+ mlp_ratio=4,
49
+ qkv_bias=True,
50
+ qk_scale=None,
51
+ attn_drop=0.0,
52
+ proj_drop=0.0,
53
+ drop_path=0.3,
54
+ shuffle_orders=True,
55
+ pre_norm=True,
56
+ enable_rpe=False,
57
+ enable_flash=True,
58
+ upcast_attention=False,
59
+ upcast_softmax=False,
60
+ cls_mode=False,
61
+ pdnorm_bn=False,
62
+ pdnorm_ln=False,
63
+ pdnorm_decouple=True,
64
+ pdnorm_adaptive=False,
65
+ pdnorm_affine=True,
66
+ pdnorm_conditions=('nuScenes', 'SemanticKITTI', 'Waymo'),
67
+ dinov2='large'),
68
+ criteria=[
69
+ dict(type='CrossEntropyLoss', loss_weight=1.0, ignore_index=-1),
70
+ dict(
71
+ type='LovaszLoss',
72
+ mode='multiclass',
73
+ loss_weight=1.0,
74
+ ignore_index=-1)
75
+ ])
76
+ optimizer = dict(type='AdamW', lr=0.002, weight_decay=0.005)
77
+ scheduler = dict(
78
+ type='OneCycleLR',
79
+ max_lr=[0.002, 0.0002],
80
+ pct_start=0.04,
81
+ anneal_strategy='cos',
82
+ div_factor=10.0,
83
+ final_div_factor=100.0)
84
+ dataset_type = 'NuScenesDataset'
85
+ data_root = 'data/nuscenes'
86
+ ignore_index = -1
87
+ names = [
88
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle', 'motorcycle',
89
+ 'pedestrian', 'traffic_cone', 'trailer', 'truck', 'driveable_surface',
90
+ 'other_flat', 'sidewalk', 'terrain', 'manmade', 'vegetation'
91
+ ]
92
+ data = dict(
93
+ num_classes=16,
94
+ ignore_index=-1,
95
+ names=[
96
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle',
97
+ 'motorcycle', 'pedestrian', 'traffic_cone', 'trailer', 'truck',
98
+ 'driveable_surface', 'other_flat', 'sidewalk', 'terrain', 'manmade',
99
+ 'vegetation'
100
+ ],
101
+ train=dict(
102
+ type='NuScenesDataset',
103
+ split='train',
104
+ data_root='data/nuscenes',
105
+ with_images=True,
106
+ transform=[
107
+ dict(type='ImageResize', size=[378, 672]),
108
+ dict(
109
+ type='ImageColorJitter',
110
+ brightness=0.4,
111
+ contrast=0.4,
112
+ saturation=0.2,
113
+ hue=0.1),
114
+ dict(type='ImageRandomHorizontalFlip'),
115
+ dict(type='ImageNormalize'),
116
+ dict(
117
+ type='RandomRotate',
118
+ angle=[-1, 1],
119
+ axis='z',
120
+ center=[0, 0, 0],
121
+ p=0.5),
122
+ dict(type='RandomScale', scale=[0.9, 1.1]),
123
+ dict(type='RandomFlip', p=0.5),
124
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
125
+ dict(
126
+ type='GridSample',
127
+ grid_size=0.05,
128
+ hash_type='fnv',
129
+ mode='train',
130
+ keys=('coord', 'strength', 'segment', 'image_coord',
131
+ 'image_mask'),
132
+ return_grid_coord=True),
133
+ dict(type='ToTensor'),
134
+ dict(
135
+ type='Collect',
136
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
137
+ 'image_mask'),
138
+ feat_keys=('coord', 'strength'))
139
+ ],
140
+ test_mode=False,
141
+ ignore_index=-1,
142
+ loop=1),
143
+ val=dict(
144
+ type='NuScenesDataset',
145
+ split='val',
146
+ data_root='data/nuscenes',
147
+ with_images=True,
148
+ transform=[
149
+ dict(type='ImageResize', size=[378, 672]),
150
+ dict(type='ImageNormalize'),
151
+ dict(
152
+ type='GridSample',
153
+ grid_size=0.05,
154
+ hash_type='fnv',
155
+ mode='train',
156
+ keys=('coord', 'strength', 'segment', 'image_coord',
157
+ 'image_mask'),
158
+ return_grid_coord=True),
159
+ dict(type='ToTensor'),
160
+ dict(
161
+ type='Collect',
162
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
163
+ 'image_mask'),
164
+ feat_keys=('coord', 'strength'))
165
+ ],
166
+ test_mode=False,
167
+ ignore_index=-1),
168
+ test=dict(
169
+ type='NuScenesDataset',
170
+ split='val',
171
+ data_root='data/nuscenes',
172
+ with_images=True,
173
+ transform=[
174
+ dict(type='ImageResize', size=[378, 672]),
175
+ dict(type='Copy', keys_dict=dict(segment='origin_segment')),
176
+ dict(
177
+ type='GridSample',
178
+ grid_size=0.025,
179
+ hash_type='fnv',
180
+ mode='train',
181
+ keys=('coord', 'strength', 'segment', 'image_coord',
182
+ 'image_mask'),
183
+ return_inverse=True)
184
+ ],
185
+ test_mode=True,
186
+ test_cfg=dict(
187
+ voxelize=dict(
188
+ type='GridSample',
189
+ grid_size=0.05,
190
+ hash_type='fnv',
191
+ mode='test',
192
+ return_grid_coord=True,
193
+ keys=('coord', 'strength', 'image_coord', 'image_mask')),
194
+ crop=None,
195
+ post_transform=[
196
+ dict(type='ImageNormalize'),
197
+ dict(type='ToTensor'),
198
+ dict(
199
+ type='Collect',
200
+ keys=('coord', 'grid_coord', 'index', 'image',
201
+ 'image_coord', 'image_mask'),
202
+ feat_keys=('coord', 'strength'))
203
+ ],
204
+ aug_transform=[[{
205
+ 'type': 'RandomRotateTargetAngle',
206
+ 'angle': [0],
207
+ 'axis': 'z',
208
+ 'center': [0, 0, 0],
209
+ 'p': 1
210
+ }]]),
211
+ ignore_index=-1))
nuscenes/semseg-ptv3_dino-L/events.out.tfevents.1729779943.n23g0020.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62010b45d3f19d5168c57c228fcffeed6c0f2c92536cb64139d667e35ab507ad
3
+ size 11464320
nuscenes/semseg-ptv3_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9e002b7a360a04e7cc98db52d110ec1f1342d4c5b7b0cd4152db937abb21247
3
+ size 1778497018
nuscenes/semseg-ptv3_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c35d3e4ecb6d92d8be3fbf1057328e6b8425e8d4225a9eb1e3383af4c4aace17
3
+ size 1778497018
nuscenes/semseg-ptv3_dino-L/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:388f8ab322059fefb0ea8c824dbf1d04f9acad09cdd67de25836848370347568
3
+ size 65235469