DempseyWen commited on
Commit
f66b011
·
verified ·
1 Parent(s): c8cfb4d

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. SiMO_AF/config.yaml +339 -0
  2. SiMO_PF/config.yaml +309 -0
SiMO_AF/config.yaml ADDED
@@ -0,0 +1,339 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ add_data_extension:
2
+ - bev_visibility.png
3
+ cav_lidar_range: &id002
4
+ - -51.2
5
+ - -51.2
6
+ - -3
7
+ - 51.2
8
+ - 51.2
9
+ - 1
10
+ comm_range: 70
11
+ comment: ''
12
+ data_augment:
13
+ - ALONG_AXIS_LIST:
14
+ - x
15
+ NAME: random_world_flip
16
+ - NAME: random_world_rotation
17
+ WORLD_ROT_ANGLE:
18
+ - -0.78539816
19
+ - 0.78539816
20
+ - NAME: random_world_scaling
21
+ WORLD_SCALE_RANGE:
22
+ - 0.95
23
+ - 1.05
24
+ fusion:
25
+ args:
26
+ data_aug_conf: &id004
27
+ H: 600
28
+ Ncams: 4
29
+ W: 800
30
+ bot_pct_lim:
31
+ - 0.0
32
+ - 0.05
33
+ cams:
34
+ - camera0
35
+ - camera1
36
+ - camera2
37
+ - camera3
38
+ final_dim:
39
+ - 384
40
+ - 512
41
+ rand_flip: false
42
+ resize_lim:
43
+ - 0.65
44
+ - 0.7
45
+ rot_lim:
46
+ - -3.6
47
+ - 3.6
48
+ grid_conf: &id003
49
+ ddiscr:
50
+ - 2
51
+ - 50
52
+ - 48
53
+ mode: LID
54
+ xbound:
55
+ - -51.2
56
+ - 51.2
57
+ - 0.4
58
+ ybound:
59
+ - -51.2
60
+ - 51.2
61
+ - 0.4
62
+ zbound:
63
+ - -10
64
+ - 10
65
+ - 20.0
66
+ proj_first: false
67
+ core_method: intermediate
68
+ dataset: opv2v
69
+ heter:
70
+ modality_setting:
71
+ m1:
72
+ core_method: point_pillar
73
+ freeze: true
74
+ model_dir: opencood/logs/HeterBaseline_opv2v_lidar_attfuse_2024_12_02_22_07_35
75
+ sensor_type: lidar
76
+ m2:
77
+ core_method: lift_splat_shoot
78
+ freeze: true
79
+ model_dir: opencood/logs/official_checkpoints/HeterBaseline_opv2v_camera_attfuse_2023_08_08_16_50_01
80
+ sensor_type: camera
81
+ input_source:
82
+ - lidar
83
+ - camera
84
+ - depth
85
+ label_type: lidar
86
+ loss:
87
+ args:
88
+ cls:
89
+ alpha: 0.25
90
+ gamma: 2.0
91
+ type: SigmoidFocalLoss
92
+ weight: 1.0
93
+ depth:
94
+ weight: 1.0
95
+ dir:
96
+ args: &id001
97
+ anchor_yaw: &id006
98
+ - 0
99
+ - 90
100
+ dir_offset: 0.7853
101
+ num_bins: 2
102
+ type: WeightedSoftmaxClassificationLoss
103
+ weight: 0.2
104
+ pos_cls_weight: 2.0
105
+ reg:
106
+ codewise: true
107
+ sigma: 3.0
108
+ type: WeightedSmoothL1Loss
109
+ weight: 2.0
110
+ core_method: point_pillar_loss
111
+ lr_scheduler:
112
+ core_method: multistep
113
+ gamma: 0.1
114
+ step_size:
115
+ - 10
116
+ - 40
117
+ model:
118
+ args:
119
+ anchor_number: 2
120
+ att:
121
+ feat_dim: 256
122
+ dir_args: *id001
123
+ head_freeze: true
124
+ in_head: 256
125
+ lamma:
126
+ dim: 256
127
+ feat_dim: 256
128
+ feature_stride: 2
129
+ freeze: false
130
+ heads: 2
131
+ lidar_drop_ratio: 0.5
132
+ random_drop: false
133
+ single_mode: 'camera'
134
+ lidar_range: *id002
135
+ m1:
136
+ aligner_args:
137
+ args:
138
+ dim: 256
139
+ num_of_blocks: 3
140
+ core_method: convnext
141
+ freeze: true
142
+ spatial_align: false
143
+ backbone_args:
144
+ freeze: true
145
+ layer_nums:
146
+ - 3
147
+ - 5
148
+ - 8
149
+ layer_strides:
150
+ - 2
151
+ - 2
152
+ - 2
153
+ num_filters:
154
+ - 64
155
+ - 128
156
+ - 256
157
+ num_upsample_filter:
158
+ - 128
159
+ - 128
160
+ - 128
161
+ upsample_strides:
162
+ - 1
163
+ - 2
164
+ - 4
165
+ core_method: point_pillar
166
+ encoder_args:
167
+ freeze: true
168
+ lidar_range: *id002
169
+ pillar_vfe:
170
+ num_filters:
171
+ - 64
172
+ use_absolute_xyz: true
173
+ use_norm: true
174
+ with_distance: false
175
+ point_pillar_scatter:
176
+ grid_size: !!python/object/apply:numpy.core.multiarray._reconstruct
177
+ args:
178
+ - !!python/name:numpy.ndarray ''
179
+ - !!python/tuple
180
+ - 0
181
+ - !!binary |
182
+ Yg==
183
+ state: !!python/tuple
184
+ - 1
185
+ - !!python/tuple
186
+ - 3
187
+ - !!python/object/apply:numpy.dtype
188
+ args:
189
+ - i8
190
+ - false
191
+ - true
192
+ state: !!python/tuple
193
+ - 3
194
+ - <
195
+ - null
196
+ - null
197
+ - null
198
+ - -1
199
+ - -1
200
+ - 0
201
+ - false
202
+ - !!binary |
203
+ AAEAAAAAAAAAAQAAAAAAAAEAAAAAAAAA
204
+ num_features: 64
205
+ voxel_size: &id005
206
+ - 0.4
207
+ - 0.4
208
+ - 4
209
+ freeze: true
210
+ model_dir: opencood/logs/HeterBaseline_opv2v_lidar_attfuse_2024_12_02_22_07_35
211
+ sensor_type: lidar
212
+ shrink_header:
213
+ dim:
214
+ - 256
215
+ freeze: true
216
+ input_dim: 384
217
+ kernal_size:
218
+ - 3
219
+ padding:
220
+ - 1
221
+ stride:
222
+ - 1
223
+ m2:
224
+ aligner_args:
225
+ args:
226
+ dim: 256
227
+ num_of_blocks: 3
228
+ core_method: convnext
229
+ freeze: true
230
+ spatial_align: false
231
+ backbone_args:
232
+ freeze: true
233
+ inplanes: 128
234
+ layer_nums:
235
+ - 3
236
+ - 5
237
+ - 8
238
+ layer_strides:
239
+ - 2
240
+ - 2
241
+ - 2
242
+ num_filters:
243
+ - 64
244
+ - 128
245
+ - 256
246
+ num_upsample_filter:
247
+ - 128
248
+ - 128
249
+ - 128
250
+ upsample_strides:
251
+ - 1
252
+ - 2
253
+ - 4
254
+ camera_mask_args:
255
+ cav_lidar_range: *id002
256
+ grid_conf: *id003
257
+ core_method: lift_splat_shoot
258
+ encoder_args:
259
+ anchor_number: 2
260
+ camera_encoder: EfficientNet
261
+ data_aug_conf: *id004
262
+ depth_supervision: true
263
+ freeze: true
264
+ grid_conf: *id003
265
+ img_downsample: 8
266
+ img_features: 128
267
+ use_depth_gt: false
268
+ freeze: true
269
+ model_dir: opencood/logs/official_checkpoints/HeterBaseline_opv2v_camera_attfuse_2023_08_08_16_50_01
270
+ sensor_type: camera
271
+ shrink_header:
272
+ dim:
273
+ - 256
274
+ freeze: true
275
+ input_dim: 384
276
+ kernal_size:
277
+ - 3
278
+ padding:
279
+ - 1
280
+ stride:
281
+ - 1
282
+ ma_fusion_method: att
283
+ mm_fusion_method: lamma3
284
+ single_modality: 'camera'
285
+ voxel_size: *id005
286
+ core_method: point_pillar_lss_lamma2_attfuse
287
+ name: opv2v_lidarcamera_lamma3_attfuse
288
+ noise_setting: !!python/object/apply:collections.OrderedDict
289
+ - - - add_noise
290
+ - false
291
+ optimizer:
292
+ args:
293
+ eps: 1.0e-10
294
+ weight_decay: 0.0001
295
+ core_method: Adam
296
+ lr: 0.0002
297
+ postprocess:
298
+ anchor_args:
299
+ D: 1
300
+ H: 256
301
+ W: 256
302
+ cav_lidar_range: *id002
303
+ feature_stride: 2
304
+ h: 1.56
305
+ l: 3.9
306
+ num: 2
307
+ r: *id006
308
+ vd: 4
309
+ vh: 0.4
310
+ vw: 0.4
311
+ w: 1.6
312
+ core_method: VoxelPostprocessor
313
+ dir_args: *id001
314
+ gt_range: *id002
315
+ max_num: 150
316
+ nms_thresh: 0.15
317
+ order: hwl
318
+ target_args:
319
+ neg_threshold: 0.45
320
+ pos_threshold: 0.6
321
+ score_threshold: 0.2
322
+ preprocess:
323
+ args:
324
+ max_points_per_voxel: 32
325
+ max_voxel_test: 70000
326
+ max_voxel_train: 32000
327
+ voxel_size: *id005
328
+ cav_lidar_range: *id002
329
+ core_method: SpVoxelPreprocessor
330
+ root_dir: data/OPV2V/train
331
+ test_dir: data/OPV2V/test
332
+ train_params:
333
+ batch_size: 1
334
+ epoches: 40
335
+ eval_freq: 2
336
+ max_cav: 5
337
+ save_freq: 2
338
+ validate_dir: data/OPV2V/validate
339
+ yaml_parser: load_general_params
SiMO_PF/config.yaml ADDED
@@ -0,0 +1,309 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ add_data_extension:
2
+ - bev_visibility.png
3
+ cav_lidar_range: &id002
4
+ - -51.2
5
+ - -51.2
6
+ - -3
7
+ - 51.2
8
+ - 51.2
9
+ - 1
10
+ comm_range: 70
11
+ comment: ''
12
+ data_augment:
13
+ - ALONG_AXIS_LIST:
14
+ - x
15
+ NAME: random_world_flip
16
+ - NAME: random_world_rotation
17
+ WORLD_ROT_ANGLE:
18
+ - -0.78539816
19
+ - 0.78539816
20
+ - NAME: random_world_scaling
21
+ WORLD_SCALE_RANGE:
22
+ - 0.95
23
+ - 1.05
24
+ fusion:
25
+ args:
26
+ data_aug_conf: &id004
27
+ H: 600
28
+ Ncams: 4
29
+ W: 800
30
+ bot_pct_lim:
31
+ - 0.0
32
+ - 0.05
33
+ cams:
34
+ - camera0
35
+ - camera1
36
+ - camera2
37
+ - camera3
38
+ final_dim:
39
+ - 384
40
+ - 512
41
+ rand_flip: false
42
+ resize_lim:
43
+ - 0.65
44
+ - 0.7
45
+ rot_lim:
46
+ - -3.6
47
+ - 3.6
48
+ grid_conf: &id003
49
+ ddiscr:
50
+ - 2
51
+ - 50
52
+ - 48
53
+ mode: LID
54
+ xbound:
55
+ - -51.2
56
+ - 51.2
57
+ - 0.4
58
+ ybound:
59
+ - -51.2
60
+ - 51.2
61
+ - 0.4
62
+ zbound:
63
+ - -10
64
+ - 10
65
+ - 20.0
66
+ proj_first: false
67
+ core_method: intermediate
68
+ dataset: opv2v
69
+ heter:
70
+ modality_setting:
71
+ m1:
72
+ core_method: point_pillar
73
+ sensor_type: lidar
74
+ m2:
75
+ core_method: lift_splat_shoot
76
+ sensor_type: camera
77
+ input_source:
78
+ - lidar
79
+ - camera
80
+ - depth
81
+ label_type: lidar
82
+ loss:
83
+ args:
84
+ cls:
85
+ alpha: 0.25
86
+ gamma: 2.0
87
+ type: SigmoidFocalLoss
88
+ weight: 1.0
89
+ depth:
90
+ weight: 1.0
91
+ dir:
92
+ args: &id001
93
+ anchor_yaw: &id006
94
+ - 0
95
+ - 90
96
+ dir_offset: 0.7853
97
+ num_bins: 2
98
+ type: WeightedSoftmaxClassificationLoss
99
+ weight: 0.2
100
+ pos_cls_weight: 2.0
101
+ reg:
102
+ codewise: true
103
+ sigma: 3.0
104
+ type: WeightedSmoothL1Loss
105
+ weight: 2.0
106
+ core_method: point_pillar_loss
107
+ lr_scheduler:
108
+ core_method: multistep
109
+ gamma: 0.1
110
+ step_size:
111
+ - 15
112
+ - 40
113
+ model:
114
+ args:
115
+ anchor_number: 2
116
+ dir_args: *id001
117
+ fusion_backbone:
118
+ anchor_number: 2
119
+ freeze: true
120
+ layer_nums:
121
+ - 3
122
+ - 5
123
+ - 8
124
+ layer_strides:
125
+ - 1
126
+ - 2
127
+ - 2
128
+ num_filters:
129
+ - 64
130
+ - 128
131
+ - 256
132
+ num_upsample_filter:
133
+ - 128
134
+ - 128
135
+ - 128
136
+ resnext: true
137
+ upsample_strides:
138
+ - 1
139
+ - 2
140
+ - 4
141
+ head_freeze: true
142
+ in_head: 256
143
+ lamma:
144
+ dim: 128
145
+ feat_dim: 64
146
+ feature_stride: 2
147
+ freeze: false
148
+ heads: 2
149
+ lidar_drop_ratio: 0.5
150
+ random_drop: false
151
+ single_mode: false
152
+ lidar_range: *id002
153
+ m1:
154
+ aligner_args:
155
+ core_method: identity
156
+ freeze: true
157
+ backbone_args:
158
+ freeze: true
159
+ layer_nums:
160
+ - 3
161
+ layer_strides:
162
+ - 2
163
+ num_filters:
164
+ - 64
165
+ core_method: point_pillar
166
+ encoder_args:
167
+ freeze: true
168
+ lidar_range: *id002
169
+ pillar_vfe:
170
+ num_filters:
171
+ - 64
172
+ use_absolute_xyz: true
173
+ use_norm: true
174
+ with_distance: false
175
+ point_pillar_scatter:
176
+ grid_size: !!python/object/apply:numpy.core.multiarray._reconstruct
177
+ args:
178
+ - !!python/name:numpy.ndarray ''
179
+ - !!python/tuple
180
+ - 0
181
+ - !!binary |
182
+ Yg==
183
+ state: !!python/tuple
184
+ - 1
185
+ - !!python/tuple
186
+ - 3
187
+ - !!python/object/apply:numpy.dtype
188
+ args:
189
+ - i8
190
+ - false
191
+ - true
192
+ state: !!python/tuple
193
+ - 3
194
+ - <
195
+ - null
196
+ - null
197
+ - null
198
+ - -1
199
+ - -1
200
+ - 0
201
+ - false
202
+ - !!binary |
203
+ AAEAAAAAAAAAAQAAAAAAAAEAAAAAAAAA
204
+ num_features: 64
205
+ voxel_size: &id005
206
+ - 0.4
207
+ - 0.4
208
+ - 4
209
+ sensor_type: lidar
210
+ m2:
211
+ aligner_args:
212
+ args:
213
+ dim: 64
214
+ num_of_blocks: 3
215
+ core_method: convnext
216
+ freeze: true
217
+ spatial_align: false
218
+ backbone_args:
219
+ freeze: true
220
+ inplanes: 128
221
+ layer_nums:
222
+ - 3
223
+ layer_strides:
224
+ - 2
225
+ num_filters:
226
+ - 64
227
+ camera_mask_args:
228
+ cav_lidar_range: *id002
229
+ grid_conf: *id003
230
+ core_method: lift_splat_shoot
231
+ encoder_args:
232
+ anchor_number: 2
233
+ camera_encoder: EfficientNet
234
+ data_aug_conf: *id004
235
+ depth_supervision: true
236
+ freeze: true
237
+ grid_conf: *id003
238
+ img_downsample: 8
239
+ img_features: 128
240
+ use_depth_gt: false
241
+ sensor_type: camera
242
+ mm_fusion_method: lamma3
243
+ shrink_header:
244
+ dim:
245
+ - 256
246
+ freeze: true
247
+ input_dim: 384
248
+ kernal_size:
249
+ - 3
250
+ padding:
251
+ - 1
252
+ stride:
253
+ - 1
254
+ single_modality: false
255
+ voxel_size: *id005
256
+ core_method: point_pillar_lss_lamma2_pyramid_fusion
257
+ name: opv2v_lidarcamera_lamma2_pyramid_fusion
258
+ noise_setting: !!python/object/apply:collections.OrderedDict
259
+ - - - add_noise
260
+ - false
261
+ optimizer:
262
+ args:
263
+ eps: 1.0e-10
264
+ weight_decay: 0.0001
265
+ core_method: Adam
266
+ lr: 0.0002
267
+ postprocess:
268
+ anchor_args:
269
+ D: 1
270
+ H: 256
271
+ W: 256
272
+ cav_lidar_range: *id002
273
+ feature_stride: 2
274
+ h: 1.56
275
+ l: 3.9
276
+ num: 2
277
+ r: *id006
278
+ vd: 4
279
+ vh: 0.4
280
+ vw: 0.4
281
+ w: 1.6
282
+ core_method: VoxelPostprocessor
283
+ dir_args: *id001
284
+ gt_range: *id002
285
+ max_num: 150
286
+ nms_thresh: 0.15
287
+ order: hwl
288
+ target_args:
289
+ neg_threshold: 0.45
290
+ pos_threshold: 0.6
291
+ score_threshold: 0.2
292
+ preprocess:
293
+ args:
294
+ max_points_per_voxel: 32
295
+ max_voxel_test: 70000
296
+ max_voxel_train: 32000
297
+ voxel_size: *id005
298
+ cav_lidar_range: *id002
299
+ core_method: SpVoxelPreprocessor
300
+ root_dir: data/OPV2V/train
301
+ test_dir: data/OPV2V/test
302
+ train_params:
303
+ batch_size: 1
304
+ epoches: 50
305
+ eval_freq: 2
306
+ max_cav: 5
307
+ save_freq: 2
308
+ validate_dir: data/OPV2V/validate
309
+ yaml_parser: load_general_params