xiangbog commited on
Commit
a6c87ca
·
1 Parent(s): 514e4a7

Add AirV2X perception model checkpoints

Browse files
airv2x_intermediate_cobevt/release/best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51f291b499b2b432a795f24148487aa582652789959b03d299256f1ca54f922b
3
+ size 39692890
airv2x_intermediate_cobevt/release/config.yaml ADDED
@@ -0,0 +1,443 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ active_sensors: &id001
2
+ - lidar
3
+ bevcam_fov: 110
4
+ collaborators: &id002
5
+ - vehicle
6
+ - rsu
7
+ - drone
8
+ data_augment:
9
+ - ALONG_AXIS_LIST:
10
+ - x
11
+ NAME: random_world_flip
12
+ - NAME: random_world_rotation
13
+ WORLD_ROT_ANGLE:
14
+ - -0.78539816
15
+ - 0.78539816
16
+ - NAME: random_world_scaling
17
+ WORLD_SCALE_RANGE:
18
+ - 0.95
19
+ - 1.05
20
+ device: cuda
21
+ dynamic_class: 7
22
+ ego_type: vehicle
23
+ fusion:
24
+ args:
25
+ drone_data_aug_conf: &id003
26
+ H: 720
27
+ W: 1280
28
+ bot_pct_lim:
29
+ - 0.0
30
+ - 0.05
31
+ final_dim:
32
+ - 360
33
+ - 640
34
+ rand_flip: false
35
+ resize_lim:
36
+ - 0.65
37
+ - 0.7
38
+ rot_lim:
39
+ - -3.6
40
+ - 3.6
41
+ drone_grid_conf: &id004
42
+ ddiscr:
43
+ - 6
44
+ - 150
45
+ - 144
46
+ mode: UD
47
+ xbound:
48
+ - -140.8
49
+ - 140.8
50
+ - 0.4
51
+ ybound:
52
+ - -40
53
+ - 40
54
+ - 0.4
55
+ zbound:
56
+ - -150
57
+ - -6
58
+ - 144
59
+ proj_first: true
60
+ rsu_data_aug_conf: &id005
61
+ H: 720
62
+ W: 1280
63
+ bot_pct_lim:
64
+ - 0.0
65
+ - 0.05
66
+ final_dim:
67
+ - 360
68
+ - 640
69
+ rand_flip: false
70
+ resize_lim:
71
+ - 0.65
72
+ - 0.7
73
+ rot_lim:
74
+ - 0
75
+ - 0
76
+ rsu_grid_conf: &id006
77
+ ddiscr:
78
+ - 2
79
+ - 50
80
+ - 48
81
+ mode: LID
82
+ xbound:
83
+ - -140.8
84
+ - 140.8
85
+ - 0.4
86
+ ybound:
87
+ - -40
88
+ - 40
89
+ - 0.4
90
+ zbound:
91
+ - -30
92
+ - 30
93
+ - 60.0
94
+ veh_data_aug_conf: &id008
95
+ H: 720
96
+ W: 1280
97
+ bot_pct_lim:
98
+ - 0.0
99
+ - 0.05
100
+ final_dim:
101
+ - 360
102
+ - 640
103
+ rand_flip: false
104
+ resize_lim:
105
+ - 0.65
106
+ - 0.7
107
+ rot_lim:
108
+ - 0
109
+ - 0
110
+ veh_grid_conf: &id009
111
+ ddiscr:
112
+ - 2
113
+ - 50
114
+ - 48
115
+ mode: LID
116
+ xbound:
117
+ - -140.8
118
+ - 140.8
119
+ - 0.4
120
+ ybound:
121
+ - -40
122
+ - 40
123
+ - 0.4
124
+ zbound:
125
+ - -10
126
+ - 10
127
+ - 20.0
128
+ core_method: IntermediateFusionDatasetAirv2x
129
+ loss:
130
+ det:
131
+ args:
132
+ cls_weight: 1.0
133
+ num_class: 7
134
+ reg: 2.0
135
+ core_method: point_pillar_loss_multiclass
136
+ seg:
137
+ args:
138
+ d_coe: 2.0
139
+ d_weights:
140
+ - 200.0
141
+ - 200.0
142
+ - 75.0
143
+ - 200.0
144
+ - 200.0
145
+ - 200.0
146
+ l_weights: 8.0
147
+ s_coe: 0.0
148
+ s_weights: 50.0
149
+ seg_branch: both
150
+ core_method: vanilla_seg_loss
151
+ lr_scheduler:
152
+ core_method: multistep
153
+ gamma: 0.1
154
+ step_size:
155
+ - 10
156
+ - 15
157
+ model:
158
+ args:
159
+ active_sensors: *id001
160
+ anchor_number: 2
161
+ backbone_fix: false
162
+ base_bev_backbone:
163
+ layer_nums:
164
+ - 3
165
+ - 5
166
+ - 8
167
+ layer_strides:
168
+ - 2
169
+ - 2
170
+ - 2
171
+ num_filters:
172
+ - 64
173
+ - 128
174
+ - 256
175
+ num_upsample_filter:
176
+ - 128
177
+ - 128
178
+ - 128
179
+ upsample_strides:
180
+ - 1
181
+ - 2
182
+ - 4
183
+ cav_range: &id012
184
+ - -140.8
185
+ - -40
186
+ - -3
187
+ - 140.8
188
+ - 40
189
+ - 1
190
+ collaborators: *id002
191
+ compression: 0
192
+ device: cuda
193
+ drone:
194
+ cam:
195
+ bevout_feature: 64
196
+ camera_encoder: EfficientNet
197
+ data_aug_conf: *id003
198
+ depth_supervision: false
199
+ grid_conf: *id004
200
+ img_downsample: 8
201
+ img_features: 64
202
+ use_depth_gt: true
203
+ lidar:
204
+ backbone_fix: false
205
+ compression: 0
206
+ lidar_range:
207
+ - -140.8
208
+ - -40
209
+ - -150
210
+ - 140.8
211
+ - 40
212
+ - -6
213
+ pillar_vfe:
214
+ num_filters:
215
+ - 64
216
+ use_absolute_xyz: true
217
+ use_norm: true
218
+ with_distance: false
219
+ point_pillar_scatter:
220
+ grid_size: &id007 !!python/object/apply:numpy.core.multiarray._reconstruct
221
+ args:
222
+ - &id010 !!python/name:numpy.ndarray ''
223
+ - !!python/tuple
224
+ - 0
225
+ - !!binary |
226
+ Yg==
227
+ state: !!python/tuple
228
+ - 1
229
+ - !!python/tuple
230
+ - 3
231
+ - &id011 !!python/object/apply:numpy.dtype
232
+ args:
233
+ - i8
234
+ - false
235
+ - true
236
+ state: !!python/tuple
237
+ - 3
238
+ - <
239
+ - null
240
+ - null
241
+ - null
242
+ - -1
243
+ - -1
244
+ - 0
245
+ - false
246
+ - !!binary |
247
+ wAIAAAAAAADIAAAAAAAAAAEAAAAAAAAA
248
+ num_features: 64
249
+ voxel_size:
250
+ - 0.4
251
+ - 0.4
252
+ - 144
253
+ modalities:
254
+ - lidar
255
+ dynamic_class: 7
256
+ fax_fusion:
257
+ agent_size: 7
258
+ depth: 3
259
+ dim_head: 32
260
+ drop_out: 0.1
261
+ input_dim: 256
262
+ mask: true
263
+ mlp_dim: 256
264
+ window_size: 4
265
+ head_dim: 256
266
+ max_cav: &id013
267
+ drone: 2
268
+ rsu: 2
269
+ vehicle: 3
270
+ max_cav_num: 7
271
+ num_class: 7
272
+ obj_head: true
273
+ outC: 256
274
+ proj_first: true
275
+ rsu:
276
+ cam:
277
+ bevout_feature: 64
278
+ camera_encoder: EfficientNet
279
+ data_aug_conf: *id005
280
+ depth_supervision: false
281
+ grid_conf: *id006
282
+ img_downsample: 8
283
+ img_features: 64
284
+ use_depth_gt: true
285
+ lidar:
286
+ backbone_fix: false
287
+ compression: 0
288
+ lidar_range:
289
+ - -140.8
290
+ - -40
291
+ - -30
292
+ - 140.8
293
+ - 40
294
+ - 30
295
+ pillar_vfe:
296
+ num_filters:
297
+ - 64
298
+ use_absolute_xyz: true
299
+ use_norm: true
300
+ with_distance: false
301
+ point_pillar_scatter:
302
+ grid_size: *id007
303
+ num_features: 64
304
+ voxel_size:
305
+ - 0.4
306
+ - 0.4
307
+ - 60
308
+ modalities:
309
+ - lidar
310
+ seg_branch: both
311
+ seg_hw: 512
312
+ seg_res: 0.25
313
+ shrink_header:
314
+ dim:
315
+ - 256
316
+ input_dim: 384
317
+ kernal_size:
318
+ - 1
319
+ padding:
320
+ - 0
321
+ stride:
322
+ - 1
323
+ use: true
324
+ static_class: 3
325
+ supervise_single: false
326
+ task: det
327
+ train: true
328
+ vehicle:
329
+ cam:
330
+ bevout_feature: 64
331
+ camera_encoder: EfficientNet
332
+ data_aug_conf: *id008
333
+ depth_supervision: false
334
+ grid_conf: *id009
335
+ img_downsample: 8
336
+ img_features: 64
337
+ use_depth_gt: true
338
+ lidar:
339
+ backbone_fix: false
340
+ compression: 0
341
+ lidar_range:
342
+ - -140.8
343
+ - -40
344
+ - -3
345
+ - 140.8
346
+ - 40
347
+ - 1
348
+ pillar_vfe:
349
+ num_filters:
350
+ - 64
351
+ use_absolute_xyz: true
352
+ use_norm: true
353
+ with_distance: false
354
+ point_pillar_scatter:
355
+ grid_size: !!python/object/apply:numpy.core.multiarray._reconstruct
356
+ args:
357
+ - *id010
358
+ - !!python/tuple
359
+ - 0
360
+ - !!binary |
361
+ Yg==
362
+ state: !!python/tuple
363
+ - 1
364
+ - !!python/tuple
365
+ - 3
366
+ - *id011
367
+ - false
368
+ - !!binary |
369
+ wAIAAAAAAADIAAAAAAAAAAEAAAAAAAAA
370
+ num_features: 64
371
+ voxel_size:
372
+ - 0.4
373
+ - 0.4
374
+ - 4
375
+ modalities:
376
+ - lidar
377
+ core_method: airv2x_cobevt
378
+ name: airv2x_intermediate_cobevt
379
+ num_anchor: 2
380
+ num_class: 7
381
+ optimizer:
382
+ args:
383
+ eps: 1.0e-10
384
+ weight_decay: 0.0001
385
+ core_method: Adam
386
+ lr: 0.002
387
+ postprocess:
388
+ anchor_args:
389
+ D: 1
390
+ H: 200
391
+ W: 704
392
+ cav_lidar_range: *id012
393
+ feature_stride: 2
394
+ h: 1.56
395
+ l: 3.9
396
+ num: 2
397
+ r:
398
+ - 0
399
+ - 90
400
+ vd: 4
401
+ vh: 0.4
402
+ vw: 0.4
403
+ w: 1.6
404
+ core_method: VoxelPostprocessor
405
+ ego_type: vehicle
406
+ max_num: 300
407
+ nms_thresh: 0.15
408
+ order: hwl
409
+ target_args:
410
+ neg_threshold: 0.45
411
+ obj_threshold: 0.2
412
+ pos_threshold: 0.6
413
+ score_threshold: 0.2
414
+ preprocess:
415
+ args:
416
+ max_points_per_voxel: 32
417
+ max_voxel_test: 70000
418
+ max_voxel_train: 32000
419
+ voxel_size:
420
+ - 0.4
421
+ - 0.4
422
+ - 4
423
+ cav_lidar_range: *id012
424
+ core_method: SpVoxelPreprocessor
425
+ ego_type: vehicle
426
+ root_dir: dataset/airv2x/train
427
+ seg_branch: both
428
+ seg_hw: 512
429
+ seg_res: 0.25
430
+ static_class: 3
431
+ tag: default
432
+ task: det
433
+ test_dir: dataset/airv2x/test
434
+ train: true
435
+ train_params:
436
+ batch_size: 1
437
+ epoches: 50
438
+ eval_freq: 2
439
+ max_cav: *id013
440
+ max_cav_num: 7
441
+ save_freq: 1
442
+ validate_dir: dataset/airv2x/val
443
+ yaml_parser: load_airv2x_params
airv2x_intermediate_v2xvit/release/best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ba8fa2beab363cdca4de80f793679902e4e2e48bdb40a24ea2c0102daaccbc7
3
+ size 51188692
airv2x_intermediate_v2xvit/release/config.yaml ADDED
@@ -0,0 +1,475 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ active_sensors: &id001
2
+ - lidar
3
+ bevcam_fov: 110
4
+ collaborators: &id002
5
+ - vehicle
6
+ - rsu
7
+ - drone
8
+ data_augment:
9
+ - ALONG_AXIS_LIST:
10
+ - x
11
+ NAME: random_world_flip
12
+ - NAME: random_world_rotation
13
+ WORLD_ROT_ANGLE:
14
+ - -0.78539816
15
+ - 0.78539816
16
+ - NAME: random_world_scaling
17
+ WORLD_SCALE_RANGE:
18
+ - 0.95
19
+ - 1.05
20
+ device: cuda
21
+ dynamic_class: 7
22
+ ego_type: vehicle
23
+ fusion:
24
+ args:
25
+ drone_data_aug_conf: &id003
26
+ H: 720
27
+ W: 1280
28
+ bot_pct_lim:
29
+ - 0.0
30
+ - 0.05
31
+ final_dim:
32
+ - 360
33
+ - 640
34
+ rand_flip: false
35
+ resize_lim:
36
+ - 0.65
37
+ - 0.7
38
+ rot_lim:
39
+ - -3.6
40
+ - 3.6
41
+ drone_grid_conf: &id004
42
+ ddiscr:
43
+ - 6
44
+ - 150
45
+ - 144
46
+ mode: UD
47
+ xbound:
48
+ - -140.8
49
+ - 140.8
50
+ - 0.4
51
+ ybound:
52
+ - -40
53
+ - 40
54
+ - 0.4
55
+ zbound:
56
+ - -150
57
+ - -6
58
+ - 144
59
+ proj_first: true
60
+ rsu_data_aug_conf: &id005
61
+ H: 720
62
+ W: 1280
63
+ bot_pct_lim:
64
+ - 0.0
65
+ - 0.05
66
+ final_dim:
67
+ - 360
68
+ - 640
69
+ rand_flip: false
70
+ resize_lim:
71
+ - 0.65
72
+ - 0.7
73
+ rot_lim:
74
+ - 0
75
+ - 0
76
+ rsu_grid_conf: &id006
77
+ ddiscr:
78
+ - 2
79
+ - 50
80
+ - 48
81
+ mode: LID
82
+ xbound:
83
+ - -140.8
84
+ - 140.8
85
+ - 0.4
86
+ ybound:
87
+ - -40
88
+ - 40
89
+ - 0.4
90
+ zbound:
91
+ - -30
92
+ - 30
93
+ - 60.0
94
+ veh_data_aug_conf: &id008
95
+ H: 720
96
+ W: 1280
97
+ bot_pct_lim:
98
+ - 0.0
99
+ - 0.05
100
+ final_dim:
101
+ - 360
102
+ - 640
103
+ rand_flip: false
104
+ resize_lim:
105
+ - 0.65
106
+ - 0.7
107
+ rot_lim:
108
+ - 0
109
+ - 0
110
+ veh_grid_conf: &id009
111
+ ddiscr:
112
+ - 2
113
+ - 50
114
+ - 48
115
+ mode: LID
116
+ xbound:
117
+ - -140.8
118
+ - 140.8
119
+ - 0.4
120
+ ybound:
121
+ - -40
122
+ - 40
123
+ - 0.4
124
+ zbound:
125
+ - -10
126
+ - 10
127
+ - 20.0
128
+ core_method: IntermediateFusionDatasetAirv2x
129
+ loss:
130
+ det:
131
+ args:
132
+ cls_weight: 1.0
133
+ num_class: 7
134
+ reg: 2.0
135
+ core_method: point_pillar_loss_multiclass
136
+ seg:
137
+ args:
138
+ d_coe: 2.0
139
+ d_weights:
140
+ - 200.0
141
+ - 200.0
142
+ - 75.0
143
+ - 200.0
144
+ - 200.0
145
+ - 200.0
146
+ l_weights: 8.0
147
+ s_coe: 0.0
148
+ s_weights: 50.0
149
+ seg_branch: both
150
+ core_method: vanilla_seg_loss
151
+ lr_scheduler:
152
+ core_method: multistep
153
+ gamma: 0.1
154
+ step_size:
155
+ - 10
156
+ - 25
157
+ - 40
158
+ model:
159
+ args:
160
+ active_sensors: *id001
161
+ anchor_number: 2
162
+ backbone_fix: false
163
+ cav_range: &id012
164
+ - -140.8
165
+ - -40
166
+ - -3
167
+ - 140.8
168
+ - 40
169
+ - 1
170
+ collaborators: *id002
171
+ device: cuda
172
+ drone:
173
+ cam:
174
+ bevout_feature: 64
175
+ camera_encoder: EfficientNet
176
+ data_aug_conf: *id003
177
+ depth_supervision: false
178
+ grid_conf: *id004
179
+ img_downsample: 8
180
+ img_features: 64
181
+ use_depth_gt: true
182
+ lidar:
183
+ backbone_fix: false
184
+ compression: 0
185
+ lidar_range:
186
+ - -140.8
187
+ - -40
188
+ - -150
189
+ - 140.8
190
+ - 40
191
+ - -6
192
+ pillar_vfe:
193
+ num_filters:
194
+ - 64
195
+ use_absolute_xyz: true
196
+ use_norm: true
197
+ with_distance: false
198
+ point_pillar_scatter:
199
+ grid_size: &id007 !!python/object/apply:numpy.core.multiarray._reconstruct
200
+ args:
201
+ - &id010 !!python/name:numpy.ndarray ''
202
+ - !!python/tuple
203
+ - 0
204
+ - !!binary |
205
+ Yg==
206
+ state: !!python/tuple
207
+ - 1
208
+ - !!python/tuple
209
+ - 3
210
+ - &id011 !!python/object/apply:numpy.dtype
211
+ args:
212
+ - i8
213
+ - false
214
+ - true
215
+ state: !!python/tuple
216
+ - 3
217
+ - <
218
+ - null
219
+ - null
220
+ - null
221
+ - -1
222
+ - -1
223
+ - 0
224
+ - false
225
+ - !!binary |
226
+ wAIAAAAAAADIAAAAAAAAAAEAAAAAAAAA
227
+ num_features: 64
228
+ voxel_size:
229
+ - 0.4
230
+ - 0.4
231
+ - 144
232
+ modalities:
233
+ - lidar
234
+ dynamic_class: 7
235
+ ego_type: vehicle
236
+ head_dim: 256
237
+ max_cav: &id014
238
+ drone: 2
239
+ rsu: 2
240
+ vehicle: 3
241
+ max_cav_num: 7
242
+ modality_fusion:
243
+ base_bev_backbone:
244
+ layer_nums:
245
+ - 3
246
+ - 5
247
+ - 8
248
+ layer_strides:
249
+ - 2
250
+ - 2
251
+ - 2
252
+ num_filters:
253
+ - 64
254
+ - 128
255
+ - 256
256
+ num_upsample_filter:
257
+ - 128
258
+ - 128
259
+ - 128
260
+ upsample_strides:
261
+ - 1
262
+ - 2
263
+ - 4
264
+ compression: 0
265
+ shrink_header:
266
+ dim:
267
+ - 256
268
+ input_dim: 384
269
+ kernal_size:
270
+ - 1
271
+ padding:
272
+ - 0
273
+ stride:
274
+ - 1
275
+ use: true
276
+ num_class: 7
277
+ obj_head: true
278
+ outC: 256
279
+ proj_first: true
280
+ rsu:
281
+ cam:
282
+ bevout_feature: 64
283
+ camera_encoder: EfficientNet
284
+ data_aug_conf: *id005
285
+ depth_supervision: false
286
+ grid_conf: *id006
287
+ img_downsample: 8
288
+ img_features: 64
289
+ use_depth_gt: true
290
+ lidar:
291
+ backbone_fix: false
292
+ compression: 0
293
+ lidar_range:
294
+ - -140.8
295
+ - -40
296
+ - -30
297
+ - 140.8
298
+ - 40
299
+ - 30
300
+ pillar_vfe:
301
+ num_filters:
302
+ - 64
303
+ use_absolute_xyz: true
304
+ use_norm: true
305
+ with_distance: false
306
+ point_pillar_scatter:
307
+ grid_size: *id007
308
+ num_features: 64
309
+ voxel_size:
310
+ - 0.4
311
+ - 0.4
312
+ - 60
313
+ modalities:
314
+ - lidar
315
+ seg_branch: both
316
+ seg_hw: 512
317
+ seg_res: 0.25
318
+ static_class: 3
319
+ supervise_single: false
320
+ task: det
321
+ train: true
322
+ transformer:
323
+ encoder:
324
+ RTE_ratio: 2
325
+ cav_att_config:
326
+ RTE_ratio: 2
327
+ dim: 256
328
+ dim_head: 32
329
+ dropout: 0.3
330
+ heads: 8
331
+ use_RTE: true
332
+ use_hetero: true
333
+ depth: 3
334
+ feed_forward:
335
+ dropout: 0.3
336
+ mlp_dim: 256
337
+ num_blocks: 1
338
+ pwindow_att_config:
339
+ dim: 256
340
+ dim_head:
341
+ - 16
342
+ - 32
343
+ - 64
344
+ dropout: 0.3
345
+ fusion_method: split_attn
346
+ heads:
347
+ - 16
348
+ - 8
349
+ - 4
350
+ relative_pos_embedding: true
351
+ window_size:
352
+ - 2
353
+ - 4
354
+ - 4
355
+ sttf:
356
+ downsample_rate: 4
357
+ voxel_size: &id013
358
+ - 0.4
359
+ - 0.4
360
+ - 4
361
+ use_RTE: true
362
+ use_roi_mask: true
363
+ vehicle:
364
+ cam:
365
+ bevout_feature: 64
366
+ camera_encoder: EfficientNet
367
+ data_aug_conf: *id008
368
+ depth_supervision: false
369
+ grid_conf: *id009
370
+ img_downsample: 8
371
+ img_features: 64
372
+ use_depth_gt: true
373
+ lidar:
374
+ backbone_fix: false
375
+ compression: 0
376
+ lidar_range:
377
+ - -140.8
378
+ - -40
379
+ - -3
380
+ - 140.8
381
+ - 40
382
+ - 1
383
+ pillar_vfe:
384
+ num_filters:
385
+ - 64
386
+ use_absolute_xyz: true
387
+ use_norm: true
388
+ with_distance: false
389
+ point_pillar_scatter:
390
+ grid_size: !!python/object/apply:numpy.core.multiarray._reconstruct
391
+ args:
392
+ - *id010
393
+ - !!python/tuple
394
+ - 0
395
+ - !!binary |
396
+ Yg==
397
+ state: !!python/tuple
398
+ - 1
399
+ - !!python/tuple
400
+ - 3
401
+ - *id011
402
+ - false
403
+ - !!binary |
404
+ wAIAAAAAAADIAAAAAAAAAAEAAAAAAAAA
405
+ num_features: 64
406
+ voxel_size:
407
+ - 0.4
408
+ - 0.4
409
+ - 4
410
+ modalities:
411
+ - lidar
412
+ core_method: airv2x_v2xvit
413
+ name: airv2x_intermediate_v2xvit
414
+ num_anchor: 2
415
+ num_class: 7
416
+ optimizer:
417
+ args:
418
+ eps: 1.0e-10
419
+ weight_decay: 0.0001
420
+ core_method: Adam
421
+ lr: 0.002
422
+ postprocess:
423
+ anchor_args:
424
+ D: 1
425
+ H: 200
426
+ W: 704
427
+ cav_lidar_range: *id012
428
+ feature_stride: 2
429
+ h: 1.56
430
+ l: 3.9
431
+ num: 2
432
+ r:
433
+ - 0
434
+ - 90
435
+ vd: 4
436
+ vh: 0.4
437
+ vw: 0.4
438
+ w: 1.6
439
+ core_method: VoxelPostprocessor
440
+ ego_type: vehicle
441
+ max_num: 300
442
+ nms_thresh: 0.15
443
+ order: hwl
444
+ target_args:
445
+ neg_threshold: 0.45
446
+ obj_threshold: 0.2
447
+ pos_threshold: 0.6
448
+ score_threshold: 0.2
449
+ preprocess:
450
+ args:
451
+ max_points_per_voxel: 32
452
+ max_voxel_test: 70000
453
+ max_voxel_train: 32000
454
+ voxel_size: *id013
455
+ cav_lidar_range: *id012
456
+ core_method: SpVoxelPreprocessor
457
+ ego_type: vehicle
458
+ root_dir: dataset/airv2x/train
459
+ seg_branch: both
460
+ seg_hw: 512
461
+ seg_res: 0.25
462
+ static_class: 3
463
+ tag: default
464
+ task: det
465
+ train: true
466
+ train_params:
467
+ batch_size: 1
468
+ epoches: 50
469
+ eval_freq: 2
470
+ max_cav: *id014
471
+ max_cav_num: 7
472
+ save_freq: 1
473
+ validate_dir: dataset/airv2x/val
474
+ test_dir: dataset/airv2x/test
475
+ yaml_parser: load_airv2x_params
airv2x_intermediate_where2comm/release/config.yaml ADDED
@@ -0,0 +1,449 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ active_sensors: &id001
2
+ - lidar
3
+ bevcam_fov: 110
4
+ collaborators: &id002
5
+ - vehicle
6
+ - rsu
7
+ - drone
8
+ data_augment:
9
+ - ALONG_AXIS_LIST:
10
+ - x
11
+ NAME: random_world_flip
12
+ - NAME: random_world_rotation
13
+ WORLD_ROT_ANGLE:
14
+ - -0.78539816
15
+ - 0.78539816
16
+ - NAME: random_world_scaling
17
+ WORLD_SCALE_RANGE:
18
+ - 0.95
19
+ - 1.05
20
+ device: cuda
21
+ dynamic_class: 7
22
+ ego_type: vehicle
23
+ fusion:
24
+ args:
25
+ drone_data_aug_conf: &id003
26
+ H: 720
27
+ W: 1280
28
+ bot_pct_lim:
29
+ - 0.0
30
+ - 0.05
31
+ final_dim:
32
+ - 360
33
+ - 640
34
+ rand_flip: false
35
+ resize_lim:
36
+ - 0.65
37
+ - 0.7
38
+ rot_lim:
39
+ - -3.6
40
+ - 3.6
41
+ drone_grid_conf: &id004
42
+ ddiscr:
43
+ - 6
44
+ - 150
45
+ - 144
46
+ mode: UD
47
+ xbound:
48
+ - -140.8
49
+ - 140.8
50
+ - 0.4
51
+ ybound:
52
+ - -40
53
+ - 40
54
+ - 0.4
55
+ zbound:
56
+ - -150
57
+ - -6
58
+ - 144
59
+ proj_first: true
60
+ rsu_data_aug_conf: &id005
61
+ H: 720
62
+ W: 1280
63
+ bot_pct_lim:
64
+ - 0.0
65
+ - 0.05
66
+ final_dim:
67
+ - 360
68
+ - 640
69
+ rand_flip: false
70
+ resize_lim:
71
+ - 0.65
72
+ - 0.7
73
+ rot_lim:
74
+ - 0
75
+ - 0
76
+ rsu_grid_conf: &id006
77
+ ddiscr:
78
+ - 2
79
+ - 50
80
+ - 48
81
+ mode: LID
82
+ xbound:
83
+ - -140.8
84
+ - 140.8
85
+ - 0.4
86
+ ybound:
87
+ - -40
88
+ - 40
89
+ - 0.4
90
+ zbound:
91
+ - -30
92
+ - 30
93
+ - 60.0
94
+ veh_data_aug_conf: &id008
95
+ H: 720
96
+ W: 1280
97
+ bot_pct_lim:
98
+ - 0.0
99
+ - 0.05
100
+ final_dim:
101
+ - 360
102
+ - 640
103
+ rand_flip: false
104
+ resize_lim:
105
+ - 0.65
106
+ - 0.7
107
+ rot_lim:
108
+ - 0
109
+ - 0
110
+ veh_grid_conf: &id009
111
+ ddiscr:
112
+ - 2
113
+ - 50
114
+ - 48
115
+ mode: LID
116
+ xbound:
117
+ - -140.8
118
+ - 140.8
119
+ - 0.4
120
+ ybound:
121
+ - -40
122
+ - 40
123
+ - 0.4
124
+ zbound:
125
+ - -10
126
+ - 10
127
+ - 20.0
128
+ core_method: IntermediateFusionDatasetAirv2x
129
+ loss:
130
+ det:
131
+ args:
132
+ cls_weight: 1.0
133
+ num_class: 7
134
+ reg: 2.0
135
+ core_method: point_pillar_loss_multiclass
136
+ seg:
137
+ args:
138
+ d_coe: 2.0
139
+ d_weights:
140
+ - 200.0
141
+ - 200.0
142
+ - 75.0
143
+ - 200.0
144
+ - 200.0
145
+ - 200.0
146
+ l_weights: 8.0
147
+ s_coe: 0.0
148
+ s_weights: 50.0
149
+ seg_branch: both
150
+ core_method: vanilla_seg_loss
151
+ lr_scheduler:
152
+ core_method: multistep
153
+ gamma: 0.1
154
+ step_size:
155
+ - 10
156
+ - 25
157
+ - 40
158
+ model:
159
+ args:
160
+ active_sensors: *id001
161
+ anchor_number: 2
162
+ backbone_fix: false
163
+ cav_range: &id014
164
+ - -140.8
165
+ - -40
166
+ - -3
167
+ - 140.8
168
+ - 40
169
+ - 1
170
+ collaborators: *id002
171
+ device: cuda
172
+ drone:
173
+ cam:
174
+ bevout_feature: 64
175
+ camera_encoder: EfficientNet
176
+ data_aug_conf: *id003
177
+ depth_supervision: false
178
+ grid_conf: *id004
179
+ img_downsample: 8
180
+ img_features: 64
181
+ use_depth_gt: true
182
+ lidar:
183
+ backbone_fix: false
184
+ compression: 0
185
+ lidar_range:
186
+ - -140.8
187
+ - -40
188
+ - -150
189
+ - 140.8
190
+ - 40
191
+ - -6
192
+ pillar_vfe:
193
+ num_filters:
194
+ - 64
195
+ use_absolute_xyz: true
196
+ use_norm: true
197
+ with_distance: false
198
+ point_pillar_scatter:
199
+ grid_size: &id007 !!python/object/apply:numpy.core.multiarray._reconstruct
200
+ args:
201
+ - &id010 !!python/name:numpy.ndarray ''
202
+ - !!python/tuple
203
+ - 0
204
+ - !!binary |
205
+ Yg==
206
+ state: !!python/tuple
207
+ - 1
208
+ - !!python/tuple
209
+ - 3
210
+ - &id011 !!python/object/apply:numpy.dtype
211
+ args:
212
+ - i8
213
+ - false
214
+ - true
215
+ state: !!python/tuple
216
+ - 3
217
+ - <
218
+ - null
219
+ - null
220
+ - null
221
+ - -1
222
+ - -1
223
+ - 0
224
+ - false
225
+ - !!binary |
226
+ wAIAAAAAAADIAAAAAAAAAAEAAAAAAAAA
227
+ num_features: 64
228
+ voxel_size:
229
+ - 0.4
230
+ - 0.4
231
+ - 144
232
+ modalities:
233
+ - lidar
234
+ dynamic_class: 7
235
+ ego_type: vehicle
236
+ head_dim: 256
237
+ max_cav: &id016
238
+ drone: 5
239
+ rsu: 5
240
+ vehicle: 5
241
+ modality_fusion:
242
+ base_bev_backbone:
243
+ layer_nums: &id012
244
+ - 3
245
+ - 5
246
+ - 8
247
+ layer_strides:
248
+ - 2
249
+ - 2
250
+ - 2
251
+ num_filters: &id013
252
+ - 64
253
+ - 128
254
+ - 256
255
+ num_upsample_filter:
256
+ - 128
257
+ - 128
258
+ - 128
259
+ upsample_strides:
260
+ - 1
261
+ - 2
262
+ - 4
263
+ compression: 0
264
+ shrink_header:
265
+ dim:
266
+ - 256
267
+ input_dim: 384
268
+ kernal_size:
269
+ - 1
270
+ padding:
271
+ - 0
272
+ stride:
273
+ - 1
274
+ use: true
275
+ num_class: 7
276
+ obj_head: true
277
+ outC: 256
278
+ proj_first: true
279
+ rsu:
280
+ cam:
281
+ bevout_feature: 64
282
+ camera_encoder: EfficientNet
283
+ data_aug_conf: *id005
284
+ depth_supervision: false
285
+ grid_conf: *id006
286
+ img_downsample: 8
287
+ img_features: 64
288
+ use_depth_gt: true
289
+ lidar:
290
+ backbone_fix: false
291
+ compression: 0
292
+ lidar_range:
293
+ - -140.8
294
+ - -40
295
+ - -30
296
+ - 140.8
297
+ - 40
298
+ - 30
299
+ pillar_vfe:
300
+ num_filters:
301
+ - 64
302
+ use_absolute_xyz: true
303
+ use_norm: true
304
+ with_distance: false
305
+ point_pillar_scatter:
306
+ grid_size: *id007
307
+ num_features: 64
308
+ voxel_size:
309
+ - 0.4
310
+ - 0.4
311
+ - 60
312
+ modalities:
313
+ - lidar
314
+ seg_branch: both
315
+ seg_hw: 512
316
+ seg_res: 0.25
317
+ static_class: 3
318
+ supervise_single: false
319
+ task: det
320
+ train: true
321
+ vehicle:
322
+ cam:
323
+ bevout_feature: 64
324
+ camera_encoder: EfficientNet
325
+ data_aug_conf: *id008
326
+ depth_supervision: false
327
+ grid_conf: *id009
328
+ img_downsample: 8
329
+ img_features: 64
330
+ use_depth_gt: true
331
+ lidar:
332
+ backbone_fix: false
333
+ compression: 0
334
+ lidar_range:
335
+ - -140.8
336
+ - -40
337
+ - -3
338
+ - 140.8
339
+ - 40
340
+ - 1
341
+ pillar_vfe:
342
+ num_filters:
343
+ - 64
344
+ use_absolute_xyz: true
345
+ use_norm: true
346
+ with_distance: false
347
+ point_pillar_scatter:
348
+ grid_size: !!python/object/apply:numpy.core.multiarray._reconstruct
349
+ args:
350
+ - *id010
351
+ - !!python/tuple
352
+ - 0
353
+ - !!binary |
354
+ Yg==
355
+ state: !!python/tuple
356
+ - 1
357
+ - !!python/tuple
358
+ - 3
359
+ - *id011
360
+ - false
361
+ - !!binary |
362
+ wAIAAAAAAADIAAAAAAAAAAEAAAAAAAAA
363
+ num_features: 64
364
+ voxel_size:
365
+ - 0.4
366
+ - 0.4
367
+ - 4
368
+ modalities:
369
+ - lidar
370
+ where2com_fusion:
371
+ communication:
372
+ gaussian_smooth:
373
+ c_sigma: 1.0
374
+ k_size: 5
375
+ round: 1
376
+ threshold: 0.01
377
+ downsample_rate: 4
378
+ fully: false
379
+ in_channels: 256
380
+ layer_nums: *id012
381
+ multi_scale: true
382
+ num_filters: *id013
383
+ voxel_size: &id015
384
+ - 0.4
385
+ - 0.4
386
+ - 4
387
+ core_method: airv2x_where2com
388
+ name: airv2x_intermediate_where2comm
389
+ num_anchor: 2
390
+ num_class: 7
391
+ optimizer:
392
+ args:
393
+ eps: 1.0e-10
394
+ weight_decay: 0.0001
395
+ core_method: Adam
396
+ lr: 0.002
397
+ postprocess:
398
+ anchor_args:
399
+ D: 1
400
+ H: 200
401
+ W: 704
402
+ cav_lidar_range: *id014
403
+ feature_stride: 2
404
+ h: 1.56
405
+ l: 3.9
406
+ num: 2
407
+ r:
408
+ - 0
409
+ - 90
410
+ vd: 4
411
+ vh: 0.4
412
+ vw: 0.4
413
+ w: 1.6
414
+ core_method: VoxelPostprocessor
415
+ ego_type: vehicle
416
+ max_num: 300
417
+ nms_thresh: 0.15
418
+ order: hwl
419
+ target_args:
420
+ neg_threshold: 0.45
421
+ obj_threshold: 0.2
422
+ pos_threshold: 0.6
423
+ score_threshold: 0.2
424
+ preprocess:
425
+ args:
426
+ max_points_per_voxel: 32
427
+ max_voxel_test: 70000
428
+ max_voxel_train: 32000
429
+ voxel_size: *id015
430
+ cav_lidar_range: *id014
431
+ core_method: SpVoxelPreprocessor
432
+ ego_type: vehicle
433
+ root_dir: dataset/airv2x/train
434
+ seg_branch: both
435
+ seg_hw: 512
436
+ seg_res: 0.25
437
+ static_class: 3
438
+ tag: default
439
+ task: det
440
+ train: true
441
+ train_params:
442
+ batch_size: 1
443
+ epoches: 50
444
+ eval_freq: 2
445
+ max_cav: *id016
446
+ save_freq: 1
447
+ validate_dir: dataset/airv2x/val
448
+ test_dir: dataset/airv2x/test
449
+ yaml_parser: load_airv2x_params
airv2x_intermediate_where2comm/release/net_epoch16.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f0ce7c234489d6a1540944e6f656e0668e2917eea8d29b1da03885c638ceb2b
3
+ size 29195398