yuyang-cloud commited on
Commit
6bf726b
·
verified ·
1 Parent(s): 5ab3b69

Upload folder using huggingface_hub

Browse files
Files changed (20) hide show
  1. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/adapter/config.json +7 -0
  2. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/adapter/diffusion_pytorch_model.bin +3 -0
  3. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/optimizer.bin +3 -0
  4. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/pytorch_model.bin +3 -0
  5. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/pytorch_model_1.bin +3 -0
  6. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/pytorch_model_2.bin +3 -0
  7. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_0.pkl +3 -0
  8. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_1.pkl +3 -0
  9. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_2.pkl +3 -0
  10. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_3.pkl +3 -0
  11. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/scaler.pt +3 -0
  12. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/scheduler.bin +3 -0
  13. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/hydra/config.yaml +495 -0
  14. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/hydra/hydra.yaml +162 -0
  15. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/hydra/overrides.yaml +2 -0
  16. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/lora_text.pt +3 -0
  17. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/tb-occ/events.out.tfevents.1745161677.cvrp-gpu-5.2144986.0 +3 -0
  18. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/train.log +0 -0
  19. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/unet_occ/config.json +107 -0
  20. occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/unet_occ/diffusion_pytorch_model.bin +3 -0
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/adapter/config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "TextAdapter",
3
+ "_diffusers_version": "0.17.1",
4
+ "in_dim": 1024,
5
+ "int_dim": 896,
6
+ "out_dim": 1024
7
+ }
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/adapter/diffusion_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01c9018495bd23c6b7cbf80ad5032ced9ad9d837bc912ef2c977a68e26682ffc
3
+ size 88693665
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f786eab56c17adc60bac922fddad5f19bb8aa74e949dfead5c5316f034cb5d
3
+ size 3881234331
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a863133b3f74977a18ad98d697da8515d45b267096f4694b4f22ac6f3f01a1f3
3
+ size 1854200581
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/pytorch_model_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:977f8e0133b3f2502a75f512e8638b5122bc7ff21a9fcbf3869d6a8acc9a828f
3
+ size 1496717673
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/pytorch_model_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6475eaebf9a7aee9314e6e88218fb8362d2bef34180b91d7e902d51128aaf69f
3
+ size 88693425
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d63cb9fb2a5f56837756cebaa3a8cb947b660ff1d88428755d04973021213b9e
3
+ size 17747
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_1.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dcf56463be636fe6a38ff30440cca6e268506c184e1a4e5ea2dfb623d47341b
3
+ size 17747
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_2.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6eb45d91195bdc76d1ec2f0d7d9fbac7179b9dbbf4cd4e53db7a087eb9dedf1
3
+ size 17747
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/random_states_3.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3345b5d76cb40ea8ee98f22e921fbebfc6053aa1f7b08ab4951a0f0897ec65ef
3
+ size 17747
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fce4e8b2846330e7f90197e8f3876452f5224d090d9fa143a17219be96966945
3
+ size 557
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/checkpoint-75000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09292b540a5bd17f70e67cef5ca61cc55788c0b633bfc767f117a92550659161
3
+ size 627
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/hydra/config.yaml ADDED
@@ -0,0 +1,495 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task_id: occ
2
+ log_root_prefix: work_dirs/debug
3
+ projname: ${model.name}
4
+ try_run: true
5
+ debug: false
6
+ log_root: ./work_dirs
7
+ init_method: env://
8
+ seed: 100
9
+ fix_seed_within_batch: false
10
+ resume_from_checkpoint: work_dirs/occ_rawbox_2025-04-17_22-56_occ/checkpoint-740000
11
+ resume_reset_scheduler: false
12
+ validation_only: false
13
+ model:
14
+ name: occ_rawbox
15
+ pretrained_model_name_or_path: pretrained/stable-diffusion-v2-1/
16
+ pretrained_t5_path: pretrained/t5-large/
17
+ pretrained_lavi_bridge_path: pretrained/LaVi-Bridge/t5_unet/
18
+ bbox_mode: all-xyz
19
+ bbox_view_shared: true
20
+ condition_embed_dim: 1024
21
+ train_with_same_noise: false
22
+ runner_module: magicdrive.runner.occ_runner.OccRunner
23
+ pipe_module: magicdrive.pipeline.pipeline_occ_unet.StableDiffusionOccUNetPipeline
24
+ vae_module: magicdrive.occ_vae.networks.networks.AutoEncoderGroupSkip
25
+ vae_ckpt: work_dirs/vae/best_model
26
+ vae:
27
+ num_class: 17
28
+ geo_feat_channels: 16
29
+ feat_channel_up: 64
30
+ mlp_hidden_channels: 256
31
+ mlp_hidden_layers: 4
32
+ z_down: false
33
+ padding_mode: replicate
34
+ voxel_fea: false
35
+ triplane: true
36
+ pos: true
37
+ dataset: Occ3D-nuScenes
38
+ unet_module: magicdrive.networks.unet_2d_condition_occ.UNet2DConditionModelOcc
39
+ use_fp32_for_unet_trainable: true
40
+ unet_dir: unet_occ
41
+ unet:
42
+ sample_size: 116
43
+ in_channels: 16
44
+ out_channels: 16
45
+ down_block_types:
46
+ - CrossAttnDownBlock2D
47
+ - CrossAttnDownBlock2D
48
+ - CrossAttnDownBlock2D
49
+ - DownBlock2D
50
+ up_block_types:
51
+ - UpBlock2D
52
+ - CrossAttnUpBlock2D
53
+ - CrossAttnUpBlock2D
54
+ - CrossAttnUpBlock2D
55
+ block_out_channels:
56
+ - 64
57
+ - 128
58
+ - 256
59
+ - 512
60
+ layers_per_block: 2
61
+ cross_attention_dim: ${model.condition_embed_dim}
62
+ tri_size: ${dataset.tri_size}
63
+ is_rollout: true
64
+ conv_down: true
65
+ conv_up: true
66
+ tri_z_down: false
67
+ map_with_aux_box: ${runner.triplane_aux_box}
68
+ map_size_wo_aux_box:
69
+ - 16
70
+ - 216
71
+ - 216
72
+ map_size_w_aux_box:
73
+ - 24
74
+ - 216
75
+ - 216
76
+ conditioning_embedding_out_channels:
77
+ - 16
78
+ - 32
79
+ - 96
80
+ - 256
81
+ use_uncond_map: zero
82
+ drop_cond_ratio: 0.25
83
+ bbox_embedder_cls: magicdrive.networks.bbox_embedder.ContinuousBBoxWithTextEmbedding
84
+ bbox_embedder_param:
85
+ n_classes: 10
86
+ class_token_dim: ${model.condition_embed_dim}
87
+ trainable_class_token: false
88
+ use_text_encoder_init: true
89
+ embedder_num_freq: 4
90
+ proj_dims:
91
+ - 1024
92
+ - 512
93
+ - 512
94
+ - 1024
95
+ mode: ${...bbox_mode}
96
+ minmax_normalize: false
97
+ dataset:
98
+ dataset_type: NuScenesDatasetM
99
+ occ_dataset_type: Occ3D-nuScenes
100
+ dataset_root: data/nuscenes/
101
+ triplane_root: data/nuscenes/nuscenes_triplane_100_100_16
102
+ dataset_process_root: data/nuscenes/nuscenes_mmdet3d_2/
103
+ dataset_cache_file_tag: 26x200x200_map_aux_full_16x216x216_triplane_map
104
+ dataset_cache_file:
105
+ - ${dataset.dataset_process_root}../nuscenes_map_aux/train_${dataset.dataset_cache_file_tag}.h5
106
+ - ${dataset.dataset_process_root}../nuscenes_map_aux/val_${dataset.dataset_cache_file_tag}.h5
107
+ template_clip: A driving scene image at {location}. {description}.
108
+ template_t5: A driving scene at {location}. {description}. {detailed_description}
109
+ image_size:
110
+ - 224
111
+ - 400
112
+ map_bound:
113
+ x:
114
+ - -40.0
115
+ - 40.0
116
+ - 0.4
117
+ 'y':
118
+ - -40.0
119
+ - 40.0
120
+ - 0.4
121
+ z:
122
+ - -1.0
123
+ - 5.4
124
+ - 0.4
125
+ tri_size:
126
+ - 100
127
+ - 100
128
+ - 16
129
+ view_order:
130
+ - CAM_FRONT_LEFT
131
+ - CAM_FRONT
132
+ - CAM_FRONT_RIGHT
133
+ - CAM_BACK_RIGHT
134
+ - CAM_BACK
135
+ - CAM_BACK_LEFT
136
+ neighboring_view_pair:
137
+ 0:
138
+ - 5
139
+ - 1
140
+ 1:
141
+ - 0
142
+ - 2
143
+ 2:
144
+ - 1
145
+ - 3
146
+ 3:
147
+ - 2
148
+ - 4
149
+ 4:
150
+ - 3
151
+ - 5
152
+ 5:
153
+ - 4
154
+ - 0
155
+ back_resize:
156
+ - 896
157
+ - 1600
158
+ back_pad:
159
+ - 0
160
+ - 4
161
+ - 0
162
+ - 0
163
+ augment2d:
164
+ resize:
165
+ - - 0.25
166
+ - 0.25
167
+ rotate: null
168
+ aux_data:
169
+ - visibility
170
+ - center_offset
171
+ - center_ohw
172
+ - height
173
+ augment3d:
174
+ scale:
175
+ - 1.0
176
+ - 1.0
177
+ rotate:
178
+ - 0.0
179
+ - 0.0
180
+ translate: 0
181
+ flip_ratio: 0.0
182
+ flip_direction: null
183
+ object_classes:
184
+ - barrier
185
+ - bicycle
186
+ - bus
187
+ - car
188
+ - construction_vehicle
189
+ - motorcycle
190
+ - pedestrian
191
+ - traffic_cone
192
+ - trailer
193
+ - truck
194
+ map_classes:
195
+ - drivable_area
196
+ - ped_crossing
197
+ - walkway
198
+ - stop_line
199
+ - carpark_area
200
+ - road_divider
201
+ - lane_divider
202
+ - road_block
203
+ input_modality:
204
+ use_lidar: false
205
+ use_camera: true
206
+ use_radar: false
207
+ use_map: false
208
+ use_external: false
209
+ train_pipeline:
210
+ - type: LoadMultiViewImageFromFiles
211
+ to_float32: true
212
+ - type: LoadAnnotations3D
213
+ with_bbox_3d: true
214
+ with_label_3d: true
215
+ with_attr_label: false
216
+ - type: ImageAug3D
217
+ final_dim: ${...image_size}
218
+ resize_lim: ${...augment2d.resize[0]}
219
+ bot_pct_lim:
220
+ - 0.0
221
+ - 0.0
222
+ rot_lim: ${...augment2d.rotate}
223
+ rand_flip: false
224
+ is_train: false
225
+ - type: GlobalRotScaleTrans
226
+ resize_lim: ${...augment3d.scale}
227
+ rot_lim: ${...augment3d.rotate}
228
+ trans_lim: ${...augment3d.translate}
229
+ is_train: true
230
+ - type: ObjectNameFilterM
231
+ classes: ${...object_classes}
232
+ - type: LoadBEVSegmentationM
233
+ dataset_root: ${...dataset_root}
234
+ xbound: ${...map_bound.x}
235
+ ybound: ${...map_bound.y}
236
+ classes: ${...map_classes}
237
+ object_classes: ${...object_classes}
238
+ aux_data: ${...aux_data}
239
+ cache_file: ${...dataset_cache_file.0}
240
+ - type: LoadBEVHDMap
241
+ dataset_root: ${...dataset_root}
242
+ xbound: ${...map_bound.x}
243
+ ybound: ${...map_bound.y}
244
+ image_size: ${...image_size}
245
+ object_classes: ${...object_classes}
246
+ - type: LoadTriPlane
247
+ dataset_root: ${...triplane_root}
248
+ dataset_type: ${...occ_dataset_type}
249
+ - type: LoadTriPlaneSegmentation
250
+ dataset_root: ${...dataset_root}
251
+ xbound: ${...map_bound.x}
252
+ ybound: ${...map_bound.y}
253
+ zbound: ${...map_bound.z}
254
+ cache_file: ${...dataset_cache_file.0}
255
+ dataset_type: ${...occ_dataset_type}
256
+ - type: LoadOccRenderMap
257
+ dataset_root: ${occ_render_path}
258
+ num_classes: 20
259
+ - type: RandomFlip3DwithViews
260
+ flip_ratio: ${...augment3d.flip_ratio}
261
+ direction: ${...augment3d.flip_direction}
262
+ - type: LoadDescription
263
+ dataset_root: ${...dataset_root}
264
+ dataset_type: ${...occ_dataset_type}
265
+ - type: ReorderMultiViewImagesM
266
+ order: ${...view_order}
267
+ safe: false
268
+ - type: ImageNormalize
269
+ mean:
270
+ - 0.5
271
+ - 0.5
272
+ - 0.5
273
+ std:
274
+ - 0.5
275
+ - 0.5
276
+ - 0.5
277
+ - type: DefaultFormatBundle3D
278
+ classes: ${...object_classes}
279
+ - type: Collect3D
280
+ keys:
281
+ - img
282
+ - triplane
283
+ - gt_bboxes_3d
284
+ - gt_labels_3d
285
+ - gt_masks_bev
286
+ - gt_aux_bev
287
+ - bev_hdmap
288
+ - layout_canvas
289
+ - gt_masks_triplane
290
+ - occ_render_image
291
+ - occ_render_depth
292
+ meta_keys:
293
+ - camera_intrinsics
294
+ - lidar2ego
295
+ - lidar2camera
296
+ - camera2lidar
297
+ - lidar2image
298
+ - img_aug_matrix
299
+ meta_lis_keys:
300
+ - timeofday
301
+ - location
302
+ - description
303
+ - detailed_description
304
+ - filename
305
+ - token
306
+ test_pipeline:
307
+ - type: LoadMultiViewImageFromFiles
308
+ to_float32: true
309
+ - type: LoadAnnotations3D
310
+ with_bbox_3d: true
311
+ with_label_3d: true
312
+ with_attr_label: false
313
+ - type: ImageAug3D
314
+ final_dim: ${...image_size}
315
+ resize_lim: ${...augment2d.resize[0]}
316
+ bot_pct_lim:
317
+ - 0.0
318
+ - 0.0
319
+ rot_lim:
320
+ - 0.0
321
+ - 0.0
322
+ rand_flip: false
323
+ is_train: false
324
+ - type: GlobalRotScaleTrans
325
+ resize_lim: ${...augment3d.scale}
326
+ rot_lim: ${...augment3d.rotate}
327
+ trans_lim: ${...augment3d.translate}
328
+ is_train: true
329
+ - type: ObjectNameFilterM
330
+ classes: ${...object_classes}
331
+ - type: LoadBEVSegmentationM
332
+ dataset_root: ${...dataset_root}
333
+ xbound: ${...map_bound.x}
334
+ ybound: ${...map_bound.y}
335
+ classes: ${...map_classes}
336
+ object_classes: ${...object_classes}
337
+ aux_data: ${...aux_data}
338
+ cache_file: ${...dataset_cache_file.1}
339
+ - type: LoadBEVHDMap
340
+ dataset_root: ${...dataset_root}
341
+ xbound: ${...map_bound.x}
342
+ ybound: ${...map_bound.y}
343
+ image_size: ${...image_size}
344
+ object_classes: ${...object_classes}
345
+ - type: LoadTriPlane
346
+ dataset_root: ${...triplane_root}
347
+ dataset_type: ${...occ_dataset_type}
348
+ - type: LoadTriPlaneSegmentation
349
+ dataset_root: ${...dataset_root}
350
+ xbound: ${...map_bound.x}
351
+ ybound: ${...map_bound.y}
352
+ zbound: ${...map_bound.z}
353
+ cache_file: ${...dataset_cache_file.1}
354
+ dataset_type: ${...occ_dataset_type}
355
+ - type: LoadOccRenderMap
356
+ dataset_root: ${occ_render_path}
357
+ num_classes: 20
358
+ - type: LoadDescription
359
+ dataset_root: ${...dataset_root}
360
+ dataset_type: ${...occ_dataset_type}
361
+ - type: ReorderMultiViewImagesM
362
+ order: ${...view_order}
363
+ safe: false
364
+ - type: ImageNormalize
365
+ mean:
366
+ - 0.5
367
+ - 0.5
368
+ - 0.5
369
+ std:
370
+ - 0.5
371
+ - 0.5
372
+ - 0.5
373
+ - type: DefaultFormatBundle3D
374
+ classes: ${...object_classes}
375
+ - type: Collect3D
376
+ keys:
377
+ - img
378
+ - triplane
379
+ - gt_bboxes_3d
380
+ - gt_labels_3d
381
+ - gt_masks_bev
382
+ - gt_aux_bev
383
+ - bev_hdmap
384
+ - layout_canvas
385
+ - gt_masks_triplane
386
+ - occ_render_image
387
+ - occ_render_depth
388
+ meta_keys:
389
+ - camera_intrinsics
390
+ - lidar2ego
391
+ - lidar2camera
392
+ - camera2lidar
393
+ - lidar2image
394
+ - img_aug_matrix
395
+ meta_lis_keys:
396
+ - timeofday
397
+ - location
398
+ - description
399
+ - detailed_description
400
+ - filename
401
+ - token
402
+ data:
403
+ train:
404
+ type: ${...dataset_type}
405
+ dataset_root: ${...dataset_root}
406
+ ann_file: ${...dataset_process_root}nuscenes_infos_train.pkl
407
+ pipeline: ${...train_pipeline}
408
+ object_classes: ${...object_classes}
409
+ map_classes: ${...map_classes}
410
+ modality: ${...input_modality}
411
+ test_mode: false
412
+ force_all_boxes: true
413
+ box_type_3d: LiDAR
414
+ filter_empty_gt: false
415
+ val:
416
+ type: ${...dataset_type}
417
+ dataset_root: ${...dataset_root}
418
+ ann_file: ${...dataset_process_root}nuscenes_infos_val.pkl
419
+ pipeline: ${...test_pipeline}
420
+ object_classes: ${...object_classes}
421
+ map_classes: ${...map_classes}
422
+ modality: ${...input_modality}
423
+ test_mode: false
424
+ force_all_boxes: true
425
+ box_type_3d: LiDAR
426
+ filter_empty_gt: false
427
+ test:
428
+ type: ${...dataset_type}
429
+ dataset_root: ${...dataset_root}
430
+ ann_file: ${...dataset_process_root}nuscenes_infos_val.pkl
431
+ pipeline: ${...test_pipeline}
432
+ object_classes: ${...object_classes}
433
+ map_classes: ${...map_classes}
434
+ modality: ${...input_modality}
435
+ test_mode: true
436
+ force_all_boxes: true
437
+ box_type_3d: LiDAR
438
+ filter_empty_gt: false
439
+ accelerator:
440
+ gradient_accumulation_steps: 1
441
+ mixed_precision: fp16
442
+ report_to: tensorboard
443
+ runner:
444
+ foreground_loss_weight: 0.0
445
+ bbox_drop_ratio: 0
446
+ bbox_add_ratio: 0
447
+ bbox_add_num: 3
448
+ triplane_aux_box: false
449
+ num_train_epochs: 800
450
+ train_batch_size: 1
451
+ max_train_steps: 7
452
+ num_workers: 8
453
+ prefetch_factor: 4
454
+ display_per_epoch: 3125
455
+ display_per_n_min: 10
456
+ max_grad_norm: 1.0
457
+ set_grads_to_none: true
458
+ enable_xformers_memory_efficient_attention: true
459
+ unet_in_fp16: false
460
+ enable_unet_checkpointing: true
461
+ enable_controlnet_checkpointing: false
462
+ noise_offset: 0.0
463
+ train_with_same_offset: true
464
+ use_8bit_adam: false
465
+ adam_beta1: 0.9
466
+ adam_beta2: 0.999
467
+ adam_weight_decay: 0.01
468
+ adam_epsilon: 1.0e-08
469
+ learning_rate: 0.0001
470
+ lr_scheduler: constant
471
+ gradient_accumulation_steps: 1
472
+ lr_num_cycles: 1
473
+ lr_power: 1.0
474
+ lr_warmup_steps: 3000
475
+ checkpointing_steps: 5
476
+ validation_steps: 5
477
+ save_model_per_epoch: null
478
+ validation_before_run: false
479
+ validation_index:
480
+ - 204
481
+ - 912
482
+ - 1828
483
+ validation_times: 2
484
+ validation_batch_size: 1
485
+ validation_show_box: true
486
+ validation_seed_global: false
487
+ pipeline_param:
488
+ guidance_scale: 2
489
+ num_inference_steps: 20
490
+ eta: 0.0
491
+ controlnet_conditioning_scale: 1.0
492
+ guess_mode: false
493
+ use_zero_map_as_unconditional: false
494
+ bbox_max_length: null
495
+ occ_render_path: data/nuscenes/occ_render_map/
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/hydra/hydra.yaml ADDED
@@ -0,0 +1,162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ${log_root_prefix}/${projname}_${now:%Y-%m-%d}_${now:%H-%M}_${task_id}
4
+ sweep:
5
+ dir: multirun/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.mode=RUN
114
+ task:
115
+ - +exp=occ
116
+ - runner=debug
117
+ job:
118
+ name: train
119
+ chdir: null
120
+ override_dirname: +exp=occ,runner=debug
121
+ id: ???
122
+ num: ???
123
+ config_name: config_occ
124
+ env_set: {}
125
+ env_copy: []
126
+ config:
127
+ override_dirname:
128
+ kv_sep: '='
129
+ item_sep: ','
130
+ exclude_keys: []
131
+ runtime:
132
+ version: 1.3.0
133
+ version_base: '1.3'
134
+ cwd: /data/yyang/workspace/MagicDrive
135
+ config_sources:
136
+ - path: hydra.conf
137
+ schema: pkg
138
+ provider: hydra
139
+ - path: /data/yyang/workspace/MagicDrive/configs
140
+ schema: file
141
+ provider: main
142
+ - path: ''
143
+ schema: structured
144
+ provider: schema
145
+ output_dir: /data/yyang/workspace/MagicDrive/work_dirs/debug/occ_rawbox_2025-04-20_23-06_occ
146
+ choices:
147
+ exp: occ
148
+ exp/model@model: ../../model/occ_rawbox
149
+ runner: debug
150
+ accelerator: default
151
+ dataset: Nuscenes_cache
152
+ model: occ_rawbox
153
+ hydra/env: default
154
+ hydra/callbacks: null
155
+ hydra/job_logging: default
156
+ hydra/hydra_logging: default
157
+ hydra/hydra_help: default
158
+ hydra/help: default
159
+ hydra/sweeper: basic
160
+ hydra/launcher: basic
161
+ hydra/output: default
162
+ verbose: false
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/hydra/overrides.yaml ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ - +exp=occ
2
+ - runner=debug
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/lora_text.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:402ee064d71b49e9b98f586a03197407685aa975abac0b10ecc3e2cd424570dd
3
+ size 12634373
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/tb-occ/events.out.tfevents.1745161677.cvrp-gpu-5.2144986.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97fca8d2dc7d80e10817b95cbff822e645a76304787ef6ceeddb40b3ab5c57a2
3
+ size 40
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/train.log ADDED
The diff for this file is too large to render. See raw diff
 
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/unet_occ/config.json ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModelOcc",
3
+ "_diffusers_version": "0.17.1",
4
+ "act_fn": "silu",
5
+ "addition_embed_type": null,
6
+ "addition_embed_type_num_heads": 64,
7
+ "attention_head_dim": 8,
8
+ "bbox_embedder_cls": "magicdrive.networks.bbox_embedder.ContinuousBBoxWithTextEmbedding",
9
+ "bbox_embedder_param": {
10
+ "class_token_dim": 1024,
11
+ "embedder_num_freq": 4,
12
+ "minmax_normalize": false,
13
+ "mode": "all-xyz",
14
+ "n_classes": 10,
15
+ "proj_dims": [
16
+ 1024,
17
+ 512,
18
+ 512,
19
+ 1024
20
+ ],
21
+ "trainable_class_token": false,
22
+ "use_text_encoder_init": true
23
+ },
24
+ "block_out_channels": [
25
+ 64,
26
+ 128,
27
+ 256,
28
+ 512
29
+ ],
30
+ "center_input_sample": false,
31
+ "class_embed_type": null,
32
+ "class_embeddings_concat": false,
33
+ "conditioning_embedding_out_channels": [
34
+ 16,
35
+ 32,
36
+ 96,
37
+ 256
38
+ ],
39
+ "conv_down": true,
40
+ "conv_in_kernel": 3,
41
+ "conv_out_kernel": 3,
42
+ "conv_up": true,
43
+ "cross_attention_dim": 1024,
44
+ "cross_attention_norm": null,
45
+ "down_block_types": [
46
+ "CrossAttnDownBlock2D",
47
+ "CrossAttnDownBlock2D",
48
+ "CrossAttnDownBlock2D",
49
+ "DownBlock2D"
50
+ ],
51
+ "downsample_padding": 1,
52
+ "drop_cond_ratio": 0.25,
53
+ "dual_cross_attention": false,
54
+ "encoder_hid_dim": null,
55
+ "encoder_hid_dim_type": null,
56
+ "flip_sin_to_cos": true,
57
+ "freq_shift": 0,
58
+ "in_channels": 16,
59
+ "is_rollout": true,
60
+ "layers_per_block": 2,
61
+ "map_embedder_cls": null,
62
+ "map_embedder_param": null,
63
+ "map_size_w_aux_box": [
64
+ 24,
65
+ 216,
66
+ 216
67
+ ],
68
+ "map_size_wo_aux_box": [
69
+ 16,
70
+ 216,
71
+ 216
72
+ ],
73
+ "map_with_aux_box": false,
74
+ "mid_block_only_cross_attention": null,
75
+ "mid_block_scale_factor": 1,
76
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
77
+ "norm_eps": 1e-05,
78
+ "norm_num_groups": 32,
79
+ "num_class_embeds": null,
80
+ "only_cross_attention": false,
81
+ "out_channels": 16,
82
+ "projection_class_embeddings_input_dim": null,
83
+ "resnet_out_scale_factor": 1.0,
84
+ "resnet_skip_time_act": false,
85
+ "resnet_time_scale_shift": "default",
86
+ "sample_size": 116,
87
+ "time_cond_proj_dim": null,
88
+ "time_embedding_act_fn": null,
89
+ "time_embedding_dim": null,
90
+ "time_embedding_type": "positional",
91
+ "timestep_post_act": null,
92
+ "tri_size": [
93
+ 100,
94
+ 100,
95
+ 16
96
+ ],
97
+ "tri_z_down": false,
98
+ "up_block_types": [
99
+ "UpBlock2D",
100
+ "CrossAttnUpBlock2D",
101
+ "CrossAttnUpBlock2D",
102
+ "CrossAttnUpBlock2D"
103
+ ],
104
+ "upcast_attention": false,
105
+ "use_linear_projection": false,
106
+ "use_uncond_map": "zero"
107
+ }
occ_rawbox_100_100_16_v3_hdmapv2_t5_epoch630/unet_occ/diffusion_pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c254bb79844033c32503a381c7648c27a480e17edd0a6b0b67c003110ffd6dd
3
+ size 1854967641