weleen commited on
Commit
5f61144
·
verified ·
1 Parent(s): 4bd1d93

Upload folder using huggingface_hub

Browse files
l10_4tasks/config.yaml ADDED
@@ -0,0 +1,523 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ callbacks:
2
+ rollout_lh:
3
+ tasks:
4
+ _target_: calvin_env.envs.tasks.Tasks
5
+ tasks:
6
+ rotate_red_block_right:
7
+ - rotate_object
8
+ - block_red
9
+ - -60
10
+ rotate_red_block_left:
11
+ - rotate_object
12
+ - block_red
13
+ - 60
14
+ rotate_blue_block_right:
15
+ - rotate_object
16
+ - block_blue
17
+ - -60
18
+ rotate_blue_block_left:
19
+ - rotate_object
20
+ - block_blue
21
+ - 60
22
+ rotate_pink_block_right:
23
+ - rotate_object
24
+ - block_pink
25
+ - -60
26
+ rotate_pink_block_left:
27
+ - rotate_object
28
+ - block_pink
29
+ - 60
30
+ push_red_block_right:
31
+ - push_object
32
+ - block_red
33
+ - 0.1
34
+ - 0
35
+ push_red_block_left:
36
+ - push_object
37
+ - block_red
38
+ - -0.1
39
+ - 0
40
+ push_blue_block_right:
41
+ - push_object
42
+ - block_blue
43
+ - 0.1
44
+ - 0
45
+ push_blue_block_left:
46
+ - push_object
47
+ - block_blue
48
+ - -0.1
49
+ - 0
50
+ push_pink_block_right:
51
+ - push_object
52
+ - block_pink
53
+ - 0.1
54
+ - 0
55
+ push_pink_block_left:
56
+ - push_object
57
+ - block_pink
58
+ - -0.1
59
+ - 0
60
+ move_slider_left:
61
+ - move_door_rel
62
+ - base__slide
63
+ - 0.15
64
+ move_slider_right:
65
+ - move_door_rel
66
+ - base__slide
67
+ - -0.15
68
+ open_drawer:
69
+ - move_door_rel
70
+ - base__drawer
71
+ - 0.12
72
+ close_drawer:
73
+ - move_door_rel
74
+ - base__drawer
75
+ - -0.12
76
+ lift_red_block_table:
77
+ - lift_object
78
+ - block_red
79
+ - 0.05
80
+ - table
81
+ - base_link
82
+ lift_red_block_slider:
83
+ - lift_object
84
+ - block_red
85
+ - 0.03
86
+ - table
87
+ - plank_link
88
+ lift_red_block_drawer:
89
+ - lift_object
90
+ - block_red
91
+ - 0.05
92
+ - table
93
+ - drawer_link
94
+ lift_blue_block_table:
95
+ - lift_object
96
+ - block_blue
97
+ - 0.05
98
+ - table
99
+ - base_link
100
+ lift_blue_block_slider:
101
+ - lift_object
102
+ - block_blue
103
+ - 0.03
104
+ - table
105
+ - plank_link
106
+ lift_blue_block_drawer:
107
+ - lift_object
108
+ - block_blue
109
+ - 0.05
110
+ - table
111
+ - drawer_link
112
+ lift_pink_block_table:
113
+ - lift_object
114
+ - block_pink
115
+ - 0.05
116
+ - table
117
+ - base_link
118
+ lift_pink_block_slider:
119
+ - lift_object
120
+ - block_pink
121
+ - 0.03
122
+ - table
123
+ - plank_link
124
+ lift_pink_block_drawer:
125
+ - lift_object
126
+ - block_pink
127
+ - 0.05
128
+ - table
129
+ - drawer_link
130
+ place_in_slider:
131
+ - place_object
132
+ - table
133
+ - plank_link
134
+ place_in_drawer:
135
+ - place_object
136
+ - table
137
+ - drawer_link
138
+ stack_block:
139
+ - stack_objects
140
+ unstack_block:
141
+ - unstack_objects
142
+ turn_on_lightbulb:
143
+ - toggle_light
144
+ - lightbulb
145
+ - 0
146
+ - 1
147
+ turn_off_lightbulb:
148
+ - toggle_light
149
+ - lightbulb
150
+ - 1
151
+ - 0
152
+ turn_on_led:
153
+ - toggle_light
154
+ - led
155
+ - 0
156
+ - 1
157
+ turn_off_led:
158
+ - toggle_light
159
+ - led
160
+ - 1
161
+ - 0
162
+ push_into_drawer:
163
+ - push_object_into
164
+ - - block_red
165
+ - block_blue
166
+ - block_pink
167
+ - table
168
+ - base_link
169
+ - table
170
+ - drawer_link
171
+ val_annotations:
172
+ rotate_red_block_right:
173
+ - take the red block and rotate it to the right
174
+ rotate_red_block_left:
175
+ - take the red block and rotate it to the left
176
+ rotate_blue_block_right:
177
+ - take the blue block and rotate it to the right
178
+ rotate_blue_block_left:
179
+ - take the blue block and rotate it to the left
180
+ rotate_pink_block_right:
181
+ - take the pink block and rotate it to the right
182
+ rotate_pink_block_left:
183
+ - take the pink block and rotate it to the left
184
+ push_red_block_right:
185
+ - go push the red block right
186
+ push_red_block_left:
187
+ - go push the red block left
188
+ push_blue_block_right:
189
+ - go push the blue block right
190
+ push_blue_block_left:
191
+ - go push the blue block left
192
+ push_pink_block_right:
193
+ - go push the pink block right
194
+ push_pink_block_left:
195
+ - go push the pink block left
196
+ move_slider_left:
197
+ - push the sliding door to the left side
198
+ move_slider_right:
199
+ - push the sliding door to the right side
200
+ open_drawer:
201
+ - pull the handle to open the drawer
202
+ close_drawer:
203
+ - push the handle to close the drawer
204
+ lift_red_block_table:
205
+ - grasp and lift the red block
206
+ lift_blue_block_table:
207
+ - grasp and lift the blue block
208
+ lift_pink_block_table:
209
+ - grasp and lift the pink block
210
+ lift_red_block_slider:
211
+ - lift the red block from the sliding cabinet
212
+ lift_blue_block_slider:
213
+ - lift the blue block from the sliding cabinet
214
+ lift_pink_block_slider:
215
+ - lift the pink block from the sliding cabinet
216
+ lift_red_block_drawer:
217
+ - Take the red block from the drawer
218
+ lift_blue_block_drawer:
219
+ - Take the blue block from the drawer
220
+ lift_pink_block_drawer:
221
+ - Take the pink block from the drawer
222
+ place_in_slider:
223
+ - store the grasped block in the sliding cabinet
224
+ place_in_drawer:
225
+ - store the grasped block in the drawer
226
+ push_into_drawer:
227
+ - slide the block that it falls into the drawer
228
+ stack_block:
229
+ - stack the grasped block
230
+ unstack_block:
231
+ - remove the stacked block
232
+ turn_on_lightbulb:
233
+ - use the switch to turn on the light bulb
234
+ turn_off_lightbulb:
235
+ - use the switch to turn off the light bulb
236
+ turn_on_led:
237
+ - press the button to turn on the led light
238
+ turn_off_led:
239
+ - press the button to turn off the led light
240
+ _target_: mode.rollout.rollout_long_horizon.RolloutLongHorizon
241
+ _recursive_: false
242
+ env_cfg:
243
+ _target_: mode.wrappers.hulc_wrapper.HulcWrapper
244
+ skip_epochs: ${rollout_lh_skip_epochs}
245
+ rollout_freq: 5
246
+ num_videos: 0
247
+ num_sequences: 1000
248
+ replan_freq: 30
249
+ ep_len: 360
250
+ empty_cache: false
251
+ log_video_to_file: false
252
+ save_dir: ./videos
253
+ lang_folder: ${lang_folder}
254
+ debug: false
255
+ ema:
256
+ _target_: mode.callbacks.ema.EMA
257
+ decay: 0.999
258
+ start_step: 0
259
+ save_ema_weights_in_callback_state: true
260
+ evaluate_ema_weights_instead: true
261
+ power: 0.6666666666666666
262
+ inv_gamma: 1.0
263
+ min_value: 0.0
264
+ max_value: 0.9999
265
+ checkpoint:
266
+ _target_: pytorch_lightning.callbacks.ModelCheckpoint
267
+ verbose: true
268
+ dirpath: saved_models
269
+ filename: '{epoch:02d}'
270
+ every_n_epochs: ${callbacks.rollout_lh.rollout_freq}
271
+ datamodule:
272
+ transforms:
273
+ train:
274
+ rgb_static:
275
+ - _target_: torchvision.transforms.Resize
276
+ size: 224
277
+ antialias: true
278
+ - _target_: mode.utils.transforms.RandomShiftsAug
279
+ pad: 10
280
+ - _target_: mode.utils.transforms.ScaleImageTensor
281
+ - _target_: torchvision.transforms.Normalize
282
+ mean:
283
+ - 0.48145466
284
+ - 0.4578275
285
+ - 0.40821073
286
+ std:
287
+ - 0.26862954
288
+ - 0.26130258
289
+ - 0.27577711
290
+ rgb_gripper:
291
+ - _target_: torchvision.transforms.Resize
292
+ size: 224
293
+ antialias: true
294
+ - _target_: mode.utils.transforms.RandomShiftsAug
295
+ pad: 4
296
+ - _target_: mode.utils.transforms.ScaleImageTensor
297
+ - _target_: torchvision.transforms.Normalize
298
+ mean:
299
+ - 0.48145466
300
+ - 0.4578275
301
+ - 0.40821073
302
+ std:
303
+ - 0.26862954
304
+ - 0.26130258
305
+ - 0.27577711
306
+ robot_obs:
307
+ - _target_: mode.utils.transforms.NormalizeVector
308
+ scene_obs:
309
+ - _target_: mode.utils.transforms.NormalizeVector
310
+ val:
311
+ rgb_static:
312
+ - _target_: torchvision.transforms.Resize
313
+ size: 224
314
+ antialias: true
315
+ - _target_: mode.utils.transforms.ScaleImageTensor
316
+ - _target_: torchvision.transforms.Normalize
317
+ mean:
318
+ - 0.48145466
319
+ - 0.4578275
320
+ - 0.40821073
321
+ std:
322
+ - 0.26862954
323
+ - 0.26130258
324
+ - 0.27577711
325
+ rgb_gripper:
326
+ - _target_: torchvision.transforms.Resize
327
+ size: 224
328
+ antialias: true
329
+ - _target_: mode.utils.transforms.ScaleImageTensor
330
+ - _target_: torchvision.transforms.Normalize
331
+ mean:
332
+ - 0.48145466
333
+ - 0.4578275
334
+ - 0.40821073
335
+ std:
336
+ - 0.26862954
337
+ - 0.26130258
338
+ - 0.27577711
339
+ robot_obs:
340
+ - _target_: mode.utils.transforms.NormalizeVector
341
+ scene_obs:
342
+ - _target_: mode.utils.transforms.NormalizeVector
343
+ _target_: mode.datasets.hulc_data_module.HulcDataModule
344
+ _recursive_: false
345
+ root_data_dir: ${root_data_dir}
346
+ action_space: 7
347
+ action_max:
348
+ - 1.0
349
+ - 1.0
350
+ - 1.0
351
+ - 1.0
352
+ - 1.0
353
+ - 1.0
354
+ - 1.0
355
+ action_min:
356
+ - -1.0
357
+ - -1.0
358
+ - -1.0
359
+ - -1.0
360
+ - -1.0
361
+ - -1.0
362
+ - -1
363
+ shuffle_val: false
364
+ observation_space:
365
+ rgb_obs:
366
+ - rgb_static
367
+ - rgb_gripper
368
+ depth_obs: []
369
+ state_obs:
370
+ - robot_obs
371
+ actions:
372
+ - rel_actions
373
+ language:
374
+ - language
375
+ proprioception_dims:
376
+ n_state_obs: 8
377
+ keep_indices:
378
+ - - 0
379
+ - 7
380
+ - - 14
381
+ - 15
382
+ robot_orientation_idx:
383
+ - 3
384
+ - 6
385
+ normalize: true
386
+ normalize_robot_orientation: true
387
+ datasets:
388
+ lang_dataset:
389
+ _target_: mode.datasets.disk_dataset.ExtendedDiskDataset
390
+ key: lang
391
+ save_format: npz
392
+ batch_size: ${batch_size}
393
+ min_window_size: ${act_seq_len}
394
+ max_window_size: ${act_seq_len}
395
+ proprio_state: ${datamodule.proprioception_dims}
396
+ obs_space: ${datamodule.observation_space}
397
+ skip_frames: 1
398
+ pad: false
399
+ lang_folder: ${lang_folder}
400
+ aux_lang_loss_window: 8
401
+ num_workers: ${num_workers}
402
+ action_seq_len: ${act_seq_len}
403
+ obs_seq_len: ${obs_seq_len}
404
+ future_range: 1
405
+ use_extracted_rel_actions: ${use_extracted_rel_actions}
406
+ model:
407
+ _target_: mode.models.mode_agent.MoDEAgent
408
+ _recursive_: false
409
+ multistep: ${multistep}
410
+ use_lr_scheduler: true
411
+ entropy_gamma: 0.01
412
+ router_z_delta: 0.0
413
+ use_proprio: false
414
+ seed: ${seed}
415
+ sampler_type: ddim
416
+ num_sampling_steps: 10
417
+ sigma_data: 0.5
418
+ sigma_min: 0.001
419
+ sigma_max: 80
420
+ noise_scheduler: exponential
421
+ sigma_sample_density_type: loglogistic
422
+ ckpt_path: /home/yiming/pretrained_models/MoDE/MoDE_Pretrained
423
+ start_from_pretrained: true
424
+ act_window_size: ${act_seq_len}
425
+ latent_dim: 1024
426
+ obs_enc_dim: ${obs_dim}
427
+ cond_dim: 512
428
+ resnet_type: '50'
429
+ optimizer:
430
+ _target_: torch.optim.AdamW
431
+ transformer_weight_decay: 0.05
432
+ obs_encoder_weight_decay: 0.05
433
+ learning_rate: 0.0001
434
+ betas:
435
+ - 0.9
436
+ - 0.95
437
+ lr_scheduler:
438
+ lr_scheduler:
439
+ init_lr: 0.0001
440
+ init_lr_scale: 0.1
441
+ final_lr_scale: 1.0e-06
442
+ total_steps: 45000
443
+ phase_ratio: (0.02, 0.08, 0.9)
444
+ lr: 0.0001
445
+ model:
446
+ _target_: mode.models.edm_diffusion.score_wrappers.GCDenoiser
447
+ _recursive_: false
448
+ sigma_data: ${model.sigma_data}
449
+ inner_model:
450
+ _target_: mode.models.networks.modedit.MoDeDiT
451
+ action_dim: ${datamodule.action_space}
452
+ goal_dim: ${model.cond_dim}
453
+ obs_dim: 2048
454
+ goal_conditioned: true
455
+ causal: true
456
+ use_custom_attn_mask: false
457
+ use_proprio: ${model.use_proprio}
458
+ state_dim: ${proprio_dims}
459
+ embed_dim: ${model.latent_dim}
460
+ n_layers: 10
461
+ goal_seq_len: 1
462
+ obs_seq_len: ${obs_seq_len}
463
+ action_seq_len: ${act_seq_len}
464
+ embed_pdrob: 0
465
+ goal_drop: 0.1
466
+ attn_pdrop: 0.3
467
+ mlp_pdrop: 0.1
468
+ n_heads: 8
469
+ device: ${device}
470
+ linear_output: true
471
+ cond_router: true
472
+ num_experts: 4
473
+ top_k: 2
474
+ router_normalize: true
475
+ use_goal_in_routing: false
476
+ use_argmax: false
477
+ use_shared_expert: false
478
+ use_noise_token_as_input: true
479
+ init_style: olmoe
480
+ language_goal:
481
+ _target_: mode.models.networks.clip_lang_encoder.LangClip
482
+ _recursive_: false
483
+ model_name: ${clip_lang_model_name}
484
+ root_data_dir: data/lebai
485
+ lang_folder: lang_clip_resnet50
486
+ vis_clip_model_name: ViT-B/16
487
+ clip_lang_model_name: ViT-B/32
488
+ log_dir: ./logs
489
+ slurm: false
490
+ seed: 421
491
+ device: cuda
492
+ batch_size: 64
493
+ devices: 4
494
+ act_dim: 7
495
+ proprio_dims: 7
496
+ obs_dim: 512
497
+ goal_dim: 512
498
+ obs_seq_len: 1
499
+ act_seq_len: 32
500
+ multistep: 32
501
+ p_last_state: 0
502
+ gen_img_res: 112
503
+ max_epochs: 100
504
+ rollout_lh_skip_epochs: 9
505
+ num_workers: 12
506
+ benchmark_name: lebai_mode
507
+ use_extracted_rel_actions: true
508
+ trainer:
509
+ devices: ${devices}
510
+ precision: bf16
511
+ max_epochs: ${max_epochs}
512
+ sync_batchnorm: true
513
+ accelerator: gpu
514
+ strategy: ddp
515
+ logger:
516
+ _target_: pytorch_lightning.loggers.WandbLogger
517
+ save_dir: .
518
+ name: logger
519
+ group: mode
520
+ log_model: false
521
+ project: ${benchmark_name}
522
+ entity: yimingwu0
523
+ id: ???
l10_4tasks/model_cleaned.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:202a4f0edcff5ea0733939d018dc7edd587862a0dcfc37f3b2384b176b08d271
3
+ size 3115403448
l10_ds1_only/config.yaml ADDED
@@ -0,0 +1,523 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ callbacks:
2
+ rollout_lh:
3
+ tasks:
4
+ _target_: calvin_env.envs.tasks.Tasks
5
+ tasks:
6
+ rotate_red_block_right:
7
+ - rotate_object
8
+ - block_red
9
+ - -60
10
+ rotate_red_block_left:
11
+ - rotate_object
12
+ - block_red
13
+ - 60
14
+ rotate_blue_block_right:
15
+ - rotate_object
16
+ - block_blue
17
+ - -60
18
+ rotate_blue_block_left:
19
+ - rotate_object
20
+ - block_blue
21
+ - 60
22
+ rotate_pink_block_right:
23
+ - rotate_object
24
+ - block_pink
25
+ - -60
26
+ rotate_pink_block_left:
27
+ - rotate_object
28
+ - block_pink
29
+ - 60
30
+ push_red_block_right:
31
+ - push_object
32
+ - block_red
33
+ - 0.1
34
+ - 0
35
+ push_red_block_left:
36
+ - push_object
37
+ - block_red
38
+ - -0.1
39
+ - 0
40
+ push_blue_block_right:
41
+ - push_object
42
+ - block_blue
43
+ - 0.1
44
+ - 0
45
+ push_blue_block_left:
46
+ - push_object
47
+ - block_blue
48
+ - -0.1
49
+ - 0
50
+ push_pink_block_right:
51
+ - push_object
52
+ - block_pink
53
+ - 0.1
54
+ - 0
55
+ push_pink_block_left:
56
+ - push_object
57
+ - block_pink
58
+ - -0.1
59
+ - 0
60
+ move_slider_left:
61
+ - move_door_rel
62
+ - base__slide
63
+ - 0.15
64
+ move_slider_right:
65
+ - move_door_rel
66
+ - base__slide
67
+ - -0.15
68
+ open_drawer:
69
+ - move_door_rel
70
+ - base__drawer
71
+ - 0.12
72
+ close_drawer:
73
+ - move_door_rel
74
+ - base__drawer
75
+ - -0.12
76
+ lift_red_block_table:
77
+ - lift_object
78
+ - block_red
79
+ - 0.05
80
+ - table
81
+ - base_link
82
+ lift_red_block_slider:
83
+ - lift_object
84
+ - block_red
85
+ - 0.03
86
+ - table
87
+ - plank_link
88
+ lift_red_block_drawer:
89
+ - lift_object
90
+ - block_red
91
+ - 0.05
92
+ - table
93
+ - drawer_link
94
+ lift_blue_block_table:
95
+ - lift_object
96
+ - block_blue
97
+ - 0.05
98
+ - table
99
+ - base_link
100
+ lift_blue_block_slider:
101
+ - lift_object
102
+ - block_blue
103
+ - 0.03
104
+ - table
105
+ - plank_link
106
+ lift_blue_block_drawer:
107
+ - lift_object
108
+ - block_blue
109
+ - 0.05
110
+ - table
111
+ - drawer_link
112
+ lift_pink_block_table:
113
+ - lift_object
114
+ - block_pink
115
+ - 0.05
116
+ - table
117
+ - base_link
118
+ lift_pink_block_slider:
119
+ - lift_object
120
+ - block_pink
121
+ - 0.03
122
+ - table
123
+ - plank_link
124
+ lift_pink_block_drawer:
125
+ - lift_object
126
+ - block_pink
127
+ - 0.05
128
+ - table
129
+ - drawer_link
130
+ place_in_slider:
131
+ - place_object
132
+ - table
133
+ - plank_link
134
+ place_in_drawer:
135
+ - place_object
136
+ - table
137
+ - drawer_link
138
+ stack_block:
139
+ - stack_objects
140
+ unstack_block:
141
+ - unstack_objects
142
+ turn_on_lightbulb:
143
+ - toggle_light
144
+ - lightbulb
145
+ - 0
146
+ - 1
147
+ turn_off_lightbulb:
148
+ - toggle_light
149
+ - lightbulb
150
+ - 1
151
+ - 0
152
+ turn_on_led:
153
+ - toggle_light
154
+ - led
155
+ - 0
156
+ - 1
157
+ turn_off_led:
158
+ - toggle_light
159
+ - led
160
+ - 1
161
+ - 0
162
+ push_into_drawer:
163
+ - push_object_into
164
+ - - block_red
165
+ - block_blue
166
+ - block_pink
167
+ - table
168
+ - base_link
169
+ - table
170
+ - drawer_link
171
+ val_annotations:
172
+ rotate_red_block_right:
173
+ - take the red block and rotate it to the right
174
+ rotate_red_block_left:
175
+ - take the red block and rotate it to the left
176
+ rotate_blue_block_right:
177
+ - take the blue block and rotate it to the right
178
+ rotate_blue_block_left:
179
+ - take the blue block and rotate it to the left
180
+ rotate_pink_block_right:
181
+ - take the pink block and rotate it to the right
182
+ rotate_pink_block_left:
183
+ - take the pink block and rotate it to the left
184
+ push_red_block_right:
185
+ - go push the red block right
186
+ push_red_block_left:
187
+ - go push the red block left
188
+ push_blue_block_right:
189
+ - go push the blue block right
190
+ push_blue_block_left:
191
+ - go push the blue block left
192
+ push_pink_block_right:
193
+ - go push the pink block right
194
+ push_pink_block_left:
195
+ - go push the pink block left
196
+ move_slider_left:
197
+ - push the sliding door to the left side
198
+ move_slider_right:
199
+ - push the sliding door to the right side
200
+ open_drawer:
201
+ - pull the handle to open the drawer
202
+ close_drawer:
203
+ - push the handle to close the drawer
204
+ lift_red_block_table:
205
+ - grasp and lift the red block
206
+ lift_blue_block_table:
207
+ - grasp and lift the blue block
208
+ lift_pink_block_table:
209
+ - grasp and lift the pink block
210
+ lift_red_block_slider:
211
+ - lift the red block from the sliding cabinet
212
+ lift_blue_block_slider:
213
+ - lift the blue block from the sliding cabinet
214
+ lift_pink_block_slider:
215
+ - lift the pink block from the sliding cabinet
216
+ lift_red_block_drawer:
217
+ - Take the red block from the drawer
218
+ lift_blue_block_drawer:
219
+ - Take the blue block from the drawer
220
+ lift_pink_block_drawer:
221
+ - Take the pink block from the drawer
222
+ place_in_slider:
223
+ - store the grasped block in the sliding cabinet
224
+ place_in_drawer:
225
+ - store the grasped block in the drawer
226
+ push_into_drawer:
227
+ - slide the block that it falls into the drawer
228
+ stack_block:
229
+ - stack the grasped block
230
+ unstack_block:
231
+ - remove the stacked block
232
+ turn_on_lightbulb:
233
+ - use the switch to turn on the light bulb
234
+ turn_off_lightbulb:
235
+ - use the switch to turn off the light bulb
236
+ turn_on_led:
237
+ - press the button to turn on the led light
238
+ turn_off_led:
239
+ - press the button to turn off the led light
240
+ _target_: mode.rollout.rollout_long_horizon.RolloutLongHorizon
241
+ _recursive_: false
242
+ env_cfg:
243
+ _target_: mode.wrappers.hulc_wrapper.HulcWrapper
244
+ skip_epochs: ${rollout_lh_skip_epochs}
245
+ rollout_freq: 5
246
+ num_videos: 0
247
+ num_sequences: 1000
248
+ replan_freq: 30
249
+ ep_len: 360
250
+ empty_cache: false
251
+ log_video_to_file: false
252
+ save_dir: ./videos
253
+ lang_folder: ${lang_folder}
254
+ debug: false
255
+ ema:
256
+ _target_: mode.callbacks.ema.EMA
257
+ decay: 0.999
258
+ start_step: 0
259
+ save_ema_weights_in_callback_state: true
260
+ evaluate_ema_weights_instead: true
261
+ power: 0.6666666666666666
262
+ inv_gamma: 1.0
263
+ min_value: 0.0
264
+ max_value: 0.9999
265
+ checkpoint:
266
+ _target_: pytorch_lightning.callbacks.ModelCheckpoint
267
+ verbose: true
268
+ dirpath: saved_models
269
+ filename: '{epoch:02d}'
270
+ every_n_epochs: ${callbacks.rollout_lh.rollout_freq}
271
+ datamodule:
272
+ transforms:
273
+ train:
274
+ rgb_static:
275
+ - _target_: torchvision.transforms.Resize
276
+ size: 224
277
+ antialias: true
278
+ - _target_: mode.utils.transforms.RandomShiftsAug
279
+ pad: 10
280
+ - _target_: mode.utils.transforms.ScaleImageTensor
281
+ - _target_: torchvision.transforms.Normalize
282
+ mean:
283
+ - 0.48145466
284
+ - 0.4578275
285
+ - 0.40821073
286
+ std:
287
+ - 0.26862954
288
+ - 0.26130258
289
+ - 0.27577711
290
+ rgb_gripper:
291
+ - _target_: torchvision.transforms.Resize
292
+ size: 224
293
+ antialias: true
294
+ - _target_: mode.utils.transforms.RandomShiftsAug
295
+ pad: 4
296
+ - _target_: mode.utils.transforms.ScaleImageTensor
297
+ - _target_: torchvision.transforms.Normalize
298
+ mean:
299
+ - 0.48145466
300
+ - 0.4578275
301
+ - 0.40821073
302
+ std:
303
+ - 0.26862954
304
+ - 0.26130258
305
+ - 0.27577711
306
+ robot_obs:
307
+ - _target_: mode.utils.transforms.NormalizeVector
308
+ scene_obs:
309
+ - _target_: mode.utils.transforms.NormalizeVector
310
+ val:
311
+ rgb_static:
312
+ - _target_: torchvision.transforms.Resize
313
+ size: 224
314
+ antialias: true
315
+ - _target_: mode.utils.transforms.ScaleImageTensor
316
+ - _target_: torchvision.transforms.Normalize
317
+ mean:
318
+ - 0.48145466
319
+ - 0.4578275
320
+ - 0.40821073
321
+ std:
322
+ - 0.26862954
323
+ - 0.26130258
324
+ - 0.27577711
325
+ rgb_gripper:
326
+ - _target_: torchvision.transforms.Resize
327
+ size: 224
328
+ antialias: true
329
+ - _target_: mode.utils.transforms.ScaleImageTensor
330
+ - _target_: torchvision.transforms.Normalize
331
+ mean:
332
+ - 0.48145466
333
+ - 0.4578275
334
+ - 0.40821073
335
+ std:
336
+ - 0.26862954
337
+ - 0.26130258
338
+ - 0.27577711
339
+ robot_obs:
340
+ - _target_: mode.utils.transforms.NormalizeVector
341
+ scene_obs:
342
+ - _target_: mode.utils.transforms.NormalizeVector
343
+ _target_: mode.datasets.hulc_data_module.HulcDataModule
344
+ _recursive_: false
345
+ root_data_dir: ${root_data_dir}
346
+ action_space: 7
347
+ action_max:
348
+ - 1.0
349
+ - 1.0
350
+ - 1.0
351
+ - 1.0
352
+ - 1.0
353
+ - 1.0
354
+ - 1.0
355
+ action_min:
356
+ - -1.0
357
+ - -1.0
358
+ - -1.0
359
+ - -1.0
360
+ - -1.0
361
+ - -1.0
362
+ - -1
363
+ shuffle_val: false
364
+ observation_space:
365
+ rgb_obs:
366
+ - rgb_static
367
+ - rgb_gripper
368
+ depth_obs: []
369
+ state_obs:
370
+ - robot_obs
371
+ actions:
372
+ - rel_actions
373
+ language:
374
+ - language
375
+ proprioception_dims:
376
+ n_state_obs: 8
377
+ keep_indices:
378
+ - - 0
379
+ - 7
380
+ - - 14
381
+ - 15
382
+ robot_orientation_idx:
383
+ - 3
384
+ - 6
385
+ normalize: true
386
+ normalize_robot_orientation: true
387
+ datasets:
388
+ lang_dataset:
389
+ _target_: mode.datasets.disk_dataset.ExtendedDiskDataset
390
+ key: lang
391
+ save_format: npz
392
+ batch_size: ${batch_size}
393
+ min_window_size: ${act_seq_len}
394
+ max_window_size: ${act_seq_len}
395
+ proprio_state: ${datamodule.proprioception_dims}
396
+ obs_space: ${datamodule.observation_space}
397
+ skip_frames: 1
398
+ pad: false
399
+ lang_folder: ${lang_folder}
400
+ aux_lang_loss_window: 8
401
+ num_workers: ${num_workers}
402
+ action_seq_len: ${act_seq_len}
403
+ obs_seq_len: ${obs_seq_len}
404
+ future_range: 1
405
+ use_extracted_rel_actions: ${use_extracted_rel_actions}
406
+ model:
407
+ _target_: mode.models.mode_agent.MoDEAgent
408
+ _recursive_: false
409
+ multistep: ${multistep}
410
+ use_lr_scheduler: true
411
+ entropy_gamma: 0.01
412
+ router_z_delta: 0.0
413
+ use_proprio: false
414
+ seed: ${seed}
415
+ sampler_type: ddim
416
+ num_sampling_steps: 10
417
+ sigma_data: 0.5
418
+ sigma_min: 0.001
419
+ sigma_max: 80
420
+ noise_scheduler: exponential
421
+ sigma_sample_density_type: loglogistic
422
+ ckpt_path: /home/yiming/pretrained_models/MoDE/MoDE_Pretrained
423
+ start_from_pretrained: true
424
+ act_window_size: ${act_seq_len}
425
+ latent_dim: 1024
426
+ obs_enc_dim: ${obs_dim}
427
+ cond_dim: 512
428
+ resnet_type: '50'
429
+ optimizer:
430
+ _target_: torch.optim.AdamW
431
+ transformer_weight_decay: 0.05
432
+ obs_encoder_weight_decay: 0.05
433
+ learning_rate: 0.0001
434
+ betas:
435
+ - 0.9
436
+ - 0.95
437
+ lr_scheduler:
438
+ lr_scheduler:
439
+ init_lr: 0.0001
440
+ init_lr_scale: 0.1
441
+ final_lr_scale: 1.0e-06
442
+ total_steps: 45000
443
+ phase_ratio: (0.02, 0.08, 0.9)
444
+ lr: 0.0001
445
+ model:
446
+ _target_: mode.models.edm_diffusion.score_wrappers.GCDenoiser
447
+ _recursive_: false
448
+ sigma_data: ${model.sigma_data}
449
+ inner_model:
450
+ _target_: mode.models.networks.modedit.MoDeDiT
451
+ action_dim: ${datamodule.action_space}
452
+ goal_dim: ${model.cond_dim}
453
+ obs_dim: 2048
454
+ goal_conditioned: true
455
+ causal: true
456
+ use_custom_attn_mask: false
457
+ use_proprio: ${model.use_proprio}
458
+ state_dim: ${proprio_dims}
459
+ embed_dim: ${model.latent_dim}
460
+ n_layers: 10
461
+ goal_seq_len: 1
462
+ obs_seq_len: ${obs_seq_len}
463
+ action_seq_len: ${act_seq_len}
464
+ embed_pdrob: 0
465
+ goal_drop: 0.1
466
+ attn_pdrop: 0.3
467
+ mlp_pdrop: 0.1
468
+ n_heads: 8
469
+ device: ${device}
470
+ linear_output: true
471
+ cond_router: true
472
+ num_experts: 4
473
+ top_k: 2
474
+ router_normalize: true
475
+ use_goal_in_routing: false
476
+ use_argmax: false
477
+ use_shared_expert: false
478
+ use_noise_token_as_input: true
479
+ init_style: olmoe
480
+ language_goal:
481
+ _target_: mode.models.networks.clip_lang_encoder.LangClip
482
+ _recursive_: false
483
+ model_name: ${clip_lang_model_name}
484
+ root_data_dir: data/lebai
485
+ lang_folder: lang_clip_resnet50
486
+ vis_clip_model_name: ViT-B/16
487
+ clip_lang_model_name: ViT-B/32
488
+ log_dir: ./logs
489
+ slurm: false
490
+ seed: 421
491
+ device: cuda
492
+ batch_size: 64
493
+ devices: 4
494
+ act_dim: 7
495
+ proprio_dims: 7
496
+ obs_dim: 512
497
+ goal_dim: 512
498
+ obs_seq_len: 1
499
+ act_seq_len: 32
500
+ multistep: 32
501
+ p_last_state: 0
502
+ gen_img_res: 112
503
+ max_epochs: 200
504
+ rollout_lh_skip_epochs: 9
505
+ num_workers: 12
506
+ benchmark_name: lebai_mode
507
+ use_extracted_rel_actions: true
508
+ trainer:
509
+ devices: ${devices}
510
+ precision: bf16
511
+ max_epochs: ${max_epochs}
512
+ sync_batchnorm: true
513
+ accelerator: gpu
514
+ strategy: ddp
515
+ logger:
516
+ _target_: pytorch_lightning.loggers.WandbLogger
517
+ save_dir: .
518
+ name: logger
519
+ group: mode
520
+ log_model: false
521
+ project: ${benchmark_name}
522
+ entity: yimingwu0
523
+ id: ???
l10_ds1_only/model_cleaned.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a54ed8b02ac954e16a881ed7ab9aca568f551c7fc03e54f178e355c3a74d2e0a
3
+ size 3115403448
l10_ds2_only/config.yaml ADDED
@@ -0,0 +1,523 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ callbacks:
2
+ rollout_lh:
3
+ tasks:
4
+ _target_: calvin_env.envs.tasks.Tasks
5
+ tasks:
6
+ rotate_red_block_right:
7
+ - rotate_object
8
+ - block_red
9
+ - -60
10
+ rotate_red_block_left:
11
+ - rotate_object
12
+ - block_red
13
+ - 60
14
+ rotate_blue_block_right:
15
+ - rotate_object
16
+ - block_blue
17
+ - -60
18
+ rotate_blue_block_left:
19
+ - rotate_object
20
+ - block_blue
21
+ - 60
22
+ rotate_pink_block_right:
23
+ - rotate_object
24
+ - block_pink
25
+ - -60
26
+ rotate_pink_block_left:
27
+ - rotate_object
28
+ - block_pink
29
+ - 60
30
+ push_red_block_right:
31
+ - push_object
32
+ - block_red
33
+ - 0.1
34
+ - 0
35
+ push_red_block_left:
36
+ - push_object
37
+ - block_red
38
+ - -0.1
39
+ - 0
40
+ push_blue_block_right:
41
+ - push_object
42
+ - block_blue
43
+ - 0.1
44
+ - 0
45
+ push_blue_block_left:
46
+ - push_object
47
+ - block_blue
48
+ - -0.1
49
+ - 0
50
+ push_pink_block_right:
51
+ - push_object
52
+ - block_pink
53
+ - 0.1
54
+ - 0
55
+ push_pink_block_left:
56
+ - push_object
57
+ - block_pink
58
+ - -0.1
59
+ - 0
60
+ move_slider_left:
61
+ - move_door_rel
62
+ - base__slide
63
+ - 0.15
64
+ move_slider_right:
65
+ - move_door_rel
66
+ - base__slide
67
+ - -0.15
68
+ open_drawer:
69
+ - move_door_rel
70
+ - base__drawer
71
+ - 0.12
72
+ close_drawer:
73
+ - move_door_rel
74
+ - base__drawer
75
+ - -0.12
76
+ lift_red_block_table:
77
+ - lift_object
78
+ - block_red
79
+ - 0.05
80
+ - table
81
+ - base_link
82
+ lift_red_block_slider:
83
+ - lift_object
84
+ - block_red
85
+ - 0.03
86
+ - table
87
+ - plank_link
88
+ lift_red_block_drawer:
89
+ - lift_object
90
+ - block_red
91
+ - 0.05
92
+ - table
93
+ - drawer_link
94
+ lift_blue_block_table:
95
+ - lift_object
96
+ - block_blue
97
+ - 0.05
98
+ - table
99
+ - base_link
100
+ lift_blue_block_slider:
101
+ - lift_object
102
+ - block_blue
103
+ - 0.03
104
+ - table
105
+ - plank_link
106
+ lift_blue_block_drawer:
107
+ - lift_object
108
+ - block_blue
109
+ - 0.05
110
+ - table
111
+ - drawer_link
112
+ lift_pink_block_table:
113
+ - lift_object
114
+ - block_pink
115
+ - 0.05
116
+ - table
117
+ - base_link
118
+ lift_pink_block_slider:
119
+ - lift_object
120
+ - block_pink
121
+ - 0.03
122
+ - table
123
+ - plank_link
124
+ lift_pink_block_drawer:
125
+ - lift_object
126
+ - block_pink
127
+ - 0.05
128
+ - table
129
+ - drawer_link
130
+ place_in_slider:
131
+ - place_object
132
+ - table
133
+ - plank_link
134
+ place_in_drawer:
135
+ - place_object
136
+ - table
137
+ - drawer_link
138
+ stack_block:
139
+ - stack_objects
140
+ unstack_block:
141
+ - unstack_objects
142
+ turn_on_lightbulb:
143
+ - toggle_light
144
+ - lightbulb
145
+ - 0
146
+ - 1
147
+ turn_off_lightbulb:
148
+ - toggle_light
149
+ - lightbulb
150
+ - 1
151
+ - 0
152
+ turn_on_led:
153
+ - toggle_light
154
+ - led
155
+ - 0
156
+ - 1
157
+ turn_off_led:
158
+ - toggle_light
159
+ - led
160
+ - 1
161
+ - 0
162
+ push_into_drawer:
163
+ - push_object_into
164
+ - - block_red
165
+ - block_blue
166
+ - block_pink
167
+ - table
168
+ - base_link
169
+ - table
170
+ - drawer_link
171
+ val_annotations:
172
+ rotate_red_block_right:
173
+ - take the red block and rotate it to the right
174
+ rotate_red_block_left:
175
+ - take the red block and rotate it to the left
176
+ rotate_blue_block_right:
177
+ - take the blue block and rotate it to the right
178
+ rotate_blue_block_left:
179
+ - take the blue block and rotate it to the left
180
+ rotate_pink_block_right:
181
+ - take the pink block and rotate it to the right
182
+ rotate_pink_block_left:
183
+ - take the pink block and rotate it to the left
184
+ push_red_block_right:
185
+ - go push the red block right
186
+ push_red_block_left:
187
+ - go push the red block left
188
+ push_blue_block_right:
189
+ - go push the blue block right
190
+ push_blue_block_left:
191
+ - go push the blue block left
192
+ push_pink_block_right:
193
+ - go push the pink block right
194
+ push_pink_block_left:
195
+ - go push the pink block left
196
+ move_slider_left:
197
+ - push the sliding door to the left side
198
+ move_slider_right:
199
+ - push the sliding door to the right side
200
+ open_drawer:
201
+ - pull the handle to open the drawer
202
+ close_drawer:
203
+ - push the handle to close the drawer
204
+ lift_red_block_table:
205
+ - grasp and lift the red block
206
+ lift_blue_block_table:
207
+ - grasp and lift the blue block
208
+ lift_pink_block_table:
209
+ - grasp and lift the pink block
210
+ lift_red_block_slider:
211
+ - lift the red block from the sliding cabinet
212
+ lift_blue_block_slider:
213
+ - lift the blue block from the sliding cabinet
214
+ lift_pink_block_slider:
215
+ - lift the pink block from the sliding cabinet
216
+ lift_red_block_drawer:
217
+ - Take the red block from the drawer
218
+ lift_blue_block_drawer:
219
+ - Take the blue block from the drawer
220
+ lift_pink_block_drawer:
221
+ - Take the pink block from the drawer
222
+ place_in_slider:
223
+ - store the grasped block in the sliding cabinet
224
+ place_in_drawer:
225
+ - store the grasped block in the drawer
226
+ push_into_drawer:
227
+ - slide the block that it falls into the drawer
228
+ stack_block:
229
+ - stack the grasped block
230
+ unstack_block:
231
+ - remove the stacked block
232
+ turn_on_lightbulb:
233
+ - use the switch to turn on the light bulb
234
+ turn_off_lightbulb:
235
+ - use the switch to turn off the light bulb
236
+ turn_on_led:
237
+ - press the button to turn on the led light
238
+ turn_off_led:
239
+ - press the button to turn off the led light
240
+ _target_: mode.rollout.rollout_long_horizon.RolloutLongHorizon
241
+ _recursive_: false
242
+ env_cfg:
243
+ _target_: mode.wrappers.hulc_wrapper.HulcWrapper
244
+ skip_epochs: ${rollout_lh_skip_epochs}
245
+ rollout_freq: 5
246
+ num_videos: 0
247
+ num_sequences: 1000
248
+ replan_freq: 30
249
+ ep_len: 360
250
+ empty_cache: false
251
+ log_video_to_file: false
252
+ save_dir: ./videos
253
+ lang_folder: ${lang_folder}
254
+ debug: false
255
+ ema:
256
+ _target_: mode.callbacks.ema.EMA
257
+ decay: 0.999
258
+ start_step: 0
259
+ save_ema_weights_in_callback_state: true
260
+ evaluate_ema_weights_instead: true
261
+ power: 0.6666666666666666
262
+ inv_gamma: 1.0
263
+ min_value: 0.0
264
+ max_value: 0.9999
265
+ checkpoint:
266
+ _target_: pytorch_lightning.callbacks.ModelCheckpoint
267
+ verbose: true
268
+ dirpath: saved_models
269
+ filename: '{epoch:02d}'
270
+ every_n_epochs: ${callbacks.rollout_lh.rollout_freq}
271
+ datamodule:
272
+ transforms:
273
+ train:
274
+ rgb_static:
275
+ - _target_: torchvision.transforms.Resize
276
+ size: 224
277
+ antialias: true
278
+ - _target_: mode.utils.transforms.RandomShiftsAug
279
+ pad: 10
280
+ - _target_: mode.utils.transforms.ScaleImageTensor
281
+ - _target_: torchvision.transforms.Normalize
282
+ mean:
283
+ - 0.48145466
284
+ - 0.4578275
285
+ - 0.40821073
286
+ std:
287
+ - 0.26862954
288
+ - 0.26130258
289
+ - 0.27577711
290
+ rgb_gripper:
291
+ - _target_: torchvision.transforms.Resize
292
+ size: 224
293
+ antialias: true
294
+ - _target_: mode.utils.transforms.RandomShiftsAug
295
+ pad: 4
296
+ - _target_: mode.utils.transforms.ScaleImageTensor
297
+ - _target_: torchvision.transforms.Normalize
298
+ mean:
299
+ - 0.48145466
300
+ - 0.4578275
301
+ - 0.40821073
302
+ std:
303
+ - 0.26862954
304
+ - 0.26130258
305
+ - 0.27577711
306
+ robot_obs:
307
+ - _target_: mode.utils.transforms.NormalizeVector
308
+ scene_obs:
309
+ - _target_: mode.utils.transforms.NormalizeVector
310
+ val:
311
+ rgb_static:
312
+ - _target_: torchvision.transforms.Resize
313
+ size: 224
314
+ antialias: true
315
+ - _target_: mode.utils.transforms.ScaleImageTensor
316
+ - _target_: torchvision.transforms.Normalize
317
+ mean:
318
+ - 0.48145466
319
+ - 0.4578275
320
+ - 0.40821073
321
+ std:
322
+ - 0.26862954
323
+ - 0.26130258
324
+ - 0.27577711
325
+ rgb_gripper:
326
+ - _target_: torchvision.transforms.Resize
327
+ size: 224
328
+ antialias: true
329
+ - _target_: mode.utils.transforms.ScaleImageTensor
330
+ - _target_: torchvision.transforms.Normalize
331
+ mean:
332
+ - 0.48145466
333
+ - 0.4578275
334
+ - 0.40821073
335
+ std:
336
+ - 0.26862954
337
+ - 0.26130258
338
+ - 0.27577711
339
+ robot_obs:
340
+ - _target_: mode.utils.transforms.NormalizeVector
341
+ scene_obs:
342
+ - _target_: mode.utils.transforms.NormalizeVector
343
+ _target_: mode.datasets.hulc_data_module.HulcDataModule
344
+ _recursive_: false
345
+ root_data_dir: ${root_data_dir}
346
+ action_space: 7
347
+ action_max:
348
+ - 1.0
349
+ - 1.0
350
+ - 1.0
351
+ - 1.0
352
+ - 1.0
353
+ - 1.0
354
+ - 1.0
355
+ action_min:
356
+ - -1.0
357
+ - -1.0
358
+ - -1.0
359
+ - -1.0
360
+ - -1.0
361
+ - -1.0
362
+ - -1
363
+ shuffle_val: false
364
+ observation_space:
365
+ rgb_obs:
366
+ - rgb_static
367
+ - rgb_gripper
368
+ depth_obs: []
369
+ state_obs:
370
+ - robot_obs
371
+ actions:
372
+ - rel_actions
373
+ language:
374
+ - language
375
+ proprioception_dims:
376
+ n_state_obs: 8
377
+ keep_indices:
378
+ - - 0
379
+ - 7
380
+ - - 14
381
+ - 15
382
+ robot_orientation_idx:
383
+ - 3
384
+ - 6
385
+ normalize: true
386
+ normalize_robot_orientation: true
387
+ datasets:
388
+ lang_dataset:
389
+ _target_: mode.datasets.disk_dataset.ExtendedDiskDataset
390
+ key: lang
391
+ save_format: npz
392
+ batch_size: ${batch_size}
393
+ min_window_size: ${act_seq_len}
394
+ max_window_size: ${act_seq_len}
395
+ proprio_state: ${datamodule.proprioception_dims}
396
+ obs_space: ${datamodule.observation_space}
397
+ skip_frames: 1
398
+ pad: false
399
+ lang_folder: ${lang_folder}
400
+ aux_lang_loss_window: 8
401
+ num_workers: ${num_workers}
402
+ action_seq_len: ${act_seq_len}
403
+ obs_seq_len: ${obs_seq_len}
404
+ future_range: 1
405
+ use_extracted_rel_actions: ${use_extracted_rel_actions}
406
+ model:
407
+ _target_: mode.models.mode_agent.MoDEAgent
408
+ _recursive_: false
409
+ multistep: ${multistep}
410
+ use_lr_scheduler: true
411
+ entropy_gamma: 0.01
412
+ router_z_delta: 0.0
413
+ use_proprio: false
414
+ seed: ${seed}
415
+ sampler_type: ddim
416
+ num_sampling_steps: 10
417
+ sigma_data: 0.5
418
+ sigma_min: 0.001
419
+ sigma_max: 80
420
+ noise_scheduler: exponential
421
+ sigma_sample_density_type: loglogistic
422
+ ckpt_path: /home/yiming/pretrained_models/MoDE/MoDE_Pretrained
423
+ start_from_pretrained: true
424
+ act_window_size: ${act_seq_len}
425
+ latent_dim: 1024
426
+ obs_enc_dim: ${obs_dim}
427
+ cond_dim: 512
428
+ resnet_type: '50'
429
+ optimizer:
430
+ _target_: torch.optim.AdamW
431
+ transformer_weight_decay: 0.05
432
+ obs_encoder_weight_decay: 0.05
433
+ learning_rate: 0.0001
434
+ betas:
435
+ - 0.9
436
+ - 0.95
437
+ lr_scheduler:
438
+ lr_scheduler:
439
+ init_lr: 0.0001
440
+ init_lr_scale: 0.1
441
+ final_lr_scale: 1.0e-06
442
+ total_steps: 45000
443
+ phase_ratio: (0.02, 0.08, 0.9)
444
+ lr: 0.0001
445
+ model:
446
+ _target_: mode.models.edm_diffusion.score_wrappers.GCDenoiser
447
+ _recursive_: false
448
+ sigma_data: ${model.sigma_data}
449
+ inner_model:
450
+ _target_: mode.models.networks.modedit.MoDeDiT
451
+ action_dim: ${datamodule.action_space}
452
+ goal_dim: ${model.cond_dim}
453
+ obs_dim: 2048
454
+ goal_conditioned: true
455
+ causal: true
456
+ use_custom_attn_mask: false
457
+ use_proprio: ${model.use_proprio}
458
+ state_dim: ${proprio_dims}
459
+ embed_dim: ${model.latent_dim}
460
+ n_layers: 10
461
+ goal_seq_len: 1
462
+ obs_seq_len: ${obs_seq_len}
463
+ action_seq_len: ${act_seq_len}
464
+ embed_pdrob: 0
465
+ goal_drop: 0.1
466
+ attn_pdrop: 0.3
467
+ mlp_pdrop: 0.1
468
+ n_heads: 8
469
+ device: ${device}
470
+ linear_output: true
471
+ cond_router: true
472
+ num_experts: 4
473
+ top_k: 2
474
+ router_normalize: true
475
+ use_goal_in_routing: false
476
+ use_argmax: false
477
+ use_shared_expert: false
478
+ use_noise_token_as_input: true
479
+ init_style: olmoe
480
+ language_goal:
481
+ _target_: mode.models.networks.clip_lang_encoder.LangClip
482
+ _recursive_: false
483
+ model_name: ${clip_lang_model_name}
484
+ root_data_dir: data/lebai
485
+ lang_folder: lang_clip_resnet50
486
+ vis_clip_model_name: ViT-B/16
487
+ clip_lang_model_name: ViT-B/32
488
+ log_dir: ./logs
489
+ slurm: false
490
+ seed: 421
491
+ device: cuda
492
+ batch_size: 64
493
+ devices: 4
494
+ act_dim: 7
495
+ proprio_dims: 7
496
+ obs_dim: 512
497
+ goal_dim: 512
498
+ obs_seq_len: 1
499
+ act_seq_len: 32
500
+ multistep: 32
501
+ p_last_state: 0
502
+ gen_img_res: 112
503
+ max_epochs: 200
504
+ rollout_lh_skip_epochs: 9
505
+ num_workers: 12
506
+ benchmark_name: lebai_mode
507
+ use_extracted_rel_actions: true
508
+ trainer:
509
+ devices: ${devices}
510
+ precision: bf16
511
+ max_epochs: ${max_epochs}
512
+ sync_batchnorm: true
513
+ accelerator: gpu
514
+ strategy: ddp
515
+ logger:
516
+ _target_: pytorch_lightning.loggers.WandbLogger
517
+ save_dir: .
518
+ name: logger
519
+ group: mode
520
+ log_model: false
521
+ project: ${benchmark_name}
522
+ entity: yimingwu0
523
+ id: ???
l10_ds2_only/model_cleaned.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:423414d6b17475736239742ddd7d6c9ecab7df933c9e91a26b01289fa37e7e05
3
+ size 3115403448
l10_ds3_only/config.yaml ADDED
@@ -0,0 +1,523 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ callbacks:
2
+ rollout_lh:
3
+ tasks:
4
+ _target_: calvin_env.envs.tasks.Tasks
5
+ tasks:
6
+ rotate_red_block_right:
7
+ - rotate_object
8
+ - block_red
9
+ - -60
10
+ rotate_red_block_left:
11
+ - rotate_object
12
+ - block_red
13
+ - 60
14
+ rotate_blue_block_right:
15
+ - rotate_object
16
+ - block_blue
17
+ - -60
18
+ rotate_blue_block_left:
19
+ - rotate_object
20
+ - block_blue
21
+ - 60
22
+ rotate_pink_block_right:
23
+ - rotate_object
24
+ - block_pink
25
+ - -60
26
+ rotate_pink_block_left:
27
+ - rotate_object
28
+ - block_pink
29
+ - 60
30
+ push_red_block_right:
31
+ - push_object
32
+ - block_red
33
+ - 0.1
34
+ - 0
35
+ push_red_block_left:
36
+ - push_object
37
+ - block_red
38
+ - -0.1
39
+ - 0
40
+ push_blue_block_right:
41
+ - push_object
42
+ - block_blue
43
+ - 0.1
44
+ - 0
45
+ push_blue_block_left:
46
+ - push_object
47
+ - block_blue
48
+ - -0.1
49
+ - 0
50
+ push_pink_block_right:
51
+ - push_object
52
+ - block_pink
53
+ - 0.1
54
+ - 0
55
+ push_pink_block_left:
56
+ - push_object
57
+ - block_pink
58
+ - -0.1
59
+ - 0
60
+ move_slider_left:
61
+ - move_door_rel
62
+ - base__slide
63
+ - 0.15
64
+ move_slider_right:
65
+ - move_door_rel
66
+ - base__slide
67
+ - -0.15
68
+ open_drawer:
69
+ - move_door_rel
70
+ - base__drawer
71
+ - 0.12
72
+ close_drawer:
73
+ - move_door_rel
74
+ - base__drawer
75
+ - -0.12
76
+ lift_red_block_table:
77
+ - lift_object
78
+ - block_red
79
+ - 0.05
80
+ - table
81
+ - base_link
82
+ lift_red_block_slider:
83
+ - lift_object
84
+ - block_red
85
+ - 0.03
86
+ - table
87
+ - plank_link
88
+ lift_red_block_drawer:
89
+ - lift_object
90
+ - block_red
91
+ - 0.05
92
+ - table
93
+ - drawer_link
94
+ lift_blue_block_table:
95
+ - lift_object
96
+ - block_blue
97
+ - 0.05
98
+ - table
99
+ - base_link
100
+ lift_blue_block_slider:
101
+ - lift_object
102
+ - block_blue
103
+ - 0.03
104
+ - table
105
+ - plank_link
106
+ lift_blue_block_drawer:
107
+ - lift_object
108
+ - block_blue
109
+ - 0.05
110
+ - table
111
+ - drawer_link
112
+ lift_pink_block_table:
113
+ - lift_object
114
+ - block_pink
115
+ - 0.05
116
+ - table
117
+ - base_link
118
+ lift_pink_block_slider:
119
+ - lift_object
120
+ - block_pink
121
+ - 0.03
122
+ - table
123
+ - plank_link
124
+ lift_pink_block_drawer:
125
+ - lift_object
126
+ - block_pink
127
+ - 0.05
128
+ - table
129
+ - drawer_link
130
+ place_in_slider:
131
+ - place_object
132
+ - table
133
+ - plank_link
134
+ place_in_drawer:
135
+ - place_object
136
+ - table
137
+ - drawer_link
138
+ stack_block:
139
+ - stack_objects
140
+ unstack_block:
141
+ - unstack_objects
142
+ turn_on_lightbulb:
143
+ - toggle_light
144
+ - lightbulb
145
+ - 0
146
+ - 1
147
+ turn_off_lightbulb:
148
+ - toggle_light
149
+ - lightbulb
150
+ - 1
151
+ - 0
152
+ turn_on_led:
153
+ - toggle_light
154
+ - led
155
+ - 0
156
+ - 1
157
+ turn_off_led:
158
+ - toggle_light
159
+ - led
160
+ - 1
161
+ - 0
162
+ push_into_drawer:
163
+ - push_object_into
164
+ - - block_red
165
+ - block_blue
166
+ - block_pink
167
+ - table
168
+ - base_link
169
+ - table
170
+ - drawer_link
171
+ val_annotations:
172
+ rotate_red_block_right:
173
+ - take the red block and rotate it to the right
174
+ rotate_red_block_left:
175
+ - take the red block and rotate it to the left
176
+ rotate_blue_block_right:
177
+ - take the blue block and rotate it to the right
178
+ rotate_blue_block_left:
179
+ - take the blue block and rotate it to the left
180
+ rotate_pink_block_right:
181
+ - take the pink block and rotate it to the right
182
+ rotate_pink_block_left:
183
+ - take the pink block and rotate it to the left
184
+ push_red_block_right:
185
+ - go push the red block right
186
+ push_red_block_left:
187
+ - go push the red block left
188
+ push_blue_block_right:
189
+ - go push the blue block right
190
+ push_blue_block_left:
191
+ - go push the blue block left
192
+ push_pink_block_right:
193
+ - go push the pink block right
194
+ push_pink_block_left:
195
+ - go push the pink block left
196
+ move_slider_left:
197
+ - push the sliding door to the left side
198
+ move_slider_right:
199
+ - push the sliding door to the right side
200
+ open_drawer:
201
+ - pull the handle to open the drawer
202
+ close_drawer:
203
+ - push the handle to close the drawer
204
+ lift_red_block_table:
205
+ - grasp and lift the red block
206
+ lift_blue_block_table:
207
+ - grasp and lift the blue block
208
+ lift_pink_block_table:
209
+ - grasp and lift the pink block
210
+ lift_red_block_slider:
211
+ - lift the red block from the sliding cabinet
212
+ lift_blue_block_slider:
213
+ - lift the blue block from the sliding cabinet
214
+ lift_pink_block_slider:
215
+ - lift the pink block from the sliding cabinet
216
+ lift_red_block_drawer:
217
+ - Take the red block from the drawer
218
+ lift_blue_block_drawer:
219
+ - Take the blue block from the drawer
220
+ lift_pink_block_drawer:
221
+ - Take the pink block from the drawer
222
+ place_in_slider:
223
+ - store the grasped block in the sliding cabinet
224
+ place_in_drawer:
225
+ - store the grasped block in the drawer
226
+ push_into_drawer:
227
+ - slide the block that it falls into the drawer
228
+ stack_block:
229
+ - stack the grasped block
230
+ unstack_block:
231
+ - remove the stacked block
232
+ turn_on_lightbulb:
233
+ - use the switch to turn on the light bulb
234
+ turn_off_lightbulb:
235
+ - use the switch to turn off the light bulb
236
+ turn_on_led:
237
+ - press the button to turn on the led light
238
+ turn_off_led:
239
+ - press the button to turn off the led light
240
+ _target_: mode.rollout.rollout_long_horizon.RolloutLongHorizon
241
+ _recursive_: false
242
+ env_cfg:
243
+ _target_: mode.wrappers.hulc_wrapper.HulcWrapper
244
+ skip_epochs: ${rollout_lh_skip_epochs}
245
+ rollout_freq: 5
246
+ num_videos: 0
247
+ num_sequences: 1000
248
+ replan_freq: 30
249
+ ep_len: 360
250
+ empty_cache: false
251
+ log_video_to_file: false
252
+ save_dir: ./videos
253
+ lang_folder: ${lang_folder}
254
+ debug: false
255
+ ema:
256
+ _target_: mode.callbacks.ema.EMA
257
+ decay: 0.999
258
+ start_step: 0
259
+ save_ema_weights_in_callback_state: true
260
+ evaluate_ema_weights_instead: true
261
+ power: 0.6666666666666666
262
+ inv_gamma: 1.0
263
+ min_value: 0.0
264
+ max_value: 0.9999
265
+ checkpoint:
266
+ _target_: pytorch_lightning.callbacks.ModelCheckpoint
267
+ verbose: true
268
+ dirpath: saved_models
269
+ filename: '{epoch:02d}'
270
+ every_n_epochs: ${callbacks.rollout_lh.rollout_freq}
271
+ datamodule:
272
+ transforms:
273
+ train:
274
+ rgb_static:
275
+ - _target_: torchvision.transforms.Resize
276
+ size: 224
277
+ antialias: true
278
+ - _target_: mode.utils.transforms.RandomShiftsAug
279
+ pad: 10
280
+ - _target_: mode.utils.transforms.ScaleImageTensor
281
+ - _target_: torchvision.transforms.Normalize
282
+ mean:
283
+ - 0.48145466
284
+ - 0.4578275
285
+ - 0.40821073
286
+ std:
287
+ - 0.26862954
288
+ - 0.26130258
289
+ - 0.27577711
290
+ rgb_gripper:
291
+ - _target_: torchvision.transforms.Resize
292
+ size: 224
293
+ antialias: true
294
+ - _target_: mode.utils.transforms.RandomShiftsAug
295
+ pad: 4
296
+ - _target_: mode.utils.transforms.ScaleImageTensor
297
+ - _target_: torchvision.transforms.Normalize
298
+ mean:
299
+ - 0.48145466
300
+ - 0.4578275
301
+ - 0.40821073
302
+ std:
303
+ - 0.26862954
304
+ - 0.26130258
305
+ - 0.27577711
306
+ robot_obs:
307
+ - _target_: mode.utils.transforms.NormalizeVector
308
+ scene_obs:
309
+ - _target_: mode.utils.transforms.NormalizeVector
310
+ val:
311
+ rgb_static:
312
+ - _target_: torchvision.transforms.Resize
313
+ size: 224
314
+ antialias: true
315
+ - _target_: mode.utils.transforms.ScaleImageTensor
316
+ - _target_: torchvision.transforms.Normalize
317
+ mean:
318
+ - 0.48145466
319
+ - 0.4578275
320
+ - 0.40821073
321
+ std:
322
+ - 0.26862954
323
+ - 0.26130258
324
+ - 0.27577711
325
+ rgb_gripper:
326
+ - _target_: torchvision.transforms.Resize
327
+ size: 224
328
+ antialias: true
329
+ - _target_: mode.utils.transforms.ScaleImageTensor
330
+ - _target_: torchvision.transforms.Normalize
331
+ mean:
332
+ - 0.48145466
333
+ - 0.4578275
334
+ - 0.40821073
335
+ std:
336
+ - 0.26862954
337
+ - 0.26130258
338
+ - 0.27577711
339
+ robot_obs:
340
+ - _target_: mode.utils.transforms.NormalizeVector
341
+ scene_obs:
342
+ - _target_: mode.utils.transforms.NormalizeVector
343
+ _target_: mode.datasets.hulc_data_module.HulcDataModule
344
+ _recursive_: false
345
+ root_data_dir: ${root_data_dir}
346
+ action_space: 7
347
+ action_max:
348
+ - 1.0
349
+ - 1.0
350
+ - 1.0
351
+ - 1.0
352
+ - 1.0
353
+ - 1.0
354
+ - 1.0
355
+ action_min:
356
+ - -1.0
357
+ - -1.0
358
+ - -1.0
359
+ - -1.0
360
+ - -1.0
361
+ - -1.0
362
+ - -1
363
+ shuffle_val: false
364
+ observation_space:
365
+ rgb_obs:
366
+ - rgb_static
367
+ - rgb_gripper
368
+ depth_obs: []
369
+ state_obs:
370
+ - robot_obs
371
+ actions:
372
+ - rel_actions
373
+ language:
374
+ - language
375
+ proprioception_dims:
376
+ n_state_obs: 8
377
+ keep_indices:
378
+ - - 0
379
+ - 7
380
+ - - 14
381
+ - 15
382
+ robot_orientation_idx:
383
+ - 3
384
+ - 6
385
+ normalize: true
386
+ normalize_robot_orientation: true
387
+ datasets:
388
+ lang_dataset:
389
+ _target_: mode.datasets.disk_dataset.ExtendedDiskDataset
390
+ key: lang
391
+ save_format: npz
392
+ batch_size: ${batch_size}
393
+ min_window_size: ${act_seq_len}
394
+ max_window_size: ${act_seq_len}
395
+ proprio_state: ${datamodule.proprioception_dims}
396
+ obs_space: ${datamodule.observation_space}
397
+ skip_frames: 1
398
+ pad: false
399
+ lang_folder: ${lang_folder}
400
+ aux_lang_loss_window: 8
401
+ num_workers: ${num_workers}
402
+ action_seq_len: ${act_seq_len}
403
+ obs_seq_len: ${obs_seq_len}
404
+ future_range: 1
405
+ use_extracted_rel_actions: ${use_extracted_rel_actions}
406
+ model:
407
+ _target_: mode.models.mode_agent.MoDEAgent
408
+ _recursive_: false
409
+ multistep: ${multistep}
410
+ use_lr_scheduler: true
411
+ entropy_gamma: 0.01
412
+ router_z_delta: 0.0
413
+ use_proprio: false
414
+ seed: ${seed}
415
+ sampler_type: ddim
416
+ num_sampling_steps: 10
417
+ sigma_data: 0.5
418
+ sigma_min: 0.001
419
+ sigma_max: 80
420
+ noise_scheduler: exponential
421
+ sigma_sample_density_type: loglogistic
422
+ ckpt_path: /home/yiming/pretrained_models/MoDE/MoDE_Pretrained
423
+ start_from_pretrained: true
424
+ act_window_size: ${act_seq_len}
425
+ latent_dim: 1024
426
+ obs_enc_dim: ${obs_dim}
427
+ cond_dim: 512
428
+ resnet_type: '50'
429
+ optimizer:
430
+ _target_: torch.optim.AdamW
431
+ transformer_weight_decay: 0.05
432
+ obs_encoder_weight_decay: 0.05
433
+ learning_rate: 0.0001
434
+ betas:
435
+ - 0.9
436
+ - 0.95
437
+ lr_scheduler:
438
+ lr_scheduler:
439
+ init_lr: 0.0001
440
+ init_lr_scale: 0.1
441
+ final_lr_scale: 1.0e-06
442
+ total_steps: 45000
443
+ phase_ratio: (0.02, 0.08, 0.9)
444
+ lr: 0.0001
445
+ model:
446
+ _target_: mode.models.edm_diffusion.score_wrappers.GCDenoiser
447
+ _recursive_: false
448
+ sigma_data: ${model.sigma_data}
449
+ inner_model:
450
+ _target_: mode.models.networks.modedit.MoDeDiT
451
+ action_dim: ${datamodule.action_space}
452
+ goal_dim: ${model.cond_dim}
453
+ obs_dim: 2048
454
+ goal_conditioned: true
455
+ causal: true
456
+ use_custom_attn_mask: false
457
+ use_proprio: ${model.use_proprio}
458
+ state_dim: ${proprio_dims}
459
+ embed_dim: ${model.latent_dim}
460
+ n_layers: 10
461
+ goal_seq_len: 1
462
+ obs_seq_len: ${obs_seq_len}
463
+ action_seq_len: ${act_seq_len}
464
+ embed_pdrob: 0
465
+ goal_drop: 0.1
466
+ attn_pdrop: 0.3
467
+ mlp_pdrop: 0.1
468
+ n_heads: 8
469
+ device: ${device}
470
+ linear_output: true
471
+ cond_router: true
472
+ num_experts: 4
473
+ top_k: 2
474
+ router_normalize: true
475
+ use_goal_in_routing: false
476
+ use_argmax: false
477
+ use_shared_expert: false
478
+ use_noise_token_as_input: true
479
+ init_style: olmoe
480
+ language_goal:
481
+ _target_: mode.models.networks.clip_lang_encoder.LangClip
482
+ _recursive_: false
483
+ model_name: ${clip_lang_model_name}
484
+ root_data_dir: data/lebai
485
+ lang_folder: lang_clip_resnet50
486
+ vis_clip_model_name: ViT-B/16
487
+ clip_lang_model_name: ViT-B/32
488
+ log_dir: ./logs
489
+ slurm: false
490
+ seed: 421
491
+ device: cuda
492
+ batch_size: 64
493
+ devices: 4
494
+ act_dim: 7
495
+ proprio_dims: 7
496
+ obs_dim: 512
497
+ goal_dim: 512
498
+ obs_seq_len: 1
499
+ act_seq_len: 32
500
+ multistep: 32
501
+ p_last_state: 0
502
+ gen_img_res: 112
503
+ max_epochs: 200
504
+ rollout_lh_skip_epochs: 9
505
+ num_workers: 12
506
+ benchmark_name: lebai_mode
507
+ use_extracted_rel_actions: true
508
+ trainer:
509
+ devices: ${devices}
510
+ precision: bf16
511
+ max_epochs: ${max_epochs}
512
+ sync_batchnorm: true
513
+ accelerator: gpu
514
+ strategy: ddp
515
+ logger:
516
+ _target_: pytorch_lightning.loggers.WandbLogger
517
+ save_dir: .
518
+ name: logger
519
+ group: mode
520
+ log_model: false
521
+ project: ${benchmark_name}
522
+ entity: yimingwu0
523
+ id: ???
l10_ds3_only/model_cleaned.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e94672c75395ac5ac3a1cf7ffdf0ffcd8fdde763ce58523d629ea11c657c59c
3
+ size 3115403448
l10_ds4_only/config.yaml ADDED
@@ -0,0 +1,523 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ callbacks:
2
+ rollout_lh:
3
+ tasks:
4
+ _target_: calvin_env.envs.tasks.Tasks
5
+ tasks:
6
+ rotate_red_block_right:
7
+ - rotate_object
8
+ - block_red
9
+ - -60
10
+ rotate_red_block_left:
11
+ - rotate_object
12
+ - block_red
13
+ - 60
14
+ rotate_blue_block_right:
15
+ - rotate_object
16
+ - block_blue
17
+ - -60
18
+ rotate_blue_block_left:
19
+ - rotate_object
20
+ - block_blue
21
+ - 60
22
+ rotate_pink_block_right:
23
+ - rotate_object
24
+ - block_pink
25
+ - -60
26
+ rotate_pink_block_left:
27
+ - rotate_object
28
+ - block_pink
29
+ - 60
30
+ push_red_block_right:
31
+ - push_object
32
+ - block_red
33
+ - 0.1
34
+ - 0
35
+ push_red_block_left:
36
+ - push_object
37
+ - block_red
38
+ - -0.1
39
+ - 0
40
+ push_blue_block_right:
41
+ - push_object
42
+ - block_blue
43
+ - 0.1
44
+ - 0
45
+ push_blue_block_left:
46
+ - push_object
47
+ - block_blue
48
+ - -0.1
49
+ - 0
50
+ push_pink_block_right:
51
+ - push_object
52
+ - block_pink
53
+ - 0.1
54
+ - 0
55
+ push_pink_block_left:
56
+ - push_object
57
+ - block_pink
58
+ - -0.1
59
+ - 0
60
+ move_slider_left:
61
+ - move_door_rel
62
+ - base__slide
63
+ - 0.15
64
+ move_slider_right:
65
+ - move_door_rel
66
+ - base__slide
67
+ - -0.15
68
+ open_drawer:
69
+ - move_door_rel
70
+ - base__drawer
71
+ - 0.12
72
+ close_drawer:
73
+ - move_door_rel
74
+ - base__drawer
75
+ - -0.12
76
+ lift_red_block_table:
77
+ - lift_object
78
+ - block_red
79
+ - 0.05
80
+ - table
81
+ - base_link
82
+ lift_red_block_slider:
83
+ - lift_object
84
+ - block_red
85
+ - 0.03
86
+ - table
87
+ - plank_link
88
+ lift_red_block_drawer:
89
+ - lift_object
90
+ - block_red
91
+ - 0.05
92
+ - table
93
+ - drawer_link
94
+ lift_blue_block_table:
95
+ - lift_object
96
+ - block_blue
97
+ - 0.05
98
+ - table
99
+ - base_link
100
+ lift_blue_block_slider:
101
+ - lift_object
102
+ - block_blue
103
+ - 0.03
104
+ - table
105
+ - plank_link
106
+ lift_blue_block_drawer:
107
+ - lift_object
108
+ - block_blue
109
+ - 0.05
110
+ - table
111
+ - drawer_link
112
+ lift_pink_block_table:
113
+ - lift_object
114
+ - block_pink
115
+ - 0.05
116
+ - table
117
+ - base_link
118
+ lift_pink_block_slider:
119
+ - lift_object
120
+ - block_pink
121
+ - 0.03
122
+ - table
123
+ - plank_link
124
+ lift_pink_block_drawer:
125
+ - lift_object
126
+ - block_pink
127
+ - 0.05
128
+ - table
129
+ - drawer_link
130
+ place_in_slider:
131
+ - place_object
132
+ - table
133
+ - plank_link
134
+ place_in_drawer:
135
+ - place_object
136
+ - table
137
+ - drawer_link
138
+ stack_block:
139
+ - stack_objects
140
+ unstack_block:
141
+ - unstack_objects
142
+ turn_on_lightbulb:
143
+ - toggle_light
144
+ - lightbulb
145
+ - 0
146
+ - 1
147
+ turn_off_lightbulb:
148
+ - toggle_light
149
+ - lightbulb
150
+ - 1
151
+ - 0
152
+ turn_on_led:
153
+ - toggle_light
154
+ - led
155
+ - 0
156
+ - 1
157
+ turn_off_led:
158
+ - toggle_light
159
+ - led
160
+ - 1
161
+ - 0
162
+ push_into_drawer:
163
+ - push_object_into
164
+ - - block_red
165
+ - block_blue
166
+ - block_pink
167
+ - table
168
+ - base_link
169
+ - table
170
+ - drawer_link
171
+ val_annotations:
172
+ rotate_red_block_right:
173
+ - take the red block and rotate it to the right
174
+ rotate_red_block_left:
175
+ - take the red block and rotate it to the left
176
+ rotate_blue_block_right:
177
+ - take the blue block and rotate it to the right
178
+ rotate_blue_block_left:
179
+ - take the blue block and rotate it to the left
180
+ rotate_pink_block_right:
181
+ - take the pink block and rotate it to the right
182
+ rotate_pink_block_left:
183
+ - take the pink block and rotate it to the left
184
+ push_red_block_right:
185
+ - go push the red block right
186
+ push_red_block_left:
187
+ - go push the red block left
188
+ push_blue_block_right:
189
+ - go push the blue block right
190
+ push_blue_block_left:
191
+ - go push the blue block left
192
+ push_pink_block_right:
193
+ - go push the pink block right
194
+ push_pink_block_left:
195
+ - go push the pink block left
196
+ move_slider_left:
197
+ - push the sliding door to the left side
198
+ move_slider_right:
199
+ - push the sliding door to the right side
200
+ open_drawer:
201
+ - pull the handle to open the drawer
202
+ close_drawer:
203
+ - push the handle to close the drawer
204
+ lift_red_block_table:
205
+ - grasp and lift the red block
206
+ lift_blue_block_table:
207
+ - grasp and lift the blue block
208
+ lift_pink_block_table:
209
+ - grasp and lift the pink block
210
+ lift_red_block_slider:
211
+ - lift the red block from the sliding cabinet
212
+ lift_blue_block_slider:
213
+ - lift the blue block from the sliding cabinet
214
+ lift_pink_block_slider:
215
+ - lift the pink block from the sliding cabinet
216
+ lift_red_block_drawer:
217
+ - Take the red block from the drawer
218
+ lift_blue_block_drawer:
219
+ - Take the blue block from the drawer
220
+ lift_pink_block_drawer:
221
+ - Take the pink block from the drawer
222
+ place_in_slider:
223
+ - store the grasped block in the sliding cabinet
224
+ place_in_drawer:
225
+ - store the grasped block in the drawer
226
+ push_into_drawer:
227
+ - slide the block that it falls into the drawer
228
+ stack_block:
229
+ - stack the grasped block
230
+ unstack_block:
231
+ - remove the stacked block
232
+ turn_on_lightbulb:
233
+ - use the switch to turn on the light bulb
234
+ turn_off_lightbulb:
235
+ - use the switch to turn off the light bulb
236
+ turn_on_led:
237
+ - press the button to turn on the led light
238
+ turn_off_led:
239
+ - press the button to turn off the led light
240
+ _target_: mode.rollout.rollout_long_horizon.RolloutLongHorizon
241
+ _recursive_: false
242
+ env_cfg:
243
+ _target_: mode.wrappers.hulc_wrapper.HulcWrapper
244
+ skip_epochs: ${rollout_lh_skip_epochs}
245
+ rollout_freq: 5
246
+ num_videos: 0
247
+ num_sequences: 1000
248
+ replan_freq: 30
249
+ ep_len: 360
250
+ empty_cache: false
251
+ log_video_to_file: false
252
+ save_dir: ./videos
253
+ lang_folder: ${lang_folder}
254
+ debug: false
255
+ ema:
256
+ _target_: mode.callbacks.ema.EMA
257
+ decay: 0.999
258
+ start_step: 0
259
+ save_ema_weights_in_callback_state: true
260
+ evaluate_ema_weights_instead: true
261
+ power: 0.6666666666666666
262
+ inv_gamma: 1.0
263
+ min_value: 0.0
264
+ max_value: 0.9999
265
+ checkpoint:
266
+ _target_: pytorch_lightning.callbacks.ModelCheckpoint
267
+ verbose: true
268
+ dirpath: saved_models
269
+ filename: '{epoch:02d}'
270
+ every_n_epochs: ${callbacks.rollout_lh.rollout_freq}
271
+ datamodule:
272
+ transforms:
273
+ train:
274
+ rgb_static:
275
+ - _target_: torchvision.transforms.Resize
276
+ size: 224
277
+ antialias: true
278
+ - _target_: mode.utils.transforms.RandomShiftsAug
279
+ pad: 10
280
+ - _target_: mode.utils.transforms.ScaleImageTensor
281
+ - _target_: torchvision.transforms.Normalize
282
+ mean:
283
+ - 0.48145466
284
+ - 0.4578275
285
+ - 0.40821073
286
+ std:
287
+ - 0.26862954
288
+ - 0.26130258
289
+ - 0.27577711
290
+ rgb_gripper:
291
+ - _target_: torchvision.transforms.Resize
292
+ size: 224
293
+ antialias: true
294
+ - _target_: mode.utils.transforms.RandomShiftsAug
295
+ pad: 4
296
+ - _target_: mode.utils.transforms.ScaleImageTensor
297
+ - _target_: torchvision.transforms.Normalize
298
+ mean:
299
+ - 0.48145466
300
+ - 0.4578275
301
+ - 0.40821073
302
+ std:
303
+ - 0.26862954
304
+ - 0.26130258
305
+ - 0.27577711
306
+ robot_obs:
307
+ - _target_: mode.utils.transforms.NormalizeVector
308
+ scene_obs:
309
+ - _target_: mode.utils.transforms.NormalizeVector
310
+ val:
311
+ rgb_static:
312
+ - _target_: torchvision.transforms.Resize
313
+ size: 224
314
+ antialias: true
315
+ - _target_: mode.utils.transforms.ScaleImageTensor
316
+ - _target_: torchvision.transforms.Normalize
317
+ mean:
318
+ - 0.48145466
319
+ - 0.4578275
320
+ - 0.40821073
321
+ std:
322
+ - 0.26862954
323
+ - 0.26130258
324
+ - 0.27577711
325
+ rgb_gripper:
326
+ - _target_: torchvision.transforms.Resize
327
+ size: 224
328
+ antialias: true
329
+ - _target_: mode.utils.transforms.ScaleImageTensor
330
+ - _target_: torchvision.transforms.Normalize
331
+ mean:
332
+ - 0.48145466
333
+ - 0.4578275
334
+ - 0.40821073
335
+ std:
336
+ - 0.26862954
337
+ - 0.26130258
338
+ - 0.27577711
339
+ robot_obs:
340
+ - _target_: mode.utils.transforms.NormalizeVector
341
+ scene_obs:
342
+ - _target_: mode.utils.transforms.NormalizeVector
343
+ _target_: mode.datasets.hulc_data_module.HulcDataModule
344
+ _recursive_: false
345
+ root_data_dir: ${root_data_dir}
346
+ action_space: 7
347
+ action_max:
348
+ - 1.0
349
+ - 1.0
350
+ - 1.0
351
+ - 1.0
352
+ - 1.0
353
+ - 1.0
354
+ - 1.0
355
+ action_min:
356
+ - -1.0
357
+ - -1.0
358
+ - -1.0
359
+ - -1.0
360
+ - -1.0
361
+ - -1.0
362
+ - -1
363
+ shuffle_val: false
364
+ observation_space:
365
+ rgb_obs:
366
+ - rgb_static
367
+ - rgb_gripper
368
+ depth_obs: []
369
+ state_obs:
370
+ - robot_obs
371
+ actions:
372
+ - rel_actions
373
+ language:
374
+ - language
375
+ proprioception_dims:
376
+ n_state_obs: 8
377
+ keep_indices:
378
+ - - 0
379
+ - 7
380
+ - - 14
381
+ - 15
382
+ robot_orientation_idx:
383
+ - 3
384
+ - 6
385
+ normalize: true
386
+ normalize_robot_orientation: true
387
+ datasets:
388
+ lang_dataset:
389
+ _target_: mode.datasets.disk_dataset.ExtendedDiskDataset
390
+ key: lang
391
+ save_format: npz
392
+ batch_size: ${batch_size}
393
+ min_window_size: ${act_seq_len}
394
+ max_window_size: ${act_seq_len}
395
+ proprio_state: ${datamodule.proprioception_dims}
396
+ obs_space: ${datamodule.observation_space}
397
+ skip_frames: 1
398
+ pad: false
399
+ lang_folder: ${lang_folder}
400
+ aux_lang_loss_window: 8
401
+ num_workers: ${num_workers}
402
+ action_seq_len: ${act_seq_len}
403
+ obs_seq_len: ${obs_seq_len}
404
+ future_range: 1
405
+ use_extracted_rel_actions: ${use_extracted_rel_actions}
406
+ model:
407
+ _target_: mode.models.mode_agent.MoDEAgent
408
+ _recursive_: false
409
+ multistep: ${multistep}
410
+ use_lr_scheduler: true
411
+ entropy_gamma: 0.01
412
+ router_z_delta: 0.0
413
+ use_proprio: false
414
+ seed: ${seed}
415
+ sampler_type: ddim
416
+ num_sampling_steps: 10
417
+ sigma_data: 0.5
418
+ sigma_min: 0.001
419
+ sigma_max: 80
420
+ noise_scheduler: exponential
421
+ sigma_sample_density_type: loglogistic
422
+ ckpt_path: /home/yiming/pretrained_models/MoDE/MoDE_Pretrained
423
+ start_from_pretrained: true
424
+ act_window_size: ${act_seq_len}
425
+ latent_dim: 1024
426
+ obs_enc_dim: ${obs_dim}
427
+ cond_dim: 512
428
+ resnet_type: '50'
429
+ optimizer:
430
+ _target_: torch.optim.AdamW
431
+ transformer_weight_decay: 0.05
432
+ obs_encoder_weight_decay: 0.05
433
+ learning_rate: 0.0001
434
+ betas:
435
+ - 0.9
436
+ - 0.95
437
+ lr_scheduler:
438
+ lr_scheduler:
439
+ init_lr: 0.0001
440
+ init_lr_scale: 0.1
441
+ final_lr_scale: 1.0e-06
442
+ total_steps: 45000
443
+ phase_ratio: (0.02, 0.08, 0.9)
444
+ lr: 0.0001
445
+ model:
446
+ _target_: mode.models.edm_diffusion.score_wrappers.GCDenoiser
447
+ _recursive_: false
448
+ sigma_data: ${model.sigma_data}
449
+ inner_model:
450
+ _target_: mode.models.networks.modedit.MoDeDiT
451
+ action_dim: ${datamodule.action_space}
452
+ goal_dim: ${model.cond_dim}
453
+ obs_dim: 2048
454
+ goal_conditioned: true
455
+ causal: true
456
+ use_custom_attn_mask: false
457
+ use_proprio: ${model.use_proprio}
458
+ state_dim: ${proprio_dims}
459
+ embed_dim: ${model.latent_dim}
460
+ n_layers: 10
461
+ goal_seq_len: 1
462
+ obs_seq_len: ${obs_seq_len}
463
+ action_seq_len: ${act_seq_len}
464
+ embed_pdrob: 0
465
+ goal_drop: 0.1
466
+ attn_pdrop: 0.3
467
+ mlp_pdrop: 0.1
468
+ n_heads: 8
469
+ device: ${device}
470
+ linear_output: true
471
+ cond_router: true
472
+ num_experts: 4
473
+ top_k: 2
474
+ router_normalize: true
475
+ use_goal_in_routing: false
476
+ use_argmax: false
477
+ use_shared_expert: false
478
+ use_noise_token_as_input: true
479
+ init_style: olmoe
480
+ language_goal:
481
+ _target_: mode.models.networks.clip_lang_encoder.LangClip
482
+ _recursive_: false
483
+ model_name: ${clip_lang_model_name}
484
+ root_data_dir: data/lebai
485
+ lang_folder: lang_clip_resnet50
486
+ vis_clip_model_name: ViT-B/16
487
+ clip_lang_model_name: ViT-B/32
488
+ log_dir: ./logs
489
+ slurm: false
490
+ seed: 421
491
+ device: cuda
492
+ batch_size: 64
493
+ devices: 4
494
+ act_dim: 7
495
+ proprio_dims: 7
496
+ obs_dim: 512
497
+ goal_dim: 512
498
+ obs_seq_len: 1
499
+ act_seq_len: 32
500
+ multistep: 32
501
+ p_last_state: 0
502
+ gen_img_res: 112
503
+ max_epochs: 200
504
+ rollout_lh_skip_epochs: 9
505
+ num_workers: 12
506
+ benchmark_name: lebai_mode
507
+ use_extracted_rel_actions: true
508
+ trainer:
509
+ devices: ${devices}
510
+ precision: bf16
511
+ max_epochs: ${max_epochs}
512
+ sync_batchnorm: true
513
+ accelerator: gpu
514
+ strategy: ddp
515
+ logger:
516
+ _target_: pytorch_lightning.loggers.WandbLogger
517
+ save_dir: .
518
+ name: logger
519
+ group: mode
520
+ log_model: false
521
+ project: ${benchmark_name}
522
+ entity: yimingwu0
523
+ id: ???
l10_ds4_only/model_cleaned.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ced8bd34e8b00519126bbc65294c011373003cb19f70953346009e34fdc2c14
3
+ size 3115403448