| { |
| "action_dim": 7, |
| "action_model_type": "DiT-L", |
| "consolidate_type": "tome", |
| "dataset_name": "realpushmultit", |
| "episode_instructions_file": null, |
| "fusion_type": "gate", |
| "future_action_window_size": 15, |
| "group_size": 16, |
| "hf_token": ".hf_token", |
| "image_aug": false, |
| "image_key": "img_third", |
| "instruction": "push the T-shaped block to visit each T-shaped target region on the table without revisiting any", |
| "is_resume": true, |
| "lora": { |
| "alpha": 48.0, |
| "cog_cross_targets": [ |
| "q_proj", |
| "k_proj", |
| "v_proj" |
| ], |
| "dit_attn_targets": [ |
| "q", |
| "v" |
| ], |
| "dropout": 0.05, |
| "enabled": true, |
| "llama_alpha": 16.0, |
| "llama_r": 8, |
| "llama_targets": [ |
| "q_proj", |
| "v_proj" |
| ], |
| "lora_cog_gate": true, |
| "lora_llama": true, |
| "lora_vision": true, |
| "r": 24, |
| "vision_alpha": 16.0, |
| "vision_r": 8, |
| "vision_targets": [ |
| "qkv" |
| ] |
| }, |
| "mem_length": 16, |
| "per_token_size": 256, |
| "pretrained_checkpoint": "/workspace/diffusion_policy/runs/memoryvla_realpushmultit/memoryvla_realpushmultit_lora_bs64_v1/checkpoints/step-006000-epoch-03-loss=0.0703.pt", |
| "repeated_diffusion_steps": 4, |
| "resume_epoch": 3, |
| "resume_step": 6000, |
| "retrieval_layers": 2, |
| "run_id": "memoryvla_realpushmultit_lora_bs64_v1", |
| "run_id_note": null, |
| "run_root_dir": "runs/memoryvla_realpushmultit", |
| "save_interval": 1000, |
| "seed": 42, |
| "trackers": [ |
| "jsonl", |
| "wandb" |
| ], |
| "update_fused": false, |
| "use_ema": false, |
| "use_timestep_pe": true, |
| "val_ratio": 0.05, |
| "vla": { |
| "base_vlm": "prism-dinosiglip-224px+7b", |
| "data_mix": "oxe_magic_soup_plus_minus", |
| "enable_gradient_checkpointing": true, |
| "enable_mixed_precision_training": true, |
| "epochs": 100, |
| "expected_world_size": 4, |
| "freeze_llm_backbone": false, |
| "freeze_vision_backbone": false, |
| "global_batch_size": 256, |
| "learning_rate": 0.0002, |
| "lr_scheduler_type": "linear-warmup+cosine-decay", |
| "max_grad_norm": 1.0, |
| "max_steps": 10000, |
| "per_device_batch_size": 64, |
| "reduce_in_full_precision": true, |
| "shuffle_buffer_size": 250000, |
| "train_strategy": "fsdp-full-shard", |
| "type": "prism-dinosiglip-224px+oxe+diffusion", |
| "unfreeze_last_llm_layer": false, |
| "vla_id": "prism-dinosiglip-224px+oxe+diffusion", |
| "warmup_ratio": 0.05, |
| "weight_decay": 0.0 |
| }, |
| "wandb_entity": "williamcao-uc-san-diego", |
| "wandb_project": "memoryvla_realpushmultit_lora", |
| "zarr_path": "data/real_push_multit/RealPushMultiT_320.zarr" |
| } |