action_dim: 7 action_model_type: DiT-L consolidate_type: tome dataset_name: realpushmultit episode_instructions_file: null fusion_type: gate future_action_window_size: 15 group_size: 16 hf_token: .hf_token image_aug: false image_key: img_third instruction: push the T-shaped block to visit each T-shaped target region on the table without revisiting any is_resume: true lora: alpha: 48.0 cog_cross_targets: - q_proj - k_proj - v_proj dit_attn_targets: - q - v dropout: 0.05 enabled: true llama_alpha: 16.0 llama_r: 8 llama_targets: - q_proj - v_proj lora_cog_gate: true lora_llama: true lora_vision: true r: 24 vision_alpha: 16.0 vision_r: 8 vision_targets: - qkv mem_length: 16 per_token_size: 256 pretrained_checkpoint: /workspace/diffusion_policy/runs/memoryvla_realpushmultit/memoryvla_realpushmultit_lora_bs64_v1/checkpoints/step-006000-epoch-03-loss=0.0703.pt repeated_diffusion_steps: 4 resume_epoch: 3 resume_step: 6000 retrieval_layers: 2 run_id: memoryvla_realpushmultit_lora_bs64_v1 run_id_note: null run_root_dir: runs/memoryvla_realpushmultit save_interval: 1000 seed: 42 trackers: - jsonl - wandb update_fused: false use_ema: false use_timestep_pe: true val_ratio: 0.05 vla: base_vlm: prism-dinosiglip-224px+7b data_mix: oxe_magic_soup_plus_minus enable_gradient_checkpointing: true enable_mixed_precision_training: true epochs: 100 expected_world_size: 4 freeze_llm_backbone: false freeze_vision_backbone: false global_batch_size: 256 learning_rate: 0.0002 lr_scheduler_type: linear-warmup+cosine-decay max_grad_norm: 1.0 max_steps: 10000 per_device_batch_size: 64 reduce_in_full_precision: true shuffle_buffer_size: 250000 train_strategy: fsdp-full-shard type: prism-dinosiglip-224px+oxe+diffusion unfreeze_last_llm_layer: false vla_id: prism-dinosiglip-224px+oxe+diffusion warmup_ratio: 0.05 weight_decay: 0.0 wandb_entity: williamcao-uc-san-diego wandb_project: memoryvla_realpushmultit_lora zarr_path: data/real_push_multit/RealPushMultiT_320.zarr