| { |
| "type": "pi0_ecot", |
| "n_obs_steps": 1, |
| "normalization_mapping": { |
| "VISUAL": "IDENTITY", |
| "STATE": "IDENTITY", |
| "ACTION": "IDENTITY" |
| }, |
| "input_features": { |
| "observation.images.top": { |
| "type": "VISUAL", |
| "shape": [ |
| 3, |
| 224, |
| 224 |
| ] |
| }, |
| "observation.state": { |
| "type": "STATE", |
| "shape": [ |
| 7 |
| ] |
| } |
| }, |
| "output_features": { |
| "action": { |
| "type": "ACTION", |
| "shape": [ |
| 7 |
| ] |
| } |
| }, |
| "device": "cpu", |
| "use_amp": true, |
| "chunk_size": 4, |
| "n_action_steps": 4, |
| "max_state_dim": 32, |
| "max_action_dim": 32, |
| "resize_imgs_with_padding": [ |
| 224, |
| 224 |
| ], |
| "empty_cameras": 0, |
| "adapt_to_pi_aloha": false, |
| "use_delta_joint_actions_aloha": false, |
| "tokenizer_max_length": 72, |
| "proj_width": 1024, |
| "num_steps": 10, |
| "use_cache": true, |
| "attention_implementation": "eager", |
| "freeze_vision_encoder": true, |
| "train_expert_only": true, |
| "train_state_proj": true, |
| "paligemma_pretrained_path": null, |
| "optimizer_lr": 0.0003, |
| "optimizer_betas": [ |
| 0.9, |
| 0.999 |
| ], |
| "optimizer_eps": 1e-08, |
| "optimizer_weight_decay": 0.0, |
| "scheduler_warmup_steps": 500, |
| "scheduler_decay_steps": 30000, |
| "scheduler_decay_lr": 2.5e-05, |
| "tokenizer_pretrained": "google/paligemma-3b-pt-224", |
| "max_move_tokens": 8, |
| "num_z_tokens": 8, |
| "ecot_source": "future_action", |
| "ecot_embedding_mode": "online", |
| "qwen_offline_z_key": "observation.ecot.qwen_hidden", |
| "vjepa_offline_z_key": "observation.ecot.vjepa_hidden", |
| "ecot_vla_offline_z_key": "observation.ecot.openvla_hidden", |
| "offline_z_is_projected": false, |
| "offline_z_sidecar_path": null, |
| "offline_z_sidecar_index_key": "index", |
| "offline_z_sidecar_z_key": "z", |
| "z_projection_path": "runs/autoencoder/checkpoint.pt", |
| "gt_z_projection_path": null, |
| "vjepa_z_projection_path": "runs/vjepa_autoencoder/checkpoint.pt", |
| "ecot_vla_z_projection_path": "runs/ecot_vla_autoencoder/checkpoint.pt", |
| "gt_move_joiner": ". ", |
| "gt_move_prompt_prefix": "Move: ", |
| "qwen_base_model_id": "Qwen/Qwen3-VL-4B-Instruct", |
| "qwen_model_id": "StarVLA/Qwen3VL-OFT-Bridge-RT-1", |
| "qwen_checkpoint_file": "checkpoints/steps_5000_pytorch_model.pt", |
| "vjepa_model_id": "facebook/vjepa2-vitl-fpc64-256", |
| "vjepa_clip_key": "observation.images.image_0_future", |
| "vjepa_clip_frames": 16, |
| "ecot_vla_model_id": "Embodied-CoT/ecot-openvla-7b-bridge", |
| "ecot_vla_prompt_template": "Task: {instruction}\nReasoning:", |
| "ecot_vla_text_max_length": 256, |
| "online_ecot_llm_hidden_dim": 4096, |
| "future_action_z_projection_path": "runs/future_action_autoencoder_transformer/checkpoint.pt", |
| "future_action_horizon": 50, |
| "future_action_key": "future_action", |
| "future_action_pad_mask_key": "future_action_pad_mask", |
| "enable_cross_masking": true, |
| "cross_mask_prob_a_only": 0.05, |
| "cross_mask_prob_a_only_start": 0.0, |
| "cross_mask_prob_a_only_end": 0.05, |
| "cross_mask_prob_a_only_curriculum_steps": 15000, |
| "cross_mask_prob_z_only": 0.050000000000000044, |
| "cross_mask_prob_z_only_start": 0.95, |
| "cross_mask_prob_z_only_end": 0.05, |
| "cross_mask_prob_z_only_curriculum_steps": 15000, |
| "z_loss_weight": 1.0, |
| "z_noise_alpha": 2.0, |
| "train_full_denoise_every": 50, |
| "train_full_denoise_loss_weight": 0.1, |
| "train_full_denoise_grad_last_k": 1, |
| "train_full_denoise_on_z_only": false |
| } |