Wr3ck1Am's picture
Add files using upload-large-folder tool
ba3fb02 verified
action_dim: 7
action_model_type: DiT-L
consolidate_type: tome
dataset_name: realpushmultit
episode_instructions_file: null
fusion_type: gate
future_action_window_size: 15
group_size: 16
hf_token: .hf_token
image_aug: false
image_key: img_third
instruction: push the T-shaped block to visit each T-shaped target region on the table
without revisiting any
is_resume: true
lora:
alpha: 48.0
cog_cross_targets:
- q_proj
- k_proj
- v_proj
dit_attn_targets:
- q
- v
dropout: 0.05
enabled: true
llama_alpha: 16.0
llama_r: 8
llama_targets:
- q_proj
- v_proj
lora_cog_gate: true
lora_llama: true
lora_vision: true
r: 24
vision_alpha: 16.0
vision_r: 8
vision_targets:
- qkv
mem_length: 16
per_token_size: 256
pretrained_checkpoint: /workspace/diffusion_policy/runs/memoryvla_realpushmultit/memoryvla_realpushmultit_lora_bs64_v1/checkpoints/step-006000-epoch-03-loss=0.0703.pt
repeated_diffusion_steps: 4
resume_epoch: 3
resume_step: 6000
retrieval_layers: 2
run_id: memoryvla_realpushmultit_lora_bs64_v1
run_id_note: null
run_root_dir: runs/memoryvla_realpushmultit
save_interval: 1000
seed: 42
trackers:
- jsonl
- wandb
update_fused: false
use_ema: false
use_timestep_pe: true
val_ratio: 0.05
vla:
base_vlm: prism-dinosiglip-224px+7b
data_mix: oxe_magic_soup_plus_minus
enable_gradient_checkpointing: true
enable_mixed_precision_training: true
epochs: 100
expected_world_size: 4
freeze_llm_backbone: false
freeze_vision_backbone: false
global_batch_size: 256
learning_rate: 0.0002
lr_scheduler_type: linear-warmup+cosine-decay
max_grad_norm: 1.0
max_steps: 10000
per_device_batch_size: 64
reduce_in_full_precision: true
shuffle_buffer_size: 250000
train_strategy: fsdp-full-shard
type: prism-dinosiglip-224px+oxe+diffusion
unfreeze_last_llm_layer: false
vla_id: prism-dinosiglip-224px+oxe+diffusion
warmup_ratio: 0.05
weight_decay: 0.0
wandb_entity: williamcao-uc-san-diego
wandb_project: memoryvla_realpushmultit_lora
zarr_path: data/real_push_multit/RealPushMultiT_320.zarr