qwenlatent_vla / config.yaml
Timsty's picture
Upload folder using huggingface_hub
e98fd25 verified
run_id: 0119_QwenLatent_libero_bs64_addnorm_chunk15
run_root_dir: ./runs
seed: 42
trackers:
- jsonl
- wandb
wandb_entity: timsty
wandb_project: vla_jepa
is_debug: false
framework:
name: QwenLatent
qwenvl:
base_vlm: /data2/timsty/checkpoint/Qwen/Qwen3-VL-2B-Instruct
attn_implementation: flash_attention_2
vl_hidden_dim: 2048
num_data_tokens: 32
action_model:
ckpt_path: /data2/timsty/code/LearnLatent/runs/0119_ActionModel_droid_furniture_libero_rt1_bridge_addnorm/final_model/pytorch_model.pt
action_size: 32
state_size: 32
hidden_size: 1024
intermediate_size: 3072
dataset_vocab_size: 256
num_data_tokens: 8
mask_ratio: 0.25
state_drop_prob: 0.5
min_action_len: 5
num_encoder_layers: 28
num_decoder_layers: 28
num_attention_heads: 16
num_key_value_heads: 8
head_dim: 128
max_position_embeddings: 2048
max_action_chunk_size: 50
rms_norm_eps: 1.0e-06
attention_dropout: 0.0
use_vae_reparameterization: false
datasets:
vla_data:
dataset_py: lerobot_datasets
data_root_dir: /data2/timsty/dataset/IPEC-COMMUNITY
data_mix: libero_all
action_type: delta_ee
CoT_prompt: 'Task: {instruction}. Robot State: {state_str}. What are the next
{chunk_size} actions to take?'
default_image_resolution:
- 3
- 224
- 224
per_device_batch_size: 64
load_all_data_for_training: true
obs:
- image_0
image_size:
- 224
- 224
video_backend: torchvision_av
load_past: false
load_future: false
chunk_size: 15
trainer:
epochs: 100
max_train_steps: 10000
num_warmup_steps: 500
save_interval: 1000
eval_interval: 50
learning_rate:
base: 5.0e-05
qwen_vl_interface: 5.0e-05
action_model: 5.0e-05
lr_scheduler_type: cosine_with_min_lr
scheduler_specific_kwargs:
min_lr: 5.0e-07
freeze_modules: ''
loss_scale:
align_loss: 1.0
recon_loss: 0.1
warmup_ratio: 0.1
weight_decay: 0.0
logging_frequency: 10
gradient_clipping: 5.0
gradient_accumulation_steps: 1
optimizer:
name: AdamW
betas:
- 0.9
- 0.95
eps: 1.0e-08
weight_decay: 1.0e-08
is_resume: false
resume_epoch: null
resume_step: null
enable_gradient_checkpointing: true
enable_mixed_precision_training: true
output_dir: ./runs/0119_QwenLatent_libero_bs64_addnorm_chunk15