lingbot-vla-4b-posttrain-robotwin / lingbotvla_cli.yaml
Weiww99's picture
Upload folder using huggingface_hub
3e0c7c4 verified
data:
cameras:
- camera_top
- camera_wrist_left
- camera_wrist_right
chat_template: default
data_name: multi
data_root: null
data_tag: default
data_type: conversation
dataloader_type: native
datasets_type: vla
drop_last: true
image_keys: images
joints:
- '{''arm.position'': 14}'
- '{''effector.position'': 2}'
max_seq_len: 64
norm_type: bounds_99_woclip
num_workers: 20
pin_memory: true
prefetch_factor: 4
robot_config_root: ./configs/robot_configs
source_name: null
text_keys: messages
train_path: ./assets/training_data/robotwin_all_tasks_with_aug.txt
train_size: 8000000
model:
adanorm_time: true
attn_implementation: flash_attention_2
basic_modules: []
decoders: {}
depth_incremental_training: false
encode_target: false
encoders: {}
final_norm_adanorm: false
force_use_huggingface: false
incremental_training: false
input_encoder: encoder
moe_implementation: null
nosplit_gate_liner: false
old_adanorm: true
output_encoder: decoder
post_training: true
separate_time_proj: false
split_gate_liner: false
use_lm_head: false
vlm_repo_id: null
vocab_size: 0
train:
action_dim: 14
activation_gpu_limit: 0.0
align_params: {}
bsz_warmup_init_mbtoken: 200
bsz_warmup_ratio: 0
chunk_size: 50
ckpt_manager: dcp
context_parallel_size: 1
data_parallel_mode: fsdp2
data_parallel_replicate_size: 1
data_parallel_shard_size: 8
decayed_max_grad_norm: 1.0
dyn_bsz: true
dyn_bsz_buffer_size: 200
dyn_bsz_margin: 0
ema_rate: 0.9999
embodiment_name: null
empty_cache_steps: 500
enable_activation_offload: false
enable_expert_vision: false
enable_forward_prefetch: true
enable_fp32: true
enable_fsdp_offload: false
enable_full_determinism: false
enable_full_shard: false
enable_gradient_checkpointing: true
enable_manual_eager: false
enable_mixed_precision: true
enable_profiling: false
enable_reentrant: false
enable_resume: true
expert_parallel_size: 1
expert_vision_path: null
expert_vision_type: null
freeze_vision_encoder: false
freeze_vit: false
global_batch_size: 256
ignore_depth: false
init_device: cuda
interact_layer_end: null
interact_layer_start: null
load_checkpoint_path: null
lr: 0.0001
lr_decay_ratio: 1.0
lr_decay_style: constant
lr_min: 1.0e-07
lr_start: 0.0
lr_warmup_ratio: 0
max_action_dim: 75
max_grad_norm: 1.0
max_state_dim: 75
max_steps: 220000
micro_batch_size: 32
module_fsdp_enable: true
my_tokenizer_max_length: 72
norm_qkv: false
num_train_epochs: 29000
optimizer: adamw
pipeline_parallel_size: 1
pre_train: false
profile_end_step: 2
profile_profile_memory: true
profile_record_shapes: true
profile_start_step: 1
profile_trace_dir: ./trace
profile_with_stack: true
qwenvl_bos: true
resume_dataloader_state: true
rmpad: false
rmpad_with_pos_ids: false
save_epochs: 29000
save_hf_weights: true
save_steps: 10000
seed: 42
skip_max_norm: false
stable_train_steps: 100000
tensor_parallel_size: 1
tokenizer_max_length: 24
ulysses_parallel_size: 1
use_compile: true
use_doptim: false
use_ema: false
use_fast_action: false
use_ki: false
use_prompt: false
use_state: false
use_subtask: false
use_wandb: false
vit_lr: 1.0e-06
vlm_causal: false
wandb_name: pi0_libero
wandb_project: pi0_libero
weight_decay: 0