robbyant
/

lingbot-vla-4b-posttrain-robotwin

Model card Files Files and versions

lingbot-vla-4b-posttrain-robotwin / lingbotvla_cli.yaml

Weiww99's picture

Upload folder using huggingface_hub

3e0c7c4 verified about 1 month ago

history blame contribute delete

3.39 kB

	data:
	cameras:
	- camera_top
	- camera_wrist_left
	- camera_wrist_right
	chat_template: default
	data_name: multi
	data_root: null
	data_tag: default
	data_type: conversation
	dataloader_type: native
	datasets_type: vla
	drop_last: true
	image_keys: images
	joints:
	- '{''arm.position'': 14}'
	- '{''effector.position'': 2}'
	max_seq_len: 64
	norm_type: bounds_99_woclip
	num_workers: 20
	pin_memory: true
	prefetch_factor: 4
	robot_config_root: ./configs/robot_configs
	source_name: null
	text_keys: messages
	train_path: ./assets/training_data/robotwin_all_tasks_with_aug.txt
	train_size: 8000000
	model:
	adanorm_time: true
	attn_implementation: flash_attention_2
	basic_modules: []
	decoders: {}
	depth_incremental_training: false
	encode_target: false
	encoders: {}
	final_norm_adanorm: false
	force_use_huggingface: false
	incremental_training: false
	input_encoder: encoder
	moe_implementation: null
	nosplit_gate_liner: false
	old_adanorm: true
	output_encoder: decoder
	post_training: true
	separate_time_proj: false
	split_gate_liner: false
	use_lm_head: false
	vlm_repo_id: null
	vocab_size: 0
	train:
	action_dim: 14
	activation_gpu_limit: 0.0
	align_params: {}
	bsz_warmup_init_mbtoken: 200
	bsz_warmup_ratio: 0
	chunk_size: 50
	ckpt_manager: dcp
	context_parallel_size: 1
	data_parallel_mode: fsdp2
	data_parallel_replicate_size: 1
	data_parallel_shard_size: 8
	decayed_max_grad_norm: 1.0
	dyn_bsz: true
	dyn_bsz_buffer_size: 200
	dyn_bsz_margin: 0
	ema_rate: 0.9999
	embodiment_name: null
	empty_cache_steps: 500
	enable_activation_offload: false
	enable_expert_vision: false
	enable_forward_prefetch: true
	enable_fp32: true
	enable_fsdp_offload: false
	enable_full_determinism: false
	enable_full_shard: false
	enable_gradient_checkpointing: true
	enable_manual_eager: false
	enable_mixed_precision: true
	enable_profiling: false
	enable_reentrant: false
	enable_resume: true
	expert_parallel_size: 1
	expert_vision_path: null
	expert_vision_type: null
	freeze_vision_encoder: false
	freeze_vit: false
	global_batch_size: 256
	ignore_depth: false
	init_device: cuda
	interact_layer_end: null
	interact_layer_start: null
	load_checkpoint_path: null
	lr: 0.0001
	lr_decay_ratio: 1.0
	lr_decay_style: constant
	lr_min: 1.0e-07
	lr_start: 0.0
	lr_warmup_ratio: 0
	max_action_dim: 75
	max_grad_norm: 1.0
	max_state_dim: 75
	max_steps: 220000
	micro_batch_size: 32
	module_fsdp_enable: true
	my_tokenizer_max_length: 72
	norm_qkv: false
	num_train_epochs: 29000
	optimizer: adamw
	pipeline_parallel_size: 1
	pre_train: false
	profile_end_step: 2
	profile_profile_memory: true
	profile_record_shapes: true
	profile_start_step: 1
	profile_trace_dir: ./trace
	profile_with_stack: true
	qwenvl_bos: true
	resume_dataloader_state: true
	rmpad: false
	rmpad_with_pos_ids: false
	save_epochs: 29000
	save_hf_weights: true
	save_steps: 10000
	seed: 42
	skip_max_norm: false
	stable_train_steps: 100000
	tensor_parallel_size: 1
	tokenizer_max_length: 24
	ulysses_parallel_size: 1
	use_compile: true
	use_doptim: false
	use_ema: false
	use_fast_action: false
	use_ki: false
	use_prompt: false
	use_state: false
	use_subtask: false
	use_wandb: false
	vit_lr: 1.0e-06
	vlm_causal: false
	wandb_name: pi0_libero
	wandb_project: pi0_libero
	weight_decay: 0