IffYuan commited on
Commit
d1a238c
·
verified ·
1 Parent(s): 6e59dc5

Upload config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.yaml +71 -0
config.yaml ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ datasets:
2
+ vla_data:
3
+ CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
4
+ Locate their bounding boxes in [x1,y1,x2,y2] format.
5
+ data_mix: bridge_rt_1
6
+ data_root_dir: ./playground/Datasets/OXE_LEROBOT
7
+ dataset_py: lerobot_datasets
8
+ image_size:
9
+ - 224
10
+ - 224
11
+ per_device_batch_size: 8
12
+ video_backend: torchvision_av
13
+ framework:
14
+ action_model:
15
+ action_dim: 7
16
+ action_horizon: 16
17
+ action_model_type: DiT-B
18
+ add_pos_embed: true
19
+ diffusion_model_cfg:
20
+ cross_attention_dim: 4096
21
+ dropout: 0.2
22
+ final_dropout: true
23
+ interleave_self_attention: true
24
+ norm_type: ada_norm
25
+ num_layers: 16
26
+ output_dim: 1024
27
+ positional_embeddings: null
28
+ future_action_window_size: 15
29
+ hidden_size: 1024
30
+ max_seq_len: 1024
31
+ noise_beta_alpha: 1.5
32
+ noise_beta_beta: 1.0
33
+ noise_s: 0.999
34
+ num_inference_timesteps: 4
35
+ num_target_vision_tokens: 32
36
+ num_timestep_buckets: 1000
37
+ past_action_window_size: 0
38
+ state_dim: 7
39
+ name: QwenGR00T
40
+ qwenvl:
41
+ base_vlm: /mnt/18T/starVLAproject/Qwen3-VL-8B-Instruct
42
+ output_dir: /starvla/Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_2node_0203_1256
43
+ run_id: qwen3vl_bridge_rt1_QwenGR00T_2node_0203_1256
44
+ run_root_dir: /starvla/Checkpoints
45
+ seed: 42
46
+ trainer:
47
+ eval_interval: 500
48
+ freeze_modules: true
49
+ gradient_accumulation_steps: 1
50
+ gradient_clipping: 1.0
51
+ is_resume: false
52
+ learning_rate:
53
+ action_model: 0.0001
54
+ base: 1.0e-05
55
+ qwen_vl_interface: 1.0e-05
56
+ logging_frequency: 50
57
+ lr_scheduler_type: cosine_with_min_lr
58
+ max_train_steps: 100000
59
+ num_warmup_steps: 10000
60
+ optimizer:
61
+ betas:
62
+ - 0.9
63
+ - 0.95
64
+ eps: 1.0e-08
65
+ weight_decay: 1.0e-08
66
+ repeated_diffusion_steps: 4
67
+ save_interval: 10000
68
+ scheduler_specific_kwargs:
69
+ min_lr: 5.0e-07
70
+ wandb_entity: xiguapi
71
+ wandb_project: Qwen3VL_Bridge_RT1_QwenGR00T