jaehyunkang commited on
Commit
6fb13bc
·
verified ·
1 Parent(s): 7c49ffe

Upload experiment_cfg/conf.yaml

Browse files
Files changed (1) hide show
  1. experiment_cfg/conf.yaml +263 -0
experiment_cfg/conf.yaml ADDED
@@ -0,0 +1,263 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ load_config_path: null
2
+ model:
3
+ model_type: Gr00tN1d6
4
+ model_dtype: bfloat16
5
+ model_name: nvidia/Eagle-Block2A-2B-v2
6
+ backbone_model_type: eagle
7
+ model_revision: null
8
+ tune_top_llm_layers: 4
9
+ backbone_embedding_dim: 2048
10
+ tune_llm: false
11
+ tune_visual: false
12
+ select_layer: 16
13
+ reproject_vision: false
14
+ use_flash_attention: true
15
+ load_bf16: false
16
+ collator_overwrite_image_inputs: false
17
+ eagle_collator: true
18
+ backbone_trainable_params_fp32: true
19
+ image_crop_size: null
20
+ image_target_size: null
21
+ shortest_image_edge: 256
22
+ crop_fraction: 0.95
23
+ random_rotation_angle: null
24
+ color_jitter_params:
25
+ brightness: 0.2
26
+ contrast: 0.2
27
+ saturation: 0.2
28
+ hue: 0.1
29
+ use_albumentations_transforms: true
30
+ formalize_language: true
31
+ apply_sincos_state_encoding: false
32
+ use_relative_action: true
33
+ random_diffusion: false
34
+ max_state_dim: 29
35
+ max_action_dim: 29
36
+ action_horizon: 16
37
+ hidden_size: 1024
38
+ input_embedding_dim: 1536
39
+ add_pos_embed: true
40
+ attn_dropout: 0.2
41
+ use_vlln: true
42
+ max_seq_len: 1024
43
+ use_alternate_vl_dit: true
44
+ attend_text_every_n_blocks: 2
45
+ diffusion_model_cfg:
46
+ positional_embeddings: null
47
+ num_layers: 32
48
+ num_attention_heads: 32
49
+ attention_head_dim: 48
50
+ norm_type: ada_norm
51
+ dropout: 0.2
52
+ final_dropout: true
53
+ output_dim: 1024
54
+ interleave_self_attention: true
55
+ num_inference_timesteps: 4
56
+ noise_beta_alpha: 1.5
57
+ noise_beta_beta: 1.0
58
+ noise_s: 0.999
59
+ num_timestep_buckets: 1000
60
+ inference_rtc_overlap_steps: null
61
+ inference_rtc_frozen_steps: null
62
+ rtc_ramp_rate: 10.0
63
+ tune_projector: true
64
+ tune_diffusion_model: true
65
+ tune_vlln: true
66
+ state_dropout_prob: 0.0
67
+ state_additive_noise_scale: 0.0
68
+ max_num_embodiments: 32
69
+ data:
70
+ datasets:
71
+ - dataset_paths:
72
+ - /fsx/rlwrld/jaehyun/datasets/isaacsim_allex/V3_Cube_Stack-5cmLeft_lerobot
73
+ embodiment_tag: new_embodiment
74
+ mix_ratio: 1.0
75
+ dataset_type: physical_embodiment
76
+ val_dataset_path: null
77
+ modality_configs:
78
+ new_embodiment:
79
+ video:
80
+ delta_indices:
81
+ - 0
82
+ modality_keys:
83
+ - camera_ego_left
84
+ - camera_ego_right
85
+ sin_cos_embedding_keys: null
86
+ mean_std_embedding_keys: null
87
+ action_configs: null
88
+ state:
89
+ delta_indices:
90
+ - 0
91
+ modality_keys:
92
+ - right_arm_joints
93
+ - left_arm_joints
94
+ - right_hand_joints
95
+ - left_hand_joints
96
+ - neck_joints
97
+ - waist_joints
98
+ sin_cos_embedding_keys: null
99
+ mean_std_embedding_keys: null
100
+ action_configs: null
101
+ action:
102
+ delta_indices:
103
+ - 0
104
+ - 1
105
+ - 2
106
+ - 3
107
+ - 4
108
+ - 5
109
+ - 6
110
+ - 7
111
+ - 8
112
+ - 9
113
+ - 10
114
+ - 11
115
+ - 12
116
+ - 13
117
+ - 14
118
+ - 15
119
+ - 16
120
+ - 17
121
+ - 18
122
+ - 19
123
+ - 20
124
+ - 21
125
+ - 22
126
+ - 23
127
+ - 24
128
+ - 25
129
+ - 26
130
+ - 27
131
+ - 28
132
+ - 29
133
+ - 30
134
+ - 31
135
+ - 32
136
+ - 33
137
+ - 34
138
+ - 35
139
+ - 36
140
+ - 37
141
+ - 38
142
+ - 39
143
+ modality_keys:
144
+ - right_arm_joints
145
+ - left_arm_joints
146
+ - right_hand_joints
147
+ - left_hand_joints
148
+ - neck_joints
149
+ - waist_joints
150
+ sin_cos_embedding_keys: null
151
+ mean_std_embedding_keys: null
152
+ action_configs:
153
+ - rep: ABSOLUTE
154
+ type: NON_EEF
155
+ format: DEFAULT
156
+ state_key: null
157
+ - rep: ABSOLUTE
158
+ type: NON_EEF
159
+ format: DEFAULT
160
+ state_key: null
161
+ - rep: ABSOLUTE
162
+ type: NON_EEF
163
+ format: DEFAULT
164
+ state_key: null
165
+ - rep: ABSOLUTE
166
+ type: NON_EEF
167
+ format: DEFAULT
168
+ state_key: null
169
+ - rep: ABSOLUTE
170
+ type: NON_EEF
171
+ format: DEFAULT
172
+ state_key: null
173
+ - rep: ABSOLUTE
174
+ type: NON_EEF
175
+ format: DEFAULT
176
+ state_key: null
177
+ language:
178
+ delta_indices:
179
+ - 0
180
+ modality_keys:
181
+ - annotation.human.task_description
182
+ sin_cos_embedding_keys: null
183
+ mean_std_embedding_keys: null
184
+ action_configs: null
185
+ modality_config_paths: []
186
+ download_cache: false
187
+ shard_size: 1024
188
+ episode_sampling_rate: 0.1
189
+ num_shards_per_epoch: 100000
190
+ override_pretraining_statistics: false
191
+ mode: single_turn
192
+ random_chop: 0.0
193
+ mock_dataset_mode: false
194
+ shuffle: true
195
+ seed: 42
196
+ multiprocessing_context: fork
197
+ allow_padding: false
198
+ subsample_ratio: 1.0
199
+ image_crop_size:
200
+ - 244
201
+ - 244
202
+ image_target_size:
203
+ - 224
204
+ - 224
205
+ video_backend: torchcodec
206
+ training:
207
+ output_dir: /fsx/rlwrld/jaehyun/Isaac-GR00T/checkpoints/isaacsim_cube_stack_ck40_abs
208
+ experiment_name: null
209
+ max_steps: 30000
210
+ global_batch_size: 128
211
+ batch_size: null
212
+ gradient_accumulation_steps: 1
213
+ learning_rate: 0.0001
214
+ lr_scheduler_type: cosine
215
+ weight_decay: 1.0e-05
216
+ warmup_ratio: 0.05
217
+ warmup_steps: 0
218
+ max_grad_norm: 1.0
219
+ optim: adamw_torch
220
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
221
+ tf32: true
222
+ fp16: false
223
+ bf16: true
224
+ eval_bf16: true
225
+ logging_steps: 10
226
+ save_steps: 10000
227
+ save_total_limit: 5
228
+ save_vl_model: false
229
+ upload_checkpoints: false
230
+ upload_every: 1000
231
+ upload_last_n_checkpoints: 5
232
+ max_concurrent_uploads: 2
233
+ eval_strategy: 'no'
234
+ eval_steps: 500
235
+ eval_set_split_ratio: 0.1
236
+ eval_batch_size: 2
237
+ save_best_eval_metric_name: ''
238
+ save_best_eval_metric_greater_is_better: true
239
+ deepspeed_stage: 2
240
+ gradient_checkpointing: false
241
+ transformers_trust_remote_code: true
242
+ transformers_local_files_only: false
243
+ transformers_cache_dir: null
244
+ transformers_access_token: null
245
+ use_ddp: false
246
+ ddp_bucket_cap_mb: 100
247
+ num_gpus: 2
248
+ dataloader_num_workers: 8
249
+ dataloader_pin_memory: true
250
+ remove_unused_columns: false
251
+ use_wandb: true
252
+ wandb_project: finetune-gr00t-n1d6
253
+ enable_profiling: false
254
+ max_retries: 3
255
+ assert_loss_less_than: null
256
+ add_rl_callback: false
257
+ enable_open_loop_eval: false
258
+ open_loop_eval_traj_ids:
259
+ - 0
260
+ open_loop_eval_steps_per_traj: 100
261
+ open_loop_eval_plot_indices: null
262
+ max_steps: 30000
263
+ save_steps: 10000