umegan commited on
Commit
11e8bc9
·
verified ·
1 Parent(s): 1cd9e3d

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint-1000/config.json +70 -0
  2. checkpoint-1000/embodiment_id.json +10 -0
  3. checkpoint-1000/experiment_cfg/conf.yaml +204 -0
  4. checkpoint-1000/experiment_cfg/config.yaml +238 -0
  5. checkpoint-1000/experiment_cfg/dataset_statistics.json +1046 -0
  6. checkpoint-1000/experiment_cfg/final_model_config.json +53 -0
  7. checkpoint-1000/experiment_cfg/final_processor_config.json +0 -0
  8. checkpoint-1000/model-00001-of-00002.safetensors +3 -0
  9. checkpoint-1000/model-00002-of-00002.safetensors +3 -0
  10. checkpoint-1000/model.safetensors.index.json +0 -0
  11. checkpoint-1000/optimizer.pt +3 -0
  12. checkpoint-1000/processor_config.json +454 -0
  13. checkpoint-1000/rng_state.pth +3 -0
  14. checkpoint-1000/scheduler.pt +3 -0
  15. checkpoint-1000/statistics.json +0 -0
  16. checkpoint-1000/trainer_state.json +634 -0
  17. checkpoint-1000/training_args.bin +3 -0
  18. checkpoint-1000/wandb_config.json +1 -0
  19. checkpoint-1500/config.json +70 -0
  20. checkpoint-1500/embodiment_id.json +10 -0
  21. checkpoint-1500/experiment_cfg/conf.yaml +204 -0
  22. checkpoint-1500/experiment_cfg/config.yaml +238 -0
  23. checkpoint-1500/experiment_cfg/dataset_statistics.json +1046 -0
  24. checkpoint-1500/experiment_cfg/final_model_config.json +53 -0
  25. checkpoint-1500/experiment_cfg/final_processor_config.json +0 -0
  26. checkpoint-1500/model-00001-of-00002.safetensors +3 -0
  27. checkpoint-1500/model-00002-of-00002.safetensors +3 -0
  28. checkpoint-1500/model.safetensors.index.json +0 -0
  29. checkpoint-1500/optimizer.pt +3 -0
  30. checkpoint-1500/processor_config.json +454 -0
  31. checkpoint-1500/rng_state.pth +3 -0
  32. checkpoint-1500/scheduler.pt +3 -0
  33. checkpoint-1500/statistics.json +0 -0
  34. checkpoint-1500/trainer_state.json +934 -0
  35. checkpoint-1500/training_args.bin +3 -0
  36. checkpoint-1500/wandb_config.json +1 -0
  37. checkpoint-2000/config.json +70 -0
  38. checkpoint-2000/embodiment_id.json +10 -0
  39. checkpoint-2000/experiment_cfg/conf.yaml +204 -0
  40. checkpoint-2000/experiment_cfg/config.yaml +238 -0
  41. checkpoint-2000/experiment_cfg/dataset_statistics.json +1046 -0
  42. checkpoint-2000/experiment_cfg/final_model_config.json +53 -0
  43. checkpoint-2000/experiment_cfg/final_processor_config.json +0 -0
  44. checkpoint-2000/model-00001-of-00002.safetensors +3 -0
  45. checkpoint-2000/model-00002-of-00002.safetensors +3 -0
  46. checkpoint-2000/model.safetensors.index.json +0 -0
  47. checkpoint-2000/optimizer.pt +3 -0
  48. checkpoint-2000/processor_config.json +454 -0
  49. checkpoint-2000/rng_state.pth +3 -0
  50. checkpoint-2000/scheduler.pt +3 -0
checkpoint-1000/config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_horizon": 50,
3
+ "add_pos_embed": true,
4
+ "apply_sincos_state_encoding": true,
5
+ "architectures": [
6
+ "Gr00tN1d6"
7
+ ],
8
+ "attn_dropout": 0.2,
9
+ "attn_implementation": null,
10
+ "backbone_embedding_dim": 2048,
11
+ "backbone_model_type": "eagle",
12
+ "backbone_trainable_params_fp32": true,
13
+ "collator_overwrite_image_inputs": false,
14
+ "color_jitter_params": {
15
+ "brightness": 0.1,
16
+ "contrast": 0.1,
17
+ "hue": 0.1,
18
+ "saturation": 0.1
19
+ },
20
+ "crop_fraction": 0.95,
21
+ "diffusion_model_cfg": {
22
+ "attention_head_dim": 48,
23
+ "dropout": 0.2,
24
+ "final_dropout": true,
25
+ "interleave_self_attention": true,
26
+ "norm_type": "ada_norm",
27
+ "num_attention_heads": 32,
28
+ "num_layers": 32,
29
+ "output_dim": 1024,
30
+ "positional_embeddings": null
31
+ },
32
+ "eagle_collator": true,
33
+ "formalize_language": true,
34
+ "gemma_collator": false,
35
+ "hidden_size": 1024,
36
+ "image_crop_size": null,
37
+ "image_target_size": null,
38
+ "input_embedding_dim": 1536,
39
+ "load_bf16": true,
40
+ "max_action_dim": 128,
41
+ "max_num_embodiments": 32,
42
+ "max_seq_len": 1024,
43
+ "max_state_dim": 128,
44
+ "model_dtype": "bfloat16",
45
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
46
+ "model_type": "Gr00tN1d6",
47
+ "noise_beta_alpha": 1.5,
48
+ "noise_beta_beta": 1.0,
49
+ "noise_s": 0.999,
50
+ "num_inference_timesteps": 4,
51
+ "num_timestep_buckets": 1000,
52
+ "random_rotation_angle": null,
53
+ "reproject_vision": false,
54
+ "select_layer": 16,
55
+ "shortest_image_edge": 256,
56
+ "state_dropout_prob": 0.0,
57
+ "torch_dtype": "bfloat16",
58
+ "transformers_version": "4.51.3",
59
+ "tune_diffusion_model": true,
60
+ "tune_llm": false,
61
+ "tune_projector": true,
62
+ "tune_top_llm_layers": 4,
63
+ "tune_visual": false,
64
+ "tune_vlln": true,
65
+ "use_albumentations_transforms": true,
66
+ "use_alternate_vl_dit": true,
67
+ "use_flash_attention": true,
68
+ "use_relative_action": true,
69
+ "use_vlln": true
70
+ }
checkpoint-1000/embodiment_id.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "robocasa_panda_omron": 13,
3
+ "gr1": 20,
4
+ "behavior_r1_pro": 24,
5
+ "unitree_g1": 8,
6
+ "oxe_google": 0,
7
+ "oxe_widowx": 1,
8
+ "libero_panda": 2,
9
+ "new_embodiment": 10
10
+ }
checkpoint-1000/experiment_cfg/conf.yaml ADDED
@@ -0,0 +1,204 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ load_config_path: null
2
+ model:
3
+ model_type: Gr00tN1d6
4
+ model_dtype: bfloat16
5
+ model_name: nvidia/Eagle-Block2A-2B-v2
6
+ backbone_model_type: eagle
7
+ model_revision: null
8
+ tune_top_llm_layers: 4
9
+ backbone_embedding_dim: 2048
10
+ tune_llm: false
11
+ tune_visual: false
12
+ select_layer: 16
13
+ reproject_vision: false
14
+ use_flash_attention: true
15
+ load_bf16: false
16
+ collator_overwrite_image_inputs: false
17
+ eagle_collator: true
18
+ backbone_trainable_params_fp32: true
19
+ image_crop_size: null
20
+ image_target_size: null
21
+ shortest_image_edge: 256
22
+ crop_fraction: 0.95
23
+ random_rotation_angle: null
24
+ color_jitter_params: null
25
+ use_albumentations_transforms: true
26
+ formalize_language: true
27
+ apply_sincos_state_encoding: false
28
+ use_relative_action: true
29
+ max_state_dim: 29
30
+ max_action_dim: 29
31
+ action_horizon: 16
32
+ hidden_size: 1024
33
+ input_embedding_dim: 1536
34
+ add_pos_embed: true
35
+ attn_dropout: 0.2
36
+ use_vlln: true
37
+ max_seq_len: 1024
38
+ use_alternate_vl_dit: true
39
+ attend_text_every_n_blocks: 2
40
+ diffusion_model_cfg:
41
+ positional_embeddings: null
42
+ num_layers: 32
43
+ num_attention_heads: 32
44
+ attention_head_dim: 48
45
+ norm_type: ada_norm
46
+ dropout: 0.2
47
+ final_dropout: true
48
+ output_dim: 1024
49
+ interleave_self_attention: true
50
+ num_inference_timesteps: 4
51
+ noise_beta_alpha: 1.5
52
+ noise_beta_beta: 1.0
53
+ noise_s: 0.999
54
+ num_timestep_buckets: 1000
55
+ tune_projector: true
56
+ tune_diffusion_model: true
57
+ tune_vlln: true
58
+ state_dropout_prob: 0.0
59
+ state_additive_noise_scale: 0.0
60
+ max_num_embodiments: 32
61
+ data:
62
+ datasets:
63
+ - dataset_paths:
64
+ - /workspaces/isaaclab_arena/train_data
65
+ embodiment_tag: new_embodiment
66
+ mix_ratio: 1.0
67
+ dataset_type: physical_embodiment
68
+ val_dataset_path: null
69
+ modality_configs:
70
+ new_embodiment:
71
+ video:
72
+ delta_indices:
73
+ - 0
74
+ modality_keys:
75
+ - ego_view
76
+ sin_cos_embedding_keys: null
77
+ mean_std_embedding_keys: null
78
+ action_configs: null
79
+ state:
80
+ delta_indices:
81
+ - 0
82
+ modality_keys:
83
+ - single_arm
84
+ - gripper
85
+ sin_cos_embedding_keys: null
86
+ mean_std_embedding_keys: null
87
+ action_configs: null
88
+ action:
89
+ delta_indices:
90
+ - 0
91
+ - 1
92
+ - 2
93
+ - 3
94
+ - 4
95
+ - 5
96
+ - 6
97
+ - 7
98
+ - 8
99
+ - 9
100
+ - 10
101
+ - 11
102
+ - 12
103
+ - 13
104
+ - 14
105
+ - 15
106
+ modality_keys:
107
+ - single_arm
108
+ - gripper
109
+ sin_cos_embedding_keys: null
110
+ mean_std_embedding_keys: null
111
+ action_configs:
112
+ - rep: RELATIVE
113
+ type: NON_EEF
114
+ format: DEFAULT
115
+ state_key: single_arm
116
+ - rep: ABSOLUTE
117
+ type: NON_EEF
118
+ format: DEFAULT
119
+ state_key: null
120
+ language:
121
+ delta_indices:
122
+ - 0
123
+ modality_keys:
124
+ - annotation.human.task_description
125
+ sin_cos_embedding_keys: null
126
+ mean_std_embedding_keys: null
127
+ action_configs: null
128
+ download_cache: false
129
+ shard_size: 1024
130
+ episode_sampling_rate: 0.1
131
+ num_shards_per_epoch: 100000
132
+ override_pretraining_statistics: false
133
+ mode: single_turn
134
+ random_chop: 0.0
135
+ mock_dataset_mode: false
136
+ shuffle: true
137
+ seed: 42
138
+ multiprocessing_context: fork
139
+ allow_padding: false
140
+ subsample_ratio: 1.0
141
+ image_crop_size:
142
+ - 244
143
+ - 244
144
+ image_target_size:
145
+ - 224
146
+ - 224
147
+ video_backend: torchcodec
148
+ training:
149
+ output_dir: /home/ubuntu/.cache/gr00t_franka_finetune
150
+ experiment_name: null
151
+ max_steps: 2000
152
+ global_batch_size: 32
153
+ batch_size: null
154
+ gradient_accumulation_steps: 1
155
+ learning_rate: 0.0001
156
+ lr_scheduler_type: cosine
157
+ weight_decay: 1.0e-05
158
+ warmup_ratio: 0.05
159
+ warmup_steps: 0
160
+ max_grad_norm: 1.0
161
+ optim: adamw_torch
162
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
163
+ tf32: true
164
+ fp16: false
165
+ bf16: true
166
+ eval_bf16: true
167
+ logging_steps: 10
168
+ save_steps: 500
169
+ save_total_limit: 4
170
+ save_vl_model: false
171
+ upload_checkpoints: false
172
+ upload_every: 1000
173
+ upload_last_n_checkpoints: 5
174
+ max_concurrent_uploads: 2
175
+ eval_strategy: 'no'
176
+ eval_steps: 500
177
+ eval_set_split_ratio: 0.1
178
+ eval_batch_size: 2
179
+ save_best_eval_metric_name: ''
180
+ save_best_eval_metric_greater_is_better: true
181
+ deepspeed_stage: 2
182
+ gradient_checkpointing: false
183
+ transformers_trust_remote_code: true
184
+ transformers_local_files_only: false
185
+ transformers_cache_dir: null
186
+ transformers_access_token: null
187
+ use_ddp: false
188
+ ddp_bucket_cap_mb: 100
189
+ num_gpus: 1
190
+ dataloader_num_workers: 32
191
+ remove_unused_columns: false
192
+ use_wandb: false
193
+ wandb_project: finetune-gr00t-n1d6
194
+ enable_profiling: false
195
+ max_retries: 3
196
+ assert_loss_less_than: null
197
+ add_rl_callback: false
198
+ enable_open_loop_eval: false
199
+ open_loop_eval_traj_ids:
200
+ - 0
201
+ open_loop_eval_steps_per_traj: 100
202
+ open_loop_eval_plot_indices: null
203
+ max_steps: 2000
204
+ save_steps: 500
checkpoint-1000/experiment_cfg/config.yaml ADDED
@@ -0,0 +1,238 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:gr00t.configs.base_config.Config
2
+ data: !!python/object:gr00t.configs.data.data_config.DataConfig
3
+ allow_padding: false
4
+ datasets:
5
+ - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
6
+ dataset_paths:
7
+ - /workspaces/isaaclab_arena/train_data
8
+ dataset_type: physical_embodiment
9
+ embodiment_tag: new_embodiment
10
+ mix_ratio: 1.0
11
+ val_dataset_path: null
12
+ download_cache: false
13
+ episode_sampling_rate: 0.1
14
+ image_crop_size:
15
+ - 244
16
+ - 244
17
+ image_target_size:
18
+ - 224
19
+ - 224
20
+ mock_dataset_mode: false
21
+ modality_configs:
22
+ new_embodiment:
23
+ action: !!python/object:gr00t.data.types.ModalityConfig
24
+ action_configs:
25
+ - !!python/object:gr00t.data.types.ActionConfig
26
+ format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
27
+ - default
28
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
29
+ - relative
30
+ state_key: single_arm
31
+ type: &id002 !!python/object/apply:gr00t.data.types.ActionType
32
+ - non_eef
33
+ - !!python/object:gr00t.data.types.ActionConfig
34
+ format: *id001
35
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
36
+ - absolute
37
+ state_key: null
38
+ type: *id002
39
+ delta_indices:
40
+ - 0
41
+ - 1
42
+ - 2
43
+ - 3
44
+ - 4
45
+ - 5
46
+ - 6
47
+ - 7
48
+ - 8
49
+ - 9
50
+ - 10
51
+ - 11
52
+ - 12
53
+ - 13
54
+ - 14
55
+ - 15
56
+ mean_std_embedding_keys: null
57
+ modality_keys:
58
+ - single_arm
59
+ - gripper
60
+ sin_cos_embedding_keys: null
61
+ language: !!python/object:gr00t.data.types.ModalityConfig
62
+ action_configs: null
63
+ delta_indices:
64
+ - 0
65
+ mean_std_embedding_keys: null
66
+ modality_keys:
67
+ - annotation.human.task_description
68
+ sin_cos_embedding_keys: null
69
+ state: !!python/object:gr00t.data.types.ModalityConfig
70
+ action_configs: null
71
+ delta_indices:
72
+ - 0
73
+ mean_std_embedding_keys: null
74
+ modality_keys:
75
+ - single_arm
76
+ - gripper
77
+ sin_cos_embedding_keys: null
78
+ video: !!python/object:gr00t.data.types.ModalityConfig
79
+ action_configs: null
80
+ delta_indices:
81
+ - 0
82
+ mean_std_embedding_keys: null
83
+ modality_keys:
84
+ - ego_view
85
+ sin_cos_embedding_keys: null
86
+ mode: single_turn
87
+ multiprocessing_context: fork
88
+ num_shards_per_epoch: 100000
89
+ override_pretraining_statistics: false
90
+ random_chop: 0.0
91
+ seed: 42
92
+ shard_size: 1024
93
+ shuffle: true
94
+ subsample_ratio: 1.0
95
+ video_backend: torchcodec
96
+ load_config_path: null
97
+ model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
98
+ _attn_implementation_autoset: false
99
+ _attn_implementation_internal: null
100
+ _commit_hash: null
101
+ _name_or_path: ''
102
+ add_cross_attention: false
103
+ architectures: null
104
+ backbone_model_type: eagle
105
+ backbone_trainable_params_fp32: true
106
+ bad_words_ids: null
107
+ begin_suppress_tokens: null
108
+ bos_token_id: null
109
+ chunk_size_feed_forward: 0
110
+ color_jitter_params: null
111
+ cross_attention_hidden_size: null
112
+ decoder_start_token_id: null
113
+ diffusion_model_cfg:
114
+ attention_head_dim: 48
115
+ dropout: 0.2
116
+ final_dropout: true
117
+ interleave_self_attention: true
118
+ norm_type: ada_norm
119
+ num_attention_heads: 32
120
+ num_layers: 32
121
+ output_dim: 1024
122
+ positional_embeddings: null
123
+ diversity_penalty: 0.0
124
+ do_sample: false
125
+ eagle_collator: true
126
+ early_stopping: false
127
+ encoder_no_repeat_ngram_size: 0
128
+ eos_token_id: null
129
+ exponential_decay_length_penalty: null
130
+ finetuning_task: null
131
+ forced_bos_token_id: null
132
+ forced_eos_token_id: null
133
+ id2label:
134
+ 0: LABEL_0
135
+ 1: LABEL_1
136
+ is_decoder: false
137
+ is_encoder_decoder: false
138
+ label2id:
139
+ LABEL_0: 0
140
+ LABEL_1: 1
141
+ length_penalty: 1.0
142
+ load_bf16: false
143
+ max_length: 20
144
+ min_length: 0
145
+ model_name: nvidia/Eagle-Block2A-2B-v2
146
+ no_repeat_ngram_size: 0
147
+ num_beam_groups: 1
148
+ num_beams: 1
149
+ num_return_sequences: 1
150
+ output_attentions: false
151
+ output_hidden_states: false
152
+ output_scores: false
153
+ pad_token_id: null
154
+ prefix: null
155
+ problem_type: null
156
+ pruned_heads: {}
157
+ random_rotation_angle: null
158
+ remove_invalid_values: false
159
+ repetition_penalty: 1.0
160
+ reproject_vision: false
161
+ return_dict: true
162
+ return_dict_in_generate: false
163
+ sep_token_id: null
164
+ state_dropout_prob: 0.0
165
+ suppress_tokens: null
166
+ task_specific_params: null
167
+ temperature: 1.0
168
+ tf_legacy_loss: false
169
+ tie_encoder_decoder: false
170
+ tie_word_embeddings: true
171
+ tokenizer_class: null
172
+ top_k: 50
173
+ top_p: 1.0
174
+ torch_dtype: null
175
+ torchscript: false
176
+ transformers_version: null
177
+ tune_diffusion_model: true
178
+ tune_llm: false
179
+ tune_projector: true
180
+ tune_visual: false
181
+ typical_p: 1.0
182
+ use_bfloat16: false
183
+ use_relative_action: true
184
+ training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
185
+ add_rl_callback: false
186
+ assert_loss_less_than: null
187
+ batch_size: null
188
+ bf16: true
189
+ dataloader_num_workers: 32
190
+ ddp_bucket_cap_mb: 100
191
+ deepspeed_stage: 2
192
+ enable_open_loop_eval: false
193
+ enable_profiling: false
194
+ eval_batch_size: 2
195
+ eval_bf16: true
196
+ eval_set_split_ratio: 0.1
197
+ eval_steps: 500
198
+ eval_strategy: 'no'
199
+ experiment_name: null
200
+ fp16: false
201
+ global_batch_size: 32
202
+ gradient_accumulation_steps: 1
203
+ gradient_checkpointing: false
204
+ learning_rate: 0.0001
205
+ logging_steps: 10
206
+ lr_scheduler_type: cosine
207
+ max_concurrent_uploads: 2
208
+ max_grad_norm: 1.0
209
+ max_retries: 3
210
+ max_steps: 2000
211
+ num_gpus: 1
212
+ open_loop_eval_plot_indices: null
213
+ open_loop_eval_steps_per_traj: 100
214
+ open_loop_eval_traj_ids:
215
+ - 0
216
+ optim: adamw_torch
217
+ output_dir: /home/ubuntu/.cache/gr00t_franka_finetune
218
+ remove_unused_columns: false
219
+ save_best_eval_metric_greater_is_better: true
220
+ save_best_eval_metric_name: ''
221
+ save_steps: 500
222
+ save_total_limit: 4
223
+ save_vl_model: false
224
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
225
+ tf32: true
226
+ transformers_access_token: null
227
+ transformers_cache_dir: null
228
+ transformers_local_files_only: false
229
+ transformers_trust_remote_code: true
230
+ upload_checkpoints: false
231
+ upload_every: 1000
232
+ upload_last_n_checkpoints: 5
233
+ use_ddp: false
234
+ use_wandb: false
235
+ wandb_project: finetune-gr00t-n1d6
236
+ warmup_ratio: 0.05
237
+ warmup_steps: 0
238
+ weight_decay: 1.0e-05
checkpoint-1000/experiment_cfg/dataset_statistics.json ADDED
@@ -0,0 +1,1046 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "new_embodiment": {
3
+ "state": {
4
+ "single_arm": {
5
+ "min": [
6
+ -0.1016506552696228,
7
+ -0.1761876344680786,
8
+ -0.054869189858436584,
9
+ -1.4101576805114746,
10
+ -0.38218289613723755,
11
+ -0.022114872932434082,
12
+ -0.10868370532989502
13
+ ],
14
+ "max": [
15
+ 0.3447756767272949,
16
+ 1.2365270853042603,
17
+ 0.39242762327194214,
18
+ 0.2529296278953552,
19
+ 0.18470034003257751,
20
+ 2.118802309036255,
21
+ 0.8016068339347839
22
+ ],
23
+ "mean": [
24
+ 0.042614661157131195,
25
+ 0.4292725920677185,
26
+ 0.10685384273529053,
27
+ -0.8481684923171997,
28
+ -0.004952127579599619,
29
+ 1.2715188264846802,
30
+ 0.14739659428596497
31
+ ],
32
+ "std": [
33
+ 0.08599156141281128,
34
+ 0.38931092619895935,
35
+ 0.08684167265892029,
36
+ 0.41639015078544617,
37
+ 0.09905096888542175,
38
+ 0.639055073261261,
39
+ 0.20859868824481964
40
+ ],
41
+ "q01": [
42
+ -0.08698830261826515,
43
+ -0.16300016283988952,
44
+ -0.031826803982257845,
45
+ -1.3965834760665894,
46
+ -0.33692867517471314,
47
+ -0.005149464607238769,
48
+ -0.0991782522201538
49
+ ],
50
+ "q99": [
51
+ 0.3135400813817978,
52
+ 1.2095760893821716,
53
+ 0.3296026331186294,
54
+ 0.09940535783767694,
55
+ 0.177163989841938,
56
+ 2.111123719215393,
57
+ 0.7685691952705384
58
+ ]
59
+ },
60
+ "gripper": {
61
+ "min": [
62
+ -0.016243789345026016,
63
+ -0.017369966953992844
64
+ ],
65
+ "max": [
66
+ 0.0,
67
+ 0.0
68
+ ],
69
+ "mean": [
70
+ -0.0054468195885419846,
71
+ -0.005668346770107746
72
+ ],
73
+ "std": [
74
+ 0.007502974011003971,
75
+ 0.007808898109942675
76
+ ],
77
+ "q01": [
78
+ -0.01618218619376421,
79
+ -0.01736501693725586
80
+ ],
81
+ "q99": [
82
+ 0.0,
83
+ 0.0
84
+ ]
85
+ }
86
+ },
87
+ "action": {
88
+ "single_arm": {
89
+ "min": [
90
+ -0.029919808730483055,
91
+ -0.030760474503040314,
92
+ -0.03454569727182388,
93
+ -0.023138338699936867,
94
+ -0.0294453464448452,
95
+ -0.04707210883498192,
96
+ 0.0
97
+ ],
98
+ "max": [
99
+ 0.04578776657581329,
100
+ 0.03417271375656128,
101
+ 0.032364509999752045,
102
+ 0.012034625746309757,
103
+ 0.08025076240301132,
104
+ 0.04756892845034599,
105
+ 0.03999999910593033
106
+ ],
107
+ "mean": [
108
+ 0.013533495366573334,
109
+ 0.007476440165191889,
110
+ -0.01020827516913414,
111
+ -0.00018720414664130658,
112
+ 0.00028234944329597056,
113
+ -5.855086783412844e-05,
114
+ 0.026392336934804916
115
+ ],
116
+ "std": [
117
+ 0.012855037115514278,
118
+ 0.012551924213767052,
119
+ 0.017873870208859444,
120
+ 0.0029166981112211943,
121
+ 0.005159514490514994,
122
+ 0.004970518872141838,
123
+ 0.01895107515156269
124
+ ],
125
+ "q01": [
126
+ -0.005514774760231375,
127
+ -0.024535775482654572,
128
+ -0.030423654653131963,
129
+ -0.008391074724495412,
130
+ -0.01150766346603632,
131
+ -0.015753980539739133,
132
+ 0.0
133
+ ],
134
+ "q99": [
135
+ 0.03146043732762337,
136
+ 0.02946644090116024,
137
+ 0.028492353856563568,
138
+ 0.006190066309645771,
139
+ 0.01955891106277704,
140
+ 0.016726106889545896,
141
+ 0.03999999910593033
142
+ ]
143
+ },
144
+ "gripper": {
145
+ "min": [
146
+ 0.0
147
+ ],
148
+ "max": [
149
+ 0.03999999910593033
150
+ ],
151
+ "mean": [
152
+ 0.026392336934804916
153
+ ],
154
+ "std": [
155
+ 0.01895107515156269
156
+ ],
157
+ "q01": [
158
+ 0.0
159
+ ],
160
+ "q99": [
161
+ 0.03999999910593033
162
+ ]
163
+ }
164
+ },
165
+ "relative_action": {
166
+ "single_arm": {
167
+ "min": [
168
+ [
169
+ -0.32329919934272766,
170
+ -1.1854932308197021,
171
+ -0.39748504757881165,
172
+ -0.25286412239074707,
173
+ -0.18570305407047272,
174
+ -2.121999979019165,
175
+ -0.7839499115943909
176
+ ],
177
+ [
178
+ -0.32189974188804626,
179
+ -1.1826070547103882,
180
+ -0.39696475863456726,
181
+ -0.2544684112071991,
182
+ -0.18530802428722382,
183
+ -2.1222615242004395,
184
+ -0.7839499115943909
185
+ ],
186
+ [
187
+ -0.32321855425834656,
188
+ -1.1859318017959595,
189
+ -0.39636000990867615,
190
+ -0.2523682117462158,
191
+ -0.18859536945819855,
192
+ -2.1214780807495117,
193
+ -0.7839499115943909
194
+ ],
195
+ [
196
+ -0.3242166042327881,
197
+ -1.181753158569336,
198
+ -0.3955015242099762,
199
+ -0.2530977129936218,
200
+ -0.18825502693653107,
201
+ -2.1224093437194824,
202
+ -0.7839499115943909
203
+ ],
204
+ [
205
+ -0.3244396150112152,
206
+ -1.1838017702102661,
207
+ -0.3950645923614502,
208
+ -0.24863530695438385,
209
+ -0.18772920966148376,
210
+ -2.1221938133239746,
211
+ -0.7839499115943909
212
+ ],
213
+ [
214
+ -0.3249604403972626,
215
+ -1.1851550340652466,
216
+ -0.3945443034172058,
217
+ -0.2545105218887329,
218
+ -0.19080020487308502,
219
+ -2.12245512008667,
220
+ -0.7839499115943909
221
+ ],
222
+ [
223
+ -0.3240599036216736,
224
+ -1.2094337940216064,
225
+ -0.3939395546913147,
226
+ -0.2524451017379761,
227
+ -0.19165967404842377,
228
+ -2.1216351985931396,
229
+ -0.7839499115943909
230
+ ],
231
+ [
232
+ -0.3237849175930023,
233
+ -1.2061353921890259,
234
+ -0.39335793256759644,
235
+ -0.25646376609802246,
236
+ -0.19124479591846466,
237
+ -2.12142276763916,
238
+ -0.7839499115943909
239
+ ],
240
+ [
241
+ -0.32624951004981995,
242
+ -1.2092955112457275,
243
+ -0.3938826322555542,
244
+ -0.25647443532943726,
245
+ -0.19049783051013947,
246
+ -2.1221275329589844,
247
+ -0.7839499115943909
248
+ ],
249
+ [
250
+ -0.32307595014572144,
251
+ -1.205997109413147,
252
+ -0.39394718408584595,
253
+ -0.257379949092865,
254
+ -0.1888638287782669,
255
+ -2.1217713356018066,
256
+ -0.7839499115943909
257
+ ],
258
+ [
259
+ -0.3202081322669983,
260
+ -1.20602285861969,
261
+ -0.39648687839508057,
262
+ -0.2556869089603424,
263
+ -0.18957450985908508,
264
+ -2.1215648651123047,
265
+ -0.7801104187965393
266
+ ],
267
+ [
268
+ -0.32303914427757263,
269
+ -1.2070811986923218,
270
+ -0.39701157808303833,
271
+ -0.2523868978023529,
272
+ -0.1896384060382843,
273
+ -2.1222102642059326,
274
+ -0.7777257561683655
275
+ ],
276
+ [
277
+ -0.3236537277698517,
278
+ -1.20821213722229,
279
+ -0.3970761299133301,
280
+ -0.25582969188690186,
281
+ -0.18970085680484772,
282
+ -2.1212406158447266,
283
+ -0.774041473865509
284
+ ],
285
+ [
286
+ -0.32262563705444336,
287
+ -1.20747709274292,
288
+ -0.39746999740600586,
289
+ -0.2536396086215973,
290
+ -0.18984927237033844,
291
+ -2.1219756603240967,
292
+ -0.7704301476478577
293
+ ],
294
+ [
295
+ -0.32665905356407166,
296
+ -1.2074377536773682,
297
+ -0.3977932929992676,
298
+ -0.2506418526172638,
299
+ -0.1900315284729004,
300
+ -2.121697187423706,
301
+ -0.7680240273475647
302
+ ],
303
+ [
304
+ -0.3236996829509735,
305
+ -1.2079046964645386,
306
+ -0.3978058695793152,
307
+ -0.2523408532142639,
308
+ -0.19020666182041168,
309
+ -2.1220388412475586,
310
+ -0.765728771686554
311
+ ]
312
+ ],
313
+ "max": [
314
+ [
315
+ 0.12719863653182983,
316
+ 0.18446235358715057,
317
+ 0.06538978964090347,
318
+ 1.4123303890228271,
319
+ 0.36543214321136475,
320
+ 0.055936314165592194,
321
+ 0.1482430398464203
322
+ ],
323
+ [
324
+ 0.12787628173828125,
325
+ 0.18225406110286713,
326
+ 0.0630723312497139,
327
+ 1.4122768640518188,
328
+ 0.3634565770626068,
329
+ 0.05312386155128479,
330
+ 0.14398613572120667
331
+ ],
332
+ [
333
+ 0.12855961918830872,
334
+ 0.18054865300655365,
335
+ 0.060906484723091125,
336
+ 1.4116393327713013,
337
+ 0.3660118877887726,
338
+ 0.052048832178115845,
339
+ 0.14211878180503845
340
+ ],
341
+ [
342
+ 0.12901031970977783,
343
+ 0.17937372624874115,
344
+ 0.05962555110454559,
345
+ 1.412109613418579,
346
+ 0.3632301688194275,
347
+ 0.05115959048271179,
348
+ 0.14021214842796326
349
+ ],
350
+ [
351
+ 0.12952828407287598,
352
+ 0.1794057935476303,
353
+ 0.06009196117520332,
354
+ 1.4119149446487427,
355
+ 0.36106500029563904,
356
+ 0.05047079920768738,
357
+ 0.13852760195732117
358
+ ],
359
+ [
360
+ 0.12882810831069946,
361
+ 0.17998431622982025,
362
+ 0.06065024808049202,
363
+ 1.4128142595291138,
364
+ 0.3649647831916809,
365
+ 0.050107747316360474,
366
+ 0.13429853320121765
367
+ ],
368
+ [
369
+ 0.12831519544124603,
370
+ 0.17946301400661469,
371
+ 0.06099287047982216,
372
+ 1.4133707284927368,
373
+ 0.36815109848976135,
374
+ 0.04975596070289612,
375
+ 0.1339406669139862
376
+ ],
377
+ [
378
+ 0.12905743718147278,
379
+ 0.1786593645811081,
380
+ 0.06112520769238472,
381
+ 1.4141303300857544,
382
+ 0.3652087152004242,
383
+ 0.04841601476073265,
384
+ 0.1322639286518097
385
+ ],
386
+ [
387
+ 0.1297350823879242,
388
+ 0.1776067465543747,
389
+ 0.0573953241109848,
390
+ 1.4146143198013306,
391
+ 0.3671979606151581,
392
+ 0.04757409915328026,
393
+ 0.13022002577781677
394
+ ],
395
+ [
396
+ 0.13041843473911285,
397
+ 0.17776383459568024,
398
+ 0.05858777463436127,
399
+ 1.4145153760910034,
400
+ 0.36353617906570435,
401
+ 0.045672591775655746,
402
+ 0.12888506054878235
403
+ ],
404
+ [
405
+ 0.13086912035942078,
406
+ 0.17834235727787018,
407
+ 0.05983245372772217,
408
+ 1.4148727655410767,
409
+ 0.36363980174064636,
410
+ 0.04265117272734642,
411
+ 0.1267530620098114
412
+ ],
413
+ [
414
+ 0.13138708472251892,
415
+ 0.17829257249832153,
416
+ 0.06080028414726257,
417
+ 1.4132124185562134,
418
+ 0.36463645100593567,
419
+ 0.04230935871601105,
420
+ 0.12515506148338318
421
+ ],
422
+ [
423
+ 0.1306869238615036,
424
+ 0.17859286069869995,
425
+ 0.06156755983829498,
426
+ 1.4115465879440308,
427
+ 0.36609867215156555,
428
+ 0.041467443108558655,
429
+ 0.12416491657495499
430
+ ],
431
+ [
432
+ 0.12939347326755524,
433
+ 0.1791713833808899,
434
+ 0.06212584674358368,
435
+ 1.4120947122573853,
436
+ 0.36583268642425537,
437
+ 0.03956593573093414,
438
+ 0.12115160375833511
439
+ ],
440
+ [
441
+ 0.12968552112579346,
442
+ 0.17865008115768433,
443
+ 0.06246846914291382,
444
+ 1.4127825498580933,
445
+ 0.36217090487480164,
446
+ 0.04159165173768997,
447
+ 0.11784551292657852
448
+ ],
449
+ [
450
+ 0.12998661398887634,
451
+ 0.17784643173217773,
452
+ 0.06260080635547638,
453
+ 1.4135223627090454,
454
+ 0.361840158700943,
455
+ 0.040185101330280304,
456
+ 0.11627308279275894
457
+ ]
458
+ ],
459
+ "mean": [
460
+ [
461
+ -0.021064985543489456,
462
+ -0.39792153239250183,
463
+ -0.11181046068668365,
464
+ 0.8605598211288452,
465
+ -0.0025237626396119595,
466
+ -1.2637412548065186,
467
+ -0.10358496010303497
468
+ ],
469
+ [
470
+ -0.02104770392179489,
471
+ -0.3978676497936249,
472
+ -0.11182692646980286,
473
+ 0.8605672717094421,
474
+ -0.002523584757000208,
475
+ -1.2637417316436768,
476
+ -0.10367059707641602
477
+ ],
478
+ [
479
+ -0.021030250936746597,
480
+ -0.397811621427536,
481
+ -0.11184262484312057,
482
+ 0.8605707287788391,
483
+ -0.0025277354288846254,
484
+ -1.2637302875518799,
485
+ -0.10375623404979706
486
+ ],
487
+ [
488
+ -0.02101544663310051,
489
+ -0.39775529503822327,
490
+ -0.11185839772224426,
491
+ 0.8605775833129883,
492
+ -0.002535233274102211,
493
+ -1.2637287378311157,
494
+ -0.10384184867143631
495
+ ],
496
+ [
497
+ -0.021001672372221947,
498
+ -0.39770010113716125,
499
+ -0.11185967922210693,
500
+ 0.8605857491493225,
501
+ -0.0025436626747250557,
502
+ -1.2637271881103516,
503
+ -0.10392745584249496
504
+ ],
505
+ [
506
+ -0.02098824642598629,
507
+ -0.3976578712463379,
508
+ -0.11185971647500992,
509
+ 0.8605918884277344,
510
+ -0.0025569903664290905,
511
+ -1.2637248039245605,
512
+ -0.10401306301355362
513
+ ],
514
+ [
515
+ -0.020976334810256958,
516
+ -0.39763131737709045,
517
+ -0.11186240613460541,
518
+ 0.8606000542640686,
519
+ -0.0025741278659552336,
520
+ -1.26372230052948,
521
+ -0.10409871488809586
522
+ ],
523
+ [
524
+ -0.020982732996344566,
525
+ -0.3976297378540039,
526
+ -0.11186536401510239,
527
+ 0.8606085777282715,
528
+ -0.0025887791998684406,
529
+ -1.2637240886688232,
530
+ -0.1041843369603157
531
+ ],
532
+ [
533
+ -0.020988795906305313,
534
+ -0.397623211145401,
535
+ -0.11186520755290985,
536
+ 0.8606117963790894,
537
+ -0.0025999434292316437,
538
+ -1.2637230157852173,
539
+ -0.10424429178237915
540
+ ],
541
+ [
542
+ -0.020994234830141068,
543
+ -0.3976192772388458,
544
+ -0.11186467111110687,
545
+ 0.8606191873550415,
546
+ -0.002612028270959854,
547
+ -1.2637211084365845,
548
+ -0.10427426546812057
549
+ ],
550
+ [
551
+ -0.020999347791075706,
552
+ -0.3976156413555145,
553
+ -0.11186596006155014,
554
+ 0.8606262803077698,
555
+ -0.0026231720112264156,
556
+ -1.2637207508087158,
557
+ -0.10427425056695938
558
+ ],
559
+ [
560
+ -0.021002445369958878,
561
+ -0.3976096510887146,
562
+ -0.11186514049768448,
563
+ 0.860630214214325,
564
+ -0.002635682700201869,
565
+ -1.2637168169021606,
566
+ -0.10427428781986237
567
+ ],
568
+ [
569
+ -0.021011201664805412,
570
+ -0.39761000871658325,
571
+ -0.11186651140451431,
572
+ 0.860638439655304,
573
+ -0.002646006178110838,
574
+ -1.2637174129486084,
575
+ -0.10427427291870117
576
+ ],
577
+ [
578
+ -0.021014675498008728,
579
+ -0.39760351181030273,
580
+ -0.11186712980270386,
581
+ 0.8606441617012024,
582
+ -0.002654573880136013,
583
+ -1.2637194395065308,
584
+ -0.10427426546812057
585
+ ],
586
+ [
587
+ -0.021040834486484528,
588
+ -0.3976028859615326,
589
+ -0.11186829954385757,
590
+ 0.8606491088867188,
591
+ -0.002666682470589876,
592
+ -1.2637138366699219,
593
+ -0.10427425056695938
594
+ ],
595
+ [
596
+ -0.02106592431664467,
597
+ -0.39760419726371765,
598
+ -0.11186770349740982,
599
+ 0.8606574535369873,
600
+ -0.002680801786482334,
601
+ -1.2637156248092651,
602
+ -0.10427422821521759
603
+ ]
604
+ ],
605
+ "std": [
606
+ [
607
+ 0.07862132787704468,
608
+ 0.36472052335739136,
609
+ 0.07953183352947235,
610
+ 0.41708749532699585,
611
+ 0.08953142166137695,
612
+ 0.6474994421005249,
613
+ 0.2003270834684372
614
+ ],
615
+ [
616
+ 0.07865532487630844,
617
+ 0.36466875672340393,
618
+ 0.07954908907413483,
619
+ 0.4170789122581482,
620
+ 0.08954057842493057,
621
+ 0.6475056409835815,
622
+ 0.20027098059654236
623
+ ],
624
+ [
625
+ 0.07868577539920807,
626
+ 0.36461395025253296,
627
+ 0.07956718653440475,
628
+ 0.41706907749176025,
629
+ 0.08954384922981262,
630
+ 0.6475113034248352,
631
+ 0.20021489262580872
632
+ ],
633
+ [
634
+ 0.07872062176465988,
635
+ 0.3645585775375366,
636
+ 0.07958472520112991,
637
+ 0.41705429553985596,
638
+ 0.08954395353794098,
639
+ 0.6475160717964172,
640
+ 0.2001601606607437
641
+ ],
642
+ [
643
+ 0.07875548303127289,
644
+ 0.3645066022872925,
645
+ 0.07957513630390167,
646
+ 0.4170401096343994,
647
+ 0.08954435586929321,
648
+ 0.6475217342376709,
649
+ 0.2001052349805832
650
+ ],
651
+ [
652
+ 0.07878728210926056,
653
+ 0.36448603868484497,
654
+ 0.07956283539533615,
655
+ 0.4170234501361847,
656
+ 0.08953587710857391,
657
+ 0.6475263237953186,
658
+ 0.2000516802072525
659
+ ],
660
+ [
661
+ 0.07882208377122879,
662
+ 0.36450454592704773,
663
+ 0.07955189794301987,
664
+ 0.41700881719589233,
665
+ 0.08952254056930542,
666
+ 0.647530734539032,
667
+ 0.19999809563159943
668
+ ],
669
+ [
670
+ 0.07889280468225479,
671
+ 0.3645552396774292,
672
+ 0.07954024523496628,
673
+ 0.4169907867908478,
674
+ 0.08951205015182495,
675
+ 0.6475338339805603,
676
+ 0.19994452595710754
677
+ ],
678
+ [
679
+ 0.07896006852388382,
680
+ 0.3646087050437927,
681
+ 0.07952792197465897,
682
+ 0.4169798195362091,
683
+ 0.08950342237949371,
684
+ 0.6475362181663513,
685
+ 0.19982454180717468
686
+ ],
687
+ [
688
+ 0.07902492582798004,
689
+ 0.36466050148010254,
690
+ 0.07951349020004272,
691
+ 0.4169654846191406,
692
+ 0.08949856460094452,
693
+ 0.6475402116775513,
694
+ 0.19963733851909637
695
+ ],
696
+ [
697
+ 0.0790853276848793,
698
+ 0.36471861600875854,
699
+ 0.07950460910797119,
700
+ 0.4169500768184662,
701
+ 0.08949100971221924,
702
+ 0.6475431323051453,
703
+ 0.19935448467731476
704
+ ],
705
+ [
706
+ 0.0791463851928711,
707
+ 0.3647766411304474,
708
+ 0.07949627935886383,
709
+ 0.4169394075870514,
710
+ 0.08948377519845963,
711
+ 0.6475453972816467,
712
+ 0.19907325506210327
713
+ ],
714
+ [
715
+ 0.07920938730239868,
716
+ 0.36483389139175415,
717
+ 0.07948218286037445,
718
+ 0.4169244170188904,
719
+ 0.08947892487049103,
720
+ 0.6475448608398438,
721
+ 0.19879388809204102
722
+ ],
723
+ [
724
+ 0.0792689323425293,
725
+ 0.3648894131183624,
726
+ 0.07947037369012833,
727
+ 0.41691312193870544,
728
+ 0.08947526663541794,
729
+ 0.6475451588630676,
730
+ 0.19851621985435486
731
+ ],
732
+ [
733
+ 0.07932519167661667,
734
+ 0.3649515211582184,
735
+ 0.07945462316274643,
736
+ 0.4169033467769623,
737
+ 0.08946864306926727,
738
+ 0.6475487947463989,
739
+ 0.19824036955833435
740
+ ],
741
+ [
742
+ 0.07937267422676086,
743
+ 0.36501482129096985,
744
+ 0.07943546772003174,
745
+ 0.41688644886016846,
746
+ 0.08945988863706589,
747
+ 0.6475464701652527,
748
+ 0.19796623289585114
749
+ ]
750
+ ],
751
+ "q01": [
752
+ [
753
+ -0.2686644893884659,
754
+ -1.1166756582260131,
755
+ -0.3249503219127655,
756
+ -0.10763738259673118,
757
+ -0.17754718899726868,
758
+ -2.11095911026001,
759
+ -0.726121768951416
760
+ ],
761
+ [
762
+ -0.2715908128023148,
763
+ -1.1176964545249939,
764
+ -0.3246971207857132,
765
+ -0.10447386264801026,
766
+ -0.17755473166704178,
767
+ -2.111039023399353,
768
+ -0.726121768951416
769
+ ],
770
+ [
771
+ -0.2721079695224762,
772
+ -1.1183462095260621,
773
+ -0.32473934948444366,
774
+ -0.10659581780433655,
775
+ -0.17748151123523712,
776
+ -2.1109159421920776,
777
+ -0.726121768951416
778
+ ],
779
+ [
780
+ -0.2719108146429062,
781
+ -1.1183584260940551,
782
+ -0.3249865293502808,
783
+ -0.10559523880481719,
784
+ -0.17776453107595444,
785
+ -2.1114220952987672,
786
+ -0.726121768951416
787
+ ],
788
+ [
789
+ -0.27478108763694764,
790
+ -1.1184560322761536,
791
+ -0.32442001819610594,
792
+ -0.10662905514240265,
793
+ -0.17751205533742906,
794
+ -2.111326847076416,
795
+ -0.726121768951416
796
+ ],
797
+ [
798
+ -0.27461387276649474,
799
+ -1.1171478915214539,
800
+ -0.32468852162361145,
801
+ -0.10610488697886467,
802
+ -0.17753057986497878,
803
+ -2.1112320852279662,
804
+ -0.726121768951416
805
+ ],
806
+ [
807
+ -0.2748466944694519,
808
+ -1.1176495385169982,
809
+ -0.3247254079580307,
810
+ -0.10539359807968139,
811
+ -0.17761774510145187,
812
+ -2.111006693840027,
813
+ -0.726121768951416
814
+ ],
815
+ [
816
+ -0.2763983929157257,
817
+ -1.1234028029441834,
818
+ -0.32481603741645815,
819
+ -0.10651438012719154,
820
+ -0.17762102216482162,
821
+ -2.110989727973938,
822
+ -0.726121768951416
823
+ ],
824
+ [
825
+ -0.27612989604473115,
826
+ -1.1322602534294128,
827
+ -0.3249142354726791,
828
+ -0.104207394272089,
829
+ -0.17753226101398467,
830
+ -2.1104533433914185,
831
+ -0.726121768951416
832
+ ],
833
+ [
834
+ -0.2772212654352188,
835
+ -1.1327979397773742,
836
+ -0.3250032651424408,
837
+ -0.10369521856307984,
838
+ -0.1775078284740448,
839
+ -2.110794858932495,
840
+ -0.726121768951416
841
+ ],
842
+ [
843
+ -0.27782695055007933,
844
+ -1.1329670572280883,
845
+ -0.3251311558485031,
846
+ -0.10523794278502464,
847
+ -0.17756187170743942,
848
+ -2.111419234275818,
849
+ -0.7251607692241668
850
+ ],
851
+ [
852
+ -0.2772995239496231,
853
+ -1.1324901962280274,
854
+ -0.32540663063526154,
855
+ -0.10621625065803528,
856
+ -0.17752183318138123,
857
+ -2.1106600952148438,
858
+ -0.7238819229602814
859
+ ],
860
+ [
861
+ -0.2760401529073715,
862
+ -1.131754720211029,
863
+ -0.3250221389532089,
864
+ -0.10366981148719788,
865
+ -0.17745642334222794,
866
+ -2.110166282653809,
867
+ -0.7220853567123413
868
+ ],
869
+ [
870
+ -0.27648825109004976,
871
+ -1.1315274477005004,
872
+ -0.32488527715206145,
873
+ -0.10417581394314765,
874
+ -0.17765929341316222,
875
+ -2.111174240112305,
876
+ -0.721002539396286
877
+ ],
878
+ [
879
+ -0.2767831003665924,
880
+ -1.1337191128730775,
881
+ -0.32499175250530243,
882
+ -0.10650760352611542,
883
+ -0.1782200300693512,
884
+ -2.1105369424819944,
885
+ -0.7191157519817353
886
+ ],
887
+ [
888
+ -0.2783048951625824,
889
+ -1.1336584401130676,
890
+ -0.3245078271627426,
891
+ -0.10380961641669273,
892
+ -0.17757790327072143,
893
+ -2.1105402278900147,
894
+ -0.717497273683548
895
+ ]
896
+ ],
897
+ "q99": [
898
+ [
899
+ 0.10997488573193549,
900
+ 0.16461794972419735,
901
+ 0.03921745248138905,
902
+ 1.39764888048172,
903
+ 0.30130664169788357,
904
+ 0.01098630111664532,
905
+ 0.1122507885098457
906
+ ],
907
+ [
908
+ 0.11004416078329086,
909
+ 0.1643620255589485,
910
+ 0.03903082057833671,
911
+ 1.398072485923767,
912
+ 0.3018379479646683,
913
+ 0.010057139471173268,
914
+ 0.11005336791276932
915
+ ],
916
+ [
917
+ 0.11012477055191992,
918
+ 0.16386553168296814,
919
+ 0.038735973685979835,
920
+ 1.3967380928993225,
921
+ 0.30213871598243713,
922
+ 0.010799065530300123,
923
+ 0.10891361147165297
924
+ ],
925
+ [
926
+ 0.1099956126511097,
927
+ 0.16371061593294142,
928
+ 0.03824721999466418,
929
+ 1.3970967960357665,
930
+ 0.302277557849884,
931
+ 0.011137769222259486,
932
+ 0.10836461812257767
933
+ ],
934
+ [
935
+ 0.11023993626236915,
936
+ 0.1633686304092407,
937
+ 0.03792811810970305,
938
+ 1.3972763657569884,
939
+ 0.3007064414024353,
940
+ 0.010738395974039987,
941
+ 0.10781787663698195
942
+ ],
943
+ [
944
+ 0.11034056857228279,
945
+ 0.16381058037281035,
946
+ 0.03771789923310276,
947
+ 1.3969033169746399,
948
+ 0.3010092568397521,
949
+ 0.010312179420143333,
950
+ 0.1074419716000557
951
+ ],
952
+ [
953
+ 0.11034261405467986,
954
+ 0.1636140125989914,
955
+ 0.03730809785425661,
956
+ 1.3973512649536133,
957
+ 0.3012144303321838,
958
+ 0.009373838771134584,
959
+ 0.10661112785339355
960
+ ],
961
+ [
962
+ 0.11037104874849318,
963
+ 0.16361432492733002,
964
+ 0.03730310291051864,
965
+ 1.397199330329895,
966
+ 0.30146020889282227,
967
+ 0.009104850329458668,
968
+ 0.10594455733895301
969
+ ],
970
+ [
971
+ 0.11031954407691955,
972
+ 0.16329921871423722,
973
+ 0.037490070536732666,
974
+ 1.3971175789833068,
975
+ 0.30101816475391385,
976
+ 0.007780624665319918,
977
+ 0.10561806678771973
978
+ ],
979
+ [
980
+ 0.11039042010903358,
981
+ 0.16369332671165465,
982
+ 0.036998328715562794,
983
+ 1.3964923930168152,
984
+ 0.3020000964403152,
985
+ 0.007503410866484006,
986
+ 0.10535383358597755
987
+ ],
988
+ [
989
+ 0.11048222631216048,
990
+ 0.16336869567632675,
991
+ 0.03698733076453208,
992
+ 1.3960149836540223,
993
+ 0.30287389039993284,
994
+ 0.0068738124519586155,
995
+ 0.10515481844544411
996
+ ],
997
+ [
998
+ 0.11053489252924918,
999
+ 0.16354636400938033,
1000
+ 0.03707304038107395,
1001
+ 1.396628396511078,
1002
+ 0.3029059028625488,
1003
+ 0.006812876258045408,
1004
+ 0.1047084142267704
1005
+ ],
1006
+ [
1007
+ 0.11039242312312125,
1008
+ 0.16331785261631013,
1009
+ 0.03715803913772106,
1010
+ 1.3973055458068848,
1011
+ 0.30323826253414154,
1012
+ 0.006487304139882287,
1013
+ 0.10444164305925369
1014
+ ],
1015
+ [
1016
+ 0.11058814465999603,
1017
+ 0.16320075422525404,
1018
+ 0.0372002275288105,
1019
+ 1.3976932382583618,
1020
+ 0.30252904832363126,
1021
+ 0.005770333949476429,
1022
+ 0.10420910120010375
1023
+ ],
1024
+ [
1025
+ 0.11048216462135314,
1026
+ 0.1634601667523384,
1027
+ 0.0368946287035942,
1028
+ 1.396862666606903,
1029
+ 0.3012196272611618,
1030
+ 0.006188006103038769,
1031
+ 0.10407691970467567
1032
+ ],
1033
+ [
1034
+ 0.11032852262258529,
1035
+ 0.16324337780475617,
1036
+ 0.03683135174214838,
1037
+ 1.3966079354286194,
1038
+ 0.30130040407180775,
1039
+ 0.006021949928253876,
1040
+ 0.10380818247795105
1041
+ ]
1042
+ ]
1043
+ }
1044
+ }
1045
+ }
1046
+ }
checkpoint-1000/experiment_cfg/final_model_config.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "Gr00tN1d6",
3
+ "model_dtype": "bfloat16",
4
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
5
+ "backbone_model_type": "eagle",
6
+ "model_revision": null,
7
+ "tune_top_llm_layers": 4,
8
+ "backbone_embedding_dim": 2048,
9
+ "tune_llm": false,
10
+ "tune_visual": false,
11
+ "select_layer": 16,
12
+ "reproject_vision": false,
13
+ "use_flash_attention": true,
14
+ "load_bf16": true,
15
+ "collator_overwrite_image_inputs": false,
16
+ "eagle_collator": true,
17
+ "backbone_trainable_params_fp32": true,
18
+ "apply_sincos_state_encoding": true,
19
+ "use_relative_action": true,
20
+ "max_state_dim": 128,
21
+ "max_action_dim": 128,
22
+ "action_horizon": 50,
23
+ "hidden_size": 1024,
24
+ "input_embedding_dim": 1536,
25
+ "add_pos_embed": true,
26
+ "attn_dropout": 0.2,
27
+ "use_vlln": true,
28
+ "max_seq_len": 1024,
29
+ "use_alternate_vl_dit": true,
30
+ "attend_text_every_n_blocks": 2,
31
+ "diffusion_model_cfg": {
32
+ "attention_head_dim": 48,
33
+ "dropout": 0.2,
34
+ "final_dropout": true,
35
+ "interleave_self_attention": true,
36
+ "norm_type": "ada_norm",
37
+ "num_attention_heads": 32,
38
+ "num_layers": 32,
39
+ "output_dim": 1024,
40
+ "positional_embeddings": null
41
+ },
42
+ "num_inference_timesteps": 4,
43
+ "noise_beta_alpha": 1.5,
44
+ "noise_beta_beta": 1.0,
45
+ "noise_s": 0.999,
46
+ "num_timestep_buckets": 1000,
47
+ "tune_projector": true,
48
+ "tune_diffusion_model": true,
49
+ "tune_vlln": true,
50
+ "state_dropout_prob": 0.0,
51
+ "state_additive_noise_scale": 0.0,
52
+ "max_num_embodiments": 32
53
+ }
checkpoint-1000/experiment_cfg/final_processor_config.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1000/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02646418bc33318b62e7ef691c8d7add35772395b99f13be296d813e5f93d05b
3
+ size 4990120184
checkpoint-1000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fdc6262bc45affc2b050421cbf8a24ae571dce75dbfcf0b01c8c78131258e81
3
+ size 4823190320
checkpoint-1000/model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:185a90afae21031e12019294f25b654b08ad1096f83d240d2fff47861180b0c5
3
+ size 12960193762
checkpoint-1000/processor_config.json ADDED
@@ -0,0 +1,454 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "processor_class": "Gr00tN1d6Processor",
3
+ "processor_kwargs": {
4
+ "modality_configs": {
5
+ "behavior_r1_pro": {
6
+ "video": {
7
+ "delta_indices": [
8
+ 0
9
+ ],
10
+ "modality_keys": [
11
+ "observation.images.rgb.head_256_256",
12
+ "observation.images.rgb.left_wrist_256_256",
13
+ "observation.images.rgb.right_wrist_256_256"
14
+ ],
15
+ "sin_cos_embedding_keys": null,
16
+ "mean_std_embedding_keys": null,
17
+ "action_configs": null
18
+ },
19
+ "state": {
20
+ "delta_indices": [
21
+ 0
22
+ ],
23
+ "modality_keys": [
24
+ "robot_pos",
25
+ "robot_ori_cos",
26
+ "robot_ori_sin",
27
+ "robot_2d_ori",
28
+ "robot_2d_ori_cos",
29
+ "robot_2d_ori_sin",
30
+ "robot_lin_vel",
31
+ "robot_ang_vel",
32
+ "arm_left_qpos",
33
+ "arm_left_qpos_sin",
34
+ "arm_left_qpos_cos",
35
+ "eef_left_pos",
36
+ "eef_left_quat",
37
+ "gripper_left_qpos",
38
+ "arm_right_qpos",
39
+ "arm_right_qpos_sin",
40
+ "arm_right_qpos_cos",
41
+ "eef_right_pos",
42
+ "eef_right_quat",
43
+ "gripper_right_qpos",
44
+ "trunk_qpos"
45
+ ],
46
+ "sin_cos_embedding_keys": null,
47
+ "mean_std_embedding_keys": null,
48
+ "action_configs": null
49
+ },
50
+ "action": {
51
+ "delta_indices": [
52
+ 0,
53
+ 1,
54
+ 2,
55
+ 3,
56
+ 4,
57
+ 5,
58
+ 6,
59
+ 7,
60
+ 8,
61
+ 9,
62
+ 10,
63
+ 11,
64
+ 12,
65
+ 13,
66
+ 14,
67
+ 15,
68
+ 16,
69
+ 17,
70
+ 18,
71
+ 19,
72
+ 20,
73
+ 21,
74
+ 22,
75
+ 23,
76
+ 24,
77
+ 25,
78
+ 26,
79
+ 27,
80
+ 28,
81
+ 29,
82
+ 30,
83
+ 31
84
+ ],
85
+ "modality_keys": [
86
+ "base",
87
+ "torso",
88
+ "left_arm",
89
+ "left_gripper",
90
+ "right_arm",
91
+ "right_gripper"
92
+ ],
93
+ "sin_cos_embedding_keys": null,
94
+ "mean_std_embedding_keys": null,
95
+ "action_configs": [
96
+ {
97
+ "rep": "ABSOLUTE",
98
+ "type": "NON_EEF",
99
+ "format": "DEFAULT",
100
+ "state_key": null
101
+ },
102
+ {
103
+ "rep": "RELATIVE",
104
+ "type": "NON_EEF",
105
+ "format": "DEFAULT",
106
+ "state_key": "trunk_qpos"
107
+ },
108
+ {
109
+ "rep": "RELATIVE",
110
+ "type": "NON_EEF",
111
+ "format": "DEFAULT",
112
+ "state_key": "arm_left_qpos"
113
+ },
114
+ {
115
+ "rep": "ABSOLUTE",
116
+ "type": "NON_EEF",
117
+ "format": "DEFAULT",
118
+ "state_key": null
119
+ },
120
+ {
121
+ "rep": "RELATIVE",
122
+ "type": "NON_EEF",
123
+ "format": "DEFAULT",
124
+ "state_key": "arm_right_qpos"
125
+ },
126
+ {
127
+ "rep": "ABSOLUTE",
128
+ "type": "NON_EEF",
129
+ "format": "DEFAULT",
130
+ "state_key": null
131
+ }
132
+ ]
133
+ },
134
+ "language": {
135
+ "delta_indices": [
136
+ 0
137
+ ],
138
+ "modality_keys": [
139
+ "annotation.human.coarse_action"
140
+ ],
141
+ "sin_cos_embedding_keys": null,
142
+ "mean_std_embedding_keys": null,
143
+ "action_configs": null
144
+ }
145
+ },
146
+ "gr1": {
147
+ "video": {
148
+ "delta_indices": [
149
+ 0
150
+ ],
151
+ "modality_keys": [
152
+ "ego_view_bg_crop_pad_res256_freq20"
153
+ ],
154
+ "sin_cos_embedding_keys": null,
155
+ "mean_std_embedding_keys": null,
156
+ "action_configs": null
157
+ },
158
+ "state": {
159
+ "delta_indices": [
160
+ 0
161
+ ],
162
+ "modality_keys": [
163
+ "left_arm",
164
+ "right_arm",
165
+ "left_hand",
166
+ "right_hand",
167
+ "waist"
168
+ ],
169
+ "sin_cos_embedding_keys": [
170
+ "left_arm",
171
+ "right_arm",
172
+ "left_hand",
173
+ "right_hand",
174
+ "waist"
175
+ ],
176
+ "mean_std_embedding_keys": null,
177
+ "action_configs": null
178
+ },
179
+ "action": {
180
+ "delta_indices": [
181
+ 0,
182
+ 1,
183
+ 2,
184
+ 3,
185
+ 4,
186
+ 5,
187
+ 6,
188
+ 7,
189
+ 8,
190
+ 9,
191
+ 10,
192
+ 11,
193
+ 12,
194
+ 13,
195
+ 14,
196
+ 15
197
+ ],
198
+ "modality_keys": [
199
+ "left_arm",
200
+ "right_arm",
201
+ "left_hand",
202
+ "right_hand",
203
+ "waist"
204
+ ],
205
+ "sin_cos_embedding_keys": null,
206
+ "mean_std_embedding_keys": null,
207
+ "action_configs": [
208
+ {
209
+ "rep": "RELATIVE",
210
+ "type": "NON_EEF",
211
+ "format": "DEFAULT",
212
+ "state_key": null
213
+ },
214
+ {
215
+ "rep": "RELATIVE",
216
+ "type": "NON_EEF",
217
+ "format": "DEFAULT",
218
+ "state_key": null
219
+ },
220
+ {
221
+ "rep": "RELATIVE",
222
+ "type": "NON_EEF",
223
+ "format": "DEFAULT",
224
+ "state_key": null
225
+ },
226
+ {
227
+ "rep": "RELATIVE",
228
+ "type": "NON_EEF",
229
+ "format": "DEFAULT",
230
+ "state_key": null
231
+ },
232
+ {
233
+ "rep": "ABSOLUTE",
234
+ "type": "NON_EEF",
235
+ "format": "DEFAULT",
236
+ "state_key": null
237
+ }
238
+ ]
239
+ },
240
+ "language": {
241
+ "delta_indices": [
242
+ 0
243
+ ],
244
+ "modality_keys": [
245
+ "task"
246
+ ],
247
+ "sin_cos_embedding_keys": null,
248
+ "mean_std_embedding_keys": null,
249
+ "action_configs": null
250
+ }
251
+ },
252
+ "robocasa_panda_omron": {
253
+ "video": {
254
+ "delta_indices": [
255
+ 0
256
+ ],
257
+ "modality_keys": [
258
+ "res256_image_side_0",
259
+ "res256_image_side_1",
260
+ "res256_image_wrist_0"
261
+ ],
262
+ "sin_cos_embedding_keys": null,
263
+ "mean_std_embedding_keys": null,
264
+ "action_configs": null
265
+ },
266
+ "state": {
267
+ "delta_indices": [
268
+ 0
269
+ ],
270
+ "modality_keys": [
271
+ "end_effector_position_relative",
272
+ "end_effector_rotation_relative",
273
+ "gripper_qpos",
274
+ "base_position",
275
+ "base_rotation"
276
+ ],
277
+ "sin_cos_embedding_keys": null,
278
+ "mean_std_embedding_keys": null,
279
+ "action_configs": null
280
+ },
281
+ "action": {
282
+ "delta_indices": [
283
+ 0,
284
+ 1,
285
+ 2,
286
+ 3,
287
+ 4,
288
+ 5,
289
+ 6,
290
+ 7,
291
+ 8,
292
+ 9,
293
+ 10,
294
+ 11,
295
+ 12,
296
+ 13,
297
+ 14,
298
+ 15
299
+ ],
300
+ "modality_keys": [
301
+ "end_effector_position",
302
+ "end_effector_rotation",
303
+ "gripper_close",
304
+ "base_motion",
305
+ "control_mode"
306
+ ],
307
+ "sin_cos_embedding_keys": null,
308
+ "mean_std_embedding_keys": null,
309
+ "action_configs": [
310
+ {
311
+ "rep": "ABSOLUTE",
312
+ "type": "NON_EEF",
313
+ "format": "DEFAULT",
314
+ "state_key": null
315
+ },
316
+ {
317
+ "rep": "ABSOLUTE",
318
+ "type": "NON_EEF",
319
+ "format": "DEFAULT",
320
+ "state_key": null
321
+ },
322
+ {
323
+ "rep": "ABSOLUTE",
324
+ "type": "NON_EEF",
325
+ "format": "DEFAULT",
326
+ "state_key": null
327
+ },
328
+ {
329
+ "rep": "ABSOLUTE",
330
+ "type": "NON_EEF",
331
+ "format": "DEFAULT",
332
+ "state_key": null
333
+ },
334
+ {
335
+ "rep": "ABSOLUTE",
336
+ "type": "NON_EEF",
337
+ "format": "DEFAULT",
338
+ "state_key": null
339
+ }
340
+ ]
341
+ },
342
+ "language": {
343
+ "delta_indices": [
344
+ 0
345
+ ],
346
+ "modality_keys": [
347
+ "annotation.human.action.task_description"
348
+ ],
349
+ "sin_cos_embedding_keys": null,
350
+ "mean_std_embedding_keys": null,
351
+ "action_configs": null
352
+ }
353
+ },
354
+ "new_embodiment": {
355
+ "video": {
356
+ "delta_indices": [
357
+ 0
358
+ ],
359
+ "modality_keys": [
360
+ "ego_view"
361
+ ],
362
+ "sin_cos_embedding_keys": null,
363
+ "mean_std_embedding_keys": null,
364
+ "action_configs": null
365
+ },
366
+ "state": {
367
+ "delta_indices": [
368
+ 0
369
+ ],
370
+ "modality_keys": [
371
+ "single_arm",
372
+ "gripper"
373
+ ],
374
+ "sin_cos_embedding_keys": null,
375
+ "mean_std_embedding_keys": null,
376
+ "action_configs": null
377
+ },
378
+ "action": {
379
+ "delta_indices": [
380
+ 0,
381
+ 1,
382
+ 2,
383
+ 3,
384
+ 4,
385
+ 5,
386
+ 6,
387
+ 7,
388
+ 8,
389
+ 9,
390
+ 10,
391
+ 11,
392
+ 12,
393
+ 13,
394
+ 14,
395
+ 15
396
+ ],
397
+ "modality_keys": [
398
+ "single_arm",
399
+ "gripper"
400
+ ],
401
+ "sin_cos_embedding_keys": null,
402
+ "mean_std_embedding_keys": null,
403
+ "action_configs": [
404
+ {
405
+ "rep": "RELATIVE",
406
+ "type": "NON_EEF",
407
+ "format": "DEFAULT",
408
+ "state_key": "single_arm"
409
+ },
410
+ {
411
+ "rep": "ABSOLUTE",
412
+ "type": "NON_EEF",
413
+ "format": "DEFAULT",
414
+ "state_key": null
415
+ }
416
+ ]
417
+ },
418
+ "language": {
419
+ "delta_indices": [
420
+ 0
421
+ ],
422
+ "modality_keys": [
423
+ "annotation.human.task_description"
424
+ ],
425
+ "sin_cos_embedding_keys": null,
426
+ "mean_std_embedding_keys": null,
427
+ "action_configs": null
428
+ }
429
+ }
430
+ },
431
+ "image_crop_size": null,
432
+ "image_target_size": null,
433
+ "use_albumentations": true,
434
+ "random_rotation_angle": null,
435
+ "color_jitter_params": {
436
+ "brightness": 0.3,
437
+ "contrast": 0.4,
438
+ "saturation": 0.5,
439
+ "hue": 0.08
440
+ },
441
+ "shortest_image_edge": 256,
442
+ "crop_fraction": 0.95,
443
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
444
+ "model_type": "eagle",
445
+ "formalize_language": true,
446
+ "max_state_dim": 128,
447
+ "max_action_dim": 128,
448
+ "max_action_horizon": 50,
449
+ "use_percentiles": false,
450
+ "clip_outliers": true,
451
+ "apply_sincos_state_encoding": true,
452
+ "use_relative_action": true
453
+ }
454
+ }
checkpoint-1000/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac7313e126917431481c6bef049de740eaab7c1b848dbaeffb9fa5ab8608570f
3
+ size 14645
checkpoint-1000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed132db8d1e2040087f464071ec9a05351dfb4fedee309abc46c9434dcbdd77c
3
+ size 1465
checkpoint-1000/statistics.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1000/trainer_state.json ADDED
@@ -0,0 +1,634 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 0.5,
6
+ "eval_steps": 500,
7
+ "global_step": 1000,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "grad_norm": 1.7424949407577515,
14
+ "learning_rate": 9e-06,
15
+ "loss": 1.4997,
16
+ "step": 10
17
+ },
18
+ {
19
+ "grad_norm": 0.5852967500686646,
20
+ "learning_rate": 1.9e-05,
21
+ "loss": 1.3085,
22
+ "step": 20
23
+ },
24
+ {
25
+ "grad_norm": 0.9362701177597046,
26
+ "learning_rate": 2.9e-05,
27
+ "loss": 1.1792,
28
+ "step": 30
29
+ },
30
+ {
31
+ "grad_norm": 0.6769218444824219,
32
+ "learning_rate": 3.9000000000000006e-05,
33
+ "loss": 1.0609,
34
+ "step": 40
35
+ },
36
+ {
37
+ "grad_norm": 0.6926454305648804,
38
+ "learning_rate": 4.9e-05,
39
+ "loss": 1.0562,
40
+ "step": 50
41
+ },
42
+ {
43
+ "grad_norm": 0.4864855408668518,
44
+ "learning_rate": 5.9e-05,
45
+ "loss": 1.05,
46
+ "step": 60
47
+ },
48
+ {
49
+ "grad_norm": 0.390482097864151,
50
+ "learning_rate": 6.9e-05,
51
+ "loss": 1.0319,
52
+ "step": 70
53
+ },
54
+ {
55
+ "grad_norm": 0.9116744995117188,
56
+ "learning_rate": 7.900000000000001e-05,
57
+ "loss": 1.0302,
58
+ "step": 80
59
+ },
60
+ {
61
+ "grad_norm": 1.013092041015625,
62
+ "learning_rate": 8.900000000000001e-05,
63
+ "loss": 0.9882,
64
+ "step": 90
65
+ },
66
+ {
67
+ "grad_norm": 1.0793496370315552,
68
+ "learning_rate": 9.900000000000001e-05,
69
+ "loss": 0.9154,
70
+ "step": 100
71
+ },
72
+ {
73
+ "grad_norm": 1.4888230562210083,
74
+ "learning_rate": 9.999446382823013e-05,
75
+ "loss": 0.8416,
76
+ "step": 110
77
+ },
78
+ {
79
+ "grad_norm": 1.4292930364608765,
80
+ "learning_rate": 9.997532801828658e-05,
81
+ "loss": 0.6817,
82
+ "step": 120
83
+ },
84
+ {
85
+ "grad_norm": 1.4698712825775146,
86
+ "learning_rate": 9.99425294526634e-05,
87
+ "loss": 0.5077,
88
+ "step": 130
89
+ },
90
+ {
91
+ "grad_norm": 1.5290286540985107,
92
+ "learning_rate": 9.989607709816091e-05,
93
+ "loss": 0.3704,
94
+ "step": 140
95
+ },
96
+ {
97
+ "grad_norm": 1.4736027717590332,
98
+ "learning_rate": 9.983598365438902e-05,
99
+ "loss": 0.2458,
100
+ "step": 150
101
+ },
102
+ {
103
+ "grad_norm": 1.1587175130844116,
104
+ "learning_rate": 9.976226555029522e-05,
105
+ "loss": 0.1803,
106
+ "step": 160
107
+ },
108
+ {
109
+ "grad_norm": 0.9846270680427551,
110
+ "learning_rate": 9.967494293967312e-05,
111
+ "loss": 0.1529,
112
+ "step": 170
113
+ },
114
+ {
115
+ "grad_norm": 0.8785351514816284,
116
+ "learning_rate": 9.95740396956525e-05,
117
+ "loss": 0.1356,
118
+ "step": 180
119
+ },
120
+ {
121
+ "grad_norm": 0.8878108859062195,
122
+ "learning_rate": 9.945958340417283e-05,
123
+ "loss": 0.1103,
124
+ "step": 190
125
+ },
126
+ {
127
+ "grad_norm": 0.9868141412734985,
128
+ "learning_rate": 9.93316053564413e-05,
129
+ "loss": 0.1177,
130
+ "step": 200
131
+ },
132
+ {
133
+ "grad_norm": 1.1627991199493408,
134
+ "learning_rate": 9.919014054037836e-05,
135
+ "loss": 0.1098,
136
+ "step": 210
137
+ },
138
+ {
139
+ "grad_norm": 0.7567640542984009,
140
+ "learning_rate": 9.903522763105218e-05,
141
+ "loss": 0.1034,
142
+ "step": 220
143
+ },
144
+ {
145
+ "grad_norm": 0.9812158942222595,
146
+ "learning_rate": 9.886690898010535e-05,
147
+ "loss": 0.0935,
148
+ "step": 230
149
+ },
150
+ {
151
+ "grad_norm": 0.736114501953125,
152
+ "learning_rate": 9.868523060417646e-05,
153
+ "loss": 0.0918,
154
+ "step": 240
155
+ },
156
+ {
157
+ "grad_norm": 0.668365478515625,
158
+ "learning_rate": 9.849024217231935e-05,
159
+ "loss": 0.0828,
160
+ "step": 250
161
+ },
162
+ {
163
+ "grad_norm": 0.6348236799240112,
164
+ "learning_rate": 9.82819969924244e-05,
165
+ "loss": 0.0848,
166
+ "step": 260
167
+ },
168
+ {
169
+ "grad_norm": 0.8186867237091064,
170
+ "learning_rate": 9.806055199664446e-05,
171
+ "loss": 0.0976,
172
+ "step": 270
173
+ },
174
+ {
175
+ "grad_norm": 0.974027693271637,
176
+ "learning_rate": 9.782596772583026e-05,
177
+ "loss": 0.0761,
178
+ "step": 280
179
+ },
180
+ {
181
+ "grad_norm": 0.7111085057258606,
182
+ "learning_rate": 9.757830831297914e-05,
183
+ "loss": 0.0979,
184
+ "step": 290
185
+ },
186
+ {
187
+ "grad_norm": 0.9077074527740479,
188
+ "learning_rate": 9.731764146570173e-05,
189
+ "loss": 0.0787,
190
+ "step": 300
191
+ },
192
+ {
193
+ "grad_norm": 0.5821448564529419,
194
+ "learning_rate": 9.704403844771128e-05,
195
+ "loss": 0.0838,
196
+ "step": 310
197
+ },
198
+ {
199
+ "grad_norm": 0.5775296092033386,
200
+ "learning_rate": 9.675757405934103e-05,
201
+ "loss": 0.0623,
202
+ "step": 320
203
+ },
204
+ {
205
+ "grad_norm": 0.6049805879592896,
206
+ "learning_rate": 9.645832661709444e-05,
207
+ "loss": 0.0636,
208
+ "step": 330
209
+ },
210
+ {
211
+ "grad_norm": 0.45737943053245544,
212
+ "learning_rate": 9.614637793223425e-05,
213
+ "loss": 0.0626,
214
+ "step": 340
215
+ },
216
+ {
217
+ "grad_norm": 0.4611263871192932,
218
+ "learning_rate": 9.582181328841611e-05,
219
+ "loss": 0.0582,
220
+ "step": 350
221
+ },
222
+ {
223
+ "grad_norm": 0.6837406158447266,
224
+ "learning_rate": 9.548472141837286e-05,
225
+ "loss": 0.0638,
226
+ "step": 360
227
+ },
228
+ {
229
+ "grad_norm": 0.6089468002319336,
230
+ "learning_rate": 9.513519447965595e-05,
231
+ "loss": 0.0581,
232
+ "step": 370
233
+ },
234
+ {
235
+ "grad_norm": 0.585154116153717,
236
+ "learning_rate": 9.477332802944044e-05,
237
+ "loss": 0.0552,
238
+ "step": 380
239
+ },
240
+ {
241
+ "grad_norm": 0.5016727447509766,
242
+ "learning_rate": 9.439922099840054e-05,
243
+ "loss": 0.0581,
244
+ "step": 390
245
+ },
246
+ {
247
+ "grad_norm": 0.569975733757019,
248
+ "learning_rate": 9.401297566366318e-05,
249
+ "loss": 0.0594,
250
+ "step": 400
251
+ },
252
+ {
253
+ "grad_norm": 0.6577298641204834,
254
+ "learning_rate": 9.36146976208462e-05,
255
+ "loss": 0.0624,
256
+ "step": 410
257
+ },
258
+ {
259
+ "grad_norm": 0.7007710933685303,
260
+ "learning_rate": 9.320449575518972e-05,
261
+ "loss": 0.0583,
262
+ "step": 420
263
+ },
264
+ {
265
+ "grad_norm": 0.47701025009155273,
266
+ "learning_rate": 9.278248221178798e-05,
267
+ "loss": 0.0589,
268
+ "step": 430
269
+ },
270
+ {
271
+ "grad_norm": 0.5127101540565491,
272
+ "learning_rate": 9.234877236492997e-05,
273
+ "loss": 0.0571,
274
+ "step": 440
275
+ },
276
+ {
277
+ "grad_norm": 0.4970426559448242,
278
+ "learning_rate": 9.190348478655724e-05,
279
+ "loss": 0.0518,
280
+ "step": 450
281
+ },
282
+ {
283
+ "grad_norm": 0.42194655537605286,
284
+ "learning_rate": 9.144674121384757e-05,
285
+ "loss": 0.0572,
286
+ "step": 460
287
+ },
288
+ {
289
+ "grad_norm": 0.6780546307563782,
290
+ "learning_rate": 9.097866651593317e-05,
291
+ "loss": 0.0631,
292
+ "step": 470
293
+ },
294
+ {
295
+ "grad_norm": 0.3541775047779083,
296
+ "learning_rate": 9.049938865976275e-05,
297
+ "loss": 0.0548,
298
+ "step": 480
299
+ },
300
+ {
301
+ "grad_norm": 0.6049434542655945,
302
+ "learning_rate": 9.000903867511666e-05,
303
+ "loss": 0.0498,
304
+ "step": 490
305
+ },
306
+ {
307
+ "grad_norm": 0.45229852199554443,
308
+ "learning_rate": 8.950775061878453e-05,
309
+ "loss": 0.0496,
310
+ "step": 500
311
+ },
312
+ {
313
+ "grad_norm": 0.6024392247200012,
314
+ "learning_rate": 8.899566153791566e-05,
315
+ "loss": 0.0569,
316
+ "step": 510
317
+ },
318
+ {
319
+ "grad_norm": 0.4546999931335449,
320
+ "learning_rate": 8.84729114325516e-05,
321
+ "loss": 0.0509,
322
+ "step": 520
323
+ },
324
+ {
325
+ "grad_norm": 0.5965995788574219,
326
+ "learning_rate": 8.79396432173515e-05,
327
+ "loss": 0.0631,
328
+ "step": 530
329
+ },
330
+ {
331
+ "grad_norm": 0.5499140024185181,
332
+ "learning_rate": 8.739600268252078e-05,
333
+ "loss": 0.0493,
334
+ "step": 540
335
+ },
336
+ {
337
+ "grad_norm": 0.5246662497520447,
338
+ "learning_rate": 8.684213845395339e-05,
339
+ "loss": 0.0534,
340
+ "step": 550
341
+ },
342
+ {
343
+ "grad_norm": 0.47341179847717285,
344
+ "learning_rate": 8.627820195259918e-05,
345
+ "loss": 0.0462,
346
+ "step": 560
347
+ },
348
+ {
349
+ "grad_norm": 0.42044690251350403,
350
+ "learning_rate": 8.570434735306671e-05,
351
+ "loss": 0.0405,
352
+ "step": 570
353
+ },
354
+ {
355
+ "grad_norm": 0.5121616125106812,
356
+ "learning_rate": 8.512073154147362e-05,
357
+ "loss": 0.0478,
358
+ "step": 580
359
+ },
360
+ {
361
+ "grad_norm": 0.4845208525657654,
362
+ "learning_rate": 8.452751407255541e-05,
363
+ "loss": 0.0486,
364
+ "step": 590
365
+ },
366
+ {
367
+ "grad_norm": 0.3478183150291443,
368
+ "learning_rate": 8.392485712604483e-05,
369
+ "loss": 0.0568,
370
+ "step": 600
371
+ },
372
+ {
373
+ "grad_norm": 0.49295181035995483,
374
+ "learning_rate": 8.331292546233362e-05,
375
+ "loss": 0.0561,
376
+ "step": 610
377
+ },
378
+ {
379
+ "grad_norm": 0.522871732711792,
380
+ "learning_rate": 8.269188637742846e-05,
381
+ "loss": 0.0438,
382
+ "step": 620
383
+ },
384
+ {
385
+ "grad_norm": 0.45402273535728455,
386
+ "learning_rate": 8.206190965721419e-05,
387
+ "loss": 0.0354,
388
+ "step": 630
389
+ },
390
+ {
391
+ "grad_norm": 0.461839497089386,
392
+ "learning_rate": 8.14231675310358e-05,
393
+ "loss": 0.038,
394
+ "step": 640
395
+ },
396
+ {
397
+ "grad_norm": 0.47349685430526733,
398
+ "learning_rate": 8.077583462461283e-05,
399
+ "loss": 0.0414,
400
+ "step": 650
401
+ },
402
+ {
403
+ "grad_norm": 0.5613319873809814,
404
+ "learning_rate": 8.012008791229826e-05,
405
+ "loss": 0.045,
406
+ "step": 660
407
+ },
408
+ {
409
+ "grad_norm": 0.6868877410888672,
410
+ "learning_rate": 7.945610666869568e-05,
411
+ "loss": 0.0538,
412
+ "step": 670
413
+ },
414
+ {
415
+ "grad_norm": 0.5372869968414307,
416
+ "learning_rate": 7.878407241964729e-05,
417
+ "loss": 0.0458,
418
+ "step": 680
419
+ },
420
+ {
421
+ "grad_norm": 0.48658597469329834,
422
+ "learning_rate": 7.810416889260653e-05,
423
+ "loss": 0.0415,
424
+ "step": 690
425
+ },
426
+ {
427
+ "grad_norm": 0.5548452734947205,
428
+ "learning_rate": 7.741658196640892e-05,
429
+ "loss": 0.0401,
430
+ "step": 700
431
+ },
432
+ {
433
+ "grad_norm": 0.6520838141441345,
434
+ "learning_rate": 7.672149962045457e-05,
435
+ "loss": 0.0542,
436
+ "step": 710
437
+ },
438
+ {
439
+ "grad_norm": 0.5273123979568481,
440
+ "learning_rate": 7.60191118833165e-05,
441
+ "loss": 0.0461,
442
+ "step": 720
443
+ },
444
+ {
445
+ "grad_norm": 0.45993274450302124,
446
+ "learning_rate": 7.530961078078873e-05,
447
+ "loss": 0.0445,
448
+ "step": 730
449
+ },
450
+ {
451
+ "grad_norm": 0.3632051646709442,
452
+ "learning_rate": 7.45931902833884e-05,
453
+ "loss": 0.031,
454
+ "step": 740
455
+ },
456
+ {
457
+ "grad_norm": 0.3503791093826294,
458
+ "learning_rate": 7.387004625332608e-05,
459
+ "loss": 0.0362,
460
+ "step": 750
461
+ },
462
+ {
463
+ "grad_norm": 0.4252007305622101,
464
+ "learning_rate": 7.3140376390959e-05,
465
+ "loss": 0.0306,
466
+ "step": 760
467
+ },
468
+ {
469
+ "grad_norm": 0.5684967637062073,
470
+ "learning_rate": 7.240438018074189e-05,
471
+ "loss": 0.0343,
472
+ "step": 770
473
+ },
474
+ {
475
+ "grad_norm": 0.5697133541107178,
476
+ "learning_rate": 7.166225883668969e-05,
477
+ "loss": 0.0404,
478
+ "step": 780
479
+ },
480
+ {
481
+ "grad_norm": 0.6125141978263855,
482
+ "learning_rate": 7.091421524736784e-05,
483
+ "loss": 0.0393,
484
+ "step": 790
485
+ },
486
+ {
487
+ "grad_norm": 0.4313353896141052,
488
+ "learning_rate": 7.016045392042452e-05,
489
+ "loss": 0.041,
490
+ "step": 800
491
+ },
492
+ {
493
+ "grad_norm": 0.41094619035720825,
494
+ "learning_rate": 6.940118092668022e-05,
495
+ "loss": 0.0475,
496
+ "step": 810
497
+ },
498
+ {
499
+ "grad_norm": 0.3212681710720062,
500
+ "learning_rate": 6.863660384379017e-05,
501
+ "loss": 0.0388,
502
+ "step": 820
503
+ },
504
+ {
505
+ "grad_norm": 0.5655945539474487,
506
+ "learning_rate": 6.786693169949455e-05,
507
+ "loss": 0.04,
508
+ "step": 830
509
+ },
510
+ {
511
+ "grad_norm": 0.44820529222488403,
512
+ "learning_rate": 6.709237491447249e-05,
513
+ "loss": 0.0374,
514
+ "step": 840
515
+ },
516
+ {
517
+ "grad_norm": 0.43709850311279297,
518
+ "learning_rate": 6.631314524481513e-05,
519
+ "loss": 0.049,
520
+ "step": 850
521
+ },
522
+ {
523
+ "grad_norm": 0.5083968043327332,
524
+ "learning_rate": 6.552945572413358e-05,
525
+ "loss": 0.0436,
526
+ "step": 860
527
+ },
528
+ {
529
+ "grad_norm": 0.3737967610359192,
530
+ "learning_rate": 6.474152060531768e-05,
531
+ "loss": 0.0374,
532
+ "step": 870
533
+ },
534
+ {
535
+ "grad_norm": 0.4421429932117462,
536
+ "learning_rate": 6.394955530196147e-05,
537
+ "loss": 0.0293,
538
+ "step": 880
539
+ },
540
+ {
541
+ "grad_norm": 0.44184306263923645,
542
+ "learning_rate": 6.315377632947115e-05,
543
+ "loss": 0.0307,
544
+ "step": 890
545
+ },
546
+ {
547
+ "grad_norm": 0.45122212171554565,
548
+ "learning_rate": 6.235440124587198e-05,
549
+ "loss": 0.0417,
550
+ "step": 900
551
+ },
552
+ {
553
+ "grad_norm": 0.43313905596733093,
554
+ "learning_rate": 6.155164859233012e-05,
555
+ "loss": 0.0281,
556
+ "step": 910
557
+ },
558
+ {
559
+ "grad_norm": 0.31750547885894775,
560
+ "learning_rate": 6.074573783340562e-05,
561
+ "loss": 0.0328,
562
+ "step": 920
563
+ },
564
+ {
565
+ "grad_norm": 0.39470431208610535,
566
+ "learning_rate": 5.9936889297052986e-05,
567
+ "loss": 0.0286,
568
+ "step": 930
569
+ },
570
+ {
571
+ "grad_norm": 0.4038713872432709,
572
+ "learning_rate": 5.912532411438576e-05,
573
+ "loss": 0.0279,
574
+ "step": 940
575
+ },
576
+ {
577
+ "grad_norm": 0.5246008038520813,
578
+ "learning_rate": 5.831126415922148e-05,
579
+ "loss": 0.0389,
580
+ "step": 950
581
+ },
582
+ {
583
+ "grad_norm": 0.5796319842338562,
584
+ "learning_rate": 5.74949319874235e-05,
585
+ "loss": 0.0269,
586
+ "step": 960
587
+ },
588
+ {
589
+ "grad_norm": 0.442847341299057,
590
+ "learning_rate": 5.667655077605659e-05,
591
+ "loss": 0.0285,
592
+ "step": 970
593
+ },
594
+ {
595
+ "grad_norm": 0.5783978700637817,
596
+ "learning_rate": 5.585634426237246e-05,
597
+ "loss": 0.0347,
598
+ "step": 980
599
+ },
600
+ {
601
+ "grad_norm": 0.673740804195404,
602
+ "learning_rate": 5.5034536682642224e-05,
603
+ "loss": 0.037,
604
+ "step": 990
605
+ },
606
+ {
607
+ "grad_norm": 0.4028751850128174,
608
+ "learning_rate": 5.4211352710852495e-05,
609
+ "loss": 0.0359,
610
+ "step": 1000
611
+ }
612
+ ],
613
+ "logging_steps": 10,
614
+ "max_steps": 2000,
615
+ "num_input_tokens_seen": 0,
616
+ "num_train_epochs": 9223372036854775807,
617
+ "save_steps": 500,
618
+ "stateful_callbacks": {
619
+ "TrainerControl": {
620
+ "args": {
621
+ "should_epoch_stop": false,
622
+ "should_evaluate": false,
623
+ "should_log": false,
624
+ "should_save": true,
625
+ "should_training_stop": false
626
+ },
627
+ "attributes": {}
628
+ }
629
+ },
630
+ "total_flos": 0.0,
631
+ "train_batch_size": 32,
632
+ "trial_name": null,
633
+ "trial_params": null
634
+ }
checkpoint-1000/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8721c3d4c4fb62e1b3a5942bcac338cc99c78ef7dfcb870774c274d6e7efc55
3
+ size 5777
checkpoint-1000/wandb_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"project": "finetune-gr00t-n1d6", "run_id": "gr00t_franka_finetune"}
checkpoint-1500/config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_horizon": 50,
3
+ "add_pos_embed": true,
4
+ "apply_sincos_state_encoding": true,
5
+ "architectures": [
6
+ "Gr00tN1d6"
7
+ ],
8
+ "attn_dropout": 0.2,
9
+ "attn_implementation": null,
10
+ "backbone_embedding_dim": 2048,
11
+ "backbone_model_type": "eagle",
12
+ "backbone_trainable_params_fp32": true,
13
+ "collator_overwrite_image_inputs": false,
14
+ "color_jitter_params": {
15
+ "brightness": 0.1,
16
+ "contrast": 0.1,
17
+ "hue": 0.1,
18
+ "saturation": 0.1
19
+ },
20
+ "crop_fraction": 0.95,
21
+ "diffusion_model_cfg": {
22
+ "attention_head_dim": 48,
23
+ "dropout": 0.2,
24
+ "final_dropout": true,
25
+ "interleave_self_attention": true,
26
+ "norm_type": "ada_norm",
27
+ "num_attention_heads": 32,
28
+ "num_layers": 32,
29
+ "output_dim": 1024,
30
+ "positional_embeddings": null
31
+ },
32
+ "eagle_collator": true,
33
+ "formalize_language": true,
34
+ "gemma_collator": false,
35
+ "hidden_size": 1024,
36
+ "image_crop_size": null,
37
+ "image_target_size": null,
38
+ "input_embedding_dim": 1536,
39
+ "load_bf16": true,
40
+ "max_action_dim": 128,
41
+ "max_num_embodiments": 32,
42
+ "max_seq_len": 1024,
43
+ "max_state_dim": 128,
44
+ "model_dtype": "bfloat16",
45
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
46
+ "model_type": "Gr00tN1d6",
47
+ "noise_beta_alpha": 1.5,
48
+ "noise_beta_beta": 1.0,
49
+ "noise_s": 0.999,
50
+ "num_inference_timesteps": 4,
51
+ "num_timestep_buckets": 1000,
52
+ "random_rotation_angle": null,
53
+ "reproject_vision": false,
54
+ "select_layer": 16,
55
+ "shortest_image_edge": 256,
56
+ "state_dropout_prob": 0.0,
57
+ "torch_dtype": "bfloat16",
58
+ "transformers_version": "4.51.3",
59
+ "tune_diffusion_model": true,
60
+ "tune_llm": false,
61
+ "tune_projector": true,
62
+ "tune_top_llm_layers": 4,
63
+ "tune_visual": false,
64
+ "tune_vlln": true,
65
+ "use_albumentations_transforms": true,
66
+ "use_alternate_vl_dit": true,
67
+ "use_flash_attention": true,
68
+ "use_relative_action": true,
69
+ "use_vlln": true
70
+ }
checkpoint-1500/embodiment_id.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "robocasa_panda_omron": 13,
3
+ "gr1": 20,
4
+ "behavior_r1_pro": 24,
5
+ "unitree_g1": 8,
6
+ "oxe_google": 0,
7
+ "oxe_widowx": 1,
8
+ "libero_panda": 2,
9
+ "new_embodiment": 10
10
+ }
checkpoint-1500/experiment_cfg/conf.yaml ADDED
@@ -0,0 +1,204 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ load_config_path: null
2
+ model:
3
+ model_type: Gr00tN1d6
4
+ model_dtype: bfloat16
5
+ model_name: nvidia/Eagle-Block2A-2B-v2
6
+ backbone_model_type: eagle
7
+ model_revision: null
8
+ tune_top_llm_layers: 4
9
+ backbone_embedding_dim: 2048
10
+ tune_llm: false
11
+ tune_visual: false
12
+ select_layer: 16
13
+ reproject_vision: false
14
+ use_flash_attention: true
15
+ load_bf16: false
16
+ collator_overwrite_image_inputs: false
17
+ eagle_collator: true
18
+ backbone_trainable_params_fp32: true
19
+ image_crop_size: null
20
+ image_target_size: null
21
+ shortest_image_edge: 256
22
+ crop_fraction: 0.95
23
+ random_rotation_angle: null
24
+ color_jitter_params: null
25
+ use_albumentations_transforms: true
26
+ formalize_language: true
27
+ apply_sincos_state_encoding: false
28
+ use_relative_action: true
29
+ max_state_dim: 29
30
+ max_action_dim: 29
31
+ action_horizon: 16
32
+ hidden_size: 1024
33
+ input_embedding_dim: 1536
34
+ add_pos_embed: true
35
+ attn_dropout: 0.2
36
+ use_vlln: true
37
+ max_seq_len: 1024
38
+ use_alternate_vl_dit: true
39
+ attend_text_every_n_blocks: 2
40
+ diffusion_model_cfg:
41
+ positional_embeddings: null
42
+ num_layers: 32
43
+ num_attention_heads: 32
44
+ attention_head_dim: 48
45
+ norm_type: ada_norm
46
+ dropout: 0.2
47
+ final_dropout: true
48
+ output_dim: 1024
49
+ interleave_self_attention: true
50
+ num_inference_timesteps: 4
51
+ noise_beta_alpha: 1.5
52
+ noise_beta_beta: 1.0
53
+ noise_s: 0.999
54
+ num_timestep_buckets: 1000
55
+ tune_projector: true
56
+ tune_diffusion_model: true
57
+ tune_vlln: true
58
+ state_dropout_prob: 0.0
59
+ state_additive_noise_scale: 0.0
60
+ max_num_embodiments: 32
61
+ data:
62
+ datasets:
63
+ - dataset_paths:
64
+ - /workspaces/isaaclab_arena/train_data
65
+ embodiment_tag: new_embodiment
66
+ mix_ratio: 1.0
67
+ dataset_type: physical_embodiment
68
+ val_dataset_path: null
69
+ modality_configs:
70
+ new_embodiment:
71
+ video:
72
+ delta_indices:
73
+ - 0
74
+ modality_keys:
75
+ - ego_view
76
+ sin_cos_embedding_keys: null
77
+ mean_std_embedding_keys: null
78
+ action_configs: null
79
+ state:
80
+ delta_indices:
81
+ - 0
82
+ modality_keys:
83
+ - single_arm
84
+ - gripper
85
+ sin_cos_embedding_keys: null
86
+ mean_std_embedding_keys: null
87
+ action_configs: null
88
+ action:
89
+ delta_indices:
90
+ - 0
91
+ - 1
92
+ - 2
93
+ - 3
94
+ - 4
95
+ - 5
96
+ - 6
97
+ - 7
98
+ - 8
99
+ - 9
100
+ - 10
101
+ - 11
102
+ - 12
103
+ - 13
104
+ - 14
105
+ - 15
106
+ modality_keys:
107
+ - single_arm
108
+ - gripper
109
+ sin_cos_embedding_keys: null
110
+ mean_std_embedding_keys: null
111
+ action_configs:
112
+ - rep: RELATIVE
113
+ type: NON_EEF
114
+ format: DEFAULT
115
+ state_key: single_arm
116
+ - rep: ABSOLUTE
117
+ type: NON_EEF
118
+ format: DEFAULT
119
+ state_key: null
120
+ language:
121
+ delta_indices:
122
+ - 0
123
+ modality_keys:
124
+ - annotation.human.task_description
125
+ sin_cos_embedding_keys: null
126
+ mean_std_embedding_keys: null
127
+ action_configs: null
128
+ download_cache: false
129
+ shard_size: 1024
130
+ episode_sampling_rate: 0.1
131
+ num_shards_per_epoch: 100000
132
+ override_pretraining_statistics: false
133
+ mode: single_turn
134
+ random_chop: 0.0
135
+ mock_dataset_mode: false
136
+ shuffle: true
137
+ seed: 42
138
+ multiprocessing_context: fork
139
+ allow_padding: false
140
+ subsample_ratio: 1.0
141
+ image_crop_size:
142
+ - 244
143
+ - 244
144
+ image_target_size:
145
+ - 224
146
+ - 224
147
+ video_backend: torchcodec
148
+ training:
149
+ output_dir: /home/ubuntu/.cache/gr00t_franka_finetune
150
+ experiment_name: null
151
+ max_steps: 2000
152
+ global_batch_size: 32
153
+ batch_size: null
154
+ gradient_accumulation_steps: 1
155
+ learning_rate: 0.0001
156
+ lr_scheduler_type: cosine
157
+ weight_decay: 1.0e-05
158
+ warmup_ratio: 0.05
159
+ warmup_steps: 0
160
+ max_grad_norm: 1.0
161
+ optim: adamw_torch
162
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
163
+ tf32: true
164
+ fp16: false
165
+ bf16: true
166
+ eval_bf16: true
167
+ logging_steps: 10
168
+ save_steps: 500
169
+ save_total_limit: 4
170
+ save_vl_model: false
171
+ upload_checkpoints: false
172
+ upload_every: 1000
173
+ upload_last_n_checkpoints: 5
174
+ max_concurrent_uploads: 2
175
+ eval_strategy: 'no'
176
+ eval_steps: 500
177
+ eval_set_split_ratio: 0.1
178
+ eval_batch_size: 2
179
+ save_best_eval_metric_name: ''
180
+ save_best_eval_metric_greater_is_better: true
181
+ deepspeed_stage: 2
182
+ gradient_checkpointing: false
183
+ transformers_trust_remote_code: true
184
+ transformers_local_files_only: false
185
+ transformers_cache_dir: null
186
+ transformers_access_token: null
187
+ use_ddp: false
188
+ ddp_bucket_cap_mb: 100
189
+ num_gpus: 1
190
+ dataloader_num_workers: 32
191
+ remove_unused_columns: false
192
+ use_wandb: false
193
+ wandb_project: finetune-gr00t-n1d6
194
+ enable_profiling: false
195
+ max_retries: 3
196
+ assert_loss_less_than: null
197
+ add_rl_callback: false
198
+ enable_open_loop_eval: false
199
+ open_loop_eval_traj_ids:
200
+ - 0
201
+ open_loop_eval_steps_per_traj: 100
202
+ open_loop_eval_plot_indices: null
203
+ max_steps: 2000
204
+ save_steps: 500
checkpoint-1500/experiment_cfg/config.yaml ADDED
@@ -0,0 +1,238 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:gr00t.configs.base_config.Config
2
+ data: !!python/object:gr00t.configs.data.data_config.DataConfig
3
+ allow_padding: false
4
+ datasets:
5
+ - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
6
+ dataset_paths:
7
+ - /workspaces/isaaclab_arena/train_data
8
+ dataset_type: physical_embodiment
9
+ embodiment_tag: new_embodiment
10
+ mix_ratio: 1.0
11
+ val_dataset_path: null
12
+ download_cache: false
13
+ episode_sampling_rate: 0.1
14
+ image_crop_size:
15
+ - 244
16
+ - 244
17
+ image_target_size:
18
+ - 224
19
+ - 224
20
+ mock_dataset_mode: false
21
+ modality_configs:
22
+ new_embodiment:
23
+ action: !!python/object:gr00t.data.types.ModalityConfig
24
+ action_configs:
25
+ - !!python/object:gr00t.data.types.ActionConfig
26
+ format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
27
+ - default
28
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
29
+ - relative
30
+ state_key: single_arm
31
+ type: &id002 !!python/object/apply:gr00t.data.types.ActionType
32
+ - non_eef
33
+ - !!python/object:gr00t.data.types.ActionConfig
34
+ format: *id001
35
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
36
+ - absolute
37
+ state_key: null
38
+ type: *id002
39
+ delta_indices:
40
+ - 0
41
+ - 1
42
+ - 2
43
+ - 3
44
+ - 4
45
+ - 5
46
+ - 6
47
+ - 7
48
+ - 8
49
+ - 9
50
+ - 10
51
+ - 11
52
+ - 12
53
+ - 13
54
+ - 14
55
+ - 15
56
+ mean_std_embedding_keys: null
57
+ modality_keys:
58
+ - single_arm
59
+ - gripper
60
+ sin_cos_embedding_keys: null
61
+ language: !!python/object:gr00t.data.types.ModalityConfig
62
+ action_configs: null
63
+ delta_indices:
64
+ - 0
65
+ mean_std_embedding_keys: null
66
+ modality_keys:
67
+ - annotation.human.task_description
68
+ sin_cos_embedding_keys: null
69
+ state: !!python/object:gr00t.data.types.ModalityConfig
70
+ action_configs: null
71
+ delta_indices:
72
+ - 0
73
+ mean_std_embedding_keys: null
74
+ modality_keys:
75
+ - single_arm
76
+ - gripper
77
+ sin_cos_embedding_keys: null
78
+ video: !!python/object:gr00t.data.types.ModalityConfig
79
+ action_configs: null
80
+ delta_indices:
81
+ - 0
82
+ mean_std_embedding_keys: null
83
+ modality_keys:
84
+ - ego_view
85
+ sin_cos_embedding_keys: null
86
+ mode: single_turn
87
+ multiprocessing_context: fork
88
+ num_shards_per_epoch: 100000
89
+ override_pretraining_statistics: false
90
+ random_chop: 0.0
91
+ seed: 42
92
+ shard_size: 1024
93
+ shuffle: true
94
+ subsample_ratio: 1.0
95
+ video_backend: torchcodec
96
+ load_config_path: null
97
+ model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
98
+ _attn_implementation_autoset: false
99
+ _attn_implementation_internal: null
100
+ _commit_hash: null
101
+ _name_or_path: ''
102
+ add_cross_attention: false
103
+ architectures: null
104
+ backbone_model_type: eagle
105
+ backbone_trainable_params_fp32: true
106
+ bad_words_ids: null
107
+ begin_suppress_tokens: null
108
+ bos_token_id: null
109
+ chunk_size_feed_forward: 0
110
+ color_jitter_params: null
111
+ cross_attention_hidden_size: null
112
+ decoder_start_token_id: null
113
+ diffusion_model_cfg:
114
+ attention_head_dim: 48
115
+ dropout: 0.2
116
+ final_dropout: true
117
+ interleave_self_attention: true
118
+ norm_type: ada_norm
119
+ num_attention_heads: 32
120
+ num_layers: 32
121
+ output_dim: 1024
122
+ positional_embeddings: null
123
+ diversity_penalty: 0.0
124
+ do_sample: false
125
+ eagle_collator: true
126
+ early_stopping: false
127
+ encoder_no_repeat_ngram_size: 0
128
+ eos_token_id: null
129
+ exponential_decay_length_penalty: null
130
+ finetuning_task: null
131
+ forced_bos_token_id: null
132
+ forced_eos_token_id: null
133
+ id2label:
134
+ 0: LABEL_0
135
+ 1: LABEL_1
136
+ is_decoder: false
137
+ is_encoder_decoder: false
138
+ label2id:
139
+ LABEL_0: 0
140
+ LABEL_1: 1
141
+ length_penalty: 1.0
142
+ load_bf16: false
143
+ max_length: 20
144
+ min_length: 0
145
+ model_name: nvidia/Eagle-Block2A-2B-v2
146
+ no_repeat_ngram_size: 0
147
+ num_beam_groups: 1
148
+ num_beams: 1
149
+ num_return_sequences: 1
150
+ output_attentions: false
151
+ output_hidden_states: false
152
+ output_scores: false
153
+ pad_token_id: null
154
+ prefix: null
155
+ problem_type: null
156
+ pruned_heads: {}
157
+ random_rotation_angle: null
158
+ remove_invalid_values: false
159
+ repetition_penalty: 1.0
160
+ reproject_vision: false
161
+ return_dict: true
162
+ return_dict_in_generate: false
163
+ sep_token_id: null
164
+ state_dropout_prob: 0.0
165
+ suppress_tokens: null
166
+ task_specific_params: null
167
+ temperature: 1.0
168
+ tf_legacy_loss: false
169
+ tie_encoder_decoder: false
170
+ tie_word_embeddings: true
171
+ tokenizer_class: null
172
+ top_k: 50
173
+ top_p: 1.0
174
+ torch_dtype: null
175
+ torchscript: false
176
+ transformers_version: null
177
+ tune_diffusion_model: true
178
+ tune_llm: false
179
+ tune_projector: true
180
+ tune_visual: false
181
+ typical_p: 1.0
182
+ use_bfloat16: false
183
+ use_relative_action: true
184
+ training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
185
+ add_rl_callback: false
186
+ assert_loss_less_than: null
187
+ batch_size: null
188
+ bf16: true
189
+ dataloader_num_workers: 32
190
+ ddp_bucket_cap_mb: 100
191
+ deepspeed_stage: 2
192
+ enable_open_loop_eval: false
193
+ enable_profiling: false
194
+ eval_batch_size: 2
195
+ eval_bf16: true
196
+ eval_set_split_ratio: 0.1
197
+ eval_steps: 500
198
+ eval_strategy: 'no'
199
+ experiment_name: null
200
+ fp16: false
201
+ global_batch_size: 32
202
+ gradient_accumulation_steps: 1
203
+ gradient_checkpointing: false
204
+ learning_rate: 0.0001
205
+ logging_steps: 10
206
+ lr_scheduler_type: cosine
207
+ max_concurrent_uploads: 2
208
+ max_grad_norm: 1.0
209
+ max_retries: 3
210
+ max_steps: 2000
211
+ num_gpus: 1
212
+ open_loop_eval_plot_indices: null
213
+ open_loop_eval_steps_per_traj: 100
214
+ open_loop_eval_traj_ids:
215
+ - 0
216
+ optim: adamw_torch
217
+ output_dir: /home/ubuntu/.cache/gr00t_franka_finetune
218
+ remove_unused_columns: false
219
+ save_best_eval_metric_greater_is_better: true
220
+ save_best_eval_metric_name: ''
221
+ save_steps: 500
222
+ save_total_limit: 4
223
+ save_vl_model: false
224
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
225
+ tf32: true
226
+ transformers_access_token: null
227
+ transformers_cache_dir: null
228
+ transformers_local_files_only: false
229
+ transformers_trust_remote_code: true
230
+ upload_checkpoints: false
231
+ upload_every: 1000
232
+ upload_last_n_checkpoints: 5
233
+ use_ddp: false
234
+ use_wandb: false
235
+ wandb_project: finetune-gr00t-n1d6
236
+ warmup_ratio: 0.05
237
+ warmup_steps: 0
238
+ weight_decay: 1.0e-05
checkpoint-1500/experiment_cfg/dataset_statistics.json ADDED
@@ -0,0 +1,1046 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "new_embodiment": {
3
+ "state": {
4
+ "single_arm": {
5
+ "min": [
6
+ -0.1016506552696228,
7
+ -0.1761876344680786,
8
+ -0.054869189858436584,
9
+ -1.4101576805114746,
10
+ -0.38218289613723755,
11
+ -0.022114872932434082,
12
+ -0.10868370532989502
13
+ ],
14
+ "max": [
15
+ 0.3447756767272949,
16
+ 1.2365270853042603,
17
+ 0.39242762327194214,
18
+ 0.2529296278953552,
19
+ 0.18470034003257751,
20
+ 2.118802309036255,
21
+ 0.8016068339347839
22
+ ],
23
+ "mean": [
24
+ 0.042614661157131195,
25
+ 0.4292725920677185,
26
+ 0.10685384273529053,
27
+ -0.8481684923171997,
28
+ -0.004952127579599619,
29
+ 1.2715188264846802,
30
+ 0.14739659428596497
31
+ ],
32
+ "std": [
33
+ 0.08599156141281128,
34
+ 0.38931092619895935,
35
+ 0.08684167265892029,
36
+ 0.41639015078544617,
37
+ 0.09905096888542175,
38
+ 0.639055073261261,
39
+ 0.20859868824481964
40
+ ],
41
+ "q01": [
42
+ -0.08698830261826515,
43
+ -0.16300016283988952,
44
+ -0.031826803982257845,
45
+ -1.3965834760665894,
46
+ -0.33692867517471314,
47
+ -0.005149464607238769,
48
+ -0.0991782522201538
49
+ ],
50
+ "q99": [
51
+ 0.3135400813817978,
52
+ 1.2095760893821716,
53
+ 0.3296026331186294,
54
+ 0.09940535783767694,
55
+ 0.177163989841938,
56
+ 2.111123719215393,
57
+ 0.7685691952705384
58
+ ]
59
+ },
60
+ "gripper": {
61
+ "min": [
62
+ -0.016243789345026016,
63
+ -0.017369966953992844
64
+ ],
65
+ "max": [
66
+ 0.0,
67
+ 0.0
68
+ ],
69
+ "mean": [
70
+ -0.0054468195885419846,
71
+ -0.005668346770107746
72
+ ],
73
+ "std": [
74
+ 0.007502974011003971,
75
+ 0.007808898109942675
76
+ ],
77
+ "q01": [
78
+ -0.01618218619376421,
79
+ -0.01736501693725586
80
+ ],
81
+ "q99": [
82
+ 0.0,
83
+ 0.0
84
+ ]
85
+ }
86
+ },
87
+ "action": {
88
+ "single_arm": {
89
+ "min": [
90
+ -0.029919808730483055,
91
+ -0.030760474503040314,
92
+ -0.03454569727182388,
93
+ -0.023138338699936867,
94
+ -0.0294453464448452,
95
+ -0.04707210883498192,
96
+ 0.0
97
+ ],
98
+ "max": [
99
+ 0.04578776657581329,
100
+ 0.03417271375656128,
101
+ 0.032364509999752045,
102
+ 0.012034625746309757,
103
+ 0.08025076240301132,
104
+ 0.04756892845034599,
105
+ 0.03999999910593033
106
+ ],
107
+ "mean": [
108
+ 0.013533495366573334,
109
+ 0.007476440165191889,
110
+ -0.01020827516913414,
111
+ -0.00018720414664130658,
112
+ 0.00028234944329597056,
113
+ -5.855086783412844e-05,
114
+ 0.026392336934804916
115
+ ],
116
+ "std": [
117
+ 0.012855037115514278,
118
+ 0.012551924213767052,
119
+ 0.017873870208859444,
120
+ 0.0029166981112211943,
121
+ 0.005159514490514994,
122
+ 0.004970518872141838,
123
+ 0.01895107515156269
124
+ ],
125
+ "q01": [
126
+ -0.005514774760231375,
127
+ -0.024535775482654572,
128
+ -0.030423654653131963,
129
+ -0.008391074724495412,
130
+ -0.01150766346603632,
131
+ -0.015753980539739133,
132
+ 0.0
133
+ ],
134
+ "q99": [
135
+ 0.03146043732762337,
136
+ 0.02946644090116024,
137
+ 0.028492353856563568,
138
+ 0.006190066309645771,
139
+ 0.01955891106277704,
140
+ 0.016726106889545896,
141
+ 0.03999999910593033
142
+ ]
143
+ },
144
+ "gripper": {
145
+ "min": [
146
+ 0.0
147
+ ],
148
+ "max": [
149
+ 0.03999999910593033
150
+ ],
151
+ "mean": [
152
+ 0.026392336934804916
153
+ ],
154
+ "std": [
155
+ 0.01895107515156269
156
+ ],
157
+ "q01": [
158
+ 0.0
159
+ ],
160
+ "q99": [
161
+ 0.03999999910593033
162
+ ]
163
+ }
164
+ },
165
+ "relative_action": {
166
+ "single_arm": {
167
+ "min": [
168
+ [
169
+ -0.32329919934272766,
170
+ -1.1854932308197021,
171
+ -0.39748504757881165,
172
+ -0.25286412239074707,
173
+ -0.18570305407047272,
174
+ -2.121999979019165,
175
+ -0.7839499115943909
176
+ ],
177
+ [
178
+ -0.32189974188804626,
179
+ -1.1826070547103882,
180
+ -0.39696475863456726,
181
+ -0.2544684112071991,
182
+ -0.18530802428722382,
183
+ -2.1222615242004395,
184
+ -0.7839499115943909
185
+ ],
186
+ [
187
+ -0.32321855425834656,
188
+ -1.1859318017959595,
189
+ -0.39636000990867615,
190
+ -0.2523682117462158,
191
+ -0.18859536945819855,
192
+ -2.1214780807495117,
193
+ -0.7839499115943909
194
+ ],
195
+ [
196
+ -0.3242166042327881,
197
+ -1.181753158569336,
198
+ -0.3955015242099762,
199
+ -0.2530977129936218,
200
+ -0.18825502693653107,
201
+ -2.1224093437194824,
202
+ -0.7839499115943909
203
+ ],
204
+ [
205
+ -0.3244396150112152,
206
+ -1.1838017702102661,
207
+ -0.3950645923614502,
208
+ -0.24863530695438385,
209
+ -0.18772920966148376,
210
+ -2.1221938133239746,
211
+ -0.7839499115943909
212
+ ],
213
+ [
214
+ -0.3249604403972626,
215
+ -1.1851550340652466,
216
+ -0.3945443034172058,
217
+ -0.2545105218887329,
218
+ -0.19080020487308502,
219
+ -2.12245512008667,
220
+ -0.7839499115943909
221
+ ],
222
+ [
223
+ -0.3240599036216736,
224
+ -1.2094337940216064,
225
+ -0.3939395546913147,
226
+ -0.2524451017379761,
227
+ -0.19165967404842377,
228
+ -2.1216351985931396,
229
+ -0.7839499115943909
230
+ ],
231
+ [
232
+ -0.3237849175930023,
233
+ -1.2061353921890259,
234
+ -0.39335793256759644,
235
+ -0.25646376609802246,
236
+ -0.19124479591846466,
237
+ -2.12142276763916,
238
+ -0.7839499115943909
239
+ ],
240
+ [
241
+ -0.32624951004981995,
242
+ -1.2092955112457275,
243
+ -0.3938826322555542,
244
+ -0.25647443532943726,
245
+ -0.19049783051013947,
246
+ -2.1221275329589844,
247
+ -0.7839499115943909
248
+ ],
249
+ [
250
+ -0.32307595014572144,
251
+ -1.205997109413147,
252
+ -0.39394718408584595,
253
+ -0.257379949092865,
254
+ -0.1888638287782669,
255
+ -2.1217713356018066,
256
+ -0.7839499115943909
257
+ ],
258
+ [
259
+ -0.3202081322669983,
260
+ -1.20602285861969,
261
+ -0.39648687839508057,
262
+ -0.2556869089603424,
263
+ -0.18957450985908508,
264
+ -2.1215648651123047,
265
+ -0.7801104187965393
266
+ ],
267
+ [
268
+ -0.32303914427757263,
269
+ -1.2070811986923218,
270
+ -0.39701157808303833,
271
+ -0.2523868978023529,
272
+ -0.1896384060382843,
273
+ -2.1222102642059326,
274
+ -0.7777257561683655
275
+ ],
276
+ [
277
+ -0.3236537277698517,
278
+ -1.20821213722229,
279
+ -0.3970761299133301,
280
+ -0.25582969188690186,
281
+ -0.18970085680484772,
282
+ -2.1212406158447266,
283
+ -0.774041473865509
284
+ ],
285
+ [
286
+ -0.32262563705444336,
287
+ -1.20747709274292,
288
+ -0.39746999740600586,
289
+ -0.2536396086215973,
290
+ -0.18984927237033844,
291
+ -2.1219756603240967,
292
+ -0.7704301476478577
293
+ ],
294
+ [
295
+ -0.32665905356407166,
296
+ -1.2074377536773682,
297
+ -0.3977932929992676,
298
+ -0.2506418526172638,
299
+ -0.1900315284729004,
300
+ -2.121697187423706,
301
+ -0.7680240273475647
302
+ ],
303
+ [
304
+ -0.3236996829509735,
305
+ -1.2079046964645386,
306
+ -0.3978058695793152,
307
+ -0.2523408532142639,
308
+ -0.19020666182041168,
309
+ -2.1220388412475586,
310
+ -0.765728771686554
311
+ ]
312
+ ],
313
+ "max": [
314
+ [
315
+ 0.12719863653182983,
316
+ 0.18446235358715057,
317
+ 0.06538978964090347,
318
+ 1.4123303890228271,
319
+ 0.36543214321136475,
320
+ 0.055936314165592194,
321
+ 0.1482430398464203
322
+ ],
323
+ [
324
+ 0.12787628173828125,
325
+ 0.18225406110286713,
326
+ 0.0630723312497139,
327
+ 1.4122768640518188,
328
+ 0.3634565770626068,
329
+ 0.05312386155128479,
330
+ 0.14398613572120667
331
+ ],
332
+ [
333
+ 0.12855961918830872,
334
+ 0.18054865300655365,
335
+ 0.060906484723091125,
336
+ 1.4116393327713013,
337
+ 0.3660118877887726,
338
+ 0.052048832178115845,
339
+ 0.14211878180503845
340
+ ],
341
+ [
342
+ 0.12901031970977783,
343
+ 0.17937372624874115,
344
+ 0.05962555110454559,
345
+ 1.412109613418579,
346
+ 0.3632301688194275,
347
+ 0.05115959048271179,
348
+ 0.14021214842796326
349
+ ],
350
+ [
351
+ 0.12952828407287598,
352
+ 0.1794057935476303,
353
+ 0.06009196117520332,
354
+ 1.4119149446487427,
355
+ 0.36106500029563904,
356
+ 0.05047079920768738,
357
+ 0.13852760195732117
358
+ ],
359
+ [
360
+ 0.12882810831069946,
361
+ 0.17998431622982025,
362
+ 0.06065024808049202,
363
+ 1.4128142595291138,
364
+ 0.3649647831916809,
365
+ 0.050107747316360474,
366
+ 0.13429853320121765
367
+ ],
368
+ [
369
+ 0.12831519544124603,
370
+ 0.17946301400661469,
371
+ 0.06099287047982216,
372
+ 1.4133707284927368,
373
+ 0.36815109848976135,
374
+ 0.04975596070289612,
375
+ 0.1339406669139862
376
+ ],
377
+ [
378
+ 0.12905743718147278,
379
+ 0.1786593645811081,
380
+ 0.06112520769238472,
381
+ 1.4141303300857544,
382
+ 0.3652087152004242,
383
+ 0.04841601476073265,
384
+ 0.1322639286518097
385
+ ],
386
+ [
387
+ 0.1297350823879242,
388
+ 0.1776067465543747,
389
+ 0.0573953241109848,
390
+ 1.4146143198013306,
391
+ 0.3671979606151581,
392
+ 0.04757409915328026,
393
+ 0.13022002577781677
394
+ ],
395
+ [
396
+ 0.13041843473911285,
397
+ 0.17776383459568024,
398
+ 0.05858777463436127,
399
+ 1.4145153760910034,
400
+ 0.36353617906570435,
401
+ 0.045672591775655746,
402
+ 0.12888506054878235
403
+ ],
404
+ [
405
+ 0.13086912035942078,
406
+ 0.17834235727787018,
407
+ 0.05983245372772217,
408
+ 1.4148727655410767,
409
+ 0.36363980174064636,
410
+ 0.04265117272734642,
411
+ 0.1267530620098114
412
+ ],
413
+ [
414
+ 0.13138708472251892,
415
+ 0.17829257249832153,
416
+ 0.06080028414726257,
417
+ 1.4132124185562134,
418
+ 0.36463645100593567,
419
+ 0.04230935871601105,
420
+ 0.12515506148338318
421
+ ],
422
+ [
423
+ 0.1306869238615036,
424
+ 0.17859286069869995,
425
+ 0.06156755983829498,
426
+ 1.4115465879440308,
427
+ 0.36609867215156555,
428
+ 0.041467443108558655,
429
+ 0.12416491657495499
430
+ ],
431
+ [
432
+ 0.12939347326755524,
433
+ 0.1791713833808899,
434
+ 0.06212584674358368,
435
+ 1.4120947122573853,
436
+ 0.36583268642425537,
437
+ 0.03956593573093414,
438
+ 0.12115160375833511
439
+ ],
440
+ [
441
+ 0.12968552112579346,
442
+ 0.17865008115768433,
443
+ 0.06246846914291382,
444
+ 1.4127825498580933,
445
+ 0.36217090487480164,
446
+ 0.04159165173768997,
447
+ 0.11784551292657852
448
+ ],
449
+ [
450
+ 0.12998661398887634,
451
+ 0.17784643173217773,
452
+ 0.06260080635547638,
453
+ 1.4135223627090454,
454
+ 0.361840158700943,
455
+ 0.040185101330280304,
456
+ 0.11627308279275894
457
+ ]
458
+ ],
459
+ "mean": [
460
+ [
461
+ -0.021064985543489456,
462
+ -0.39792153239250183,
463
+ -0.11181046068668365,
464
+ 0.8605598211288452,
465
+ -0.0025237626396119595,
466
+ -1.2637412548065186,
467
+ -0.10358496010303497
468
+ ],
469
+ [
470
+ -0.02104770392179489,
471
+ -0.3978676497936249,
472
+ -0.11182692646980286,
473
+ 0.8605672717094421,
474
+ -0.002523584757000208,
475
+ -1.2637417316436768,
476
+ -0.10367059707641602
477
+ ],
478
+ [
479
+ -0.021030250936746597,
480
+ -0.397811621427536,
481
+ -0.11184262484312057,
482
+ 0.8605707287788391,
483
+ -0.0025277354288846254,
484
+ -1.2637302875518799,
485
+ -0.10375623404979706
486
+ ],
487
+ [
488
+ -0.02101544663310051,
489
+ -0.39775529503822327,
490
+ -0.11185839772224426,
491
+ 0.8605775833129883,
492
+ -0.002535233274102211,
493
+ -1.2637287378311157,
494
+ -0.10384184867143631
495
+ ],
496
+ [
497
+ -0.021001672372221947,
498
+ -0.39770010113716125,
499
+ -0.11185967922210693,
500
+ 0.8605857491493225,
501
+ -0.0025436626747250557,
502
+ -1.2637271881103516,
503
+ -0.10392745584249496
504
+ ],
505
+ [
506
+ -0.02098824642598629,
507
+ -0.3976578712463379,
508
+ -0.11185971647500992,
509
+ 0.8605918884277344,
510
+ -0.0025569903664290905,
511
+ -1.2637248039245605,
512
+ -0.10401306301355362
513
+ ],
514
+ [
515
+ -0.020976334810256958,
516
+ -0.39763131737709045,
517
+ -0.11186240613460541,
518
+ 0.8606000542640686,
519
+ -0.0025741278659552336,
520
+ -1.26372230052948,
521
+ -0.10409871488809586
522
+ ],
523
+ [
524
+ -0.020982732996344566,
525
+ -0.3976297378540039,
526
+ -0.11186536401510239,
527
+ 0.8606085777282715,
528
+ -0.0025887791998684406,
529
+ -1.2637240886688232,
530
+ -0.1041843369603157
531
+ ],
532
+ [
533
+ -0.020988795906305313,
534
+ -0.397623211145401,
535
+ -0.11186520755290985,
536
+ 0.8606117963790894,
537
+ -0.0025999434292316437,
538
+ -1.2637230157852173,
539
+ -0.10424429178237915
540
+ ],
541
+ [
542
+ -0.020994234830141068,
543
+ -0.3976192772388458,
544
+ -0.11186467111110687,
545
+ 0.8606191873550415,
546
+ -0.002612028270959854,
547
+ -1.2637211084365845,
548
+ -0.10427426546812057
549
+ ],
550
+ [
551
+ -0.020999347791075706,
552
+ -0.3976156413555145,
553
+ -0.11186596006155014,
554
+ 0.8606262803077698,
555
+ -0.0026231720112264156,
556
+ -1.2637207508087158,
557
+ -0.10427425056695938
558
+ ],
559
+ [
560
+ -0.021002445369958878,
561
+ -0.3976096510887146,
562
+ -0.11186514049768448,
563
+ 0.860630214214325,
564
+ -0.002635682700201869,
565
+ -1.2637168169021606,
566
+ -0.10427428781986237
567
+ ],
568
+ [
569
+ -0.021011201664805412,
570
+ -0.39761000871658325,
571
+ -0.11186651140451431,
572
+ 0.860638439655304,
573
+ -0.002646006178110838,
574
+ -1.2637174129486084,
575
+ -0.10427427291870117
576
+ ],
577
+ [
578
+ -0.021014675498008728,
579
+ -0.39760351181030273,
580
+ -0.11186712980270386,
581
+ 0.8606441617012024,
582
+ -0.002654573880136013,
583
+ -1.2637194395065308,
584
+ -0.10427426546812057
585
+ ],
586
+ [
587
+ -0.021040834486484528,
588
+ -0.3976028859615326,
589
+ -0.11186829954385757,
590
+ 0.8606491088867188,
591
+ -0.002666682470589876,
592
+ -1.2637138366699219,
593
+ -0.10427425056695938
594
+ ],
595
+ [
596
+ -0.02106592431664467,
597
+ -0.39760419726371765,
598
+ -0.11186770349740982,
599
+ 0.8606574535369873,
600
+ -0.002680801786482334,
601
+ -1.2637156248092651,
602
+ -0.10427422821521759
603
+ ]
604
+ ],
605
+ "std": [
606
+ [
607
+ 0.07862132787704468,
608
+ 0.36472052335739136,
609
+ 0.07953183352947235,
610
+ 0.41708749532699585,
611
+ 0.08953142166137695,
612
+ 0.6474994421005249,
613
+ 0.2003270834684372
614
+ ],
615
+ [
616
+ 0.07865532487630844,
617
+ 0.36466875672340393,
618
+ 0.07954908907413483,
619
+ 0.4170789122581482,
620
+ 0.08954057842493057,
621
+ 0.6475056409835815,
622
+ 0.20027098059654236
623
+ ],
624
+ [
625
+ 0.07868577539920807,
626
+ 0.36461395025253296,
627
+ 0.07956718653440475,
628
+ 0.41706907749176025,
629
+ 0.08954384922981262,
630
+ 0.6475113034248352,
631
+ 0.20021489262580872
632
+ ],
633
+ [
634
+ 0.07872062176465988,
635
+ 0.3645585775375366,
636
+ 0.07958472520112991,
637
+ 0.41705429553985596,
638
+ 0.08954395353794098,
639
+ 0.6475160717964172,
640
+ 0.2001601606607437
641
+ ],
642
+ [
643
+ 0.07875548303127289,
644
+ 0.3645066022872925,
645
+ 0.07957513630390167,
646
+ 0.4170401096343994,
647
+ 0.08954435586929321,
648
+ 0.6475217342376709,
649
+ 0.2001052349805832
650
+ ],
651
+ [
652
+ 0.07878728210926056,
653
+ 0.36448603868484497,
654
+ 0.07956283539533615,
655
+ 0.4170234501361847,
656
+ 0.08953587710857391,
657
+ 0.6475263237953186,
658
+ 0.2000516802072525
659
+ ],
660
+ [
661
+ 0.07882208377122879,
662
+ 0.36450454592704773,
663
+ 0.07955189794301987,
664
+ 0.41700881719589233,
665
+ 0.08952254056930542,
666
+ 0.647530734539032,
667
+ 0.19999809563159943
668
+ ],
669
+ [
670
+ 0.07889280468225479,
671
+ 0.3645552396774292,
672
+ 0.07954024523496628,
673
+ 0.4169907867908478,
674
+ 0.08951205015182495,
675
+ 0.6475338339805603,
676
+ 0.19994452595710754
677
+ ],
678
+ [
679
+ 0.07896006852388382,
680
+ 0.3646087050437927,
681
+ 0.07952792197465897,
682
+ 0.4169798195362091,
683
+ 0.08950342237949371,
684
+ 0.6475362181663513,
685
+ 0.19982454180717468
686
+ ],
687
+ [
688
+ 0.07902492582798004,
689
+ 0.36466050148010254,
690
+ 0.07951349020004272,
691
+ 0.4169654846191406,
692
+ 0.08949856460094452,
693
+ 0.6475402116775513,
694
+ 0.19963733851909637
695
+ ],
696
+ [
697
+ 0.0790853276848793,
698
+ 0.36471861600875854,
699
+ 0.07950460910797119,
700
+ 0.4169500768184662,
701
+ 0.08949100971221924,
702
+ 0.6475431323051453,
703
+ 0.19935448467731476
704
+ ],
705
+ [
706
+ 0.0791463851928711,
707
+ 0.3647766411304474,
708
+ 0.07949627935886383,
709
+ 0.4169394075870514,
710
+ 0.08948377519845963,
711
+ 0.6475453972816467,
712
+ 0.19907325506210327
713
+ ],
714
+ [
715
+ 0.07920938730239868,
716
+ 0.36483389139175415,
717
+ 0.07948218286037445,
718
+ 0.4169244170188904,
719
+ 0.08947892487049103,
720
+ 0.6475448608398438,
721
+ 0.19879388809204102
722
+ ],
723
+ [
724
+ 0.0792689323425293,
725
+ 0.3648894131183624,
726
+ 0.07947037369012833,
727
+ 0.41691312193870544,
728
+ 0.08947526663541794,
729
+ 0.6475451588630676,
730
+ 0.19851621985435486
731
+ ],
732
+ [
733
+ 0.07932519167661667,
734
+ 0.3649515211582184,
735
+ 0.07945462316274643,
736
+ 0.4169033467769623,
737
+ 0.08946864306926727,
738
+ 0.6475487947463989,
739
+ 0.19824036955833435
740
+ ],
741
+ [
742
+ 0.07937267422676086,
743
+ 0.36501482129096985,
744
+ 0.07943546772003174,
745
+ 0.41688644886016846,
746
+ 0.08945988863706589,
747
+ 0.6475464701652527,
748
+ 0.19796623289585114
749
+ ]
750
+ ],
751
+ "q01": [
752
+ [
753
+ -0.2686644893884659,
754
+ -1.1166756582260131,
755
+ -0.3249503219127655,
756
+ -0.10763738259673118,
757
+ -0.17754718899726868,
758
+ -2.11095911026001,
759
+ -0.726121768951416
760
+ ],
761
+ [
762
+ -0.2715908128023148,
763
+ -1.1176964545249939,
764
+ -0.3246971207857132,
765
+ -0.10447386264801026,
766
+ -0.17755473166704178,
767
+ -2.111039023399353,
768
+ -0.726121768951416
769
+ ],
770
+ [
771
+ -0.2721079695224762,
772
+ -1.1183462095260621,
773
+ -0.32473934948444366,
774
+ -0.10659581780433655,
775
+ -0.17748151123523712,
776
+ -2.1109159421920776,
777
+ -0.726121768951416
778
+ ],
779
+ [
780
+ -0.2719108146429062,
781
+ -1.1183584260940551,
782
+ -0.3249865293502808,
783
+ -0.10559523880481719,
784
+ -0.17776453107595444,
785
+ -2.1114220952987672,
786
+ -0.726121768951416
787
+ ],
788
+ [
789
+ -0.27478108763694764,
790
+ -1.1184560322761536,
791
+ -0.32442001819610594,
792
+ -0.10662905514240265,
793
+ -0.17751205533742906,
794
+ -2.111326847076416,
795
+ -0.726121768951416
796
+ ],
797
+ [
798
+ -0.27461387276649474,
799
+ -1.1171478915214539,
800
+ -0.32468852162361145,
801
+ -0.10610488697886467,
802
+ -0.17753057986497878,
803
+ -2.1112320852279662,
804
+ -0.726121768951416
805
+ ],
806
+ [
807
+ -0.2748466944694519,
808
+ -1.1176495385169982,
809
+ -0.3247254079580307,
810
+ -0.10539359807968139,
811
+ -0.17761774510145187,
812
+ -2.111006693840027,
813
+ -0.726121768951416
814
+ ],
815
+ [
816
+ -0.2763983929157257,
817
+ -1.1234028029441834,
818
+ -0.32481603741645815,
819
+ -0.10651438012719154,
820
+ -0.17762102216482162,
821
+ -2.110989727973938,
822
+ -0.726121768951416
823
+ ],
824
+ [
825
+ -0.27612989604473115,
826
+ -1.1322602534294128,
827
+ -0.3249142354726791,
828
+ -0.104207394272089,
829
+ -0.17753226101398467,
830
+ -2.1104533433914185,
831
+ -0.726121768951416
832
+ ],
833
+ [
834
+ -0.2772212654352188,
835
+ -1.1327979397773742,
836
+ -0.3250032651424408,
837
+ -0.10369521856307984,
838
+ -0.1775078284740448,
839
+ -2.110794858932495,
840
+ -0.726121768951416
841
+ ],
842
+ [
843
+ -0.27782695055007933,
844
+ -1.1329670572280883,
845
+ -0.3251311558485031,
846
+ -0.10523794278502464,
847
+ -0.17756187170743942,
848
+ -2.111419234275818,
849
+ -0.7251607692241668
850
+ ],
851
+ [
852
+ -0.2772995239496231,
853
+ -1.1324901962280274,
854
+ -0.32540663063526154,
855
+ -0.10621625065803528,
856
+ -0.17752183318138123,
857
+ -2.1106600952148438,
858
+ -0.7238819229602814
859
+ ],
860
+ [
861
+ -0.2760401529073715,
862
+ -1.131754720211029,
863
+ -0.3250221389532089,
864
+ -0.10366981148719788,
865
+ -0.17745642334222794,
866
+ -2.110166282653809,
867
+ -0.7220853567123413
868
+ ],
869
+ [
870
+ -0.27648825109004976,
871
+ -1.1315274477005004,
872
+ -0.32488527715206145,
873
+ -0.10417581394314765,
874
+ -0.17765929341316222,
875
+ -2.111174240112305,
876
+ -0.721002539396286
877
+ ],
878
+ [
879
+ -0.2767831003665924,
880
+ -1.1337191128730775,
881
+ -0.32499175250530243,
882
+ -0.10650760352611542,
883
+ -0.1782200300693512,
884
+ -2.1105369424819944,
885
+ -0.7191157519817353
886
+ ],
887
+ [
888
+ -0.2783048951625824,
889
+ -1.1336584401130676,
890
+ -0.3245078271627426,
891
+ -0.10380961641669273,
892
+ -0.17757790327072143,
893
+ -2.1105402278900147,
894
+ -0.717497273683548
895
+ ]
896
+ ],
897
+ "q99": [
898
+ [
899
+ 0.10997488573193549,
900
+ 0.16461794972419735,
901
+ 0.03921745248138905,
902
+ 1.39764888048172,
903
+ 0.30130664169788357,
904
+ 0.01098630111664532,
905
+ 0.1122507885098457
906
+ ],
907
+ [
908
+ 0.11004416078329086,
909
+ 0.1643620255589485,
910
+ 0.03903082057833671,
911
+ 1.398072485923767,
912
+ 0.3018379479646683,
913
+ 0.010057139471173268,
914
+ 0.11005336791276932
915
+ ],
916
+ [
917
+ 0.11012477055191992,
918
+ 0.16386553168296814,
919
+ 0.038735973685979835,
920
+ 1.3967380928993225,
921
+ 0.30213871598243713,
922
+ 0.010799065530300123,
923
+ 0.10891361147165297
924
+ ],
925
+ [
926
+ 0.1099956126511097,
927
+ 0.16371061593294142,
928
+ 0.03824721999466418,
929
+ 1.3970967960357665,
930
+ 0.302277557849884,
931
+ 0.011137769222259486,
932
+ 0.10836461812257767
933
+ ],
934
+ [
935
+ 0.11023993626236915,
936
+ 0.1633686304092407,
937
+ 0.03792811810970305,
938
+ 1.3972763657569884,
939
+ 0.3007064414024353,
940
+ 0.010738395974039987,
941
+ 0.10781787663698195
942
+ ],
943
+ [
944
+ 0.11034056857228279,
945
+ 0.16381058037281035,
946
+ 0.03771789923310276,
947
+ 1.3969033169746399,
948
+ 0.3010092568397521,
949
+ 0.010312179420143333,
950
+ 0.1074419716000557
951
+ ],
952
+ [
953
+ 0.11034261405467986,
954
+ 0.1636140125989914,
955
+ 0.03730809785425661,
956
+ 1.3973512649536133,
957
+ 0.3012144303321838,
958
+ 0.009373838771134584,
959
+ 0.10661112785339355
960
+ ],
961
+ [
962
+ 0.11037104874849318,
963
+ 0.16361432492733002,
964
+ 0.03730310291051864,
965
+ 1.397199330329895,
966
+ 0.30146020889282227,
967
+ 0.009104850329458668,
968
+ 0.10594455733895301
969
+ ],
970
+ [
971
+ 0.11031954407691955,
972
+ 0.16329921871423722,
973
+ 0.037490070536732666,
974
+ 1.3971175789833068,
975
+ 0.30101816475391385,
976
+ 0.007780624665319918,
977
+ 0.10561806678771973
978
+ ],
979
+ [
980
+ 0.11039042010903358,
981
+ 0.16369332671165465,
982
+ 0.036998328715562794,
983
+ 1.3964923930168152,
984
+ 0.3020000964403152,
985
+ 0.007503410866484006,
986
+ 0.10535383358597755
987
+ ],
988
+ [
989
+ 0.11048222631216048,
990
+ 0.16336869567632675,
991
+ 0.03698733076453208,
992
+ 1.3960149836540223,
993
+ 0.30287389039993284,
994
+ 0.0068738124519586155,
995
+ 0.10515481844544411
996
+ ],
997
+ [
998
+ 0.11053489252924918,
999
+ 0.16354636400938033,
1000
+ 0.03707304038107395,
1001
+ 1.396628396511078,
1002
+ 0.3029059028625488,
1003
+ 0.006812876258045408,
1004
+ 0.1047084142267704
1005
+ ],
1006
+ [
1007
+ 0.11039242312312125,
1008
+ 0.16331785261631013,
1009
+ 0.03715803913772106,
1010
+ 1.3973055458068848,
1011
+ 0.30323826253414154,
1012
+ 0.006487304139882287,
1013
+ 0.10444164305925369
1014
+ ],
1015
+ [
1016
+ 0.11058814465999603,
1017
+ 0.16320075422525404,
1018
+ 0.0372002275288105,
1019
+ 1.3976932382583618,
1020
+ 0.30252904832363126,
1021
+ 0.005770333949476429,
1022
+ 0.10420910120010375
1023
+ ],
1024
+ [
1025
+ 0.11048216462135314,
1026
+ 0.1634601667523384,
1027
+ 0.0368946287035942,
1028
+ 1.396862666606903,
1029
+ 0.3012196272611618,
1030
+ 0.006188006103038769,
1031
+ 0.10407691970467567
1032
+ ],
1033
+ [
1034
+ 0.11032852262258529,
1035
+ 0.16324337780475617,
1036
+ 0.03683135174214838,
1037
+ 1.3966079354286194,
1038
+ 0.30130040407180775,
1039
+ 0.006021949928253876,
1040
+ 0.10380818247795105
1041
+ ]
1042
+ ]
1043
+ }
1044
+ }
1045
+ }
1046
+ }
checkpoint-1500/experiment_cfg/final_model_config.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "Gr00tN1d6",
3
+ "model_dtype": "bfloat16",
4
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
5
+ "backbone_model_type": "eagle",
6
+ "model_revision": null,
7
+ "tune_top_llm_layers": 4,
8
+ "backbone_embedding_dim": 2048,
9
+ "tune_llm": false,
10
+ "tune_visual": false,
11
+ "select_layer": 16,
12
+ "reproject_vision": false,
13
+ "use_flash_attention": true,
14
+ "load_bf16": true,
15
+ "collator_overwrite_image_inputs": false,
16
+ "eagle_collator": true,
17
+ "backbone_trainable_params_fp32": true,
18
+ "apply_sincos_state_encoding": true,
19
+ "use_relative_action": true,
20
+ "max_state_dim": 128,
21
+ "max_action_dim": 128,
22
+ "action_horizon": 50,
23
+ "hidden_size": 1024,
24
+ "input_embedding_dim": 1536,
25
+ "add_pos_embed": true,
26
+ "attn_dropout": 0.2,
27
+ "use_vlln": true,
28
+ "max_seq_len": 1024,
29
+ "use_alternate_vl_dit": true,
30
+ "attend_text_every_n_blocks": 2,
31
+ "diffusion_model_cfg": {
32
+ "attention_head_dim": 48,
33
+ "dropout": 0.2,
34
+ "final_dropout": true,
35
+ "interleave_self_attention": true,
36
+ "norm_type": "ada_norm",
37
+ "num_attention_heads": 32,
38
+ "num_layers": 32,
39
+ "output_dim": 1024,
40
+ "positional_embeddings": null
41
+ },
42
+ "num_inference_timesteps": 4,
43
+ "noise_beta_alpha": 1.5,
44
+ "noise_beta_beta": 1.0,
45
+ "noise_s": 0.999,
46
+ "num_timestep_buckets": 1000,
47
+ "tune_projector": true,
48
+ "tune_diffusion_model": true,
49
+ "tune_vlln": true,
50
+ "state_dropout_prob": 0.0,
51
+ "state_additive_noise_scale": 0.0,
52
+ "max_num_embodiments": 32
53
+ }
checkpoint-1500/experiment_cfg/final_processor_config.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1500/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:797319ec80e8b31ac563fd77a28c3cf786914f82b8d3389dc4bbf5ec3b801b48
3
+ size 4990120184
checkpoint-1500/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae4f374051e14e67b4390972eafde4d422c273c8034a861bb70fc8725454c82d
3
+ size 4823190320
checkpoint-1500/model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1500/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82d4f9690e038342ae130d3cc7dceaafd81d8db2d67fecf95aa41644a003876b
3
+ size 12960193762
checkpoint-1500/processor_config.json ADDED
@@ -0,0 +1,454 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "processor_class": "Gr00tN1d6Processor",
3
+ "processor_kwargs": {
4
+ "modality_configs": {
5
+ "behavior_r1_pro": {
6
+ "video": {
7
+ "delta_indices": [
8
+ 0
9
+ ],
10
+ "modality_keys": [
11
+ "observation.images.rgb.head_256_256",
12
+ "observation.images.rgb.left_wrist_256_256",
13
+ "observation.images.rgb.right_wrist_256_256"
14
+ ],
15
+ "sin_cos_embedding_keys": null,
16
+ "mean_std_embedding_keys": null,
17
+ "action_configs": null
18
+ },
19
+ "state": {
20
+ "delta_indices": [
21
+ 0
22
+ ],
23
+ "modality_keys": [
24
+ "robot_pos",
25
+ "robot_ori_cos",
26
+ "robot_ori_sin",
27
+ "robot_2d_ori",
28
+ "robot_2d_ori_cos",
29
+ "robot_2d_ori_sin",
30
+ "robot_lin_vel",
31
+ "robot_ang_vel",
32
+ "arm_left_qpos",
33
+ "arm_left_qpos_sin",
34
+ "arm_left_qpos_cos",
35
+ "eef_left_pos",
36
+ "eef_left_quat",
37
+ "gripper_left_qpos",
38
+ "arm_right_qpos",
39
+ "arm_right_qpos_sin",
40
+ "arm_right_qpos_cos",
41
+ "eef_right_pos",
42
+ "eef_right_quat",
43
+ "gripper_right_qpos",
44
+ "trunk_qpos"
45
+ ],
46
+ "sin_cos_embedding_keys": null,
47
+ "mean_std_embedding_keys": null,
48
+ "action_configs": null
49
+ },
50
+ "action": {
51
+ "delta_indices": [
52
+ 0,
53
+ 1,
54
+ 2,
55
+ 3,
56
+ 4,
57
+ 5,
58
+ 6,
59
+ 7,
60
+ 8,
61
+ 9,
62
+ 10,
63
+ 11,
64
+ 12,
65
+ 13,
66
+ 14,
67
+ 15,
68
+ 16,
69
+ 17,
70
+ 18,
71
+ 19,
72
+ 20,
73
+ 21,
74
+ 22,
75
+ 23,
76
+ 24,
77
+ 25,
78
+ 26,
79
+ 27,
80
+ 28,
81
+ 29,
82
+ 30,
83
+ 31
84
+ ],
85
+ "modality_keys": [
86
+ "base",
87
+ "torso",
88
+ "left_arm",
89
+ "left_gripper",
90
+ "right_arm",
91
+ "right_gripper"
92
+ ],
93
+ "sin_cos_embedding_keys": null,
94
+ "mean_std_embedding_keys": null,
95
+ "action_configs": [
96
+ {
97
+ "rep": "ABSOLUTE",
98
+ "type": "NON_EEF",
99
+ "format": "DEFAULT",
100
+ "state_key": null
101
+ },
102
+ {
103
+ "rep": "RELATIVE",
104
+ "type": "NON_EEF",
105
+ "format": "DEFAULT",
106
+ "state_key": "trunk_qpos"
107
+ },
108
+ {
109
+ "rep": "RELATIVE",
110
+ "type": "NON_EEF",
111
+ "format": "DEFAULT",
112
+ "state_key": "arm_left_qpos"
113
+ },
114
+ {
115
+ "rep": "ABSOLUTE",
116
+ "type": "NON_EEF",
117
+ "format": "DEFAULT",
118
+ "state_key": null
119
+ },
120
+ {
121
+ "rep": "RELATIVE",
122
+ "type": "NON_EEF",
123
+ "format": "DEFAULT",
124
+ "state_key": "arm_right_qpos"
125
+ },
126
+ {
127
+ "rep": "ABSOLUTE",
128
+ "type": "NON_EEF",
129
+ "format": "DEFAULT",
130
+ "state_key": null
131
+ }
132
+ ]
133
+ },
134
+ "language": {
135
+ "delta_indices": [
136
+ 0
137
+ ],
138
+ "modality_keys": [
139
+ "annotation.human.coarse_action"
140
+ ],
141
+ "sin_cos_embedding_keys": null,
142
+ "mean_std_embedding_keys": null,
143
+ "action_configs": null
144
+ }
145
+ },
146
+ "gr1": {
147
+ "video": {
148
+ "delta_indices": [
149
+ 0
150
+ ],
151
+ "modality_keys": [
152
+ "ego_view_bg_crop_pad_res256_freq20"
153
+ ],
154
+ "sin_cos_embedding_keys": null,
155
+ "mean_std_embedding_keys": null,
156
+ "action_configs": null
157
+ },
158
+ "state": {
159
+ "delta_indices": [
160
+ 0
161
+ ],
162
+ "modality_keys": [
163
+ "left_arm",
164
+ "right_arm",
165
+ "left_hand",
166
+ "right_hand",
167
+ "waist"
168
+ ],
169
+ "sin_cos_embedding_keys": [
170
+ "left_arm",
171
+ "right_arm",
172
+ "left_hand",
173
+ "right_hand",
174
+ "waist"
175
+ ],
176
+ "mean_std_embedding_keys": null,
177
+ "action_configs": null
178
+ },
179
+ "action": {
180
+ "delta_indices": [
181
+ 0,
182
+ 1,
183
+ 2,
184
+ 3,
185
+ 4,
186
+ 5,
187
+ 6,
188
+ 7,
189
+ 8,
190
+ 9,
191
+ 10,
192
+ 11,
193
+ 12,
194
+ 13,
195
+ 14,
196
+ 15
197
+ ],
198
+ "modality_keys": [
199
+ "left_arm",
200
+ "right_arm",
201
+ "left_hand",
202
+ "right_hand",
203
+ "waist"
204
+ ],
205
+ "sin_cos_embedding_keys": null,
206
+ "mean_std_embedding_keys": null,
207
+ "action_configs": [
208
+ {
209
+ "rep": "RELATIVE",
210
+ "type": "NON_EEF",
211
+ "format": "DEFAULT",
212
+ "state_key": null
213
+ },
214
+ {
215
+ "rep": "RELATIVE",
216
+ "type": "NON_EEF",
217
+ "format": "DEFAULT",
218
+ "state_key": null
219
+ },
220
+ {
221
+ "rep": "RELATIVE",
222
+ "type": "NON_EEF",
223
+ "format": "DEFAULT",
224
+ "state_key": null
225
+ },
226
+ {
227
+ "rep": "RELATIVE",
228
+ "type": "NON_EEF",
229
+ "format": "DEFAULT",
230
+ "state_key": null
231
+ },
232
+ {
233
+ "rep": "ABSOLUTE",
234
+ "type": "NON_EEF",
235
+ "format": "DEFAULT",
236
+ "state_key": null
237
+ }
238
+ ]
239
+ },
240
+ "language": {
241
+ "delta_indices": [
242
+ 0
243
+ ],
244
+ "modality_keys": [
245
+ "task"
246
+ ],
247
+ "sin_cos_embedding_keys": null,
248
+ "mean_std_embedding_keys": null,
249
+ "action_configs": null
250
+ }
251
+ },
252
+ "robocasa_panda_omron": {
253
+ "video": {
254
+ "delta_indices": [
255
+ 0
256
+ ],
257
+ "modality_keys": [
258
+ "res256_image_side_0",
259
+ "res256_image_side_1",
260
+ "res256_image_wrist_0"
261
+ ],
262
+ "sin_cos_embedding_keys": null,
263
+ "mean_std_embedding_keys": null,
264
+ "action_configs": null
265
+ },
266
+ "state": {
267
+ "delta_indices": [
268
+ 0
269
+ ],
270
+ "modality_keys": [
271
+ "end_effector_position_relative",
272
+ "end_effector_rotation_relative",
273
+ "gripper_qpos",
274
+ "base_position",
275
+ "base_rotation"
276
+ ],
277
+ "sin_cos_embedding_keys": null,
278
+ "mean_std_embedding_keys": null,
279
+ "action_configs": null
280
+ },
281
+ "action": {
282
+ "delta_indices": [
283
+ 0,
284
+ 1,
285
+ 2,
286
+ 3,
287
+ 4,
288
+ 5,
289
+ 6,
290
+ 7,
291
+ 8,
292
+ 9,
293
+ 10,
294
+ 11,
295
+ 12,
296
+ 13,
297
+ 14,
298
+ 15
299
+ ],
300
+ "modality_keys": [
301
+ "end_effector_position",
302
+ "end_effector_rotation",
303
+ "gripper_close",
304
+ "base_motion",
305
+ "control_mode"
306
+ ],
307
+ "sin_cos_embedding_keys": null,
308
+ "mean_std_embedding_keys": null,
309
+ "action_configs": [
310
+ {
311
+ "rep": "ABSOLUTE",
312
+ "type": "NON_EEF",
313
+ "format": "DEFAULT",
314
+ "state_key": null
315
+ },
316
+ {
317
+ "rep": "ABSOLUTE",
318
+ "type": "NON_EEF",
319
+ "format": "DEFAULT",
320
+ "state_key": null
321
+ },
322
+ {
323
+ "rep": "ABSOLUTE",
324
+ "type": "NON_EEF",
325
+ "format": "DEFAULT",
326
+ "state_key": null
327
+ },
328
+ {
329
+ "rep": "ABSOLUTE",
330
+ "type": "NON_EEF",
331
+ "format": "DEFAULT",
332
+ "state_key": null
333
+ },
334
+ {
335
+ "rep": "ABSOLUTE",
336
+ "type": "NON_EEF",
337
+ "format": "DEFAULT",
338
+ "state_key": null
339
+ }
340
+ ]
341
+ },
342
+ "language": {
343
+ "delta_indices": [
344
+ 0
345
+ ],
346
+ "modality_keys": [
347
+ "annotation.human.action.task_description"
348
+ ],
349
+ "sin_cos_embedding_keys": null,
350
+ "mean_std_embedding_keys": null,
351
+ "action_configs": null
352
+ }
353
+ },
354
+ "new_embodiment": {
355
+ "video": {
356
+ "delta_indices": [
357
+ 0
358
+ ],
359
+ "modality_keys": [
360
+ "ego_view"
361
+ ],
362
+ "sin_cos_embedding_keys": null,
363
+ "mean_std_embedding_keys": null,
364
+ "action_configs": null
365
+ },
366
+ "state": {
367
+ "delta_indices": [
368
+ 0
369
+ ],
370
+ "modality_keys": [
371
+ "single_arm",
372
+ "gripper"
373
+ ],
374
+ "sin_cos_embedding_keys": null,
375
+ "mean_std_embedding_keys": null,
376
+ "action_configs": null
377
+ },
378
+ "action": {
379
+ "delta_indices": [
380
+ 0,
381
+ 1,
382
+ 2,
383
+ 3,
384
+ 4,
385
+ 5,
386
+ 6,
387
+ 7,
388
+ 8,
389
+ 9,
390
+ 10,
391
+ 11,
392
+ 12,
393
+ 13,
394
+ 14,
395
+ 15
396
+ ],
397
+ "modality_keys": [
398
+ "single_arm",
399
+ "gripper"
400
+ ],
401
+ "sin_cos_embedding_keys": null,
402
+ "mean_std_embedding_keys": null,
403
+ "action_configs": [
404
+ {
405
+ "rep": "RELATIVE",
406
+ "type": "NON_EEF",
407
+ "format": "DEFAULT",
408
+ "state_key": "single_arm"
409
+ },
410
+ {
411
+ "rep": "ABSOLUTE",
412
+ "type": "NON_EEF",
413
+ "format": "DEFAULT",
414
+ "state_key": null
415
+ }
416
+ ]
417
+ },
418
+ "language": {
419
+ "delta_indices": [
420
+ 0
421
+ ],
422
+ "modality_keys": [
423
+ "annotation.human.task_description"
424
+ ],
425
+ "sin_cos_embedding_keys": null,
426
+ "mean_std_embedding_keys": null,
427
+ "action_configs": null
428
+ }
429
+ }
430
+ },
431
+ "image_crop_size": null,
432
+ "image_target_size": null,
433
+ "use_albumentations": true,
434
+ "random_rotation_angle": null,
435
+ "color_jitter_params": {
436
+ "brightness": 0.3,
437
+ "contrast": 0.4,
438
+ "saturation": 0.5,
439
+ "hue": 0.08
440
+ },
441
+ "shortest_image_edge": 256,
442
+ "crop_fraction": 0.95,
443
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
444
+ "model_type": "eagle",
445
+ "formalize_language": true,
446
+ "max_state_dim": 128,
447
+ "max_action_dim": 128,
448
+ "max_action_horizon": 50,
449
+ "use_percentiles": false,
450
+ "clip_outliers": true,
451
+ "apply_sincos_state_encoding": true,
452
+ "use_relative_action": true
453
+ }
454
+ }
checkpoint-1500/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de961030f70571a51def24d15c8812bbf105571c3610a2faeffb44cf60d1f842
3
+ size 14645
checkpoint-1500/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80e5cea2b8c16ba7f8e8cb5acd351607e70c71051544e5400a084679f5f66141
3
+ size 1465
checkpoint-1500/statistics.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-1500/trainer_state.json ADDED
@@ -0,0 +1,934 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 0.75,
6
+ "eval_steps": 500,
7
+ "global_step": 1500,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "grad_norm": 1.7424949407577515,
14
+ "learning_rate": 9e-06,
15
+ "loss": 1.4997,
16
+ "step": 10
17
+ },
18
+ {
19
+ "grad_norm": 0.5852967500686646,
20
+ "learning_rate": 1.9e-05,
21
+ "loss": 1.3085,
22
+ "step": 20
23
+ },
24
+ {
25
+ "grad_norm": 0.9362701177597046,
26
+ "learning_rate": 2.9e-05,
27
+ "loss": 1.1792,
28
+ "step": 30
29
+ },
30
+ {
31
+ "grad_norm": 0.6769218444824219,
32
+ "learning_rate": 3.9000000000000006e-05,
33
+ "loss": 1.0609,
34
+ "step": 40
35
+ },
36
+ {
37
+ "grad_norm": 0.6926454305648804,
38
+ "learning_rate": 4.9e-05,
39
+ "loss": 1.0562,
40
+ "step": 50
41
+ },
42
+ {
43
+ "grad_norm": 0.4864855408668518,
44
+ "learning_rate": 5.9e-05,
45
+ "loss": 1.05,
46
+ "step": 60
47
+ },
48
+ {
49
+ "grad_norm": 0.390482097864151,
50
+ "learning_rate": 6.9e-05,
51
+ "loss": 1.0319,
52
+ "step": 70
53
+ },
54
+ {
55
+ "grad_norm": 0.9116744995117188,
56
+ "learning_rate": 7.900000000000001e-05,
57
+ "loss": 1.0302,
58
+ "step": 80
59
+ },
60
+ {
61
+ "grad_norm": 1.013092041015625,
62
+ "learning_rate": 8.900000000000001e-05,
63
+ "loss": 0.9882,
64
+ "step": 90
65
+ },
66
+ {
67
+ "grad_norm": 1.0793496370315552,
68
+ "learning_rate": 9.900000000000001e-05,
69
+ "loss": 0.9154,
70
+ "step": 100
71
+ },
72
+ {
73
+ "grad_norm": 1.4888230562210083,
74
+ "learning_rate": 9.999446382823013e-05,
75
+ "loss": 0.8416,
76
+ "step": 110
77
+ },
78
+ {
79
+ "grad_norm": 1.4292930364608765,
80
+ "learning_rate": 9.997532801828658e-05,
81
+ "loss": 0.6817,
82
+ "step": 120
83
+ },
84
+ {
85
+ "grad_norm": 1.4698712825775146,
86
+ "learning_rate": 9.99425294526634e-05,
87
+ "loss": 0.5077,
88
+ "step": 130
89
+ },
90
+ {
91
+ "grad_norm": 1.5290286540985107,
92
+ "learning_rate": 9.989607709816091e-05,
93
+ "loss": 0.3704,
94
+ "step": 140
95
+ },
96
+ {
97
+ "grad_norm": 1.4736027717590332,
98
+ "learning_rate": 9.983598365438902e-05,
99
+ "loss": 0.2458,
100
+ "step": 150
101
+ },
102
+ {
103
+ "grad_norm": 1.1587175130844116,
104
+ "learning_rate": 9.976226555029522e-05,
105
+ "loss": 0.1803,
106
+ "step": 160
107
+ },
108
+ {
109
+ "grad_norm": 0.9846270680427551,
110
+ "learning_rate": 9.967494293967312e-05,
111
+ "loss": 0.1529,
112
+ "step": 170
113
+ },
114
+ {
115
+ "grad_norm": 0.8785351514816284,
116
+ "learning_rate": 9.95740396956525e-05,
117
+ "loss": 0.1356,
118
+ "step": 180
119
+ },
120
+ {
121
+ "grad_norm": 0.8878108859062195,
122
+ "learning_rate": 9.945958340417283e-05,
123
+ "loss": 0.1103,
124
+ "step": 190
125
+ },
126
+ {
127
+ "grad_norm": 0.9868141412734985,
128
+ "learning_rate": 9.93316053564413e-05,
129
+ "loss": 0.1177,
130
+ "step": 200
131
+ },
132
+ {
133
+ "grad_norm": 1.1627991199493408,
134
+ "learning_rate": 9.919014054037836e-05,
135
+ "loss": 0.1098,
136
+ "step": 210
137
+ },
138
+ {
139
+ "grad_norm": 0.7567640542984009,
140
+ "learning_rate": 9.903522763105218e-05,
141
+ "loss": 0.1034,
142
+ "step": 220
143
+ },
144
+ {
145
+ "grad_norm": 0.9812158942222595,
146
+ "learning_rate": 9.886690898010535e-05,
147
+ "loss": 0.0935,
148
+ "step": 230
149
+ },
150
+ {
151
+ "grad_norm": 0.736114501953125,
152
+ "learning_rate": 9.868523060417646e-05,
153
+ "loss": 0.0918,
154
+ "step": 240
155
+ },
156
+ {
157
+ "grad_norm": 0.668365478515625,
158
+ "learning_rate": 9.849024217231935e-05,
159
+ "loss": 0.0828,
160
+ "step": 250
161
+ },
162
+ {
163
+ "grad_norm": 0.6348236799240112,
164
+ "learning_rate": 9.82819969924244e-05,
165
+ "loss": 0.0848,
166
+ "step": 260
167
+ },
168
+ {
169
+ "grad_norm": 0.8186867237091064,
170
+ "learning_rate": 9.806055199664446e-05,
171
+ "loss": 0.0976,
172
+ "step": 270
173
+ },
174
+ {
175
+ "grad_norm": 0.974027693271637,
176
+ "learning_rate": 9.782596772583026e-05,
177
+ "loss": 0.0761,
178
+ "step": 280
179
+ },
180
+ {
181
+ "grad_norm": 0.7111085057258606,
182
+ "learning_rate": 9.757830831297914e-05,
183
+ "loss": 0.0979,
184
+ "step": 290
185
+ },
186
+ {
187
+ "grad_norm": 0.9077074527740479,
188
+ "learning_rate": 9.731764146570173e-05,
189
+ "loss": 0.0787,
190
+ "step": 300
191
+ },
192
+ {
193
+ "grad_norm": 0.5821448564529419,
194
+ "learning_rate": 9.704403844771128e-05,
195
+ "loss": 0.0838,
196
+ "step": 310
197
+ },
198
+ {
199
+ "grad_norm": 0.5775296092033386,
200
+ "learning_rate": 9.675757405934103e-05,
201
+ "loss": 0.0623,
202
+ "step": 320
203
+ },
204
+ {
205
+ "grad_norm": 0.6049805879592896,
206
+ "learning_rate": 9.645832661709444e-05,
207
+ "loss": 0.0636,
208
+ "step": 330
209
+ },
210
+ {
211
+ "grad_norm": 0.45737943053245544,
212
+ "learning_rate": 9.614637793223425e-05,
213
+ "loss": 0.0626,
214
+ "step": 340
215
+ },
216
+ {
217
+ "grad_norm": 0.4611263871192932,
218
+ "learning_rate": 9.582181328841611e-05,
219
+ "loss": 0.0582,
220
+ "step": 350
221
+ },
222
+ {
223
+ "grad_norm": 0.6837406158447266,
224
+ "learning_rate": 9.548472141837286e-05,
225
+ "loss": 0.0638,
226
+ "step": 360
227
+ },
228
+ {
229
+ "grad_norm": 0.6089468002319336,
230
+ "learning_rate": 9.513519447965595e-05,
231
+ "loss": 0.0581,
232
+ "step": 370
233
+ },
234
+ {
235
+ "grad_norm": 0.585154116153717,
236
+ "learning_rate": 9.477332802944044e-05,
237
+ "loss": 0.0552,
238
+ "step": 380
239
+ },
240
+ {
241
+ "grad_norm": 0.5016727447509766,
242
+ "learning_rate": 9.439922099840054e-05,
243
+ "loss": 0.0581,
244
+ "step": 390
245
+ },
246
+ {
247
+ "grad_norm": 0.569975733757019,
248
+ "learning_rate": 9.401297566366318e-05,
249
+ "loss": 0.0594,
250
+ "step": 400
251
+ },
252
+ {
253
+ "grad_norm": 0.6577298641204834,
254
+ "learning_rate": 9.36146976208462e-05,
255
+ "loss": 0.0624,
256
+ "step": 410
257
+ },
258
+ {
259
+ "grad_norm": 0.7007710933685303,
260
+ "learning_rate": 9.320449575518972e-05,
261
+ "loss": 0.0583,
262
+ "step": 420
263
+ },
264
+ {
265
+ "grad_norm": 0.47701025009155273,
266
+ "learning_rate": 9.278248221178798e-05,
267
+ "loss": 0.0589,
268
+ "step": 430
269
+ },
270
+ {
271
+ "grad_norm": 0.5127101540565491,
272
+ "learning_rate": 9.234877236492997e-05,
273
+ "loss": 0.0571,
274
+ "step": 440
275
+ },
276
+ {
277
+ "grad_norm": 0.4970426559448242,
278
+ "learning_rate": 9.190348478655724e-05,
279
+ "loss": 0.0518,
280
+ "step": 450
281
+ },
282
+ {
283
+ "grad_norm": 0.42194655537605286,
284
+ "learning_rate": 9.144674121384757e-05,
285
+ "loss": 0.0572,
286
+ "step": 460
287
+ },
288
+ {
289
+ "grad_norm": 0.6780546307563782,
290
+ "learning_rate": 9.097866651593317e-05,
291
+ "loss": 0.0631,
292
+ "step": 470
293
+ },
294
+ {
295
+ "grad_norm": 0.3541775047779083,
296
+ "learning_rate": 9.049938865976275e-05,
297
+ "loss": 0.0548,
298
+ "step": 480
299
+ },
300
+ {
301
+ "grad_norm": 0.6049434542655945,
302
+ "learning_rate": 9.000903867511666e-05,
303
+ "loss": 0.0498,
304
+ "step": 490
305
+ },
306
+ {
307
+ "grad_norm": 0.45229852199554443,
308
+ "learning_rate": 8.950775061878453e-05,
309
+ "loss": 0.0496,
310
+ "step": 500
311
+ },
312
+ {
313
+ "grad_norm": 0.6024392247200012,
314
+ "learning_rate": 8.899566153791566e-05,
315
+ "loss": 0.0569,
316
+ "step": 510
317
+ },
318
+ {
319
+ "grad_norm": 0.4546999931335449,
320
+ "learning_rate": 8.84729114325516e-05,
321
+ "loss": 0.0509,
322
+ "step": 520
323
+ },
324
+ {
325
+ "grad_norm": 0.5965995788574219,
326
+ "learning_rate": 8.79396432173515e-05,
327
+ "loss": 0.0631,
328
+ "step": 530
329
+ },
330
+ {
331
+ "grad_norm": 0.5499140024185181,
332
+ "learning_rate": 8.739600268252078e-05,
333
+ "loss": 0.0493,
334
+ "step": 540
335
+ },
336
+ {
337
+ "grad_norm": 0.5246662497520447,
338
+ "learning_rate": 8.684213845395339e-05,
339
+ "loss": 0.0534,
340
+ "step": 550
341
+ },
342
+ {
343
+ "grad_norm": 0.47341179847717285,
344
+ "learning_rate": 8.627820195259918e-05,
345
+ "loss": 0.0462,
346
+ "step": 560
347
+ },
348
+ {
349
+ "grad_norm": 0.42044690251350403,
350
+ "learning_rate": 8.570434735306671e-05,
351
+ "loss": 0.0405,
352
+ "step": 570
353
+ },
354
+ {
355
+ "grad_norm": 0.5121616125106812,
356
+ "learning_rate": 8.512073154147362e-05,
357
+ "loss": 0.0478,
358
+ "step": 580
359
+ },
360
+ {
361
+ "grad_norm": 0.4845208525657654,
362
+ "learning_rate": 8.452751407255541e-05,
363
+ "loss": 0.0486,
364
+ "step": 590
365
+ },
366
+ {
367
+ "grad_norm": 0.3478183150291443,
368
+ "learning_rate": 8.392485712604483e-05,
369
+ "loss": 0.0568,
370
+ "step": 600
371
+ },
372
+ {
373
+ "grad_norm": 0.49295181035995483,
374
+ "learning_rate": 8.331292546233362e-05,
375
+ "loss": 0.0561,
376
+ "step": 610
377
+ },
378
+ {
379
+ "grad_norm": 0.522871732711792,
380
+ "learning_rate": 8.269188637742846e-05,
381
+ "loss": 0.0438,
382
+ "step": 620
383
+ },
384
+ {
385
+ "grad_norm": 0.45402273535728455,
386
+ "learning_rate": 8.206190965721419e-05,
387
+ "loss": 0.0354,
388
+ "step": 630
389
+ },
390
+ {
391
+ "grad_norm": 0.461839497089386,
392
+ "learning_rate": 8.14231675310358e-05,
393
+ "loss": 0.038,
394
+ "step": 640
395
+ },
396
+ {
397
+ "grad_norm": 0.47349685430526733,
398
+ "learning_rate": 8.077583462461283e-05,
399
+ "loss": 0.0414,
400
+ "step": 650
401
+ },
402
+ {
403
+ "grad_norm": 0.5613319873809814,
404
+ "learning_rate": 8.012008791229826e-05,
405
+ "loss": 0.045,
406
+ "step": 660
407
+ },
408
+ {
409
+ "grad_norm": 0.6868877410888672,
410
+ "learning_rate": 7.945610666869568e-05,
411
+ "loss": 0.0538,
412
+ "step": 670
413
+ },
414
+ {
415
+ "grad_norm": 0.5372869968414307,
416
+ "learning_rate": 7.878407241964729e-05,
417
+ "loss": 0.0458,
418
+ "step": 680
419
+ },
420
+ {
421
+ "grad_norm": 0.48658597469329834,
422
+ "learning_rate": 7.810416889260653e-05,
423
+ "loss": 0.0415,
424
+ "step": 690
425
+ },
426
+ {
427
+ "grad_norm": 0.5548452734947205,
428
+ "learning_rate": 7.741658196640892e-05,
429
+ "loss": 0.0401,
430
+ "step": 700
431
+ },
432
+ {
433
+ "grad_norm": 0.6520838141441345,
434
+ "learning_rate": 7.672149962045457e-05,
435
+ "loss": 0.0542,
436
+ "step": 710
437
+ },
438
+ {
439
+ "grad_norm": 0.5273123979568481,
440
+ "learning_rate": 7.60191118833165e-05,
441
+ "loss": 0.0461,
442
+ "step": 720
443
+ },
444
+ {
445
+ "grad_norm": 0.45993274450302124,
446
+ "learning_rate": 7.530961078078873e-05,
447
+ "loss": 0.0445,
448
+ "step": 730
449
+ },
450
+ {
451
+ "grad_norm": 0.3632051646709442,
452
+ "learning_rate": 7.45931902833884e-05,
453
+ "loss": 0.031,
454
+ "step": 740
455
+ },
456
+ {
457
+ "grad_norm": 0.3503791093826294,
458
+ "learning_rate": 7.387004625332608e-05,
459
+ "loss": 0.0362,
460
+ "step": 750
461
+ },
462
+ {
463
+ "grad_norm": 0.4252007305622101,
464
+ "learning_rate": 7.3140376390959e-05,
465
+ "loss": 0.0306,
466
+ "step": 760
467
+ },
468
+ {
469
+ "grad_norm": 0.5684967637062073,
470
+ "learning_rate": 7.240438018074189e-05,
471
+ "loss": 0.0343,
472
+ "step": 770
473
+ },
474
+ {
475
+ "grad_norm": 0.5697133541107178,
476
+ "learning_rate": 7.166225883668969e-05,
477
+ "loss": 0.0404,
478
+ "step": 780
479
+ },
480
+ {
481
+ "grad_norm": 0.6125141978263855,
482
+ "learning_rate": 7.091421524736784e-05,
483
+ "loss": 0.0393,
484
+ "step": 790
485
+ },
486
+ {
487
+ "grad_norm": 0.4313353896141052,
488
+ "learning_rate": 7.016045392042452e-05,
489
+ "loss": 0.041,
490
+ "step": 800
491
+ },
492
+ {
493
+ "grad_norm": 0.41094619035720825,
494
+ "learning_rate": 6.940118092668022e-05,
495
+ "loss": 0.0475,
496
+ "step": 810
497
+ },
498
+ {
499
+ "grad_norm": 0.3212681710720062,
500
+ "learning_rate": 6.863660384379017e-05,
501
+ "loss": 0.0388,
502
+ "step": 820
503
+ },
504
+ {
505
+ "grad_norm": 0.5655945539474487,
506
+ "learning_rate": 6.786693169949455e-05,
507
+ "loss": 0.04,
508
+ "step": 830
509
+ },
510
+ {
511
+ "grad_norm": 0.44820529222488403,
512
+ "learning_rate": 6.709237491447249e-05,
513
+ "loss": 0.0374,
514
+ "step": 840
515
+ },
516
+ {
517
+ "grad_norm": 0.43709850311279297,
518
+ "learning_rate": 6.631314524481513e-05,
519
+ "loss": 0.049,
520
+ "step": 850
521
+ },
522
+ {
523
+ "grad_norm": 0.5083968043327332,
524
+ "learning_rate": 6.552945572413358e-05,
525
+ "loss": 0.0436,
526
+ "step": 860
527
+ },
528
+ {
529
+ "grad_norm": 0.3737967610359192,
530
+ "learning_rate": 6.474152060531768e-05,
531
+ "loss": 0.0374,
532
+ "step": 870
533
+ },
534
+ {
535
+ "grad_norm": 0.4421429932117462,
536
+ "learning_rate": 6.394955530196147e-05,
537
+ "loss": 0.0293,
538
+ "step": 880
539
+ },
540
+ {
541
+ "grad_norm": 0.44184306263923645,
542
+ "learning_rate": 6.315377632947115e-05,
543
+ "loss": 0.0307,
544
+ "step": 890
545
+ },
546
+ {
547
+ "grad_norm": 0.45122212171554565,
548
+ "learning_rate": 6.235440124587198e-05,
549
+ "loss": 0.0417,
550
+ "step": 900
551
+ },
552
+ {
553
+ "grad_norm": 0.43313905596733093,
554
+ "learning_rate": 6.155164859233012e-05,
555
+ "loss": 0.0281,
556
+ "step": 910
557
+ },
558
+ {
559
+ "grad_norm": 0.31750547885894775,
560
+ "learning_rate": 6.074573783340562e-05,
561
+ "loss": 0.0328,
562
+ "step": 920
563
+ },
564
+ {
565
+ "grad_norm": 0.39470431208610535,
566
+ "learning_rate": 5.9936889297052986e-05,
567
+ "loss": 0.0286,
568
+ "step": 930
569
+ },
570
+ {
571
+ "grad_norm": 0.4038713872432709,
572
+ "learning_rate": 5.912532411438576e-05,
573
+ "loss": 0.0279,
574
+ "step": 940
575
+ },
576
+ {
577
+ "grad_norm": 0.5246008038520813,
578
+ "learning_rate": 5.831126415922148e-05,
579
+ "loss": 0.0389,
580
+ "step": 950
581
+ },
582
+ {
583
+ "grad_norm": 0.5796319842338562,
584
+ "learning_rate": 5.74949319874235e-05,
585
+ "loss": 0.0269,
586
+ "step": 960
587
+ },
588
+ {
589
+ "grad_norm": 0.442847341299057,
590
+ "learning_rate": 5.667655077605659e-05,
591
+ "loss": 0.0285,
592
+ "step": 970
593
+ },
594
+ {
595
+ "grad_norm": 0.5783978700637817,
596
+ "learning_rate": 5.585634426237246e-05,
597
+ "loss": 0.0347,
598
+ "step": 980
599
+ },
600
+ {
601
+ "grad_norm": 0.673740804195404,
602
+ "learning_rate": 5.5034536682642224e-05,
603
+ "loss": 0.037,
604
+ "step": 990
605
+ },
606
+ {
607
+ "grad_norm": 0.4028751850128174,
608
+ "learning_rate": 5.4211352710852495e-05,
609
+ "loss": 0.0359,
610
+ "step": 1000
611
+ },
612
+ {
613
+ "grad_norm": 0.35525479912757874,
614
+ "learning_rate": 5.3387017397281704e-05,
615
+ "loss": 0.0336,
616
+ "step": 1010
617
+ },
618
+ {
619
+ "grad_norm": 0.4501492381095886,
620
+ "learning_rate": 5.2561756106973656e-05,
621
+ "loss": 0.0315,
622
+ "step": 1020
623
+ },
624
+ {
625
+ "grad_norm": 0.40087419748306274,
626
+ "learning_rate": 5.1735794458124956e-05,
627
+ "loss": 0.0336,
628
+ "step": 1030
629
+ },
630
+ {
631
+ "grad_norm": 0.45209842920303345,
632
+ "learning_rate": 5.0909358260403186e-05,
633
+ "loss": 0.0307,
634
+ "step": 1040
635
+ },
636
+ {
637
+ "grad_norm": 0.3294844925403595,
638
+ "learning_rate": 5.0082673453212914e-05,
639
+ "loss": 0.0278,
640
+ "step": 1050
641
+ },
642
+ {
643
+ "grad_norm": 0.37356334924697876,
644
+ "learning_rate": 4.925596604392603e-05,
645
+ "loss": 0.0344,
646
+ "step": 1060
647
+ },
648
+ {
649
+ "grad_norm": 0.5277794599533081,
650
+ "learning_rate": 4.8429462046093585e-05,
651
+ "loss": 0.0332,
652
+ "step": 1070
653
+ },
654
+ {
655
+ "grad_norm": 0.5260717868804932,
656
+ "learning_rate": 4.7603387417656026e-05,
657
+ "loss": 0.0328,
658
+ "step": 1080
659
+ },
660
+ {
661
+ "grad_norm": 0.3290504217147827,
662
+ "learning_rate": 4.677796799916845e-05,
663
+ "loss": 0.0246,
664
+ "step": 1090
665
+ },
666
+ {
667
+ "grad_norm": 0.2661372721195221,
668
+ "learning_rate": 4.5953429452058135e-05,
669
+ "loss": 0.032,
670
+ "step": 1100
671
+ },
672
+ {
673
+ "grad_norm": 0.30993494391441345,
674
+ "learning_rate": 4.5129997196930845e-05,
675
+ "loss": 0.0318,
676
+ "step": 1110
677
+ },
678
+ {
679
+ "grad_norm": 0.49708715081214905,
680
+ "learning_rate": 4.430789635194324e-05,
681
+ "loss": 0.0307,
682
+ "step": 1120
683
+ },
684
+ {
685
+ "grad_norm": 0.34312236309051514,
686
+ "learning_rate": 4.348735167125771e-05,
687
+ "loss": 0.0333,
688
+ "step": 1130
689
+ },
690
+ {
691
+ "grad_norm": 0.3901269733905792,
692
+ "learning_rate": 4.2668587483596864e-05,
693
+ "loss": 0.0328,
694
+ "step": 1140
695
+ },
696
+ {
697
+ "grad_norm": 0.3739551901817322,
698
+ "learning_rate": 4.1851827630914305e-05,
699
+ "loss": 0.0272,
700
+ "step": 1150
701
+ },
702
+ {
703
+ "grad_norm": 0.36706796288490295,
704
+ "learning_rate": 4.103729540719847e-05,
705
+ "loss": 0.0277,
706
+ "step": 1160
707
+ },
708
+ {
709
+ "grad_norm": 0.3322960138320923,
710
+ "learning_rate": 4.0225213497426276e-05,
711
+ "loss": 0.0236,
712
+ "step": 1170
713
+ },
714
+ {
715
+ "grad_norm": 0.26609674096107483,
716
+ "learning_rate": 3.9415803916683224e-05,
717
+ "loss": 0.0265,
718
+ "step": 1180
719
+ },
720
+ {
721
+ "grad_norm": 0.44145846366882324,
722
+ "learning_rate": 3.860928794946682e-05,
723
+ "loss": 0.0256,
724
+ "step": 1190
725
+ },
726
+ {
727
+ "grad_norm": 0.29344606399536133,
728
+ "learning_rate": 3.780588608918947e-05,
729
+ "loss": 0.0275,
730
+ "step": 1200
731
+ },
732
+ {
733
+ "grad_norm": 0.3439117968082428,
734
+ "learning_rate": 3.700581797789786e-05,
735
+ "loss": 0.0295,
736
+ "step": 1210
737
+ },
738
+ {
739
+ "grad_norm": 0.41021284461021423,
740
+ "learning_rate": 3.6209302346225006e-05,
741
+ "loss": 0.0234,
742
+ "step": 1220
743
+ },
744
+ {
745
+ "grad_norm": 0.2943209707736969,
746
+ "learning_rate": 3.541655695359142e-05,
747
+ "loss": 0.0276,
748
+ "step": 1230
749
+ },
750
+ {
751
+ "grad_norm": 0.36791661381721497,
752
+ "learning_rate": 3.462779852867197e-05,
753
+ "loss": 0.0233,
754
+ "step": 1240
755
+ },
756
+ {
757
+ "grad_norm": 0.4398164749145508,
758
+ "learning_rate": 3.384324271014429e-05,
759
+ "loss": 0.0298,
760
+ "step": 1250
761
+ },
762
+ {
763
+ "grad_norm": 0.48210081458091736,
764
+ "learning_rate": 3.3063103987735433e-05,
765
+ "loss": 0.0227,
766
+ "step": 1260
767
+ },
768
+ {
769
+ "grad_norm": 0.33244040608406067,
770
+ "learning_rate": 3.228759564358248e-05,
771
+ "loss": 0.0273,
772
+ "step": 1270
773
+ },
774
+ {
775
+ "grad_norm": 0.47357818484306335,
776
+ "learning_rate": 3.1516929693923315e-05,
777
+ "loss": 0.0243,
778
+ "step": 1280
779
+ },
780
+ {
781
+ "grad_norm": 0.36431384086608887,
782
+ "learning_rate": 3.075131683113352e-05,
783
+ "loss": 0.0271,
784
+ "step": 1290
785
+ },
786
+ {
787
+ "grad_norm": 0.34549668431282043,
788
+ "learning_rate": 2.999096636612518e-05,
789
+ "loss": 0.0262,
790
+ "step": 1300
791
+ },
792
+ {
793
+ "grad_norm": 0.2728613615036011,
794
+ "learning_rate": 2.9236086171123404e-05,
795
+ "loss": 0.0224,
796
+ "step": 1310
797
+ },
798
+ {
799
+ "grad_norm": 0.37844163179397583,
800
+ "learning_rate": 2.8486882622836026e-05,
801
+ "loss": 0.0252,
802
+ "step": 1320
803
+ },
804
+ {
805
+ "grad_norm": 0.2981228530406952,
806
+ "learning_rate": 2.774356054603243e-05,
807
+ "loss": 0.0205,
808
+ "step": 1330
809
+ },
810
+ {
811
+ "grad_norm": 0.37120452523231506,
812
+ "learning_rate": 2.7006323157546386e-05,
813
+ "loss": 0.0249,
814
+ "step": 1340
815
+ },
816
+ {
817
+ "grad_norm": 0.41909462213516235,
818
+ "learning_rate": 2.6275372010718635e-05,
819
+ "loss": 0.021,
820
+ "step": 1350
821
+ },
822
+ {
823
+ "grad_norm": 0.4190634489059448,
824
+ "learning_rate": 2.555090694029421e-05,
825
+ "loss": 0.0239,
826
+ "step": 1360
827
+ },
828
+ {
829
+ "grad_norm": 0.42239516973495483,
830
+ "learning_rate": 2.4833126007789653e-05,
831
+ "loss": 0.0208,
832
+ "step": 1370
833
+ },
834
+ {
835
+ "grad_norm": 0.2549847364425659,
836
+ "learning_rate": 2.4122225447344875e-05,
837
+ "loss": 0.022,
838
+ "step": 1380
839
+ },
840
+ {
841
+ "grad_norm": 0.25902891159057617,
842
+ "learning_rate": 2.341839961207482e-05,
843
+ "loss": 0.0193,
844
+ "step": 1390
845
+ },
846
+ {
847
+ "grad_norm": 0.6364672780036926,
848
+ "learning_rate": 2.2721840920935196e-05,
849
+ "loss": 0.0245,
850
+ "step": 1400
851
+ },
852
+ {
853
+ "grad_norm": 0.2977903485298157,
854
+ "learning_rate": 2.2032739806117058e-05,
855
+ "loss": 0.0184,
856
+ "step": 1410
857
+ },
858
+ {
859
+ "grad_norm": 0.39573556184768677,
860
+ "learning_rate": 2.1351284660984572e-05,
861
+ "loss": 0.0243,
862
+ "step": 1420
863
+ },
864
+ {
865
+ "grad_norm": 0.4302116930484772,
866
+ "learning_rate": 2.067766178857013e-05,
867
+ "loss": 0.0218,
868
+ "step": 1430
869
+ },
870
+ {
871
+ "grad_norm": 0.23667673766613007,
872
+ "learning_rate": 2.0012055350640986e-05,
873
+ "loss": 0.0207,
874
+ "step": 1440
875
+ },
876
+ {
877
+ "grad_norm": 0.2744090259075165,
878
+ "learning_rate": 1.9354647317351188e-05,
879
+ "loss": 0.0251,
880
+ "step": 1450
881
+ },
882
+ {
883
+ "grad_norm": 0.394101083278656,
884
+ "learning_rate": 1.8705617417492883e-05,
885
+ "loss": 0.0233,
886
+ "step": 1460
887
+ },
888
+ {
889
+ "grad_norm": 0.3944133222103119,
890
+ "learning_rate": 1.8065143089360172e-05,
891
+ "loss": 0.0215,
892
+ "step": 1470
893
+ },
894
+ {
895
+ "grad_norm": 0.34019017219543457,
896
+ "learning_rate": 1.743339943223926e-05,
897
+ "loss": 0.026,
898
+ "step": 1480
899
+ },
900
+ {
901
+ "grad_norm": 0.2179572582244873,
902
+ "learning_rate": 1.6810559158538092e-05,
903
+ "loss": 0.0178,
904
+ "step": 1490
905
+ },
906
+ {
907
+ "grad_norm": 0.42695897817611694,
908
+ "learning_rate": 1.6196792546568472e-05,
909
+ "loss": 0.0251,
910
+ "step": 1500
911
+ }
912
+ ],
913
+ "logging_steps": 10,
914
+ "max_steps": 2000,
915
+ "num_input_tokens_seen": 0,
916
+ "num_train_epochs": 9223372036854775807,
917
+ "save_steps": 500,
918
+ "stateful_callbacks": {
919
+ "TrainerControl": {
920
+ "args": {
921
+ "should_epoch_stop": false,
922
+ "should_evaluate": false,
923
+ "should_log": false,
924
+ "should_save": true,
925
+ "should_training_stop": false
926
+ },
927
+ "attributes": {}
928
+ }
929
+ },
930
+ "total_flos": 0.0,
931
+ "train_batch_size": 32,
932
+ "trial_name": null,
933
+ "trial_params": null
934
+ }
checkpoint-1500/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8721c3d4c4fb62e1b3a5942bcac338cc99c78ef7dfcb870774c274d6e7efc55
3
+ size 5777
checkpoint-1500/wandb_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"project": "finetune-gr00t-n1d6", "run_id": "gr00t_franka_finetune"}
checkpoint-2000/config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_horizon": 50,
3
+ "add_pos_embed": true,
4
+ "apply_sincos_state_encoding": true,
5
+ "architectures": [
6
+ "Gr00tN1d6"
7
+ ],
8
+ "attn_dropout": 0.2,
9
+ "attn_implementation": null,
10
+ "backbone_embedding_dim": 2048,
11
+ "backbone_model_type": "eagle",
12
+ "backbone_trainable_params_fp32": true,
13
+ "collator_overwrite_image_inputs": false,
14
+ "color_jitter_params": {
15
+ "brightness": 0.1,
16
+ "contrast": 0.1,
17
+ "hue": 0.1,
18
+ "saturation": 0.1
19
+ },
20
+ "crop_fraction": 0.95,
21
+ "diffusion_model_cfg": {
22
+ "attention_head_dim": 48,
23
+ "dropout": 0.2,
24
+ "final_dropout": true,
25
+ "interleave_self_attention": true,
26
+ "norm_type": "ada_norm",
27
+ "num_attention_heads": 32,
28
+ "num_layers": 32,
29
+ "output_dim": 1024,
30
+ "positional_embeddings": null
31
+ },
32
+ "eagle_collator": true,
33
+ "formalize_language": true,
34
+ "gemma_collator": false,
35
+ "hidden_size": 1024,
36
+ "image_crop_size": null,
37
+ "image_target_size": null,
38
+ "input_embedding_dim": 1536,
39
+ "load_bf16": true,
40
+ "max_action_dim": 128,
41
+ "max_num_embodiments": 32,
42
+ "max_seq_len": 1024,
43
+ "max_state_dim": 128,
44
+ "model_dtype": "bfloat16",
45
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
46
+ "model_type": "Gr00tN1d6",
47
+ "noise_beta_alpha": 1.5,
48
+ "noise_beta_beta": 1.0,
49
+ "noise_s": 0.999,
50
+ "num_inference_timesteps": 4,
51
+ "num_timestep_buckets": 1000,
52
+ "random_rotation_angle": null,
53
+ "reproject_vision": false,
54
+ "select_layer": 16,
55
+ "shortest_image_edge": 256,
56
+ "state_dropout_prob": 0.0,
57
+ "torch_dtype": "bfloat16",
58
+ "transformers_version": "4.51.3",
59
+ "tune_diffusion_model": true,
60
+ "tune_llm": false,
61
+ "tune_projector": true,
62
+ "tune_top_llm_layers": 4,
63
+ "tune_visual": false,
64
+ "tune_vlln": true,
65
+ "use_albumentations_transforms": true,
66
+ "use_alternate_vl_dit": true,
67
+ "use_flash_attention": true,
68
+ "use_relative_action": true,
69
+ "use_vlln": true
70
+ }
checkpoint-2000/embodiment_id.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "robocasa_panda_omron": 13,
3
+ "gr1": 20,
4
+ "behavior_r1_pro": 24,
5
+ "unitree_g1": 8,
6
+ "oxe_google": 0,
7
+ "oxe_widowx": 1,
8
+ "libero_panda": 2,
9
+ "new_embodiment": 10
10
+ }
checkpoint-2000/experiment_cfg/conf.yaml ADDED
@@ -0,0 +1,204 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ load_config_path: null
2
+ model:
3
+ model_type: Gr00tN1d6
4
+ model_dtype: bfloat16
5
+ model_name: nvidia/Eagle-Block2A-2B-v2
6
+ backbone_model_type: eagle
7
+ model_revision: null
8
+ tune_top_llm_layers: 4
9
+ backbone_embedding_dim: 2048
10
+ tune_llm: false
11
+ tune_visual: false
12
+ select_layer: 16
13
+ reproject_vision: false
14
+ use_flash_attention: true
15
+ load_bf16: false
16
+ collator_overwrite_image_inputs: false
17
+ eagle_collator: true
18
+ backbone_trainable_params_fp32: true
19
+ image_crop_size: null
20
+ image_target_size: null
21
+ shortest_image_edge: 256
22
+ crop_fraction: 0.95
23
+ random_rotation_angle: null
24
+ color_jitter_params: null
25
+ use_albumentations_transforms: true
26
+ formalize_language: true
27
+ apply_sincos_state_encoding: false
28
+ use_relative_action: true
29
+ max_state_dim: 29
30
+ max_action_dim: 29
31
+ action_horizon: 16
32
+ hidden_size: 1024
33
+ input_embedding_dim: 1536
34
+ add_pos_embed: true
35
+ attn_dropout: 0.2
36
+ use_vlln: true
37
+ max_seq_len: 1024
38
+ use_alternate_vl_dit: true
39
+ attend_text_every_n_blocks: 2
40
+ diffusion_model_cfg:
41
+ positional_embeddings: null
42
+ num_layers: 32
43
+ num_attention_heads: 32
44
+ attention_head_dim: 48
45
+ norm_type: ada_norm
46
+ dropout: 0.2
47
+ final_dropout: true
48
+ output_dim: 1024
49
+ interleave_self_attention: true
50
+ num_inference_timesteps: 4
51
+ noise_beta_alpha: 1.5
52
+ noise_beta_beta: 1.0
53
+ noise_s: 0.999
54
+ num_timestep_buckets: 1000
55
+ tune_projector: true
56
+ tune_diffusion_model: true
57
+ tune_vlln: true
58
+ state_dropout_prob: 0.0
59
+ state_additive_noise_scale: 0.0
60
+ max_num_embodiments: 32
61
+ data:
62
+ datasets:
63
+ - dataset_paths:
64
+ - /workspaces/isaaclab_arena/train_data
65
+ embodiment_tag: new_embodiment
66
+ mix_ratio: 1.0
67
+ dataset_type: physical_embodiment
68
+ val_dataset_path: null
69
+ modality_configs:
70
+ new_embodiment:
71
+ video:
72
+ delta_indices:
73
+ - 0
74
+ modality_keys:
75
+ - ego_view
76
+ sin_cos_embedding_keys: null
77
+ mean_std_embedding_keys: null
78
+ action_configs: null
79
+ state:
80
+ delta_indices:
81
+ - 0
82
+ modality_keys:
83
+ - single_arm
84
+ - gripper
85
+ sin_cos_embedding_keys: null
86
+ mean_std_embedding_keys: null
87
+ action_configs: null
88
+ action:
89
+ delta_indices:
90
+ - 0
91
+ - 1
92
+ - 2
93
+ - 3
94
+ - 4
95
+ - 5
96
+ - 6
97
+ - 7
98
+ - 8
99
+ - 9
100
+ - 10
101
+ - 11
102
+ - 12
103
+ - 13
104
+ - 14
105
+ - 15
106
+ modality_keys:
107
+ - single_arm
108
+ - gripper
109
+ sin_cos_embedding_keys: null
110
+ mean_std_embedding_keys: null
111
+ action_configs:
112
+ - rep: RELATIVE
113
+ type: NON_EEF
114
+ format: DEFAULT
115
+ state_key: single_arm
116
+ - rep: ABSOLUTE
117
+ type: NON_EEF
118
+ format: DEFAULT
119
+ state_key: null
120
+ language:
121
+ delta_indices:
122
+ - 0
123
+ modality_keys:
124
+ - annotation.human.task_description
125
+ sin_cos_embedding_keys: null
126
+ mean_std_embedding_keys: null
127
+ action_configs: null
128
+ download_cache: false
129
+ shard_size: 1024
130
+ episode_sampling_rate: 0.1
131
+ num_shards_per_epoch: 100000
132
+ override_pretraining_statistics: false
133
+ mode: single_turn
134
+ random_chop: 0.0
135
+ mock_dataset_mode: false
136
+ shuffle: true
137
+ seed: 42
138
+ multiprocessing_context: fork
139
+ allow_padding: false
140
+ subsample_ratio: 1.0
141
+ image_crop_size:
142
+ - 244
143
+ - 244
144
+ image_target_size:
145
+ - 224
146
+ - 224
147
+ video_backend: torchcodec
148
+ training:
149
+ output_dir: /home/ubuntu/.cache/gr00t_franka_finetune
150
+ experiment_name: null
151
+ max_steps: 2000
152
+ global_batch_size: 32
153
+ batch_size: null
154
+ gradient_accumulation_steps: 1
155
+ learning_rate: 0.0001
156
+ lr_scheduler_type: cosine
157
+ weight_decay: 1.0e-05
158
+ warmup_ratio: 0.05
159
+ warmup_steps: 0
160
+ max_grad_norm: 1.0
161
+ optim: adamw_torch
162
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
163
+ tf32: true
164
+ fp16: false
165
+ bf16: true
166
+ eval_bf16: true
167
+ logging_steps: 10
168
+ save_steps: 500
169
+ save_total_limit: 4
170
+ save_vl_model: false
171
+ upload_checkpoints: false
172
+ upload_every: 1000
173
+ upload_last_n_checkpoints: 5
174
+ max_concurrent_uploads: 2
175
+ eval_strategy: 'no'
176
+ eval_steps: 500
177
+ eval_set_split_ratio: 0.1
178
+ eval_batch_size: 2
179
+ save_best_eval_metric_name: ''
180
+ save_best_eval_metric_greater_is_better: true
181
+ deepspeed_stage: 2
182
+ gradient_checkpointing: false
183
+ transformers_trust_remote_code: true
184
+ transformers_local_files_only: false
185
+ transformers_cache_dir: null
186
+ transformers_access_token: null
187
+ use_ddp: false
188
+ ddp_bucket_cap_mb: 100
189
+ num_gpus: 1
190
+ dataloader_num_workers: 32
191
+ remove_unused_columns: false
192
+ use_wandb: false
193
+ wandb_project: finetune-gr00t-n1d6
194
+ enable_profiling: false
195
+ max_retries: 3
196
+ assert_loss_less_than: null
197
+ add_rl_callback: false
198
+ enable_open_loop_eval: false
199
+ open_loop_eval_traj_ids:
200
+ - 0
201
+ open_loop_eval_steps_per_traj: 100
202
+ open_loop_eval_plot_indices: null
203
+ max_steps: 2000
204
+ save_steps: 500
checkpoint-2000/experiment_cfg/config.yaml ADDED
@@ -0,0 +1,238 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:gr00t.configs.base_config.Config
2
+ data: !!python/object:gr00t.configs.data.data_config.DataConfig
3
+ allow_padding: false
4
+ datasets:
5
+ - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
6
+ dataset_paths:
7
+ - /workspaces/isaaclab_arena/train_data
8
+ dataset_type: physical_embodiment
9
+ embodiment_tag: new_embodiment
10
+ mix_ratio: 1.0
11
+ val_dataset_path: null
12
+ download_cache: false
13
+ episode_sampling_rate: 0.1
14
+ image_crop_size:
15
+ - 244
16
+ - 244
17
+ image_target_size:
18
+ - 224
19
+ - 224
20
+ mock_dataset_mode: false
21
+ modality_configs:
22
+ new_embodiment:
23
+ action: !!python/object:gr00t.data.types.ModalityConfig
24
+ action_configs:
25
+ - !!python/object:gr00t.data.types.ActionConfig
26
+ format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
27
+ - default
28
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
29
+ - relative
30
+ state_key: single_arm
31
+ type: &id002 !!python/object/apply:gr00t.data.types.ActionType
32
+ - non_eef
33
+ - !!python/object:gr00t.data.types.ActionConfig
34
+ format: *id001
35
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
36
+ - absolute
37
+ state_key: null
38
+ type: *id002
39
+ delta_indices:
40
+ - 0
41
+ - 1
42
+ - 2
43
+ - 3
44
+ - 4
45
+ - 5
46
+ - 6
47
+ - 7
48
+ - 8
49
+ - 9
50
+ - 10
51
+ - 11
52
+ - 12
53
+ - 13
54
+ - 14
55
+ - 15
56
+ mean_std_embedding_keys: null
57
+ modality_keys:
58
+ - single_arm
59
+ - gripper
60
+ sin_cos_embedding_keys: null
61
+ language: !!python/object:gr00t.data.types.ModalityConfig
62
+ action_configs: null
63
+ delta_indices:
64
+ - 0
65
+ mean_std_embedding_keys: null
66
+ modality_keys:
67
+ - annotation.human.task_description
68
+ sin_cos_embedding_keys: null
69
+ state: !!python/object:gr00t.data.types.ModalityConfig
70
+ action_configs: null
71
+ delta_indices:
72
+ - 0
73
+ mean_std_embedding_keys: null
74
+ modality_keys:
75
+ - single_arm
76
+ - gripper
77
+ sin_cos_embedding_keys: null
78
+ video: !!python/object:gr00t.data.types.ModalityConfig
79
+ action_configs: null
80
+ delta_indices:
81
+ - 0
82
+ mean_std_embedding_keys: null
83
+ modality_keys:
84
+ - ego_view
85
+ sin_cos_embedding_keys: null
86
+ mode: single_turn
87
+ multiprocessing_context: fork
88
+ num_shards_per_epoch: 100000
89
+ override_pretraining_statistics: false
90
+ random_chop: 0.0
91
+ seed: 42
92
+ shard_size: 1024
93
+ shuffle: true
94
+ subsample_ratio: 1.0
95
+ video_backend: torchcodec
96
+ load_config_path: null
97
+ model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
98
+ _attn_implementation_autoset: false
99
+ _attn_implementation_internal: null
100
+ _commit_hash: null
101
+ _name_or_path: ''
102
+ add_cross_attention: false
103
+ architectures: null
104
+ backbone_model_type: eagle
105
+ backbone_trainable_params_fp32: true
106
+ bad_words_ids: null
107
+ begin_suppress_tokens: null
108
+ bos_token_id: null
109
+ chunk_size_feed_forward: 0
110
+ color_jitter_params: null
111
+ cross_attention_hidden_size: null
112
+ decoder_start_token_id: null
113
+ diffusion_model_cfg:
114
+ attention_head_dim: 48
115
+ dropout: 0.2
116
+ final_dropout: true
117
+ interleave_self_attention: true
118
+ norm_type: ada_norm
119
+ num_attention_heads: 32
120
+ num_layers: 32
121
+ output_dim: 1024
122
+ positional_embeddings: null
123
+ diversity_penalty: 0.0
124
+ do_sample: false
125
+ eagle_collator: true
126
+ early_stopping: false
127
+ encoder_no_repeat_ngram_size: 0
128
+ eos_token_id: null
129
+ exponential_decay_length_penalty: null
130
+ finetuning_task: null
131
+ forced_bos_token_id: null
132
+ forced_eos_token_id: null
133
+ id2label:
134
+ 0: LABEL_0
135
+ 1: LABEL_1
136
+ is_decoder: false
137
+ is_encoder_decoder: false
138
+ label2id:
139
+ LABEL_0: 0
140
+ LABEL_1: 1
141
+ length_penalty: 1.0
142
+ load_bf16: false
143
+ max_length: 20
144
+ min_length: 0
145
+ model_name: nvidia/Eagle-Block2A-2B-v2
146
+ no_repeat_ngram_size: 0
147
+ num_beam_groups: 1
148
+ num_beams: 1
149
+ num_return_sequences: 1
150
+ output_attentions: false
151
+ output_hidden_states: false
152
+ output_scores: false
153
+ pad_token_id: null
154
+ prefix: null
155
+ problem_type: null
156
+ pruned_heads: {}
157
+ random_rotation_angle: null
158
+ remove_invalid_values: false
159
+ repetition_penalty: 1.0
160
+ reproject_vision: false
161
+ return_dict: true
162
+ return_dict_in_generate: false
163
+ sep_token_id: null
164
+ state_dropout_prob: 0.0
165
+ suppress_tokens: null
166
+ task_specific_params: null
167
+ temperature: 1.0
168
+ tf_legacy_loss: false
169
+ tie_encoder_decoder: false
170
+ tie_word_embeddings: true
171
+ tokenizer_class: null
172
+ top_k: 50
173
+ top_p: 1.0
174
+ torch_dtype: null
175
+ torchscript: false
176
+ transformers_version: null
177
+ tune_diffusion_model: true
178
+ tune_llm: false
179
+ tune_projector: true
180
+ tune_visual: false
181
+ typical_p: 1.0
182
+ use_bfloat16: false
183
+ use_relative_action: true
184
+ training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
185
+ add_rl_callback: false
186
+ assert_loss_less_than: null
187
+ batch_size: null
188
+ bf16: true
189
+ dataloader_num_workers: 32
190
+ ddp_bucket_cap_mb: 100
191
+ deepspeed_stage: 2
192
+ enable_open_loop_eval: false
193
+ enable_profiling: false
194
+ eval_batch_size: 2
195
+ eval_bf16: true
196
+ eval_set_split_ratio: 0.1
197
+ eval_steps: 500
198
+ eval_strategy: 'no'
199
+ experiment_name: null
200
+ fp16: false
201
+ global_batch_size: 32
202
+ gradient_accumulation_steps: 1
203
+ gradient_checkpointing: false
204
+ learning_rate: 0.0001
205
+ logging_steps: 10
206
+ lr_scheduler_type: cosine
207
+ max_concurrent_uploads: 2
208
+ max_grad_norm: 1.0
209
+ max_retries: 3
210
+ max_steps: 2000
211
+ num_gpus: 1
212
+ open_loop_eval_plot_indices: null
213
+ open_loop_eval_steps_per_traj: 100
214
+ open_loop_eval_traj_ids:
215
+ - 0
216
+ optim: adamw_torch
217
+ output_dir: /home/ubuntu/.cache/gr00t_franka_finetune
218
+ remove_unused_columns: false
219
+ save_best_eval_metric_greater_is_better: true
220
+ save_best_eval_metric_name: ''
221
+ save_steps: 500
222
+ save_total_limit: 4
223
+ save_vl_model: false
224
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
225
+ tf32: true
226
+ transformers_access_token: null
227
+ transformers_cache_dir: null
228
+ transformers_local_files_only: false
229
+ transformers_trust_remote_code: true
230
+ upload_checkpoints: false
231
+ upload_every: 1000
232
+ upload_last_n_checkpoints: 5
233
+ use_ddp: false
234
+ use_wandb: false
235
+ wandb_project: finetune-gr00t-n1d6
236
+ warmup_ratio: 0.05
237
+ warmup_steps: 0
238
+ weight_decay: 1.0e-05
checkpoint-2000/experiment_cfg/dataset_statistics.json ADDED
@@ -0,0 +1,1046 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "new_embodiment": {
3
+ "state": {
4
+ "single_arm": {
5
+ "min": [
6
+ -0.1016506552696228,
7
+ -0.1761876344680786,
8
+ -0.054869189858436584,
9
+ -1.4101576805114746,
10
+ -0.38218289613723755,
11
+ -0.022114872932434082,
12
+ -0.10868370532989502
13
+ ],
14
+ "max": [
15
+ 0.3447756767272949,
16
+ 1.2365270853042603,
17
+ 0.39242762327194214,
18
+ 0.2529296278953552,
19
+ 0.18470034003257751,
20
+ 2.118802309036255,
21
+ 0.8016068339347839
22
+ ],
23
+ "mean": [
24
+ 0.042614661157131195,
25
+ 0.4292725920677185,
26
+ 0.10685384273529053,
27
+ -0.8481684923171997,
28
+ -0.004952127579599619,
29
+ 1.2715188264846802,
30
+ 0.14739659428596497
31
+ ],
32
+ "std": [
33
+ 0.08599156141281128,
34
+ 0.38931092619895935,
35
+ 0.08684167265892029,
36
+ 0.41639015078544617,
37
+ 0.09905096888542175,
38
+ 0.639055073261261,
39
+ 0.20859868824481964
40
+ ],
41
+ "q01": [
42
+ -0.08698830261826515,
43
+ -0.16300016283988952,
44
+ -0.031826803982257845,
45
+ -1.3965834760665894,
46
+ -0.33692867517471314,
47
+ -0.005149464607238769,
48
+ -0.0991782522201538
49
+ ],
50
+ "q99": [
51
+ 0.3135400813817978,
52
+ 1.2095760893821716,
53
+ 0.3296026331186294,
54
+ 0.09940535783767694,
55
+ 0.177163989841938,
56
+ 2.111123719215393,
57
+ 0.7685691952705384
58
+ ]
59
+ },
60
+ "gripper": {
61
+ "min": [
62
+ -0.016243789345026016,
63
+ -0.017369966953992844
64
+ ],
65
+ "max": [
66
+ 0.0,
67
+ 0.0
68
+ ],
69
+ "mean": [
70
+ -0.0054468195885419846,
71
+ -0.005668346770107746
72
+ ],
73
+ "std": [
74
+ 0.007502974011003971,
75
+ 0.007808898109942675
76
+ ],
77
+ "q01": [
78
+ -0.01618218619376421,
79
+ -0.01736501693725586
80
+ ],
81
+ "q99": [
82
+ 0.0,
83
+ 0.0
84
+ ]
85
+ }
86
+ },
87
+ "action": {
88
+ "single_arm": {
89
+ "min": [
90
+ -0.029919808730483055,
91
+ -0.030760474503040314,
92
+ -0.03454569727182388,
93
+ -0.023138338699936867,
94
+ -0.0294453464448452,
95
+ -0.04707210883498192,
96
+ 0.0
97
+ ],
98
+ "max": [
99
+ 0.04578776657581329,
100
+ 0.03417271375656128,
101
+ 0.032364509999752045,
102
+ 0.012034625746309757,
103
+ 0.08025076240301132,
104
+ 0.04756892845034599,
105
+ 0.03999999910593033
106
+ ],
107
+ "mean": [
108
+ 0.013533495366573334,
109
+ 0.007476440165191889,
110
+ -0.01020827516913414,
111
+ -0.00018720414664130658,
112
+ 0.00028234944329597056,
113
+ -5.855086783412844e-05,
114
+ 0.026392336934804916
115
+ ],
116
+ "std": [
117
+ 0.012855037115514278,
118
+ 0.012551924213767052,
119
+ 0.017873870208859444,
120
+ 0.0029166981112211943,
121
+ 0.005159514490514994,
122
+ 0.004970518872141838,
123
+ 0.01895107515156269
124
+ ],
125
+ "q01": [
126
+ -0.005514774760231375,
127
+ -0.024535775482654572,
128
+ -0.030423654653131963,
129
+ -0.008391074724495412,
130
+ -0.01150766346603632,
131
+ -0.015753980539739133,
132
+ 0.0
133
+ ],
134
+ "q99": [
135
+ 0.03146043732762337,
136
+ 0.02946644090116024,
137
+ 0.028492353856563568,
138
+ 0.006190066309645771,
139
+ 0.01955891106277704,
140
+ 0.016726106889545896,
141
+ 0.03999999910593033
142
+ ]
143
+ },
144
+ "gripper": {
145
+ "min": [
146
+ 0.0
147
+ ],
148
+ "max": [
149
+ 0.03999999910593033
150
+ ],
151
+ "mean": [
152
+ 0.026392336934804916
153
+ ],
154
+ "std": [
155
+ 0.01895107515156269
156
+ ],
157
+ "q01": [
158
+ 0.0
159
+ ],
160
+ "q99": [
161
+ 0.03999999910593033
162
+ ]
163
+ }
164
+ },
165
+ "relative_action": {
166
+ "single_arm": {
167
+ "min": [
168
+ [
169
+ -0.32329919934272766,
170
+ -1.1854932308197021,
171
+ -0.39748504757881165,
172
+ -0.25286412239074707,
173
+ -0.18570305407047272,
174
+ -2.121999979019165,
175
+ -0.7839499115943909
176
+ ],
177
+ [
178
+ -0.32189974188804626,
179
+ -1.1826070547103882,
180
+ -0.39696475863456726,
181
+ -0.2544684112071991,
182
+ -0.18530802428722382,
183
+ -2.1222615242004395,
184
+ -0.7839499115943909
185
+ ],
186
+ [
187
+ -0.32321855425834656,
188
+ -1.1859318017959595,
189
+ -0.39636000990867615,
190
+ -0.2523682117462158,
191
+ -0.18859536945819855,
192
+ -2.1214780807495117,
193
+ -0.7839499115943909
194
+ ],
195
+ [
196
+ -0.3242166042327881,
197
+ -1.181753158569336,
198
+ -0.3955015242099762,
199
+ -0.2530977129936218,
200
+ -0.18825502693653107,
201
+ -2.1224093437194824,
202
+ -0.7839499115943909
203
+ ],
204
+ [
205
+ -0.3244396150112152,
206
+ -1.1838017702102661,
207
+ -0.3950645923614502,
208
+ -0.24863530695438385,
209
+ -0.18772920966148376,
210
+ -2.1221938133239746,
211
+ -0.7839499115943909
212
+ ],
213
+ [
214
+ -0.3249604403972626,
215
+ -1.1851550340652466,
216
+ -0.3945443034172058,
217
+ -0.2545105218887329,
218
+ -0.19080020487308502,
219
+ -2.12245512008667,
220
+ -0.7839499115943909
221
+ ],
222
+ [
223
+ -0.3240599036216736,
224
+ -1.2094337940216064,
225
+ -0.3939395546913147,
226
+ -0.2524451017379761,
227
+ -0.19165967404842377,
228
+ -2.1216351985931396,
229
+ -0.7839499115943909
230
+ ],
231
+ [
232
+ -0.3237849175930023,
233
+ -1.2061353921890259,
234
+ -0.39335793256759644,
235
+ -0.25646376609802246,
236
+ -0.19124479591846466,
237
+ -2.12142276763916,
238
+ -0.7839499115943909
239
+ ],
240
+ [
241
+ -0.32624951004981995,
242
+ -1.2092955112457275,
243
+ -0.3938826322555542,
244
+ -0.25647443532943726,
245
+ -0.19049783051013947,
246
+ -2.1221275329589844,
247
+ -0.7839499115943909
248
+ ],
249
+ [
250
+ -0.32307595014572144,
251
+ -1.205997109413147,
252
+ -0.39394718408584595,
253
+ -0.257379949092865,
254
+ -0.1888638287782669,
255
+ -2.1217713356018066,
256
+ -0.7839499115943909
257
+ ],
258
+ [
259
+ -0.3202081322669983,
260
+ -1.20602285861969,
261
+ -0.39648687839508057,
262
+ -0.2556869089603424,
263
+ -0.18957450985908508,
264
+ -2.1215648651123047,
265
+ -0.7801104187965393
266
+ ],
267
+ [
268
+ -0.32303914427757263,
269
+ -1.2070811986923218,
270
+ -0.39701157808303833,
271
+ -0.2523868978023529,
272
+ -0.1896384060382843,
273
+ -2.1222102642059326,
274
+ -0.7777257561683655
275
+ ],
276
+ [
277
+ -0.3236537277698517,
278
+ -1.20821213722229,
279
+ -0.3970761299133301,
280
+ -0.25582969188690186,
281
+ -0.18970085680484772,
282
+ -2.1212406158447266,
283
+ -0.774041473865509
284
+ ],
285
+ [
286
+ -0.32262563705444336,
287
+ -1.20747709274292,
288
+ -0.39746999740600586,
289
+ -0.2536396086215973,
290
+ -0.18984927237033844,
291
+ -2.1219756603240967,
292
+ -0.7704301476478577
293
+ ],
294
+ [
295
+ -0.32665905356407166,
296
+ -1.2074377536773682,
297
+ -0.3977932929992676,
298
+ -0.2506418526172638,
299
+ -0.1900315284729004,
300
+ -2.121697187423706,
301
+ -0.7680240273475647
302
+ ],
303
+ [
304
+ -0.3236996829509735,
305
+ -1.2079046964645386,
306
+ -0.3978058695793152,
307
+ -0.2523408532142639,
308
+ -0.19020666182041168,
309
+ -2.1220388412475586,
310
+ -0.765728771686554
311
+ ]
312
+ ],
313
+ "max": [
314
+ [
315
+ 0.12719863653182983,
316
+ 0.18446235358715057,
317
+ 0.06538978964090347,
318
+ 1.4123303890228271,
319
+ 0.36543214321136475,
320
+ 0.055936314165592194,
321
+ 0.1482430398464203
322
+ ],
323
+ [
324
+ 0.12787628173828125,
325
+ 0.18225406110286713,
326
+ 0.0630723312497139,
327
+ 1.4122768640518188,
328
+ 0.3634565770626068,
329
+ 0.05312386155128479,
330
+ 0.14398613572120667
331
+ ],
332
+ [
333
+ 0.12855961918830872,
334
+ 0.18054865300655365,
335
+ 0.060906484723091125,
336
+ 1.4116393327713013,
337
+ 0.3660118877887726,
338
+ 0.052048832178115845,
339
+ 0.14211878180503845
340
+ ],
341
+ [
342
+ 0.12901031970977783,
343
+ 0.17937372624874115,
344
+ 0.05962555110454559,
345
+ 1.412109613418579,
346
+ 0.3632301688194275,
347
+ 0.05115959048271179,
348
+ 0.14021214842796326
349
+ ],
350
+ [
351
+ 0.12952828407287598,
352
+ 0.1794057935476303,
353
+ 0.06009196117520332,
354
+ 1.4119149446487427,
355
+ 0.36106500029563904,
356
+ 0.05047079920768738,
357
+ 0.13852760195732117
358
+ ],
359
+ [
360
+ 0.12882810831069946,
361
+ 0.17998431622982025,
362
+ 0.06065024808049202,
363
+ 1.4128142595291138,
364
+ 0.3649647831916809,
365
+ 0.050107747316360474,
366
+ 0.13429853320121765
367
+ ],
368
+ [
369
+ 0.12831519544124603,
370
+ 0.17946301400661469,
371
+ 0.06099287047982216,
372
+ 1.4133707284927368,
373
+ 0.36815109848976135,
374
+ 0.04975596070289612,
375
+ 0.1339406669139862
376
+ ],
377
+ [
378
+ 0.12905743718147278,
379
+ 0.1786593645811081,
380
+ 0.06112520769238472,
381
+ 1.4141303300857544,
382
+ 0.3652087152004242,
383
+ 0.04841601476073265,
384
+ 0.1322639286518097
385
+ ],
386
+ [
387
+ 0.1297350823879242,
388
+ 0.1776067465543747,
389
+ 0.0573953241109848,
390
+ 1.4146143198013306,
391
+ 0.3671979606151581,
392
+ 0.04757409915328026,
393
+ 0.13022002577781677
394
+ ],
395
+ [
396
+ 0.13041843473911285,
397
+ 0.17776383459568024,
398
+ 0.05858777463436127,
399
+ 1.4145153760910034,
400
+ 0.36353617906570435,
401
+ 0.045672591775655746,
402
+ 0.12888506054878235
403
+ ],
404
+ [
405
+ 0.13086912035942078,
406
+ 0.17834235727787018,
407
+ 0.05983245372772217,
408
+ 1.4148727655410767,
409
+ 0.36363980174064636,
410
+ 0.04265117272734642,
411
+ 0.1267530620098114
412
+ ],
413
+ [
414
+ 0.13138708472251892,
415
+ 0.17829257249832153,
416
+ 0.06080028414726257,
417
+ 1.4132124185562134,
418
+ 0.36463645100593567,
419
+ 0.04230935871601105,
420
+ 0.12515506148338318
421
+ ],
422
+ [
423
+ 0.1306869238615036,
424
+ 0.17859286069869995,
425
+ 0.06156755983829498,
426
+ 1.4115465879440308,
427
+ 0.36609867215156555,
428
+ 0.041467443108558655,
429
+ 0.12416491657495499
430
+ ],
431
+ [
432
+ 0.12939347326755524,
433
+ 0.1791713833808899,
434
+ 0.06212584674358368,
435
+ 1.4120947122573853,
436
+ 0.36583268642425537,
437
+ 0.03956593573093414,
438
+ 0.12115160375833511
439
+ ],
440
+ [
441
+ 0.12968552112579346,
442
+ 0.17865008115768433,
443
+ 0.06246846914291382,
444
+ 1.4127825498580933,
445
+ 0.36217090487480164,
446
+ 0.04159165173768997,
447
+ 0.11784551292657852
448
+ ],
449
+ [
450
+ 0.12998661398887634,
451
+ 0.17784643173217773,
452
+ 0.06260080635547638,
453
+ 1.4135223627090454,
454
+ 0.361840158700943,
455
+ 0.040185101330280304,
456
+ 0.11627308279275894
457
+ ]
458
+ ],
459
+ "mean": [
460
+ [
461
+ -0.021064985543489456,
462
+ -0.39792153239250183,
463
+ -0.11181046068668365,
464
+ 0.8605598211288452,
465
+ -0.0025237626396119595,
466
+ -1.2637412548065186,
467
+ -0.10358496010303497
468
+ ],
469
+ [
470
+ -0.02104770392179489,
471
+ -0.3978676497936249,
472
+ -0.11182692646980286,
473
+ 0.8605672717094421,
474
+ -0.002523584757000208,
475
+ -1.2637417316436768,
476
+ -0.10367059707641602
477
+ ],
478
+ [
479
+ -0.021030250936746597,
480
+ -0.397811621427536,
481
+ -0.11184262484312057,
482
+ 0.8605707287788391,
483
+ -0.0025277354288846254,
484
+ -1.2637302875518799,
485
+ -0.10375623404979706
486
+ ],
487
+ [
488
+ -0.02101544663310051,
489
+ -0.39775529503822327,
490
+ -0.11185839772224426,
491
+ 0.8605775833129883,
492
+ -0.002535233274102211,
493
+ -1.2637287378311157,
494
+ -0.10384184867143631
495
+ ],
496
+ [
497
+ -0.021001672372221947,
498
+ -0.39770010113716125,
499
+ -0.11185967922210693,
500
+ 0.8605857491493225,
501
+ -0.0025436626747250557,
502
+ -1.2637271881103516,
503
+ -0.10392745584249496
504
+ ],
505
+ [
506
+ -0.02098824642598629,
507
+ -0.3976578712463379,
508
+ -0.11185971647500992,
509
+ 0.8605918884277344,
510
+ -0.0025569903664290905,
511
+ -1.2637248039245605,
512
+ -0.10401306301355362
513
+ ],
514
+ [
515
+ -0.020976334810256958,
516
+ -0.39763131737709045,
517
+ -0.11186240613460541,
518
+ 0.8606000542640686,
519
+ -0.0025741278659552336,
520
+ -1.26372230052948,
521
+ -0.10409871488809586
522
+ ],
523
+ [
524
+ -0.020982732996344566,
525
+ -0.3976297378540039,
526
+ -0.11186536401510239,
527
+ 0.8606085777282715,
528
+ -0.0025887791998684406,
529
+ -1.2637240886688232,
530
+ -0.1041843369603157
531
+ ],
532
+ [
533
+ -0.020988795906305313,
534
+ -0.397623211145401,
535
+ -0.11186520755290985,
536
+ 0.8606117963790894,
537
+ -0.0025999434292316437,
538
+ -1.2637230157852173,
539
+ -0.10424429178237915
540
+ ],
541
+ [
542
+ -0.020994234830141068,
543
+ -0.3976192772388458,
544
+ -0.11186467111110687,
545
+ 0.8606191873550415,
546
+ -0.002612028270959854,
547
+ -1.2637211084365845,
548
+ -0.10427426546812057
549
+ ],
550
+ [
551
+ -0.020999347791075706,
552
+ -0.3976156413555145,
553
+ -0.11186596006155014,
554
+ 0.8606262803077698,
555
+ -0.0026231720112264156,
556
+ -1.2637207508087158,
557
+ -0.10427425056695938
558
+ ],
559
+ [
560
+ -0.021002445369958878,
561
+ -0.3976096510887146,
562
+ -0.11186514049768448,
563
+ 0.860630214214325,
564
+ -0.002635682700201869,
565
+ -1.2637168169021606,
566
+ -0.10427428781986237
567
+ ],
568
+ [
569
+ -0.021011201664805412,
570
+ -0.39761000871658325,
571
+ -0.11186651140451431,
572
+ 0.860638439655304,
573
+ -0.002646006178110838,
574
+ -1.2637174129486084,
575
+ -0.10427427291870117
576
+ ],
577
+ [
578
+ -0.021014675498008728,
579
+ -0.39760351181030273,
580
+ -0.11186712980270386,
581
+ 0.8606441617012024,
582
+ -0.002654573880136013,
583
+ -1.2637194395065308,
584
+ -0.10427426546812057
585
+ ],
586
+ [
587
+ -0.021040834486484528,
588
+ -0.3976028859615326,
589
+ -0.11186829954385757,
590
+ 0.8606491088867188,
591
+ -0.002666682470589876,
592
+ -1.2637138366699219,
593
+ -0.10427425056695938
594
+ ],
595
+ [
596
+ -0.02106592431664467,
597
+ -0.39760419726371765,
598
+ -0.11186770349740982,
599
+ 0.8606574535369873,
600
+ -0.002680801786482334,
601
+ -1.2637156248092651,
602
+ -0.10427422821521759
603
+ ]
604
+ ],
605
+ "std": [
606
+ [
607
+ 0.07862132787704468,
608
+ 0.36472052335739136,
609
+ 0.07953183352947235,
610
+ 0.41708749532699585,
611
+ 0.08953142166137695,
612
+ 0.6474994421005249,
613
+ 0.2003270834684372
614
+ ],
615
+ [
616
+ 0.07865532487630844,
617
+ 0.36466875672340393,
618
+ 0.07954908907413483,
619
+ 0.4170789122581482,
620
+ 0.08954057842493057,
621
+ 0.6475056409835815,
622
+ 0.20027098059654236
623
+ ],
624
+ [
625
+ 0.07868577539920807,
626
+ 0.36461395025253296,
627
+ 0.07956718653440475,
628
+ 0.41706907749176025,
629
+ 0.08954384922981262,
630
+ 0.6475113034248352,
631
+ 0.20021489262580872
632
+ ],
633
+ [
634
+ 0.07872062176465988,
635
+ 0.3645585775375366,
636
+ 0.07958472520112991,
637
+ 0.41705429553985596,
638
+ 0.08954395353794098,
639
+ 0.6475160717964172,
640
+ 0.2001601606607437
641
+ ],
642
+ [
643
+ 0.07875548303127289,
644
+ 0.3645066022872925,
645
+ 0.07957513630390167,
646
+ 0.4170401096343994,
647
+ 0.08954435586929321,
648
+ 0.6475217342376709,
649
+ 0.2001052349805832
650
+ ],
651
+ [
652
+ 0.07878728210926056,
653
+ 0.36448603868484497,
654
+ 0.07956283539533615,
655
+ 0.4170234501361847,
656
+ 0.08953587710857391,
657
+ 0.6475263237953186,
658
+ 0.2000516802072525
659
+ ],
660
+ [
661
+ 0.07882208377122879,
662
+ 0.36450454592704773,
663
+ 0.07955189794301987,
664
+ 0.41700881719589233,
665
+ 0.08952254056930542,
666
+ 0.647530734539032,
667
+ 0.19999809563159943
668
+ ],
669
+ [
670
+ 0.07889280468225479,
671
+ 0.3645552396774292,
672
+ 0.07954024523496628,
673
+ 0.4169907867908478,
674
+ 0.08951205015182495,
675
+ 0.6475338339805603,
676
+ 0.19994452595710754
677
+ ],
678
+ [
679
+ 0.07896006852388382,
680
+ 0.3646087050437927,
681
+ 0.07952792197465897,
682
+ 0.4169798195362091,
683
+ 0.08950342237949371,
684
+ 0.6475362181663513,
685
+ 0.19982454180717468
686
+ ],
687
+ [
688
+ 0.07902492582798004,
689
+ 0.36466050148010254,
690
+ 0.07951349020004272,
691
+ 0.4169654846191406,
692
+ 0.08949856460094452,
693
+ 0.6475402116775513,
694
+ 0.19963733851909637
695
+ ],
696
+ [
697
+ 0.0790853276848793,
698
+ 0.36471861600875854,
699
+ 0.07950460910797119,
700
+ 0.4169500768184662,
701
+ 0.08949100971221924,
702
+ 0.6475431323051453,
703
+ 0.19935448467731476
704
+ ],
705
+ [
706
+ 0.0791463851928711,
707
+ 0.3647766411304474,
708
+ 0.07949627935886383,
709
+ 0.4169394075870514,
710
+ 0.08948377519845963,
711
+ 0.6475453972816467,
712
+ 0.19907325506210327
713
+ ],
714
+ [
715
+ 0.07920938730239868,
716
+ 0.36483389139175415,
717
+ 0.07948218286037445,
718
+ 0.4169244170188904,
719
+ 0.08947892487049103,
720
+ 0.6475448608398438,
721
+ 0.19879388809204102
722
+ ],
723
+ [
724
+ 0.0792689323425293,
725
+ 0.3648894131183624,
726
+ 0.07947037369012833,
727
+ 0.41691312193870544,
728
+ 0.08947526663541794,
729
+ 0.6475451588630676,
730
+ 0.19851621985435486
731
+ ],
732
+ [
733
+ 0.07932519167661667,
734
+ 0.3649515211582184,
735
+ 0.07945462316274643,
736
+ 0.4169033467769623,
737
+ 0.08946864306926727,
738
+ 0.6475487947463989,
739
+ 0.19824036955833435
740
+ ],
741
+ [
742
+ 0.07937267422676086,
743
+ 0.36501482129096985,
744
+ 0.07943546772003174,
745
+ 0.41688644886016846,
746
+ 0.08945988863706589,
747
+ 0.6475464701652527,
748
+ 0.19796623289585114
749
+ ]
750
+ ],
751
+ "q01": [
752
+ [
753
+ -0.2686644893884659,
754
+ -1.1166756582260131,
755
+ -0.3249503219127655,
756
+ -0.10763738259673118,
757
+ -0.17754718899726868,
758
+ -2.11095911026001,
759
+ -0.726121768951416
760
+ ],
761
+ [
762
+ -0.2715908128023148,
763
+ -1.1176964545249939,
764
+ -0.3246971207857132,
765
+ -0.10447386264801026,
766
+ -0.17755473166704178,
767
+ -2.111039023399353,
768
+ -0.726121768951416
769
+ ],
770
+ [
771
+ -0.2721079695224762,
772
+ -1.1183462095260621,
773
+ -0.32473934948444366,
774
+ -0.10659581780433655,
775
+ -0.17748151123523712,
776
+ -2.1109159421920776,
777
+ -0.726121768951416
778
+ ],
779
+ [
780
+ -0.2719108146429062,
781
+ -1.1183584260940551,
782
+ -0.3249865293502808,
783
+ -0.10559523880481719,
784
+ -0.17776453107595444,
785
+ -2.1114220952987672,
786
+ -0.726121768951416
787
+ ],
788
+ [
789
+ -0.27478108763694764,
790
+ -1.1184560322761536,
791
+ -0.32442001819610594,
792
+ -0.10662905514240265,
793
+ -0.17751205533742906,
794
+ -2.111326847076416,
795
+ -0.726121768951416
796
+ ],
797
+ [
798
+ -0.27461387276649474,
799
+ -1.1171478915214539,
800
+ -0.32468852162361145,
801
+ -0.10610488697886467,
802
+ -0.17753057986497878,
803
+ -2.1112320852279662,
804
+ -0.726121768951416
805
+ ],
806
+ [
807
+ -0.2748466944694519,
808
+ -1.1176495385169982,
809
+ -0.3247254079580307,
810
+ -0.10539359807968139,
811
+ -0.17761774510145187,
812
+ -2.111006693840027,
813
+ -0.726121768951416
814
+ ],
815
+ [
816
+ -0.2763983929157257,
817
+ -1.1234028029441834,
818
+ -0.32481603741645815,
819
+ -0.10651438012719154,
820
+ -0.17762102216482162,
821
+ -2.110989727973938,
822
+ -0.726121768951416
823
+ ],
824
+ [
825
+ -0.27612989604473115,
826
+ -1.1322602534294128,
827
+ -0.3249142354726791,
828
+ -0.104207394272089,
829
+ -0.17753226101398467,
830
+ -2.1104533433914185,
831
+ -0.726121768951416
832
+ ],
833
+ [
834
+ -0.2772212654352188,
835
+ -1.1327979397773742,
836
+ -0.3250032651424408,
837
+ -0.10369521856307984,
838
+ -0.1775078284740448,
839
+ -2.110794858932495,
840
+ -0.726121768951416
841
+ ],
842
+ [
843
+ -0.27782695055007933,
844
+ -1.1329670572280883,
845
+ -0.3251311558485031,
846
+ -0.10523794278502464,
847
+ -0.17756187170743942,
848
+ -2.111419234275818,
849
+ -0.7251607692241668
850
+ ],
851
+ [
852
+ -0.2772995239496231,
853
+ -1.1324901962280274,
854
+ -0.32540663063526154,
855
+ -0.10621625065803528,
856
+ -0.17752183318138123,
857
+ -2.1106600952148438,
858
+ -0.7238819229602814
859
+ ],
860
+ [
861
+ -0.2760401529073715,
862
+ -1.131754720211029,
863
+ -0.3250221389532089,
864
+ -0.10366981148719788,
865
+ -0.17745642334222794,
866
+ -2.110166282653809,
867
+ -0.7220853567123413
868
+ ],
869
+ [
870
+ -0.27648825109004976,
871
+ -1.1315274477005004,
872
+ -0.32488527715206145,
873
+ -0.10417581394314765,
874
+ -0.17765929341316222,
875
+ -2.111174240112305,
876
+ -0.721002539396286
877
+ ],
878
+ [
879
+ -0.2767831003665924,
880
+ -1.1337191128730775,
881
+ -0.32499175250530243,
882
+ -0.10650760352611542,
883
+ -0.1782200300693512,
884
+ -2.1105369424819944,
885
+ -0.7191157519817353
886
+ ],
887
+ [
888
+ -0.2783048951625824,
889
+ -1.1336584401130676,
890
+ -0.3245078271627426,
891
+ -0.10380961641669273,
892
+ -0.17757790327072143,
893
+ -2.1105402278900147,
894
+ -0.717497273683548
895
+ ]
896
+ ],
897
+ "q99": [
898
+ [
899
+ 0.10997488573193549,
900
+ 0.16461794972419735,
901
+ 0.03921745248138905,
902
+ 1.39764888048172,
903
+ 0.30130664169788357,
904
+ 0.01098630111664532,
905
+ 0.1122507885098457
906
+ ],
907
+ [
908
+ 0.11004416078329086,
909
+ 0.1643620255589485,
910
+ 0.03903082057833671,
911
+ 1.398072485923767,
912
+ 0.3018379479646683,
913
+ 0.010057139471173268,
914
+ 0.11005336791276932
915
+ ],
916
+ [
917
+ 0.11012477055191992,
918
+ 0.16386553168296814,
919
+ 0.038735973685979835,
920
+ 1.3967380928993225,
921
+ 0.30213871598243713,
922
+ 0.010799065530300123,
923
+ 0.10891361147165297
924
+ ],
925
+ [
926
+ 0.1099956126511097,
927
+ 0.16371061593294142,
928
+ 0.03824721999466418,
929
+ 1.3970967960357665,
930
+ 0.302277557849884,
931
+ 0.011137769222259486,
932
+ 0.10836461812257767
933
+ ],
934
+ [
935
+ 0.11023993626236915,
936
+ 0.1633686304092407,
937
+ 0.03792811810970305,
938
+ 1.3972763657569884,
939
+ 0.3007064414024353,
940
+ 0.010738395974039987,
941
+ 0.10781787663698195
942
+ ],
943
+ [
944
+ 0.11034056857228279,
945
+ 0.16381058037281035,
946
+ 0.03771789923310276,
947
+ 1.3969033169746399,
948
+ 0.3010092568397521,
949
+ 0.010312179420143333,
950
+ 0.1074419716000557
951
+ ],
952
+ [
953
+ 0.11034261405467986,
954
+ 0.1636140125989914,
955
+ 0.03730809785425661,
956
+ 1.3973512649536133,
957
+ 0.3012144303321838,
958
+ 0.009373838771134584,
959
+ 0.10661112785339355
960
+ ],
961
+ [
962
+ 0.11037104874849318,
963
+ 0.16361432492733002,
964
+ 0.03730310291051864,
965
+ 1.397199330329895,
966
+ 0.30146020889282227,
967
+ 0.009104850329458668,
968
+ 0.10594455733895301
969
+ ],
970
+ [
971
+ 0.11031954407691955,
972
+ 0.16329921871423722,
973
+ 0.037490070536732666,
974
+ 1.3971175789833068,
975
+ 0.30101816475391385,
976
+ 0.007780624665319918,
977
+ 0.10561806678771973
978
+ ],
979
+ [
980
+ 0.11039042010903358,
981
+ 0.16369332671165465,
982
+ 0.036998328715562794,
983
+ 1.3964923930168152,
984
+ 0.3020000964403152,
985
+ 0.007503410866484006,
986
+ 0.10535383358597755
987
+ ],
988
+ [
989
+ 0.11048222631216048,
990
+ 0.16336869567632675,
991
+ 0.03698733076453208,
992
+ 1.3960149836540223,
993
+ 0.30287389039993284,
994
+ 0.0068738124519586155,
995
+ 0.10515481844544411
996
+ ],
997
+ [
998
+ 0.11053489252924918,
999
+ 0.16354636400938033,
1000
+ 0.03707304038107395,
1001
+ 1.396628396511078,
1002
+ 0.3029059028625488,
1003
+ 0.006812876258045408,
1004
+ 0.1047084142267704
1005
+ ],
1006
+ [
1007
+ 0.11039242312312125,
1008
+ 0.16331785261631013,
1009
+ 0.03715803913772106,
1010
+ 1.3973055458068848,
1011
+ 0.30323826253414154,
1012
+ 0.006487304139882287,
1013
+ 0.10444164305925369
1014
+ ],
1015
+ [
1016
+ 0.11058814465999603,
1017
+ 0.16320075422525404,
1018
+ 0.0372002275288105,
1019
+ 1.3976932382583618,
1020
+ 0.30252904832363126,
1021
+ 0.005770333949476429,
1022
+ 0.10420910120010375
1023
+ ],
1024
+ [
1025
+ 0.11048216462135314,
1026
+ 0.1634601667523384,
1027
+ 0.0368946287035942,
1028
+ 1.396862666606903,
1029
+ 0.3012196272611618,
1030
+ 0.006188006103038769,
1031
+ 0.10407691970467567
1032
+ ],
1033
+ [
1034
+ 0.11032852262258529,
1035
+ 0.16324337780475617,
1036
+ 0.03683135174214838,
1037
+ 1.3966079354286194,
1038
+ 0.30130040407180775,
1039
+ 0.006021949928253876,
1040
+ 0.10380818247795105
1041
+ ]
1042
+ ]
1043
+ }
1044
+ }
1045
+ }
1046
+ }
checkpoint-2000/experiment_cfg/final_model_config.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "Gr00tN1d6",
3
+ "model_dtype": "bfloat16",
4
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
5
+ "backbone_model_type": "eagle",
6
+ "model_revision": null,
7
+ "tune_top_llm_layers": 4,
8
+ "backbone_embedding_dim": 2048,
9
+ "tune_llm": false,
10
+ "tune_visual": false,
11
+ "select_layer": 16,
12
+ "reproject_vision": false,
13
+ "use_flash_attention": true,
14
+ "load_bf16": true,
15
+ "collator_overwrite_image_inputs": false,
16
+ "eagle_collator": true,
17
+ "backbone_trainable_params_fp32": true,
18
+ "apply_sincos_state_encoding": true,
19
+ "use_relative_action": true,
20
+ "max_state_dim": 128,
21
+ "max_action_dim": 128,
22
+ "action_horizon": 50,
23
+ "hidden_size": 1024,
24
+ "input_embedding_dim": 1536,
25
+ "add_pos_embed": true,
26
+ "attn_dropout": 0.2,
27
+ "use_vlln": true,
28
+ "max_seq_len": 1024,
29
+ "use_alternate_vl_dit": true,
30
+ "attend_text_every_n_blocks": 2,
31
+ "diffusion_model_cfg": {
32
+ "attention_head_dim": 48,
33
+ "dropout": 0.2,
34
+ "final_dropout": true,
35
+ "interleave_self_attention": true,
36
+ "norm_type": "ada_norm",
37
+ "num_attention_heads": 32,
38
+ "num_layers": 32,
39
+ "output_dim": 1024,
40
+ "positional_embeddings": null
41
+ },
42
+ "num_inference_timesteps": 4,
43
+ "noise_beta_alpha": 1.5,
44
+ "noise_beta_beta": 1.0,
45
+ "noise_s": 0.999,
46
+ "num_timestep_buckets": 1000,
47
+ "tune_projector": true,
48
+ "tune_diffusion_model": true,
49
+ "tune_vlln": true,
50
+ "state_dropout_prob": 0.0,
51
+ "state_additive_noise_scale": 0.0,
52
+ "max_num_embodiments": 32
53
+ }
checkpoint-2000/experiment_cfg/final_processor_config.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-2000/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de0d19ccd220d816042eee892ceb96bfc5c43a02e4e274c481cd726d2b36f0ef
3
+ size 4990120184
checkpoint-2000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cb3593b91f21ea438acbb11fe50ac2daebf81740d2a227ed7ac6eb738d70686
3
+ size 4823190320
checkpoint-2000/model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-2000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4ca7c8409935f6d1ab0d2e0bb9f4e2c7d14771e38be0fa58d214c2975b66439
3
+ size 12960193762
checkpoint-2000/processor_config.json ADDED
@@ -0,0 +1,454 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "processor_class": "Gr00tN1d6Processor",
3
+ "processor_kwargs": {
4
+ "modality_configs": {
5
+ "behavior_r1_pro": {
6
+ "video": {
7
+ "delta_indices": [
8
+ 0
9
+ ],
10
+ "modality_keys": [
11
+ "observation.images.rgb.head_256_256",
12
+ "observation.images.rgb.left_wrist_256_256",
13
+ "observation.images.rgb.right_wrist_256_256"
14
+ ],
15
+ "sin_cos_embedding_keys": null,
16
+ "mean_std_embedding_keys": null,
17
+ "action_configs": null
18
+ },
19
+ "state": {
20
+ "delta_indices": [
21
+ 0
22
+ ],
23
+ "modality_keys": [
24
+ "robot_pos",
25
+ "robot_ori_cos",
26
+ "robot_ori_sin",
27
+ "robot_2d_ori",
28
+ "robot_2d_ori_cos",
29
+ "robot_2d_ori_sin",
30
+ "robot_lin_vel",
31
+ "robot_ang_vel",
32
+ "arm_left_qpos",
33
+ "arm_left_qpos_sin",
34
+ "arm_left_qpos_cos",
35
+ "eef_left_pos",
36
+ "eef_left_quat",
37
+ "gripper_left_qpos",
38
+ "arm_right_qpos",
39
+ "arm_right_qpos_sin",
40
+ "arm_right_qpos_cos",
41
+ "eef_right_pos",
42
+ "eef_right_quat",
43
+ "gripper_right_qpos",
44
+ "trunk_qpos"
45
+ ],
46
+ "sin_cos_embedding_keys": null,
47
+ "mean_std_embedding_keys": null,
48
+ "action_configs": null
49
+ },
50
+ "action": {
51
+ "delta_indices": [
52
+ 0,
53
+ 1,
54
+ 2,
55
+ 3,
56
+ 4,
57
+ 5,
58
+ 6,
59
+ 7,
60
+ 8,
61
+ 9,
62
+ 10,
63
+ 11,
64
+ 12,
65
+ 13,
66
+ 14,
67
+ 15,
68
+ 16,
69
+ 17,
70
+ 18,
71
+ 19,
72
+ 20,
73
+ 21,
74
+ 22,
75
+ 23,
76
+ 24,
77
+ 25,
78
+ 26,
79
+ 27,
80
+ 28,
81
+ 29,
82
+ 30,
83
+ 31
84
+ ],
85
+ "modality_keys": [
86
+ "base",
87
+ "torso",
88
+ "left_arm",
89
+ "left_gripper",
90
+ "right_arm",
91
+ "right_gripper"
92
+ ],
93
+ "sin_cos_embedding_keys": null,
94
+ "mean_std_embedding_keys": null,
95
+ "action_configs": [
96
+ {
97
+ "rep": "ABSOLUTE",
98
+ "type": "NON_EEF",
99
+ "format": "DEFAULT",
100
+ "state_key": null
101
+ },
102
+ {
103
+ "rep": "RELATIVE",
104
+ "type": "NON_EEF",
105
+ "format": "DEFAULT",
106
+ "state_key": "trunk_qpos"
107
+ },
108
+ {
109
+ "rep": "RELATIVE",
110
+ "type": "NON_EEF",
111
+ "format": "DEFAULT",
112
+ "state_key": "arm_left_qpos"
113
+ },
114
+ {
115
+ "rep": "ABSOLUTE",
116
+ "type": "NON_EEF",
117
+ "format": "DEFAULT",
118
+ "state_key": null
119
+ },
120
+ {
121
+ "rep": "RELATIVE",
122
+ "type": "NON_EEF",
123
+ "format": "DEFAULT",
124
+ "state_key": "arm_right_qpos"
125
+ },
126
+ {
127
+ "rep": "ABSOLUTE",
128
+ "type": "NON_EEF",
129
+ "format": "DEFAULT",
130
+ "state_key": null
131
+ }
132
+ ]
133
+ },
134
+ "language": {
135
+ "delta_indices": [
136
+ 0
137
+ ],
138
+ "modality_keys": [
139
+ "annotation.human.coarse_action"
140
+ ],
141
+ "sin_cos_embedding_keys": null,
142
+ "mean_std_embedding_keys": null,
143
+ "action_configs": null
144
+ }
145
+ },
146
+ "gr1": {
147
+ "video": {
148
+ "delta_indices": [
149
+ 0
150
+ ],
151
+ "modality_keys": [
152
+ "ego_view_bg_crop_pad_res256_freq20"
153
+ ],
154
+ "sin_cos_embedding_keys": null,
155
+ "mean_std_embedding_keys": null,
156
+ "action_configs": null
157
+ },
158
+ "state": {
159
+ "delta_indices": [
160
+ 0
161
+ ],
162
+ "modality_keys": [
163
+ "left_arm",
164
+ "right_arm",
165
+ "left_hand",
166
+ "right_hand",
167
+ "waist"
168
+ ],
169
+ "sin_cos_embedding_keys": [
170
+ "left_arm",
171
+ "right_arm",
172
+ "left_hand",
173
+ "right_hand",
174
+ "waist"
175
+ ],
176
+ "mean_std_embedding_keys": null,
177
+ "action_configs": null
178
+ },
179
+ "action": {
180
+ "delta_indices": [
181
+ 0,
182
+ 1,
183
+ 2,
184
+ 3,
185
+ 4,
186
+ 5,
187
+ 6,
188
+ 7,
189
+ 8,
190
+ 9,
191
+ 10,
192
+ 11,
193
+ 12,
194
+ 13,
195
+ 14,
196
+ 15
197
+ ],
198
+ "modality_keys": [
199
+ "left_arm",
200
+ "right_arm",
201
+ "left_hand",
202
+ "right_hand",
203
+ "waist"
204
+ ],
205
+ "sin_cos_embedding_keys": null,
206
+ "mean_std_embedding_keys": null,
207
+ "action_configs": [
208
+ {
209
+ "rep": "RELATIVE",
210
+ "type": "NON_EEF",
211
+ "format": "DEFAULT",
212
+ "state_key": null
213
+ },
214
+ {
215
+ "rep": "RELATIVE",
216
+ "type": "NON_EEF",
217
+ "format": "DEFAULT",
218
+ "state_key": null
219
+ },
220
+ {
221
+ "rep": "RELATIVE",
222
+ "type": "NON_EEF",
223
+ "format": "DEFAULT",
224
+ "state_key": null
225
+ },
226
+ {
227
+ "rep": "RELATIVE",
228
+ "type": "NON_EEF",
229
+ "format": "DEFAULT",
230
+ "state_key": null
231
+ },
232
+ {
233
+ "rep": "ABSOLUTE",
234
+ "type": "NON_EEF",
235
+ "format": "DEFAULT",
236
+ "state_key": null
237
+ }
238
+ ]
239
+ },
240
+ "language": {
241
+ "delta_indices": [
242
+ 0
243
+ ],
244
+ "modality_keys": [
245
+ "task"
246
+ ],
247
+ "sin_cos_embedding_keys": null,
248
+ "mean_std_embedding_keys": null,
249
+ "action_configs": null
250
+ }
251
+ },
252
+ "robocasa_panda_omron": {
253
+ "video": {
254
+ "delta_indices": [
255
+ 0
256
+ ],
257
+ "modality_keys": [
258
+ "res256_image_side_0",
259
+ "res256_image_side_1",
260
+ "res256_image_wrist_0"
261
+ ],
262
+ "sin_cos_embedding_keys": null,
263
+ "mean_std_embedding_keys": null,
264
+ "action_configs": null
265
+ },
266
+ "state": {
267
+ "delta_indices": [
268
+ 0
269
+ ],
270
+ "modality_keys": [
271
+ "end_effector_position_relative",
272
+ "end_effector_rotation_relative",
273
+ "gripper_qpos",
274
+ "base_position",
275
+ "base_rotation"
276
+ ],
277
+ "sin_cos_embedding_keys": null,
278
+ "mean_std_embedding_keys": null,
279
+ "action_configs": null
280
+ },
281
+ "action": {
282
+ "delta_indices": [
283
+ 0,
284
+ 1,
285
+ 2,
286
+ 3,
287
+ 4,
288
+ 5,
289
+ 6,
290
+ 7,
291
+ 8,
292
+ 9,
293
+ 10,
294
+ 11,
295
+ 12,
296
+ 13,
297
+ 14,
298
+ 15
299
+ ],
300
+ "modality_keys": [
301
+ "end_effector_position",
302
+ "end_effector_rotation",
303
+ "gripper_close",
304
+ "base_motion",
305
+ "control_mode"
306
+ ],
307
+ "sin_cos_embedding_keys": null,
308
+ "mean_std_embedding_keys": null,
309
+ "action_configs": [
310
+ {
311
+ "rep": "ABSOLUTE",
312
+ "type": "NON_EEF",
313
+ "format": "DEFAULT",
314
+ "state_key": null
315
+ },
316
+ {
317
+ "rep": "ABSOLUTE",
318
+ "type": "NON_EEF",
319
+ "format": "DEFAULT",
320
+ "state_key": null
321
+ },
322
+ {
323
+ "rep": "ABSOLUTE",
324
+ "type": "NON_EEF",
325
+ "format": "DEFAULT",
326
+ "state_key": null
327
+ },
328
+ {
329
+ "rep": "ABSOLUTE",
330
+ "type": "NON_EEF",
331
+ "format": "DEFAULT",
332
+ "state_key": null
333
+ },
334
+ {
335
+ "rep": "ABSOLUTE",
336
+ "type": "NON_EEF",
337
+ "format": "DEFAULT",
338
+ "state_key": null
339
+ }
340
+ ]
341
+ },
342
+ "language": {
343
+ "delta_indices": [
344
+ 0
345
+ ],
346
+ "modality_keys": [
347
+ "annotation.human.action.task_description"
348
+ ],
349
+ "sin_cos_embedding_keys": null,
350
+ "mean_std_embedding_keys": null,
351
+ "action_configs": null
352
+ }
353
+ },
354
+ "new_embodiment": {
355
+ "video": {
356
+ "delta_indices": [
357
+ 0
358
+ ],
359
+ "modality_keys": [
360
+ "ego_view"
361
+ ],
362
+ "sin_cos_embedding_keys": null,
363
+ "mean_std_embedding_keys": null,
364
+ "action_configs": null
365
+ },
366
+ "state": {
367
+ "delta_indices": [
368
+ 0
369
+ ],
370
+ "modality_keys": [
371
+ "single_arm",
372
+ "gripper"
373
+ ],
374
+ "sin_cos_embedding_keys": null,
375
+ "mean_std_embedding_keys": null,
376
+ "action_configs": null
377
+ },
378
+ "action": {
379
+ "delta_indices": [
380
+ 0,
381
+ 1,
382
+ 2,
383
+ 3,
384
+ 4,
385
+ 5,
386
+ 6,
387
+ 7,
388
+ 8,
389
+ 9,
390
+ 10,
391
+ 11,
392
+ 12,
393
+ 13,
394
+ 14,
395
+ 15
396
+ ],
397
+ "modality_keys": [
398
+ "single_arm",
399
+ "gripper"
400
+ ],
401
+ "sin_cos_embedding_keys": null,
402
+ "mean_std_embedding_keys": null,
403
+ "action_configs": [
404
+ {
405
+ "rep": "RELATIVE",
406
+ "type": "NON_EEF",
407
+ "format": "DEFAULT",
408
+ "state_key": "single_arm"
409
+ },
410
+ {
411
+ "rep": "ABSOLUTE",
412
+ "type": "NON_EEF",
413
+ "format": "DEFAULT",
414
+ "state_key": null
415
+ }
416
+ ]
417
+ },
418
+ "language": {
419
+ "delta_indices": [
420
+ 0
421
+ ],
422
+ "modality_keys": [
423
+ "annotation.human.task_description"
424
+ ],
425
+ "sin_cos_embedding_keys": null,
426
+ "mean_std_embedding_keys": null,
427
+ "action_configs": null
428
+ }
429
+ }
430
+ },
431
+ "image_crop_size": null,
432
+ "image_target_size": null,
433
+ "use_albumentations": true,
434
+ "random_rotation_angle": null,
435
+ "color_jitter_params": {
436
+ "brightness": 0.3,
437
+ "contrast": 0.4,
438
+ "saturation": 0.5,
439
+ "hue": 0.08
440
+ },
441
+ "shortest_image_edge": 256,
442
+ "crop_fraction": 0.95,
443
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
444
+ "model_type": "eagle",
445
+ "formalize_language": true,
446
+ "max_state_dim": 128,
447
+ "max_action_dim": 128,
448
+ "max_action_horizon": 50,
449
+ "use_percentiles": false,
450
+ "clip_outliers": true,
451
+ "apply_sincos_state_encoding": true,
452
+ "use_relative_action": true
453
+ }
454
+ }
checkpoint-2000/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:903f9feec6355f31fbe50eb924e3a0aa889d94e00801bcc2d3dc34d878468ec7
3
+ size 14645
checkpoint-2000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbd70720477de19dc6b2749427bae8a74f79040c6554cb5dc9c48e7b75cda08a
3
+ size 1465