LucaFrat commited on
Commit
8ada3e0
·
verified ·
1 Parent(s): c86bbcb

Upload folder using huggingface_hub

Browse files
checkpoint-4000/config.json ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_horizon": 40,
3
+ "add_pos_embed": true,
4
+ "apply_sincos_state_encoding": false,
5
+ "architectures": [
6
+ "Gr00tN1d7"
7
+ ],
8
+ "attn_dropout": 0.2,
9
+ "attn_implementation": null,
10
+ "backbone_embedding_dim": 2048,
11
+ "backbone_trainable_params_fp32": true,
12
+ "color_jitter_params": {
13
+ "brightness": 0.3,
14
+ "contrast": 0.4,
15
+ "hue": 0.08,
16
+ "saturation": 0.5
17
+ },
18
+ "crop_fraction": 0.95,
19
+ "diffusion_model_cfg": {
20
+ "attention_head_dim": 48,
21
+ "dropout": 0.2,
22
+ "final_dropout": true,
23
+ "interleave_self_attention": true,
24
+ "norm_type": "ada_norm",
25
+ "num_attention_heads": 32,
26
+ "num_layers": 32,
27
+ "output_dim": 1024,
28
+ "positional_embeddings": null
29
+ },
30
+ "dtype": "float32",
31
+ "exclude_state": false,
32
+ "formalize_language": true,
33
+ "hidden_size": 1024,
34
+ "image_crop_size": [
35
+ 230,
36
+ 230
37
+ ],
38
+ "image_target_size": [
39
+ 256,
40
+ 256
41
+ ],
42
+ "letter_box_transform": false,
43
+ "load_bf16": false,
44
+ "max_action_dim": 132,
45
+ "max_num_embodiments": 32,
46
+ "max_seq_len": 1024,
47
+ "max_state_dim": 132,
48
+ "model_dtype": "bfloat16",
49
+ "model_name": "nvidia/Cosmos-Reason2-2B",
50
+ "model_type": "Gr00tN1d7",
51
+ "noise_beta_alpha": 1.5,
52
+ "noise_beta_beta": 1.0,
53
+ "noise_s": 0.999,
54
+ "num_inference_timesteps": 4,
55
+ "num_timestep_buckets": 1000,
56
+ "random_history_crop": true,
57
+ "random_rotation_angle": 0,
58
+ "reproject_vision": false,
59
+ "rtc_ramp_rate": 6.0,
60
+ "select_layer": 16,
61
+ "shortest_image_edge": 256,
62
+ "state_dropout_prob": 0.2,
63
+ "state_gaussian_noise_std": 0.0,
64
+ "transformers_version": "4.57.3",
65
+ "tune_diffusion_model": true,
66
+ "tune_linear": true,
67
+ "tune_llm": false,
68
+ "tune_projector": true,
69
+ "tune_top_llm_layers": 0,
70
+ "tune_visual": false,
71
+ "tune_vlln": true,
72
+ "use_albumentations": true,
73
+ "use_alternate_vl_dit": true,
74
+ "use_flash_attention": true,
75
+ "use_future_tokens": false,
76
+ "use_mean_std": false,
77
+ "use_percentiles": true,
78
+ "use_vl_self_attention": true,
79
+ "use_vlln": true,
80
+ "vl_self_attention_cfg": {
81
+ "attention_head_dim": 64,
82
+ "dropout": 0.2,
83
+ "final_dropout": true,
84
+ "num_attention_heads": 32,
85
+ "num_layers": 4,
86
+ "positional_embeddings": null
87
+ }
88
+ }
checkpoint-4000/embodiment_id.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "robocasa_panda_omron": 13,
3
+ "oxe_droid": 17,
4
+ "oxe_fractal": 18,
5
+ "oxe_language_table": 19,
6
+ "oxe_bridge": 20,
7
+ "unknown": 22,
8
+ "gr1_unified": 20,
9
+ "agibot": 26,
10
+ "sim_behavior_r1_pro": 23,
11
+ "xdof": 24,
12
+ "xdof_oss_data": 25,
13
+ "unitree_g1_full_body_with_waist_height_nav_cmd": 25,
14
+ "real_r1_pro_sharpa": 27,
15
+ "real_r1_pro_sharpa_add_view": 27,
16
+ "real_r1_pro_sharpa_relative_arm_joint": 26,
17
+ "real_r1_pro_sharpa_delta_eef": 26,
18
+ "real_r1_pro_sharpa_absolute_eef": 26,
19
+ "real_r1_pro_sharpa_meanstd": 26,
20
+ "real_r1_pro_sharpa_relative_eef": 26,
21
+ "real_r1_pro_sharpa_relative_eef_add_view": 26,
22
+ "real_r1_pro_sharpa_relative_eef_relative_hand": 26,
23
+ "real_r1_pro_sharpa_relative_eef_human": 26,
24
+ "real_r1_pro_sharpa_relative_eef_human_add_view": 26,
25
+ "real_r1_pro_sharpa_relative_eef_human_relative_hand": 26,
26
+ "real_r1_pro_sharpa_relative_eef_egodex": 26,
27
+ "real_r1_pro_sharpa_relative_eef_egodex_relative_hand": 26,
28
+ "real_r1_pro_sharpa_relative_eef_egodex_wrist_only": 26,
29
+ "real_r1_pro_sharpa_relative_eef_maxinsights": 26,
30
+ "real_r1_pro_sharpa_relative_eef_maxinsights_relative_hand": 26,
31
+ "real_r1_pro_sharpa_relative_eef_mecka": 26,
32
+ "real_r1_pro_sharpa_relative_eef_mecka_relative_hand": 26,
33
+ "real_g1_relative_eef_absolute_joints": 25,
34
+ "real_g1_relative_eef_absolute_joints_wrist_cam": 25,
35
+ "real_g1_relative_eef_relative_joints": 25,
36
+ "real_r1_pro_sharpa_relative_eef_relative_hand_relative_joint": 26,
37
+ "real_r1_pro_sharpa_relative_joint": 29,
38
+ "oxe_droid_relative_eef_relative_joint": 24,
39
+ "oxe_droid_relative_eef_relative_joint_swapped": 24,
40
+ "oxe_droid_relative_eef_relative_joint_upweight_z": 24,
41
+ "oxe_droid_relative_eef_relative_joint_upweight_z_swapped": 24,
42
+ "oxe_droid_relative_eef_relative_joint_3view": 24,
43
+ "oxe_droid_relative_eef_relative_joint_3view_swapped": 24,
44
+ "oxe_droid_relative_eef": 24,
45
+ "oxe_droid_joint_position_relative": 24,
46
+ "xdof_relative_eef_relative_joint": 27,
47
+ "xdof_relative_eef_relative_joint_subtask": 27,
48
+ "xdof_relative_eef": 27,
49
+ "xdof_relative_joint": 28,
50
+ "simpler_env_google": 0,
51
+ "simpler_env_widowx": 1,
52
+ "libero_sim": 2,
53
+ "droid_sim": 3,
54
+ "unitree_g1_sonic": 11,
55
+ "new_embodiment": 10,
56
+ "robocasa_gr1_tabletop": 10
57
+ }
checkpoint-4000/experiment_cfg/conf.yaml ADDED
@@ -0,0 +1,251 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ load_config_path: null
2
+ model:
3
+ model_type: Gr00tN1d7
4
+ model_dtype: bfloat16
5
+ model_name: nvidia/Cosmos-Reason2-2B
6
+ backbone_model_type: qwen
7
+ model_revision: null
8
+ tune_top_llm_layers: 0
9
+ backbone_embedding_dim: 2048
10
+ tune_llm: false
11
+ tune_visual: false
12
+ select_layer: 12
13
+ reproject_vision: false
14
+ use_flash_attention: true
15
+ load_bf16: false
16
+ backbone_trainable_params_fp32: true
17
+ image_crop_size:
18
+ - 230
19
+ - 230
20
+ image_target_size:
21
+ - 256
22
+ - 256
23
+ shortest_image_edge: null
24
+ crop_fraction: null
25
+ random_rotation_angle: null
26
+ color_jitter_params:
27
+ brightness: 0.3
28
+ contrast: 0.4
29
+ saturation: 0.5
30
+ hue: 0.08
31
+ use_albumentations_transforms: true
32
+ extra_augmentation_config: null
33
+ formalize_language: true
34
+ apply_sincos_state_encoding: false
35
+ use_percentiles: true
36
+ use_relative_action: true
37
+ max_state_dim: 132
38
+ max_action_dim: 132
39
+ action_horizon: 40
40
+ hidden_size: 1024
41
+ input_embedding_dim: 1536
42
+ state_history_length: 1
43
+ add_pos_embed: true
44
+ attn_dropout: 0.2
45
+ use_vlln: true
46
+ max_seq_len: 1024
47
+ use_alternate_vl_dit: true
48
+ attend_text_every_n_blocks: 2
49
+ diffusion_model_cfg:
50
+ positional_embeddings: null
51
+ num_layers: 16
52
+ num_attention_heads: 32
53
+ attention_head_dim: 48
54
+ norm_type: ada_norm
55
+ dropout: 0.2
56
+ final_dropout: true
57
+ output_dim: 1024
58
+ interleave_self_attention: true
59
+ num_inference_timesteps: 4
60
+ noise_beta_alpha: 1.5
61
+ noise_beta_beta: 1.0
62
+ noise_s: 0.999
63
+ num_timestep_buckets: 1000
64
+ tune_projector: true
65
+ tune_diffusion_model: true
66
+ tune_vlln: true
67
+ state_dropout_prob: 0.2
68
+ exclude_state: false
69
+ use_mean_std: false
70
+ max_num_embodiments: 32
71
+ data:
72
+ datasets:
73
+ - dataset_paths:
74
+ - /home/ubuntu/groot-files/dataset
75
+ embodiment_tag: unitree_g1_sonic
76
+ mix_ratio: 1.0
77
+ dataset_type: physical_embodiment
78
+ val_dataset_path: null
79
+ modality_configs:
80
+ unitree_g1_sonic:
81
+ video:
82
+ delta_indices:
83
+ - 0
84
+ modality_keys:
85
+ - ego_view
86
+ sin_cos_embedding_keys: null
87
+ mean_std_embedding_keys: null
88
+ action_configs: null
89
+ state:
90
+ delta_indices:
91
+ - 0
92
+ modality_keys:
93
+ - left_leg
94
+ - right_leg
95
+ - waist
96
+ - left_arm
97
+ - right_arm
98
+ - left_hand
99
+ - right_hand
100
+ - projected_gravity
101
+ sin_cos_embedding_keys: null
102
+ mean_std_embedding_keys: null
103
+ action_configs: null
104
+ action:
105
+ delta_indices:
106
+ - 0
107
+ - 1
108
+ - 2
109
+ - 3
110
+ - 4
111
+ - 5
112
+ - 6
113
+ - 7
114
+ - 8
115
+ - 9
116
+ - 10
117
+ - 11
118
+ - 12
119
+ - 13
120
+ - 14
121
+ - 15
122
+ - 16
123
+ - 17
124
+ - 18
125
+ - 19
126
+ - 20
127
+ - 21
128
+ - 22
129
+ - 23
130
+ - 24
131
+ - 25
132
+ - 26
133
+ - 27
134
+ - 28
135
+ - 29
136
+ - 30
137
+ - 31
138
+ - 32
139
+ - 33
140
+ - 34
141
+ - 35
142
+ - 36
143
+ - 37
144
+ - 38
145
+ - 39
146
+ modality_keys:
147
+ - motion_token
148
+ - left_hand_joints
149
+ - right_hand_joints
150
+ sin_cos_embedding_keys: null
151
+ mean_std_embedding_keys: null
152
+ action_configs:
153
+ - rep: ABSOLUTE
154
+ type: NON_EEF
155
+ format: DEFAULT
156
+ state_key: null
157
+ - rep: ABSOLUTE
158
+ type: NON_EEF
159
+ format: DEFAULT
160
+ state_key: null
161
+ - rep: ABSOLUTE
162
+ type: NON_EEF
163
+ format: DEFAULT
164
+ state_key: null
165
+ language:
166
+ delta_indices:
167
+ - 0
168
+ modality_keys:
169
+ - annotation.human.task_description
170
+ sin_cos_embedding_keys: null
171
+ mean_std_embedding_keys: null
172
+ action_configs: null
173
+ download_cache: false
174
+ shard_size: 1024
175
+ episode_sampling_rate: 0.1
176
+ num_shards_per_epoch: 100000
177
+ override_pretraining_statistics: true
178
+ mode: single_turn
179
+ random_chop: 0.0
180
+ mock_dataset_mode: false
181
+ shuffle: true
182
+ seed: 42
183
+ multiprocessing_context: fork
184
+ allow_padding: false
185
+ subsample_ratio: 1.0
186
+ image_crop_size:
187
+ - 244
188
+ - 244
189
+ image_target_size:
190
+ - 224
191
+ - 224
192
+ video_backend: torchcodec
193
+ training:
194
+ output_dir: /home/ubuntu/groot-files/checkpoints/g1_finetune-20260526-211344-gpu2
195
+ experiment_name: null
196
+ max_steps: 20000
197
+ global_batch_size: 128
198
+ batch_size: null
199
+ gradient_accumulation_steps: 1
200
+ learning_rate: 0.0001
201
+ lr_scheduler_type: cosine
202
+ weight_decay: 1.0e-05
203
+ warmup_ratio: 0.05
204
+ warmup_steps: 0
205
+ max_grad_norm: 1.0
206
+ optim: adamw_torch
207
+ start_from_checkpoint: nvidia/GR00T-N1.7-3B
208
+ skip_weight_loading: false
209
+ tf32: true
210
+ fp16: false
211
+ bf16: true
212
+ eval_bf16: true
213
+ logging_steps: 10
214
+ save_steps: 4000
215
+ save_total_limit: 10
216
+ save_vl_model: false
217
+ save_only_model: false
218
+ upload_checkpoints: false
219
+ upload_every: 1000
220
+ upload_last_n_checkpoints: 5
221
+ max_concurrent_uploads: 2
222
+ eval_strategy: 'no'
223
+ eval_steps: 500
224
+ eval_set_split_ratio: 0.1
225
+ eval_batch_size: 2
226
+ save_best_eval_metric_name: ''
227
+ save_best_eval_metric_greater_is_better: true
228
+ deepspeed_stage: 2
229
+ gradient_checkpointing: false
230
+ transformers_trust_remote_code: true
231
+ transformers_local_files_only: false
232
+ transformers_cache_dir: null
233
+ transformers_access_token: null
234
+ use_ddp: false
235
+ ddp_bucket_cap_mb: 100
236
+ num_gpus: 1
237
+ dataloader_num_workers: 6
238
+ remove_unused_columns: false
239
+ use_wandb: true
240
+ wandb_project: groot-finetune
241
+ enable_profiling: false
242
+ max_retries: 3
243
+ assert_loss_less_than: null
244
+ add_rl_callback: false
245
+ enable_open_loop_eval: false
246
+ open_loop_eval_traj_ids:
247
+ - 0
248
+ open_loop_eval_steps_per_traj: 100
249
+ open_loop_eval_plot_indices: null
250
+ max_steps: 20000
251
+ save_steps: 4000
checkpoint-4000/experiment_cfg/config.yaml ADDED
@@ -0,0 +1,277 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:gr00t.configs.base_config.Config
2
+ data: !!python/object:gr00t.configs.data.data_config.DataConfig
3
+ allow_padding: false
4
+ datasets:
5
+ - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
6
+ dataset_paths:
7
+ - /home/ubuntu/groot-files/dataset
8
+ dataset_type: physical_embodiment
9
+ embodiment_tag: unitree_g1_sonic
10
+ mix_ratio: 1.0
11
+ val_dataset_path: null
12
+ download_cache: false
13
+ episode_sampling_rate: 0.1
14
+ image_crop_size:
15
+ - 244
16
+ - 244
17
+ image_target_size:
18
+ - 224
19
+ - 224
20
+ mock_dataset_mode: false
21
+ modality_configs:
22
+ unitree_g1_sonic:
23
+ action: !!python/object:gr00t.data.types.ModalityConfig
24
+ action_configs:
25
+ - !!python/object:gr00t.data.types.ActionConfig
26
+ format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
27
+ - default
28
+ rep: &id002 !!python/object/apply:gr00t.data.types.ActionRepresentation
29
+ - absolute
30
+ state_key: null
31
+ type: &id003 !!python/object/apply:gr00t.data.types.ActionType
32
+ - non_eef
33
+ - !!python/object:gr00t.data.types.ActionConfig
34
+ format: *id001
35
+ rep: *id002
36
+ state_key: null
37
+ type: *id003
38
+ - !!python/object:gr00t.data.types.ActionConfig
39
+ format: *id001
40
+ rep: *id002
41
+ state_key: null
42
+ type: *id003
43
+ delta_indices:
44
+ - 0
45
+ - 1
46
+ - 2
47
+ - 3
48
+ - 4
49
+ - 5
50
+ - 6
51
+ - 7
52
+ - 8
53
+ - 9
54
+ - 10
55
+ - 11
56
+ - 12
57
+ - 13
58
+ - 14
59
+ - 15
60
+ - 16
61
+ - 17
62
+ - 18
63
+ - 19
64
+ - 20
65
+ - 21
66
+ - 22
67
+ - 23
68
+ - 24
69
+ - 25
70
+ - 26
71
+ - 27
72
+ - 28
73
+ - 29
74
+ - 30
75
+ - 31
76
+ - 32
77
+ - 33
78
+ - 34
79
+ - 35
80
+ - 36
81
+ - 37
82
+ - 38
83
+ - 39
84
+ mean_std_embedding_keys: null
85
+ modality_keys:
86
+ - motion_token
87
+ - left_hand_joints
88
+ - right_hand_joints
89
+ sin_cos_embedding_keys: null
90
+ language: !!python/object:gr00t.data.types.ModalityConfig
91
+ action_configs: null
92
+ delta_indices:
93
+ - 0
94
+ mean_std_embedding_keys: null
95
+ modality_keys:
96
+ - annotation.human.task_description
97
+ sin_cos_embedding_keys: null
98
+ state: !!python/object:gr00t.data.types.ModalityConfig
99
+ action_configs: null
100
+ delta_indices:
101
+ - 0
102
+ mean_std_embedding_keys: null
103
+ modality_keys:
104
+ - left_leg
105
+ - right_leg
106
+ - waist
107
+ - left_arm
108
+ - right_arm
109
+ - left_hand
110
+ - right_hand
111
+ - projected_gravity
112
+ sin_cos_embedding_keys: null
113
+ video: !!python/object:gr00t.data.types.ModalityConfig
114
+ action_configs: null
115
+ delta_indices:
116
+ - 0
117
+ mean_std_embedding_keys: null
118
+ modality_keys:
119
+ - ego_view
120
+ sin_cos_embedding_keys: null
121
+ mode: single_turn
122
+ multiprocessing_context: fork
123
+ num_shards_per_epoch: 100000
124
+ override_pretraining_statistics: true
125
+ random_chop: 0.0
126
+ seed: 42
127
+ shard_size: 1024
128
+ shuffle: true
129
+ subsample_ratio: 1.0
130
+ video_backend: torchcodec
131
+ load_config_path: null
132
+ model: !!python/object:gr00t.configs.model.gr00t_n1d7.Gr00tN1d7Config
133
+ _attn_implementation_internal: null
134
+ _commit_hash: null
135
+ _name_or_path: ''
136
+ _output_attentions: false
137
+ add_cross_attention: false
138
+ architectures: null
139
+ backbone_trainable_params_fp32: true
140
+ bad_words_ids: null
141
+ begin_suppress_tokens: null
142
+ bos_token_id: null
143
+ chunk_size_feed_forward: 0
144
+ color_jitter_params:
145
+ brightness: 0.3
146
+ contrast: 0.4
147
+ hue: 0.08
148
+ saturation: 0.5
149
+ cross_attention_hidden_size: null
150
+ decoder_start_token_id: null
151
+ diffusion_model_cfg:
152
+ attention_head_dim: 48
153
+ dropout: 0.2
154
+ final_dropout: true
155
+ interleave_self_attention: true
156
+ norm_type: ada_norm
157
+ num_attention_heads: 32
158
+ num_layers: 16
159
+ output_dim: 1024
160
+ positional_embeddings: null
161
+ diversity_penalty: 0.0
162
+ do_sample: false
163
+ dtype: null
164
+ early_stopping: false
165
+ encoder_no_repeat_ngram_size: 0
166
+ eos_token_id: null
167
+ exponential_decay_length_penalty: null
168
+ extra_augmentation_config: null
169
+ finetuning_task: null
170
+ forced_bos_token_id: null
171
+ forced_eos_token_id: null
172
+ id2label:
173
+ 0: LABEL_0
174
+ 1: LABEL_1
175
+ is_decoder: false
176
+ is_encoder_decoder: false
177
+ label2id:
178
+ LABEL_0: 0
179
+ LABEL_1: 1
180
+ length_penalty: 1.0
181
+ load_bf16: false
182
+ max_length: 20
183
+ min_length: 0
184
+ model_name: nvidia/Cosmos-Reason2-2B
185
+ no_repeat_ngram_size: 0
186
+ num_beam_groups: 1
187
+ num_beams: 1
188
+ num_return_sequences: 1
189
+ output_hidden_states: false
190
+ output_scores: false
191
+ pad_token_id: null
192
+ prefix: null
193
+ problem_type: null
194
+ pruned_heads: {}
195
+ random_rotation_angle: null
196
+ remove_invalid_values: false
197
+ repetition_penalty: 1.0
198
+ reproject_vision: false
199
+ return_dict: true
200
+ return_dict_in_generate: false
201
+ sep_token_id: null
202
+ state_dropout_prob: 0.2
203
+ suppress_tokens: null
204
+ task_specific_params: null
205
+ temperature: 1.0
206
+ tf_legacy_loss: false
207
+ tie_encoder_decoder: false
208
+ tie_word_embeddings: true
209
+ tokenizer_class: null
210
+ top_k: 50
211
+ top_p: 1.0
212
+ torchscript: false
213
+ transformers_version: null
214
+ tune_diffusion_model: true
215
+ tune_llm: false
216
+ tune_projector: true
217
+ tune_visual: false
218
+ typical_p: 1.0
219
+ use_bfloat16: false
220
+ use_relative_action: true
221
+ training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
222
+ add_rl_callback: false
223
+ assert_loss_less_than: null
224
+ batch_size: null
225
+ bf16: true
226
+ dataloader_num_workers: 6
227
+ ddp_bucket_cap_mb: 100
228
+ deepspeed_stage: 2
229
+ enable_open_loop_eval: false
230
+ enable_profiling: false
231
+ eval_batch_size: 2
232
+ eval_bf16: true
233
+ eval_set_split_ratio: 0.1
234
+ eval_steps: 500
235
+ eval_strategy: 'no'
236
+ experiment_name: null
237
+ fp16: false
238
+ global_batch_size: 128
239
+ gradient_accumulation_steps: 1
240
+ gradient_checkpointing: false
241
+ learning_rate: 0.0001
242
+ logging_steps: 10
243
+ lr_scheduler_type: cosine
244
+ max_concurrent_uploads: 2
245
+ max_grad_norm: 1.0
246
+ max_retries: 3
247
+ max_steps: 20000
248
+ num_gpus: 1
249
+ open_loop_eval_plot_indices: null
250
+ open_loop_eval_steps_per_traj: 100
251
+ open_loop_eval_traj_ids:
252
+ - 0
253
+ optim: adamw_torch
254
+ output_dir: /home/ubuntu/groot-files/checkpoints/g1_finetune-20260526-211344-gpu2
255
+ remove_unused_columns: false
256
+ save_best_eval_metric_greater_is_better: true
257
+ save_best_eval_metric_name: ''
258
+ save_only_model: false
259
+ save_steps: 4000
260
+ save_total_limit: 10
261
+ save_vl_model: false
262
+ skip_weight_loading: false
263
+ start_from_checkpoint: nvidia/GR00T-N1.7-3B
264
+ tf32: true
265
+ transformers_access_token: null
266
+ transformers_cache_dir: null
267
+ transformers_local_files_only: false
268
+ transformers_trust_remote_code: true
269
+ upload_checkpoints: false
270
+ upload_every: 1000
271
+ upload_last_n_checkpoints: 5
272
+ use_ddp: false
273
+ use_wandb: true
274
+ wandb_project: groot-finetune
275
+ warmup_ratio: 0.05
276
+ warmup_steps: 0
277
+ weight_decay: 1.0e-05
checkpoint-4000/experiment_cfg/dataset_statistics.json ADDED
@@ -0,0 +1,907 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "unitree_g1_sonic": {
3
+ "state": {
4
+ "left_leg": {
5
+ "min": [
6
+ -0.4857776165008545,
7
+ -0.24391146004199982,
8
+ -0.8776780366897583,
9
+ 0.03597185015678406,
10
+ -0.4930363595485687,
11
+ -0.20340518653392792
12
+ ],
13
+ "max": [
14
+ 0.3237466514110565,
15
+ 0.31727835536003113,
16
+ 0.7570706605911255,
17
+ 0.8986315131187439,
18
+ 0.1892659068107605,
19
+ 0.15561887621879578
20
+ ],
21
+ "mean": [
22
+ 0.038367897272109985,
23
+ 0.017137423157691956,
24
+ 0.10202965885400772,
25
+ 0.21319514513015747,
26
+ -0.20034761726856232,
27
+ -0.009860903024673462
28
+ ],
29
+ "std": [
30
+ 0.12473291903734207,
31
+ 0.0657326877117157,
32
+ 0.16789446771144867,
33
+ 0.0855027362704277,
34
+ 0.05454540252685547,
35
+ 0.043583426624536514
36
+ ],
37
+ "q01": [
38
+ -0.3429580569267273,
39
+ -0.14271177425980566,
40
+ -0.41709126979112626,
41
+ 0.12328944355249405,
42
+ -0.2934864178299904,
43
+ -0.11147186532616615
44
+ ],
45
+ "q99": [
46
+ 0.18860293924808502,
47
+ 0.17139848843216907,
48
+ 0.4404219493269922,
49
+ 0.5360466212034226,
50
+ -0.019520661234855623,
51
+ 0.09359118081629283
52
+ ]
53
+ },
54
+ "right_leg": {
55
+ "min": [
56
+ -0.5335952043533325,
57
+ -0.350761741399765,
58
+ -1.3307929039001465,
59
+ 0.07445771992206573,
60
+ -0.6092288494110107,
61
+ -0.1984633058309555
62
+ ],
63
+ "max": [
64
+ 0.25397607684135437,
65
+ 0.15654273331165314,
66
+ 0.24837948381900787,
67
+ 0.9999935626983643,
68
+ 0.1089707612991333,
69
+ 0.17701147496700287
70
+ ],
71
+ "mean": [
72
+ 0.05046115070581436,
73
+ -0.023679343983530998,
74
+ -0.213065966963768,
75
+ 0.20844903588294983,
76
+ -0.19808240234851837,
77
+ -0.0055496226996183395
78
+ ],
79
+ "std": [
80
+ 0.07887373864650726,
81
+ 0.06217808276414871,
82
+ 0.18437089025974274,
83
+ 0.10042016953229904,
84
+ 0.06798264384269714,
85
+ 0.04407079145312309
86
+ ],
87
+ "q01": [
88
+ -0.193911362439394,
89
+ -0.1981988400220871,
90
+ -0.90549436211586,
91
+ 0.127213454246521,
92
+ -0.4343456655740738,
93
+ -0.11320190876722336
94
+ ],
95
+ "q99": [
96
+ 0.1967100210487844,
97
+ 0.11513377726078033,
98
+ 0.15384408906102207,
99
+ 0.7395615458488474,
100
+ -0.05514147877693175,
101
+ 0.08568341806530994
102
+ ]
103
+ },
104
+ "waist": {
105
+ "min": [
106
+ -0.3889274299144745,
107
+ -0.3032904267311096,
108
+ -0.04627600684762001
109
+ ],
110
+ "max": [
111
+ 0.4404728412628174,
112
+ 0.11908156424760818,
113
+ 0.05046159774065018
114
+ ],
115
+ "mean": [
116
+ 0.1003476083278656,
117
+ -0.03575156629085541,
118
+ -0.0004057084152009338
119
+ ],
120
+ "std": [
121
+ 0.11155267059803009,
122
+ 0.044356729835271835,
123
+ 0.007639772724360228
124
+ ],
125
+ "q01": [
126
+ -0.09896008186042309,
127
+ -0.16525592356920243,
128
+ -0.019172759167850016
129
+ ],
130
+ "q99": [
131
+ 0.3729535743594171,
132
+ 0.04077914115041498,
133
+ 0.024438940081745388
134
+ ]
135
+ },
136
+ "left_arm": {
137
+ "min": [
138
+ -0.2003283053636551,
139
+ 0.09816279262304306,
140
+ -0.5412195920944214,
141
+ 0.7723593711853027,
142
+ -0.7412483096122742,
143
+ -0.09287774562835693,
144
+ -0.31815722584724426
145
+ ],
146
+ "max": [
147
+ 0.4134317934513092,
148
+ 0.38915175199508667,
149
+ 0.3470511734485626,
150
+ 1.363792896270752,
151
+ 0.38266828656196594,
152
+ 0.5152138471603394,
153
+ 0.42312705516815186
154
+ ],
155
+ "mean": [
156
+ 0.17467822134494781,
157
+ 0.20962199568748474,
158
+ 0.03295444697141647,
159
+ 1.0894439220428467,
160
+ -0.11893314123153687,
161
+ 0.20652393996715546,
162
+ 0.01763514056801796
163
+ ],
164
+ "std": [
165
+ 0.08956529945135117,
166
+ 0.03943527489900589,
167
+ 0.09209521114826202,
168
+ 0.07066802680492401,
169
+ 0.19965490698814392,
170
+ 0.11541580408811569,
171
+ 0.10361754149198532
172
+ ],
173
+ "q01": [
174
+ -0.06361526139080524,
175
+ 0.1356973797082901,
176
+ -0.1961050637066364,
177
+ 0.9089213967323303,
178
+ -0.5769511580467224,
179
+ -0.03977684192359447,
180
+ -0.22587568387389184
181
+ ],
182
+ "q99": [
183
+ 0.3310546398162843,
184
+ 0.31673349142074597,
185
+ 0.2289490304887296,
186
+ 1.2593449354171753,
187
+ 0.2899013936519628,
188
+ 0.46442466974258423,
189
+ 0.2727669641375545
190
+ ]
191
+ },
192
+ "right_arm": {
193
+ "min": [
194
+ -0.9788835048675537,
195
+ -0.7953690886497498,
196
+ -0.49778875708580017,
197
+ -0.7156979441642761,
198
+ -0.9786917567253113,
199
+ -0.1273084282875061,
200
+ -0.9962846040725708
201
+ ],
202
+ "max": [
203
+ 0.3628104329109192,
204
+ 0.08640626072883606,
205
+ 0.8718883395195007,
206
+ 1.3758729696273804,
207
+ 1.0651459693908691,
208
+ 0.6638182401657104,
209
+ 0.9581388235092163
210
+ ],
211
+ "mean": [
212
+ -0.14295516908168793,
213
+ -0.20207007229328156,
214
+ 0.164081871509552,
215
+ 0.32978397607803345,
216
+ 0.15659268200397491,
217
+ 0.21257737278938293,
218
+ 0.0897224023938179
219
+ ],
220
+ "std": [
221
+ 0.2832476496696472,
222
+ 0.07377105951309204,
223
+ 0.18590903282165527,
224
+ 0.6193384528160095,
225
+ 0.20538125932216644,
226
+ 0.12802571058273315,
227
+ 0.21542473137378693
228
+ ],
229
+ "q01": [
230
+ -0.7704071193933487,
231
+ -0.376973994076252,
232
+ -0.19678157344460487,
233
+ -0.5173931628465652,
234
+ -0.39670541584491725,
235
+ -0.03838966768234967,
236
+ -0.3572006195783615
237
+ ],
238
+ "q99": [
239
+ 0.24905617535114288,
240
+ 0.0024351945263335014,
241
+ 0.586448073387146,
242
+ 1.304707604646683,
243
+ 0.5929710775613787,
244
+ 0.5161845684051514,
245
+ 0.6641693621873858
246
+ ]
247
+ },
248
+ "left_hand": {
249
+ "min": [
250
+ 0.0,
251
+ 0.0,
252
+ 0.0,
253
+ 0.0,
254
+ 0.0,
255
+ 0.0,
256
+ 0.0
257
+ ],
258
+ "max": [
259
+ 0.0,
260
+ 0.0,
261
+ 0.0,
262
+ 0.0,
263
+ 0.0,
264
+ 0.0,
265
+ 0.0
266
+ ],
267
+ "mean": [
268
+ 0.0,
269
+ 0.0,
270
+ 0.0,
271
+ 0.0,
272
+ 0.0,
273
+ 0.0,
274
+ 0.0
275
+ ],
276
+ "std": [
277
+ 0.0,
278
+ 0.0,
279
+ 0.0,
280
+ 0.0,
281
+ 0.0,
282
+ 0.0,
283
+ 0.0
284
+ ],
285
+ "q01": [
286
+ 0.0,
287
+ 0.0,
288
+ 0.0,
289
+ 0.0,
290
+ 0.0,
291
+ 0.0,
292
+ 0.0
293
+ ],
294
+ "q99": [
295
+ 0.0,
296
+ 0.0,
297
+ 0.0,
298
+ 0.0,
299
+ 0.0,
300
+ 0.0,
301
+ 0.0
302
+ ]
303
+ },
304
+ "right_hand": {
305
+ "min": [
306
+ 0.0,
307
+ 0.0,
308
+ 0.0,
309
+ 0.0,
310
+ 0.0,
311
+ 0.0,
312
+ 0.0
313
+ ],
314
+ "max": [
315
+ 0.0,
316
+ 0.0,
317
+ 0.0,
318
+ 0.0,
319
+ 0.0,
320
+ 0.0,
321
+ 0.0
322
+ ],
323
+ "mean": [
324
+ 0.0,
325
+ 0.0,
326
+ 0.0,
327
+ 0.0,
328
+ 0.0,
329
+ 0.0,
330
+ 0.0
331
+ ],
332
+ "std": [
333
+ 0.0,
334
+ 0.0,
335
+ 0.0,
336
+ 0.0,
337
+ 0.0,
338
+ 0.0,
339
+ 0.0
340
+ ],
341
+ "q01": [
342
+ 0.0,
343
+ 0.0,
344
+ 0.0,
345
+ 0.0,
346
+ 0.0,
347
+ 0.0,
348
+ 0.0
349
+ ],
350
+ "q99": [
351
+ 0.0,
352
+ 0.0,
353
+ 0.0,
354
+ 0.0,
355
+ 0.0,
356
+ 0.0,
357
+ 0.0
358
+ ]
359
+ },
360
+ "projected_gravity": {
361
+ "min": [
362
+ -0.12354099005460739,
363
+ -0.13017292320728302,
364
+ -1.0
365
+ ],
366
+ "max": [
367
+ 0.22223307192325592,
368
+ 0.10705921798944473,
369
+ -0.9749471545219421
370
+ ],
371
+ "mean": [
372
+ -0.01818661577999592,
373
+ 0.0029902660753577948,
374
+ -0.9988934993743896
375
+ ],
376
+ "std": [
377
+ 0.03578517585992813,
378
+ 0.032206468284130096,
379
+ 0.0014198371209307285
380
+ ],
381
+ "q01": [
382
+ -0.09425989575684071,
383
+ -0.08990333564579486,
384
+ -0.9999815225601196
385
+ ],
386
+ "q99": [
387
+ 0.06742736026644708,
388
+ 0.06235775817185641,
389
+ -0.9940253734588623
390
+ ]
391
+ }
392
+ },
393
+ "action": {
394
+ "motion_token": {
395
+ "min": [
396
+ -0.3125,
397
+ -0.5,
398
+ -0.5,
399
+ -0.4375,
400
+ -0.625,
401
+ -0.375,
402
+ -0.25,
403
+ -0.0625,
404
+ -0.4375,
405
+ -0.6875,
406
+ -0.375,
407
+ -0.375,
408
+ -0.3125,
409
+ -0.375,
410
+ -0.6875,
411
+ -0.25,
412
+ -0.375,
413
+ -0.25,
414
+ -0.375,
415
+ -0.5,
416
+ -0.5,
417
+ -0.5,
418
+ -0.625,
419
+ -0.5,
420
+ -0.375,
421
+ -0.5625,
422
+ -0.125,
423
+ -0.5,
424
+ -0.3125,
425
+ -0.3125,
426
+ -0.125,
427
+ -0.375,
428
+ 0.0625,
429
+ -0.1875,
430
+ -0.1875,
431
+ -0.5625,
432
+ -0.6875,
433
+ -0.6875,
434
+ -0.125,
435
+ -0.125,
436
+ -0.4375,
437
+ -0.5625,
438
+ -0.3125,
439
+ -0.375,
440
+ -0.5,
441
+ -0.4375,
442
+ -0.125,
443
+ -0.3125,
444
+ -0.5,
445
+ -0.25,
446
+ -0.375,
447
+ -0.625,
448
+ -0.0625,
449
+ -0.4375,
450
+ -0.0625,
451
+ -0.4375,
452
+ -0.5,
453
+ 0.0,
454
+ -0.25,
455
+ -0.5,
456
+ -0.375,
457
+ -0.1875,
458
+ 0.0,
459
+ -0.5
460
+ ],
461
+ "max": [
462
+ 0.125,
463
+ 0.25,
464
+ 0.25,
465
+ 0.125,
466
+ 0.1875,
467
+ 0.1875,
468
+ 0.5,
469
+ 0.4375,
470
+ 0.25,
471
+ 0.125,
472
+ 0.1875,
473
+ 0.0625,
474
+ 0.125,
475
+ 0.3125,
476
+ -0.0625,
477
+ 0.1875,
478
+ 0.25,
479
+ 0.25,
480
+ 0.125,
481
+ 0.0625,
482
+ 0.3125,
483
+ 0.125,
484
+ 0.25,
485
+ 0.25,
486
+ 0.3125,
487
+ 0.125,
488
+ 0.375,
489
+ 0.1875,
490
+ 0.375,
491
+ 0.375,
492
+ 0.375,
493
+ 0.25,
494
+ 0.4375,
495
+ 0.5,
496
+ 0.5,
497
+ 0.5625,
498
+ 0.25,
499
+ -0.0625,
500
+ 0.3125,
501
+ 0.4375,
502
+ 0.125,
503
+ 0.4375,
504
+ 0.4375,
505
+ 0.375,
506
+ -0.0625,
507
+ 0.1875,
508
+ 0.5625,
509
+ 0.1875,
510
+ 0.3125,
511
+ 0.1875,
512
+ 0.25,
513
+ 0.1875,
514
+ 0.375,
515
+ 0.3125,
516
+ 0.5625,
517
+ 0.1875,
518
+ 0.4375,
519
+ 0.5625,
520
+ 0.1875,
521
+ 0.375,
522
+ 0.3125,
523
+ 0.4375,
524
+ 0.5625,
525
+ 0.0
526
+ ],
527
+ "mean": [
528
+ -0.05732722207903862,
529
+ -0.12596048414707184,
530
+ -0.015900524333119392,
531
+ -0.16434414684772491,
532
+ -0.18957528471946716,
533
+ -0.08797170221805573,
534
+ 0.2548595666885376,
535
+ 0.19856274127960205,
536
+ -0.025066815316677094,
537
+ -0.21372610330581665,
538
+ -0.10314688086509705,
539
+ -0.21981850266456604,
540
+ -0.12050355225801468,
541
+ -0.08165144175291061,
542
+ -0.38714757561683655,
543
+ -8.805885590845719e-05,
544
+ -0.049404650926589966,
545
+ -0.055493421852588654,
546
+ -0.09600593894720078,
547
+ -0.2977478802204132,
548
+ -0.029102997854351997,
549
+ -0.2329292893409729,
550
+ -0.19594638049602509,
551
+ -0.23360289633274078,
552
+ -0.095408596098423,
553
+ -0.17069709300994873,
554
+ 0.1292250156402588,
555
+ -0.2315811812877655,
556
+ 0.07302621006965637,
557
+ 0.06577451527118683,
558
+ 0.1414906084537506,
559
+ -0.11845822632312775,
560
+ 0.2995853126049042,
561
+ 0.17635828256607056,
562
+ 0.14573286473751068,
563
+ 0.0782189592719078,
564
+ -0.1727832704782486,
565
+ -0.3186105489730835,
566
+ 0.11981905251741409,
567
+ 0.13200204074382782,
568
+ -0.08226785063743591,
569
+ -0.09514441341161728,
570
+ 0.060834143310785294,
571
+ -0.006165935657918453,
572
+ -0.3161884844303131,
573
+ -0.02333650551736355,
574
+ 0.21719853579998016,
575
+ -0.10866008698940277,
576
+ -0.01649424061179161,
577
+ -0.007006580010056496,
578
+ -0.06802137941122055,
579
+ -0.14377468824386597,
580
+ 0.21333755552768707,
581
+ 0.015348567627370358,
582
+ 0.22719819843769073,
583
+ -0.1495230346918106,
584
+ 0.030986731871962547,
585
+ 0.296153724193573,
586
+ -0.023153124377131462,
587
+ -0.1389232873916626,
588
+ 0.035359714180231094,
589
+ 0.10143018513917923,
590
+ 0.30849015712738037,
591
+ -0.22524820268154144
592
+ ],
593
+ "std": [
594
+ 0.06542618572711945,
595
+ 0.09994574636220932,
596
+ 0.07207678258419037,
597
+ 0.08702709525823593,
598
+ 0.17209544777870178,
599
+ 0.0581701286137104,
600
+ 0.09559116512537003,
601
+ 0.07802454382181168,
602
+ 0.13620688021183014,
603
+ 0.1569388061761856,
604
+ 0.0967717096209526,
605
+ 0.0680033266544342,
606
+ 0.05837923660874367,
607
+ 0.11557621508836746,
608
+ 0.11890240013599396,
609
+ 0.08077684044837952,
610
+ 0.06398067623376846,
611
+ 0.06826013326644897,
612
+ 0.09755037724971771,
613
+ 0.10724268853664398,
614
+ 0.1992810219526291,
615
+ 0.12710419297218323,
616
+ 0.21719561517238617,
617
+ 0.14369657635688782,
618
+ 0.08655858784914017,
619
+ 0.11142221838235855,
620
+ 0.057688891887664795,
621
+ 0.18031662702560425,
622
+ 0.0692613422870636,
623
+ 0.16206243634223938,
624
+ 0.11068906635046005,
625
+ 0.06650221347808838,
626
+ 0.06952458620071411,
627
+ 0.10304083675146103,
628
+ 0.12724509835243225,
629
+ 0.3227654695510864,
630
+ 0.14636477828025818,
631
+ 0.08603093028068542,
632
+ 0.08780314773321152,
633
+ 0.06147885322570801,
634
+ 0.07425742596387863,
635
+ 0.27255958318710327,
636
+ 0.13721545040607452,
637
+ 0.10124049335718155,
638
+ 0.06286311149597168,
639
+ 0.0642034038901329,
640
+ 0.08693595230579376,
641
+ 0.06350599974393845,
642
+ 0.11969305574893951,
643
+ 0.06820058822631836,
644
+ 0.09139743447303772,
645
+ 0.1545047014951706,
646
+ 0.06951460987329483,
647
+ 0.08810964971780777,
648
+ 0.0868336483836174,
649
+ 0.0749349296092987,
650
+ 0.09778603166341782,
651
+ 0.11456362158060074,
652
+ 0.06560879200696945,
653
+ 0.2043108344078064,
654
+ 0.07238639891147614,
655
+ 0.0965481698513031,
656
+ 0.11412639170885086,
657
+ 0.11945699900388718
658
+ ],
659
+ "q01": [
660
+ -0.1875,
661
+ -0.375,
662
+ -0.1875,
663
+ -0.375,
664
+ -0.5625,
665
+ -0.1875,
666
+ 0.0625,
667
+ 0.0,
668
+ -0.3125,
669
+ -0.625,
670
+ -0.3125,
671
+ -0.3125,
672
+ -0.25,
673
+ -0.3125,
674
+ -0.625,
675
+ -0.1875,
676
+ -0.25,
677
+ -0.1875,
678
+ -0.3125,
679
+ -0.5,
680
+ -0.375,
681
+ -0.4375,
682
+ -0.5625,
683
+ -0.4375,
684
+ -0.3125,
685
+ -0.5,
686
+ -0.0625,
687
+ -0.5,
688
+ -0.0625,
689
+ -0.1875,
690
+ -0.0625,
691
+ -0.25,
692
+ 0.125,
693
+ -0.0625,
694
+ -0.0625,
695
+ -0.5,
696
+ -0.5625,
697
+ -0.5625,
698
+ -0.0625,
699
+ 0.0,
700
+ -0.25,
701
+ -0.5625,
702
+ -0.1875,
703
+ -0.25,
704
+ -0.4375,
705
+ -0.1875,
706
+ 0.0625,
707
+ -0.25,
708
+ -0.375,
709
+ -0.1875,
710
+ -0.3125,
711
+ -0.5,
712
+ 0.0625,
713
+ -0.1875,
714
+ 0.0625,
715
+ -0.375,
716
+ -0.375,
717
+ 0.0625,
718
+ -0.1875,
719
+ -0.4375,
720
+ -0.1875,
721
+ -0.0625,
722
+ 0.125,
723
+ -0.4375
724
+ ],
725
+ "q99": [
726
+ 0.0625,
727
+ 0.0625,
728
+ 0.1875,
729
+ 0.0,
730
+ 0.125,
731
+ 0.0625,
732
+ 0.375,
733
+ 0.375,
734
+ 0.1875,
735
+ 0.0625,
736
+ 0.0625,
737
+ -0.0625,
738
+ 0.0625,
739
+ 0.1875,
740
+ -0.125,
741
+ 0.125,
742
+ 0.125,
743
+ 0.125,
744
+ 0.0625,
745
+ -0.0625,
746
+ 0.25,
747
+ 0.0,
748
+ 0.1875,
749
+ 0.125,
750
+ 0.0625,
751
+ 0.0,
752
+ 0.25,
753
+ 0.125,
754
+ 0.25,
755
+ 0.3125,
756
+ 0.3125,
757
+ 0.0625,
758
+ 0.375,
759
+ 0.375,
760
+ 0.4375,
761
+ 0.5,
762
+ 0.125,
763
+ -0.125,
764
+ 0.3125,
765
+ 0.25,
766
+ 0.0625,
767
+ 0.3125,
768
+ 0.3125,
769
+ 0.25,
770
+ -0.125,
771
+ 0.125,
772
+ 0.4375,
773
+ 0.0,
774
+ 0.1875,
775
+ 0.125,
776
+ 0.125,
777
+ 0.125,
778
+ 0.375,
779
+ 0.1875,
780
+ 0.5,
781
+ 0.0625,
782
+ 0.25,
783
+ 0.5,
784
+ 0.125,
785
+ 0.1875,
786
+ 0.25,
787
+ 0.3125,
788
+ 0.5,
789
+ 0.0
790
+ ]
791
+ },
792
+ "left_hand_joints": {
793
+ "min": [
794
+ 0.0,
795
+ 0.0,
796
+ 0.0,
797
+ 0.0,
798
+ 0.0,
799
+ 0.0,
800
+ 0.0
801
+ ],
802
+ "max": [
803
+ 0.0,
804
+ 0.0,
805
+ 0.0,
806
+ 0.0,
807
+ 0.0,
808
+ 0.0,
809
+ 0.0
810
+ ],
811
+ "mean": [
812
+ 0.0,
813
+ 0.0,
814
+ 0.0,
815
+ 0.0,
816
+ 0.0,
817
+ 0.0,
818
+ 0.0
819
+ ],
820
+ "std": [
821
+ 0.0,
822
+ 0.0,
823
+ 0.0,
824
+ 0.0,
825
+ 0.0,
826
+ 0.0,
827
+ 0.0
828
+ ],
829
+ "q01": [
830
+ 0.0,
831
+ 0.0,
832
+ 0.0,
833
+ 0.0,
834
+ 0.0,
835
+ 0.0,
836
+ 0.0
837
+ ],
838
+ "q99": [
839
+ 0.0,
840
+ 0.0,
841
+ 0.0,
842
+ 0.0,
843
+ 0.0,
844
+ 0.0,
845
+ 0.0
846
+ ]
847
+ },
848
+ "right_hand_joints": {
849
+ "min": [
850
+ 0.0,
851
+ 0.0,
852
+ 0.0,
853
+ 0.0,
854
+ 0.0,
855
+ 0.0,
856
+ 0.0
857
+ ],
858
+ "max": [
859
+ 0.0,
860
+ 0.0,
861
+ 0.0,
862
+ 0.0,
863
+ 0.0,
864
+ 0.0,
865
+ 0.0
866
+ ],
867
+ "mean": [
868
+ 0.0,
869
+ 0.0,
870
+ 0.0,
871
+ 0.0,
872
+ 0.0,
873
+ 0.0,
874
+ 0.0
875
+ ],
876
+ "std": [
877
+ 0.0,
878
+ 0.0,
879
+ 0.0,
880
+ 0.0,
881
+ 0.0,
882
+ 0.0,
883
+ 0.0
884
+ ],
885
+ "q01": [
886
+ 0.0,
887
+ 0.0,
888
+ 0.0,
889
+ 0.0,
890
+ 0.0,
891
+ 0.0,
892
+ 0.0
893
+ ],
894
+ "q99": [
895
+ 0.0,
896
+ 0.0,
897
+ 0.0,
898
+ 0.0,
899
+ 0.0,
900
+ 0.0,
901
+ 0.0
902
+ ]
903
+ }
904
+ },
905
+ "relative_action": {}
906
+ }
907
+ }
checkpoint-4000/experiment_cfg/final_model_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "Gr00tN1d7",
3
+ "model_dtype": "bfloat16",
4
+ "model_name": "nvidia/Cosmos-Reason2-2B",
5
+ "backbone_model_type": "qwen",
6
+ "model_revision": null,
7
+ "tune_top_llm_layers": 0,
8
+ "backbone_embedding_dim": 2048,
9
+ "tune_llm": false,
10
+ "tune_visual": false,
11
+ "select_layer": 16,
12
+ "reproject_vision": false,
13
+ "use_flash_attention": true,
14
+ "load_bf16": false,
15
+ "backbone_trainable_params_fp32": true,
16
+ "extra_augmentation_config": null,
17
+ "apply_sincos_state_encoding": false,
18
+ "use_percentiles": true,
19
+ "use_relative_action": false,
20
+ "max_state_dim": 132,
21
+ "max_action_dim": 132,
22
+ "action_horizon": 40,
23
+ "hidden_size": 1024,
24
+ "input_embedding_dim": 1536,
25
+ "state_history_length": 1,
26
+ "add_pos_embed": true,
27
+ "attn_dropout": 0.2,
28
+ "use_vlln": true,
29
+ "max_seq_len": 1024,
30
+ "use_alternate_vl_dit": true,
31
+ "attend_text_every_n_blocks": 2,
32
+ "diffusion_model_cfg": {
33
+ "attention_head_dim": 48,
34
+ "dropout": 0.2,
35
+ "final_dropout": true,
36
+ "interleave_self_attention": true,
37
+ "norm_type": "ada_norm",
38
+ "num_attention_heads": 32,
39
+ "num_layers": 32,
40
+ "output_dim": 1024,
41
+ "positional_embeddings": null
42
+ },
43
+ "num_inference_timesteps": 4,
44
+ "noise_beta_alpha": 1.5,
45
+ "noise_beta_beta": 1.0,
46
+ "noise_s": 0.999,
47
+ "num_timestep_buckets": 1000,
48
+ "tune_projector": true,
49
+ "tune_diffusion_model": true,
50
+ "tune_vlln": true,
51
+ "state_dropout_prob": 0.2,
52
+ "exclude_state": false,
53
+ "use_mean_std": false,
54
+ "max_num_embodiments": 32
55
+ }
checkpoint-4000/experiment_cfg/final_processor_config.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-4000/model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbcaea5ee88f1e0f1465043920a2647c67e7de17d24adfd1c477742a6168edec
3
+ size 4986649584
checkpoint-4000/model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f20b05362a61144d0d23ff607b3410b769e653f9cd02b6f78f6c3a4375aaf057
3
+ size 4970792616
checkpoint-4000/model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:765a0ce59c06edc53d8371d666a0f6767b1e523c80324533ef5cab833de7dedb
3
+ size 2618758696
checkpoint-4000/model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-4000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2797d0d0087270c1480c0bc77561587ce776cccff82ce641eb8bbbd35bb6e97
3
+ size 12964594710
checkpoint-4000/processor_config.json ADDED
@@ -0,0 +1,1159 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "processor_class": "Gr00tN1d7Processor",
3
+ "processor_kwargs": {
4
+ "modality_configs": {
5
+ "real_g1_relative_eef_relative_joints": {
6
+ "video": {
7
+ "delta_indices": [
8
+ -20,
9
+ 0
10
+ ],
11
+ "modality_keys": [
12
+ "ego_view"
13
+ ],
14
+ "sin_cos_embedding_keys": null,
15
+ "mean_std_embedding_keys": null,
16
+ "action_configs": null
17
+ },
18
+ "state": {
19
+ "delta_indices": [
20
+ 0
21
+ ],
22
+ "modality_keys": [
23
+ "left_wrist_eef_9d",
24
+ "right_wrist_eef_9d",
25
+ "left_hand",
26
+ "right_hand",
27
+ "left_arm",
28
+ "right_arm",
29
+ "waist"
30
+ ],
31
+ "sin_cos_embedding_keys": null,
32
+ "mean_std_embedding_keys": null,
33
+ "action_configs": null
34
+ },
35
+ "action": {
36
+ "delta_indices": [
37
+ 0,
38
+ 1,
39
+ 2,
40
+ 3,
41
+ 4,
42
+ 5,
43
+ 6,
44
+ 7,
45
+ 8,
46
+ 9,
47
+ 10,
48
+ 11,
49
+ 12,
50
+ 13,
51
+ 14,
52
+ 15,
53
+ 16,
54
+ 17,
55
+ 18,
56
+ 19,
57
+ 20,
58
+ 21,
59
+ 22,
60
+ 23,
61
+ 24,
62
+ 25,
63
+ 26,
64
+ 27,
65
+ 28,
66
+ 29,
67
+ 30,
68
+ 31,
69
+ 32,
70
+ 33,
71
+ 34,
72
+ 35,
73
+ 36,
74
+ 37,
75
+ 38,
76
+ 39
77
+ ],
78
+ "modality_keys": [
79
+ "left_wrist_eef_9d",
80
+ "right_wrist_eef_9d",
81
+ "left_hand",
82
+ "right_hand",
83
+ "left_arm",
84
+ "right_arm",
85
+ "waist",
86
+ "base_height_command",
87
+ "navigate_command"
88
+ ],
89
+ "sin_cos_embedding_keys": null,
90
+ "mean_std_embedding_keys": null,
91
+ "action_configs": [
92
+ {
93
+ "rep": "RELATIVE",
94
+ "type": "EEF",
95
+ "format": "XYZ_ROT6D",
96
+ "state_key": "left_wrist_eef_9d"
97
+ },
98
+ {
99
+ "rep": "RELATIVE",
100
+ "type": "EEF",
101
+ "format": "XYZ_ROT6D",
102
+ "state_key": "right_wrist_eef_9d"
103
+ },
104
+ {
105
+ "rep": "ABSOLUTE",
106
+ "type": "NON_EEF",
107
+ "format": "DEFAULT",
108
+ "state_key": "left_hand"
109
+ },
110
+ {
111
+ "rep": "ABSOLUTE",
112
+ "type": "NON_EEF",
113
+ "format": "DEFAULT",
114
+ "state_key": "right_hand"
115
+ },
116
+ {
117
+ "rep": "RELATIVE",
118
+ "type": "NON_EEF",
119
+ "format": "DEFAULT",
120
+ "state_key": "left_arm"
121
+ },
122
+ {
123
+ "rep": "RELATIVE",
124
+ "type": "NON_EEF",
125
+ "format": "DEFAULT",
126
+ "state_key": "right_arm"
127
+ },
128
+ {
129
+ "rep": "ABSOLUTE",
130
+ "type": "NON_EEF",
131
+ "format": "DEFAULT",
132
+ "state_key": "waist"
133
+ },
134
+ {
135
+ "rep": "ABSOLUTE",
136
+ "type": "NON_EEF",
137
+ "format": "DEFAULT",
138
+ "state_key": "base_height_command"
139
+ },
140
+ {
141
+ "rep": "ABSOLUTE",
142
+ "type": "NON_EEF",
143
+ "format": "DEFAULT",
144
+ "state_key": "navigate_command"
145
+ }
146
+ ]
147
+ },
148
+ "language": {
149
+ "delta_indices": [
150
+ 0
151
+ ],
152
+ "modality_keys": [
153
+ "annotation.human.task_description"
154
+ ],
155
+ "sin_cos_embedding_keys": null,
156
+ "mean_std_embedding_keys": null,
157
+ "action_configs": null
158
+ }
159
+ },
160
+ "real_r1_pro_sharpa_relative_eef_mecka": {
161
+ "video": {
162
+ "delta_indices": [
163
+ -30,
164
+ 0
165
+ ],
166
+ "modality_keys": [
167
+ "ego_view_cropratio_res320x240_freq30"
168
+ ],
169
+ "sin_cos_embedding_keys": null,
170
+ "mean_std_embedding_keys": null,
171
+ "action_configs": null
172
+ },
173
+ "state": {
174
+ "delta_indices": [
175
+ 0
176
+ ],
177
+ "modality_keys": [
178
+ "left_wrist_eef",
179
+ "right_wrist_eef",
180
+ "left_hand_joints",
181
+ "right_hand_joints"
182
+ ],
183
+ "sin_cos_embedding_keys": null,
184
+ "mean_std_embedding_keys": null,
185
+ "action_configs": null
186
+ },
187
+ "action": {
188
+ "delta_indices": [
189
+ 0,
190
+ 1,
191
+ 2,
192
+ 3,
193
+ 4,
194
+ 5,
195
+ 6,
196
+ 7,
197
+ 8,
198
+ 9,
199
+ 10,
200
+ 11,
201
+ 12,
202
+ 13,
203
+ 14,
204
+ 15,
205
+ 16,
206
+ 17,
207
+ 18,
208
+ 19,
209
+ 20,
210
+ 21,
211
+ 22,
212
+ 23,
213
+ 24,
214
+ 25,
215
+ 26,
216
+ 27,
217
+ 28,
218
+ 29,
219
+ 30,
220
+ 31,
221
+ 32,
222
+ 33,
223
+ 34,
224
+ 35,
225
+ 36,
226
+ 37,
227
+ 38,
228
+ 39
229
+ ],
230
+ "modality_keys": [
231
+ "left_wrist_eef",
232
+ "right_wrist_eef",
233
+ "left_hand_joints",
234
+ "right_hand_joints"
235
+ ],
236
+ "sin_cos_embedding_keys": null,
237
+ "mean_std_embedding_keys": null,
238
+ "action_configs": [
239
+ {
240
+ "rep": "RELATIVE",
241
+ "type": "EEF",
242
+ "format": "XYZ_ROT6D",
243
+ "state_key": "left_wrist_eef"
244
+ },
245
+ {
246
+ "rep": "RELATIVE",
247
+ "type": "EEF",
248
+ "format": "XYZ_ROT6D",
249
+ "state_key": "right_wrist_eef"
250
+ },
251
+ {
252
+ "rep": "ABSOLUTE",
253
+ "type": "NON_EEF",
254
+ "format": "DEFAULT",
255
+ "state_key": "left_hand_joints"
256
+ },
257
+ {
258
+ "rep": "ABSOLUTE",
259
+ "type": "NON_EEF",
260
+ "format": "DEFAULT",
261
+ "state_key": "right_hand_joints"
262
+ }
263
+ ]
264
+ },
265
+ "language": {
266
+ "delta_indices": [
267
+ 0
268
+ ],
269
+ "modality_keys": [
270
+ "annotation.human.coarse_action"
271
+ ],
272
+ "sin_cos_embedding_keys": null,
273
+ "mean_std_embedding_keys": null,
274
+ "action_configs": null
275
+ }
276
+ },
277
+ "real_r1_pro_sharpa_relative_eef_human": {
278
+ "video": {
279
+ "delta_indices": [
280
+ -20,
281
+ 0
282
+ ],
283
+ "modality_keys": [
284
+ "ego_view_res320x240_freq20",
285
+ "left_wrist_view_res320x240_freq20",
286
+ "right_wrist_view_res320x240_freq20"
287
+ ],
288
+ "sin_cos_embedding_keys": null,
289
+ "mean_std_embedding_keys": null,
290
+ "action_configs": null
291
+ },
292
+ "state": {
293
+ "delta_indices": [
294
+ 0
295
+ ],
296
+ "modality_keys": [
297
+ "left_wrist_eef",
298
+ "right_wrist_eef",
299
+ "left_hand_joints",
300
+ "right_hand_joints"
301
+ ],
302
+ "sin_cos_embedding_keys": null,
303
+ "mean_std_embedding_keys": null,
304
+ "action_configs": null
305
+ },
306
+ "action": {
307
+ "delta_indices": [
308
+ 0,
309
+ 1,
310
+ 2,
311
+ 3,
312
+ 4,
313
+ 5,
314
+ 6,
315
+ 7,
316
+ 8,
317
+ 9,
318
+ 10,
319
+ 11,
320
+ 12,
321
+ 13,
322
+ 14,
323
+ 15,
324
+ 16,
325
+ 17,
326
+ 18,
327
+ 19,
328
+ 20,
329
+ 21,
330
+ 22,
331
+ 23,
332
+ 24,
333
+ 25,
334
+ 26,
335
+ 27,
336
+ 28,
337
+ 29,
338
+ 30,
339
+ 31,
340
+ 32,
341
+ 33,
342
+ 34,
343
+ 35,
344
+ 36,
345
+ 37,
346
+ 38,
347
+ 39
348
+ ],
349
+ "modality_keys": [
350
+ "left_wrist_eef",
351
+ "right_wrist_eef",
352
+ "left_hand_joints",
353
+ "right_hand_joints"
354
+ ],
355
+ "sin_cos_embedding_keys": null,
356
+ "mean_std_embedding_keys": null,
357
+ "action_configs": [
358
+ {
359
+ "rep": "RELATIVE",
360
+ "type": "EEF",
361
+ "format": "XYZ_ROT6D",
362
+ "state_key": "left_wrist_eef"
363
+ },
364
+ {
365
+ "rep": "RELATIVE",
366
+ "type": "EEF",
367
+ "format": "XYZ_ROT6D",
368
+ "state_key": "right_wrist_eef"
369
+ },
370
+ {
371
+ "rep": "ABSOLUTE",
372
+ "type": "NON_EEF",
373
+ "format": "DEFAULT",
374
+ "state_key": "left_hand_joints"
375
+ },
376
+ {
377
+ "rep": "ABSOLUTE",
378
+ "type": "NON_EEF",
379
+ "format": "DEFAULT",
380
+ "state_key": "right_hand_joints"
381
+ }
382
+ ]
383
+ },
384
+ "language": {
385
+ "delta_indices": [
386
+ 0
387
+ ],
388
+ "modality_keys": [
389
+ "annotation.human.coarse_action"
390
+ ],
391
+ "sin_cos_embedding_keys": null,
392
+ "mean_std_embedding_keys": null,
393
+ "action_configs": null
394
+ }
395
+ },
396
+ "real_r1_pro_sharpa_relative_eef": {
397
+ "video": {
398
+ "delta_indices": [
399
+ -20,
400
+ 0
401
+ ],
402
+ "modality_keys": [
403
+ "ego_view_res320x240_freq20",
404
+ "left_wrist_view_res320x240_freq20",
405
+ "right_wrist_view_res320x240_freq20"
406
+ ],
407
+ "sin_cos_embedding_keys": null,
408
+ "mean_std_embedding_keys": null,
409
+ "action_configs": null
410
+ },
411
+ "state": {
412
+ "delta_indices": [
413
+ 0
414
+ ],
415
+ "modality_keys": [
416
+ "left_wrist_eef",
417
+ "right_wrist_eef",
418
+ "left_hand_joints",
419
+ "right_hand_joints"
420
+ ],
421
+ "sin_cos_embedding_keys": null,
422
+ "mean_std_embedding_keys": null,
423
+ "action_configs": null
424
+ },
425
+ "action": {
426
+ "delta_indices": [
427
+ 0,
428
+ 1,
429
+ 2,
430
+ 3,
431
+ 4,
432
+ 5,
433
+ 6,
434
+ 7,
435
+ 8,
436
+ 9,
437
+ 10,
438
+ 11,
439
+ 12,
440
+ 13,
441
+ 14,
442
+ 15,
443
+ 16,
444
+ 17,
445
+ 18,
446
+ 19,
447
+ 20,
448
+ 21,
449
+ 22,
450
+ 23,
451
+ 24,
452
+ 25,
453
+ 26,
454
+ 27,
455
+ 28,
456
+ 29,
457
+ 30,
458
+ 31,
459
+ 32,
460
+ 33,
461
+ 34,
462
+ 35,
463
+ 36,
464
+ 37,
465
+ 38,
466
+ 39
467
+ ],
468
+ "modality_keys": [
469
+ "left_wrist_eef",
470
+ "right_wrist_eef",
471
+ "left_hand_joints",
472
+ "right_hand_joints"
473
+ ],
474
+ "sin_cos_embedding_keys": null,
475
+ "mean_std_embedding_keys": null,
476
+ "action_configs": [
477
+ {
478
+ "rep": "RELATIVE",
479
+ "type": "EEF",
480
+ "format": "XYZ_ROT6D",
481
+ "state_key": "left_wrist_eef"
482
+ },
483
+ {
484
+ "rep": "RELATIVE",
485
+ "type": "EEF",
486
+ "format": "XYZ_ROT6D",
487
+ "state_key": "right_wrist_eef"
488
+ },
489
+ {
490
+ "rep": "ABSOLUTE",
491
+ "type": "NON_EEF",
492
+ "format": "DEFAULT",
493
+ "state_key": "left_hand_joints"
494
+ },
495
+ {
496
+ "rep": "ABSOLUTE",
497
+ "type": "NON_EEF",
498
+ "format": "DEFAULT",
499
+ "state_key": "right_hand_joints"
500
+ }
501
+ ]
502
+ },
503
+ "language": {
504
+ "delta_indices": [
505
+ 0
506
+ ],
507
+ "modality_keys": [
508
+ "annotation.human.coarse_action"
509
+ ],
510
+ "sin_cos_embedding_keys": null,
511
+ "mean_std_embedding_keys": null,
512
+ "action_configs": null
513
+ }
514
+ },
515
+ "xdof_relative_eef_relative_joint": {
516
+ "video": {
517
+ "delta_indices": [
518
+ -30,
519
+ 0
520
+ ],
521
+ "modality_keys": [
522
+ "top_camera-images-rgb_320_240",
523
+ "left_camera-images-rgb_320_240",
524
+ "right_camera-images-rgb_320_240"
525
+ ],
526
+ "sin_cos_embedding_keys": null,
527
+ "mean_std_embedding_keys": null,
528
+ "action_configs": null
529
+ },
530
+ "state": {
531
+ "delta_indices": [
532
+ 0
533
+ ],
534
+ "modality_keys": [
535
+ "left_wrist_eef",
536
+ "right_wrist_eef",
537
+ "left_gripper_pos",
538
+ "right_gripper_pos",
539
+ "left_joint_pos",
540
+ "right_joint_pos"
541
+ ],
542
+ "sin_cos_embedding_keys": null,
543
+ "mean_std_embedding_keys": null,
544
+ "action_configs": null
545
+ },
546
+ "action": {
547
+ "delta_indices": [
548
+ 0,
549
+ 1,
550
+ 2,
551
+ 3,
552
+ 4,
553
+ 5,
554
+ 6,
555
+ 7,
556
+ 8,
557
+ 9,
558
+ 10,
559
+ 11,
560
+ 12,
561
+ 13,
562
+ 14,
563
+ 15,
564
+ 16,
565
+ 17,
566
+ 18,
567
+ 19,
568
+ 20,
569
+ 21,
570
+ 22,
571
+ 23,
572
+ 24,
573
+ 25,
574
+ 26,
575
+ 27,
576
+ 28,
577
+ 29,
578
+ 30,
579
+ 31,
580
+ 32,
581
+ 33,
582
+ 34,
583
+ 35,
584
+ 36,
585
+ 37,
586
+ 38,
587
+ 39
588
+ ],
589
+ "modality_keys": [
590
+ "left_wrist_eef",
591
+ "right_wrist_eef",
592
+ "left_gripper_pos",
593
+ "right_gripper_pos",
594
+ "left_joint_pos",
595
+ "right_joint_pos"
596
+ ],
597
+ "sin_cos_embedding_keys": null,
598
+ "mean_std_embedding_keys": null,
599
+ "action_configs": [
600
+ {
601
+ "rep": "RELATIVE",
602
+ "type": "EEF",
603
+ "format": "XYZ_ROT6D",
604
+ "state_key": "left_wrist_eef"
605
+ },
606
+ {
607
+ "rep": "RELATIVE",
608
+ "type": "EEF",
609
+ "format": "XYZ_ROT6D",
610
+ "state_key": "right_wrist_eef"
611
+ },
612
+ {
613
+ "rep": "ABSOLUTE",
614
+ "type": "NON_EEF",
615
+ "format": "DEFAULT",
616
+ "state_key": "left_gripper_pos"
617
+ },
618
+ {
619
+ "rep": "ABSOLUTE",
620
+ "type": "NON_EEF",
621
+ "format": "DEFAULT",
622
+ "state_key": "right_gripper_pos"
623
+ },
624
+ {
625
+ "rep": "RELATIVE",
626
+ "type": "NON_EEF",
627
+ "format": "DEFAULT",
628
+ "state_key": "left_joint_pos"
629
+ },
630
+ {
631
+ "rep": "RELATIVE",
632
+ "type": "NON_EEF",
633
+ "format": "DEFAULT",
634
+ "state_key": "right_joint_pos"
635
+ }
636
+ ]
637
+ },
638
+ "language": {
639
+ "delta_indices": [
640
+ 0
641
+ ],
642
+ "modality_keys": [
643
+ "annotation.task"
644
+ ],
645
+ "sin_cos_embedding_keys": null,
646
+ "mean_std_embedding_keys": null,
647
+ "action_configs": null
648
+ }
649
+ },
650
+ "real_r1_pro_sharpa_relative_eef_maxinsights": {
651
+ "video": {
652
+ "delta_indices": [
653
+ -30,
654
+ 0
655
+ ],
656
+ "modality_keys": [
657
+ "ego_view_cropratio_res320x240_freq30"
658
+ ],
659
+ "sin_cos_embedding_keys": null,
660
+ "mean_std_embedding_keys": null,
661
+ "action_configs": null
662
+ },
663
+ "state": {
664
+ "delta_indices": [
665
+ 0
666
+ ],
667
+ "modality_keys": [
668
+ "left_wrist_eef",
669
+ "right_wrist_eef",
670
+ "left_hand_joints",
671
+ "right_hand_joints"
672
+ ],
673
+ "sin_cos_embedding_keys": null,
674
+ "mean_std_embedding_keys": null,
675
+ "action_configs": null
676
+ },
677
+ "action": {
678
+ "delta_indices": [
679
+ 0,
680
+ 1,
681
+ 2,
682
+ 3,
683
+ 4,
684
+ 5,
685
+ 6,
686
+ 7,
687
+ 8,
688
+ 9,
689
+ 10,
690
+ 11,
691
+ 12,
692
+ 13,
693
+ 14,
694
+ 15,
695
+ 16,
696
+ 17,
697
+ 18,
698
+ 19,
699
+ 20,
700
+ 21,
701
+ 22,
702
+ 23,
703
+ 24,
704
+ 25,
705
+ 26,
706
+ 27,
707
+ 28,
708
+ 29,
709
+ 30,
710
+ 31,
711
+ 32,
712
+ 33,
713
+ 34,
714
+ 35,
715
+ 36,
716
+ 37,
717
+ 38,
718
+ 39
719
+ ],
720
+ "modality_keys": [
721
+ "left_wrist_eef",
722
+ "right_wrist_eef",
723
+ "left_hand_joints",
724
+ "right_hand_joints"
725
+ ],
726
+ "sin_cos_embedding_keys": null,
727
+ "mean_std_embedding_keys": null,
728
+ "action_configs": [
729
+ {
730
+ "rep": "RELATIVE",
731
+ "type": "EEF",
732
+ "format": "XYZ_ROT6D",
733
+ "state_key": "left_wrist_eef"
734
+ },
735
+ {
736
+ "rep": "RELATIVE",
737
+ "type": "EEF",
738
+ "format": "XYZ_ROT6D",
739
+ "state_key": "right_wrist_eef"
740
+ },
741
+ {
742
+ "rep": "ABSOLUTE",
743
+ "type": "NON_EEF",
744
+ "format": "DEFAULT",
745
+ "state_key": "left_hand_joints"
746
+ },
747
+ {
748
+ "rep": "ABSOLUTE",
749
+ "type": "NON_EEF",
750
+ "format": "DEFAULT",
751
+ "state_key": "right_hand_joints"
752
+ }
753
+ ]
754
+ },
755
+ "language": {
756
+ "delta_indices": [
757
+ 0
758
+ ],
759
+ "modality_keys": [
760
+ "annotation.human.coarse_action"
761
+ ],
762
+ "sin_cos_embedding_keys": null,
763
+ "mean_std_embedding_keys": null,
764
+ "action_configs": null
765
+ }
766
+ },
767
+ "xdof_relative_eef_relative_joint_subtask": {
768
+ "video": {
769
+ "delta_indices": [
770
+ -30,
771
+ 0
772
+ ],
773
+ "modality_keys": [
774
+ "top_camera-images-rgb_320_240",
775
+ "left_camera-images-rgb_320_240",
776
+ "right_camera-images-rgb_320_240"
777
+ ],
778
+ "sin_cos_embedding_keys": null,
779
+ "mean_std_embedding_keys": null,
780
+ "action_configs": null
781
+ },
782
+ "state": {
783
+ "delta_indices": [
784
+ 0
785
+ ],
786
+ "modality_keys": [
787
+ "left_wrist_eef",
788
+ "right_wrist_eef",
789
+ "left_gripper_pos",
790
+ "right_gripper_pos",
791
+ "left_joint_pos",
792
+ "right_joint_pos"
793
+ ],
794
+ "sin_cos_embedding_keys": null,
795
+ "mean_std_embedding_keys": null,
796
+ "action_configs": null
797
+ },
798
+ "action": {
799
+ "delta_indices": [
800
+ 0,
801
+ 1,
802
+ 2,
803
+ 3,
804
+ 4,
805
+ 5,
806
+ 6,
807
+ 7,
808
+ 8,
809
+ 9,
810
+ 10,
811
+ 11,
812
+ 12,
813
+ 13,
814
+ 14,
815
+ 15,
816
+ 16,
817
+ 17,
818
+ 18,
819
+ 19,
820
+ 20,
821
+ 21,
822
+ 22,
823
+ 23,
824
+ 24,
825
+ 25,
826
+ 26,
827
+ 27,
828
+ 28,
829
+ 29,
830
+ 30,
831
+ 31,
832
+ 32,
833
+ 33,
834
+ 34,
835
+ 35,
836
+ 36,
837
+ 37,
838
+ 38,
839
+ 39
840
+ ],
841
+ "modality_keys": [
842
+ "left_wrist_eef",
843
+ "right_wrist_eef",
844
+ "left_gripper_pos",
845
+ "right_gripper_pos",
846
+ "left_joint_pos",
847
+ "right_joint_pos"
848
+ ],
849
+ "sin_cos_embedding_keys": null,
850
+ "mean_std_embedding_keys": null,
851
+ "action_configs": [
852
+ {
853
+ "rep": "RELATIVE",
854
+ "type": "EEF",
855
+ "format": "XYZ_ROT6D",
856
+ "state_key": "left_wrist_eef"
857
+ },
858
+ {
859
+ "rep": "RELATIVE",
860
+ "type": "EEF",
861
+ "format": "XYZ_ROT6D",
862
+ "state_key": "right_wrist_eef"
863
+ },
864
+ {
865
+ "rep": "ABSOLUTE",
866
+ "type": "NON_EEF",
867
+ "format": "DEFAULT",
868
+ "state_key": "left_gripper_pos"
869
+ },
870
+ {
871
+ "rep": "ABSOLUTE",
872
+ "type": "NON_EEF",
873
+ "format": "DEFAULT",
874
+ "state_key": "right_gripper_pos"
875
+ },
876
+ {
877
+ "rep": "RELATIVE",
878
+ "type": "NON_EEF",
879
+ "format": "DEFAULT",
880
+ "state_key": "left_joint_pos"
881
+ },
882
+ {
883
+ "rep": "RELATIVE",
884
+ "type": "NON_EEF",
885
+ "format": "DEFAULT",
886
+ "state_key": "right_joint_pos"
887
+ }
888
+ ]
889
+ },
890
+ "language": {
891
+ "delta_indices": [
892
+ 0
893
+ ],
894
+ "modality_keys": [
895
+ "annotation.sub_task"
896
+ ],
897
+ "sin_cos_embedding_keys": null,
898
+ "mean_std_embedding_keys": null,
899
+ "action_configs": null
900
+ }
901
+ },
902
+ "oxe_droid_relative_eef_relative_joint": {
903
+ "video": {
904
+ "delta_indices": [
905
+ -15,
906
+ 0
907
+ ],
908
+ "modality_keys": [
909
+ "exterior_image_1_left",
910
+ "wrist_image_left"
911
+ ],
912
+ "sin_cos_embedding_keys": null,
913
+ "mean_std_embedding_keys": null,
914
+ "action_configs": null
915
+ },
916
+ "state": {
917
+ "delta_indices": [
918
+ 0
919
+ ],
920
+ "modality_keys": [
921
+ "eef_9d",
922
+ "gripper_position",
923
+ "joint_position"
924
+ ],
925
+ "sin_cos_embedding_keys": null,
926
+ "mean_std_embedding_keys": null,
927
+ "action_configs": null
928
+ },
929
+ "action": {
930
+ "delta_indices": [
931
+ 0,
932
+ 1,
933
+ 2,
934
+ 3,
935
+ 4,
936
+ 5,
937
+ 6,
938
+ 7,
939
+ 8,
940
+ 9,
941
+ 10,
942
+ 11,
943
+ 12,
944
+ 13,
945
+ 14,
946
+ 15,
947
+ 16,
948
+ 17,
949
+ 18,
950
+ 19,
951
+ 20,
952
+ 21,
953
+ 22,
954
+ 23,
955
+ 24,
956
+ 25,
957
+ 26,
958
+ 27,
959
+ 28,
960
+ 29,
961
+ 30,
962
+ 31,
963
+ 32,
964
+ 33,
965
+ 34,
966
+ 35,
967
+ 36,
968
+ 37,
969
+ 38,
970
+ 39
971
+ ],
972
+ "modality_keys": [
973
+ "eef_9d",
974
+ "gripper_position",
975
+ "joint_position"
976
+ ],
977
+ "sin_cos_embedding_keys": null,
978
+ "mean_std_embedding_keys": null,
979
+ "action_configs": [
980
+ {
981
+ "rep": "RELATIVE",
982
+ "type": "EEF",
983
+ "format": "XYZ_ROT6D",
984
+ "state_key": "eef_9d"
985
+ },
986
+ {
987
+ "rep": "ABSOLUTE",
988
+ "type": "NON_EEF",
989
+ "format": "DEFAULT",
990
+ "state_key": "gripper_position"
991
+ },
992
+ {
993
+ "rep": "RELATIVE",
994
+ "type": "NON_EEF",
995
+ "format": "DEFAULT",
996
+ "state_key": "joint_position"
997
+ }
998
+ ]
999
+ },
1000
+ "language": {
1001
+ "delta_indices": [
1002
+ 0
1003
+ ],
1004
+ "modality_keys": [
1005
+ "annotation.language.language_instruction"
1006
+ ],
1007
+ "sin_cos_embedding_keys": null,
1008
+ "mean_std_embedding_keys": null,
1009
+ "action_configs": null
1010
+ }
1011
+ },
1012
+ "unitree_g1_sonic": {
1013
+ "video": {
1014
+ "delta_indices": [
1015
+ 0
1016
+ ],
1017
+ "modality_keys": [
1018
+ "ego_view"
1019
+ ],
1020
+ "sin_cos_embedding_keys": null,
1021
+ "mean_std_embedding_keys": null,
1022
+ "action_configs": null
1023
+ },
1024
+ "state": {
1025
+ "delta_indices": [
1026
+ 0
1027
+ ],
1028
+ "modality_keys": [
1029
+ "left_leg",
1030
+ "right_leg",
1031
+ "waist",
1032
+ "left_arm",
1033
+ "right_arm",
1034
+ "left_hand",
1035
+ "right_hand",
1036
+ "projected_gravity"
1037
+ ],
1038
+ "sin_cos_embedding_keys": null,
1039
+ "mean_std_embedding_keys": null,
1040
+ "action_configs": null
1041
+ },
1042
+ "action": {
1043
+ "delta_indices": [
1044
+ 0,
1045
+ 1,
1046
+ 2,
1047
+ 3,
1048
+ 4,
1049
+ 5,
1050
+ 6,
1051
+ 7,
1052
+ 8,
1053
+ 9,
1054
+ 10,
1055
+ 11,
1056
+ 12,
1057
+ 13,
1058
+ 14,
1059
+ 15,
1060
+ 16,
1061
+ 17,
1062
+ 18,
1063
+ 19,
1064
+ 20,
1065
+ 21,
1066
+ 22,
1067
+ 23,
1068
+ 24,
1069
+ 25,
1070
+ 26,
1071
+ 27,
1072
+ 28,
1073
+ 29,
1074
+ 30,
1075
+ 31,
1076
+ 32,
1077
+ 33,
1078
+ 34,
1079
+ 35,
1080
+ 36,
1081
+ 37,
1082
+ 38,
1083
+ 39
1084
+ ],
1085
+ "modality_keys": [
1086
+ "motion_token",
1087
+ "left_hand_joints",
1088
+ "right_hand_joints"
1089
+ ],
1090
+ "sin_cos_embedding_keys": null,
1091
+ "mean_std_embedding_keys": null,
1092
+ "action_configs": [
1093
+ {
1094
+ "rep": "ABSOLUTE",
1095
+ "type": "NON_EEF",
1096
+ "format": "DEFAULT",
1097
+ "state_key": null
1098
+ },
1099
+ {
1100
+ "rep": "ABSOLUTE",
1101
+ "type": "NON_EEF",
1102
+ "format": "DEFAULT",
1103
+ "state_key": null
1104
+ },
1105
+ {
1106
+ "rep": "ABSOLUTE",
1107
+ "type": "NON_EEF",
1108
+ "format": "DEFAULT",
1109
+ "state_key": null
1110
+ }
1111
+ ]
1112
+ },
1113
+ "language": {
1114
+ "delta_indices": [
1115
+ 0
1116
+ ],
1117
+ "modality_keys": [
1118
+ "annotation.human.task_description"
1119
+ ],
1120
+ "sin_cos_embedding_keys": null,
1121
+ "mean_std_embedding_keys": null,
1122
+ "action_configs": null
1123
+ }
1124
+ }
1125
+ },
1126
+ "image_crop_size": [
1127
+ 230,
1128
+ 230
1129
+ ],
1130
+ "image_target_size": [
1131
+ 256,
1132
+ 256
1133
+ ],
1134
+ "use_albumentations": true,
1135
+ "random_rotation_angle": 0,
1136
+ "color_jitter_params": {
1137
+ "brightness": 0.3,
1138
+ "contrast": 0.4,
1139
+ "saturation": 0.5,
1140
+ "hue": 0.08
1141
+ },
1142
+ "shortest_image_edge": 256,
1143
+ "crop_fraction": 0.95,
1144
+ "letter_box_transform": false,
1145
+ "model_name": "nvidia/Cosmos-Reason2-2B",
1146
+ "model_type": "qwen",
1147
+ "formalize_language": true,
1148
+ "max_state_dim": 132,
1149
+ "max_action_dim": 132,
1150
+ "max_action_horizon": 40,
1151
+ "use_percentiles": true,
1152
+ "use_mean_std": false,
1153
+ "clip_outliers": true,
1154
+ "apply_sincos_state_encoding": false,
1155
+ "use_relative_action": true,
1156
+ "exclude_state": false,
1157
+ "state_dropout_prob": 0.2
1158
+ }
1159
+ }
checkpoint-4000/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdb99b66cb25083056887a1f47ebbaf1c58f0d43e6ee7d27ba8f75e18c5eada1
3
+ size 14645
checkpoint-4000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e735feb89f2e1201272c210a226e7690cb2b92d37a1c1eb9a843518a2be8b38f
3
+ size 1465
checkpoint-4000/statistics.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-4000/trainer_state.json ADDED
@@ -0,0 +1,2434 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 0.2,
6
+ "eval_steps": 500,
7
+ "global_step": 4000,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "grad_norm": 0.15373489260673523,
14
+ "learning_rate": 9e-07,
15
+ "loss": 1.2116,
16
+ "step": 10
17
+ },
18
+ {
19
+ "grad_norm": 0.12143079191446304,
20
+ "learning_rate": 1.9e-06,
21
+ "loss": 1.2054,
22
+ "step": 20
23
+ },
24
+ {
25
+ "grad_norm": 0.11240886896848679,
26
+ "learning_rate": 2.9e-06,
27
+ "loss": 1.2027,
28
+ "step": 30
29
+ },
30
+ {
31
+ "grad_norm": 0.21381829679012299,
32
+ "learning_rate": 3.9e-06,
33
+ "loss": 1.1886,
34
+ "step": 40
35
+ },
36
+ {
37
+ "grad_norm": 0.2458868771791458,
38
+ "learning_rate": 4.9000000000000005e-06,
39
+ "loss": 1.1589,
40
+ "step": 50
41
+ },
42
+ {
43
+ "grad_norm": 0.2544420659542084,
44
+ "learning_rate": 5.9e-06,
45
+ "loss": 1.1296,
46
+ "step": 60
47
+ },
48
+ {
49
+ "grad_norm": 0.23853255808353424,
50
+ "learning_rate": 6.900000000000001e-06,
51
+ "loss": 1.1103,
52
+ "step": 70
53
+ },
54
+ {
55
+ "grad_norm": 0.31489869952201843,
56
+ "learning_rate": 7.9e-06,
57
+ "loss": 1.0948,
58
+ "step": 80
59
+ },
60
+ {
61
+ "grad_norm": 0.2596352696418762,
62
+ "learning_rate": 8.9e-06,
63
+ "loss": 1.0914,
64
+ "step": 90
65
+ },
66
+ {
67
+ "grad_norm": 0.2258705496788025,
68
+ "learning_rate": 9.900000000000002e-06,
69
+ "loss": 1.0912,
70
+ "step": 100
71
+ },
72
+ {
73
+ "grad_norm": 0.5682782530784607,
74
+ "learning_rate": 1.09e-05,
75
+ "loss": 1.0893,
76
+ "step": 110
77
+ },
78
+ {
79
+ "grad_norm": 0.3197626769542694,
80
+ "learning_rate": 1.19e-05,
81
+ "loss": 1.081,
82
+ "step": 120
83
+ },
84
+ {
85
+ "grad_norm": 0.18166182935237885,
86
+ "learning_rate": 1.29e-05,
87
+ "loss": 1.073,
88
+ "step": 130
89
+ },
90
+ {
91
+ "grad_norm": 0.4554118812084198,
92
+ "learning_rate": 1.3900000000000002e-05,
93
+ "loss": 1.0634,
94
+ "step": 140
95
+ },
96
+ {
97
+ "grad_norm": 0.42795446515083313,
98
+ "learning_rate": 1.49e-05,
99
+ "loss": 1.047,
100
+ "step": 150
101
+ },
102
+ {
103
+ "grad_norm": 0.5283658504486084,
104
+ "learning_rate": 1.59e-05,
105
+ "loss": 1.013,
106
+ "step": 160
107
+ },
108
+ {
109
+ "grad_norm": 0.3358186185359955,
110
+ "learning_rate": 1.69e-05,
111
+ "loss": 0.9804,
112
+ "step": 170
113
+ },
114
+ {
115
+ "grad_norm": 0.5145778656005859,
116
+ "learning_rate": 1.79e-05,
117
+ "loss": 0.936,
118
+ "step": 180
119
+ },
120
+ {
121
+ "grad_norm": 0.5755268335342407,
122
+ "learning_rate": 1.8900000000000002e-05,
123
+ "loss": 0.8896,
124
+ "step": 190
125
+ },
126
+ {
127
+ "grad_norm": 0.6188399791717529,
128
+ "learning_rate": 1.9900000000000003e-05,
129
+ "loss": 0.8577,
130
+ "step": 200
131
+ },
132
+ {
133
+ "grad_norm": 0.9716882109642029,
134
+ "learning_rate": 2.09e-05,
135
+ "loss": 0.8271,
136
+ "step": 210
137
+ },
138
+ {
139
+ "grad_norm": 0.918986976146698,
140
+ "learning_rate": 2.19e-05,
141
+ "loss": 0.7906,
142
+ "step": 220
143
+ },
144
+ {
145
+ "grad_norm": 0.8000361919403076,
146
+ "learning_rate": 2.29e-05,
147
+ "loss": 0.751,
148
+ "step": 230
149
+ },
150
+ {
151
+ "grad_norm": 1.0514482259750366,
152
+ "learning_rate": 2.39e-05,
153
+ "loss": 0.7155,
154
+ "step": 240
155
+ },
156
+ {
157
+ "grad_norm": 0.7911136746406555,
158
+ "learning_rate": 2.4900000000000002e-05,
159
+ "loss": 0.6906,
160
+ "step": 250
161
+ },
162
+ {
163
+ "grad_norm": 0.92540043592453,
164
+ "learning_rate": 2.5900000000000003e-05,
165
+ "loss": 0.6638,
166
+ "step": 260
167
+ },
168
+ {
169
+ "grad_norm": 1.0331710577011108,
170
+ "learning_rate": 2.6900000000000003e-05,
171
+ "loss": 0.6444,
172
+ "step": 270
173
+ },
174
+ {
175
+ "grad_norm": 1.2573391199111938,
176
+ "learning_rate": 2.7900000000000004e-05,
177
+ "loss": 0.618,
178
+ "step": 280
179
+ },
180
+ {
181
+ "grad_norm": 1.2672662734985352,
182
+ "learning_rate": 2.8899999999999998e-05,
183
+ "loss": 0.6095,
184
+ "step": 290
185
+ },
186
+ {
187
+ "grad_norm": 1.0279985666275024,
188
+ "learning_rate": 2.9900000000000002e-05,
189
+ "loss": 0.5921,
190
+ "step": 300
191
+ },
192
+ {
193
+ "grad_norm": 0.9896909594535828,
194
+ "learning_rate": 3.09e-05,
195
+ "loss": 0.5765,
196
+ "step": 310
197
+ },
198
+ {
199
+ "grad_norm": 1.0756268501281738,
200
+ "learning_rate": 3.19e-05,
201
+ "loss": 0.5679,
202
+ "step": 320
203
+ },
204
+ {
205
+ "grad_norm": 1.3084145784378052,
206
+ "learning_rate": 3.29e-05,
207
+ "loss": 0.5569,
208
+ "step": 330
209
+ },
210
+ {
211
+ "grad_norm": 1.2895151376724243,
212
+ "learning_rate": 3.3900000000000004e-05,
213
+ "loss": 0.5475,
214
+ "step": 340
215
+ },
216
+ {
217
+ "grad_norm": 1.1118186712265015,
218
+ "learning_rate": 3.49e-05,
219
+ "loss": 0.5367,
220
+ "step": 350
221
+ },
222
+ {
223
+ "grad_norm": 0.9377628564834595,
224
+ "learning_rate": 3.59e-05,
225
+ "loss": 0.5192,
226
+ "step": 360
227
+ },
228
+ {
229
+ "grad_norm": 1.1136053800582886,
230
+ "learning_rate": 3.69e-05,
231
+ "loss": 0.5096,
232
+ "step": 370
233
+ },
234
+ {
235
+ "grad_norm": 0.8958713412284851,
236
+ "learning_rate": 3.79e-05,
237
+ "loss": 0.4938,
238
+ "step": 380
239
+ },
240
+ {
241
+ "grad_norm": 1.4132113456726074,
242
+ "learning_rate": 3.8900000000000004e-05,
243
+ "loss": 0.4777,
244
+ "step": 390
245
+ },
246
+ {
247
+ "grad_norm": 1.250508189201355,
248
+ "learning_rate": 3.99e-05,
249
+ "loss": 0.4575,
250
+ "step": 400
251
+ },
252
+ {
253
+ "grad_norm": 1.2522258758544922,
254
+ "learning_rate": 4.09e-05,
255
+ "loss": 0.4386,
256
+ "step": 410
257
+ },
258
+ {
259
+ "grad_norm": 1.4475443363189697,
260
+ "learning_rate": 4.19e-05,
261
+ "loss": 0.4295,
262
+ "step": 420
263
+ },
264
+ {
265
+ "grad_norm": 0.925055742263794,
266
+ "learning_rate": 4.29e-05,
267
+ "loss": 0.4157,
268
+ "step": 430
269
+ },
270
+ {
271
+ "grad_norm": 1.2969681024551392,
272
+ "learning_rate": 4.39e-05,
273
+ "loss": 0.4052,
274
+ "step": 440
275
+ },
276
+ {
277
+ "grad_norm": 1.3583041429519653,
278
+ "learning_rate": 4.49e-05,
279
+ "loss": 0.3953,
280
+ "step": 450
281
+ },
282
+ {
283
+ "grad_norm": 1.028383493423462,
284
+ "learning_rate": 4.5900000000000004e-05,
285
+ "loss": 0.375,
286
+ "step": 460
287
+ },
288
+ {
289
+ "grad_norm": 1.255179762840271,
290
+ "learning_rate": 4.69e-05,
291
+ "loss": 0.3699,
292
+ "step": 470
293
+ },
294
+ {
295
+ "grad_norm": 1.326106309890747,
296
+ "learning_rate": 4.79e-05,
297
+ "loss": 0.3579,
298
+ "step": 480
299
+ },
300
+ {
301
+ "grad_norm": 1.2961987257003784,
302
+ "learning_rate": 4.89e-05,
303
+ "loss": 0.3478,
304
+ "step": 490
305
+ },
306
+ {
307
+ "grad_norm": 1.2104370594024658,
308
+ "learning_rate": 4.99e-05,
309
+ "loss": 0.339,
310
+ "step": 500
311
+ },
312
+ {
313
+ "grad_norm": 1.4508124589920044,
314
+ "learning_rate": 5.0900000000000004e-05,
315
+ "loss": 0.3219,
316
+ "step": 510
317
+ },
318
+ {
319
+ "grad_norm": 1.4312357902526855,
320
+ "learning_rate": 5.19e-05,
321
+ "loss": 0.3042,
322
+ "step": 520
323
+ },
324
+ {
325
+ "grad_norm": 1.7213497161865234,
326
+ "learning_rate": 5.2900000000000005e-05,
327
+ "loss": 0.2887,
328
+ "step": 530
329
+ },
330
+ {
331
+ "grad_norm": 1.7162240743637085,
332
+ "learning_rate": 5.390000000000001e-05,
333
+ "loss": 0.2856,
334
+ "step": 540
335
+ },
336
+ {
337
+ "grad_norm": 1.1437758207321167,
338
+ "learning_rate": 5.4900000000000006e-05,
339
+ "loss": 0.2642,
340
+ "step": 550
341
+ },
342
+ {
343
+ "grad_norm": 1.4461580514907837,
344
+ "learning_rate": 5.590000000000001e-05,
345
+ "loss": 0.2508,
346
+ "step": 560
347
+ },
348
+ {
349
+ "grad_norm": 1.4058153629302979,
350
+ "learning_rate": 5.69e-05,
351
+ "loss": 0.2437,
352
+ "step": 570
353
+ },
354
+ {
355
+ "grad_norm": 1.3282971382141113,
356
+ "learning_rate": 5.79e-05,
357
+ "loss": 0.2275,
358
+ "step": 580
359
+ },
360
+ {
361
+ "grad_norm": 1.6089696884155273,
362
+ "learning_rate": 5.89e-05,
363
+ "loss": 0.2166,
364
+ "step": 590
365
+ },
366
+ {
367
+ "grad_norm": 1.5542049407958984,
368
+ "learning_rate": 5.99e-05,
369
+ "loss": 0.2008,
370
+ "step": 600
371
+ },
372
+ {
373
+ "grad_norm": 1.372789740562439,
374
+ "learning_rate": 6.09e-05,
375
+ "loss": 0.1888,
376
+ "step": 610
377
+ },
378
+ {
379
+ "grad_norm": 1.3900244235992432,
380
+ "learning_rate": 6.19e-05,
381
+ "loss": 0.1825,
382
+ "step": 620
383
+ },
384
+ {
385
+ "grad_norm": 1.1616129875183105,
386
+ "learning_rate": 6.29e-05,
387
+ "loss": 0.1673,
388
+ "step": 630
389
+ },
390
+ {
391
+ "grad_norm": 1.3904050588607788,
392
+ "learning_rate": 6.390000000000001e-05,
393
+ "loss": 0.1631,
394
+ "step": 640
395
+ },
396
+ {
397
+ "grad_norm": 1.6666728258132935,
398
+ "learning_rate": 6.49e-05,
399
+ "loss": 0.1508,
400
+ "step": 650
401
+ },
402
+ {
403
+ "grad_norm": 1.458060383796692,
404
+ "learning_rate": 6.59e-05,
405
+ "loss": 0.134,
406
+ "step": 660
407
+ },
408
+ {
409
+ "grad_norm": 1.2632263898849487,
410
+ "learning_rate": 6.690000000000001e-05,
411
+ "loss": 0.1435,
412
+ "step": 670
413
+ },
414
+ {
415
+ "grad_norm": 1.3523911237716675,
416
+ "learning_rate": 6.790000000000001e-05,
417
+ "loss": 0.1383,
418
+ "step": 680
419
+ },
420
+ {
421
+ "grad_norm": 1.3925788402557373,
422
+ "learning_rate": 6.89e-05,
423
+ "loss": 0.1317,
424
+ "step": 690
425
+ },
426
+ {
427
+ "grad_norm": 1.6858913898468018,
428
+ "learning_rate": 6.99e-05,
429
+ "loss": 0.1309,
430
+ "step": 700
431
+ },
432
+ {
433
+ "grad_norm": 1.2360647916793823,
434
+ "learning_rate": 7.09e-05,
435
+ "loss": 0.1267,
436
+ "step": 710
437
+ },
438
+ {
439
+ "grad_norm": 1.1521002054214478,
440
+ "learning_rate": 7.19e-05,
441
+ "loss": 0.1259,
442
+ "step": 720
443
+ },
444
+ {
445
+ "grad_norm": 1.232092022895813,
446
+ "learning_rate": 7.29e-05,
447
+ "loss": 0.1333,
448
+ "step": 730
449
+ },
450
+ {
451
+ "grad_norm": 1.4635534286499023,
452
+ "learning_rate": 7.390000000000001e-05,
453
+ "loss": 0.129,
454
+ "step": 740
455
+ },
456
+ {
457
+ "grad_norm": 1.108782172203064,
458
+ "learning_rate": 7.49e-05,
459
+ "loss": 0.1285,
460
+ "step": 750
461
+ },
462
+ {
463
+ "grad_norm": 1.3770654201507568,
464
+ "learning_rate": 7.59e-05,
465
+ "loss": 0.1247,
466
+ "step": 760
467
+ },
468
+ {
469
+ "grad_norm": 1.1716821193695068,
470
+ "learning_rate": 7.69e-05,
471
+ "loss": 0.1297,
472
+ "step": 770
473
+ },
474
+ {
475
+ "grad_norm": 1.185289740562439,
476
+ "learning_rate": 7.790000000000001e-05,
477
+ "loss": 0.1246,
478
+ "step": 780
479
+ },
480
+ {
481
+ "grad_norm": 1.3426638841629028,
482
+ "learning_rate": 7.890000000000001e-05,
483
+ "loss": 0.1209,
484
+ "step": 790
485
+ },
486
+ {
487
+ "grad_norm": 1.0914347171783447,
488
+ "learning_rate": 7.99e-05,
489
+ "loss": 0.1226,
490
+ "step": 800
491
+ },
492
+ {
493
+ "grad_norm": 1.47992742061615,
494
+ "learning_rate": 8.090000000000001e-05,
495
+ "loss": 0.1116,
496
+ "step": 810
497
+ },
498
+ {
499
+ "grad_norm": 1.189318299293518,
500
+ "learning_rate": 8.19e-05,
501
+ "loss": 0.1155,
502
+ "step": 820
503
+ },
504
+ {
505
+ "grad_norm": 1.218897819519043,
506
+ "learning_rate": 8.29e-05,
507
+ "loss": 0.1106,
508
+ "step": 830
509
+ },
510
+ {
511
+ "grad_norm": 1.1049423217773438,
512
+ "learning_rate": 8.39e-05,
513
+ "loss": 0.1143,
514
+ "step": 840
515
+ },
516
+ {
517
+ "grad_norm": 1.3933051824569702,
518
+ "learning_rate": 8.49e-05,
519
+ "loss": 0.1241,
520
+ "step": 850
521
+ },
522
+ {
523
+ "grad_norm": 1.0603047609329224,
524
+ "learning_rate": 8.59e-05,
525
+ "loss": 0.1111,
526
+ "step": 860
527
+ },
528
+ {
529
+ "grad_norm": 1.1517871618270874,
530
+ "learning_rate": 8.69e-05,
531
+ "loss": 0.1114,
532
+ "step": 870
533
+ },
534
+ {
535
+ "grad_norm": 1.2335821390151978,
536
+ "learning_rate": 8.790000000000001e-05,
537
+ "loss": 0.1135,
538
+ "step": 880
539
+ },
540
+ {
541
+ "grad_norm": 1.471954107284546,
542
+ "learning_rate": 8.89e-05,
543
+ "loss": 0.1149,
544
+ "step": 890
545
+ },
546
+ {
547
+ "grad_norm": 1.1479299068450928,
548
+ "learning_rate": 8.99e-05,
549
+ "loss": 0.1144,
550
+ "step": 900
551
+ },
552
+ {
553
+ "grad_norm": 1.1517722606658936,
554
+ "learning_rate": 9.090000000000001e-05,
555
+ "loss": 0.1097,
556
+ "step": 910
557
+ },
558
+ {
559
+ "grad_norm": 1.2328661680221558,
560
+ "learning_rate": 9.190000000000001e-05,
561
+ "loss": 0.11,
562
+ "step": 920
563
+ },
564
+ {
565
+ "grad_norm": 1.227306842803955,
566
+ "learning_rate": 9.290000000000001e-05,
567
+ "loss": 0.1144,
568
+ "step": 930
569
+ },
570
+ {
571
+ "grad_norm": 1.1643450260162354,
572
+ "learning_rate": 9.39e-05,
573
+ "loss": 0.1074,
574
+ "step": 940
575
+ },
576
+ {
577
+ "grad_norm": 1.1138417720794678,
578
+ "learning_rate": 9.49e-05,
579
+ "loss": 0.113,
580
+ "step": 950
581
+ },
582
+ {
583
+ "grad_norm": 1.0035343170166016,
584
+ "learning_rate": 9.59e-05,
585
+ "loss": 0.1102,
586
+ "step": 960
587
+ },
588
+ {
589
+ "grad_norm": 1.089536190032959,
590
+ "learning_rate": 9.69e-05,
591
+ "loss": 0.1089,
592
+ "step": 970
593
+ },
594
+ {
595
+ "grad_norm": 1.1418471336364746,
596
+ "learning_rate": 9.790000000000001e-05,
597
+ "loss": 0.1075,
598
+ "step": 980
599
+ },
600
+ {
601
+ "grad_norm": 1.0369817018508911,
602
+ "learning_rate": 9.89e-05,
603
+ "loss": 0.1094,
604
+ "step": 990
605
+ },
606
+ {
607
+ "grad_norm": 1.081180214881897,
608
+ "learning_rate": 9.99e-05,
609
+ "loss": 0.1069,
610
+ "step": 1000
611
+ },
612
+ {
613
+ "grad_norm": 1.1965157985687256,
614
+ "learning_rate": 9.999994463727085e-05,
615
+ "loss": 0.1078,
616
+ "step": 1010
617
+ },
618
+ {
619
+ "grad_norm": 1.0836145877838135,
620
+ "learning_rate": 9.999975326009292e-05,
621
+ "loss": 0.1034,
622
+ "step": 1020
623
+ },
624
+ {
625
+ "grad_norm": 1.0701448917388916,
626
+ "learning_rate": 9.999942518549879e-05,
627
+ "loss": 0.1063,
628
+ "step": 1030
629
+ },
630
+ {
631
+ "grad_norm": 1.0245521068572998,
632
+ "learning_rate": 9.999896041438544e-05,
633
+ "loss": 0.1003,
634
+ "step": 1040
635
+ },
636
+ {
637
+ "grad_norm": 0.9008662104606628,
638
+ "learning_rate": 9.999835894802353e-05,
639
+ "loss": 0.1007,
640
+ "step": 1050
641
+ },
642
+ {
643
+ "grad_norm": 1.405444860458374,
644
+ "learning_rate": 9.999762078805743e-05,
645
+ "loss": 0.0983,
646
+ "step": 1060
647
+ },
648
+ {
649
+ "grad_norm": 0.9956735968589783,
650
+ "learning_rate": 9.999674593650526e-05,
651
+ "loss": 0.1015,
652
+ "step": 1070
653
+ },
654
+ {
655
+ "grad_norm": 0.9828646779060364,
656
+ "learning_rate": 9.99957343957588e-05,
657
+ "loss": 0.099,
658
+ "step": 1080
659
+ },
660
+ {
661
+ "grad_norm": 1.3071095943450928,
662
+ "learning_rate": 9.99945861685836e-05,
663
+ "loss": 0.0949,
664
+ "step": 1090
665
+ },
666
+ {
667
+ "grad_norm": 0.9832029342651367,
668
+ "learning_rate": 9.999330125811884e-05,
669
+ "loss": 0.102,
670
+ "step": 1100
671
+ },
672
+ {
673
+ "grad_norm": 1.0148258209228516,
674
+ "learning_rate": 9.999187966787744e-05,
675
+ "loss": 0.103,
676
+ "step": 1110
677
+ },
678
+ {
679
+ "grad_norm": 1.0134457349777222,
680
+ "learning_rate": 9.999032140174595e-05,
681
+ "loss": 0.0949,
682
+ "step": 1120
683
+ },
684
+ {
685
+ "grad_norm": 0.9154807329177856,
686
+ "learning_rate": 9.998862646398464e-05,
687
+ "loss": 0.0989,
688
+ "step": 1130
689
+ },
690
+ {
691
+ "grad_norm": 1.0683287382125854,
692
+ "learning_rate": 9.998679485922739e-05,
693
+ "loss": 0.0937,
694
+ "step": 1140
695
+ },
696
+ {
697
+ "grad_norm": 0.9443909525871277,
698
+ "learning_rate": 9.998482659248174e-05,
699
+ "loss": 0.0964,
700
+ "step": 1150
701
+ },
702
+ {
703
+ "grad_norm": 0.8048564195632935,
704
+ "learning_rate": 9.998272166912883e-05,
705
+ "loss": 0.0978,
706
+ "step": 1160
707
+ },
708
+ {
709
+ "grad_norm": 1.0226809978485107,
710
+ "learning_rate": 9.998048009492347e-05,
711
+ "loss": 0.0979,
712
+ "step": 1170
713
+ },
714
+ {
715
+ "grad_norm": 1.0117919445037842,
716
+ "learning_rate": 9.997810187599403e-05,
717
+ "loss": 0.0993,
718
+ "step": 1180
719
+ },
720
+ {
721
+ "grad_norm": 0.8559236526489258,
722
+ "learning_rate": 9.997558701884249e-05,
723
+ "loss": 0.095,
724
+ "step": 1190
725
+ },
726
+ {
727
+ "grad_norm": 1.009264349937439,
728
+ "learning_rate": 9.997293553034433e-05,
729
+ "loss": 0.0947,
730
+ "step": 1200
731
+ },
732
+ {
733
+ "grad_norm": 1.0090675354003906,
734
+ "learning_rate": 9.997014741774866e-05,
735
+ "loss": 0.0991,
736
+ "step": 1210
737
+ },
738
+ {
739
+ "grad_norm": 0.9128223657608032,
740
+ "learning_rate": 9.996722268867803e-05,
741
+ "loss": 0.0973,
742
+ "step": 1220
743
+ },
744
+ {
745
+ "grad_norm": 0.8223145008087158,
746
+ "learning_rate": 9.996416135112858e-05,
747
+ "loss": 0.0943,
748
+ "step": 1230
749
+ },
750
+ {
751
+ "grad_norm": 0.6892135143280029,
752
+ "learning_rate": 9.996096341346988e-05,
753
+ "loss": 0.0914,
754
+ "step": 1240
755
+ },
756
+ {
757
+ "grad_norm": 0.8441371321678162,
758
+ "learning_rate": 9.995762888444495e-05,
759
+ "loss": 0.095,
760
+ "step": 1250
761
+ },
762
+ {
763
+ "grad_norm": 0.8410964608192444,
764
+ "learning_rate": 9.995415777317027e-05,
765
+ "loss": 0.0905,
766
+ "step": 1260
767
+ },
768
+ {
769
+ "grad_norm": 0.9202972650527954,
770
+ "learning_rate": 9.995055008913574e-05,
771
+ "loss": 0.09,
772
+ "step": 1270
773
+ },
774
+ {
775
+ "grad_norm": 0.969850480556488,
776
+ "learning_rate": 9.994680584220463e-05,
777
+ "loss": 0.0977,
778
+ "step": 1280
779
+ },
780
+ {
781
+ "grad_norm": 0.9843644499778748,
782
+ "learning_rate": 9.994292504261355e-05,
783
+ "loss": 0.0903,
784
+ "step": 1290
785
+ },
786
+ {
787
+ "grad_norm": 0.8046810030937195,
788
+ "learning_rate": 9.993890770097247e-05,
789
+ "loss": 0.0885,
790
+ "step": 1300
791
+ },
792
+ {
793
+ "grad_norm": 1.0213329792022705,
794
+ "learning_rate": 9.993475382826467e-05,
795
+ "loss": 0.0906,
796
+ "step": 1310
797
+ },
798
+ {
799
+ "grad_norm": 0.9399948120117188,
800
+ "learning_rate": 9.993046343584664e-05,
801
+ "loss": 0.0885,
802
+ "step": 1320
803
+ },
804
+ {
805
+ "grad_norm": 0.8615891337394714,
806
+ "learning_rate": 9.992603653544816e-05,
807
+ "loss": 0.0898,
808
+ "step": 1330
809
+ },
810
+ {
811
+ "grad_norm": 0.7804251909255981,
812
+ "learning_rate": 9.992147313917222e-05,
813
+ "loss": 0.0879,
814
+ "step": 1340
815
+ },
816
+ {
817
+ "grad_norm": 0.7505974173545837,
818
+ "learning_rate": 9.991677325949497e-05,
819
+ "loss": 0.0877,
820
+ "step": 1350
821
+ },
822
+ {
823
+ "grad_norm": 0.8564302921295166,
824
+ "learning_rate": 9.991193690926568e-05,
825
+ "loss": 0.0853,
826
+ "step": 1360
827
+ },
828
+ {
829
+ "grad_norm": 0.921603798866272,
830
+ "learning_rate": 9.990696410170678e-05,
831
+ "loss": 0.0868,
832
+ "step": 1370
833
+ },
834
+ {
835
+ "grad_norm": 0.905284583568573,
836
+ "learning_rate": 9.990185485041371e-05,
837
+ "loss": 0.0812,
838
+ "step": 1380
839
+ },
840
+ {
841
+ "grad_norm": 0.8342713713645935,
842
+ "learning_rate": 9.989660916935498e-05,
843
+ "loss": 0.0845,
844
+ "step": 1390
845
+ },
846
+ {
847
+ "grad_norm": 0.8646072149276733,
848
+ "learning_rate": 9.989122707287208e-05,
849
+ "loss": 0.0863,
850
+ "step": 1400
851
+ },
852
+ {
853
+ "grad_norm": 1.0666006803512573,
854
+ "learning_rate": 9.988570857567945e-05,
855
+ "loss": 0.0887,
856
+ "step": 1410
857
+ },
858
+ {
859
+ "grad_norm": 0.8190611004829407,
860
+ "learning_rate": 9.988005369286446e-05,
861
+ "loss": 0.0845,
862
+ "step": 1420
863
+ },
864
+ {
865
+ "grad_norm": 0.8214516639709473,
866
+ "learning_rate": 9.987426243988734e-05,
867
+ "loss": 0.0883,
868
+ "step": 1430
869
+ },
870
+ {
871
+ "grad_norm": 0.7905929684638977,
872
+ "learning_rate": 9.986833483258114e-05,
873
+ "loss": 0.0861,
874
+ "step": 1440
875
+ },
876
+ {
877
+ "grad_norm": 0.8426095247268677,
878
+ "learning_rate": 9.986227088715173e-05,
879
+ "loss": 0.0823,
880
+ "step": 1450
881
+ },
882
+ {
883
+ "grad_norm": 0.9610787630081177,
884
+ "learning_rate": 9.98560706201777e-05,
885
+ "loss": 0.0835,
886
+ "step": 1460
887
+ },
888
+ {
889
+ "grad_norm": 0.8222280740737915,
890
+ "learning_rate": 9.984973404861036e-05,
891
+ "loss": 0.0878,
892
+ "step": 1470
893
+ },
894
+ {
895
+ "grad_norm": 0.840451717376709,
896
+ "learning_rate": 9.984326118977361e-05,
897
+ "loss": 0.0812,
898
+ "step": 1480
899
+ },
900
+ {
901
+ "grad_norm": 0.7655553817749023,
902
+ "learning_rate": 9.983665206136406e-05,
903
+ "loss": 0.0784,
904
+ "step": 1490
905
+ },
906
+ {
907
+ "grad_norm": 0.9331004023551941,
908
+ "learning_rate": 9.982990668145075e-05,
909
+ "loss": 0.0779,
910
+ "step": 1500
911
+ },
912
+ {
913
+ "grad_norm": 0.7345725297927856,
914
+ "learning_rate": 9.982302506847534e-05,
915
+ "loss": 0.0792,
916
+ "step": 1510
917
+ },
918
+ {
919
+ "grad_norm": 0.8967569470405579,
920
+ "learning_rate": 9.981600724125189e-05,
921
+ "loss": 0.0782,
922
+ "step": 1520
923
+ },
924
+ {
925
+ "grad_norm": 0.7933437824249268,
926
+ "learning_rate": 9.980885321896685e-05,
927
+ "loss": 0.0773,
928
+ "step": 1530
929
+ },
930
+ {
931
+ "grad_norm": 0.6864101886749268,
932
+ "learning_rate": 9.980156302117905e-05,
933
+ "loss": 0.0773,
934
+ "step": 1540
935
+ },
936
+ {
937
+ "grad_norm": 0.689123272895813,
938
+ "learning_rate": 9.979413666781963e-05,
939
+ "loss": 0.0824,
940
+ "step": 1550
941
+ },
942
+ {
943
+ "grad_norm": 0.8207864165306091,
944
+ "learning_rate": 9.978657417919193e-05,
945
+ "loss": 0.0803,
946
+ "step": 1560
947
+ },
948
+ {
949
+ "grad_norm": 0.7813171744346619,
950
+ "learning_rate": 9.977887557597153e-05,
951
+ "loss": 0.0817,
952
+ "step": 1570
953
+ },
954
+ {
955
+ "grad_norm": 0.695106565952301,
956
+ "learning_rate": 9.97710408792061e-05,
957
+ "loss": 0.0783,
958
+ "step": 1580
959
+ },
960
+ {
961
+ "grad_norm": 0.9048652052879333,
962
+ "learning_rate": 9.976307011031542e-05,
963
+ "loss": 0.0788,
964
+ "step": 1590
965
+ },
966
+ {
967
+ "grad_norm": 0.8499309420585632,
968
+ "learning_rate": 9.975496329109126e-05,
969
+ "loss": 0.081,
970
+ "step": 1600
971
+ },
972
+ {
973
+ "grad_norm": 0.8718334436416626,
974
+ "learning_rate": 9.974672044369732e-05,
975
+ "loss": 0.0777,
976
+ "step": 1610
977
+ },
978
+ {
979
+ "grad_norm": 0.6900801658630371,
980
+ "learning_rate": 9.97383415906693e-05,
981
+ "loss": 0.077,
982
+ "step": 1620
983
+ },
984
+ {
985
+ "grad_norm": 0.8092792630195618,
986
+ "learning_rate": 9.97298267549146e-05,
987
+ "loss": 0.0788,
988
+ "step": 1630
989
+ },
990
+ {
991
+ "grad_norm": 0.8192611932754517,
992
+ "learning_rate": 9.972117595971249e-05,
993
+ "loss": 0.0799,
994
+ "step": 1640
995
+ },
996
+ {
997
+ "grad_norm": 0.8722266554832458,
998
+ "learning_rate": 9.971238922871391e-05,
999
+ "loss": 0.0819,
1000
+ "step": 1650
1001
+ },
1002
+ {
1003
+ "grad_norm": 0.914159893989563,
1004
+ "learning_rate": 9.970346658594142e-05,
1005
+ "loss": 0.0838,
1006
+ "step": 1660
1007
+ },
1008
+ {
1009
+ "grad_norm": 0.8131964206695557,
1010
+ "learning_rate": 9.969440805578923e-05,
1011
+ "loss": 0.0797,
1012
+ "step": 1670
1013
+ },
1014
+ {
1015
+ "grad_norm": 0.7147591710090637,
1016
+ "learning_rate": 9.968521366302298e-05,
1017
+ "loss": 0.0799,
1018
+ "step": 1680
1019
+ },
1020
+ {
1021
+ "grad_norm": 0.8249319791793823,
1022
+ "learning_rate": 9.967588343277981e-05,
1023
+ "loss": 0.0783,
1024
+ "step": 1690
1025
+ },
1026
+ {
1027
+ "grad_norm": 0.7327215075492859,
1028
+ "learning_rate": 9.966641739056818e-05,
1029
+ "loss": 0.0787,
1030
+ "step": 1700
1031
+ },
1032
+ {
1033
+ "grad_norm": 0.7018980979919434,
1034
+ "learning_rate": 9.965681556226793e-05,
1035
+ "loss": 0.0705,
1036
+ "step": 1710
1037
+ },
1038
+ {
1039
+ "grad_norm": 0.8972001671791077,
1040
+ "learning_rate": 9.964707797413006e-05,
1041
+ "loss": 0.0796,
1042
+ "step": 1720
1043
+ },
1044
+ {
1045
+ "grad_norm": 0.8128800392150879,
1046
+ "learning_rate": 9.963720465277679e-05,
1047
+ "loss": 0.0818,
1048
+ "step": 1730
1049
+ },
1050
+ {
1051
+ "grad_norm": 0.9391877055168152,
1052
+ "learning_rate": 9.96271956252014e-05,
1053
+ "loss": 0.0758,
1054
+ "step": 1740
1055
+ },
1056
+ {
1057
+ "grad_norm": 0.8188132047653198,
1058
+ "learning_rate": 9.961705091876816e-05,
1059
+ "loss": 0.0756,
1060
+ "step": 1750
1061
+ },
1062
+ {
1063
+ "grad_norm": 0.8037185668945312,
1064
+ "learning_rate": 9.960677056121235e-05,
1065
+ "loss": 0.0783,
1066
+ "step": 1760
1067
+ },
1068
+ {
1069
+ "grad_norm": 0.6627317070960999,
1070
+ "learning_rate": 9.959635458064005e-05,
1071
+ "loss": 0.0773,
1072
+ "step": 1770
1073
+ },
1074
+ {
1075
+ "grad_norm": 0.6626058220863342,
1076
+ "learning_rate": 9.958580300552815e-05,
1077
+ "loss": 0.0775,
1078
+ "step": 1780
1079
+ },
1080
+ {
1081
+ "grad_norm": 0.7204414010047913,
1082
+ "learning_rate": 9.957511586472426e-05,
1083
+ "loss": 0.0762,
1084
+ "step": 1790
1085
+ },
1086
+ {
1087
+ "grad_norm": 0.6517882347106934,
1088
+ "learning_rate": 9.956429318744662e-05,
1089
+ "loss": 0.0776,
1090
+ "step": 1800
1091
+ },
1092
+ {
1093
+ "grad_norm": 0.7082467675209045,
1094
+ "learning_rate": 9.955333500328404e-05,
1095
+ "loss": 0.0737,
1096
+ "step": 1810
1097
+ },
1098
+ {
1099
+ "grad_norm": 0.7636476159095764,
1100
+ "learning_rate": 9.95422413421957e-05,
1101
+ "loss": 0.0733,
1102
+ "step": 1820
1103
+ },
1104
+ {
1105
+ "grad_norm": 0.72133868932724,
1106
+ "learning_rate": 9.953101223451133e-05,
1107
+ "loss": 0.0749,
1108
+ "step": 1830
1109
+ },
1110
+ {
1111
+ "grad_norm": 0.7455642223358154,
1112
+ "learning_rate": 9.951964771093085e-05,
1113
+ "loss": 0.074,
1114
+ "step": 1840
1115
+ },
1116
+ {
1117
+ "grad_norm": 0.6844678521156311,
1118
+ "learning_rate": 9.950814780252442e-05,
1119
+ "loss": 0.0773,
1120
+ "step": 1850
1121
+ },
1122
+ {
1123
+ "grad_norm": 0.49062681198120117,
1124
+ "learning_rate": 9.949651254073236e-05,
1125
+ "loss": 0.0732,
1126
+ "step": 1860
1127
+ },
1128
+ {
1129
+ "grad_norm": 0.789148211479187,
1130
+ "learning_rate": 9.948474195736504e-05,
1131
+ "loss": 0.0718,
1132
+ "step": 1870
1133
+ },
1134
+ {
1135
+ "grad_norm": 0.6764615178108215,
1136
+ "learning_rate": 9.947283608460277e-05,
1137
+ "loss": 0.0742,
1138
+ "step": 1880
1139
+ },
1140
+ {
1141
+ "grad_norm": 0.6999238133430481,
1142
+ "learning_rate": 9.946079495499577e-05,
1143
+ "loss": 0.0747,
1144
+ "step": 1890
1145
+ },
1146
+ {
1147
+ "grad_norm": 0.7517783045768738,
1148
+ "learning_rate": 9.944861860146401e-05,
1149
+ "loss": 0.0753,
1150
+ "step": 1900
1151
+ },
1152
+ {
1153
+ "grad_norm": 0.7183238863945007,
1154
+ "learning_rate": 9.943630705729719e-05,
1155
+ "loss": 0.0697,
1156
+ "step": 1910
1157
+ },
1158
+ {
1159
+ "grad_norm": 0.5847482681274414,
1160
+ "learning_rate": 9.942386035615459e-05,
1161
+ "loss": 0.072,
1162
+ "step": 1920
1163
+ },
1164
+ {
1165
+ "grad_norm": 0.5976929068565369,
1166
+ "learning_rate": 9.941127853206503e-05,
1167
+ "loss": 0.0694,
1168
+ "step": 1930
1169
+ },
1170
+ {
1171
+ "grad_norm": 0.5992315411567688,
1172
+ "learning_rate": 9.939856161942673e-05,
1173
+ "loss": 0.0729,
1174
+ "step": 1940
1175
+ },
1176
+ {
1177
+ "grad_norm": 0.6920360922813416,
1178
+ "learning_rate": 9.938570965300724e-05,
1179
+ "loss": 0.0693,
1180
+ "step": 1950
1181
+ },
1182
+ {
1183
+ "grad_norm": 0.7227588891983032,
1184
+ "learning_rate": 9.937272266794335e-05,
1185
+ "loss": 0.0779,
1186
+ "step": 1960
1187
+ },
1188
+ {
1189
+ "grad_norm": 0.6451845169067383,
1190
+ "learning_rate": 9.935960069974096e-05,
1191
+ "loss": 0.0705,
1192
+ "step": 1970
1193
+ },
1194
+ {
1195
+ "grad_norm": 0.7243984341621399,
1196
+ "learning_rate": 9.934634378427506e-05,
1197
+ "loss": 0.0708,
1198
+ "step": 1980
1199
+ },
1200
+ {
1201
+ "grad_norm": 0.6210780143737793,
1202
+ "learning_rate": 9.933295195778954e-05,
1203
+ "loss": 0.0772,
1204
+ "step": 1990
1205
+ },
1206
+ {
1207
+ "grad_norm": 0.5807631611824036,
1208
+ "learning_rate": 9.931942525689715e-05,
1209
+ "loss": 0.0745,
1210
+ "step": 2000
1211
+ },
1212
+ {
1213
+ "grad_norm": 0.6609013676643372,
1214
+ "learning_rate": 9.930576371857936e-05,
1215
+ "loss": 0.0723,
1216
+ "step": 2010
1217
+ },
1218
+ {
1219
+ "grad_norm": 0.7919302582740784,
1220
+ "learning_rate": 9.929196738018629e-05,
1221
+ "loss": 0.0702,
1222
+ "step": 2020
1223
+ },
1224
+ {
1225
+ "grad_norm": 0.6295292973518372,
1226
+ "learning_rate": 9.927803627943662e-05,
1227
+ "loss": 0.0674,
1228
+ "step": 2030
1229
+ },
1230
+ {
1231
+ "grad_norm": 0.756155788898468,
1232
+ "learning_rate": 9.926397045441744e-05,
1233
+ "loss": 0.0687,
1234
+ "step": 2040
1235
+ },
1236
+ {
1237
+ "grad_norm": 0.7688308954238892,
1238
+ "learning_rate": 9.924976994358417e-05,
1239
+ "loss": 0.0718,
1240
+ "step": 2050
1241
+ },
1242
+ {
1243
+ "grad_norm": 0.8509033918380737,
1244
+ "learning_rate": 9.923543478576048e-05,
1245
+ "loss": 0.0727,
1246
+ "step": 2060
1247
+ },
1248
+ {
1249
+ "grad_norm": 0.7590917944908142,
1250
+ "learning_rate": 9.922096502013813e-05,
1251
+ "loss": 0.074,
1252
+ "step": 2070
1253
+ },
1254
+ {
1255
+ "grad_norm": 0.8109246492385864,
1256
+ "learning_rate": 9.92063606862769e-05,
1257
+ "loss": 0.0721,
1258
+ "step": 2080
1259
+ },
1260
+ {
1261
+ "grad_norm": 0.6400628685951233,
1262
+ "learning_rate": 9.919162182410453e-05,
1263
+ "loss": 0.0707,
1264
+ "step": 2090
1265
+ },
1266
+ {
1267
+ "grad_norm": 0.5556660890579224,
1268
+ "learning_rate": 9.917674847391645e-05,
1269
+ "loss": 0.0663,
1270
+ "step": 2100
1271
+ },
1272
+ {
1273
+ "grad_norm": 0.7919337749481201,
1274
+ "learning_rate": 9.916174067637584e-05,
1275
+ "loss": 0.0675,
1276
+ "step": 2110
1277
+ },
1278
+ {
1279
+ "grad_norm": 0.6571515798568726,
1280
+ "learning_rate": 9.914659847251348e-05,
1281
+ "loss": 0.0683,
1282
+ "step": 2120
1283
+ },
1284
+ {
1285
+ "grad_norm": 0.5666832327842712,
1286
+ "learning_rate": 9.913132190372753e-05,
1287
+ "loss": 0.0706,
1288
+ "step": 2130
1289
+ },
1290
+ {
1291
+ "grad_norm": 0.6068550944328308,
1292
+ "learning_rate": 9.911591101178359e-05,
1293
+ "loss": 0.067,
1294
+ "step": 2140
1295
+ },
1296
+ {
1297
+ "grad_norm": 0.5472414493560791,
1298
+ "learning_rate": 9.910036583881443e-05,
1299
+ "loss": 0.0686,
1300
+ "step": 2150
1301
+ },
1302
+ {
1303
+ "grad_norm": 0.6243656277656555,
1304
+ "learning_rate": 9.908468642731995e-05,
1305
+ "loss": 0.0663,
1306
+ "step": 2160
1307
+ },
1308
+ {
1309
+ "grad_norm": 0.685313880443573,
1310
+ "learning_rate": 9.906887282016707e-05,
1311
+ "loss": 0.0704,
1312
+ "step": 2170
1313
+ },
1314
+ {
1315
+ "grad_norm": 0.6772751212120056,
1316
+ "learning_rate": 9.90529250605896e-05,
1317
+ "loss": 0.0651,
1318
+ "step": 2180
1319
+ },
1320
+ {
1321
+ "grad_norm": 0.6815426349639893,
1322
+ "learning_rate": 9.903684319218809e-05,
1323
+ "loss": 0.0728,
1324
+ "step": 2190
1325
+ },
1326
+ {
1327
+ "grad_norm": 0.822087287902832,
1328
+ "learning_rate": 9.902062725892976e-05,
1329
+ "loss": 0.0723,
1330
+ "step": 2200
1331
+ },
1332
+ {
1333
+ "grad_norm": 0.6740921139717102,
1334
+ "learning_rate": 9.900427730514834e-05,
1335
+ "loss": 0.0722,
1336
+ "step": 2210
1337
+ },
1338
+ {
1339
+ "grad_norm": 0.730047345161438,
1340
+ "learning_rate": 9.8987793375544e-05,
1341
+ "loss": 0.0717,
1342
+ "step": 2220
1343
+ },
1344
+ {
1345
+ "grad_norm": 0.8769873976707458,
1346
+ "learning_rate": 9.897117551518318e-05,
1347
+ "loss": 0.0672,
1348
+ "step": 2230
1349
+ },
1350
+ {
1351
+ "grad_norm": 0.5988404750823975,
1352
+ "learning_rate": 9.895442376949844e-05,
1353
+ "loss": 0.0691,
1354
+ "step": 2240
1355
+ },
1356
+ {
1357
+ "grad_norm": 0.7594494223594666,
1358
+ "learning_rate": 9.893753818428845e-05,
1359
+ "loss": 0.0703,
1360
+ "step": 2250
1361
+ },
1362
+ {
1363
+ "grad_norm": 0.7655356526374817,
1364
+ "learning_rate": 9.892051880571773e-05,
1365
+ "loss": 0.0643,
1366
+ "step": 2260
1367
+ },
1368
+ {
1369
+ "grad_norm": 0.6700913906097412,
1370
+ "learning_rate": 9.890336568031663e-05,
1371
+ "loss": 0.066,
1372
+ "step": 2270
1373
+ },
1374
+ {
1375
+ "grad_norm": 0.6776233315467834,
1376
+ "learning_rate": 9.888607885498113e-05,
1377
+ "loss": 0.0713,
1378
+ "step": 2280
1379
+ },
1380
+ {
1381
+ "grad_norm": 0.6251364350318909,
1382
+ "learning_rate": 9.886865837697275e-05,
1383
+ "loss": 0.0675,
1384
+ "step": 2290
1385
+ },
1386
+ {
1387
+ "grad_norm": 0.6322036981582642,
1388
+ "learning_rate": 9.88511042939184e-05,
1389
+ "loss": 0.07,
1390
+ "step": 2300
1391
+ },
1392
+ {
1393
+ "grad_norm": 0.6706236600875854,
1394
+ "learning_rate": 9.883341665381028e-05,
1395
+ "loss": 0.0707,
1396
+ "step": 2310
1397
+ },
1398
+ {
1399
+ "grad_norm": 0.7654581069946289,
1400
+ "learning_rate": 9.881559550500575e-05,
1401
+ "loss": 0.0684,
1402
+ "step": 2320
1403
+ },
1404
+ {
1405
+ "grad_norm": 0.6615346074104309,
1406
+ "learning_rate": 9.879764089622712e-05,
1407
+ "loss": 0.0664,
1408
+ "step": 2330
1409
+ },
1410
+ {
1411
+ "grad_norm": 0.6900296807289124,
1412
+ "learning_rate": 9.87795528765616e-05,
1413
+ "loss": 0.0703,
1414
+ "step": 2340
1415
+ },
1416
+ {
1417
+ "grad_norm": 0.6962850689888,
1418
+ "learning_rate": 9.876133149546118e-05,
1419
+ "loss": 0.0712,
1420
+ "step": 2350
1421
+ },
1422
+ {
1423
+ "grad_norm": 0.5966289639472961,
1424
+ "learning_rate": 9.874297680274238e-05,
1425
+ "loss": 0.0705,
1426
+ "step": 2360
1427
+ },
1428
+ {
1429
+ "grad_norm": 0.5869346261024475,
1430
+ "learning_rate": 9.872448884858624e-05,
1431
+ "loss": 0.0673,
1432
+ "step": 2370
1433
+ },
1434
+ {
1435
+ "grad_norm": 0.6729479432106018,
1436
+ "learning_rate": 9.870586768353815e-05,
1437
+ "loss": 0.0698,
1438
+ "step": 2380
1439
+ },
1440
+ {
1441
+ "grad_norm": 0.4968750476837158,
1442
+ "learning_rate": 9.868711335850764e-05,
1443
+ "loss": 0.071,
1444
+ "step": 2390
1445
+ },
1446
+ {
1447
+ "grad_norm": 0.5750929713249207,
1448
+ "learning_rate": 9.866822592476833e-05,
1449
+ "loss": 0.066,
1450
+ "step": 2400
1451
+ },
1452
+ {
1453
+ "grad_norm": 0.6520802974700928,
1454
+ "learning_rate": 9.86492054339577e-05,
1455
+ "loss": 0.0704,
1456
+ "step": 2410
1457
+ },
1458
+ {
1459
+ "grad_norm": 0.6432913541793823,
1460
+ "learning_rate": 9.863005193807711e-05,
1461
+ "loss": 0.0669,
1462
+ "step": 2420
1463
+ },
1464
+ {
1465
+ "grad_norm": 0.7633799314498901,
1466
+ "learning_rate": 9.861076548949143e-05,
1467
+ "loss": 0.0641,
1468
+ "step": 2430
1469
+ },
1470
+ {
1471
+ "grad_norm": 0.727251410484314,
1472
+ "learning_rate": 9.859134614092912e-05,
1473
+ "loss": 0.0666,
1474
+ "step": 2440
1475
+ },
1476
+ {
1477
+ "grad_norm": 0.6507017016410828,
1478
+ "learning_rate": 9.857179394548191e-05,
1479
+ "loss": 0.0631,
1480
+ "step": 2450
1481
+ },
1482
+ {
1483
+ "grad_norm": 0.802526593208313,
1484
+ "learning_rate": 9.855210895660477e-05,
1485
+ "loss": 0.0695,
1486
+ "step": 2460
1487
+ },
1488
+ {
1489
+ "grad_norm": 0.4968661069869995,
1490
+ "learning_rate": 9.853229122811568e-05,
1491
+ "loss": 0.0668,
1492
+ "step": 2470
1493
+ },
1494
+ {
1495
+ "grad_norm": 0.5049183964729309,
1496
+ "learning_rate": 9.851234081419559e-05,
1497
+ "loss": 0.0679,
1498
+ "step": 2480
1499
+ },
1500
+ {
1501
+ "grad_norm": 0.5562856793403625,
1502
+ "learning_rate": 9.849225776938814e-05,
1503
+ "loss": 0.067,
1504
+ "step": 2490
1505
+ },
1506
+ {
1507
+ "grad_norm": 0.578382134437561,
1508
+ "learning_rate": 9.847204214859964e-05,
1509
+ "loss": 0.0641,
1510
+ "step": 2500
1511
+ },
1512
+ {
1513
+ "grad_norm": 0.6934925317764282,
1514
+ "learning_rate": 9.845169400709879e-05,
1515
+ "loss": 0.0677,
1516
+ "step": 2510
1517
+ },
1518
+ {
1519
+ "grad_norm": 0.729125440120697,
1520
+ "learning_rate": 9.843121340051664e-05,
1521
+ "loss": 0.0637,
1522
+ "step": 2520
1523
+ },
1524
+ {
1525
+ "grad_norm": 0.6229711174964905,
1526
+ "learning_rate": 9.841060038484641e-05,
1527
+ "loss": 0.064,
1528
+ "step": 2530
1529
+ },
1530
+ {
1531
+ "grad_norm": 0.6090768575668335,
1532
+ "learning_rate": 9.838985501644328e-05,
1533
+ "loss": 0.0623,
1534
+ "step": 2540
1535
+ },
1536
+ {
1537
+ "grad_norm": 0.8319109082221985,
1538
+ "learning_rate": 9.83689773520243e-05,
1539
+ "loss": 0.0669,
1540
+ "step": 2550
1541
+ },
1542
+ {
1543
+ "grad_norm": 0.6815285086631775,
1544
+ "learning_rate": 9.834796744866819e-05,
1545
+ "loss": 0.0661,
1546
+ "step": 2560
1547
+ },
1548
+ {
1549
+ "grad_norm": 0.49073100090026855,
1550
+ "learning_rate": 9.832682536381525e-05,
1551
+ "loss": 0.0686,
1552
+ "step": 2570
1553
+ },
1554
+ {
1555
+ "grad_norm": 0.5500509142875671,
1556
+ "learning_rate": 9.830555115526711e-05,
1557
+ "loss": 0.0663,
1558
+ "step": 2580
1559
+ },
1560
+ {
1561
+ "grad_norm": 0.5543439388275146,
1562
+ "learning_rate": 9.828414488118667e-05,
1563
+ "loss": 0.0586,
1564
+ "step": 2590
1565
+ },
1566
+ {
1567
+ "grad_norm": 0.5412293672561646,
1568
+ "learning_rate": 9.826260660009785e-05,
1569
+ "loss": 0.065,
1570
+ "step": 2600
1571
+ },
1572
+ {
1573
+ "grad_norm": 0.46607404947280884,
1574
+ "learning_rate": 9.824093637088547e-05,
1575
+ "loss": 0.0643,
1576
+ "step": 2610
1577
+ },
1578
+ {
1579
+ "grad_norm": 0.5089811682701111,
1580
+ "learning_rate": 9.821913425279514e-05,
1581
+ "loss": 0.0627,
1582
+ "step": 2620
1583
+ },
1584
+ {
1585
+ "grad_norm": 0.6004795432090759,
1586
+ "learning_rate": 9.8197200305433e-05,
1587
+ "loss": 0.0648,
1588
+ "step": 2630
1589
+ },
1590
+ {
1591
+ "grad_norm": 0.5946650505065918,
1592
+ "learning_rate": 9.817513458876564e-05,
1593
+ "loss": 0.0634,
1594
+ "step": 2640
1595
+ },
1596
+ {
1597
+ "grad_norm": 0.7084515690803528,
1598
+ "learning_rate": 9.815293716311987e-05,
1599
+ "loss": 0.0653,
1600
+ "step": 2650
1601
+ },
1602
+ {
1603
+ "grad_norm": 0.6806345582008362,
1604
+ "learning_rate": 9.813060808918262e-05,
1605
+ "loss": 0.0639,
1606
+ "step": 2660
1607
+ },
1608
+ {
1609
+ "grad_norm": 0.6408096551895142,
1610
+ "learning_rate": 9.810814742800069e-05,
1611
+ "loss": 0.0641,
1612
+ "step": 2670
1613
+ },
1614
+ {
1615
+ "grad_norm": 0.5025924444198608,
1616
+ "learning_rate": 9.808555524098074e-05,
1617
+ "loss": 0.063,
1618
+ "step": 2680
1619
+ },
1620
+ {
1621
+ "grad_norm": 0.7290829420089722,
1622
+ "learning_rate": 9.806283158988887e-05,
1623
+ "loss": 0.0647,
1624
+ "step": 2690
1625
+ },
1626
+ {
1627
+ "grad_norm": 0.5606433153152466,
1628
+ "learning_rate": 9.803997653685072e-05,
1629
+ "loss": 0.062,
1630
+ "step": 2700
1631
+ },
1632
+ {
1633
+ "grad_norm": 0.5064647793769836,
1634
+ "learning_rate": 9.801699014435112e-05,
1635
+ "loss": 0.0643,
1636
+ "step": 2710
1637
+ },
1638
+ {
1639
+ "grad_norm": 0.5947048664093018,
1640
+ "learning_rate": 9.799387247523398e-05,
1641
+ "loss": 0.06,
1642
+ "step": 2720
1643
+ },
1644
+ {
1645
+ "grad_norm": 0.6373162269592285,
1646
+ "learning_rate": 9.797062359270215e-05,
1647
+ "loss": 0.0596,
1648
+ "step": 2730
1649
+ },
1650
+ {
1651
+ "grad_norm": 0.683765709400177,
1652
+ "learning_rate": 9.794724356031715e-05,
1653
+ "loss": 0.0641,
1654
+ "step": 2740
1655
+ },
1656
+ {
1657
+ "grad_norm": 0.6411890983581543,
1658
+ "learning_rate": 9.792373244199913e-05,
1659
+ "loss": 0.0687,
1660
+ "step": 2750
1661
+ },
1662
+ {
1663
+ "grad_norm": 0.4775662422180176,
1664
+ "learning_rate": 9.790009030202658e-05,
1665
+ "loss": 0.0622,
1666
+ "step": 2760
1667
+ },
1668
+ {
1669
+ "grad_norm": 0.651835560798645,
1670
+ "learning_rate": 9.78763172050362e-05,
1671
+ "loss": 0.0621,
1672
+ "step": 2770
1673
+ },
1674
+ {
1675
+ "grad_norm": 0.6854885220527649,
1676
+ "learning_rate": 9.785241321602274e-05,
1677
+ "loss": 0.0667,
1678
+ "step": 2780
1679
+ },
1680
+ {
1681
+ "grad_norm": 0.6907970309257507,
1682
+ "learning_rate": 9.782837840033879e-05,
1683
+ "loss": 0.0669,
1684
+ "step": 2790
1685
+ },
1686
+ {
1687
+ "grad_norm": 0.5823140740394592,
1688
+ "learning_rate": 9.780421282369461e-05,
1689
+ "loss": 0.0678,
1690
+ "step": 2800
1691
+ },
1692
+ {
1693
+ "grad_norm": 0.6364890933036804,
1694
+ "learning_rate": 9.777991655215797e-05,
1695
+ "loss": 0.0663,
1696
+ "step": 2810
1697
+ },
1698
+ {
1699
+ "grad_norm": 0.5718041658401489,
1700
+ "learning_rate": 9.775548965215394e-05,
1701
+ "loss": 0.0626,
1702
+ "step": 2820
1703
+ },
1704
+ {
1705
+ "grad_norm": 0.4957229793071747,
1706
+ "learning_rate": 9.773093219046474e-05,
1707
+ "loss": 0.0634,
1708
+ "step": 2830
1709
+ },
1710
+ {
1711
+ "grad_norm": 0.6113382577896118,
1712
+ "learning_rate": 9.770624423422954e-05,
1713
+ "loss": 0.0665,
1714
+ "step": 2840
1715
+ },
1716
+ {
1717
+ "grad_norm": 0.6246403455734253,
1718
+ "learning_rate": 9.768142585094426e-05,
1719
+ "loss": 0.0626,
1720
+ "step": 2850
1721
+ },
1722
+ {
1723
+ "grad_norm": 0.6030095219612122,
1724
+ "learning_rate": 9.765647710846142e-05,
1725
+ "loss": 0.0662,
1726
+ "step": 2860
1727
+ },
1728
+ {
1729
+ "grad_norm": 0.5451913475990295,
1730
+ "learning_rate": 9.763139807498991e-05,
1731
+ "loss": 0.0692,
1732
+ "step": 2870
1733
+ },
1734
+ {
1735
+ "grad_norm": 0.5483195185661316,
1736
+ "learning_rate": 9.760618881909487e-05,
1737
+ "loss": 0.0599,
1738
+ "step": 2880
1739
+ },
1740
+ {
1741
+ "grad_norm": 0.47611215710639954,
1742
+ "learning_rate": 9.758084940969744e-05,
1743
+ "loss": 0.0635,
1744
+ "step": 2890
1745
+ },
1746
+ {
1747
+ "grad_norm": 0.5544406175613403,
1748
+ "learning_rate": 9.755537991607459e-05,
1749
+ "loss": 0.0592,
1750
+ "step": 2900
1751
+ },
1752
+ {
1753
+ "grad_norm": 0.6410639882087708,
1754
+ "learning_rate": 9.752978040785895e-05,
1755
+ "loss": 0.0613,
1756
+ "step": 2910
1757
+ },
1758
+ {
1759
+ "grad_norm": 0.6519464254379272,
1760
+ "learning_rate": 9.750405095503859e-05,
1761
+ "loss": 0.0584,
1762
+ "step": 2920
1763
+ },
1764
+ {
1765
+ "grad_norm": 0.6715825200080872,
1766
+ "learning_rate": 9.747819162795686e-05,
1767
+ "loss": 0.064,
1768
+ "step": 2930
1769
+ },
1770
+ {
1771
+ "grad_norm": 0.5294116139411926,
1772
+ "learning_rate": 9.745220249731217e-05,
1773
+ "loss": 0.0617,
1774
+ "step": 2940
1775
+ },
1776
+ {
1777
+ "grad_norm": 0.5013177394866943,
1778
+ "learning_rate": 9.742608363415781e-05,
1779
+ "loss": 0.0579,
1780
+ "step": 2950
1781
+ },
1782
+ {
1783
+ "grad_norm": 0.7086690664291382,
1784
+ "learning_rate": 9.739983510990176e-05,
1785
+ "loss": 0.0627,
1786
+ "step": 2960
1787
+ },
1788
+ {
1789
+ "grad_norm": 0.6349759697914124,
1790
+ "learning_rate": 9.737345699630647e-05,
1791
+ "loss": 0.0676,
1792
+ "step": 2970
1793
+ },
1794
+ {
1795
+ "grad_norm": 0.6648471355438232,
1796
+ "learning_rate": 9.734694936548869e-05,
1797
+ "loss": 0.0642,
1798
+ "step": 2980
1799
+ },
1800
+ {
1801
+ "grad_norm": 0.4997161328792572,
1802
+ "learning_rate": 9.732031228991932e-05,
1803
+ "loss": 0.0603,
1804
+ "step": 2990
1805
+ },
1806
+ {
1807
+ "grad_norm": 0.4930708408355713,
1808
+ "learning_rate": 9.729354584242302e-05,
1809
+ "loss": 0.0596,
1810
+ "step": 3000
1811
+ },
1812
+ {
1813
+ "grad_norm": 0.6939645409584045,
1814
+ "learning_rate": 9.726665009617832e-05,
1815
+ "loss": 0.0627,
1816
+ "step": 3010
1817
+ },
1818
+ {
1819
+ "grad_norm": 0.6745036244392395,
1820
+ "learning_rate": 9.723962512471714e-05,
1821
+ "loss": 0.0622,
1822
+ "step": 3020
1823
+ },
1824
+ {
1825
+ "grad_norm": 0.6208877563476562,
1826
+ "learning_rate": 9.72124710019247e-05,
1827
+ "loss": 0.0599,
1828
+ "step": 3030
1829
+ },
1830
+ {
1831
+ "grad_norm": 0.615725576877594,
1832
+ "learning_rate": 9.718518780203934e-05,
1833
+ "loss": 0.0611,
1834
+ "step": 3040
1835
+ },
1836
+ {
1837
+ "grad_norm": 0.5784436464309692,
1838
+ "learning_rate": 9.715777559965228e-05,
1839
+ "loss": 0.0598,
1840
+ "step": 3050
1841
+ },
1842
+ {
1843
+ "grad_norm": 0.6067401766777039,
1844
+ "learning_rate": 9.713023446970746e-05,
1845
+ "loss": 0.0647,
1846
+ "step": 3060
1847
+ },
1848
+ {
1849
+ "grad_norm": 0.5806649327278137,
1850
+ "learning_rate": 9.710256448750126e-05,
1851
+ "loss": 0.0625,
1852
+ "step": 3070
1853
+ },
1854
+ {
1855
+ "grad_norm": 0.6504300236701965,
1856
+ "learning_rate": 9.707476572868235e-05,
1857
+ "loss": 0.058,
1858
+ "step": 3080
1859
+ },
1860
+ {
1861
+ "grad_norm": 0.500622570514679,
1862
+ "learning_rate": 9.704683826925149e-05,
1863
+ "loss": 0.0577,
1864
+ "step": 3090
1865
+ },
1866
+ {
1867
+ "grad_norm": 0.6325183510780334,
1868
+ "learning_rate": 9.701878218556129e-05,
1869
+ "loss": 0.0603,
1870
+ "step": 3100
1871
+ },
1872
+ {
1873
+ "grad_norm": 0.555566132068634,
1874
+ "learning_rate": 9.699059755431598e-05,
1875
+ "loss": 0.0616,
1876
+ "step": 3110
1877
+ },
1878
+ {
1879
+ "grad_norm": 0.4982530474662781,
1880
+ "learning_rate": 9.696228445257132e-05,
1881
+ "loss": 0.0594,
1882
+ "step": 3120
1883
+ },
1884
+ {
1885
+ "grad_norm": 0.5743557214736938,
1886
+ "learning_rate": 9.693384295773419e-05,
1887
+ "loss": 0.056,
1888
+ "step": 3130
1889
+ },
1890
+ {
1891
+ "grad_norm": 0.4599805772304535,
1892
+ "learning_rate": 9.690527314756259e-05,
1893
+ "loss": 0.0551,
1894
+ "step": 3140
1895
+ },
1896
+ {
1897
+ "grad_norm": 0.6725175976753235,
1898
+ "learning_rate": 9.687657510016527e-05,
1899
+ "loss": 0.0586,
1900
+ "step": 3150
1901
+ },
1902
+ {
1903
+ "grad_norm": 0.5373369455337524,
1904
+ "learning_rate": 9.684774889400161e-05,
1905
+ "loss": 0.0576,
1906
+ "step": 3160
1907
+ },
1908
+ {
1909
+ "grad_norm": 0.6253339648246765,
1910
+ "learning_rate": 9.681879460788135e-05,
1911
+ "loss": 0.0586,
1912
+ "step": 3170
1913
+ },
1914
+ {
1915
+ "grad_norm": 0.6447578072547913,
1916
+ "learning_rate": 9.67897123209644e-05,
1917
+ "loss": 0.0639,
1918
+ "step": 3180
1919
+ },
1920
+ {
1921
+ "grad_norm": 0.44229140877723694,
1922
+ "learning_rate": 9.676050211276062e-05,
1923
+ "loss": 0.0606,
1924
+ "step": 3190
1925
+ },
1926
+ {
1927
+ "grad_norm": 0.6652916669845581,
1928
+ "learning_rate": 9.673116406312962e-05,
1929
+ "loss": 0.0629,
1930
+ "step": 3200
1931
+ },
1932
+ {
1933
+ "grad_norm": 0.7552599906921387,
1934
+ "learning_rate": 9.67016982522805e-05,
1935
+ "loss": 0.0666,
1936
+ "step": 3210
1937
+ },
1938
+ {
1939
+ "grad_norm": 0.6908206939697266,
1940
+ "learning_rate": 9.667210476077164e-05,
1941
+ "loss": 0.0606,
1942
+ "step": 3220
1943
+ },
1944
+ {
1945
+ "grad_norm": 0.5687106251716614,
1946
+ "learning_rate": 9.664238366951055e-05,
1947
+ "loss": 0.0599,
1948
+ "step": 3230
1949
+ },
1950
+ {
1951
+ "grad_norm": 0.563493549823761,
1952
+ "learning_rate": 9.661253505975355e-05,
1953
+ "loss": 0.0569,
1954
+ "step": 3240
1955
+ },
1956
+ {
1957
+ "grad_norm": 0.6353240609169006,
1958
+ "learning_rate": 9.658255901310557e-05,
1959
+ "loss": 0.0593,
1960
+ "step": 3250
1961
+ },
1962
+ {
1963
+ "grad_norm": 0.5277099609375,
1964
+ "learning_rate": 9.655245561152e-05,
1965
+ "loss": 0.0608,
1966
+ "step": 3260
1967
+ },
1968
+ {
1969
+ "grad_norm": 0.5423051118850708,
1970
+ "learning_rate": 9.65222249372984e-05,
1971
+ "loss": 0.0549,
1972
+ "step": 3270
1973
+ },
1974
+ {
1975
+ "grad_norm": 0.474439412355423,
1976
+ "learning_rate": 9.649186707309026e-05,
1977
+ "loss": 0.0592,
1978
+ "step": 3280
1979
+ },
1980
+ {
1981
+ "grad_norm": 0.5447307825088501,
1982
+ "learning_rate": 9.646138210189283e-05,
1983
+ "loss": 0.0573,
1984
+ "step": 3290
1985
+ },
1986
+ {
1987
+ "grad_norm": 0.46958911418914795,
1988
+ "learning_rate": 9.643077010705087e-05,
1989
+ "loss": 0.0648,
1990
+ "step": 3300
1991
+ },
1992
+ {
1993
+ "grad_norm": 0.6247355341911316,
1994
+ "learning_rate": 9.640003117225637e-05,
1995
+ "loss": 0.0649,
1996
+ "step": 3310
1997
+ },
1998
+ {
1999
+ "grad_norm": 0.622942328453064,
2000
+ "learning_rate": 9.636916538154846e-05,
2001
+ "loss": 0.0669,
2002
+ "step": 3320
2003
+ },
2004
+ {
2005
+ "grad_norm": 0.46045130491256714,
2006
+ "learning_rate": 9.633817281931296e-05,
2007
+ "loss": 0.0622,
2008
+ "step": 3330
2009
+ },
2010
+ {
2011
+ "grad_norm": 0.5312515497207642,
2012
+ "learning_rate": 9.630705357028242e-05,
2013
+ "loss": 0.0597,
2014
+ "step": 3340
2015
+ },
2016
+ {
2017
+ "grad_norm": 0.4561923146247864,
2018
+ "learning_rate": 9.627580771953563e-05,
2019
+ "loss": 0.0564,
2020
+ "step": 3350
2021
+ },
2022
+ {
2023
+ "grad_norm": 0.4700702428817749,
2024
+ "learning_rate": 9.624443535249759e-05,
2025
+ "loss": 0.0633,
2026
+ "step": 3360
2027
+ },
2028
+ {
2029
+ "grad_norm": 0.5625237226486206,
2030
+ "learning_rate": 9.621293655493913e-05,
2031
+ "loss": 0.0578,
2032
+ "step": 3370
2033
+ },
2034
+ {
2035
+ "grad_norm": 0.5612451434135437,
2036
+ "learning_rate": 9.618131141297675e-05,
2037
+ "loss": 0.0649,
2038
+ "step": 3380
2039
+ },
2040
+ {
2041
+ "grad_norm": 0.5531405210494995,
2042
+ "learning_rate": 9.614956001307242e-05,
2043
+ "loss": 0.0636,
2044
+ "step": 3390
2045
+ },
2046
+ {
2047
+ "grad_norm": 0.5203084945678711,
2048
+ "learning_rate": 9.611768244203321e-05,
2049
+ "loss": 0.0597,
2050
+ "step": 3400
2051
+ },
2052
+ {
2053
+ "grad_norm": 0.48514410853385925,
2054
+ "learning_rate": 9.60856787870112e-05,
2055
+ "loss": 0.0618,
2056
+ "step": 3410
2057
+ },
2058
+ {
2059
+ "grad_norm": 0.42436739802360535,
2060
+ "learning_rate": 9.605354913550318e-05,
2061
+ "loss": 0.0594,
2062
+ "step": 3420
2063
+ },
2064
+ {
2065
+ "grad_norm": 0.4707908630371094,
2066
+ "learning_rate": 9.602129357535037e-05,
2067
+ "loss": 0.0581,
2068
+ "step": 3430
2069
+ },
2070
+ {
2071
+ "grad_norm": 0.6007688045501709,
2072
+ "learning_rate": 9.598891219473825e-05,
2073
+ "loss": 0.0583,
2074
+ "step": 3440
2075
+ },
2076
+ {
2077
+ "grad_norm": 0.58519446849823,
2078
+ "learning_rate": 9.595640508219625e-05,
2079
+ "loss": 0.0582,
2080
+ "step": 3450
2081
+ },
2082
+ {
2083
+ "grad_norm": 0.6219605207443237,
2084
+ "learning_rate": 9.592377232659761e-05,
2085
+ "loss": 0.0607,
2086
+ "step": 3460
2087
+ },
2088
+ {
2089
+ "grad_norm": 0.5018323659896851,
2090
+ "learning_rate": 9.589101401715904e-05,
2091
+ "loss": 0.0551,
2092
+ "step": 3470
2093
+ },
2094
+ {
2095
+ "grad_norm": 0.5631371140480042,
2096
+ "learning_rate": 9.585813024344045e-05,
2097
+ "loss": 0.0579,
2098
+ "step": 3480
2099
+ },
2100
+ {
2101
+ "grad_norm": 0.7580733299255371,
2102
+ "learning_rate": 9.58251210953449e-05,
2103
+ "loss": 0.0571,
2104
+ "step": 3490
2105
+ },
2106
+ {
2107
+ "grad_norm": 0.6364933252334595,
2108
+ "learning_rate": 9.579198666311809e-05,
2109
+ "loss": 0.0545,
2110
+ "step": 3500
2111
+ },
2112
+ {
2113
+ "grad_norm": 0.6756724715232849,
2114
+ "learning_rate": 9.575872703734832e-05,
2115
+ "loss": 0.0589,
2116
+ "step": 3510
2117
+ },
2118
+ {
2119
+ "grad_norm": 0.4428686499595642,
2120
+ "learning_rate": 9.572534230896611e-05,
2121
+ "loss": 0.0565,
2122
+ "step": 3520
2123
+ },
2124
+ {
2125
+ "grad_norm": 0.5265988707542419,
2126
+ "learning_rate": 9.569183256924403e-05,
2127
+ "loss": 0.0531,
2128
+ "step": 3530
2129
+ },
2130
+ {
2131
+ "grad_norm": 0.6523367762565613,
2132
+ "learning_rate": 9.565819790979646e-05,
2133
+ "loss": 0.058,
2134
+ "step": 3540
2135
+ },
2136
+ {
2137
+ "grad_norm": 0.5738118886947632,
2138
+ "learning_rate": 9.562443842257925e-05,
2139
+ "loss": 0.0607,
2140
+ "step": 3550
2141
+ },
2142
+ {
2143
+ "grad_norm": 0.5877414345741272,
2144
+ "learning_rate": 9.559055419988956e-05,
2145
+ "loss": 0.0599,
2146
+ "step": 3560
2147
+ },
2148
+ {
2149
+ "grad_norm": 0.6353724598884583,
2150
+ "learning_rate": 9.555654533436557e-05,
2151
+ "loss": 0.0581,
2152
+ "step": 3570
2153
+ },
2154
+ {
2155
+ "grad_norm": 0.42666953802108765,
2156
+ "learning_rate": 9.552241191898621e-05,
2157
+ "loss": 0.0556,
2158
+ "step": 3580
2159
+ },
2160
+ {
2161
+ "grad_norm": 0.5157475471496582,
2162
+ "learning_rate": 9.548815404707092e-05,
2163
+ "loss": 0.0604,
2164
+ "step": 3590
2165
+ },
2166
+ {
2167
+ "grad_norm": 0.7215608954429626,
2168
+ "learning_rate": 9.545377181227942e-05,
2169
+ "loss": 0.0601,
2170
+ "step": 3600
2171
+ },
2172
+ {
2173
+ "grad_norm": 0.5162255764007568,
2174
+ "learning_rate": 9.541926530861145e-05,
2175
+ "loss": 0.055,
2176
+ "step": 3610
2177
+ },
2178
+ {
2179
+ "grad_norm": 0.4929755628108978,
2180
+ "learning_rate": 9.538463463040645e-05,
2181
+ "loss": 0.0624,
2182
+ "step": 3620
2183
+ },
2184
+ {
2185
+ "grad_norm": 0.4630160331726074,
2186
+ "learning_rate": 9.534987987234337e-05,
2187
+ "loss": 0.0531,
2188
+ "step": 3630
2189
+ },
2190
+ {
2191
+ "grad_norm": 0.6550790071487427,
2192
+ "learning_rate": 9.53150011294404e-05,
2193
+ "loss": 0.06,
2194
+ "step": 3640
2195
+ },
2196
+ {
2197
+ "grad_norm": 0.6224126815795898,
2198
+ "learning_rate": 9.527999849705471e-05,
2199
+ "loss": 0.058,
2200
+ "step": 3650
2201
+ },
2202
+ {
2203
+ "grad_norm": 0.5941552519798279,
2204
+ "learning_rate": 9.524487207088213e-05,
2205
+ "loss": 0.0605,
2206
+ "step": 3660
2207
+ },
2208
+ {
2209
+ "grad_norm": 0.5191814303398132,
2210
+ "learning_rate": 9.520962194695698e-05,
2211
+ "loss": 0.0554,
2212
+ "step": 3670
2213
+ },
2214
+ {
2215
+ "grad_norm": 0.5197587013244629,
2216
+ "learning_rate": 9.517424822165175e-05,
2217
+ "loss": 0.0604,
2218
+ "step": 3680
2219
+ },
2220
+ {
2221
+ "grad_norm": 0.6364939212799072,
2222
+ "learning_rate": 9.513875099167685e-05,
2223
+ "loss": 0.0607,
2224
+ "step": 3690
2225
+ },
2226
+ {
2227
+ "grad_norm": 0.6344776153564453,
2228
+ "learning_rate": 9.510313035408035e-05,
2229
+ "loss": 0.0591,
2230
+ "step": 3700
2231
+ },
2232
+ {
2233
+ "grad_norm": 0.5283899903297424,
2234
+ "learning_rate": 9.506738640624775e-05,
2235
+ "loss": 0.0548,
2236
+ "step": 3710
2237
+ },
2238
+ {
2239
+ "grad_norm": 0.5169802308082581,
2240
+ "learning_rate": 9.50315192459016e-05,
2241
+ "loss": 0.0568,
2242
+ "step": 3720
2243
+ },
2244
+ {
2245
+ "grad_norm": 0.5627011656761169,
2246
+ "learning_rate": 9.499552897110136e-05,
2247
+ "loss": 0.0575,
2248
+ "step": 3730
2249
+ },
2250
+ {
2251
+ "grad_norm": 0.5730915665626526,
2252
+ "learning_rate": 9.495941568024304e-05,
2253
+ "loss": 0.0544,
2254
+ "step": 3740
2255
+ },
2256
+ {
2257
+ "grad_norm": 0.5705208778381348,
2258
+ "learning_rate": 9.492317947205904e-05,
2259
+ "loss": 0.0554,
2260
+ "step": 3750
2261
+ },
2262
+ {
2263
+ "grad_norm": 0.48615023493766785,
2264
+ "learning_rate": 9.488682044561775e-05,
2265
+ "loss": 0.054,
2266
+ "step": 3760
2267
+ },
2268
+ {
2269
+ "grad_norm": 0.5147746205329895,
2270
+ "learning_rate": 9.485033870032335e-05,
2271
+ "loss": 0.0559,
2272
+ "step": 3770
2273
+ },
2274
+ {
2275
+ "grad_norm": 0.5804494023323059,
2276
+ "learning_rate": 9.481373433591556e-05,
2277
+ "loss": 0.0593,
2278
+ "step": 3780
2279
+ },
2280
+ {
2281
+ "grad_norm": 0.5439186096191406,
2282
+ "learning_rate": 9.47770074524693e-05,
2283
+ "loss": 0.0551,
2284
+ "step": 3790
2285
+ },
2286
+ {
2287
+ "grad_norm": 0.529241681098938,
2288
+ "learning_rate": 9.474015815039446e-05,
2289
+ "loss": 0.0579,
2290
+ "step": 3800
2291
+ },
2292
+ {
2293
+ "grad_norm": 0.42327943444252014,
2294
+ "learning_rate": 9.470318653043565e-05,
2295
+ "loss": 0.0551,
2296
+ "step": 3810
2297
+ },
2298
+ {
2299
+ "grad_norm": 0.4692992568016052,
2300
+ "learning_rate": 9.466609269367185e-05,
2301
+ "loss": 0.0577,
2302
+ "step": 3820
2303
+ },
2304
+ {
2305
+ "grad_norm": 0.6473419070243835,
2306
+ "learning_rate": 9.46288767415162e-05,
2307
+ "loss": 0.0609,
2308
+ "step": 3830
2309
+ },
2310
+ {
2311
+ "grad_norm": 0.624902069568634,
2312
+ "learning_rate": 9.459153877571567e-05,
2313
+ "loss": 0.0592,
2314
+ "step": 3840
2315
+ },
2316
+ {
2317
+ "grad_norm": 0.6024203896522522,
2318
+ "learning_rate": 9.455407889835087e-05,
2319
+ "loss": 0.0575,
2320
+ "step": 3850
2321
+ },
2322
+ {
2323
+ "grad_norm": 0.4566102623939514,
2324
+ "learning_rate": 9.451649721183564e-05,
2325
+ "loss": 0.0536,
2326
+ "step": 3860
2327
+ },
2328
+ {
2329
+ "grad_norm": 0.5603846907615662,
2330
+ "learning_rate": 9.447879381891692e-05,
2331
+ "loss": 0.0541,
2332
+ "step": 3870
2333
+ },
2334
+ {
2335
+ "grad_norm": 0.4703678488731384,
2336
+ "learning_rate": 9.444096882267428e-05,
2337
+ "loss": 0.0544,
2338
+ "step": 3880
2339
+ },
2340
+ {
2341
+ "grad_norm": 0.5888656377792358,
2342
+ "learning_rate": 9.440302232651988e-05,
2343
+ "loss": 0.0562,
2344
+ "step": 3890
2345
+ },
2346
+ {
2347
+ "grad_norm": 0.541254460811615,
2348
+ "learning_rate": 9.436495443419795e-05,
2349
+ "loss": 0.0531,
2350
+ "step": 3900
2351
+ },
2352
+ {
2353
+ "grad_norm": 0.48808667063713074,
2354
+ "learning_rate": 9.432676524978466e-05,
2355
+ "loss": 0.0515,
2356
+ "step": 3910
2357
+ },
2358
+ {
2359
+ "grad_norm": 0.6694585084915161,
2360
+ "learning_rate": 9.42884548776878e-05,
2361
+ "loss": 0.0552,
2362
+ "step": 3920
2363
+ },
2364
+ {
2365
+ "grad_norm": 0.683584451675415,
2366
+ "learning_rate": 9.425002342264646e-05,
2367
+ "loss": 0.0565,
2368
+ "step": 3930
2369
+ },
2370
+ {
2371
+ "grad_norm": 0.5609367489814758,
2372
+ "learning_rate": 9.421147098973077e-05,
2373
+ "loss": 0.0547,
2374
+ "step": 3940
2375
+ },
2376
+ {
2377
+ "grad_norm": 0.6370012164115906,
2378
+ "learning_rate": 9.41727976843416e-05,
2379
+ "loss": 0.0616,
2380
+ "step": 3950
2381
+ },
2382
+ {
2383
+ "grad_norm": 0.5923592448234558,
2384
+ "learning_rate": 9.413400361221029e-05,
2385
+ "loss": 0.0583,
2386
+ "step": 3960
2387
+ },
2388
+ {
2389
+ "grad_norm": 0.6023064255714417,
2390
+ "learning_rate": 9.409508887939835e-05,
2391
+ "loss": 0.0588,
2392
+ "step": 3970
2393
+ },
2394
+ {
2395
+ "grad_norm": 0.6249566078186035,
2396
+ "learning_rate": 9.40560535922972e-05,
2397
+ "loss": 0.0587,
2398
+ "step": 3980
2399
+ },
2400
+ {
2401
+ "grad_norm": 0.4997934103012085,
2402
+ "learning_rate": 9.40168978576278e-05,
2403
+ "loss": 0.0654,
2404
+ "step": 3990
2405
+ },
2406
+ {
2407
+ "grad_norm": 0.5568627119064331,
2408
+ "learning_rate": 9.397762178244043e-05,
2409
+ "loss": 0.055,
2410
+ "step": 4000
2411
+ }
2412
+ ],
2413
+ "logging_steps": 10,
2414
+ "max_steps": 20000,
2415
+ "num_input_tokens_seen": 0,
2416
+ "num_train_epochs": 9223372036854775807,
2417
+ "save_steps": 4000,
2418
+ "stateful_callbacks": {
2419
+ "TrainerControl": {
2420
+ "args": {
2421
+ "should_epoch_stop": false,
2422
+ "should_evaluate": false,
2423
+ "should_log": false,
2424
+ "should_save": true,
2425
+ "should_training_stop": false
2426
+ },
2427
+ "attributes": {}
2428
+ }
2429
+ },
2430
+ "total_flos": 0.0,
2431
+ "train_batch_size": 128,
2432
+ "trial_name": null,
2433
+ "trial_params": null
2434
+ }
checkpoint-4000/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:348441e79ef2f019ff5f9e7b571fdbd2d1a1ba8a05c1268363c11d816d370703
3
+ size 5905
checkpoint-4000/wandb_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"project": "groot-finetune", "run_id": "g1_finetune-20260526-211344-gpu2"}