somusan commited on
Commit
61b42d3
·
verified ·
1 Parent(s): d818948

Upload folder using huggingface_hub

Browse files
checkpoint-5000/config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_horizon": 50,
3
+ "add_pos_embed": true,
4
+ "apply_sincos_state_encoding": true,
5
+ "architectures": [
6
+ "Gr00tN1d6"
7
+ ],
8
+ "attn_dropout": 0.2,
9
+ "attn_implementation": null,
10
+ "backbone_embedding_dim": 2048,
11
+ "backbone_model_type": "eagle",
12
+ "backbone_trainable_params_fp32": true,
13
+ "collator_overwrite_image_inputs": false,
14
+ "color_jitter_params": {
15
+ "brightness": 0.1,
16
+ "contrast": 0.1,
17
+ "hue": 0.1,
18
+ "saturation": 0.1
19
+ },
20
+ "crop_fraction": 0.95,
21
+ "diffusion_model_cfg": {
22
+ "attention_head_dim": 48,
23
+ "dropout": 0.2,
24
+ "final_dropout": true,
25
+ "interleave_self_attention": true,
26
+ "norm_type": "ada_norm",
27
+ "num_attention_heads": 32,
28
+ "num_layers": 32,
29
+ "output_dim": 1024,
30
+ "positional_embeddings": null
31
+ },
32
+ "eagle_collator": true,
33
+ "formalize_language": true,
34
+ "gemma_collator": false,
35
+ "hidden_size": 1024,
36
+ "image_crop_size": null,
37
+ "image_target_size": null,
38
+ "input_embedding_dim": 1536,
39
+ "load_bf16": true,
40
+ "max_action_dim": 128,
41
+ "max_num_embodiments": 32,
42
+ "max_seq_len": 1024,
43
+ "max_state_dim": 128,
44
+ "model_dtype": "bfloat16",
45
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
46
+ "model_type": "Gr00tN1d6",
47
+ "noise_beta_alpha": 1.5,
48
+ "noise_beta_beta": 1.0,
49
+ "noise_s": 0.999,
50
+ "num_inference_timesteps": 4,
51
+ "num_timestep_buckets": 1000,
52
+ "random_rotation_angle": null,
53
+ "reproject_vision": false,
54
+ "select_layer": 16,
55
+ "shortest_image_edge": 256,
56
+ "state_dropout_prob": 0.15,
57
+ "torch_dtype": "bfloat16",
58
+ "transformers_version": "4.51.3",
59
+ "tune_diffusion_model": true,
60
+ "tune_llm": false,
61
+ "tune_projector": true,
62
+ "tune_top_llm_layers": 4,
63
+ "tune_visual": false,
64
+ "tune_vlln": true,
65
+ "use_albumentations_transforms": true,
66
+ "use_alternate_vl_dit": true,
67
+ "use_flash_attention": true,
68
+ "use_relative_action": true,
69
+ "use_vlln": true
70
+ }
checkpoint-5000/embodiment_id.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "robocasa_panda_omron": 13,
3
+ "gr1": 20,
4
+ "behavior_r1_pro": 24,
5
+ "unitree_g1": 8,
6
+ "oxe_google": 0,
7
+ "oxe_widowx": 1,
8
+ "libero_panda": 2,
9
+ "oxe_droid": 16,
10
+ "new_embodiment": 10
11
+ }
checkpoint-5000/experiment_cfg/conf.yaml ADDED
@@ -0,0 +1,209 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ load_config_path: null
2
+ model:
3
+ model_type: Gr00tN1d6
4
+ model_dtype: bfloat16
5
+ model_name: nvidia/Eagle-Block2A-2B-v2
6
+ backbone_model_type: eagle
7
+ model_revision: null
8
+ tune_top_llm_layers: 4
9
+ backbone_embedding_dim: 2048
10
+ tune_llm: false
11
+ tune_visual: false
12
+ select_layer: 16
13
+ reproject_vision: false
14
+ use_flash_attention: true
15
+ load_bf16: false
16
+ collator_overwrite_image_inputs: false
17
+ eagle_collator: true
18
+ backbone_trainable_params_fp32: true
19
+ image_crop_size: null
20
+ image_target_size: null
21
+ shortest_image_edge: 256
22
+ crop_fraction: 0.95
23
+ random_rotation_angle: null
24
+ color_jitter_params:
25
+ brightness: 0.3
26
+ contrast: 0.4
27
+ saturation: 0.5
28
+ hue: 0.08
29
+ use_albumentations_transforms: true
30
+ formalize_language: true
31
+ apply_sincos_state_encoding: false
32
+ use_relative_action: true
33
+ max_state_dim: 29
34
+ max_action_dim: 29
35
+ action_horizon: 16
36
+ hidden_size: 1024
37
+ input_embedding_dim: 1536
38
+ add_pos_embed: true
39
+ attn_dropout: 0.2
40
+ use_vlln: true
41
+ max_seq_len: 1024
42
+ use_alternate_vl_dit: true
43
+ attend_text_every_n_blocks: 2
44
+ diffusion_model_cfg:
45
+ positional_embeddings: null
46
+ num_layers: 32
47
+ num_attention_heads: 32
48
+ attention_head_dim: 48
49
+ norm_type: ada_norm
50
+ dropout: 0.2
51
+ final_dropout: true
52
+ output_dim: 1024
53
+ interleave_self_attention: true
54
+ num_inference_timesteps: 4
55
+ noise_beta_alpha: 1.5
56
+ noise_beta_beta: 1.0
57
+ noise_s: 0.999
58
+ num_timestep_buckets: 1000
59
+ tune_projector: true
60
+ tune_diffusion_model: true
61
+ tune_vlln: true
62
+ state_dropout_prob: 0.15
63
+ state_additive_noise_scale: 0.0
64
+ max_num_embodiments: 32
65
+ data:
66
+ datasets:
67
+ - dataset_paths:
68
+ - /workspace/teleoperation_dataset_gr00t_v2_p3_4_merged_lerobot_v2
69
+ embodiment_tag: new_embodiment
70
+ mix_ratio: 1.0
71
+ dataset_type: physical_embodiment
72
+ val_dataset_path: null
73
+ modality_configs:
74
+ new_embodiment:
75
+ video:
76
+ delta_indices:
77
+ - 0
78
+ modality_keys:
79
+ - front
80
+ - wrist
81
+ sin_cos_embedding_keys: null
82
+ mean_std_embedding_keys: null
83
+ action_configs: null
84
+ state:
85
+ delta_indices:
86
+ - 0
87
+ modality_keys:
88
+ - single_arm
89
+ - gripper
90
+ sin_cos_embedding_keys: null
91
+ mean_std_embedding_keys: null
92
+ action_configs: null
93
+ action:
94
+ delta_indices:
95
+ - 0
96
+ - 1
97
+ - 2
98
+ - 3
99
+ - 4
100
+ - 5
101
+ - 6
102
+ - 7
103
+ - 8
104
+ - 9
105
+ - 10
106
+ - 11
107
+ - 12
108
+ - 13
109
+ - 14
110
+ - 15
111
+ modality_keys:
112
+ - single_arm
113
+ - gripper
114
+ sin_cos_embedding_keys: null
115
+ mean_std_embedding_keys: null
116
+ action_configs:
117
+ - rep: RELATIVE
118
+ type: NON_EEF
119
+ format: DEFAULT
120
+ state_key: null
121
+ - rep: ABSOLUTE
122
+ type: NON_EEF
123
+ format: DEFAULT
124
+ state_key: null
125
+ language:
126
+ delta_indices:
127
+ - 0
128
+ modality_keys:
129
+ - annotation.human.task_description
130
+ sin_cos_embedding_keys: null
131
+ mean_std_embedding_keys: null
132
+ action_configs: null
133
+ download_cache: false
134
+ shard_size: 1024
135
+ episode_sampling_rate: 0.1
136
+ num_shards_per_epoch: 100000
137
+ override_pretraining_statistics: false
138
+ mode: single_turn
139
+ random_chop: 0.0
140
+ mock_dataset_mode: false
141
+ shuffle: true
142
+ seed: 42
143
+ multiprocessing_context: fork
144
+ allow_padding: false
145
+ subsample_ratio: 1.0
146
+ image_crop_size:
147
+ - 244
148
+ - 244
149
+ image_target_size:
150
+ - 224
151
+ - 224
152
+ video_backend: torchcodec
153
+ training:
154
+ output_dir: /workspace/Isaac-GR00T/outputs/omy_1
155
+ experiment_name: null
156
+ max_steps: 5000
157
+ global_batch_size: 32
158
+ batch_size: null
159
+ gradient_accumulation_steps: 1
160
+ learning_rate: 5.0e-05
161
+ lr_scheduler_type: cosine
162
+ weight_decay: 0.0001
163
+ warmup_ratio: 0.05
164
+ warmup_steps: 0
165
+ max_grad_norm: 1.0
166
+ optim: adamw_torch
167
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
168
+ tf32: true
169
+ fp16: false
170
+ bf16: true
171
+ eval_bf16: true
172
+ logging_steps: 10
173
+ save_steps: 5000
174
+ save_total_limit: 1
175
+ save_vl_model: false
176
+ upload_checkpoints: false
177
+ upload_every: 1000
178
+ upload_last_n_checkpoints: 5
179
+ max_concurrent_uploads: 2
180
+ eval_strategy: 'no'
181
+ eval_steps: 500
182
+ eval_set_split_ratio: 0.1
183
+ eval_batch_size: 2
184
+ save_best_eval_metric_name: ''
185
+ save_best_eval_metric_greater_is_better: true
186
+ deepspeed_stage: 2
187
+ gradient_checkpointing: false
188
+ transformers_trust_remote_code: true
189
+ transformers_local_files_only: false
190
+ transformers_cache_dir: null
191
+ transformers_access_token: null
192
+ use_ddp: false
193
+ ddp_bucket_cap_mb: 100
194
+ num_gpus: 1
195
+ dataloader_num_workers: 4
196
+ remove_unused_columns: false
197
+ use_wandb: false
198
+ wandb_project: finetune-gr00t-n1d6
199
+ enable_profiling: false
200
+ max_retries: 3
201
+ assert_loss_less_than: null
202
+ add_rl_callback: false
203
+ enable_open_loop_eval: false
204
+ open_loop_eval_traj_ids:
205
+ - 0
206
+ open_loop_eval_steps_per_traj: 100
207
+ open_loop_eval_plot_indices: null
208
+ max_steps: 5000
209
+ save_steps: 5000
checkpoint-5000/experiment_cfg/config.yaml ADDED
@@ -0,0 +1,243 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:gr00t.configs.base_config.Config
2
+ data: !!python/object:gr00t.configs.data.data_config.DataConfig
3
+ allow_padding: false
4
+ datasets:
5
+ - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
6
+ dataset_paths:
7
+ - /workspace/teleoperation_dataset_gr00t_v2_p3_4_merged_lerobot_v2
8
+ dataset_type: physical_embodiment
9
+ embodiment_tag: new_embodiment
10
+ mix_ratio: 1.0
11
+ val_dataset_path: null
12
+ download_cache: false
13
+ episode_sampling_rate: 0.1
14
+ image_crop_size:
15
+ - 244
16
+ - 244
17
+ image_target_size:
18
+ - 224
19
+ - 224
20
+ mock_dataset_mode: false
21
+ modality_configs:
22
+ new_embodiment:
23
+ action: !!python/object:gr00t.data.types.ModalityConfig
24
+ action_configs:
25
+ - !!python/object:gr00t.data.types.ActionConfig
26
+ format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
27
+ - default
28
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
29
+ - relative
30
+ state_key: null
31
+ type: &id002 !!python/object/apply:gr00t.data.types.ActionType
32
+ - non_eef
33
+ - !!python/object:gr00t.data.types.ActionConfig
34
+ format: *id001
35
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
36
+ - absolute
37
+ state_key: null
38
+ type: *id002
39
+ delta_indices:
40
+ - 0
41
+ - 1
42
+ - 2
43
+ - 3
44
+ - 4
45
+ - 5
46
+ - 6
47
+ - 7
48
+ - 8
49
+ - 9
50
+ - 10
51
+ - 11
52
+ - 12
53
+ - 13
54
+ - 14
55
+ - 15
56
+ mean_std_embedding_keys: null
57
+ modality_keys:
58
+ - single_arm
59
+ - gripper
60
+ sin_cos_embedding_keys: null
61
+ language: !!python/object:gr00t.data.types.ModalityConfig
62
+ action_configs: null
63
+ delta_indices:
64
+ - 0
65
+ mean_std_embedding_keys: null
66
+ modality_keys:
67
+ - annotation.human.task_description
68
+ sin_cos_embedding_keys: null
69
+ state: !!python/object:gr00t.data.types.ModalityConfig
70
+ action_configs: null
71
+ delta_indices:
72
+ - 0
73
+ mean_std_embedding_keys: null
74
+ modality_keys:
75
+ - single_arm
76
+ - gripper
77
+ sin_cos_embedding_keys: null
78
+ video: !!python/object:gr00t.data.types.ModalityConfig
79
+ action_configs: null
80
+ delta_indices:
81
+ - 0
82
+ mean_std_embedding_keys: null
83
+ modality_keys:
84
+ - front
85
+ - wrist
86
+ sin_cos_embedding_keys: null
87
+ mode: single_turn
88
+ multiprocessing_context: fork
89
+ num_shards_per_epoch: 100000
90
+ override_pretraining_statistics: false
91
+ random_chop: 0.0
92
+ seed: 42
93
+ shard_size: 1024
94
+ shuffle: true
95
+ subsample_ratio: 1.0
96
+ video_backend: torchcodec
97
+ load_config_path: null
98
+ model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
99
+ _attn_implementation_autoset: false
100
+ _attn_implementation_internal: null
101
+ _commit_hash: null
102
+ _name_or_path: ''
103
+ add_cross_attention: false
104
+ architectures: null
105
+ backbone_model_type: eagle
106
+ backbone_trainable_params_fp32: true
107
+ bad_words_ids: null
108
+ begin_suppress_tokens: null
109
+ bos_token_id: null
110
+ chunk_size_feed_forward: 0
111
+ color_jitter_params:
112
+ brightness: 0.3
113
+ contrast: 0.4
114
+ hue: 0.08
115
+ saturation: 0.5
116
+ cross_attention_hidden_size: null
117
+ decoder_start_token_id: null
118
+ diffusion_model_cfg:
119
+ attention_head_dim: 48
120
+ dropout: 0.2
121
+ final_dropout: true
122
+ interleave_self_attention: true
123
+ norm_type: ada_norm
124
+ num_attention_heads: 32
125
+ num_layers: 32
126
+ output_dim: 1024
127
+ positional_embeddings: null
128
+ diversity_penalty: 0.0
129
+ do_sample: false
130
+ eagle_collator: true
131
+ early_stopping: false
132
+ encoder_no_repeat_ngram_size: 0
133
+ eos_token_id: null
134
+ exponential_decay_length_penalty: null
135
+ finetuning_task: null
136
+ forced_bos_token_id: null
137
+ forced_eos_token_id: null
138
+ id2label:
139
+ 0: LABEL_0
140
+ 1: LABEL_1
141
+ is_decoder: false
142
+ is_encoder_decoder: false
143
+ label2id:
144
+ LABEL_0: 0
145
+ LABEL_1: 1
146
+ length_penalty: 1.0
147
+ load_bf16: false
148
+ max_length: 20
149
+ min_length: 0
150
+ model_name: nvidia/Eagle-Block2A-2B-v2
151
+ no_repeat_ngram_size: 0
152
+ num_beam_groups: 1
153
+ num_beams: 1
154
+ num_return_sequences: 1
155
+ output_attentions: false
156
+ output_hidden_states: false
157
+ output_scores: false
158
+ pad_token_id: null
159
+ prefix: null
160
+ problem_type: null
161
+ pruned_heads: {}
162
+ random_rotation_angle: null
163
+ remove_invalid_values: false
164
+ repetition_penalty: 1.0
165
+ reproject_vision: false
166
+ return_dict: true
167
+ return_dict_in_generate: false
168
+ sep_token_id: null
169
+ state_dropout_prob: 0.15
170
+ suppress_tokens: null
171
+ task_specific_params: null
172
+ temperature: 1.0
173
+ tf_legacy_loss: false
174
+ tie_encoder_decoder: false
175
+ tie_word_embeddings: true
176
+ tokenizer_class: null
177
+ top_k: 50
178
+ top_p: 1.0
179
+ torch_dtype: null
180
+ torchscript: false
181
+ transformers_version: null
182
+ tune_diffusion_model: true
183
+ tune_llm: false
184
+ tune_projector: true
185
+ tune_visual: false
186
+ typical_p: 1.0
187
+ use_bfloat16: false
188
+ use_relative_action: true
189
+ training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
190
+ add_rl_callback: false
191
+ assert_loss_less_than: null
192
+ batch_size: null
193
+ bf16: true
194
+ dataloader_num_workers: 4
195
+ ddp_bucket_cap_mb: 100
196
+ deepspeed_stage: 2
197
+ enable_open_loop_eval: false
198
+ enable_profiling: false
199
+ eval_batch_size: 2
200
+ eval_bf16: true
201
+ eval_set_split_ratio: 0.1
202
+ eval_steps: 500
203
+ eval_strategy: 'no'
204
+ experiment_name: null
205
+ fp16: false
206
+ global_batch_size: 32
207
+ gradient_accumulation_steps: 1
208
+ gradient_checkpointing: false
209
+ learning_rate: 5.0e-05
210
+ logging_steps: 10
211
+ lr_scheduler_type: cosine
212
+ max_concurrent_uploads: 2
213
+ max_grad_norm: 1.0
214
+ max_retries: 3
215
+ max_steps: 5000
216
+ num_gpus: 1
217
+ open_loop_eval_plot_indices: null
218
+ open_loop_eval_steps_per_traj: 100
219
+ open_loop_eval_traj_ids:
220
+ - 0
221
+ optim: adamw_torch
222
+ output_dir: /workspace/Isaac-GR00T/outputs/omy_1
223
+ remove_unused_columns: false
224
+ save_best_eval_metric_greater_is_better: true
225
+ save_best_eval_metric_name: ''
226
+ save_steps: 5000
227
+ save_total_limit: 1
228
+ save_vl_model: false
229
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
230
+ tf32: true
231
+ transformers_access_token: null
232
+ transformers_cache_dir: null
233
+ transformers_local_files_only: false
234
+ transformers_trust_remote_code: true
235
+ upload_checkpoints: false
236
+ upload_every: 1000
237
+ upload_last_n_checkpoints: 5
238
+ use_ddp: false
239
+ use_wandb: false
240
+ wandb_project: finetune-gr00t-n1d6
241
+ warmup_ratio: 0.05
242
+ warmup_steps: 0
243
+ weight_decay: 0.0001
checkpoint-5000/experiment_cfg/dataset_statistics.json ADDED
@@ -0,0 +1,932 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "new_embodiment": {
3
+ "state": {
4
+ "single_arm": {
5
+ "min": [
6
+ -0.3484296202659607,
7
+ -0.2940049469470978,
8
+ -1.4568357467651367,
9
+ -0.918129026889801,
10
+ 1.5524020195007324,
11
+ -0.8714576959609985
12
+ ],
13
+ "max": [
14
+ 0.871225893497467,
15
+ 1.4812145233154297,
16
+ 2.2445228099823,
17
+ 1.6041626930236816,
18
+ 1.580612301826477,
19
+ 0.34752944111824036
20
+ ],
21
+ "mean": [
22
+ 0.0660708295904004,
23
+ 0.2896196729390686,
24
+ 1.273881831918799,
25
+ 0.07309057529716799,
26
+ 1.5695173609910642,
27
+ -0.0675732313873097
28
+ ],
29
+ "std": [
30
+ 0.24684875710013002,
31
+ 0.2624021895353532,
32
+ 0.6396142403168285,
33
+ 0.5623540573067425,
34
+ 0.0019495733088944448,
35
+ 0.24706634675426653
36
+ ],
37
+ "q01": [
38
+ -0.14120122547514716,
39
+ -0.15137712556556798,
40
+ 0.25940447983184756,
41
+ -0.7327557047228977,
42
+ 1.5623217466486523,
43
+ -0.6984691145028645
44
+ ],
45
+ "q99": [
46
+ 0.6986005893203253,
47
+ 0.6137331449754688,
48
+ 1.989423889739015,
49
+ 0.902999176898917,
50
+ 1.5715922809600218,
51
+ 0.13965727915057108
52
+ ]
53
+ },
54
+ "gripper": {
55
+ "min": [
56
+ 0.0
57
+ ],
58
+ "max": [
59
+ 1.0
60
+ ],
61
+ "mean": [
62
+ 0.2753448165213926
63
+ ],
64
+ "std": [
65
+ 0.44668786429986657
66
+ ],
67
+ "q01": [
68
+ -1.000000013351432e-10
69
+ ],
70
+ "q99": [
71
+ 0.9999925267031382
72
+ ]
73
+ }
74
+ },
75
+ "action": {
76
+ "single_arm": {
77
+ "min": [
78
+ -0.35249605774879456,
79
+ -0.340976357460022,
80
+ -1.4720337390899658,
81
+ -0.9139819741249084,
82
+ 1.5523695945739746,
83
+ -0.8805081248283386
84
+ ],
85
+ "max": [
86
+ 0.8796143531799316,
87
+ 1.4417712688446045,
88
+ 2.2255284786224365,
89
+ 1.6055001020431519,
90
+ 1.571340799331665,
91
+ 0.351653516292572
92
+ ],
93
+ "mean": [
94
+ 0.07284960426261836,
95
+ 0.2567877877935287,
96
+ 1.2472866734129062,
97
+ 0.0652026161086495,
98
+ 1.56964799977149,
99
+ -0.07374245072646021
100
+ ],
101
+ "std": [
102
+ 0.25668078105389325,
103
+ 0.25697145420740913,
104
+ 0.6486887061942791,
105
+ 0.566977630034768,
106
+ 0.002414096561250562,
107
+ 0.2566087339519503
108
+ ],
109
+ "q01": [
110
+ -0.1498670041869513,
111
+ -0.17465162009659907,
112
+ 0.2170314396344432,
113
+ -0.7378591563813238,
114
+ 1.5674572562165083,
115
+ -0.7113432860253213
116
+ ],
117
+ "q99": [
118
+ 0.7104775490699361,
119
+ 0.5871068334930613,
120
+ 1.9767465605823349,
121
+ 0.9021054332053293,
122
+ 1.5705683645924846,
123
+ 0.14903640795681997
124
+ ]
125
+ },
126
+ "gripper": {
127
+ "min": [
128
+ 0.0
129
+ ],
130
+ "max": [
131
+ 1.0
132
+ ],
133
+ "mean": [
134
+ 0.2733744355732537
135
+ ],
136
+ "std": [
137
+ 0.4456914315372699
138
+ ],
139
+ "q01": [
140
+ -1.000000013351432e-10
141
+ ],
142
+ "q99": [
143
+ 0.9999924756906762
144
+ ]
145
+ }
146
+ },
147
+ "relative_action": {
148
+ "single_arm": {
149
+ "min": [
150
+ [
151
+ -0.15696251392364502,
152
+ -0.34446781873703003,
153
+ -0.6737130880355835,
154
+ -0.3178783655166626,
155
+ -0.01156306266784668,
156
+ -0.16844062507152557
157
+ ],
158
+ [
159
+ -0.1919003129005432,
160
+ -0.4053707718849182,
161
+ -0.7816908955574036,
162
+ -0.38410383462905884,
163
+ -0.011548161506652832,
164
+ -0.2033797651529312
165
+ ],
166
+ [
167
+ -0.22658002376556396,
168
+ -0.46504658460617065,
169
+ -0.8752028942108154,
170
+ -0.4481411576271057,
171
+ -0.011525154113769531,
172
+ -0.2386666089296341
173
+ ],
174
+ [
175
+ -0.25767937302589417,
176
+ -0.5173105597496033,
177
+ -0.960516095161438,
178
+ -0.5121691226959229,
179
+ -0.011506915092468262,
180
+ -0.2736057639122009
181
+ ],
182
+ [
183
+ -0.2887968122959137,
184
+ -0.5641186833381653,
185
+ -1.0343924760818481,
186
+ -0.5759719610214233,
187
+ -0.011516809463500977,
188
+ -0.30846402049064636
189
+ ],
190
+ [
191
+ -0.3199325501918793,
192
+ -0.6068925261497498,
193
+ -1.1042704582214355,
194
+ -0.6281388401985168,
195
+ -0.011510848999023438,
196
+ -0.34338027238845825
197
+ ],
198
+ [
199
+ -0.3509705364704132,
200
+ -0.6361642479896545,
201
+ -1.1701284646987915,
202
+ -0.6791977882385254,
203
+ -0.011488914489746094,
204
+ -0.37825170159339905
205
+ ],
206
+ [
207
+ -0.38060125708580017,
208
+ -0.6464956998825073,
209
+ -1.2320352792739868,
210
+ -0.7301526665687561,
211
+ -0.01146841049194336,
212
+ -0.4131423830986023
213
+ ],
214
+ [
215
+ -0.40787461400032043,
216
+ -0.6518352031707764,
217
+ -1.2899482250213623,
218
+ -0.7853091359138489,
219
+ -0.011491179466247559,
220
+ -0.448012113571167
221
+ ],
222
+ [
223
+ -0.4350906312465668,
224
+ -0.6538127660751343,
225
+ -1.3439218997955322,
226
+ -0.8374760150909424,
227
+ -0.011620759963989258,
228
+ -0.48276638984680176
229
+ ],
230
+ [
231
+ -0.4614231288433075,
232
+ -0.6572719812393188,
233
+ -1.3943485021591187,
234
+ -0.8772416114807129,
235
+ -0.011820793151855469,
236
+ -0.5160169005393982
237
+ ],
238
+ [
239
+ -0.485305517911911,
240
+ -0.6611306667327881,
241
+ -1.4443868398666382,
242
+ -0.9266657829284668,
243
+ -0.012117266654968262,
244
+ -0.547016978263855
245
+ ],
246
+ [
247
+ -0.5076735019683838,
248
+ -0.663108229637146,
249
+ -1.4905352592468262,
250
+ -0.9745397567749023,
251
+ -0.01165163516998291,
252
+ -0.5803918838500977
253
+ ],
254
+ [
255
+ -0.5290192365646362,
256
+ -0.6650083065032959,
257
+ -1.533168911933899,
258
+ -1.0207548141479492,
259
+ -0.011184930801391602,
260
+ -0.6152510046958923
261
+ ],
262
+ [
263
+ -0.5489386320114136,
264
+ -0.6667595505714417,
265
+ -1.5753229856491089,
266
+ -1.051430106163025,
267
+ -0.0109940767288208,
268
+ -0.6500052809715271
269
+ ],
270
+ [
271
+ -0.5668587684631348,
272
+ -0.667188823223114,
273
+ -1.6137160062789917,
274
+ -1.0931904315948486,
275
+ -0.010291337966918945,
276
+ -0.6832557916641235
277
+ ]
278
+ ],
279
+ "max": [
280
+ [
281
+ 0.16824336349964142,
282
+ 0.24052470922470093,
283
+ 0.5061454772949219,
284
+ 0.39507728815078735,
285
+ 0.006520986557006836,
286
+ 0.15706884860992432
287
+ ],
288
+ [
289
+ 0.20314648747444153,
290
+ 0.3025338053703308,
291
+ 0.6245244741439819,
292
+ 0.4650633931159973,
293
+ 0.006515979766845703,
294
+ 0.19194811582565308
295
+ ],
296
+ [
297
+ 0.2384708970785141,
298
+ 0.36002570390701294,
299
+ 0.7428172826766968,
300
+ 0.5275017023086548,
301
+ 0.006508588790893555,
302
+ 0.22680965065956116
303
+ ],
304
+ [
305
+ 0.2733740210533142,
306
+ 0.4157518148422241,
307
+ 0.8477752208709717,
308
+ 0.5841488242149353,
309
+ 0.00649869441986084,
310
+ 0.25784188508987427
311
+ ],
312
+ [
313
+ 0.30832749605178833,
314
+ 0.470317006111145,
315
+ 0.9313650131225586,
316
+ 0.6372599005699158,
317
+ 0.0064623355865478516,
318
+ 0.2888680100440979
319
+ ],
320
+ [
321
+ 0.343273401260376,
322
+ 0.5153665542602539,
323
+ 1.0067442655563354,
324
+ 0.6891289949417114,
325
+ 0.006403207778930664,
326
+ 0.31988149881362915
327
+ ],
328
+ [
329
+ 0.37823686003685,
330
+ 0.5592126250267029,
331
+ 1.065140724182129,
332
+ 0.7395720481872559,
333
+ 0.006318211555480957,
334
+ 0.3508707284927368
335
+ ],
336
+ [
337
+ 0.4132160246372223,
338
+ 0.5731149315834045,
339
+ 1.0996272563934326,
340
+ 0.788618266582489,
341
+ 0.006203055381774902,
342
+ 0.380546510219574
343
+ ],
344
+ [
345
+ 0.4482080936431885,
346
+ 0.5804688334465027,
347
+ 1.1714509725570679,
348
+ 0.8365987539291382,
349
+ 0.006093502044677734,
350
+ 0.40765124559402466
351
+ ],
352
+ [
353
+ 0.4830245077610016,
354
+ 0.5881319642066956,
355
+ 1.2263423204421997,
356
+ 0.8837657570838928,
357
+ 0.006119847297668457,
358
+ 0.4347139000892639
359
+ ],
360
+ [
361
+ 0.5162209272384644,
362
+ 0.5954858660697937,
363
+ 1.2864584922790527,
364
+ 0.9293184876441956,
365
+ 0.006140708923339844,
366
+ 0.4610365033149719
367
+ ],
368
+ [
369
+ 0.5473360419273376,
370
+ 0.5992559194564819,
371
+ 1.3450905084609985,
372
+ 0.9761509299278259,
373
+ 0.0061490535736083984,
374
+ 0.4848148226737976
375
+ ],
376
+ [
377
+ 0.5806077122688293,
378
+ 0.6047143936157227,
379
+ 1.3999574184417725,
380
+ 1.0215784311294556,
381
+ 0.006112813949584961,
382
+ 0.5069919228553772
383
+ ],
384
+ [
385
+ 0.6154510378837585,
386
+ 0.6339849233627319,
387
+ 1.451041579246521,
388
+ 1.0653609037399292,
389
+ 0.006089210510253906,
390
+ 0.5281317234039307
391
+ ],
392
+ [
393
+ 0.6502674221992493,
394
+ 0.6601248383522034,
395
+ 1.4983268976211548,
396
+ 1.1104395389556885,
397
+ 0.006052851676940918,
398
+ 0.5478552579879761
399
+ ],
400
+ [
401
+ 0.6834638714790344,
402
+ 0.6824098229408264,
403
+ 1.5142232179641724,
404
+ 1.1536270380020142,
405
+ 0.006022810935974121,
406
+ 0.565622091293335
407
+ ]
408
+ ],
409
+ "mean": [
410
+ [
411
+ 0.002399730496108532,
412
+ -0.03371857479214668,
413
+ -0.026506593450903893,
414
+ -0.007294314913451672,
415
+ -3.3637643355177715e-05,
416
+ -0.002175837755203247
417
+ ],
418
+ [
419
+ 0.0029731958638876677,
420
+ -0.03329775482416153,
421
+ -0.026526525616645813,
422
+ -0.007697952911257744,
423
+ -3.4519027394708246e-05,
424
+ -0.0027493059169501066
425
+ ],
426
+ [
427
+ 0.003604522440582514,
428
+ -0.032867252826690674,
429
+ -0.02654336765408516,
430
+ -0.008099138736724854,
431
+ -3.462656241026707e-05,
432
+ -0.0033809158485382795
433
+ ],
434
+ [
435
+ 0.004330680705606937,
436
+ -0.03244740143418312,
437
+ -0.026560107246041298,
438
+ -0.008501662872731686,
439
+ -3.4149335988331586e-05,
440
+ -0.004107005428522825
441
+ ],
442
+ [
443
+ 0.005132367368787527,
444
+ -0.032020263373851776,
445
+ -0.026579467579722404,
446
+ -0.00890059769153595,
447
+ -3.363030918990262e-05,
448
+ -0.004908420145511627
449
+ ],
450
+ [
451
+ 0.006013290956616402,
452
+ -0.03158460557460785,
453
+ -0.026602549478411674,
454
+ -0.00930008850991726,
455
+ -3.3384036214556545e-05,
456
+ -0.005788702052086592
457
+ ],
458
+ [
459
+ 0.0069674355909228325,
460
+ -0.031136885285377502,
461
+ -0.026633556932210922,
462
+ -0.009698453359305859,
463
+ -3.306723738205619e-05,
464
+ -0.006742133293300867
465
+ ],
466
+ [
467
+ 0.007998677901923656,
468
+ -0.030675340443849564,
469
+ -0.026676973327994347,
470
+ -0.010097721591591835,
471
+ -3.293266854598187e-05,
472
+ -0.007772281300276518
473
+ ],
474
+ [
475
+ 0.009103219956159592,
476
+ -0.030197689309716225,
477
+ -0.026734555140137672,
478
+ -0.010497260838747025,
479
+ -3.274149639764801e-05,
480
+ -0.008875810541212559
481
+ ],
482
+ [
483
+ 0.01028699241578579,
484
+ -0.029703862965106964,
485
+ -0.026812396943569183,
486
+ -0.010893884114921093,
487
+ -3.268092768848874e-05,
488
+ -0.010058477520942688
489
+ ],
490
+ [
491
+ 0.011553517542779446,
492
+ -0.029192553833127022,
493
+ -0.026906808838248253,
494
+ -0.011289995163679123,
495
+ -3.269802255090326e-05,
496
+ -0.01132387388497591
497
+ ],
498
+ [
499
+ 0.012908070348203182,
500
+ -0.028664078563451767,
501
+ -0.02701812982559204,
502
+ -0.011685356497764587,
503
+ -3.28218775393907e-05,
504
+ -0.012677285820245743
505
+ ],
506
+ [
507
+ 0.014355717226862907,
508
+ -0.028118710964918137,
509
+ -0.027147676795721054,
510
+ -0.012079907581210136,
511
+ -3.296746945125051e-05,
512
+ -0.014123816974461079
513
+ ],
514
+ [
515
+ 0.015898622572422028,
516
+ -0.027556538581848145,
517
+ -0.02729668840765953,
518
+ -0.012473052367568016,
519
+ -3.313259003334679e-05,
520
+ -0.015665428712964058
521
+ ],
522
+ [
523
+ 0.01753367856144905,
524
+ -0.026974856853485107,
525
+ -0.027466658502817154,
526
+ -0.012863936834037304,
527
+ -3.3350897865602747e-05,
528
+ -0.01729944720864296
529
+ ],
530
+ [
531
+ 0.019253134727478027,
532
+ -0.026369046419858932,
533
+ -0.02766418643295765,
534
+ -0.013252663426101208,
535
+ -3.3440224797232077e-05,
536
+ -0.019018059596419334
537
+ ]
538
+ ],
539
+ "std": [
540
+ [
541
+ 0.04323775693774223,
542
+ 0.045802634209394455,
543
+ 0.10585169494152069,
544
+ 0.08371099829673767,
545
+ 0.000734939647372812,
546
+ 0.04311731085181236
547
+ ],
548
+ [
549
+ 0.052831608802080154,
550
+ 0.0550084225833416,
551
+ 0.12866128981113434,
552
+ 0.10224901884794235,
553
+ 0.0007391870021820068,
554
+ 0.052699752151966095
555
+ ],
556
+ [
557
+ 0.06230269744992256,
558
+ 0.06383407860994339,
559
+ 0.15080901980400085,
560
+ 0.12041323632001877,
561
+ 0.0007443022332154214,
562
+ 0.0621633417904377
563
+ ],
564
+ [
565
+ 0.07166402041912079,
566
+ 0.07222028821706772,
567
+ 0.17223787307739258,
568
+ 0.13817144930362701,
569
+ 0.0007505182875320315,
570
+ 0.07151757925748825
571
+ ],
572
+ [
573
+ 0.08089207857847214,
574
+ 0.08016153424978256,
575
+ 0.19294390082359314,
576
+ 0.1555166095495224,
577
+ 0.000756296853069216,
578
+ 0.08074097335338593
579
+ ],
580
+ [
581
+ 0.0899948924779892,
582
+ 0.08766801655292511,
583
+ 0.2129502147436142,
584
+ 0.17245666682720184,
585
+ 0.0007633369532413781,
586
+ 0.0898369774222374
587
+ ],
588
+ [
589
+ 0.09896065294742584,
590
+ 0.09475349634885788,
591
+ 0.2322818636894226,
592
+ 0.1889989674091339,
593
+ 0.0007708776392973959,
594
+ 0.09880099445581436
595
+ ],
596
+ [
597
+ 0.10780492424964905,
598
+ 0.10143771767616272,
599
+ 0.25096794962882996,
600
+ 0.20515595376491547,
601
+ 0.0007795444107614458,
602
+ 0.10764006525278091
603
+ ],
604
+ [
605
+ 0.11651723086833954,
606
+ 0.10774324834346771,
607
+ 0.26903823018074036,
608
+ 0.22093604505062103,
609
+ 0.0007895926828496158,
610
+ 0.11634589731693268
611
+ ],
612
+ [
613
+ 0.12510086596012115,
614
+ 0.11369043588638306,
615
+ 0.28652051091194153,
616
+ 0.23635028302669525,
617
+ 0.0008002828690223396,
618
+ 0.124925397336483
619
+ ],
620
+ [
621
+ 0.1335495114326477,
622
+ 0.11929997056722641,
623
+ 0.3034432828426361,
624
+ 0.2514086365699768,
625
+ 0.0008107878966256976,
626
+ 0.1333676427602768
627
+ ],
628
+ [
629
+ 0.1418585479259491,
630
+ 0.124591164290905,
631
+ 0.31983453035354614,
632
+ 0.2661244869232178,
633
+ 0.0008217667927965522,
634
+ 0.14167335629463196
635
+ ],
636
+ [
637
+ 0.1500254124403,
638
+ 0.1295834332704544,
639
+ 0.3357211947441101,
640
+ 0.28050777316093445,
641
+ 0.0008334207232110202,
642
+ 0.14983689785003662
643
+ ],
644
+ [
645
+ 0.15803955495357513,
646
+ 0.1342964768409729,
647
+ 0.351129412651062,
648
+ 0.294569730758667,
649
+ 0.0008444534032605588,
650
+ 0.15784819424152374
651
+ ],
652
+ [
653
+ 0.16589556634426117,
654
+ 0.138750359416008,
655
+ 0.3660843074321747,
656
+ 0.3083218038082123,
657
+ 0.0008554744417779148,
658
+ 0.1657029092311859
659
+ ],
660
+ [
661
+ 0.17359334230422974,
662
+ 0.14296913146972656,
663
+ 0.38061195611953735,
664
+ 0.3217768371105194,
665
+ 0.000866534246597439,
666
+ 0.1733987182378769
667
+ ]
668
+ ],
669
+ "q01": [
670
+ [
671
+ -0.12213177978992462,
672
+ -0.14521412551403046,
673
+ -0.36651915311813354,
674
+ -0.22651121020317078,
675
+ -0.002628536429256201,
676
+ -0.13755188882350922
677
+ ],
678
+ [
679
+ -0.14906743168830872,
680
+ -0.1672179400920868,
681
+ -0.43642017245292664,
682
+ -0.2747143805027008,
683
+ -0.002645096741616726,
684
+ -0.1674933135509491
685
+ ],
686
+ [
687
+ -0.17482531070709229,
688
+ -0.18630193173885345,
689
+ -0.519730806350708,
690
+ -0.32141369581222534,
691
+ -0.0026340961921960115,
692
+ -0.19536428153514862
693
+ ],
694
+ [
695
+ -0.19858603179454803,
696
+ -0.2066028118133545,
697
+ -0.585573136806488,
698
+ -0.36707189679145813,
699
+ -0.002717776456847787,
700
+ -0.2237655073404312
701
+ ],
702
+ [
703
+ -0.22130325436592102,
704
+ -0.22337931394577026,
705
+ -0.6607177257537842,
706
+ -0.40824657678604126,
707
+ -0.0029330539982765913,
708
+ -0.25334563851356506
709
+ ],
710
+ [
711
+ -0.24440711736679077,
712
+ -0.238887757062912,
713
+ -0.7216896414756775,
714
+ -0.4496803879737854,
715
+ -0.0030421495903283358,
716
+ -0.28178611397743225
717
+ ],
718
+ [
719
+ -0.26698970794677734,
720
+ -0.25492310523986816,
721
+ -0.7907676100730896,
722
+ -0.4887317419052124,
723
+ -0.003101882990449667,
724
+ -0.3099566102027893
725
+ ],
726
+ [
727
+ -0.286782830953598,
728
+ -0.27151039242744446,
729
+ -0.8517748713493347,
730
+ -0.5257248282432556,
731
+ -0.003171453485265374,
732
+ -0.3390139937400818
733
+ ],
734
+ [
735
+ -0.30621322989463806,
736
+ -0.2862298786640167,
737
+ -0.9015073776245117,
738
+ -0.5636691451072693,
739
+ -0.0032641314901411533,
740
+ -0.36655768752098083
741
+ ],
742
+ [
743
+ -0.3255496025085449,
744
+ -0.29756152629852295,
745
+ -0.9560237526893616,
746
+ -0.5999890565872192,
747
+ -0.0032778121531009674,
748
+ -0.3943326771259308
749
+ ],
750
+ [
751
+ -0.34466391801834106,
752
+ -0.30887919664382935,
753
+ -1.0073438882827759,
754
+ -0.632552444934845,
755
+ -0.0033038281835615635,
756
+ -0.4224179685115814
757
+ ],
758
+ [
759
+ -0.35855481028556824,
760
+ -0.3250240683555603,
761
+ -1.0543361902236938,
762
+ -0.6657060980796814,
763
+ -0.0033189060632139444,
764
+ -0.448632150888443
765
+ ],
766
+ [
767
+ -0.3737456798553467,
768
+ -0.3364461362361908,
769
+ -1.0995036363601685,
770
+ -0.6994519829750061,
771
+ -0.0033822304103523493,
772
+ -0.47539883852005005
773
+ ],
774
+ [
775
+ -0.3870712220668793,
776
+ -0.3443698287010193,
777
+ -1.1389037370681763,
778
+ -0.7261598706245422,
779
+ -0.003482704982161522,
780
+ -0.5010547041893005
781
+ ],
782
+ [
783
+ -0.3985598683357239,
784
+ -0.35595327615737915,
785
+ -1.1819812059402466,
786
+ -0.7497241497039795,
787
+ -0.0035526324063539505,
788
+ -0.5260051488876343
789
+ ],
790
+ [
791
+ -0.4100184440612793,
792
+ -0.36467358469963074,
793
+ -1.230539083480835,
794
+ -0.7697025537490845,
795
+ -0.003628845326602459,
796
+ -0.5501382946968079
797
+ ]
798
+ ],
799
+ "q99": [
800
+ [
801
+ 0.13778626918792725,
802
+ 0.11720699071884155,
803
+ 0.2617994546890259,
804
+ 0.23129749298095703,
805
+ 0.0021540913730859756,
806
+ 0.12180761247873306
807
+ ],
808
+ [
809
+ 0.16777439415454865,
810
+ 0.1505272388458252,
811
+ 0.3302338719367981,
812
+ 0.2836305797100067,
813
+ 0.002166236750781536,
814
+ 0.14862465858459473
815
+ ],
816
+ [
817
+ 0.19595178961753845,
818
+ 0.18208669126033783,
819
+ 0.3971126675605774,
820
+ 0.336750864982605,
821
+ 0.0021774321794509888,
822
+ 0.1744869202375412
823
+ ],
824
+ [
825
+ 0.22429130971431732,
826
+ 0.21202439069747925,
827
+ 0.45463618636131287,
828
+ 0.38751187920570374,
829
+ 0.002235555090010166,
830
+ 0.19793902337551117
831
+ ],
832
+ [
833
+ 0.2538144588470459,
834
+ 0.23781366646289825,
835
+ 0.5186766982078552,
836
+ 0.43724244832992554,
837
+ 0.0022584283724427223,
838
+ 0.22057458758354187
839
+ ],
840
+ [
841
+ 0.28190404176712036,
842
+ 0.2608570158481598,
843
+ 0.5791972875595093,
844
+ 0.48876842856407166,
845
+ 0.002288524992763996,
846
+ 0.24382244050502777
847
+ ],
848
+ [
849
+ 0.3102819323539734,
850
+ 0.2809824049472809,
851
+ 0.6328328251838684,
852
+ 0.5347740054130554,
853
+ 0.002312292344868183,
854
+ 0.2663334310054779
855
+ ],
856
+ [
857
+ 0.3394824266433716,
858
+ 0.29752638936042786,
859
+ 0.6895572543144226,
860
+ 0.5827977061271667,
861
+ 0.002330307848751545,
862
+ 0.2859741449356079
863
+ ],
864
+ [
865
+ 0.3669600784778595,
866
+ 0.31471166014671326,
867
+ 0.7397019267082214,
868
+ 0.6297330260276794,
869
+ 0.002337755635380745,
870
+ 0.30544596910476685
871
+ ],
872
+ [
873
+ 0.3945035934448242,
874
+ 0.33071205019950867,
875
+ 0.7886773347854614,
876
+ 0.6768563985824585,
877
+ 0.0023598140105605125,
878
+ 0.32461366057395935
879
+ ],
880
+ [
881
+ 0.4227299392223358,
882
+ 0.3485700190067291,
883
+ 0.8316053152084351,
884
+ 0.723706841468811,
885
+ 0.002375778742134571,
886
+ 0.3432371914386749
887
+ ],
888
+ [
889
+ 0.44936659932136536,
890
+ 0.35997745394706726,
891
+ 0.8786941170692444,
892
+ 0.7676846981048584,
893
+ 0.0023923860862851143,
894
+ 0.3572857081890106
895
+ ],
896
+ [
897
+ 0.47607606649398804,
898
+ 0.3778820335865021,
899
+ 0.9260716438293457,
900
+ 0.8119612336158752,
901
+ 0.0024137627333402634,
902
+ 0.37240657210350037
903
+ ],
904
+ [
905
+ 0.501969575881958,
906
+ 0.39211174845695496,
907
+ 0.9603159427642822,
908
+ 0.8552690148353577,
909
+ 0.0024626096710562706,
910
+ 0.38595545291900635
911
+ ],
912
+ [
913
+ 0.5269771218299866,
914
+ 0.4024680256843567,
915
+ 1.0048072338104248,
916
+ 0.899775505065918,
917
+ 0.00252683088183403,
918
+ 0.3976656496524811
919
+ ],
920
+ [
921
+ 0.550702691078186,
922
+ 0.4190630316734314,
923
+ 1.0371341705322266,
924
+ 0.9431969523429871,
925
+ 0.0025539007037878036,
926
+ 0.4088396430015564
927
+ ]
928
+ ]
929
+ }
930
+ }
931
+ }
932
+ }
checkpoint-5000/experiment_cfg/final_model_config.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "Gr00tN1d6",
3
+ "model_dtype": "bfloat16",
4
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
5
+ "backbone_model_type": "eagle",
6
+ "model_revision": null,
7
+ "tune_top_llm_layers": 4,
8
+ "backbone_embedding_dim": 2048,
9
+ "tune_llm": false,
10
+ "tune_visual": false,
11
+ "select_layer": 16,
12
+ "reproject_vision": false,
13
+ "use_flash_attention": true,
14
+ "load_bf16": true,
15
+ "collator_overwrite_image_inputs": false,
16
+ "eagle_collator": true,
17
+ "backbone_trainable_params_fp32": true,
18
+ "apply_sincos_state_encoding": true,
19
+ "use_relative_action": true,
20
+ "max_state_dim": 128,
21
+ "max_action_dim": 128,
22
+ "action_horizon": 50,
23
+ "hidden_size": 1024,
24
+ "input_embedding_dim": 1536,
25
+ "add_pos_embed": true,
26
+ "attn_dropout": 0.2,
27
+ "use_vlln": true,
28
+ "max_seq_len": 1024,
29
+ "use_alternate_vl_dit": true,
30
+ "attend_text_every_n_blocks": 2,
31
+ "diffusion_model_cfg": {
32
+ "attention_head_dim": 48,
33
+ "dropout": 0.2,
34
+ "final_dropout": true,
35
+ "interleave_self_attention": true,
36
+ "norm_type": "ada_norm",
37
+ "num_attention_heads": 32,
38
+ "num_layers": 32,
39
+ "output_dim": 1024,
40
+ "positional_embeddings": null
41
+ },
42
+ "num_inference_timesteps": 4,
43
+ "noise_beta_alpha": 1.5,
44
+ "noise_beta_beta": 1.0,
45
+ "noise_s": 0.999,
46
+ "num_timestep_buckets": 1000,
47
+ "tune_projector": true,
48
+ "tune_diffusion_model": true,
49
+ "tune_vlln": true,
50
+ "state_dropout_prob": 0.15,
51
+ "state_additive_noise_scale": 0.0,
52
+ "max_num_embodiments": 32
53
+ }
checkpoint-5000/experiment_cfg/final_processor_config.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-5000/model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9000dbca703190deb360e6d99cbe4cd41fc341cc5c70a2beacc8b160249fbc24
3
+ size 4990126416
checkpoint-5000/model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:304adbff51430cfce2f8796d3ffb6a8b80d0a4dc62df1620386e701e77bdbc3f
3
+ size 4823190320
checkpoint-5000/model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-5000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c37e0506353d8cf16a0b5968dba885377589ed52a73af35321bf9ed4a8aeeec7
3
+ size 12960206949
checkpoint-5000/processor_config.json ADDED
@@ -0,0 +1,455 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "processor_class": "Gr00tN1d6Processor",
3
+ "processor_kwargs": {
4
+ "modality_configs": {
5
+ "behavior_r1_pro": {
6
+ "video": {
7
+ "delta_indices": [
8
+ 0
9
+ ],
10
+ "modality_keys": [
11
+ "observation.images.rgb.head_256_256",
12
+ "observation.images.rgb.left_wrist_256_256",
13
+ "observation.images.rgb.right_wrist_256_256"
14
+ ],
15
+ "sin_cos_embedding_keys": null,
16
+ "mean_std_embedding_keys": null,
17
+ "action_configs": null
18
+ },
19
+ "state": {
20
+ "delta_indices": [
21
+ 0
22
+ ],
23
+ "modality_keys": [
24
+ "robot_pos",
25
+ "robot_ori_cos",
26
+ "robot_ori_sin",
27
+ "robot_2d_ori",
28
+ "robot_2d_ori_cos",
29
+ "robot_2d_ori_sin",
30
+ "robot_lin_vel",
31
+ "robot_ang_vel",
32
+ "arm_left_qpos",
33
+ "arm_left_qpos_sin",
34
+ "arm_left_qpos_cos",
35
+ "eef_left_pos",
36
+ "eef_left_quat",
37
+ "gripper_left_qpos",
38
+ "arm_right_qpos",
39
+ "arm_right_qpos_sin",
40
+ "arm_right_qpos_cos",
41
+ "eef_right_pos",
42
+ "eef_right_quat",
43
+ "gripper_right_qpos",
44
+ "trunk_qpos"
45
+ ],
46
+ "sin_cos_embedding_keys": null,
47
+ "mean_std_embedding_keys": null,
48
+ "action_configs": null
49
+ },
50
+ "action": {
51
+ "delta_indices": [
52
+ 0,
53
+ 1,
54
+ 2,
55
+ 3,
56
+ 4,
57
+ 5,
58
+ 6,
59
+ 7,
60
+ 8,
61
+ 9,
62
+ 10,
63
+ 11,
64
+ 12,
65
+ 13,
66
+ 14,
67
+ 15,
68
+ 16,
69
+ 17,
70
+ 18,
71
+ 19,
72
+ 20,
73
+ 21,
74
+ 22,
75
+ 23,
76
+ 24,
77
+ 25,
78
+ 26,
79
+ 27,
80
+ 28,
81
+ 29,
82
+ 30,
83
+ 31
84
+ ],
85
+ "modality_keys": [
86
+ "base",
87
+ "torso",
88
+ "left_arm",
89
+ "left_gripper",
90
+ "right_arm",
91
+ "right_gripper"
92
+ ],
93
+ "sin_cos_embedding_keys": null,
94
+ "mean_std_embedding_keys": null,
95
+ "action_configs": [
96
+ {
97
+ "rep": "ABSOLUTE",
98
+ "type": "NON_EEF",
99
+ "format": "DEFAULT",
100
+ "state_key": null
101
+ },
102
+ {
103
+ "rep": "RELATIVE",
104
+ "type": "NON_EEF",
105
+ "format": "DEFAULT",
106
+ "state_key": "trunk_qpos"
107
+ },
108
+ {
109
+ "rep": "RELATIVE",
110
+ "type": "NON_EEF",
111
+ "format": "DEFAULT",
112
+ "state_key": "arm_left_qpos"
113
+ },
114
+ {
115
+ "rep": "ABSOLUTE",
116
+ "type": "NON_EEF",
117
+ "format": "DEFAULT",
118
+ "state_key": null
119
+ },
120
+ {
121
+ "rep": "RELATIVE",
122
+ "type": "NON_EEF",
123
+ "format": "DEFAULT",
124
+ "state_key": "arm_right_qpos"
125
+ },
126
+ {
127
+ "rep": "ABSOLUTE",
128
+ "type": "NON_EEF",
129
+ "format": "DEFAULT",
130
+ "state_key": null
131
+ }
132
+ ]
133
+ },
134
+ "language": {
135
+ "delta_indices": [
136
+ 0
137
+ ],
138
+ "modality_keys": [
139
+ "annotation.human.coarse_action"
140
+ ],
141
+ "sin_cos_embedding_keys": null,
142
+ "mean_std_embedding_keys": null,
143
+ "action_configs": null
144
+ }
145
+ },
146
+ "gr1": {
147
+ "video": {
148
+ "delta_indices": [
149
+ 0
150
+ ],
151
+ "modality_keys": [
152
+ "ego_view_bg_crop_pad_res256_freq20"
153
+ ],
154
+ "sin_cos_embedding_keys": null,
155
+ "mean_std_embedding_keys": null,
156
+ "action_configs": null
157
+ },
158
+ "state": {
159
+ "delta_indices": [
160
+ 0
161
+ ],
162
+ "modality_keys": [
163
+ "left_arm",
164
+ "right_arm",
165
+ "left_hand",
166
+ "right_hand",
167
+ "waist"
168
+ ],
169
+ "sin_cos_embedding_keys": [
170
+ "left_arm",
171
+ "right_arm",
172
+ "left_hand",
173
+ "right_hand",
174
+ "waist"
175
+ ],
176
+ "mean_std_embedding_keys": null,
177
+ "action_configs": null
178
+ },
179
+ "action": {
180
+ "delta_indices": [
181
+ 0,
182
+ 1,
183
+ 2,
184
+ 3,
185
+ 4,
186
+ 5,
187
+ 6,
188
+ 7,
189
+ 8,
190
+ 9,
191
+ 10,
192
+ 11,
193
+ 12,
194
+ 13,
195
+ 14,
196
+ 15
197
+ ],
198
+ "modality_keys": [
199
+ "left_arm",
200
+ "right_arm",
201
+ "left_hand",
202
+ "right_hand",
203
+ "waist"
204
+ ],
205
+ "sin_cos_embedding_keys": null,
206
+ "mean_std_embedding_keys": null,
207
+ "action_configs": [
208
+ {
209
+ "rep": "RELATIVE",
210
+ "type": "NON_EEF",
211
+ "format": "DEFAULT",
212
+ "state_key": null
213
+ },
214
+ {
215
+ "rep": "RELATIVE",
216
+ "type": "NON_EEF",
217
+ "format": "DEFAULT",
218
+ "state_key": null
219
+ },
220
+ {
221
+ "rep": "RELATIVE",
222
+ "type": "NON_EEF",
223
+ "format": "DEFAULT",
224
+ "state_key": null
225
+ },
226
+ {
227
+ "rep": "RELATIVE",
228
+ "type": "NON_EEF",
229
+ "format": "DEFAULT",
230
+ "state_key": null
231
+ },
232
+ {
233
+ "rep": "ABSOLUTE",
234
+ "type": "NON_EEF",
235
+ "format": "DEFAULT",
236
+ "state_key": null
237
+ }
238
+ ]
239
+ },
240
+ "language": {
241
+ "delta_indices": [
242
+ 0
243
+ ],
244
+ "modality_keys": [
245
+ "task"
246
+ ],
247
+ "sin_cos_embedding_keys": null,
248
+ "mean_std_embedding_keys": null,
249
+ "action_configs": null
250
+ }
251
+ },
252
+ "robocasa_panda_omron": {
253
+ "video": {
254
+ "delta_indices": [
255
+ 0
256
+ ],
257
+ "modality_keys": [
258
+ "res256_image_side_0",
259
+ "res256_image_side_1",
260
+ "res256_image_wrist_0"
261
+ ],
262
+ "sin_cos_embedding_keys": null,
263
+ "mean_std_embedding_keys": null,
264
+ "action_configs": null
265
+ },
266
+ "state": {
267
+ "delta_indices": [
268
+ 0
269
+ ],
270
+ "modality_keys": [
271
+ "end_effector_position_relative",
272
+ "end_effector_rotation_relative",
273
+ "gripper_qpos",
274
+ "base_position",
275
+ "base_rotation"
276
+ ],
277
+ "sin_cos_embedding_keys": null,
278
+ "mean_std_embedding_keys": null,
279
+ "action_configs": null
280
+ },
281
+ "action": {
282
+ "delta_indices": [
283
+ 0,
284
+ 1,
285
+ 2,
286
+ 3,
287
+ 4,
288
+ 5,
289
+ 6,
290
+ 7,
291
+ 8,
292
+ 9,
293
+ 10,
294
+ 11,
295
+ 12,
296
+ 13,
297
+ 14,
298
+ 15
299
+ ],
300
+ "modality_keys": [
301
+ "end_effector_position",
302
+ "end_effector_rotation",
303
+ "gripper_close",
304
+ "base_motion",
305
+ "control_mode"
306
+ ],
307
+ "sin_cos_embedding_keys": null,
308
+ "mean_std_embedding_keys": null,
309
+ "action_configs": [
310
+ {
311
+ "rep": "ABSOLUTE",
312
+ "type": "NON_EEF",
313
+ "format": "DEFAULT",
314
+ "state_key": null
315
+ },
316
+ {
317
+ "rep": "ABSOLUTE",
318
+ "type": "NON_EEF",
319
+ "format": "DEFAULT",
320
+ "state_key": null
321
+ },
322
+ {
323
+ "rep": "ABSOLUTE",
324
+ "type": "NON_EEF",
325
+ "format": "DEFAULT",
326
+ "state_key": null
327
+ },
328
+ {
329
+ "rep": "ABSOLUTE",
330
+ "type": "NON_EEF",
331
+ "format": "DEFAULT",
332
+ "state_key": null
333
+ },
334
+ {
335
+ "rep": "ABSOLUTE",
336
+ "type": "NON_EEF",
337
+ "format": "DEFAULT",
338
+ "state_key": null
339
+ }
340
+ ]
341
+ },
342
+ "language": {
343
+ "delta_indices": [
344
+ 0
345
+ ],
346
+ "modality_keys": [
347
+ "annotation.human.action.task_description"
348
+ ],
349
+ "sin_cos_embedding_keys": null,
350
+ "mean_std_embedding_keys": null,
351
+ "action_configs": null
352
+ }
353
+ },
354
+ "new_embodiment": {
355
+ "video": {
356
+ "delta_indices": [
357
+ 0
358
+ ],
359
+ "modality_keys": [
360
+ "front",
361
+ "wrist"
362
+ ],
363
+ "sin_cos_embedding_keys": null,
364
+ "mean_std_embedding_keys": null,
365
+ "action_configs": null
366
+ },
367
+ "state": {
368
+ "delta_indices": [
369
+ 0
370
+ ],
371
+ "modality_keys": [
372
+ "single_arm",
373
+ "gripper"
374
+ ],
375
+ "sin_cos_embedding_keys": null,
376
+ "mean_std_embedding_keys": null,
377
+ "action_configs": null
378
+ },
379
+ "action": {
380
+ "delta_indices": [
381
+ 0,
382
+ 1,
383
+ 2,
384
+ 3,
385
+ 4,
386
+ 5,
387
+ 6,
388
+ 7,
389
+ 8,
390
+ 9,
391
+ 10,
392
+ 11,
393
+ 12,
394
+ 13,
395
+ 14,
396
+ 15
397
+ ],
398
+ "modality_keys": [
399
+ "single_arm",
400
+ "gripper"
401
+ ],
402
+ "sin_cos_embedding_keys": null,
403
+ "mean_std_embedding_keys": null,
404
+ "action_configs": [
405
+ {
406
+ "rep": "RELATIVE",
407
+ "type": "NON_EEF",
408
+ "format": "DEFAULT",
409
+ "state_key": null
410
+ },
411
+ {
412
+ "rep": "ABSOLUTE",
413
+ "type": "NON_EEF",
414
+ "format": "DEFAULT",
415
+ "state_key": null
416
+ }
417
+ ]
418
+ },
419
+ "language": {
420
+ "delta_indices": [
421
+ 0
422
+ ],
423
+ "modality_keys": [
424
+ "annotation.human.task_description"
425
+ ],
426
+ "sin_cos_embedding_keys": null,
427
+ "mean_std_embedding_keys": null,
428
+ "action_configs": null
429
+ }
430
+ }
431
+ },
432
+ "image_crop_size": null,
433
+ "image_target_size": null,
434
+ "use_albumentations": true,
435
+ "random_rotation_angle": null,
436
+ "color_jitter_params": {
437
+ "brightness": 0.3,
438
+ "contrast": 0.4,
439
+ "saturation": 0.5,
440
+ "hue": 0.08
441
+ },
442
+ "shortest_image_edge": 256,
443
+ "crop_fraction": 0.95,
444
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
445
+ "model_type": "eagle",
446
+ "formalize_language": true,
447
+ "max_state_dim": 128,
448
+ "max_action_dim": 128,
449
+ "max_action_horizon": 50,
450
+ "use_percentiles": false,
451
+ "clip_outliers": true,
452
+ "apply_sincos_state_encoding": true,
453
+ "use_relative_action": true
454
+ }
455
+ }
checkpoint-5000/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c94b1fc1a851d1e8ac06cebe2a00bd7f820540453eb0a479c22e86a95301f4de
3
+ size 14645
checkpoint-5000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70be65633883a6aafe329b1781b0415dfcaca277e07b9018fec3efef9dd36027
3
+ size 1465
checkpoint-5000/statistics.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-5000/trainer_state.json ADDED
@@ -0,0 +1,3034 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 5000,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "grad_norm": 2.7266480922698975,
14
+ "learning_rate": 1.8e-06,
15
+ "loss": 1.238,
16
+ "step": 10
17
+ },
18
+ {
19
+ "grad_norm": 1.3996137380599976,
20
+ "learning_rate": 3.8e-06,
21
+ "loss": 1.2263,
22
+ "step": 20
23
+ },
24
+ {
25
+ "grad_norm": 0.6298696398735046,
26
+ "learning_rate": 5.8e-06,
27
+ "loss": 1.1558,
28
+ "step": 30
29
+ },
30
+ {
31
+ "grad_norm": 0.4681908190250397,
32
+ "learning_rate": 7.8e-06,
33
+ "loss": 1.1569,
34
+ "step": 40
35
+ },
36
+ {
37
+ "grad_norm": 0.9008304476737976,
38
+ "learning_rate": 9.800000000000001e-06,
39
+ "loss": 1.1582,
40
+ "step": 50
41
+ },
42
+ {
43
+ "grad_norm": 0.8695996999740601,
44
+ "learning_rate": 1.18e-05,
45
+ "loss": 1.1469,
46
+ "step": 60
47
+ },
48
+ {
49
+ "grad_norm": 0.754650890827179,
50
+ "learning_rate": 1.3800000000000002e-05,
51
+ "loss": 1.0852,
52
+ "step": 70
53
+ },
54
+ {
55
+ "grad_norm": 0.7990859746932983,
56
+ "learning_rate": 1.58e-05,
57
+ "loss": 1.0661,
58
+ "step": 80
59
+ },
60
+ {
61
+ "grad_norm": 0.6180333495140076,
62
+ "learning_rate": 1.78e-05,
63
+ "loss": 1.0627,
64
+ "step": 90
65
+ },
66
+ {
67
+ "grad_norm": 0.46167218685150146,
68
+ "learning_rate": 1.9800000000000004e-05,
69
+ "loss": 1.053,
70
+ "step": 100
71
+ },
72
+ {
73
+ "grad_norm": 0.5125234723091125,
74
+ "learning_rate": 2.18e-05,
75
+ "loss": 1.0584,
76
+ "step": 110
77
+ },
78
+ {
79
+ "grad_norm": 0.615847647190094,
80
+ "learning_rate": 2.38e-05,
81
+ "loss": 1.0547,
82
+ "step": 120
83
+ },
84
+ {
85
+ "grad_norm": 0.7808847427368164,
86
+ "learning_rate": 2.58e-05,
87
+ "loss": 1.0613,
88
+ "step": 130
89
+ },
90
+ {
91
+ "grad_norm": 0.6452605128288269,
92
+ "learning_rate": 2.7800000000000005e-05,
93
+ "loss": 1.0389,
94
+ "step": 140
95
+ },
96
+ {
97
+ "grad_norm": 0.7127711176872253,
98
+ "learning_rate": 2.98e-05,
99
+ "loss": 1.0285,
100
+ "step": 150
101
+ },
102
+ {
103
+ "grad_norm": 1.9395393133163452,
104
+ "learning_rate": 3.18e-05,
105
+ "loss": 0.9987,
106
+ "step": 160
107
+ },
108
+ {
109
+ "grad_norm": 2.0809590816497803,
110
+ "learning_rate": 3.38e-05,
111
+ "loss": 0.9503,
112
+ "step": 170
113
+ },
114
+ {
115
+ "grad_norm": 1.116188406944275,
116
+ "learning_rate": 3.58e-05,
117
+ "loss": 0.8721,
118
+ "step": 180
119
+ },
120
+ {
121
+ "grad_norm": 1.0570509433746338,
122
+ "learning_rate": 3.7800000000000004e-05,
123
+ "loss": 0.8447,
124
+ "step": 190
125
+ },
126
+ {
127
+ "grad_norm": 2.021897077560425,
128
+ "learning_rate": 3.9800000000000005e-05,
129
+ "loss": 0.7972,
130
+ "step": 200
131
+ },
132
+ {
133
+ "grad_norm": 1.9479414224624634,
134
+ "learning_rate": 4.18e-05,
135
+ "loss": 0.7084,
136
+ "step": 210
137
+ },
138
+ {
139
+ "grad_norm": 2.420440912246704,
140
+ "learning_rate": 4.38e-05,
141
+ "loss": 0.638,
142
+ "step": 220
143
+ },
144
+ {
145
+ "grad_norm": 1.9939135313034058,
146
+ "learning_rate": 4.58e-05,
147
+ "loss": 0.5441,
148
+ "step": 230
149
+ },
150
+ {
151
+ "grad_norm": 1.766343116760254,
152
+ "learning_rate": 4.78e-05,
153
+ "loss": 0.4735,
154
+ "step": 240
155
+ },
156
+ {
157
+ "grad_norm": 2.4787240028381348,
158
+ "learning_rate": 4.9800000000000004e-05,
159
+ "loss": 0.3976,
160
+ "step": 250
161
+ },
162
+ {
163
+ "grad_norm": 1.8052730560302734,
164
+ "learning_rate": 4.9999557099392795e-05,
165
+ "loss": 0.2773,
166
+ "step": 260
167
+ },
168
+ {
169
+ "grad_norm": 1.487770915031433,
170
+ "learning_rate": 4.9998026105095405e-05,
171
+ "loss": 0.2167,
172
+ "step": 270
173
+ },
174
+ {
175
+ "grad_norm": 1.126673936843872,
176
+ "learning_rate": 4.9995401616153804e-05,
177
+ "loss": 0.1938,
178
+ "step": 280
179
+ },
180
+ {
181
+ "grad_norm": 1.2377407550811768,
182
+ "learning_rate": 4.9991683747371645e-05,
183
+ "loss": 0.1878,
184
+ "step": 290
185
+ },
186
+ {
187
+ "grad_norm": 2.0436601638793945,
188
+ "learning_rate": 4.9986872661380534e-05,
189
+ "loss": 0.1571,
190
+ "step": 300
191
+ },
192
+ {
193
+ "grad_norm": 1.2251367568969727,
194
+ "learning_rate": 4.998096856863298e-05,
195
+ "loss": 0.1595,
196
+ "step": 310
197
+ },
198
+ {
199
+ "grad_norm": 1.2823742628097534,
200
+ "learning_rate": 4.997397172739312e-05,
201
+ "loss": 0.1464,
202
+ "step": 320
203
+ },
204
+ {
205
+ "grad_norm": 1.0287004709243774,
206
+ "learning_rate": 4.996588244372545e-05,
207
+ "loss": 0.1295,
208
+ "step": 330
209
+ },
210
+ {
211
+ "grad_norm": 1.0611475706100464,
212
+ "learning_rate": 4.995670107148146e-05,
213
+ "loss": 0.1309,
214
+ "step": 340
215
+ },
216
+ {
217
+ "grad_norm": 1.0434561967849731,
218
+ "learning_rate": 4.9946428012284095e-05,
219
+ "loss": 0.1344,
220
+ "step": 350
221
+ },
222
+ {
223
+ "grad_norm": 1.203682780265808,
224
+ "learning_rate": 4.993506371551025e-05,
225
+ "loss": 0.1339,
226
+ "step": 360
227
+ },
228
+ {
229
+ "grad_norm": 0.7937515377998352,
230
+ "learning_rate": 4.992260867827109e-05,
231
+ "loss": 0.1247,
232
+ "step": 370
233
+ },
234
+ {
235
+ "grad_norm": 0.9882832169532776,
236
+ "learning_rate": 4.9909063445390285e-05,
237
+ "loss": 0.1221,
238
+ "step": 380
239
+ },
240
+ {
241
+ "grad_norm": 1.3059258460998535,
242
+ "learning_rate": 4.9894428609380206e-05,
243
+ "loss": 0.1215,
244
+ "step": 390
245
+ },
246
+ {
247
+ "grad_norm": 1.3231853246688843,
248
+ "learning_rate": 4.987870481041599e-05,
249
+ "loss": 0.1257,
250
+ "step": 400
251
+ },
252
+ {
253
+ "grad_norm": 0.7158247828483582,
254
+ "learning_rate": 4.986189273630752e-05,
255
+ "loss": 0.1243,
256
+ "step": 410
257
+ },
258
+ {
259
+ "grad_norm": 1.0682462453842163,
260
+ "learning_rate": 4.9843993122469424e-05,
261
+ "loss": 0.1131,
262
+ "step": 420
263
+ },
264
+ {
265
+ "grad_norm": 0.914338231086731,
266
+ "learning_rate": 4.9825006751888767e-05,
267
+ "loss": 0.1135,
268
+ "step": 430
269
+ },
270
+ {
271
+ "grad_norm": 0.8019906878471375,
272
+ "learning_rate": 4.9804934455090915e-05,
273
+ "loss": 0.1135,
274
+ "step": 440
275
+ },
276
+ {
277
+ "grad_norm": 0.878158450126648,
278
+ "learning_rate": 4.978377711010315e-05,
279
+ "loss": 0.1176,
280
+ "step": 450
281
+ },
282
+ {
283
+ "grad_norm": 1.1396379470825195,
284
+ "learning_rate": 4.976153564241628e-05,
285
+ "loss": 0.1077,
286
+ "step": 460
287
+ },
288
+ {
289
+ "grad_norm": 1.298904538154602,
290
+ "learning_rate": 4.973821102494417e-05,
291
+ "loss": 0.1208,
292
+ "step": 470
293
+ },
294
+ {
295
+ "grad_norm": 0.8515462279319763,
296
+ "learning_rate": 4.971380427798113e-05,
297
+ "loss": 0.1024,
298
+ "step": 480
299
+ },
300
+ {
301
+ "grad_norm": 0.8240450620651245,
302
+ "learning_rate": 4.9688316469157354e-05,
303
+ "loss": 0.1018,
304
+ "step": 490
305
+ },
306
+ {
307
+ "grad_norm": 0.6559143662452698,
308
+ "learning_rate": 4.9661748713392165e-05,
309
+ "loss": 0.0972,
310
+ "step": 500
311
+ },
312
+ {
313
+ "grad_norm": 0.9851711392402649,
314
+ "learning_rate": 4.963410217284526e-05,
315
+ "loss": 0.113,
316
+ "step": 510
317
+ },
318
+ {
319
+ "grad_norm": 0.8339484333992004,
320
+ "learning_rate": 4.960537805686589e-05,
321
+ "loss": 0.0973,
322
+ "step": 520
323
+ },
324
+ {
325
+ "grad_norm": 0.8457871675491333,
326
+ "learning_rate": 4.957557762193994e-05,
327
+ "loss": 0.101,
328
+ "step": 530
329
+ },
330
+ {
331
+ "grad_norm": 0.9261676669120789,
332
+ "learning_rate": 4.954470217163498e-05,
333
+ "loss": 0.0894,
334
+ "step": 540
335
+ },
336
+ {
337
+ "grad_norm": 0.8262922763824463,
338
+ "learning_rate": 4.9512753056543226e-05,
339
+ "loss": 0.0825,
340
+ "step": 550
341
+ },
342
+ {
343
+ "grad_norm": 0.6502310633659363,
344
+ "learning_rate": 4.947973167422247e-05,
345
+ "loss": 0.0876,
346
+ "step": 560
347
+ },
348
+ {
349
+ "grad_norm": 0.7397481203079224,
350
+ "learning_rate": 4.9445639469134944e-05,
351
+ "loss": 0.0768,
352
+ "step": 570
353
+ },
354
+ {
355
+ "grad_norm": 0.7882953882217407,
356
+ "learning_rate": 4.941047793258416e-05,
357
+ "loss": 0.0969,
358
+ "step": 580
359
+ },
360
+ {
361
+ "grad_norm": 0.79180508852005,
362
+ "learning_rate": 4.937424860264961e-05,
363
+ "loss": 0.108,
364
+ "step": 590
365
+ },
366
+ {
367
+ "grad_norm": 0.7894780039787292,
368
+ "learning_rate": 4.933695306411957e-05,
369
+ "loss": 0.097,
370
+ "step": 600
371
+ },
372
+ {
373
+ "grad_norm": 0.8765780925750732,
374
+ "learning_rate": 4.929859294842172e-05,
375
+ "loss": 0.1013,
376
+ "step": 610
377
+ },
378
+ {
379
+ "grad_norm": 0.9128709435462952,
380
+ "learning_rate": 4.9259169933551765e-05,
381
+ "loss": 0.0854,
382
+ "step": 620
383
+ },
384
+ {
385
+ "grad_norm": 0.6108020544052124,
386
+ "learning_rate": 4.921868574400011e-05,
387
+ "loss": 0.0809,
388
+ "step": 630
389
+ },
390
+ {
391
+ "grad_norm": 0.7296820878982544,
392
+ "learning_rate": 4.9177142150676355e-05,
393
+ "loss": 0.0858,
394
+ "step": 640
395
+ },
396
+ {
397
+ "grad_norm": 0.8388088345527649,
398
+ "learning_rate": 4.913454097083185e-05,
399
+ "loss": 0.0974,
400
+ "step": 650
401
+ },
402
+ {
403
+ "grad_norm": 0.920002818107605,
404
+ "learning_rate": 4.9090884067980205e-05,
405
+ "loss": 0.0857,
406
+ "step": 660
407
+ },
408
+ {
409
+ "grad_norm": 0.9557753205299377,
410
+ "learning_rate": 4.9046173351815796e-05,
411
+ "loss": 0.1021,
412
+ "step": 670
413
+ },
414
+ {
415
+ "grad_norm": 1.0099128484725952,
416
+ "learning_rate": 4.900041077813017e-05,
417
+ "loss": 0.0937,
418
+ "step": 680
419
+ },
420
+ {
421
+ "grad_norm": 0.7957805395126343,
422
+ "learning_rate": 4.895359834872656e-05,
423
+ "loss": 0.0919,
424
+ "step": 690
425
+ },
426
+ {
427
+ "grad_norm": 0.5897656083106995,
428
+ "learning_rate": 4.8905738111332275e-05,
429
+ "loss": 0.0868,
430
+ "step": 700
431
+ },
432
+ {
433
+ "grad_norm": 0.82470703125,
434
+ "learning_rate": 4.8856832159509156e-05,
435
+ "loss": 0.0897,
436
+ "step": 710
437
+ },
438
+ {
439
+ "grad_norm": 0.5583815574645996,
440
+ "learning_rate": 4.880688263256197e-05,
441
+ "loss": 0.0831,
442
+ "step": 720
443
+ },
444
+ {
445
+ "grad_norm": 0.5602760910987854,
446
+ "learning_rate": 4.8755891715444814e-05,
447
+ "loss": 0.0864,
448
+ "step": 730
449
+ },
450
+ {
451
+ "grad_norm": 0.6645472645759583,
452
+ "learning_rate": 4.870386163866561e-05,
453
+ "loss": 0.0785,
454
+ "step": 740
455
+ },
456
+ {
457
+ "grad_norm": 0.4997585117816925,
458
+ "learning_rate": 4.8650794678188485e-05,
459
+ "loss": 0.0736,
460
+ "step": 750
461
+ },
462
+ {
463
+ "grad_norm": 0.6175997853279114,
464
+ "learning_rate": 4.859669315533417e-05,
465
+ "loss": 0.0802,
466
+ "step": 760
467
+ },
468
+ {
469
+ "grad_norm": 0.6164193749427795,
470
+ "learning_rate": 4.8541559436678563e-05,
471
+ "loss": 0.0741,
472
+ "step": 770
473
+ },
474
+ {
475
+ "grad_norm": 0.692690908908844,
476
+ "learning_rate": 4.8485395933949114e-05,
477
+ "loss": 0.0803,
478
+ "step": 780
479
+ },
480
+ {
481
+ "grad_norm": 0.7447015047073364,
482
+ "learning_rate": 4.842820510391938e-05,
483
+ "loss": 0.0747,
484
+ "step": 790
485
+ },
486
+ {
487
+ "grad_norm": 0.9005197882652283,
488
+ "learning_rate": 4.836998944830155e-05,
489
+ "loss": 0.0859,
490
+ "step": 800
491
+ },
492
+ {
493
+ "grad_norm": 0.6014283895492554,
494
+ "learning_rate": 4.8310751513636975e-05,
495
+ "loss": 0.0847,
496
+ "step": 810
497
+ },
498
+ {
499
+ "grad_norm": 0.5599387884140015,
500
+ "learning_rate": 4.825049389118484e-05,
501
+ "loss": 0.0709,
502
+ "step": 820
503
+ },
504
+ {
505
+ "grad_norm": 0.6468709111213684,
506
+ "learning_rate": 4.818921921680874e-05,
507
+ "loss": 0.0887,
508
+ "step": 830
509
+ },
510
+ {
511
+ "grad_norm": 0.6334129571914673,
512
+ "learning_rate": 4.812693017086145e-05,
513
+ "loss": 0.0689,
514
+ "step": 840
515
+ },
516
+ {
517
+ "grad_norm": 0.6896155476570129,
518
+ "learning_rate": 4.806362947806763e-05,
519
+ "loss": 0.0839,
520
+ "step": 850
521
+ },
522
+ {
523
+ "grad_norm": 0.8341414928436279,
524
+ "learning_rate": 4.799931990740463e-05,
525
+ "loss": 0.0785,
526
+ "step": 860
527
+ },
528
+ {
529
+ "grad_norm": 0.5337378978729248,
530
+ "learning_rate": 4.7934004271981415e-05,
531
+ "loss": 0.0769,
532
+ "step": 870
533
+ },
534
+ {
535
+ "grad_norm": 0.7976155877113342,
536
+ "learning_rate": 4.786768542891548e-05,
537
+ "loss": 0.0738,
538
+ "step": 880
539
+ },
540
+ {
541
+ "grad_norm": 0.3165757358074188,
542
+ "learning_rate": 4.7800366279207854e-05,
543
+ "loss": 0.0713,
544
+ "step": 890
545
+ },
546
+ {
547
+ "grad_norm": 0.7630752325057983,
548
+ "learning_rate": 4.773204976761623e-05,
549
+ "loss": 0.0719,
550
+ "step": 900
551
+ },
552
+ {
553
+ "grad_norm": 0.6145244836807251,
554
+ "learning_rate": 4.7662738882526146e-05,
555
+ "loss": 0.0644,
556
+ "step": 910
557
+ },
558
+ {
559
+ "grad_norm": 0.6122027635574341,
560
+ "learning_rate": 4.759243665582024e-05,
561
+ "loss": 0.0728,
562
+ "step": 920
563
+ },
564
+ {
565
+ "grad_norm": 0.4458109736442566,
566
+ "learning_rate": 4.752114616274567e-05,
567
+ "loss": 0.0678,
568
+ "step": 930
569
+ },
570
+ {
571
+ "grad_norm": 0.6862826347351074,
572
+ "learning_rate": 4.744887052177954e-05,
573
+ "loss": 0.0694,
574
+ "step": 940
575
+ },
576
+ {
577
+ "grad_norm": 0.5472699403762817,
578
+ "learning_rate": 4.7375612894492536e-05,
579
+ "loss": 0.0739,
580
+ "step": 950
581
+ },
582
+ {
583
+ "grad_norm": 0.6469587087631226,
584
+ "learning_rate": 4.7301376485410596e-05,
585
+ "loss": 0.0612,
586
+ "step": 960
587
+ },
588
+ {
589
+ "grad_norm": 0.5633054971694946,
590
+ "learning_rate": 4.722616454187474e-05,
591
+ "loss": 0.0752,
592
+ "step": 970
593
+ },
594
+ {
595
+ "grad_norm": 0.611199140548706,
596
+ "learning_rate": 4.714998035389904e-05,
597
+ "loss": 0.0682,
598
+ "step": 980
599
+ },
600
+ {
601
+ "grad_norm": 0.6113159656524658,
602
+ "learning_rate": 4.7072827254026666e-05,
603
+ "loss": 0.0734,
604
+ "step": 990
605
+ },
606
+ {
607
+ "grad_norm": 0.5616899728775024,
608
+ "learning_rate": 4.6994708617184155e-05,
609
+ "loss": 0.0647,
610
+ "step": 1000
611
+ },
612
+ {
613
+ "grad_norm": 0.5405145883560181,
614
+ "learning_rate": 4.691562786053376e-05,
615
+ "loss": 0.0652,
616
+ "step": 1010
617
+ },
618
+ {
619
+ "grad_norm": 0.5287688374519348,
620
+ "learning_rate": 4.6835588443323956e-05,
621
+ "loss": 0.071,
622
+ "step": 1020
623
+ },
624
+ {
625
+ "grad_norm": 0.6897308230400085,
626
+ "learning_rate": 4.675459386673815e-05,
627
+ "loss": 0.0711,
628
+ "step": 1030
629
+ },
630
+ {
631
+ "grad_norm": 0.43904393911361694,
632
+ "learning_rate": 4.6672647673741485e-05,
633
+ "loss": 0.0762,
634
+ "step": 1040
635
+ },
636
+ {
637
+ "grad_norm": 0.502697765827179,
638
+ "learning_rate": 4.658975344892594e-05,
639
+ "loss": 0.0892,
640
+ "step": 1050
641
+ },
642
+ {
643
+ "grad_norm": 0.718237042427063,
644
+ "learning_rate": 4.650591481835344e-05,
645
+ "loss": 0.0862,
646
+ "step": 1060
647
+ },
648
+ {
649
+ "grad_norm": 0.570436954498291,
650
+ "learning_rate": 4.642113544939728e-05,
651
+ "loss": 0.07,
652
+ "step": 1070
653
+ },
654
+ {
655
+ "grad_norm": 0.4335796535015106,
656
+ "learning_rate": 4.63354190505817e-05,
657
+ "loss": 0.0811,
658
+ "step": 1080
659
+ },
660
+ {
661
+ "grad_norm": 0.6726382374763489,
662
+ "learning_rate": 4.6248769371419684e-05,
663
+ "loss": 0.0675,
664
+ "step": 1090
665
+ },
666
+ {
667
+ "grad_norm": 0.5062233805656433,
668
+ "learning_rate": 4.6161190202248897e-05,
669
+ "loss": 0.064,
670
+ "step": 1100
671
+ },
672
+ {
673
+ "grad_norm": 0.3789091408252716,
674
+ "learning_rate": 4.607268537406591e-05,
675
+ "loss": 0.0706,
676
+ "step": 1110
677
+ },
678
+ {
679
+ "grad_norm": 0.5326701402664185,
680
+ "learning_rate": 4.598325875835862e-05,
681
+ "loss": 0.071,
682
+ "step": 1120
683
+ },
684
+ {
685
+ "grad_norm": 0.5220073461532593,
686
+ "learning_rate": 4.589291426693692e-05,
687
+ "loss": 0.0727,
688
+ "step": 1130
689
+ },
690
+ {
691
+ "grad_norm": 0.5300417542457581,
692
+ "learning_rate": 4.580165585176152e-05,
693
+ "loss": 0.0678,
694
+ "step": 1140
695
+ },
696
+ {
697
+ "grad_norm": 0.524254560470581,
698
+ "learning_rate": 4.570948750477114e-05,
699
+ "loss": 0.0652,
700
+ "step": 1150
701
+ },
702
+ {
703
+ "grad_norm": 0.5178232192993164,
704
+ "learning_rate": 4.561641325770788e-05,
705
+ "loss": 0.0636,
706
+ "step": 1160
707
+ },
708
+ {
709
+ "grad_norm": 0.35104331374168396,
710
+ "learning_rate": 4.5522437181940804e-05,
711
+ "loss": 0.0624,
712
+ "step": 1170
713
+ },
714
+ {
715
+ "grad_norm": 0.5118323564529419,
716
+ "learning_rate": 4.542756338828791e-05,
717
+ "loss": 0.0622,
718
+ "step": 1180
719
+ },
720
+ {
721
+ "grad_norm": 0.4421655535697937,
722
+ "learning_rate": 4.533179602683629e-05,
723
+ "loss": 0.0629,
724
+ "step": 1190
725
+ },
726
+ {
727
+ "grad_norm": 0.7161966562271118,
728
+ "learning_rate": 4.523513928676056e-05,
729
+ "loss": 0.0599,
730
+ "step": 1200
731
+ },
732
+ {
733
+ "grad_norm": 0.4908861219882965,
734
+ "learning_rate": 4.5137597396139676e-05,
735
+ "loss": 0.0653,
736
+ "step": 1210
737
+ },
738
+ {
739
+ "grad_norm": 1.035172939300537,
740
+ "learning_rate": 4.503917462177192e-05,
741
+ "loss": 0.0592,
742
+ "step": 1220
743
+ },
744
+ {
745
+ "grad_norm": 0.6242174506187439,
746
+ "learning_rate": 4.4939875268988273e-05,
747
+ "loss": 0.0679,
748
+ "step": 1230
749
+ },
750
+ {
751
+ "grad_norm": 0.34626179933547974,
752
+ "learning_rate": 4.483970368146413e-05,
753
+ "loss": 0.0608,
754
+ "step": 1240
755
+ },
756
+ {
757
+ "grad_norm": 0.41088080406188965,
758
+ "learning_rate": 4.473866424102923e-05,
759
+ "loss": 0.0715,
760
+ "step": 1250
761
+ },
762
+ {
763
+ "grad_norm": 0.4913835823535919,
764
+ "learning_rate": 4.463676136747602e-05,
765
+ "loss": 0.0519,
766
+ "step": 1260
767
+ },
768
+ {
769
+ "grad_norm": 0.39666661620140076,
770
+ "learning_rate": 4.453399951836632e-05,
771
+ "loss": 0.0559,
772
+ "step": 1270
773
+ },
774
+ {
775
+ "grad_norm": 0.5405796766281128,
776
+ "learning_rate": 4.44303831888363e-05,
777
+ "loss": 0.0645,
778
+ "step": 1280
779
+ },
780
+ {
781
+ "grad_norm": 0.6450210809707642,
782
+ "learning_rate": 4.432591691139989e-05,
783
+ "loss": 0.0692,
784
+ "step": 1290
785
+ },
786
+ {
787
+ "grad_norm": 0.6847130656242371,
788
+ "learning_rate": 4.422060525575048e-05,
789
+ "loss": 0.0665,
790
+ "step": 1300
791
+ },
792
+ {
793
+ "grad_norm": 0.5179506540298462,
794
+ "learning_rate": 4.411445282856106e-05,
795
+ "loss": 0.0612,
796
+ "step": 1310
797
+ },
798
+ {
799
+ "grad_norm": 0.76016765832901,
800
+ "learning_rate": 4.400746427328268e-05,
801
+ "loss": 0.0618,
802
+ "step": 1320
803
+ },
804
+ {
805
+ "grad_norm": 0.522050678730011,
806
+ "learning_rate": 4.389964426994134e-05,
807
+ "loss": 0.0632,
808
+ "step": 1330
809
+ },
810
+ {
811
+ "grad_norm": 0.5314463973045349,
812
+ "learning_rate": 4.3790997534933276e-05,
813
+ "loss": 0.0628,
814
+ "step": 1340
815
+ },
816
+ {
817
+ "grad_norm": 0.4170549213886261,
818
+ "learning_rate": 4.368152882081865e-05,
819
+ "loss": 0.0595,
820
+ "step": 1350
821
+ },
822
+ {
823
+ "grad_norm": 0.5747459530830383,
824
+ "learning_rate": 4.357124291611363e-05,
825
+ "loss": 0.0549,
826
+ "step": 1360
827
+ },
828
+ {
829
+ "grad_norm": 0.5837365388870239,
830
+ "learning_rate": 4.346014464508098e-05,
831
+ "loss": 0.0519,
832
+ "step": 1370
833
+ },
834
+ {
835
+ "grad_norm": 0.35218408703804016,
836
+ "learning_rate": 4.3348238867518985e-05,
837
+ "loss": 0.06,
838
+ "step": 1380
839
+ },
840
+ {
841
+ "grad_norm": 0.40569043159484863,
842
+ "learning_rate": 4.323553047854887e-05,
843
+ "loss": 0.0484,
844
+ "step": 1390
845
+ },
846
+ {
847
+ "grad_norm": 0.5539340972900391,
848
+ "learning_rate": 4.3122024408400693e-05,
849
+ "loss": 0.0496,
850
+ "step": 1400
851
+ },
852
+ {
853
+ "grad_norm": 0.33733201026916504,
854
+ "learning_rate": 4.3007725622197674e-05,
855
+ "loss": 0.0508,
856
+ "step": 1410
857
+ },
858
+ {
859
+ "grad_norm": 0.5494152903556824,
860
+ "learning_rate": 4.2892639119739e-05,
861
+ "loss": 0.0621,
862
+ "step": 1420
863
+ },
864
+ {
865
+ "grad_norm": 0.39040982723236084,
866
+ "learning_rate": 4.277676993528112e-05,
867
+ "loss": 0.0528,
868
+ "step": 1430
869
+ },
870
+ {
871
+ "grad_norm": 0.5634658932685852,
872
+ "learning_rate": 4.2660123137317523e-05,
873
+ "loss": 0.0586,
874
+ "step": 1440
875
+ },
876
+ {
877
+ "grad_norm": 0.5504993796348572,
878
+ "learning_rate": 4.254270382835703e-05,
879
+ "loss": 0.0617,
880
+ "step": 1450
881
+ },
882
+ {
883
+ "grad_norm": 0.3419093191623688,
884
+ "learning_rate": 4.2424517144700603e-05,
885
+ "loss": 0.0573,
886
+ "step": 1460
887
+ },
888
+ {
889
+ "grad_norm": 0.3770234286785126,
890
+ "learning_rate": 4.230556825621667e-05,
891
+ "loss": 0.0552,
892
+ "step": 1470
893
+ },
894
+ {
895
+ "grad_norm": 0.5088812708854675,
896
+ "learning_rate": 4.2185862366114936e-05,
897
+ "loss": 0.061,
898
+ "step": 1480
899
+ },
900
+ {
901
+ "grad_norm": 0.5062453746795654,
902
+ "learning_rate": 4.2065404710718834e-05,
903
+ "loss": 0.0528,
904
+ "step": 1490
905
+ },
906
+ {
907
+ "grad_norm": 0.7702981233596802,
908
+ "learning_rate": 4.194420055923644e-05,
909
+ "loss": 0.0637,
910
+ "step": 1500
911
+ },
912
+ {
913
+ "grad_norm": 0.6036869287490845,
914
+ "learning_rate": 4.182225521352999e-05,
915
+ "loss": 0.0702,
916
+ "step": 1510
917
+ },
918
+ {
919
+ "grad_norm": 0.5008228421211243,
920
+ "learning_rate": 4.169957400788395e-05,
921
+ "loss": 0.0624,
922
+ "step": 1520
923
+ },
924
+ {
925
+ "grad_norm": 0.41124141216278076,
926
+ "learning_rate": 4.157616230877169e-05,
927
+ "loss": 0.0563,
928
+ "step": 1530
929
+ },
930
+ {
931
+ "grad_norm": 0.7010630369186401,
932
+ "learning_rate": 4.145202551462072e-05,
933
+ "loss": 0.062,
934
+ "step": 1540
935
+ },
936
+ {
937
+ "grad_norm": 0.4738198220729828,
938
+ "learning_rate": 4.132716905557658e-05,
939
+ "loss": 0.0636,
940
+ "step": 1550
941
+ },
942
+ {
943
+ "grad_norm": 0.5558097958564758,
944
+ "learning_rate": 4.1201598393265244e-05,
945
+ "loss": 0.0627,
946
+ "step": 1560
947
+ },
948
+ {
949
+ "grad_norm": 0.4446842074394226,
950
+ "learning_rate": 4.1075319020554286e-05,
951
+ "loss": 0.0577,
952
+ "step": 1570
953
+ },
954
+ {
955
+ "grad_norm": 0.476675808429718,
956
+ "learning_rate": 4.094833646131256e-05,
957
+ "loss": 0.0544,
958
+ "step": 1580
959
+ },
960
+ {
961
+ "grad_norm": 0.4960286617279053,
962
+ "learning_rate": 4.082065627016858e-05,
963
+ "loss": 0.0644,
964
+ "step": 1590
965
+ },
966
+ {
967
+ "grad_norm": 0.46870744228363037,
968
+ "learning_rate": 4.0692284032267516e-05,
969
+ "loss": 0.054,
970
+ "step": 1600
971
+ },
972
+ {
973
+ "grad_norm": 0.7339263558387756,
974
+ "learning_rate": 4.056322536302693e-05,
975
+ "loss": 0.0552,
976
+ "step": 1610
977
+ },
978
+ {
979
+ "grad_norm": 0.3929803669452667,
980
+ "learning_rate": 4.043348590789111e-05,
981
+ "loss": 0.0554,
982
+ "step": 1620
983
+ },
984
+ {
985
+ "grad_norm": 0.4788963198661804,
986
+ "learning_rate": 4.030307134208411e-05,
987
+ "loss": 0.052,
988
+ "step": 1630
989
+ },
990
+ {
991
+ "grad_norm": 0.4371449649333954,
992
+ "learning_rate": 4.017198737036154e-05,
993
+ "loss": 0.0531,
994
+ "step": 1640
995
+ },
996
+ {
997
+ "grad_norm": 0.4106438159942627,
998
+ "learning_rate": 4.004023972676097e-05,
999
+ "loss": 0.0569,
1000
+ "step": 1650
1001
+ },
1002
+ {
1003
+ "grad_norm": 0.3421051800251007,
1004
+ "learning_rate": 3.9907834174351125e-05,
1005
+ "loss": 0.0509,
1006
+ "step": 1660
1007
+ },
1008
+ {
1009
+ "grad_norm": 0.45882418751716614,
1010
+ "learning_rate": 3.9774776504979805e-05,
1011
+ "loss": 0.058,
1012
+ "step": 1670
1013
+ },
1014
+ {
1015
+ "grad_norm": 0.5227372646331787,
1016
+ "learning_rate": 3.964107253902052e-05,
1017
+ "loss": 0.0552,
1018
+ "step": 1680
1019
+ },
1020
+ {
1021
+ "grad_norm": 0.567558228969574,
1022
+ "learning_rate": 3.950672812511788e-05,
1023
+ "loss": 0.0617,
1024
+ "step": 1690
1025
+ },
1026
+ {
1027
+ "grad_norm": 0.6489816904067993,
1028
+ "learning_rate": 3.937174913993177e-05,
1029
+ "loss": 0.0563,
1030
+ "step": 1700
1031
+ },
1032
+ {
1033
+ "grad_norm": 0.4380536377429962,
1034
+ "learning_rate": 3.9236141487880265e-05,
1035
+ "loss": 0.0508,
1036
+ "step": 1710
1037
+ },
1038
+ {
1039
+ "grad_norm": 0.5422831177711487,
1040
+ "learning_rate": 3.909991110088138e-05,
1041
+ "loss": 0.0541,
1042
+ "step": 1720
1043
+ },
1044
+ {
1045
+ "grad_norm": 0.7260904908180237,
1046
+ "learning_rate": 3.896306393809357e-05,
1047
+ "loss": 0.0563,
1048
+ "step": 1730
1049
+ },
1050
+ {
1051
+ "grad_norm": 0.4155614972114563,
1052
+ "learning_rate": 3.882560598565504e-05,
1053
+ "loss": 0.0552,
1054
+ "step": 1740
1055
+ },
1056
+ {
1057
+ "grad_norm": 0.35693034529685974,
1058
+ "learning_rate": 3.8687543256421955e-05,
1059
+ "loss": 0.0521,
1060
+ "step": 1750
1061
+ },
1062
+ {
1063
+ "grad_norm": 0.591141402721405,
1064
+ "learning_rate": 3.8548881789705345e-05,
1065
+ "loss": 0.0571,
1066
+ "step": 1760
1067
+ },
1068
+ {
1069
+ "grad_norm": 0.5429609417915344,
1070
+ "learning_rate": 3.840962765100696e-05,
1071
+ "loss": 0.0575,
1072
+ "step": 1770
1073
+ },
1074
+ {
1075
+ "grad_norm": 0.4284355938434601,
1076
+ "learning_rate": 3.826978693175395e-05,
1077
+ "loss": 0.0547,
1078
+ "step": 1780
1079
+ },
1080
+ {
1081
+ "grad_norm": 0.720148503780365,
1082
+ "learning_rate": 3.81293657490324e-05,
1083
+ "loss": 0.0575,
1084
+ "step": 1790
1085
+ },
1086
+ {
1087
+ "grad_norm": 0.49093666672706604,
1088
+ "learning_rate": 3.798837024531974e-05,
1089
+ "loss": 0.0513,
1090
+ "step": 1800
1091
+ },
1092
+ {
1093
+ "grad_norm": 0.5715184211730957,
1094
+ "learning_rate": 3.7846806588216055e-05,
1095
+ "loss": 0.0571,
1096
+ "step": 1810
1097
+ },
1098
+ {
1099
+ "grad_norm": 0.45693865418434143,
1100
+ "learning_rate": 3.770468097017432e-05,
1101
+ "loss": 0.0481,
1102
+ "step": 1820
1103
+ },
1104
+ {
1105
+ "grad_norm": 0.49179983139038086,
1106
+ "learning_rate": 3.7561999608229505e-05,
1107
+ "loss": 0.0528,
1108
+ "step": 1830
1109
+ },
1110
+ {
1111
+ "grad_norm": 0.4709620177745819,
1112
+ "learning_rate": 3.741876874372659e-05,
1113
+ "loss": 0.0501,
1114
+ "step": 1840
1115
+ },
1116
+ {
1117
+ "grad_norm": 0.4550098776817322,
1118
+ "learning_rate": 3.727499464204758e-05,
1119
+ "loss": 0.0493,
1120
+ "step": 1850
1121
+ },
1122
+ {
1123
+ "grad_norm": 0.4054962396621704,
1124
+ "learning_rate": 3.7130683592337465e-05,
1125
+ "loss": 0.0476,
1126
+ "step": 1860
1127
+ },
1128
+ {
1129
+ "grad_norm": 0.541397750377655,
1130
+ "learning_rate": 3.698584190722906e-05,
1131
+ "loss": 0.0534,
1132
+ "step": 1870
1133
+ },
1134
+ {
1135
+ "grad_norm": 0.36921900510787964,
1136
+ "learning_rate": 3.6840475922566886e-05,
1137
+ "loss": 0.0478,
1138
+ "step": 1880
1139
+ },
1140
+ {
1141
+ "grad_norm": 0.5922922492027283,
1142
+ "learning_rate": 3.6694591997130026e-05,
1143
+ "loss": 0.0501,
1144
+ "step": 1890
1145
+ },
1146
+ {
1147
+ "grad_norm": 0.43542882800102234,
1148
+ "learning_rate": 3.654819651235401e-05,
1149
+ "loss": 0.0541,
1150
+ "step": 1900
1151
+ },
1152
+ {
1153
+ "grad_norm": 0.48189231753349304,
1154
+ "learning_rate": 3.640129587205156e-05,
1155
+ "loss": 0.0521,
1156
+ "step": 1910
1157
+ },
1158
+ {
1159
+ "grad_norm": 0.4395929276943207,
1160
+ "learning_rate": 3.625389650213259e-05,
1161
+ "loss": 0.0429,
1162
+ "step": 1920
1163
+ },
1164
+ {
1165
+ "grad_norm": 0.5689699649810791,
1166
+ "learning_rate": 3.610600485032305e-05,
1167
+ "loss": 0.0586,
1168
+ "step": 1930
1169
+ },
1170
+ {
1171
+ "grad_norm": 0.5108771920204163,
1172
+ "learning_rate": 3.5957627385882884e-05,
1173
+ "loss": 0.0523,
1174
+ "step": 1940
1175
+ },
1176
+ {
1177
+ "grad_norm": 0.5463844537734985,
1178
+ "learning_rate": 3.580877059932308e-05,
1179
+ "loss": 0.0449,
1180
+ "step": 1950
1181
+ },
1182
+ {
1183
+ "grad_norm": 0.3828030526638031,
1184
+ "learning_rate": 3.5659441002121694e-05,
1185
+ "loss": 0.0509,
1186
+ "step": 1960
1187
+ },
1188
+ {
1189
+ "grad_norm": 0.3314559757709503,
1190
+ "learning_rate": 3.550964512643908e-05,
1191
+ "loss": 0.0435,
1192
+ "step": 1970
1193
+ },
1194
+ {
1195
+ "grad_norm": 0.8163153529167175,
1196
+ "learning_rate": 3.535938952483211e-05,
1197
+ "loss": 0.0558,
1198
+ "step": 1980
1199
+ },
1200
+ {
1201
+ "grad_norm": 0.7200665473937988,
1202
+ "learning_rate": 3.520868076996755e-05,
1203
+ "loss": 0.0432,
1204
+ "step": 1990
1205
+ },
1206
+ {
1207
+ "grad_norm": 0.47182565927505493,
1208
+ "learning_rate": 3.5057525454334564e-05,
1209
+ "loss": 0.0455,
1210
+ "step": 2000
1211
+ },
1212
+ {
1213
+ "grad_norm": 0.5063982009887695,
1214
+ "learning_rate": 3.490593018995636e-05,
1215
+ "loss": 0.0446,
1216
+ "step": 2010
1217
+ },
1218
+ {
1219
+ "grad_norm": 0.44255322217941284,
1220
+ "learning_rate": 3.475390160810087e-05,
1221
+ "loss": 0.0434,
1222
+ "step": 2020
1223
+ },
1224
+ {
1225
+ "grad_norm": 0.4013705849647522,
1226
+ "learning_rate": 3.460144635899079e-05,
1227
+ "loss": 0.0501,
1228
+ "step": 2030
1229
+ },
1230
+ {
1231
+ "grad_norm": 0.5221493244171143,
1232
+ "learning_rate": 3.444857111151259e-05,
1233
+ "loss": 0.0547,
1234
+ "step": 2040
1235
+ },
1236
+ {
1237
+ "grad_norm": 0.4845060110092163,
1238
+ "learning_rate": 3.429528255292485e-05,
1239
+ "loss": 0.0497,
1240
+ "step": 2050
1241
+ },
1242
+ {
1243
+ "grad_norm": 0.4617994725704193,
1244
+ "learning_rate": 3.41415873885657e-05,
1245
+ "loss": 0.0489,
1246
+ "step": 2060
1247
+ },
1248
+ {
1249
+ "grad_norm": 0.4810671806335449,
1250
+ "learning_rate": 3.3987492341559535e-05,
1251
+ "loss": 0.0478,
1252
+ "step": 2070
1253
+ },
1254
+ {
1255
+ "grad_norm": 0.5026255249977112,
1256
+ "learning_rate": 3.383300415252292e-05,
1257
+ "loss": 0.0446,
1258
+ "step": 2080
1259
+ },
1260
+ {
1261
+ "grad_norm": 0.477425754070282,
1262
+ "learning_rate": 3.367812957926971e-05,
1263
+ "loss": 0.0517,
1264
+ "step": 2090
1265
+ },
1266
+ {
1267
+ "grad_norm": 0.3495548367500305,
1268
+ "learning_rate": 3.352287539651545e-05,
1269
+ "loss": 0.0456,
1270
+ "step": 2100
1271
+ },
1272
+ {
1273
+ "grad_norm": 0.45665979385375977,
1274
+ "learning_rate": 3.3367248395581076e-05,
1275
+ "loss": 0.046,
1276
+ "step": 2110
1277
+ },
1278
+ {
1279
+ "grad_norm": 0.41686445474624634,
1280
+ "learning_rate": 3.321125538409574e-05,
1281
+ "loss": 0.0486,
1282
+ "step": 2120
1283
+ },
1284
+ {
1285
+ "grad_norm": 0.3617282211780548,
1286
+ "learning_rate": 3.3054903185699135e-05,
1287
+ "loss": 0.0476,
1288
+ "step": 2130
1289
+ },
1290
+ {
1291
+ "grad_norm": 0.47553274035453796,
1292
+ "learning_rate": 3.2898198639742915e-05,
1293
+ "loss": 0.0432,
1294
+ "step": 2140
1295
+ },
1296
+ {
1297
+ "grad_norm": 0.3067774176597595,
1298
+ "learning_rate": 3.2741148600991576e-05,
1299
+ "loss": 0.0522,
1300
+ "step": 2150
1301
+ },
1302
+ {
1303
+ "grad_norm": 0.5735144019126892,
1304
+ "learning_rate": 3.258375993932259e-05,
1305
+ "loss": 0.0476,
1306
+ "step": 2160
1307
+ },
1308
+ {
1309
+ "grad_norm": 0.2728676497936249,
1310
+ "learning_rate": 3.2426039539425876e-05,
1311
+ "loss": 0.0414,
1312
+ "step": 2170
1313
+ },
1314
+ {
1315
+ "grad_norm": 0.6051283478736877,
1316
+ "learning_rate": 3.226799430050268e-05,
1317
+ "loss": 0.0499,
1318
+ "step": 2180
1319
+ },
1320
+ {
1321
+ "grad_norm": 0.5630646347999573,
1322
+ "learning_rate": 3.210963113596374e-05,
1323
+ "loss": 0.0418,
1324
+ "step": 2190
1325
+ },
1326
+ {
1327
+ "grad_norm": 0.4311167001724243,
1328
+ "learning_rate": 3.1950956973126906e-05,
1329
+ "loss": 0.0499,
1330
+ "step": 2200
1331
+ },
1332
+ {
1333
+ "grad_norm": 0.4380161166191101,
1334
+ "learning_rate": 3.1791978752914085e-05,
1335
+ "loss": 0.0401,
1336
+ "step": 2210
1337
+ },
1338
+ {
1339
+ "grad_norm": 0.43494531512260437,
1340
+ "learning_rate": 3.163270342954766e-05,
1341
+ "loss": 0.0469,
1342
+ "step": 2220
1343
+ },
1344
+ {
1345
+ "grad_norm": 0.5626083612442017,
1346
+ "learning_rate": 3.1473137970246246e-05,
1347
+ "loss": 0.049,
1348
+ "step": 2230
1349
+ },
1350
+ {
1351
+ "grad_norm": 0.4352441132068634,
1352
+ "learning_rate": 3.1313289354919945e-05,
1353
+ "loss": 0.0459,
1354
+ "step": 2240
1355
+ },
1356
+ {
1357
+ "grad_norm": 0.48047247529029846,
1358
+ "learning_rate": 3.1153164575865046e-05,
1359
+ "loss": 0.0459,
1360
+ "step": 2250
1361
+ },
1362
+ {
1363
+ "grad_norm": 0.6736582517623901,
1364
+ "learning_rate": 3.099277063745811e-05,
1365
+ "loss": 0.0539,
1366
+ "step": 2260
1367
+ },
1368
+ {
1369
+ "grad_norm": 0.40036192536354065,
1370
+ "learning_rate": 3.0832114555849614e-05,
1371
+ "loss": 0.0438,
1372
+ "step": 2270
1373
+ },
1374
+ {
1375
+ "grad_norm": 0.42229387164115906,
1376
+ "learning_rate": 3.0671203358657e-05,
1377
+ "loss": 0.0413,
1378
+ "step": 2280
1379
+ },
1380
+ {
1381
+ "grad_norm": 0.3298429250717163,
1382
+ "learning_rate": 3.051004408465733e-05,
1383
+ "loss": 0.04,
1384
+ "step": 2290
1385
+ },
1386
+ {
1387
+ "grad_norm": 0.43710318207740784,
1388
+ "learning_rate": 3.034864378347933e-05,
1389
+ "loss": 0.0454,
1390
+ "step": 2300
1391
+ },
1392
+ {
1393
+ "grad_norm": 0.4662761390209198,
1394
+ "learning_rate": 3.018700951529504e-05,
1395
+ "loss": 0.0521,
1396
+ "step": 2310
1397
+ },
1398
+ {
1399
+ "grad_norm": 0.5804249048233032,
1400
+ "learning_rate": 3.0025148350510974e-05,
1401
+ "loss": 0.0475,
1402
+ "step": 2320
1403
+ },
1404
+ {
1405
+ "grad_norm": 0.4282180070877075,
1406
+ "learning_rate": 2.986306736945883e-05,
1407
+ "loss": 0.0466,
1408
+ "step": 2330
1409
+ },
1410
+ {
1411
+ "grad_norm": 0.45659002661705017,
1412
+ "learning_rate": 2.970077366208579e-05,
1413
+ "loss": 0.0387,
1414
+ "step": 2340
1415
+ },
1416
+ {
1417
+ "grad_norm": 0.5479471683502197,
1418
+ "learning_rate": 2.953827432764438e-05,
1419
+ "loss": 0.0461,
1420
+ "step": 2350
1421
+ },
1422
+ {
1423
+ "grad_norm": 0.31041985750198364,
1424
+ "learning_rate": 2.9375576474381905e-05,
1425
+ "loss": 0.042,
1426
+ "step": 2360
1427
+ },
1428
+ {
1429
+ "grad_norm": 0.42949941754341125,
1430
+ "learning_rate": 2.921268721922954e-05,
1431
+ "loss": 0.0435,
1432
+ "step": 2370
1433
+ },
1434
+ {
1435
+ "grad_norm": 0.4704861044883728,
1436
+ "learning_rate": 2.904961368749099e-05,
1437
+ "loss": 0.0447,
1438
+ "step": 2380
1439
+ },
1440
+ {
1441
+ "grad_norm": 0.4041045606136322,
1442
+ "learning_rate": 2.8886363012530826e-05,
1443
+ "loss": 0.0429,
1444
+ "step": 2390
1445
+ },
1446
+ {
1447
+ "grad_norm": 0.3385079503059387,
1448
+ "learning_rate": 2.8722942335462415e-05,
1449
+ "loss": 0.0454,
1450
+ "step": 2400
1451
+ },
1452
+ {
1453
+ "grad_norm": 0.5993208289146423,
1454
+ "learning_rate": 2.8559358804835597e-05,
1455
+ "loss": 0.0426,
1456
+ "step": 2410
1457
+ },
1458
+ {
1459
+ "grad_norm": 0.36963415145874023,
1460
+ "learning_rate": 2.839561957632393e-05,
1461
+ "loss": 0.0515,
1462
+ "step": 2420
1463
+ },
1464
+ {
1465
+ "grad_norm": 0.5569792985916138,
1466
+ "learning_rate": 2.823173181241171e-05,
1467
+ "loss": 0.0484,
1468
+ "step": 2430
1469
+ },
1470
+ {
1471
+ "grad_norm": 0.4478709101676941,
1472
+ "learning_rate": 2.806770268208066e-05,
1473
+ "loss": 0.0442,
1474
+ "step": 2440
1475
+ },
1476
+ {
1477
+ "grad_norm": 0.39773526787757874,
1478
+ "learning_rate": 2.7903539360496323e-05,
1479
+ "loss": 0.0362,
1480
+ "step": 2450
1481
+ },
1482
+ {
1483
+ "grad_norm": 0.4185701906681061,
1484
+ "learning_rate": 2.773924902869418e-05,
1485
+ "loss": 0.046,
1486
+ "step": 2460
1487
+ },
1488
+ {
1489
+ "grad_norm": 0.43949025869369507,
1490
+ "learning_rate": 2.757483887326559e-05,
1491
+ "loss": 0.0433,
1492
+ "step": 2470
1493
+ },
1494
+ {
1495
+ "grad_norm": 0.4299829602241516,
1496
+ "learning_rate": 2.741031608604337e-05,
1497
+ "loss": 0.0394,
1498
+ "step": 2480
1499
+ },
1500
+ {
1501
+ "grad_norm": 0.27871155738830566,
1502
+ "learning_rate": 2.7245687863787195e-05,
1503
+ "loss": 0.0367,
1504
+ "step": 2490
1505
+ },
1506
+ {
1507
+ "grad_norm": 0.4810972511768341,
1508
+ "learning_rate": 2.7080961407868848e-05,
1509
+ "loss": 0.0428,
1510
+ "step": 2500
1511
+ },
1512
+ {
1513
+ "grad_norm": 0.3548348546028137,
1514
+ "learning_rate": 2.6916143923957138e-05,
1515
+ "loss": 0.0435,
1516
+ "step": 2510
1517
+ },
1518
+ {
1519
+ "grad_norm": 0.3431377410888672,
1520
+ "learning_rate": 2.675124262170275e-05,
1521
+ "loss": 0.0336,
1522
+ "step": 2520
1523
+ },
1524
+ {
1525
+ "grad_norm": 0.4408491551876068,
1526
+ "learning_rate": 2.6586264714422836e-05,
1527
+ "loss": 0.0404,
1528
+ "step": 2530
1529
+ },
1530
+ {
1531
+ "grad_norm": 1.0779521465301514,
1532
+ "learning_rate": 2.6421217418785544e-05,
1533
+ "loss": 0.0424,
1534
+ "step": 2540
1535
+ },
1536
+ {
1537
+ "grad_norm": 0.40511152148246765,
1538
+ "learning_rate": 2.6256107954494242e-05,
1539
+ "loss": 0.0476,
1540
+ "step": 2550
1541
+ },
1542
+ {
1543
+ "grad_norm": 0.36247146129608154,
1544
+ "learning_rate": 2.6090943543971784e-05,
1545
+ "loss": 0.0436,
1546
+ "step": 2560
1547
+ },
1548
+ {
1549
+ "grad_norm": 0.3747636079788208,
1550
+ "learning_rate": 2.592573141204455e-05,
1551
+ "loss": 0.0404,
1552
+ "step": 2570
1553
+ },
1554
+ {
1555
+ "grad_norm": 0.5357540249824524,
1556
+ "learning_rate": 2.5760478785626397e-05,
1557
+ "loss": 0.0444,
1558
+ "step": 2580
1559
+ },
1560
+ {
1561
+ "grad_norm": 0.3767753839492798,
1562
+ "learning_rate": 2.5595192893402553e-05,
1563
+ "loss": 0.0397,
1564
+ "step": 2590
1565
+ },
1566
+ {
1567
+ "grad_norm": 0.3285132944583893,
1568
+ "learning_rate": 2.5429880965513386e-05,
1569
+ "loss": 0.0381,
1570
+ "step": 2600
1571
+ },
1572
+ {
1573
+ "grad_norm": 0.4897662401199341,
1574
+ "learning_rate": 2.526455023323817e-05,
1575
+ "loss": 0.039,
1576
+ "step": 2610
1577
+ },
1578
+ {
1579
+ "grad_norm": 0.4508710205554962,
1580
+ "learning_rate": 2.5099207928678732e-05,
1581
+ "loss": 0.0395,
1582
+ "step": 2620
1583
+ },
1584
+ {
1585
+ "grad_norm": 0.3298162519931793,
1586
+ "learning_rate": 2.4933861284443112e-05,
1587
+ "loss": 0.0413,
1588
+ "step": 2630
1589
+ },
1590
+ {
1591
+ "grad_norm": 0.42930713295936584,
1592
+ "learning_rate": 2.4768517533329157e-05,
1593
+ "loss": 0.0461,
1594
+ "step": 2640
1595
+ },
1596
+ {
1597
+ "grad_norm": 0.43155762553215027,
1598
+ "learning_rate": 2.460318390800819e-05,
1599
+ "loss": 0.0453,
1600
+ "step": 2650
1601
+ },
1602
+ {
1603
+ "grad_norm": 0.3605857789516449,
1604
+ "learning_rate": 2.44378676407086e-05,
1605
+ "loss": 0.0445,
1606
+ "step": 2660
1607
+ },
1608
+ {
1609
+ "grad_norm": 0.2702181041240692,
1610
+ "learning_rate": 2.4272575962899462e-05,
1611
+ "loss": 0.0421,
1612
+ "step": 2670
1613
+ },
1614
+ {
1615
+ "grad_norm": 0.3844555616378784,
1616
+ "learning_rate": 2.410731610497424e-05,
1617
+ "loss": 0.0418,
1618
+ "step": 2680
1619
+ },
1620
+ {
1621
+ "grad_norm": 0.4364534914493561,
1622
+ "learning_rate": 2.3942095295934476e-05,
1623
+ "loss": 0.0379,
1624
+ "step": 2690
1625
+ },
1626
+ {
1627
+ "grad_norm": 0.33137261867523193,
1628
+ "learning_rate": 2.3776920763073602e-05,
1629
+ "loss": 0.0422,
1630
+ "step": 2700
1631
+ },
1632
+ {
1633
+ "grad_norm": 0.2672342360019684,
1634
+ "learning_rate": 2.361179973166078e-05,
1635
+ "loss": 0.0424,
1636
+ "step": 2710
1637
+ },
1638
+ {
1639
+ "grad_norm": 0.34315600991249084,
1640
+ "learning_rate": 2.3446739424624827e-05,
1641
+ "loss": 0.0411,
1642
+ "step": 2720
1643
+ },
1644
+ {
1645
+ "grad_norm": 0.4923914670944214,
1646
+ "learning_rate": 2.328174706223832e-05,
1647
+ "loss": 0.0439,
1648
+ "step": 2730
1649
+ },
1650
+ {
1651
+ "grad_norm": 0.26800429821014404,
1652
+ "learning_rate": 2.3116829861801686e-05,
1653
+ "loss": 0.0391,
1654
+ "step": 2740
1655
+ },
1656
+ {
1657
+ "grad_norm": 0.29833143949508667,
1658
+ "learning_rate": 2.2951995037327515e-05,
1659
+ "loss": 0.0397,
1660
+ "step": 2750
1661
+ },
1662
+ {
1663
+ "grad_norm": 0.3327856957912445,
1664
+ "learning_rate": 2.2787249799225024e-05,
1665
+ "loss": 0.0381,
1666
+ "step": 2760
1667
+ },
1668
+ {
1669
+ "grad_norm": 0.46502891182899475,
1670
+ "learning_rate": 2.2622601353984635e-05,
1671
+ "loss": 0.0411,
1672
+ "step": 2770
1673
+ },
1674
+ {
1675
+ "grad_norm": 0.40785571932792664,
1676
+ "learning_rate": 2.2458056903862726e-05,
1677
+ "loss": 0.0379,
1678
+ "step": 2780
1679
+ },
1680
+ {
1681
+ "grad_norm": 0.3968541622161865,
1682
+ "learning_rate": 2.229362364656659e-05,
1683
+ "loss": 0.0429,
1684
+ "step": 2790
1685
+ },
1686
+ {
1687
+ "grad_norm": 0.40930506587028503,
1688
+ "learning_rate": 2.21293087749396e-05,
1689
+ "loss": 0.0374,
1690
+ "step": 2800
1691
+ },
1692
+ {
1693
+ "grad_norm": 0.4295065701007843,
1694
+ "learning_rate": 2.1965119476646547e-05,
1695
+ "loss": 0.0366,
1696
+ "step": 2810
1697
+ },
1698
+ {
1699
+ "grad_norm": 0.4438641667366028,
1700
+ "learning_rate": 2.1801062933859235e-05,
1701
+ "loss": 0.0378,
1702
+ "step": 2820
1703
+ },
1704
+ {
1705
+ "grad_norm": 0.3975362181663513,
1706
+ "learning_rate": 2.1637146322942315e-05,
1707
+ "loss": 0.036,
1708
+ "step": 2830
1709
+ },
1710
+ {
1711
+ "grad_norm": 0.44547799229621887,
1712
+ "learning_rate": 2.1473376814139362e-05,
1713
+ "loss": 0.0395,
1714
+ "step": 2840
1715
+ },
1716
+ {
1717
+ "grad_norm": 0.4006638526916504,
1718
+ "learning_rate": 2.1309761571259237e-05,
1719
+ "loss": 0.0367,
1720
+ "step": 2850
1721
+ },
1722
+ {
1723
+ "grad_norm": 0.27414795756340027,
1724
+ "learning_rate": 2.1146307751362694e-05,
1725
+ "loss": 0.0312,
1726
+ "step": 2860
1727
+ },
1728
+ {
1729
+ "grad_norm": 0.4664889872074127,
1730
+ "learning_rate": 2.098302250444934e-05,
1731
+ "loss": 0.0413,
1732
+ "step": 2870
1733
+ },
1734
+ {
1735
+ "grad_norm": 0.19164593517780304,
1736
+ "learning_rate": 2.0819912973144843e-05,
1737
+ "loss": 0.0345,
1738
+ "step": 2880
1739
+ },
1740
+ {
1741
+ "grad_norm": 0.33589157462120056,
1742
+ "learning_rate": 2.065698629238851e-05,
1743
+ "loss": 0.0355,
1744
+ "step": 2890
1745
+ },
1746
+ {
1747
+ "grad_norm": 0.33917805552482605,
1748
+ "learning_rate": 2.0494249589121157e-05,
1749
+ "loss": 0.0393,
1750
+ "step": 2900
1751
+ },
1752
+ {
1753
+ "grad_norm": 0.32117098569869995,
1754
+ "learning_rate": 2.033170998197339e-05,
1755
+ "loss": 0.0448,
1756
+ "step": 2910
1757
+ },
1758
+ {
1759
+ "grad_norm": 0.6140998005867004,
1760
+ "learning_rate": 2.0169374580954165e-05,
1761
+ "loss": 0.0378,
1762
+ "step": 2920
1763
+ },
1764
+ {
1765
+ "grad_norm": 0.5331240296363831,
1766
+ "learning_rate": 2.000725048713983e-05,
1767
+ "loss": 0.0365,
1768
+ "step": 2930
1769
+ },
1770
+ {
1771
+ "grad_norm": 0.3481861352920532,
1772
+ "learning_rate": 1.9845344792363447e-05,
1773
+ "loss": 0.0356,
1774
+ "step": 2940
1775
+ },
1776
+ {
1777
+ "grad_norm": 0.5170403718948364,
1778
+ "learning_rate": 1.9683664578904614e-05,
1779
+ "loss": 0.0403,
1780
+ "step": 2950
1781
+ },
1782
+ {
1783
+ "grad_norm": 0.31584399938583374,
1784
+ "learning_rate": 1.9522216919179644e-05,
1785
+ "loss": 0.0404,
1786
+ "step": 2960
1787
+ },
1788
+ {
1789
+ "grad_norm": 0.3115321099758148,
1790
+ "learning_rate": 1.9361008875432185e-05,
1791
+ "loss": 0.0358,
1792
+ "step": 2970
1793
+ },
1794
+ {
1795
+ "grad_norm": 0.338223397731781,
1796
+ "learning_rate": 1.9200047499424308e-05,
1797
+ "loss": 0.0331,
1798
+ "step": 2980
1799
+ },
1800
+ {
1801
+ "grad_norm": 0.48482340574264526,
1802
+ "learning_rate": 1.9039339832128057e-05,
1803
+ "loss": 0.0347,
1804
+ "step": 2990
1805
+ },
1806
+ {
1807
+ "grad_norm": 0.4181440770626068,
1808
+ "learning_rate": 1.8878892903417404e-05,
1809
+ "loss": 0.0389,
1810
+ "step": 3000
1811
+ },
1812
+ {
1813
+ "grad_norm": 0.42534828186035156,
1814
+ "learning_rate": 1.871871373176078e-05,
1815
+ "loss": 0.0392,
1816
+ "step": 3010
1817
+ },
1818
+ {
1819
+ "grad_norm": 0.5645197629928589,
1820
+ "learning_rate": 1.8558809323914083e-05,
1821
+ "loss": 0.0461,
1822
+ "step": 3020
1823
+ },
1824
+ {
1825
+ "grad_norm": 0.36499112844467163,
1826
+ "learning_rate": 1.8399186674614126e-05,
1827
+ "loss": 0.0343,
1828
+ "step": 3030
1829
+ },
1830
+ {
1831
+ "grad_norm": 0.2742806673049927,
1832
+ "learning_rate": 1.823985276627269e-05,
1833
+ "loss": 0.0283,
1834
+ "step": 3040
1835
+ },
1836
+ {
1837
+ "grad_norm": 0.39008432626724243,
1838
+ "learning_rate": 1.80808145686711e-05,
1839
+ "loss": 0.0374,
1840
+ "step": 3050
1841
+ },
1842
+ {
1843
+ "grad_norm": 0.36456918716430664,
1844
+ "learning_rate": 1.7922079038655326e-05,
1845
+ "loss": 0.037,
1846
+ "step": 3060
1847
+ },
1848
+ {
1849
+ "grad_norm": 0.2564813792705536,
1850
+ "learning_rate": 1.7763653119831684e-05,
1851
+ "loss": 0.0374,
1852
+ "step": 3070
1853
+ },
1854
+ {
1855
+ "grad_norm": 0.4312773048877716,
1856
+ "learning_rate": 1.7605543742263087e-05,
1857
+ "loss": 0.0353,
1858
+ "step": 3080
1859
+ },
1860
+ {
1861
+ "grad_norm": 0.30969807505607605,
1862
+ "learning_rate": 1.744775782216593e-05,
1863
+ "loss": 0.0339,
1864
+ "step": 3090
1865
+ },
1866
+ {
1867
+ "grad_norm": 0.3753385543823242,
1868
+ "learning_rate": 1.7290302261607503e-05,
1869
+ "loss": 0.0323,
1870
+ "step": 3100
1871
+ },
1872
+ {
1873
+ "grad_norm": 0.3404577672481537,
1874
+ "learning_rate": 1.7133183948204108e-05,
1875
+ "loss": 0.0346,
1876
+ "step": 3110
1877
+ },
1878
+ {
1879
+ "grad_norm": 0.33649688959121704,
1880
+ "learning_rate": 1.6976409754819767e-05,
1881
+ "loss": 0.0332,
1882
+ "step": 3120
1883
+ },
1884
+ {
1885
+ "grad_norm": 0.7442240715026855,
1886
+ "learning_rate": 1.6819986539265582e-05,
1887
+ "loss": 0.0392,
1888
+ "step": 3130
1889
+ },
1890
+ {
1891
+ "grad_norm": 0.3342534899711609,
1892
+ "learning_rate": 1.6663921143999733e-05,
1893
+ "loss": 0.0368,
1894
+ "step": 3140
1895
+ },
1896
+ {
1897
+ "grad_norm": 0.32587477564811707,
1898
+ "learning_rate": 1.650822039582819e-05,
1899
+ "loss": 0.0318,
1900
+ "step": 3150
1901
+ },
1902
+ {
1903
+ "grad_norm": 0.5487452149391174,
1904
+ "learning_rate": 1.63528911056061e-05,
1905
+ "loss": 0.0376,
1906
+ "step": 3160
1907
+ },
1908
+ {
1909
+ "grad_norm": 0.5345733165740967,
1910
+ "learning_rate": 1.619794006793979e-05,
1911
+ "loss": 0.0386,
1912
+ "step": 3170
1913
+ },
1914
+ {
1915
+ "grad_norm": 0.3318815231323242,
1916
+ "learning_rate": 1.604337406088963e-05,
1917
+ "loss": 0.0308,
1918
+ "step": 3180
1919
+ },
1920
+ {
1921
+ "grad_norm": 0.41096043586730957,
1922
+ "learning_rate": 1.588919984567349e-05,
1923
+ "loss": 0.036,
1924
+ "step": 3190
1925
+ },
1926
+ {
1927
+ "grad_norm": 0.49638691544532776,
1928
+ "learning_rate": 1.5735424166371e-05,
1929
+ "loss": 0.0404,
1930
+ "step": 3200
1931
+ },
1932
+ {
1933
+ "grad_norm": 0.38568755984306335,
1934
+ "learning_rate": 1.558205374962854e-05,
1935
+ "loss": 0.033,
1936
+ "step": 3210
1937
+ },
1938
+ {
1939
+ "grad_norm": 0.34658241271972656,
1940
+ "learning_rate": 1.5429095304364976e-05,
1941
+ "loss": 0.0327,
1942
+ "step": 3220
1943
+ },
1944
+ {
1945
+ "grad_norm": 0.33020010590553284,
1946
+ "learning_rate": 1.527655552147824e-05,
1947
+ "loss": 0.0373,
1948
+ "step": 3230
1949
+ },
1950
+ {
1951
+ "grad_norm": 0.5657230615615845,
1952
+ "learning_rate": 1.5124441073552585e-05,
1953
+ "loss": 0.0354,
1954
+ "step": 3240
1955
+ },
1956
+ {
1957
+ "grad_norm": 0.3239688277244568,
1958
+ "learning_rate": 1.4972758614566746e-05,
1959
+ "loss": 0.0295,
1960
+ "step": 3250
1961
+ },
1962
+ {
1963
+ "grad_norm": 0.387555330991745,
1964
+ "learning_rate": 1.4821514779602864e-05,
1965
+ "loss": 0.0436,
1966
+ "step": 3260
1967
+ },
1968
+ {
1969
+ "grad_norm": 0.3232133388519287,
1970
+ "learning_rate": 1.467071618455624e-05,
1971
+ "loss": 0.0322,
1972
+ "step": 3270
1973
+ },
1974
+ {
1975
+ "grad_norm": 0.2886604964733124,
1976
+ "learning_rate": 1.452036942584595e-05,
1977
+ "loss": 0.0304,
1978
+ "step": 3280
1979
+ },
1980
+ {
1981
+ "grad_norm": 0.2882493734359741,
1982
+ "learning_rate": 1.4370481080126248e-05,
1983
+ "loss": 0.0314,
1984
+ "step": 3290
1985
+ },
1986
+ {
1987
+ "grad_norm": 0.4715385138988495,
1988
+ "learning_rate": 1.4221057703998985e-05,
1989
+ "loss": 0.0334,
1990
+ "step": 3300
1991
+ },
1992
+ {
1993
+ "grad_norm": 0.3316683769226074,
1994
+ "learning_rate": 1.4072105833726684e-05,
1995
+ "loss": 0.0351,
1996
+ "step": 3310
1997
+ },
1998
+ {
1999
+ "grad_norm": 0.3624657988548279,
2000
+ "learning_rate": 1.3923631984946672e-05,
2001
+ "loss": 0.035,
2002
+ "step": 3320
2003
+ },
2004
+ {
2005
+ "grad_norm": 0.36212462186813354,
2006
+ "learning_rate": 1.3775642652386103e-05,
2007
+ "loss": 0.0301,
2008
+ "step": 3330
2009
+ },
2010
+ {
2011
+ "grad_norm": 0.36848610639572144,
2012
+ "learning_rate": 1.3628144309577784e-05,
2013
+ "loss": 0.0324,
2014
+ "step": 3340
2015
+ },
2016
+ {
2017
+ "grad_norm": 0.4272776246070862,
2018
+ "learning_rate": 1.3481143408577079e-05,
2019
+ "loss": 0.0373,
2020
+ "step": 3350
2021
+ },
2022
+ {
2023
+ "grad_norm": 0.37170878052711487,
2024
+ "learning_rate": 1.3334646379679583e-05,
2025
+ "loss": 0.033,
2026
+ "step": 3360
2027
+ },
2028
+ {
2029
+ "grad_norm": 0.48944494128227234,
2030
+ "learning_rate": 1.3188659631139966e-05,
2031
+ "loss": 0.0414,
2032
+ "step": 3370
2033
+ },
2034
+ {
2035
+ "grad_norm": 0.3089650869369507,
2036
+ "learning_rate": 1.3043189548891516e-05,
2037
+ "loss": 0.0338,
2038
+ "step": 3380
2039
+ },
2040
+ {
2041
+ "grad_norm": 0.3926386535167694,
2042
+ "learning_rate": 1.2898242496266884e-05,
2043
+ "loss": 0.0351,
2044
+ "step": 3390
2045
+ },
2046
+ {
2047
+ "grad_norm": 0.40642455220222473,
2048
+ "learning_rate": 1.2753824813719733e-05,
2049
+ "loss": 0.0412,
2050
+ "step": 3400
2051
+ },
2052
+ {
2053
+ "grad_norm": 0.35056406259536743,
2054
+ "learning_rate": 1.2609942818547327e-05,
2055
+ "loss": 0.035,
2056
+ "step": 3410
2057
+ },
2058
+ {
2059
+ "grad_norm": 0.2923920750617981,
2060
+ "learning_rate": 1.2466602804614266e-05,
2061
+ "loss": 0.035,
2062
+ "step": 3420
2063
+ },
2064
+ {
2065
+ "grad_norm": 0.9390926957130432,
2066
+ "learning_rate": 1.2323811042077096e-05,
2067
+ "loss": 0.0298,
2068
+ "step": 3430
2069
+ },
2070
+ {
2071
+ "grad_norm": 0.5153149366378784,
2072
+ "learning_rate": 1.2181573777110106e-05,
2073
+ "loss": 0.0376,
2074
+ "step": 3440
2075
+ },
2076
+ {
2077
+ "grad_norm": 0.2597624659538269,
2078
+ "learning_rate": 1.2039897231632055e-05,
2079
+ "loss": 0.0333,
2080
+ "step": 3450
2081
+ },
2082
+ {
2083
+ "grad_norm": 0.36722615361213684,
2084
+ "learning_rate": 1.1898787603033995e-05,
2085
+ "loss": 0.038,
2086
+ "step": 3460
2087
+ },
2088
+ {
2089
+ "grad_norm": 0.23120303452014923,
2090
+ "learning_rate": 1.1758251063908227e-05,
2091
+ "loss": 0.0305,
2092
+ "step": 3470
2093
+ },
2094
+ {
2095
+ "grad_norm": 0.4411832094192505,
2096
+ "learning_rate": 1.1618293761778235e-05,
2097
+ "loss": 0.0305,
2098
+ "step": 3480
2099
+ },
2100
+ {
2101
+ "grad_norm": 0.36204567551612854,
2102
+ "learning_rate": 1.1478921818829827e-05,
2103
+ "loss": 0.0325,
2104
+ "step": 3490
2105
+ },
2106
+ {
2107
+ "grad_norm": 0.38650524616241455,
2108
+ "learning_rate": 1.1340141331643276e-05,
2109
+ "loss": 0.037,
2110
+ "step": 3500
2111
+ },
2112
+ {
2113
+ "grad_norm": 0.29249370098114014,
2114
+ "learning_rate": 1.1201958370926682e-05,
2115
+ "loss": 0.0304,
2116
+ "step": 3510
2117
+ },
2118
+ {
2119
+ "grad_norm": 0.3050512969493866,
2120
+ "learning_rate": 1.1064378981250409e-05,
2121
+ "loss": 0.0322,
2122
+ "step": 3520
2123
+ },
2124
+ {
2125
+ "grad_norm": 0.36122196912765503,
2126
+ "learning_rate": 1.0927409180782638e-05,
2127
+ "loss": 0.0325,
2128
+ "step": 3530
2129
+ },
2130
+ {
2131
+ "grad_norm": 0.3820047974586487,
2132
+ "learning_rate": 1.0791054961026182e-05,
2133
+ "loss": 0.0361,
2134
+ "step": 3540
2135
+ },
2136
+ {
2137
+ "grad_norm": 0.3520725965499878,
2138
+ "learning_rate": 1.0655322286556318e-05,
2139
+ "loss": 0.0333,
2140
+ "step": 3550
2141
+ },
2142
+ {
2143
+ "grad_norm": 0.3393506705760956,
2144
+ "learning_rate": 1.0520217094759962e-05,
2145
+ "loss": 0.0352,
2146
+ "step": 3560
2147
+ },
2148
+ {
2149
+ "grad_norm": 0.3986015021800995,
2150
+ "learning_rate": 1.0385745295575866e-05,
2151
+ "loss": 0.0331,
2152
+ "step": 3570
2153
+ },
2154
+ {
2155
+ "grad_norm": 0.3583716154098511,
2156
+ "learning_rate": 1.0251912771236159e-05,
2157
+ "loss": 0.0319,
2158
+ "step": 3580
2159
+ },
2160
+ {
2161
+ "grad_norm": 0.27882295846939087,
2162
+ "learning_rate": 1.0118725376009025e-05,
2163
+ "loss": 0.0341,
2164
+ "step": 3590
2165
+ },
2166
+ {
2167
+ "grad_norm": 0.32304292917251587,
2168
+ "learning_rate": 9.986188935942579e-06,
2169
+ "loss": 0.0291,
2170
+ "step": 3600
2171
+ },
2172
+ {
2173
+ "grad_norm": 0.5138395428657532,
2174
+ "learning_rate": 9.854309248610085e-06,
2175
+ "loss": 0.0313,
2176
+ "step": 3610
2177
+ },
2178
+ {
2179
+ "grad_norm": 0.31992360949516296,
2180
+ "learning_rate": 9.723092082856294e-06,
2181
+ "loss": 0.0305,
2182
+ "step": 3620
2183
+ },
2184
+ {
2185
+ "grad_norm": 0.2782381772994995,
2186
+ "learning_rate": 9.592543178545107e-06,
2187
+ "loss": 0.029,
2188
+ "step": 3630
2189
+ },
2190
+ {
2191
+ "grad_norm": 0.27642911672592163,
2192
+ "learning_rate": 9.462668246308529e-06,
2193
+ "loss": 0.0329,
2194
+ "step": 3640
2195
+ },
2196
+ {
2197
+ "grad_norm": 0.33659425377845764,
2198
+ "learning_rate": 9.333472967296833e-06,
2199
+ "loss": 0.0328,
2200
+ "step": 3650
2201
+ },
2202
+ {
2203
+ "grad_norm": 0.40272244811058044,
2204
+ "learning_rate": 9.204962992930063e-06,
2205
+ "loss": 0.0284,
2206
+ "step": 3660
2207
+ },
2208
+ {
2209
+ "grad_norm": 0.4781797528266907,
2210
+ "learning_rate": 9.077143944650802e-06,
2211
+ "loss": 0.0323,
2212
+ "step": 3670
2213
+ },
2214
+ {
2215
+ "grad_norm": 0.34181609749794006,
2216
+ "learning_rate": 8.950021413678306e-06,
2217
+ "loss": 0.0305,
2218
+ "step": 3680
2219
+ },
2220
+ {
2221
+ "grad_norm": 0.3515138328075409,
2222
+ "learning_rate": 8.8236009607639e-06,
2223
+ "loss": 0.0311,
2224
+ "step": 3690
2225
+ },
2226
+ {
2227
+ "grad_norm": 0.42265385389328003,
2228
+ "learning_rate": 8.697888115947725e-06,
2229
+ "loss": 0.0294,
2230
+ "step": 3700
2231
+ },
2232
+ {
2233
+ "grad_norm": 0.24089132249355316,
2234
+ "learning_rate": 8.572888378316884e-06,
2235
+ "loss": 0.0346,
2236
+ "step": 3710
2237
+ },
2238
+ {
2239
+ "grad_norm": 0.3806060254573822,
2240
+ "learning_rate": 8.448607215764823e-06,
2241
+ "loss": 0.0274,
2242
+ "step": 3720
2243
+ },
2244
+ {
2245
+ "grad_norm": 0.40154969692230225,
2246
+ "learning_rate": 8.325050064752238e-06,
2247
+ "loss": 0.0321,
2248
+ "step": 3730
2249
+ },
2250
+ {
2251
+ "grad_norm": 0.6564791798591614,
2252
+ "learning_rate": 8.202222330069167e-06,
2253
+ "loss": 0.0324,
2254
+ "step": 3740
2255
+ },
2256
+ {
2257
+ "grad_norm": 0.4108399748802185,
2258
+ "learning_rate": 8.080129384598625e-06,
2259
+ "loss": 0.0301,
2260
+ "step": 3750
2261
+ },
2262
+ {
2263
+ "grad_norm": 0.19246874749660492,
2264
+ "learning_rate": 7.958776569081586e-06,
2265
+ "loss": 0.0288,
2266
+ "step": 3760
2267
+ },
2268
+ {
2269
+ "grad_norm": 0.4110735058784485,
2270
+ "learning_rate": 7.838169191883316e-06,
2271
+ "loss": 0.0382,
2272
+ "step": 3770
2273
+ },
2274
+ {
2275
+ "grad_norm": 0.25348952412605286,
2276
+ "learning_rate": 7.718312528761223e-06,
2277
+ "loss": 0.0311,
2278
+ "step": 3780
2279
+ },
2280
+ {
2281
+ "grad_norm": 0.3308151662349701,
2282
+ "learning_rate": 7.59921182263402e-06,
2283
+ "loss": 0.0274,
2284
+ "step": 3790
2285
+ },
2286
+ {
2287
+ "grad_norm": 0.28520438075065613,
2288
+ "learning_rate": 7.480872283352428e-06,
2289
+ "loss": 0.0309,
2290
+ "step": 3800
2291
+ },
2292
+ {
2293
+ "grad_norm": 0.337143212556839,
2294
+ "learning_rate": 7.363299087471276e-06,
2295
+ "loss": 0.0259,
2296
+ "step": 3810
2297
+ },
2298
+ {
2299
+ "grad_norm": 0.22851786017417908,
2300
+ "learning_rate": 7.246497378023018e-06,
2301
+ "loss": 0.0323,
2302
+ "step": 3820
2303
+ },
2304
+ {
2305
+ "grad_norm": 0.5074667930603027,
2306
+ "learning_rate": 7.130472264292823e-06,
2307
+ "loss": 0.0292,
2308
+ "step": 3830
2309
+ },
2310
+ {
2311
+ "grad_norm": 0.2871147096157074,
2312
+ "learning_rate": 7.015228821595024e-06,
2313
+ "loss": 0.0296,
2314
+ "step": 3840
2315
+ },
2316
+ {
2317
+ "grad_norm": 0.30016905069351196,
2318
+ "learning_rate": 6.9007720910511554e-06,
2319
+ "loss": 0.0231,
2320
+ "step": 3850
2321
+ },
2322
+ {
2323
+ "grad_norm": 0.28288936614990234,
2324
+ "learning_rate": 6.7871070793693815e-06,
2325
+ "loss": 0.033,
2326
+ "step": 3860
2327
+ },
2328
+ {
2329
+ "grad_norm": 0.44114962220191956,
2330
+ "learning_rate": 6.6742387586255505e-06,
2331
+ "loss": 0.0343,
2332
+ "step": 3870
2333
+ },
2334
+ {
2335
+ "grad_norm": 0.22615277767181396,
2336
+ "learning_rate": 6.562172066045655e-06,
2337
+ "loss": 0.0267,
2338
+ "step": 3880
2339
+ },
2340
+ {
2341
+ "grad_norm": 0.24401821196079254,
2342
+ "learning_rate": 6.450911903789863e-06,
2343
+ "loss": 0.0322,
2344
+ "step": 3890
2345
+ },
2346
+ {
2347
+ "grad_norm": 0.4524429738521576,
2348
+ "learning_rate": 6.340463138738123e-06,
2349
+ "loss": 0.0292,
2350
+ "step": 3900
2351
+ },
2352
+ {
2353
+ "grad_norm": 0.3167012929916382,
2354
+ "learning_rate": 6.230830602277199e-06,
2355
+ "loss": 0.0325,
2356
+ "step": 3910
2357
+ },
2358
+ {
2359
+ "grad_norm": 0.2682662010192871,
2360
+ "learning_rate": 6.1220190900894175e-06,
2361
+ "loss": 0.0273,
2362
+ "step": 3920
2363
+ },
2364
+ {
2365
+ "grad_norm": 0.29721036553382874,
2366
+ "learning_rate": 6.014033361942806e-06,
2367
+ "loss": 0.0266,
2368
+ "step": 3930
2369
+ },
2370
+ {
2371
+ "grad_norm": 0.42319223284721375,
2372
+ "learning_rate": 5.906878141482944e-06,
2373
+ "loss": 0.0322,
2374
+ "step": 3940
2375
+ },
2376
+ {
2377
+ "grad_norm": 0.38211673498153687,
2378
+ "learning_rate": 5.800558116026319e-06,
2379
+ "loss": 0.0312,
2380
+ "step": 3950
2381
+ },
2382
+ {
2383
+ "grad_norm": 0.27969926595687866,
2384
+ "learning_rate": 5.695077936355259e-06,
2385
+ "loss": 0.0263,
2386
+ "step": 3960
2387
+ },
2388
+ {
2389
+ "grad_norm": 0.22936464846134186,
2390
+ "learning_rate": 5.590442216514543e-06,
2391
+ "loss": 0.0309,
2392
+ "step": 3970
2393
+ },
2394
+ {
2395
+ "grad_norm": 0.3358422517776489,
2396
+ "learning_rate": 5.48665553360952e-06,
2397
+ "loss": 0.0243,
2398
+ "step": 3980
2399
+ },
2400
+ {
2401
+ "grad_norm": 0.2455916702747345,
2402
+ "learning_rate": 5.383722427605931e-06,
2403
+ "loss": 0.0293,
2404
+ "step": 3990
2405
+ },
2406
+ {
2407
+ "grad_norm": 0.24449455738067627,
2408
+ "learning_rate": 5.281647401131279e-06,
2409
+ "loss": 0.0283,
2410
+ "step": 4000
2411
+ },
2412
+ {
2413
+ "grad_norm": 0.40746790170669556,
2414
+ "learning_rate": 5.1804349192779044e-06,
2415
+ "loss": 0.0324,
2416
+ "step": 4010
2417
+ },
2418
+ {
2419
+ "grad_norm": 0.3240891695022583,
2420
+ "learning_rate": 5.0800894094076565e-06,
2421
+ "loss": 0.024,
2422
+ "step": 4020
2423
+ },
2424
+ {
2425
+ "grad_norm": 0.25076866149902344,
2426
+ "learning_rate": 4.980615260958193e-06,
2427
+ "loss": 0.0328,
2428
+ "step": 4030
2429
+ },
2430
+ {
2431
+ "grad_norm": 0.1966366469860077,
2432
+ "learning_rate": 4.882016825251037e-06,
2433
+ "loss": 0.0303,
2434
+ "step": 4040
2435
+ },
2436
+ {
2437
+ "grad_norm": 0.2640022337436676,
2438
+ "learning_rate": 4.784298415301172e-06,
2439
+ "loss": 0.0254,
2440
+ "step": 4050
2441
+ },
2442
+ {
2443
+ "grad_norm": 0.33577871322631836,
2444
+ "learning_rate": 4.687464305628405e-06,
2445
+ "loss": 0.0296,
2446
+ "step": 4060
2447
+ },
2448
+ {
2449
+ "grad_norm": 0.40677428245544434,
2450
+ "learning_rate": 4.591518732070402e-06,
2451
+ "loss": 0.0278,
2452
+ "step": 4070
2453
+ },
2454
+ {
2455
+ "grad_norm": 0.46990591287612915,
2456
+ "learning_rate": 4.4964658915973676e-06,
2457
+ "loss": 0.0279,
2458
+ "step": 4080
2459
+ },
2460
+ {
2461
+ "grad_norm": 0.22323285043239594,
2462
+ "learning_rate": 4.40230994212848e-06,
2463
+ "loss": 0.0293,
2464
+ "step": 4090
2465
+ },
2466
+ {
2467
+ "grad_norm": 0.2634666860103607,
2468
+ "learning_rate": 4.309055002349987e-06,
2469
+ "loss": 0.0303,
2470
+ "step": 4100
2471
+ },
2472
+ {
2473
+ "grad_norm": 0.45921197533607483,
2474
+ "learning_rate": 4.21670515153505e-06,
2475
+ "loss": 0.0297,
2476
+ "step": 4110
2477
+ },
2478
+ {
2479
+ "grad_norm": 0.640613853931427,
2480
+ "learning_rate": 4.12526442936533e-06,
2481
+ "loss": 0.0241,
2482
+ "step": 4120
2483
+ },
2484
+ {
2485
+ "grad_norm": 0.3607765734195709,
2486
+ "learning_rate": 4.03473683575423e-06,
2487
+ "loss": 0.0263,
2488
+ "step": 4130
2489
+ },
2490
+ {
2491
+ "grad_norm": 0.3656626045703888,
2492
+ "learning_rate": 3.945126330671969e-06,
2493
+ "loss": 0.028,
2494
+ "step": 4140
2495
+ },
2496
+ {
2497
+ "grad_norm": 0.8340692520141602,
2498
+ "learning_rate": 3.856436833972341e-06,
2499
+ "loss": 0.0298,
2500
+ "step": 4150
2501
+ },
2502
+ {
2503
+ "grad_norm": 0.5998902320861816,
2504
+ "learning_rate": 3.7686722252212344e-06,
2505
+ "loss": 0.0285,
2506
+ "step": 4160
2507
+ },
2508
+ {
2509
+ "grad_norm": 0.36758774518966675,
2510
+ "learning_rate": 3.681836343526965e-06,
2511
+ "loss": 0.0329,
2512
+ "step": 4170
2513
+ },
2514
+ {
2515
+ "grad_norm": 0.31286585330963135,
2516
+ "learning_rate": 3.5959329873723e-06,
2517
+ "loss": 0.0296,
2518
+ "step": 4180
2519
+ },
2520
+ {
2521
+ "grad_norm": 0.38393154740333557,
2522
+ "learning_rate": 3.510965914448333e-06,
2523
+ "loss": 0.0329,
2524
+ "step": 4190
2525
+ },
2526
+ {
2527
+ "grad_norm": 0.396363228559494,
2528
+ "learning_rate": 3.4269388414900792e-06,
2529
+ "loss": 0.0317,
2530
+ "step": 4200
2531
+ },
2532
+ {
2533
+ "grad_norm": 0.222749263048172,
2534
+ "learning_rate": 3.3438554441139247e-06,
2535
+ "loss": 0.0223,
2536
+ "step": 4210
2537
+ },
2538
+ {
2539
+ "grad_norm": 0.24695293605327606,
2540
+ "learning_rate": 3.2617193566568283e-06,
2541
+ "loss": 0.0241,
2542
+ "step": 4220
2543
+ },
2544
+ {
2545
+ "grad_norm": 0.4028778374195099,
2546
+ "learning_rate": 3.1805341720173326e-06,
2547
+ "loss": 0.0226,
2548
+ "step": 4230
2549
+ },
2550
+ {
2551
+ "grad_norm": 0.2558240592479706,
2552
+ "learning_rate": 3.100303441498423e-06,
2553
+ "loss": 0.0315,
2554
+ "step": 4240
2555
+ },
2556
+ {
2557
+ "grad_norm": 0.5111129283905029,
2558
+ "learning_rate": 3.021030674652156e-06,
2559
+ "loss": 0.0291,
2560
+ "step": 4250
2561
+ },
2562
+ {
2563
+ "grad_norm": 0.28568732738494873,
2564
+ "learning_rate": 2.942719339126171e-06,
2565
+ "loss": 0.0288,
2566
+ "step": 4260
2567
+ },
2568
+ {
2569
+ "grad_norm": 0.9272612929344177,
2570
+ "learning_rate": 2.8653728605119695e-06,
2571
+ "loss": 0.0265,
2572
+ "step": 4270
2573
+ },
2574
+ {
2575
+ "grad_norm": 0.2502414584159851,
2576
+ "learning_rate": 2.788994622195096e-06,
2577
+ "loss": 0.0257,
2578
+ "step": 4280
2579
+ },
2580
+ {
2581
+ "grad_norm": 0.3649044930934906,
2582
+ "learning_rate": 2.7135879652071318e-06,
2583
+ "loss": 0.0257,
2584
+ "step": 4290
2585
+ },
2586
+ {
2587
+ "grad_norm": 0.26225656270980835,
2588
+ "learning_rate": 2.6391561880795253e-06,
2589
+ "loss": 0.0256,
2590
+ "step": 4300
2591
+ },
2592
+ {
2593
+ "grad_norm": 0.38593482971191406,
2594
+ "learning_rate": 2.5657025466993472e-06,
2595
+ "loss": 0.0238,
2596
+ "step": 4310
2597
+ },
2598
+ {
2599
+ "grad_norm": 0.24045054614543915,
2600
+ "learning_rate": 2.493230254166817e-06,
2601
+ "loss": 0.0275,
2602
+ "step": 4320
2603
+ },
2604
+ {
2605
+ "grad_norm": 0.33231034874916077,
2606
+ "learning_rate": 2.4217424806547984e-06,
2607
+ "loss": 0.0251,
2608
+ "step": 4330
2609
+ },
2610
+ {
2611
+ "grad_norm": 0.31093278527259827,
2612
+ "learning_rate": 2.3512423532700805e-06,
2613
+ "loss": 0.0244,
2614
+ "step": 4340
2615
+ },
2616
+ {
2617
+ "grad_norm": 0.3532539904117584,
2618
+ "learning_rate": 2.2817329559166293e-06,
2619
+ "loss": 0.0252,
2620
+ "step": 4350
2621
+ },
2622
+ {
2623
+ "grad_norm": 0.5126403570175171,
2624
+ "learning_rate": 2.213217329160672e-06,
2625
+ "loss": 0.0263,
2626
+ "step": 4360
2627
+ },
2628
+ {
2629
+ "grad_norm": 0.3334461450576782,
2630
+ "learning_rate": 2.1456984700976733e-06,
2631
+ "loss": 0.0315,
2632
+ "step": 4370
2633
+ },
2634
+ {
2635
+ "grad_norm": 0.3070288598537445,
2636
+ "learning_rate": 2.079179332221265e-06,
2637
+ "loss": 0.0283,
2638
+ "step": 4380
2639
+ },
2640
+ {
2641
+ "grad_norm": 0.4461181163787842,
2642
+ "learning_rate": 2.0136628252940217e-06,
2643
+ "loss": 0.0274,
2644
+ "step": 4390
2645
+ },
2646
+ {
2647
+ "grad_norm": 0.6602442264556885,
2648
+ "learning_rate": 1.9491518152202096e-06,
2649
+ "loss": 0.0317,
2650
+ "step": 4400
2651
+ },
2652
+ {
2653
+ "grad_norm": 0.2886788547039032,
2654
+ "learning_rate": 1.8856491239203938e-06,
2655
+ "loss": 0.0253,
2656
+ "step": 4410
2657
+ },
2658
+ {
2659
+ "grad_norm": 0.3347417116165161,
2660
+ "learning_rate": 1.8231575292080027e-06,
2661
+ "loss": 0.0316,
2662
+ "step": 4420
2663
+ },
2664
+ {
2665
+ "grad_norm": 0.3918112814426422,
2666
+ "learning_rate": 1.7616797646678479e-06,
2667
+ "loss": 0.0289,
2668
+ "step": 4430
2669
+ },
2670
+ {
2671
+ "grad_norm": 0.41051027178764343,
2672
+ "learning_rate": 1.7012185195365016e-06,
2673
+ "loss": 0.0304,
2674
+ "step": 4440
2675
+ },
2676
+ {
2677
+ "grad_norm": 0.2741791903972626,
2678
+ "learning_rate": 1.6417764385846996e-06,
2679
+ "loss": 0.0241,
2680
+ "step": 4450
2681
+ },
2682
+ {
2683
+ "grad_norm": 0.337773859500885,
2684
+ "learning_rate": 1.5833561220016253e-06,
2685
+ "loss": 0.0276,
2686
+ "step": 4460
2687
+ },
2688
+ {
2689
+ "grad_norm": 0.394645631313324,
2690
+ "learning_rate": 1.5259601252811755e-06,
2691
+ "loss": 0.0229,
2692
+ "step": 4470
2693
+ },
2694
+ {
2695
+ "grad_norm": 0.26460105180740356,
2696
+ "learning_rate": 1.4695909591101924e-06,
2697
+ "loss": 0.0275,
2698
+ "step": 4480
2699
+ },
2700
+ {
2701
+ "grad_norm": 0.30859678983688354,
2702
+ "learning_rate": 1.4142510892586113e-06,
2703
+ "loss": 0.0255,
2704
+ "step": 4490
2705
+ },
2706
+ {
2707
+ "grad_norm": 0.3854379951953888,
2708
+ "learning_rate": 1.3599429364716144e-06,
2709
+ "loss": 0.0276,
2710
+ "step": 4500
2711
+ },
2712
+ {
2713
+ "grad_norm": 0.2807616591453552,
2714
+ "learning_rate": 1.3066688763637453e-06,
2715
+ "loss": 0.028,
2716
+ "step": 4510
2717
+ },
2718
+ {
2719
+ "grad_norm": 0.364891916513443,
2720
+ "learning_rate": 1.2544312393149683e-06,
2721
+ "loss": 0.0258,
2722
+ "step": 4520
2723
+ },
2724
+ {
2725
+ "grad_norm": 0.8333351016044617,
2726
+ "learning_rate": 1.2032323103687654e-06,
2727
+ "loss": 0.0302,
2728
+ "step": 4530
2729
+ },
2730
+ {
2731
+ "grad_norm": 0.31938087940216064,
2732
+ "learning_rate": 1.1530743291321367e-06,
2733
+ "loss": 0.0255,
2734
+ "step": 4540
2735
+ },
2736
+ {
2737
+ "grad_norm": 0.2908027172088623,
2738
+ "learning_rate": 1.1039594896776834e-06,
2739
+ "loss": 0.0227,
2740
+ "step": 4550
2741
+ },
2742
+ {
2743
+ "grad_norm": 0.2906731963157654,
2744
+ "learning_rate": 1.0558899404475824e-06,
2745
+ "loss": 0.0254,
2746
+ "step": 4560
2747
+ },
2748
+ {
2749
+ "grad_norm": 0.4353867471218109,
2750
+ "learning_rate": 1.008867784159645e-06,
2751
+ "loss": 0.0267,
2752
+ "step": 4570
2753
+ },
2754
+ {
2755
+ "grad_norm": 0.30952566862106323,
2756
+ "learning_rate": 9.628950777153256e-07,
2757
+ "loss": 0.0262,
2758
+ "step": 4580
2759
+ },
2760
+ {
2761
+ "grad_norm": 0.7123703956604004,
2762
+ "learning_rate": 9.179738321097225e-07,
2763
+ "loss": 0.0262,
2764
+ "step": 4590
2765
+ },
2766
+ {
2767
+ "grad_norm": 0.4011175334453583,
2768
+ "learning_rate": 8.741060123436535e-07,
2769
+ "loss": 0.0232,
2770
+ "step": 4600
2771
+ },
2772
+ {
2773
+ "grad_norm": 0.305926114320755,
2774
+ "learning_rate": 8.312935373376573e-07,
2775
+ "loss": 0.0259,
2776
+ "step": 4610
2777
+ },
2778
+ {
2779
+ "grad_norm": 0.33336731791496277,
2780
+ "learning_rate": 7.895382798480927e-07,
2781
+ "loss": 0.0283,
2782
+ "step": 4620
2783
+ },
2784
+ {
2785
+ "grad_norm": 0.3118588328361511,
2786
+ "learning_rate": 7.488420663851859e-07,
2787
+ "loss": 0.0224,
2788
+ "step": 4630
2789
+ },
2790
+ {
2791
+ "grad_norm": 0.21298760175704956,
2792
+ "learning_rate": 7.092066771331507e-07,
2793
+ "loss": 0.0282,
2794
+ "step": 4640
2795
+ },
2796
+ {
2797
+ "grad_norm": 0.4557483196258545,
2798
+ "learning_rate": 6.706338458723205e-07,
2799
+ "loss": 0.0277,
2800
+ "step": 4650
2801
+ },
2802
+ {
2803
+ "grad_norm": 0.33916375041007996,
2804
+ "learning_rate": 6.331252599032833e-07,
2805
+ "loss": 0.0322,
2806
+ "step": 4660
2807
+ },
2808
+ {
2809
+ "grad_norm": 0.36580178141593933,
2810
+ "learning_rate": 5.96682559973108e-07,
2811
+ "loss": 0.0234,
2812
+ "step": 4670
2813
+ },
2814
+ {
2815
+ "grad_norm": 0.23574711382389069,
2816
+ "learning_rate": 5.613073402035429e-07,
2817
+ "loss": 0.0229,
2818
+ "step": 4680
2819
+ },
2820
+ {
2821
+ "grad_norm": 0.34600311517715454,
2822
+ "learning_rate": 5.270011480213056e-07,
2823
+ "loss": 0.0332,
2824
+ "step": 4690
2825
+ },
2826
+ {
2827
+ "grad_norm": 0.28487834334373474,
2828
+ "learning_rate": 4.937654840903722e-07,
2829
+ "loss": 0.0355,
2830
+ "step": 4700
2831
+ },
2832
+ {
2833
+ "grad_norm": 0.36917445063591003,
2834
+ "learning_rate": 4.6160180224635305e-07,
2835
+ "loss": 0.0245,
2836
+ "step": 4710
2837
+ },
2838
+ {
2839
+ "grad_norm": 0.2571835517883301,
2840
+ "learning_rate": 4.3051150943289596e-07,
2841
+ "loss": 0.0265,
2842
+ "step": 4720
2843
+ },
2844
+ {
2845
+ "grad_norm": 0.3375624716281891,
2846
+ "learning_rate": 4.004959656401186e-07,
2847
+ "loss": 0.0274,
2848
+ "step": 4730
2849
+ },
2850
+ {
2851
+ "grad_norm": 0.35926106572151184,
2852
+ "learning_rate": 3.715564838451452e-07,
2853
+ "loss": 0.0266,
2854
+ "step": 4740
2855
+ },
2856
+ {
2857
+ "grad_norm": 0.4017363488674164,
2858
+ "learning_rate": 3.436943299546608e-07,
2859
+ "loss": 0.0278,
2860
+ "step": 4750
2861
+ },
2862
+ {
2863
+ "grad_norm": 0.2312772423028946,
2864
+ "learning_rate": 3.169107227495388e-07,
2865
+ "loss": 0.0256,
2866
+ "step": 4760
2867
+ },
2868
+ {
2869
+ "grad_norm": 0.2088507115840912,
2870
+ "learning_rate": 2.912068338315255e-07,
2871
+ "loss": 0.0277,
2872
+ "step": 4770
2873
+ },
2874
+ {
2875
+ "grad_norm": 0.168931245803833,
2876
+ "learning_rate": 2.6658378757198623e-07,
2877
+ "loss": 0.0234,
2878
+ "step": 4780
2879
+ },
2880
+ {
2881
+ "grad_norm": 0.43259093165397644,
2882
+ "learning_rate": 2.430426610627395e-07,
2883
+ "loss": 0.0248,
2884
+ "step": 4790
2885
+ },
2886
+ {
2887
+ "grad_norm": 0.45266538858413696,
2888
+ "learning_rate": 2.205844840689142e-07,
2889
+ "loss": 0.0298,
2890
+ "step": 4800
2891
+ },
2892
+ {
2893
+ "grad_norm": 0.41012969613075256,
2894
+ "learning_rate": 1.9921023898393233e-07,
2895
+ "loss": 0.0258,
2896
+ "step": 4810
2897
+ },
2898
+ {
2899
+ "grad_norm": 0.4440428614616394,
2900
+ "learning_rate": 1.7892086078651616e-07,
2901
+ "loss": 0.021,
2902
+ "step": 4820
2903
+ },
2904
+ {
2905
+ "grad_norm": 0.3820282518863678,
2906
+ "learning_rate": 1.5971723699979013e-07,
2907
+ "loss": 0.0274,
2908
+ "step": 4830
2909
+ },
2910
+ {
2911
+ "grad_norm": 0.166753888130188,
2912
+ "learning_rate": 1.4160020765247862e-07,
2913
+ "loss": 0.0338,
2914
+ "step": 4840
2915
+ },
2916
+ {
2917
+ "grad_norm": 0.2630172669887543,
2918
+ "learning_rate": 1.2457056524212696e-07,
2919
+ "loss": 0.0303,
2920
+ "step": 4850
2921
+ },
2922
+ {
2923
+ "grad_norm": 0.28150999546051025,
2924
+ "learning_rate": 1.0862905470047091e-07,
2925
+ "loss": 0.0248,
2926
+ "step": 4860
2927
+ },
2928
+ {
2929
+ "grad_norm": 0.19534726440906525,
2930
+ "learning_rate": 9.377637336082101e-08,
2931
+ "loss": 0.0218,
2932
+ "step": 4870
2933
+ },
2934
+ {
2935
+ "grad_norm": 0.21588121354579926,
2936
+ "learning_rate": 8.001317092757864e-08,
2937
+ "loss": 0.0292,
2938
+ "step": 4880
2939
+ },
2940
+ {
2941
+ "grad_norm": 0.3922027349472046,
2942
+ "learning_rate": 6.73400494477977e-08,
2943
+ "loss": 0.0273,
2944
+ "step": 4890
2945
+ },
2946
+ {
2947
+ "grad_norm": 0.3174291253089905,
2948
+ "learning_rate": 5.5757563284875026e-08,
2949
+ "loss": 0.0276,
2950
+ "step": 4900
2951
+ },
2952
+ {
2953
+ "grad_norm": 0.24576455354690552,
2954
+ "learning_rate": 4.526621909426987e-08,
2955
+ "loss": 0.0259,
2956
+ "step": 4910
2957
+ },
2958
+ {
2959
+ "grad_norm": 0.22395384311676025,
2960
+ "learning_rate": 3.586647580136881e-08,
2961
+ "loss": 0.023,
2962
+ "step": 4920
2963
+ },
2964
+ {
2965
+ "grad_norm": 0.8619683980941772,
2966
+ "learning_rate": 2.755874458139629e-08,
2967
+ "loss": 0.0288,
2968
+ "step": 4930
2969
+ },
2970
+ {
2971
+ "grad_norm": 0.31981348991394043,
2972
+ "learning_rate": 2.034338884142617e-08,
2973
+ "loss": 0.0246,
2974
+ "step": 4940
2975
+ },
2976
+ {
2977
+ "grad_norm": 0.27290672063827515,
2978
+ "learning_rate": 1.422072420449172e-08,
2979
+ "loss": 0.0277,
2980
+ "step": 4950
2981
+ },
2982
+ {
2983
+ "grad_norm": 0.2460501492023468,
2984
+ "learning_rate": 9.191018495779968e-09,
2985
+ "loss": 0.0247,
2986
+ "step": 4960
2987
+ },
2988
+ {
2989
+ "grad_norm": 0.27399739623069763,
2990
+ "learning_rate": 5.254491730916078e-09,
2991
+ "loss": 0.0333,
2992
+ "step": 4970
2993
+ },
2994
+ {
2995
+ "grad_norm": 0.3019241988658905,
2996
+ "learning_rate": 2.411316106326611e-09,
2997
+ "loss": 0.0295,
2998
+ "step": 4980
2999
+ },
3000
+ {
3001
+ "grad_norm": 0.2698662281036377,
3002
+ "learning_rate": 6.616159917316456e-10,
3003
+ "loss": 0.0259,
3004
+ "step": 4990
3005
+ },
3006
+ {
3007
+ "grad_norm": 0.282757043838501,
3008
+ "learning_rate": 5.4679246769273606e-12,
3009
+ "loss": 0.0249,
3010
+ "step": 5000
3011
+ }
3012
+ ],
3013
+ "logging_steps": 10,
3014
+ "max_steps": 5000,
3015
+ "num_input_tokens_seen": 0,
3016
+ "num_train_epochs": 9223372036854775807,
3017
+ "save_steps": 5000,
3018
+ "stateful_callbacks": {
3019
+ "TrainerControl": {
3020
+ "args": {
3021
+ "should_epoch_stop": false,
3022
+ "should_evaluate": false,
3023
+ "should_log": false,
3024
+ "should_save": true,
3025
+ "should_training_stop": true
3026
+ },
3027
+ "attributes": {}
3028
+ }
3029
+ },
3030
+ "total_flos": 0.0,
3031
+ "train_batch_size": 32,
3032
+ "trial_name": null,
3033
+ "trial_params": null
3034
+ }
checkpoint-5000/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:273910977029e314f0cf45f0c23e1eddadbc4e624fca833ddf2b3468e7f50876
3
+ size 5713
checkpoint-5000/wandb_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"project": "finetune-gr00t-n1d6", "run_id": "omy_1"}
config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_horizon": 50,
3
+ "add_pos_embed": true,
4
+ "apply_sincos_state_encoding": true,
5
+ "architectures": [
6
+ "Gr00tN1d6"
7
+ ],
8
+ "attn_dropout": 0.2,
9
+ "attn_implementation": null,
10
+ "backbone_embedding_dim": 2048,
11
+ "backbone_model_type": "eagle",
12
+ "backbone_trainable_params_fp32": true,
13
+ "collator_overwrite_image_inputs": false,
14
+ "color_jitter_params": {
15
+ "brightness": 0.1,
16
+ "contrast": 0.1,
17
+ "hue": 0.1,
18
+ "saturation": 0.1
19
+ },
20
+ "crop_fraction": 0.95,
21
+ "diffusion_model_cfg": {
22
+ "attention_head_dim": 48,
23
+ "dropout": 0.2,
24
+ "final_dropout": true,
25
+ "interleave_self_attention": true,
26
+ "norm_type": "ada_norm",
27
+ "num_attention_heads": 32,
28
+ "num_layers": 32,
29
+ "output_dim": 1024,
30
+ "positional_embeddings": null
31
+ },
32
+ "eagle_collator": true,
33
+ "formalize_language": true,
34
+ "gemma_collator": false,
35
+ "hidden_size": 1024,
36
+ "image_crop_size": null,
37
+ "image_target_size": null,
38
+ "input_embedding_dim": 1536,
39
+ "load_bf16": true,
40
+ "max_action_dim": 128,
41
+ "max_num_embodiments": 32,
42
+ "max_seq_len": 1024,
43
+ "max_state_dim": 128,
44
+ "model_dtype": "bfloat16",
45
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
46
+ "model_type": "Gr00tN1d6",
47
+ "noise_beta_alpha": 1.5,
48
+ "noise_beta_beta": 1.0,
49
+ "noise_s": 0.999,
50
+ "num_inference_timesteps": 4,
51
+ "num_timestep_buckets": 1000,
52
+ "random_rotation_angle": null,
53
+ "reproject_vision": false,
54
+ "select_layer": 16,
55
+ "shortest_image_edge": 256,
56
+ "state_dropout_prob": 0.15,
57
+ "torch_dtype": "bfloat16",
58
+ "transformers_version": "4.51.3",
59
+ "tune_diffusion_model": true,
60
+ "tune_llm": false,
61
+ "tune_projector": true,
62
+ "tune_top_llm_layers": 4,
63
+ "tune_visual": false,
64
+ "tune_vlln": true,
65
+ "use_albumentations_transforms": true,
66
+ "use_alternate_vl_dit": true,
67
+ "use_flash_attention": true,
68
+ "use_relative_action": true,
69
+ "use_vlln": true
70
+ }
experiment_cfg/conf.yaml ADDED
@@ -0,0 +1,209 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ load_config_path: null
2
+ model:
3
+ model_type: Gr00tN1d6
4
+ model_dtype: bfloat16
5
+ model_name: nvidia/Eagle-Block2A-2B-v2
6
+ backbone_model_type: eagle
7
+ model_revision: null
8
+ tune_top_llm_layers: 4
9
+ backbone_embedding_dim: 2048
10
+ tune_llm: false
11
+ tune_visual: false
12
+ select_layer: 16
13
+ reproject_vision: false
14
+ use_flash_attention: true
15
+ load_bf16: false
16
+ collator_overwrite_image_inputs: false
17
+ eagle_collator: true
18
+ backbone_trainable_params_fp32: true
19
+ image_crop_size: null
20
+ image_target_size: null
21
+ shortest_image_edge: 256
22
+ crop_fraction: 0.95
23
+ random_rotation_angle: null
24
+ color_jitter_params:
25
+ brightness: 0.3
26
+ contrast: 0.4
27
+ saturation: 0.5
28
+ hue: 0.08
29
+ use_albumentations_transforms: true
30
+ formalize_language: true
31
+ apply_sincos_state_encoding: false
32
+ use_relative_action: true
33
+ max_state_dim: 29
34
+ max_action_dim: 29
35
+ action_horizon: 16
36
+ hidden_size: 1024
37
+ input_embedding_dim: 1536
38
+ add_pos_embed: true
39
+ attn_dropout: 0.2
40
+ use_vlln: true
41
+ max_seq_len: 1024
42
+ use_alternate_vl_dit: true
43
+ attend_text_every_n_blocks: 2
44
+ diffusion_model_cfg:
45
+ positional_embeddings: null
46
+ num_layers: 32
47
+ num_attention_heads: 32
48
+ attention_head_dim: 48
49
+ norm_type: ada_norm
50
+ dropout: 0.2
51
+ final_dropout: true
52
+ output_dim: 1024
53
+ interleave_self_attention: true
54
+ num_inference_timesteps: 4
55
+ noise_beta_alpha: 1.5
56
+ noise_beta_beta: 1.0
57
+ noise_s: 0.999
58
+ num_timestep_buckets: 1000
59
+ tune_projector: true
60
+ tune_diffusion_model: true
61
+ tune_vlln: true
62
+ state_dropout_prob: 0.15
63
+ state_additive_noise_scale: 0.0
64
+ max_num_embodiments: 32
65
+ data:
66
+ datasets:
67
+ - dataset_paths:
68
+ - /workspace/teleoperation_dataset_gr00t_v2_p3_4_merged_lerobot_v2
69
+ embodiment_tag: new_embodiment
70
+ mix_ratio: 1.0
71
+ dataset_type: physical_embodiment
72
+ val_dataset_path: null
73
+ modality_configs:
74
+ new_embodiment:
75
+ video:
76
+ delta_indices:
77
+ - 0
78
+ modality_keys:
79
+ - front
80
+ - wrist
81
+ sin_cos_embedding_keys: null
82
+ mean_std_embedding_keys: null
83
+ action_configs: null
84
+ state:
85
+ delta_indices:
86
+ - 0
87
+ modality_keys:
88
+ - single_arm
89
+ - gripper
90
+ sin_cos_embedding_keys: null
91
+ mean_std_embedding_keys: null
92
+ action_configs: null
93
+ action:
94
+ delta_indices:
95
+ - 0
96
+ - 1
97
+ - 2
98
+ - 3
99
+ - 4
100
+ - 5
101
+ - 6
102
+ - 7
103
+ - 8
104
+ - 9
105
+ - 10
106
+ - 11
107
+ - 12
108
+ - 13
109
+ - 14
110
+ - 15
111
+ modality_keys:
112
+ - single_arm
113
+ - gripper
114
+ sin_cos_embedding_keys: null
115
+ mean_std_embedding_keys: null
116
+ action_configs:
117
+ - rep: RELATIVE
118
+ type: NON_EEF
119
+ format: DEFAULT
120
+ state_key: null
121
+ - rep: ABSOLUTE
122
+ type: NON_EEF
123
+ format: DEFAULT
124
+ state_key: null
125
+ language:
126
+ delta_indices:
127
+ - 0
128
+ modality_keys:
129
+ - annotation.human.task_description
130
+ sin_cos_embedding_keys: null
131
+ mean_std_embedding_keys: null
132
+ action_configs: null
133
+ download_cache: false
134
+ shard_size: 1024
135
+ episode_sampling_rate: 0.1
136
+ num_shards_per_epoch: 100000
137
+ override_pretraining_statistics: false
138
+ mode: single_turn
139
+ random_chop: 0.0
140
+ mock_dataset_mode: false
141
+ shuffle: true
142
+ seed: 42
143
+ multiprocessing_context: fork
144
+ allow_padding: false
145
+ subsample_ratio: 1.0
146
+ image_crop_size:
147
+ - 244
148
+ - 244
149
+ image_target_size:
150
+ - 224
151
+ - 224
152
+ video_backend: torchcodec
153
+ training:
154
+ output_dir: /workspace/Isaac-GR00T/outputs/omy_1
155
+ experiment_name: null
156
+ max_steps: 5000
157
+ global_batch_size: 32
158
+ batch_size: null
159
+ gradient_accumulation_steps: 1
160
+ learning_rate: 5.0e-05
161
+ lr_scheduler_type: cosine
162
+ weight_decay: 0.0001
163
+ warmup_ratio: 0.05
164
+ warmup_steps: 0
165
+ max_grad_norm: 1.0
166
+ optim: adamw_torch
167
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
168
+ tf32: true
169
+ fp16: false
170
+ bf16: true
171
+ eval_bf16: true
172
+ logging_steps: 10
173
+ save_steps: 5000
174
+ save_total_limit: 1
175
+ save_vl_model: false
176
+ upload_checkpoints: false
177
+ upload_every: 1000
178
+ upload_last_n_checkpoints: 5
179
+ max_concurrent_uploads: 2
180
+ eval_strategy: 'no'
181
+ eval_steps: 500
182
+ eval_set_split_ratio: 0.1
183
+ eval_batch_size: 2
184
+ save_best_eval_metric_name: ''
185
+ save_best_eval_metric_greater_is_better: true
186
+ deepspeed_stage: 2
187
+ gradient_checkpointing: false
188
+ transformers_trust_remote_code: true
189
+ transformers_local_files_only: false
190
+ transformers_cache_dir: null
191
+ transformers_access_token: null
192
+ use_ddp: false
193
+ ddp_bucket_cap_mb: 100
194
+ num_gpus: 1
195
+ dataloader_num_workers: 4
196
+ remove_unused_columns: false
197
+ use_wandb: false
198
+ wandb_project: finetune-gr00t-n1d6
199
+ enable_profiling: false
200
+ max_retries: 3
201
+ assert_loss_less_than: null
202
+ add_rl_callback: false
203
+ enable_open_loop_eval: false
204
+ open_loop_eval_traj_ids:
205
+ - 0
206
+ open_loop_eval_steps_per_traj: 100
207
+ open_loop_eval_plot_indices: null
208
+ max_steps: 5000
209
+ save_steps: 5000
experiment_cfg/config.yaml ADDED
@@ -0,0 +1,243 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:gr00t.configs.base_config.Config
2
+ data: !!python/object:gr00t.configs.data.data_config.DataConfig
3
+ allow_padding: false
4
+ datasets:
5
+ - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
6
+ dataset_paths:
7
+ - /workspace/teleoperation_dataset_gr00t_v2_p3_4_merged_lerobot_v2
8
+ dataset_type: physical_embodiment
9
+ embodiment_tag: new_embodiment
10
+ mix_ratio: 1.0
11
+ val_dataset_path: null
12
+ download_cache: false
13
+ episode_sampling_rate: 0.1
14
+ image_crop_size:
15
+ - 244
16
+ - 244
17
+ image_target_size:
18
+ - 224
19
+ - 224
20
+ mock_dataset_mode: false
21
+ modality_configs:
22
+ new_embodiment:
23
+ action: !!python/object:gr00t.data.types.ModalityConfig
24
+ action_configs:
25
+ - !!python/object:gr00t.data.types.ActionConfig
26
+ format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
27
+ - default
28
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
29
+ - relative
30
+ state_key: null
31
+ type: &id002 !!python/object/apply:gr00t.data.types.ActionType
32
+ - non_eef
33
+ - !!python/object:gr00t.data.types.ActionConfig
34
+ format: *id001
35
+ rep: !!python/object/apply:gr00t.data.types.ActionRepresentation
36
+ - absolute
37
+ state_key: null
38
+ type: *id002
39
+ delta_indices:
40
+ - 0
41
+ - 1
42
+ - 2
43
+ - 3
44
+ - 4
45
+ - 5
46
+ - 6
47
+ - 7
48
+ - 8
49
+ - 9
50
+ - 10
51
+ - 11
52
+ - 12
53
+ - 13
54
+ - 14
55
+ - 15
56
+ mean_std_embedding_keys: null
57
+ modality_keys:
58
+ - single_arm
59
+ - gripper
60
+ sin_cos_embedding_keys: null
61
+ language: !!python/object:gr00t.data.types.ModalityConfig
62
+ action_configs: null
63
+ delta_indices:
64
+ - 0
65
+ mean_std_embedding_keys: null
66
+ modality_keys:
67
+ - annotation.human.task_description
68
+ sin_cos_embedding_keys: null
69
+ state: !!python/object:gr00t.data.types.ModalityConfig
70
+ action_configs: null
71
+ delta_indices:
72
+ - 0
73
+ mean_std_embedding_keys: null
74
+ modality_keys:
75
+ - single_arm
76
+ - gripper
77
+ sin_cos_embedding_keys: null
78
+ video: !!python/object:gr00t.data.types.ModalityConfig
79
+ action_configs: null
80
+ delta_indices:
81
+ - 0
82
+ mean_std_embedding_keys: null
83
+ modality_keys:
84
+ - front
85
+ - wrist
86
+ sin_cos_embedding_keys: null
87
+ mode: single_turn
88
+ multiprocessing_context: fork
89
+ num_shards_per_epoch: 100000
90
+ override_pretraining_statistics: false
91
+ random_chop: 0.0
92
+ seed: 42
93
+ shard_size: 1024
94
+ shuffle: true
95
+ subsample_ratio: 1.0
96
+ video_backend: torchcodec
97
+ load_config_path: null
98
+ model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
99
+ _attn_implementation_autoset: false
100
+ _attn_implementation_internal: null
101
+ _commit_hash: null
102
+ _name_or_path: ''
103
+ add_cross_attention: false
104
+ architectures: null
105
+ backbone_model_type: eagle
106
+ backbone_trainable_params_fp32: true
107
+ bad_words_ids: null
108
+ begin_suppress_tokens: null
109
+ bos_token_id: null
110
+ chunk_size_feed_forward: 0
111
+ color_jitter_params:
112
+ brightness: 0.3
113
+ contrast: 0.4
114
+ hue: 0.08
115
+ saturation: 0.5
116
+ cross_attention_hidden_size: null
117
+ decoder_start_token_id: null
118
+ diffusion_model_cfg:
119
+ attention_head_dim: 48
120
+ dropout: 0.2
121
+ final_dropout: true
122
+ interleave_self_attention: true
123
+ norm_type: ada_norm
124
+ num_attention_heads: 32
125
+ num_layers: 32
126
+ output_dim: 1024
127
+ positional_embeddings: null
128
+ diversity_penalty: 0.0
129
+ do_sample: false
130
+ eagle_collator: true
131
+ early_stopping: false
132
+ encoder_no_repeat_ngram_size: 0
133
+ eos_token_id: null
134
+ exponential_decay_length_penalty: null
135
+ finetuning_task: null
136
+ forced_bos_token_id: null
137
+ forced_eos_token_id: null
138
+ id2label:
139
+ 0: LABEL_0
140
+ 1: LABEL_1
141
+ is_decoder: false
142
+ is_encoder_decoder: false
143
+ label2id:
144
+ LABEL_0: 0
145
+ LABEL_1: 1
146
+ length_penalty: 1.0
147
+ load_bf16: false
148
+ max_length: 20
149
+ min_length: 0
150
+ model_name: nvidia/Eagle-Block2A-2B-v2
151
+ no_repeat_ngram_size: 0
152
+ num_beam_groups: 1
153
+ num_beams: 1
154
+ num_return_sequences: 1
155
+ output_attentions: false
156
+ output_hidden_states: false
157
+ output_scores: false
158
+ pad_token_id: null
159
+ prefix: null
160
+ problem_type: null
161
+ pruned_heads: {}
162
+ random_rotation_angle: null
163
+ remove_invalid_values: false
164
+ repetition_penalty: 1.0
165
+ reproject_vision: false
166
+ return_dict: true
167
+ return_dict_in_generate: false
168
+ sep_token_id: null
169
+ state_dropout_prob: 0.15
170
+ suppress_tokens: null
171
+ task_specific_params: null
172
+ temperature: 1.0
173
+ tf_legacy_loss: false
174
+ tie_encoder_decoder: false
175
+ tie_word_embeddings: true
176
+ tokenizer_class: null
177
+ top_k: 50
178
+ top_p: 1.0
179
+ torch_dtype: null
180
+ torchscript: false
181
+ transformers_version: null
182
+ tune_diffusion_model: true
183
+ tune_llm: false
184
+ tune_projector: true
185
+ tune_visual: false
186
+ typical_p: 1.0
187
+ use_bfloat16: false
188
+ use_relative_action: true
189
+ training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
190
+ add_rl_callback: false
191
+ assert_loss_less_than: null
192
+ batch_size: null
193
+ bf16: true
194
+ dataloader_num_workers: 4
195
+ ddp_bucket_cap_mb: 100
196
+ deepspeed_stage: 2
197
+ enable_open_loop_eval: false
198
+ enable_profiling: false
199
+ eval_batch_size: 2
200
+ eval_bf16: true
201
+ eval_set_split_ratio: 0.1
202
+ eval_steps: 500
203
+ eval_strategy: 'no'
204
+ experiment_name: null
205
+ fp16: false
206
+ global_batch_size: 32
207
+ gradient_accumulation_steps: 1
208
+ gradient_checkpointing: false
209
+ learning_rate: 5.0e-05
210
+ logging_steps: 10
211
+ lr_scheduler_type: cosine
212
+ max_concurrent_uploads: 2
213
+ max_grad_norm: 1.0
214
+ max_retries: 3
215
+ max_steps: 5000
216
+ num_gpus: 1
217
+ open_loop_eval_plot_indices: null
218
+ open_loop_eval_steps_per_traj: 100
219
+ open_loop_eval_traj_ids:
220
+ - 0
221
+ optim: adamw_torch
222
+ output_dir: /workspace/Isaac-GR00T/outputs/omy_1
223
+ remove_unused_columns: false
224
+ save_best_eval_metric_greater_is_better: true
225
+ save_best_eval_metric_name: ''
226
+ save_steps: 5000
227
+ save_total_limit: 1
228
+ save_vl_model: false
229
+ start_from_checkpoint: nvidia/GR00T-N1.6-3B
230
+ tf32: true
231
+ transformers_access_token: null
232
+ transformers_cache_dir: null
233
+ transformers_local_files_only: false
234
+ transformers_trust_remote_code: true
235
+ upload_checkpoints: false
236
+ upload_every: 1000
237
+ upload_last_n_checkpoints: 5
238
+ use_ddp: false
239
+ use_wandb: false
240
+ wandb_project: finetune-gr00t-n1d6
241
+ warmup_ratio: 0.05
242
+ warmup_steps: 0
243
+ weight_decay: 0.0001
experiment_cfg/dataset_statistics.json ADDED
@@ -0,0 +1,932 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "new_embodiment": {
3
+ "state": {
4
+ "single_arm": {
5
+ "min": [
6
+ -0.3484296202659607,
7
+ -0.2940049469470978,
8
+ -1.4568357467651367,
9
+ -0.918129026889801,
10
+ 1.5524020195007324,
11
+ -0.8714576959609985
12
+ ],
13
+ "max": [
14
+ 0.871225893497467,
15
+ 1.4812145233154297,
16
+ 2.2445228099823,
17
+ 1.6041626930236816,
18
+ 1.580612301826477,
19
+ 0.34752944111824036
20
+ ],
21
+ "mean": [
22
+ 0.0660708295904004,
23
+ 0.2896196729390686,
24
+ 1.273881831918799,
25
+ 0.07309057529716799,
26
+ 1.5695173609910642,
27
+ -0.0675732313873097
28
+ ],
29
+ "std": [
30
+ 0.24684875710013002,
31
+ 0.2624021895353532,
32
+ 0.6396142403168285,
33
+ 0.5623540573067425,
34
+ 0.0019495733088944448,
35
+ 0.24706634675426653
36
+ ],
37
+ "q01": [
38
+ -0.14120122547514716,
39
+ -0.15137712556556798,
40
+ 0.25940447983184756,
41
+ -0.7327557047228977,
42
+ 1.5623217466486523,
43
+ -0.6984691145028645
44
+ ],
45
+ "q99": [
46
+ 0.6986005893203253,
47
+ 0.6137331449754688,
48
+ 1.989423889739015,
49
+ 0.902999176898917,
50
+ 1.5715922809600218,
51
+ 0.13965727915057108
52
+ ]
53
+ },
54
+ "gripper": {
55
+ "min": [
56
+ 0.0
57
+ ],
58
+ "max": [
59
+ 1.0
60
+ ],
61
+ "mean": [
62
+ 0.2753448165213926
63
+ ],
64
+ "std": [
65
+ 0.44668786429986657
66
+ ],
67
+ "q01": [
68
+ -1.000000013351432e-10
69
+ ],
70
+ "q99": [
71
+ 0.9999925267031382
72
+ ]
73
+ }
74
+ },
75
+ "action": {
76
+ "single_arm": {
77
+ "min": [
78
+ -0.35249605774879456,
79
+ -0.340976357460022,
80
+ -1.4720337390899658,
81
+ -0.9139819741249084,
82
+ 1.5523695945739746,
83
+ -0.8805081248283386
84
+ ],
85
+ "max": [
86
+ 0.8796143531799316,
87
+ 1.4417712688446045,
88
+ 2.2255284786224365,
89
+ 1.6055001020431519,
90
+ 1.571340799331665,
91
+ 0.351653516292572
92
+ ],
93
+ "mean": [
94
+ 0.07284960426261836,
95
+ 0.2567877877935287,
96
+ 1.2472866734129062,
97
+ 0.0652026161086495,
98
+ 1.56964799977149,
99
+ -0.07374245072646021
100
+ ],
101
+ "std": [
102
+ 0.25668078105389325,
103
+ 0.25697145420740913,
104
+ 0.6486887061942791,
105
+ 0.566977630034768,
106
+ 0.002414096561250562,
107
+ 0.2566087339519503
108
+ ],
109
+ "q01": [
110
+ -0.1498670041869513,
111
+ -0.17465162009659907,
112
+ 0.2170314396344432,
113
+ -0.7378591563813238,
114
+ 1.5674572562165083,
115
+ -0.7113432860253213
116
+ ],
117
+ "q99": [
118
+ 0.7104775490699361,
119
+ 0.5871068334930613,
120
+ 1.9767465605823349,
121
+ 0.9021054332053293,
122
+ 1.5705683645924846,
123
+ 0.14903640795681997
124
+ ]
125
+ },
126
+ "gripper": {
127
+ "min": [
128
+ 0.0
129
+ ],
130
+ "max": [
131
+ 1.0
132
+ ],
133
+ "mean": [
134
+ 0.2733744355732537
135
+ ],
136
+ "std": [
137
+ 0.4456914315372699
138
+ ],
139
+ "q01": [
140
+ -1.000000013351432e-10
141
+ ],
142
+ "q99": [
143
+ 0.9999924756906762
144
+ ]
145
+ }
146
+ },
147
+ "relative_action": {
148
+ "single_arm": {
149
+ "min": [
150
+ [
151
+ -0.15696251392364502,
152
+ -0.34446781873703003,
153
+ -0.6737130880355835,
154
+ -0.3178783655166626,
155
+ -0.01156306266784668,
156
+ -0.16844062507152557
157
+ ],
158
+ [
159
+ -0.1919003129005432,
160
+ -0.4053707718849182,
161
+ -0.7816908955574036,
162
+ -0.38410383462905884,
163
+ -0.011548161506652832,
164
+ -0.2033797651529312
165
+ ],
166
+ [
167
+ -0.22658002376556396,
168
+ -0.46504658460617065,
169
+ -0.8752028942108154,
170
+ -0.4481411576271057,
171
+ -0.011525154113769531,
172
+ -0.2386666089296341
173
+ ],
174
+ [
175
+ -0.25767937302589417,
176
+ -0.5173105597496033,
177
+ -0.960516095161438,
178
+ -0.5121691226959229,
179
+ -0.011506915092468262,
180
+ -0.2736057639122009
181
+ ],
182
+ [
183
+ -0.2887968122959137,
184
+ -0.5641186833381653,
185
+ -1.0343924760818481,
186
+ -0.5759719610214233,
187
+ -0.011516809463500977,
188
+ -0.30846402049064636
189
+ ],
190
+ [
191
+ -0.3199325501918793,
192
+ -0.6068925261497498,
193
+ -1.1042704582214355,
194
+ -0.6281388401985168,
195
+ -0.011510848999023438,
196
+ -0.34338027238845825
197
+ ],
198
+ [
199
+ -0.3509705364704132,
200
+ -0.6361642479896545,
201
+ -1.1701284646987915,
202
+ -0.6791977882385254,
203
+ -0.011488914489746094,
204
+ -0.37825170159339905
205
+ ],
206
+ [
207
+ -0.38060125708580017,
208
+ -0.6464956998825073,
209
+ -1.2320352792739868,
210
+ -0.7301526665687561,
211
+ -0.01146841049194336,
212
+ -0.4131423830986023
213
+ ],
214
+ [
215
+ -0.40787461400032043,
216
+ -0.6518352031707764,
217
+ -1.2899482250213623,
218
+ -0.7853091359138489,
219
+ -0.011491179466247559,
220
+ -0.448012113571167
221
+ ],
222
+ [
223
+ -0.4350906312465668,
224
+ -0.6538127660751343,
225
+ -1.3439218997955322,
226
+ -0.8374760150909424,
227
+ -0.011620759963989258,
228
+ -0.48276638984680176
229
+ ],
230
+ [
231
+ -0.4614231288433075,
232
+ -0.6572719812393188,
233
+ -1.3943485021591187,
234
+ -0.8772416114807129,
235
+ -0.011820793151855469,
236
+ -0.5160169005393982
237
+ ],
238
+ [
239
+ -0.485305517911911,
240
+ -0.6611306667327881,
241
+ -1.4443868398666382,
242
+ -0.9266657829284668,
243
+ -0.012117266654968262,
244
+ -0.547016978263855
245
+ ],
246
+ [
247
+ -0.5076735019683838,
248
+ -0.663108229637146,
249
+ -1.4905352592468262,
250
+ -0.9745397567749023,
251
+ -0.01165163516998291,
252
+ -0.5803918838500977
253
+ ],
254
+ [
255
+ -0.5290192365646362,
256
+ -0.6650083065032959,
257
+ -1.533168911933899,
258
+ -1.0207548141479492,
259
+ -0.011184930801391602,
260
+ -0.6152510046958923
261
+ ],
262
+ [
263
+ -0.5489386320114136,
264
+ -0.6667595505714417,
265
+ -1.5753229856491089,
266
+ -1.051430106163025,
267
+ -0.0109940767288208,
268
+ -0.6500052809715271
269
+ ],
270
+ [
271
+ -0.5668587684631348,
272
+ -0.667188823223114,
273
+ -1.6137160062789917,
274
+ -1.0931904315948486,
275
+ -0.010291337966918945,
276
+ -0.6832557916641235
277
+ ]
278
+ ],
279
+ "max": [
280
+ [
281
+ 0.16824336349964142,
282
+ 0.24052470922470093,
283
+ 0.5061454772949219,
284
+ 0.39507728815078735,
285
+ 0.006520986557006836,
286
+ 0.15706884860992432
287
+ ],
288
+ [
289
+ 0.20314648747444153,
290
+ 0.3025338053703308,
291
+ 0.6245244741439819,
292
+ 0.4650633931159973,
293
+ 0.006515979766845703,
294
+ 0.19194811582565308
295
+ ],
296
+ [
297
+ 0.2384708970785141,
298
+ 0.36002570390701294,
299
+ 0.7428172826766968,
300
+ 0.5275017023086548,
301
+ 0.006508588790893555,
302
+ 0.22680965065956116
303
+ ],
304
+ [
305
+ 0.2733740210533142,
306
+ 0.4157518148422241,
307
+ 0.8477752208709717,
308
+ 0.5841488242149353,
309
+ 0.00649869441986084,
310
+ 0.25784188508987427
311
+ ],
312
+ [
313
+ 0.30832749605178833,
314
+ 0.470317006111145,
315
+ 0.9313650131225586,
316
+ 0.6372599005699158,
317
+ 0.0064623355865478516,
318
+ 0.2888680100440979
319
+ ],
320
+ [
321
+ 0.343273401260376,
322
+ 0.5153665542602539,
323
+ 1.0067442655563354,
324
+ 0.6891289949417114,
325
+ 0.006403207778930664,
326
+ 0.31988149881362915
327
+ ],
328
+ [
329
+ 0.37823686003685,
330
+ 0.5592126250267029,
331
+ 1.065140724182129,
332
+ 0.7395720481872559,
333
+ 0.006318211555480957,
334
+ 0.3508707284927368
335
+ ],
336
+ [
337
+ 0.4132160246372223,
338
+ 0.5731149315834045,
339
+ 1.0996272563934326,
340
+ 0.788618266582489,
341
+ 0.006203055381774902,
342
+ 0.380546510219574
343
+ ],
344
+ [
345
+ 0.4482080936431885,
346
+ 0.5804688334465027,
347
+ 1.1714509725570679,
348
+ 0.8365987539291382,
349
+ 0.006093502044677734,
350
+ 0.40765124559402466
351
+ ],
352
+ [
353
+ 0.4830245077610016,
354
+ 0.5881319642066956,
355
+ 1.2263423204421997,
356
+ 0.8837657570838928,
357
+ 0.006119847297668457,
358
+ 0.4347139000892639
359
+ ],
360
+ [
361
+ 0.5162209272384644,
362
+ 0.5954858660697937,
363
+ 1.2864584922790527,
364
+ 0.9293184876441956,
365
+ 0.006140708923339844,
366
+ 0.4610365033149719
367
+ ],
368
+ [
369
+ 0.5473360419273376,
370
+ 0.5992559194564819,
371
+ 1.3450905084609985,
372
+ 0.9761509299278259,
373
+ 0.0061490535736083984,
374
+ 0.4848148226737976
375
+ ],
376
+ [
377
+ 0.5806077122688293,
378
+ 0.6047143936157227,
379
+ 1.3999574184417725,
380
+ 1.0215784311294556,
381
+ 0.006112813949584961,
382
+ 0.5069919228553772
383
+ ],
384
+ [
385
+ 0.6154510378837585,
386
+ 0.6339849233627319,
387
+ 1.451041579246521,
388
+ 1.0653609037399292,
389
+ 0.006089210510253906,
390
+ 0.5281317234039307
391
+ ],
392
+ [
393
+ 0.6502674221992493,
394
+ 0.6601248383522034,
395
+ 1.4983268976211548,
396
+ 1.1104395389556885,
397
+ 0.006052851676940918,
398
+ 0.5478552579879761
399
+ ],
400
+ [
401
+ 0.6834638714790344,
402
+ 0.6824098229408264,
403
+ 1.5142232179641724,
404
+ 1.1536270380020142,
405
+ 0.006022810935974121,
406
+ 0.565622091293335
407
+ ]
408
+ ],
409
+ "mean": [
410
+ [
411
+ 0.002399730496108532,
412
+ -0.03371857479214668,
413
+ -0.026506593450903893,
414
+ -0.007294314913451672,
415
+ -3.3637643355177715e-05,
416
+ -0.002175837755203247
417
+ ],
418
+ [
419
+ 0.0029731958638876677,
420
+ -0.03329775482416153,
421
+ -0.026526525616645813,
422
+ -0.007697952911257744,
423
+ -3.4519027394708246e-05,
424
+ -0.0027493059169501066
425
+ ],
426
+ [
427
+ 0.003604522440582514,
428
+ -0.032867252826690674,
429
+ -0.02654336765408516,
430
+ -0.008099138736724854,
431
+ -3.462656241026707e-05,
432
+ -0.0033809158485382795
433
+ ],
434
+ [
435
+ 0.004330680705606937,
436
+ -0.03244740143418312,
437
+ -0.026560107246041298,
438
+ -0.008501662872731686,
439
+ -3.4149335988331586e-05,
440
+ -0.004107005428522825
441
+ ],
442
+ [
443
+ 0.005132367368787527,
444
+ -0.032020263373851776,
445
+ -0.026579467579722404,
446
+ -0.00890059769153595,
447
+ -3.363030918990262e-05,
448
+ -0.004908420145511627
449
+ ],
450
+ [
451
+ 0.006013290956616402,
452
+ -0.03158460557460785,
453
+ -0.026602549478411674,
454
+ -0.00930008850991726,
455
+ -3.3384036214556545e-05,
456
+ -0.005788702052086592
457
+ ],
458
+ [
459
+ 0.0069674355909228325,
460
+ -0.031136885285377502,
461
+ -0.026633556932210922,
462
+ -0.009698453359305859,
463
+ -3.306723738205619e-05,
464
+ -0.006742133293300867
465
+ ],
466
+ [
467
+ 0.007998677901923656,
468
+ -0.030675340443849564,
469
+ -0.026676973327994347,
470
+ -0.010097721591591835,
471
+ -3.293266854598187e-05,
472
+ -0.007772281300276518
473
+ ],
474
+ [
475
+ 0.009103219956159592,
476
+ -0.030197689309716225,
477
+ -0.026734555140137672,
478
+ -0.010497260838747025,
479
+ -3.274149639764801e-05,
480
+ -0.008875810541212559
481
+ ],
482
+ [
483
+ 0.01028699241578579,
484
+ -0.029703862965106964,
485
+ -0.026812396943569183,
486
+ -0.010893884114921093,
487
+ -3.268092768848874e-05,
488
+ -0.010058477520942688
489
+ ],
490
+ [
491
+ 0.011553517542779446,
492
+ -0.029192553833127022,
493
+ -0.026906808838248253,
494
+ -0.011289995163679123,
495
+ -3.269802255090326e-05,
496
+ -0.01132387388497591
497
+ ],
498
+ [
499
+ 0.012908070348203182,
500
+ -0.028664078563451767,
501
+ -0.02701812982559204,
502
+ -0.011685356497764587,
503
+ -3.28218775393907e-05,
504
+ -0.012677285820245743
505
+ ],
506
+ [
507
+ 0.014355717226862907,
508
+ -0.028118710964918137,
509
+ -0.027147676795721054,
510
+ -0.012079907581210136,
511
+ -3.296746945125051e-05,
512
+ -0.014123816974461079
513
+ ],
514
+ [
515
+ 0.015898622572422028,
516
+ -0.027556538581848145,
517
+ -0.02729668840765953,
518
+ -0.012473052367568016,
519
+ -3.313259003334679e-05,
520
+ -0.015665428712964058
521
+ ],
522
+ [
523
+ 0.01753367856144905,
524
+ -0.026974856853485107,
525
+ -0.027466658502817154,
526
+ -0.012863936834037304,
527
+ -3.3350897865602747e-05,
528
+ -0.01729944720864296
529
+ ],
530
+ [
531
+ 0.019253134727478027,
532
+ -0.026369046419858932,
533
+ -0.02766418643295765,
534
+ -0.013252663426101208,
535
+ -3.3440224797232077e-05,
536
+ -0.019018059596419334
537
+ ]
538
+ ],
539
+ "std": [
540
+ [
541
+ 0.04323775693774223,
542
+ 0.045802634209394455,
543
+ 0.10585169494152069,
544
+ 0.08371099829673767,
545
+ 0.000734939647372812,
546
+ 0.04311731085181236
547
+ ],
548
+ [
549
+ 0.052831608802080154,
550
+ 0.0550084225833416,
551
+ 0.12866128981113434,
552
+ 0.10224901884794235,
553
+ 0.0007391870021820068,
554
+ 0.052699752151966095
555
+ ],
556
+ [
557
+ 0.06230269744992256,
558
+ 0.06383407860994339,
559
+ 0.15080901980400085,
560
+ 0.12041323632001877,
561
+ 0.0007443022332154214,
562
+ 0.0621633417904377
563
+ ],
564
+ [
565
+ 0.07166402041912079,
566
+ 0.07222028821706772,
567
+ 0.17223787307739258,
568
+ 0.13817144930362701,
569
+ 0.0007505182875320315,
570
+ 0.07151757925748825
571
+ ],
572
+ [
573
+ 0.08089207857847214,
574
+ 0.08016153424978256,
575
+ 0.19294390082359314,
576
+ 0.1555166095495224,
577
+ 0.000756296853069216,
578
+ 0.08074097335338593
579
+ ],
580
+ [
581
+ 0.0899948924779892,
582
+ 0.08766801655292511,
583
+ 0.2129502147436142,
584
+ 0.17245666682720184,
585
+ 0.0007633369532413781,
586
+ 0.0898369774222374
587
+ ],
588
+ [
589
+ 0.09896065294742584,
590
+ 0.09475349634885788,
591
+ 0.2322818636894226,
592
+ 0.1889989674091339,
593
+ 0.0007708776392973959,
594
+ 0.09880099445581436
595
+ ],
596
+ [
597
+ 0.10780492424964905,
598
+ 0.10143771767616272,
599
+ 0.25096794962882996,
600
+ 0.20515595376491547,
601
+ 0.0007795444107614458,
602
+ 0.10764006525278091
603
+ ],
604
+ [
605
+ 0.11651723086833954,
606
+ 0.10774324834346771,
607
+ 0.26903823018074036,
608
+ 0.22093604505062103,
609
+ 0.0007895926828496158,
610
+ 0.11634589731693268
611
+ ],
612
+ [
613
+ 0.12510086596012115,
614
+ 0.11369043588638306,
615
+ 0.28652051091194153,
616
+ 0.23635028302669525,
617
+ 0.0008002828690223396,
618
+ 0.124925397336483
619
+ ],
620
+ [
621
+ 0.1335495114326477,
622
+ 0.11929997056722641,
623
+ 0.3034432828426361,
624
+ 0.2514086365699768,
625
+ 0.0008107878966256976,
626
+ 0.1333676427602768
627
+ ],
628
+ [
629
+ 0.1418585479259491,
630
+ 0.124591164290905,
631
+ 0.31983453035354614,
632
+ 0.2661244869232178,
633
+ 0.0008217667927965522,
634
+ 0.14167335629463196
635
+ ],
636
+ [
637
+ 0.1500254124403,
638
+ 0.1295834332704544,
639
+ 0.3357211947441101,
640
+ 0.28050777316093445,
641
+ 0.0008334207232110202,
642
+ 0.14983689785003662
643
+ ],
644
+ [
645
+ 0.15803955495357513,
646
+ 0.1342964768409729,
647
+ 0.351129412651062,
648
+ 0.294569730758667,
649
+ 0.0008444534032605588,
650
+ 0.15784819424152374
651
+ ],
652
+ [
653
+ 0.16589556634426117,
654
+ 0.138750359416008,
655
+ 0.3660843074321747,
656
+ 0.3083218038082123,
657
+ 0.0008554744417779148,
658
+ 0.1657029092311859
659
+ ],
660
+ [
661
+ 0.17359334230422974,
662
+ 0.14296913146972656,
663
+ 0.38061195611953735,
664
+ 0.3217768371105194,
665
+ 0.000866534246597439,
666
+ 0.1733987182378769
667
+ ]
668
+ ],
669
+ "q01": [
670
+ [
671
+ -0.12213177978992462,
672
+ -0.14521412551403046,
673
+ -0.36651915311813354,
674
+ -0.22651121020317078,
675
+ -0.002628536429256201,
676
+ -0.13755188882350922
677
+ ],
678
+ [
679
+ -0.14906743168830872,
680
+ -0.1672179400920868,
681
+ -0.43642017245292664,
682
+ -0.2747143805027008,
683
+ -0.002645096741616726,
684
+ -0.1674933135509491
685
+ ],
686
+ [
687
+ -0.17482531070709229,
688
+ -0.18630193173885345,
689
+ -0.519730806350708,
690
+ -0.32141369581222534,
691
+ -0.0026340961921960115,
692
+ -0.19536428153514862
693
+ ],
694
+ [
695
+ -0.19858603179454803,
696
+ -0.2066028118133545,
697
+ -0.585573136806488,
698
+ -0.36707189679145813,
699
+ -0.002717776456847787,
700
+ -0.2237655073404312
701
+ ],
702
+ [
703
+ -0.22130325436592102,
704
+ -0.22337931394577026,
705
+ -0.6607177257537842,
706
+ -0.40824657678604126,
707
+ -0.0029330539982765913,
708
+ -0.25334563851356506
709
+ ],
710
+ [
711
+ -0.24440711736679077,
712
+ -0.238887757062912,
713
+ -0.7216896414756775,
714
+ -0.4496803879737854,
715
+ -0.0030421495903283358,
716
+ -0.28178611397743225
717
+ ],
718
+ [
719
+ -0.26698970794677734,
720
+ -0.25492310523986816,
721
+ -0.7907676100730896,
722
+ -0.4887317419052124,
723
+ -0.003101882990449667,
724
+ -0.3099566102027893
725
+ ],
726
+ [
727
+ -0.286782830953598,
728
+ -0.27151039242744446,
729
+ -0.8517748713493347,
730
+ -0.5257248282432556,
731
+ -0.003171453485265374,
732
+ -0.3390139937400818
733
+ ],
734
+ [
735
+ -0.30621322989463806,
736
+ -0.2862298786640167,
737
+ -0.9015073776245117,
738
+ -0.5636691451072693,
739
+ -0.0032641314901411533,
740
+ -0.36655768752098083
741
+ ],
742
+ [
743
+ -0.3255496025085449,
744
+ -0.29756152629852295,
745
+ -0.9560237526893616,
746
+ -0.5999890565872192,
747
+ -0.0032778121531009674,
748
+ -0.3943326771259308
749
+ ],
750
+ [
751
+ -0.34466391801834106,
752
+ -0.30887919664382935,
753
+ -1.0073438882827759,
754
+ -0.632552444934845,
755
+ -0.0033038281835615635,
756
+ -0.4224179685115814
757
+ ],
758
+ [
759
+ -0.35855481028556824,
760
+ -0.3250240683555603,
761
+ -1.0543361902236938,
762
+ -0.6657060980796814,
763
+ -0.0033189060632139444,
764
+ -0.448632150888443
765
+ ],
766
+ [
767
+ -0.3737456798553467,
768
+ -0.3364461362361908,
769
+ -1.0995036363601685,
770
+ -0.6994519829750061,
771
+ -0.0033822304103523493,
772
+ -0.47539883852005005
773
+ ],
774
+ [
775
+ -0.3870712220668793,
776
+ -0.3443698287010193,
777
+ -1.1389037370681763,
778
+ -0.7261598706245422,
779
+ -0.003482704982161522,
780
+ -0.5010547041893005
781
+ ],
782
+ [
783
+ -0.3985598683357239,
784
+ -0.35595327615737915,
785
+ -1.1819812059402466,
786
+ -0.7497241497039795,
787
+ -0.0035526324063539505,
788
+ -0.5260051488876343
789
+ ],
790
+ [
791
+ -0.4100184440612793,
792
+ -0.36467358469963074,
793
+ -1.230539083480835,
794
+ -0.7697025537490845,
795
+ -0.003628845326602459,
796
+ -0.5501382946968079
797
+ ]
798
+ ],
799
+ "q99": [
800
+ [
801
+ 0.13778626918792725,
802
+ 0.11720699071884155,
803
+ 0.2617994546890259,
804
+ 0.23129749298095703,
805
+ 0.0021540913730859756,
806
+ 0.12180761247873306
807
+ ],
808
+ [
809
+ 0.16777439415454865,
810
+ 0.1505272388458252,
811
+ 0.3302338719367981,
812
+ 0.2836305797100067,
813
+ 0.002166236750781536,
814
+ 0.14862465858459473
815
+ ],
816
+ [
817
+ 0.19595178961753845,
818
+ 0.18208669126033783,
819
+ 0.3971126675605774,
820
+ 0.336750864982605,
821
+ 0.0021774321794509888,
822
+ 0.1744869202375412
823
+ ],
824
+ [
825
+ 0.22429130971431732,
826
+ 0.21202439069747925,
827
+ 0.45463618636131287,
828
+ 0.38751187920570374,
829
+ 0.002235555090010166,
830
+ 0.19793902337551117
831
+ ],
832
+ [
833
+ 0.2538144588470459,
834
+ 0.23781366646289825,
835
+ 0.5186766982078552,
836
+ 0.43724244832992554,
837
+ 0.0022584283724427223,
838
+ 0.22057458758354187
839
+ ],
840
+ [
841
+ 0.28190404176712036,
842
+ 0.2608570158481598,
843
+ 0.5791972875595093,
844
+ 0.48876842856407166,
845
+ 0.002288524992763996,
846
+ 0.24382244050502777
847
+ ],
848
+ [
849
+ 0.3102819323539734,
850
+ 0.2809824049472809,
851
+ 0.6328328251838684,
852
+ 0.5347740054130554,
853
+ 0.002312292344868183,
854
+ 0.2663334310054779
855
+ ],
856
+ [
857
+ 0.3394824266433716,
858
+ 0.29752638936042786,
859
+ 0.6895572543144226,
860
+ 0.5827977061271667,
861
+ 0.002330307848751545,
862
+ 0.2859741449356079
863
+ ],
864
+ [
865
+ 0.3669600784778595,
866
+ 0.31471166014671326,
867
+ 0.7397019267082214,
868
+ 0.6297330260276794,
869
+ 0.002337755635380745,
870
+ 0.30544596910476685
871
+ ],
872
+ [
873
+ 0.3945035934448242,
874
+ 0.33071205019950867,
875
+ 0.7886773347854614,
876
+ 0.6768563985824585,
877
+ 0.0023598140105605125,
878
+ 0.32461366057395935
879
+ ],
880
+ [
881
+ 0.4227299392223358,
882
+ 0.3485700190067291,
883
+ 0.8316053152084351,
884
+ 0.723706841468811,
885
+ 0.002375778742134571,
886
+ 0.3432371914386749
887
+ ],
888
+ [
889
+ 0.44936659932136536,
890
+ 0.35997745394706726,
891
+ 0.8786941170692444,
892
+ 0.7676846981048584,
893
+ 0.0023923860862851143,
894
+ 0.3572857081890106
895
+ ],
896
+ [
897
+ 0.47607606649398804,
898
+ 0.3778820335865021,
899
+ 0.9260716438293457,
900
+ 0.8119612336158752,
901
+ 0.0024137627333402634,
902
+ 0.37240657210350037
903
+ ],
904
+ [
905
+ 0.501969575881958,
906
+ 0.39211174845695496,
907
+ 0.9603159427642822,
908
+ 0.8552690148353577,
909
+ 0.0024626096710562706,
910
+ 0.38595545291900635
911
+ ],
912
+ [
913
+ 0.5269771218299866,
914
+ 0.4024680256843567,
915
+ 1.0048072338104248,
916
+ 0.899775505065918,
917
+ 0.00252683088183403,
918
+ 0.3976656496524811
919
+ ],
920
+ [
921
+ 0.550702691078186,
922
+ 0.4190630316734314,
923
+ 1.0371341705322266,
924
+ 0.9431969523429871,
925
+ 0.0025539007037878036,
926
+ 0.4088396430015564
927
+ ]
928
+ ]
929
+ }
930
+ }
931
+ }
932
+ }
experiment_cfg/final_model_config.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "Gr00tN1d6",
3
+ "model_dtype": "bfloat16",
4
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
5
+ "backbone_model_type": "eagle",
6
+ "model_revision": null,
7
+ "tune_top_llm_layers": 4,
8
+ "backbone_embedding_dim": 2048,
9
+ "tune_llm": false,
10
+ "tune_visual": false,
11
+ "select_layer": 16,
12
+ "reproject_vision": false,
13
+ "use_flash_attention": true,
14
+ "load_bf16": true,
15
+ "collator_overwrite_image_inputs": false,
16
+ "eagle_collator": true,
17
+ "backbone_trainable_params_fp32": true,
18
+ "apply_sincos_state_encoding": true,
19
+ "use_relative_action": true,
20
+ "max_state_dim": 128,
21
+ "max_action_dim": 128,
22
+ "action_horizon": 50,
23
+ "hidden_size": 1024,
24
+ "input_embedding_dim": 1536,
25
+ "add_pos_embed": true,
26
+ "attn_dropout": 0.2,
27
+ "use_vlln": true,
28
+ "max_seq_len": 1024,
29
+ "use_alternate_vl_dit": true,
30
+ "attend_text_every_n_blocks": 2,
31
+ "diffusion_model_cfg": {
32
+ "attention_head_dim": 48,
33
+ "dropout": 0.2,
34
+ "final_dropout": true,
35
+ "interleave_self_attention": true,
36
+ "norm_type": "ada_norm",
37
+ "num_attention_heads": 32,
38
+ "num_layers": 32,
39
+ "output_dim": 1024,
40
+ "positional_embeddings": null
41
+ },
42
+ "num_inference_timesteps": 4,
43
+ "noise_beta_alpha": 1.5,
44
+ "noise_beta_beta": 1.0,
45
+ "noise_s": 0.999,
46
+ "num_timestep_buckets": 1000,
47
+ "tune_projector": true,
48
+ "tune_diffusion_model": true,
49
+ "tune_vlln": true,
50
+ "state_dropout_prob": 0.15,
51
+ "state_additive_noise_scale": 0.0,
52
+ "max_num_embodiments": 32
53
+ }
experiment_cfg/final_processor_config.json ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9000dbca703190deb360e6d99cbe4cd41fc341cc5c70a2beacc8b160249fbc24
3
+ size 4990126416
model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:304adbff51430cfce2f8796d3ffb6a8b80d0a4dc62df1620386e701e77bdbc3f
3
+ size 4823190320
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
processor/embodiment_id.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "robocasa_panda_omron": 13,
3
+ "gr1": 20,
4
+ "behavior_r1_pro": 24,
5
+ "unitree_g1": 8,
6
+ "oxe_google": 0,
7
+ "oxe_widowx": 1,
8
+ "libero_panda": 2,
9
+ "oxe_droid": 16,
10
+ "new_embodiment": 10
11
+ }
processor/processor_config.json ADDED
@@ -0,0 +1,455 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "processor_class": "Gr00tN1d6Processor",
3
+ "processor_kwargs": {
4
+ "modality_configs": {
5
+ "behavior_r1_pro": {
6
+ "video": {
7
+ "delta_indices": [
8
+ 0
9
+ ],
10
+ "modality_keys": [
11
+ "observation.images.rgb.head_256_256",
12
+ "observation.images.rgb.left_wrist_256_256",
13
+ "observation.images.rgb.right_wrist_256_256"
14
+ ],
15
+ "sin_cos_embedding_keys": null,
16
+ "mean_std_embedding_keys": null,
17
+ "action_configs": null
18
+ },
19
+ "state": {
20
+ "delta_indices": [
21
+ 0
22
+ ],
23
+ "modality_keys": [
24
+ "robot_pos",
25
+ "robot_ori_cos",
26
+ "robot_ori_sin",
27
+ "robot_2d_ori",
28
+ "robot_2d_ori_cos",
29
+ "robot_2d_ori_sin",
30
+ "robot_lin_vel",
31
+ "robot_ang_vel",
32
+ "arm_left_qpos",
33
+ "arm_left_qpos_sin",
34
+ "arm_left_qpos_cos",
35
+ "eef_left_pos",
36
+ "eef_left_quat",
37
+ "gripper_left_qpos",
38
+ "arm_right_qpos",
39
+ "arm_right_qpos_sin",
40
+ "arm_right_qpos_cos",
41
+ "eef_right_pos",
42
+ "eef_right_quat",
43
+ "gripper_right_qpos",
44
+ "trunk_qpos"
45
+ ],
46
+ "sin_cos_embedding_keys": null,
47
+ "mean_std_embedding_keys": null,
48
+ "action_configs": null
49
+ },
50
+ "action": {
51
+ "delta_indices": [
52
+ 0,
53
+ 1,
54
+ 2,
55
+ 3,
56
+ 4,
57
+ 5,
58
+ 6,
59
+ 7,
60
+ 8,
61
+ 9,
62
+ 10,
63
+ 11,
64
+ 12,
65
+ 13,
66
+ 14,
67
+ 15,
68
+ 16,
69
+ 17,
70
+ 18,
71
+ 19,
72
+ 20,
73
+ 21,
74
+ 22,
75
+ 23,
76
+ 24,
77
+ 25,
78
+ 26,
79
+ 27,
80
+ 28,
81
+ 29,
82
+ 30,
83
+ 31
84
+ ],
85
+ "modality_keys": [
86
+ "base",
87
+ "torso",
88
+ "left_arm",
89
+ "left_gripper",
90
+ "right_arm",
91
+ "right_gripper"
92
+ ],
93
+ "sin_cos_embedding_keys": null,
94
+ "mean_std_embedding_keys": null,
95
+ "action_configs": [
96
+ {
97
+ "rep": "ABSOLUTE",
98
+ "type": "NON_EEF",
99
+ "format": "DEFAULT",
100
+ "state_key": null
101
+ },
102
+ {
103
+ "rep": "RELATIVE",
104
+ "type": "NON_EEF",
105
+ "format": "DEFAULT",
106
+ "state_key": "trunk_qpos"
107
+ },
108
+ {
109
+ "rep": "RELATIVE",
110
+ "type": "NON_EEF",
111
+ "format": "DEFAULT",
112
+ "state_key": "arm_left_qpos"
113
+ },
114
+ {
115
+ "rep": "ABSOLUTE",
116
+ "type": "NON_EEF",
117
+ "format": "DEFAULT",
118
+ "state_key": null
119
+ },
120
+ {
121
+ "rep": "RELATIVE",
122
+ "type": "NON_EEF",
123
+ "format": "DEFAULT",
124
+ "state_key": "arm_right_qpos"
125
+ },
126
+ {
127
+ "rep": "ABSOLUTE",
128
+ "type": "NON_EEF",
129
+ "format": "DEFAULT",
130
+ "state_key": null
131
+ }
132
+ ]
133
+ },
134
+ "language": {
135
+ "delta_indices": [
136
+ 0
137
+ ],
138
+ "modality_keys": [
139
+ "annotation.human.coarse_action"
140
+ ],
141
+ "sin_cos_embedding_keys": null,
142
+ "mean_std_embedding_keys": null,
143
+ "action_configs": null
144
+ }
145
+ },
146
+ "gr1": {
147
+ "video": {
148
+ "delta_indices": [
149
+ 0
150
+ ],
151
+ "modality_keys": [
152
+ "ego_view_bg_crop_pad_res256_freq20"
153
+ ],
154
+ "sin_cos_embedding_keys": null,
155
+ "mean_std_embedding_keys": null,
156
+ "action_configs": null
157
+ },
158
+ "state": {
159
+ "delta_indices": [
160
+ 0
161
+ ],
162
+ "modality_keys": [
163
+ "left_arm",
164
+ "right_arm",
165
+ "left_hand",
166
+ "right_hand",
167
+ "waist"
168
+ ],
169
+ "sin_cos_embedding_keys": [
170
+ "left_arm",
171
+ "right_arm",
172
+ "left_hand",
173
+ "right_hand",
174
+ "waist"
175
+ ],
176
+ "mean_std_embedding_keys": null,
177
+ "action_configs": null
178
+ },
179
+ "action": {
180
+ "delta_indices": [
181
+ 0,
182
+ 1,
183
+ 2,
184
+ 3,
185
+ 4,
186
+ 5,
187
+ 6,
188
+ 7,
189
+ 8,
190
+ 9,
191
+ 10,
192
+ 11,
193
+ 12,
194
+ 13,
195
+ 14,
196
+ 15
197
+ ],
198
+ "modality_keys": [
199
+ "left_arm",
200
+ "right_arm",
201
+ "left_hand",
202
+ "right_hand",
203
+ "waist"
204
+ ],
205
+ "sin_cos_embedding_keys": null,
206
+ "mean_std_embedding_keys": null,
207
+ "action_configs": [
208
+ {
209
+ "rep": "RELATIVE",
210
+ "type": "NON_EEF",
211
+ "format": "DEFAULT",
212
+ "state_key": null
213
+ },
214
+ {
215
+ "rep": "RELATIVE",
216
+ "type": "NON_EEF",
217
+ "format": "DEFAULT",
218
+ "state_key": null
219
+ },
220
+ {
221
+ "rep": "RELATIVE",
222
+ "type": "NON_EEF",
223
+ "format": "DEFAULT",
224
+ "state_key": null
225
+ },
226
+ {
227
+ "rep": "RELATIVE",
228
+ "type": "NON_EEF",
229
+ "format": "DEFAULT",
230
+ "state_key": null
231
+ },
232
+ {
233
+ "rep": "ABSOLUTE",
234
+ "type": "NON_EEF",
235
+ "format": "DEFAULT",
236
+ "state_key": null
237
+ }
238
+ ]
239
+ },
240
+ "language": {
241
+ "delta_indices": [
242
+ 0
243
+ ],
244
+ "modality_keys": [
245
+ "task"
246
+ ],
247
+ "sin_cos_embedding_keys": null,
248
+ "mean_std_embedding_keys": null,
249
+ "action_configs": null
250
+ }
251
+ },
252
+ "robocasa_panda_omron": {
253
+ "video": {
254
+ "delta_indices": [
255
+ 0
256
+ ],
257
+ "modality_keys": [
258
+ "res256_image_side_0",
259
+ "res256_image_side_1",
260
+ "res256_image_wrist_0"
261
+ ],
262
+ "sin_cos_embedding_keys": null,
263
+ "mean_std_embedding_keys": null,
264
+ "action_configs": null
265
+ },
266
+ "state": {
267
+ "delta_indices": [
268
+ 0
269
+ ],
270
+ "modality_keys": [
271
+ "end_effector_position_relative",
272
+ "end_effector_rotation_relative",
273
+ "gripper_qpos",
274
+ "base_position",
275
+ "base_rotation"
276
+ ],
277
+ "sin_cos_embedding_keys": null,
278
+ "mean_std_embedding_keys": null,
279
+ "action_configs": null
280
+ },
281
+ "action": {
282
+ "delta_indices": [
283
+ 0,
284
+ 1,
285
+ 2,
286
+ 3,
287
+ 4,
288
+ 5,
289
+ 6,
290
+ 7,
291
+ 8,
292
+ 9,
293
+ 10,
294
+ 11,
295
+ 12,
296
+ 13,
297
+ 14,
298
+ 15
299
+ ],
300
+ "modality_keys": [
301
+ "end_effector_position",
302
+ "end_effector_rotation",
303
+ "gripper_close",
304
+ "base_motion",
305
+ "control_mode"
306
+ ],
307
+ "sin_cos_embedding_keys": null,
308
+ "mean_std_embedding_keys": null,
309
+ "action_configs": [
310
+ {
311
+ "rep": "ABSOLUTE",
312
+ "type": "NON_EEF",
313
+ "format": "DEFAULT",
314
+ "state_key": null
315
+ },
316
+ {
317
+ "rep": "ABSOLUTE",
318
+ "type": "NON_EEF",
319
+ "format": "DEFAULT",
320
+ "state_key": null
321
+ },
322
+ {
323
+ "rep": "ABSOLUTE",
324
+ "type": "NON_EEF",
325
+ "format": "DEFAULT",
326
+ "state_key": null
327
+ },
328
+ {
329
+ "rep": "ABSOLUTE",
330
+ "type": "NON_EEF",
331
+ "format": "DEFAULT",
332
+ "state_key": null
333
+ },
334
+ {
335
+ "rep": "ABSOLUTE",
336
+ "type": "NON_EEF",
337
+ "format": "DEFAULT",
338
+ "state_key": null
339
+ }
340
+ ]
341
+ },
342
+ "language": {
343
+ "delta_indices": [
344
+ 0
345
+ ],
346
+ "modality_keys": [
347
+ "annotation.human.action.task_description"
348
+ ],
349
+ "sin_cos_embedding_keys": null,
350
+ "mean_std_embedding_keys": null,
351
+ "action_configs": null
352
+ }
353
+ },
354
+ "new_embodiment": {
355
+ "video": {
356
+ "delta_indices": [
357
+ 0
358
+ ],
359
+ "modality_keys": [
360
+ "front",
361
+ "wrist"
362
+ ],
363
+ "sin_cos_embedding_keys": null,
364
+ "mean_std_embedding_keys": null,
365
+ "action_configs": null
366
+ },
367
+ "state": {
368
+ "delta_indices": [
369
+ 0
370
+ ],
371
+ "modality_keys": [
372
+ "single_arm",
373
+ "gripper"
374
+ ],
375
+ "sin_cos_embedding_keys": null,
376
+ "mean_std_embedding_keys": null,
377
+ "action_configs": null
378
+ },
379
+ "action": {
380
+ "delta_indices": [
381
+ 0,
382
+ 1,
383
+ 2,
384
+ 3,
385
+ 4,
386
+ 5,
387
+ 6,
388
+ 7,
389
+ 8,
390
+ 9,
391
+ 10,
392
+ 11,
393
+ 12,
394
+ 13,
395
+ 14,
396
+ 15
397
+ ],
398
+ "modality_keys": [
399
+ "single_arm",
400
+ "gripper"
401
+ ],
402
+ "sin_cos_embedding_keys": null,
403
+ "mean_std_embedding_keys": null,
404
+ "action_configs": [
405
+ {
406
+ "rep": "RELATIVE",
407
+ "type": "NON_EEF",
408
+ "format": "DEFAULT",
409
+ "state_key": null
410
+ },
411
+ {
412
+ "rep": "ABSOLUTE",
413
+ "type": "NON_EEF",
414
+ "format": "DEFAULT",
415
+ "state_key": null
416
+ }
417
+ ]
418
+ },
419
+ "language": {
420
+ "delta_indices": [
421
+ 0
422
+ ],
423
+ "modality_keys": [
424
+ "annotation.human.task_description"
425
+ ],
426
+ "sin_cos_embedding_keys": null,
427
+ "mean_std_embedding_keys": null,
428
+ "action_configs": null
429
+ }
430
+ }
431
+ },
432
+ "image_crop_size": null,
433
+ "image_target_size": null,
434
+ "use_albumentations": true,
435
+ "random_rotation_angle": null,
436
+ "color_jitter_params": {
437
+ "brightness": 0.3,
438
+ "contrast": 0.4,
439
+ "saturation": 0.5,
440
+ "hue": 0.08
441
+ },
442
+ "shortest_image_edge": 256,
443
+ "crop_fraction": 0.95,
444
+ "model_name": "nvidia/Eagle-Block2A-2B-v2",
445
+ "model_type": "eagle",
446
+ "formalize_language": true,
447
+ "max_state_dim": 128,
448
+ "max_action_dim": 128,
449
+ "max_action_horizon": 50,
450
+ "use_percentiles": false,
451
+ "clip_outliers": true,
452
+ "apply_sincos_state_encoding": true,
453
+ "use_relative_action": true
454
+ }
455
+ }
processor/statistics.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:273910977029e314f0cf45f0c23e1eddadbc4e624fca833ddf2b3468e7f50876
3
+ size 5713
wandb_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"project": "finetune-gr00t-n1d6", "run_id": "omy_1"}