bot commited on
Commit
132e80f
·
1 Parent(s): 25b38a9

Import Path, gitignore checkpoints

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoints/
checkpoints/step_000500/pretrained_model/config.json DELETED
@@ -1,95 +0,0 @@
1
- {
2
- "type": "pi05",
3
- "n_obs_steps": 1,
4
- "input_features": {
5
- "observation.images.base_0_rgb": {
6
- "type": "VISUAL",
7
- "shape": [
8
- 3,
9
- 224,
10
- 224
11
- ]
12
- },
13
- "observation.images.left_wrist_0_rgb": {
14
- "type": "VISUAL",
15
- "shape": [
16
- 3,
17
- 224,
18
- 224
19
- ]
20
- },
21
- "observation.images.right_wrist_0_rgb": {
22
- "type": "VISUAL",
23
- "shape": [
24
- 3,
25
- 224,
26
- 224
27
- ]
28
- },
29
- "observation.state": {
30
- "type": "STATE",
31
- "shape": [
32
- 32
33
- ]
34
- }
35
- },
36
- "output_features": {
37
- "action": {
38
- "type": "ACTION",
39
- "shape": [
40
- 6
41
- ]
42
- }
43
- },
44
- "device": "cuda",
45
- "use_amp": false,
46
- "use_peft": false,
47
- "push_to_hub": true,
48
- "repo_id": "StrongRoboticsLab/pi05-so100-diverse",
49
- "private": null,
50
- "tags": null,
51
- "license": null,
52
- "pretrained_path": "lerobot/pi05_base",
53
- "paligemma_variant": "gemma_2b",
54
- "action_expert_variant": "gemma_300m",
55
- "dtype": "bfloat16",
56
- "chunk_size": 50,
57
- "n_action_steps": 50,
58
- "max_state_dim": 32,
59
- "max_action_dim": 32,
60
- "num_inference_steps": 10,
61
- "time_sampling_beta_alpha": 1.5,
62
- "time_sampling_beta_beta": 1.0,
63
- "time_sampling_scale": 0.999,
64
- "time_sampling_offset": 0.001,
65
- "min_period": 0.004,
66
- "max_period": 4.0,
67
- "rtc_config": null,
68
- "image_resolution": [
69
- 224,
70
- 224
71
- ],
72
- "empty_cameras": 0,
73
- "tokenizer_max_length": 200,
74
- "normalization_mapping": {
75
- "VISUAL": "IDENTITY",
76
- "STATE": "MEAN_STD",
77
- "ACTION": "MEAN_STD"
78
- },
79
- "gradient_checkpointing": false,
80
- "compile_model": false,
81
- "compile_mode": "max-autotune",
82
- "freeze_vision_encoder": false,
83
- "train_expert_only": true,
84
- "optimizer_lr": 2.5e-05,
85
- "optimizer_betas": [
86
- 0.9,
87
- 0.95
88
- ],
89
- "optimizer_eps": 1e-08,
90
- "optimizer_weight_decay": 0.01,
91
- "optimizer_grad_clip_norm": 1.0,
92
- "scheduler_warmup_steps": 1000,
93
- "scheduler_decay_steps": 340000,
94
- "scheduler_decay_lr": 2.5e-06
95
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoints/step_000500/pretrained_model/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:622f382ec13790812f787a51b9bf6374e358ba36caa30e88968d7706fe3c6e70
3
- size 9354050752
 
 
 
 
checkpoints/step_000500/pretrained_model/policy_postprocessor.json DELETED
@@ -1,32 +0,0 @@
1
- {
2
- "name": "policy_postprocessor",
3
- "steps": [
4
- {
5
- "registry_name": "unnormalizer_processor",
6
- "config": {
7
- "eps": 1e-08,
8
- "features": {
9
- "action": {
10
- "type": "ACTION",
11
- "shape": [
12
- 6
13
- ]
14
- }
15
- },
16
- "norm_map": {
17
- "VISUAL": "IDENTITY",
18
- "STATE": "MEAN_STD",
19
- "ACTION": "MEAN_STD"
20
- }
21
- },
22
- "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors"
23
- },
24
- {
25
- "registry_name": "device_processor",
26
- "config": {
27
- "device": "cpu",
28
- "float_dtype": null
29
- }
30
- }
31
- ]
32
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoints/step_000500/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6a631ee0d784519e7052f654e71248331b32f26ba470b8d15f29553e15d8a0f
3
- size 768
 
 
 
 
checkpoints/step_000500/pretrained_model/policy_preprocessor.json DELETED
@@ -1,90 +0,0 @@
1
- {
2
- "name": "policy_preprocessor",
3
- "steps": [
4
- {
5
- "registry_name": "rename_observations_processor",
6
- "config": {
7
- "rename_map": {
8
- "observation.images.image": "observation.images.base_0_rgb",
9
- "observation.images.image2": "observation.images.left_wrist_0_rgb"
10
- }
11
- }
12
- },
13
- {
14
- "registry_name": "to_batch_processor",
15
- "config": {}
16
- },
17
- {
18
- "registry_name": "normalizer_processor",
19
- "config": {
20
- "eps": 1e-08,
21
- "features": {
22
- "observation.images.base_0_rgb": {
23
- "type": "VISUAL",
24
- "shape": [
25
- 3,
26
- 224,
27
- 224
28
- ]
29
- },
30
- "observation.images.left_wrist_0_rgb": {
31
- "type": "VISUAL",
32
- "shape": [
33
- 3,
34
- 224,
35
- 224
36
- ]
37
- },
38
- "observation.images.right_wrist_0_rgb": {
39
- "type": "VISUAL",
40
- "shape": [
41
- 3,
42
- 224,
43
- 224
44
- ]
45
- },
46
- "observation.state": {
47
- "type": "STATE",
48
- "shape": [
49
- 32
50
- ]
51
- },
52
- "action": {
53
- "type": "ACTION",
54
- "shape": [
55
- 6
56
- ]
57
- }
58
- },
59
- "norm_map": {
60
- "VISUAL": "IDENTITY",
61
- "STATE": "MEAN_STD",
62
- "ACTION": "MEAN_STD"
63
- }
64
- },
65
- "state_file": "policy_preprocessor_step_2_normalizer_processor.safetensors"
66
- },
67
- {
68
- "registry_name": "pi05_prepare_state_tokenizer_processor_step",
69
- "config": {}
70
- },
71
- {
72
- "registry_name": "tokenizer_processor",
73
- "config": {
74
- "max_length": 200,
75
- "task_key": "task",
76
- "padding_side": "right",
77
- "padding": "max_length",
78
- "truncation": true,
79
- "tokenizer_name": "google/paligemma-3b-pt-224"
80
- }
81
- },
82
- {
83
- "registry_name": "device_processor",
84
- "config": {
85
- "device": "cuda",
86
- "float_dtype": null
87
- }
88
- }
89
- ]
90
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoints/step_000500/pretrained_model/policy_preprocessor_step_2_normalizer_processor.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6a631ee0d784519e7052f654e71248331b32f26ba470b8d15f29553e15d8a0f
3
- size 768
 
 
 
 
checkpoints/step_000500/pretrained_model/train_config.json DELETED
@@ -1,236 +0,0 @@
1
- {
2
- "dataset": {
3
- "repo_id": "so100:/ephemeral/community_dataset_v3:/workspace/pi05-so100-diverse/filtered_index.json:/workspace/pi05-so100-diverse/norm_stats.json",
4
- "root": null,
5
- "episodes": null,
6
- "image_transforms": {
7
- "enable": false,
8
- "max_num_transforms": 3,
9
- "random_order": false,
10
- "tfs": {
11
- "brightness": {
12
- "weight": 1.0,
13
- "type": "ColorJitter",
14
- "kwargs": {
15
- "brightness": [
16
- 0.8,
17
- 1.2
18
- ]
19
- }
20
- },
21
- "contrast": {
22
- "weight": 1.0,
23
- "type": "ColorJitter",
24
- "kwargs": {
25
- "contrast": [
26
- 0.8,
27
- 1.2
28
- ]
29
- }
30
- },
31
- "saturation": {
32
- "weight": 1.0,
33
- "type": "ColorJitter",
34
- "kwargs": {
35
- "saturation": [
36
- 0.5,
37
- 1.5
38
- ]
39
- }
40
- },
41
- "hue": {
42
- "weight": 1.0,
43
- "type": "ColorJitter",
44
- "kwargs": {
45
- "hue": [
46
- -0.05,
47
- 0.05
48
- ]
49
- }
50
- },
51
- "sharpness": {
52
- "weight": 1.0,
53
- "type": "SharpnessJitter",
54
- "kwargs": {
55
- "sharpness": [
56
- 0.5,
57
- 1.5
58
- ]
59
- }
60
- },
61
- "affine": {
62
- "weight": 1.0,
63
- "type": "RandomAffine",
64
- "kwargs": {
65
- "degrees": [
66
- -5.0,
67
- 5.0
68
- ],
69
- "translate": [
70
- 0.05,
71
- 0.05
72
- ]
73
- }
74
- }
75
- }
76
- },
77
- "revision": null,
78
- "use_imagenet_stats": true,
79
- "video_backend": "torchcodec",
80
- "streaming": false
81
- },
82
- "env": null,
83
- "policy": {
84
- "type": "pi05",
85
- "n_obs_steps": 1,
86
- "input_features": {
87
- "observation.images.base_0_rgb": {
88
- "type": "VISUAL",
89
- "shape": [
90
- 3,
91
- 224,
92
- 224
93
- ]
94
- },
95
- "observation.images.left_wrist_0_rgb": {
96
- "type": "VISUAL",
97
- "shape": [
98
- 3,
99
- 224,
100
- 224
101
- ]
102
- },
103
- "observation.images.right_wrist_0_rgb": {
104
- "type": "VISUAL",
105
- "shape": [
106
- 3,
107
- 224,
108
- 224
109
- ]
110
- },
111
- "observation.state": {
112
- "type": "STATE",
113
- "shape": [
114
- 32
115
- ]
116
- }
117
- },
118
- "output_features": {
119
- "action": {
120
- "type": "ACTION",
121
- "shape": [
122
- 6
123
- ]
124
- }
125
- },
126
- "device": "cuda",
127
- "use_amp": false,
128
- "use_peft": false,
129
- "push_to_hub": true,
130
- "repo_id": "StrongRoboticsLab/pi05-so100-diverse",
131
- "private": null,
132
- "tags": null,
133
- "license": null,
134
- "pretrained_path": "lerobot/pi05_base",
135
- "paligemma_variant": "gemma_2b",
136
- "action_expert_variant": "gemma_300m",
137
- "dtype": "bfloat16",
138
- "chunk_size": 50,
139
- "n_action_steps": 50,
140
- "max_state_dim": 32,
141
- "max_action_dim": 32,
142
- "num_inference_steps": 10,
143
- "time_sampling_beta_alpha": 1.5,
144
- "time_sampling_beta_beta": 1.0,
145
- "time_sampling_scale": 0.999,
146
- "time_sampling_offset": 0.001,
147
- "min_period": 0.004,
148
- "max_period": 4.0,
149
- "rtc_config": null,
150
- "image_resolution": [
151
- 224,
152
- 224
153
- ],
154
- "empty_cameras": 0,
155
- "tokenizer_max_length": 200,
156
- "normalization_mapping": {
157
- "VISUAL": "IDENTITY",
158
- "STATE": "MEAN_STD",
159
- "ACTION": "MEAN_STD"
160
- },
161
- "gradient_checkpointing": false,
162
- "compile_model": false,
163
- "compile_mode": "max-autotune",
164
- "freeze_vision_encoder": false,
165
- "train_expert_only": true,
166
- "optimizer_lr": 2.5e-05,
167
- "optimizer_betas": [
168
- 0.9,
169
- 0.95
170
- ],
171
- "optimizer_eps": 1e-08,
172
- "optimizer_weight_decay": 0.01,
173
- "optimizer_grad_clip_norm": 1.0,
174
- "scheduler_warmup_steps": 1000,
175
- "scheduler_decay_steps": 340000,
176
- "scheduler_decay_lr": 2.5e-06
177
- },
178
- "output_dir": "/ephemeral/production_run",
179
- "job_name": "pi05",
180
- "resume": false,
181
- "seed": 1000,
182
- "cudnn_deterministic": false,
183
- "num_workers": 4,
184
- "batch_size": 16,
185
- "steps": 340000,
186
- "eval_freq": 20000,
187
- "log_freq": 50,
188
- "tolerance_s": 0.0001,
189
- "save_checkpoint": true,
190
- "save_freq": 500,
191
- "use_policy_training_preset": true,
192
- "optimizer": {
193
- "type": "adamw",
194
- "lr": 2.5e-05,
195
- "weight_decay": 0.01,
196
- "grad_clip_norm": 1.0,
197
- "betas": [
198
- 0.9,
199
- 0.95
200
- ],
201
- "eps": 1e-08
202
- },
203
- "scheduler": {
204
- "type": "cosine_decay_with_warmup",
205
- "num_warmup_steps": 1000,
206
- "num_decay_steps": 340000,
207
- "peak_lr": 2.5e-05,
208
- "decay_lr": 2.5e-06
209
- },
210
- "eval": {
211
- "n_episodes": 50,
212
- "batch_size": 50,
213
- "use_async_envs": false
214
- },
215
- "wandb": {
216
- "enable": true,
217
- "disable_artifact": false,
218
- "project": "pi05-so100-diverse",
219
- "entity": null,
220
- "notes": null,
221
- "run_id": "7zuftzeh",
222
- "mode": null,
223
- "add_tags": true
224
- },
225
- "peft": null,
226
- "use_rabc": false,
227
- "rabc_progress_path": null,
228
- "rabc_kappa": 0.01,
229
- "rabc_epsilon": 1e-06,
230
- "rabc_head_mode": "sparse",
231
- "rename_map": {
232
- "observation.images.image": "observation.images.base_0_rgb",
233
- "observation.images.image2": "observation.images.left_wrist_0_rgb"
234
- },
235
- "checkpoint_path": null
236
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoints/step_000500/training_state/optimizer_param_groups.json DELETED
@@ -1,833 +0,0 @@
1
- [
2
- {
3
- "lr": 1.2512487512487514e-05,
4
- "betas": [
5
- 0.9,
6
- 0.95
7
- ],
8
- "eps": 1e-08,
9
- "weight_decay": 0.01,
10
- "amsgrad": false,
11
- "foreach": null,
12
- "maximize": false,
13
- "capturable": false,
14
- "differentiable": false,
15
- "fused": null,
16
- "initial_lr": 2.5e-05,
17
- "params": [
18
- 0,
19
- 1,
20
- 2,
21
- 3,
22
- 4,
23
- 5,
24
- 6,
25
- 7,
26
- 8,
27
- 9,
28
- 10,
29
- 11,
30
- 12,
31
- 13,
32
- 14,
33
- 15,
34
- 16,
35
- 17,
36
- 18,
37
- 19,
38
- 20,
39
- 21,
40
- 22,
41
- 23,
42
- 24,
43
- 25,
44
- 26,
45
- 27,
46
- 28,
47
- 29,
48
- 30,
49
- 31,
50
- 32,
51
- 33,
52
- 34,
53
- 35,
54
- 36,
55
- 37,
56
- 38,
57
- 39,
58
- 40,
59
- 41,
60
- 42,
61
- 43,
62
- 44,
63
- 45,
64
- 46,
65
- 47,
66
- 48,
67
- 49,
68
- 50,
69
- 51,
70
- 52,
71
- 53,
72
- 54,
73
- 55,
74
- 56,
75
- 57,
76
- 58,
77
- 59,
78
- 60,
79
- 61,
80
- 62,
81
- 63,
82
- 64,
83
- 65,
84
- 66,
85
- 67,
86
- 68,
87
- 69,
88
- 70,
89
- 71,
90
- 72,
91
- 73,
92
- 74,
93
- 75,
94
- 76,
95
- 77,
96
- 78,
97
- 79,
98
- 80,
99
- 81,
100
- 82,
101
- 83,
102
- 84,
103
- 85,
104
- 86,
105
- 87,
106
- 88,
107
- 89,
108
- 90,
109
- 91,
110
- 92,
111
- 93,
112
- 94,
113
- 95,
114
- 96,
115
- 97,
116
- 98,
117
- 99,
118
- 100,
119
- 101,
120
- 102,
121
- 103,
122
- 104,
123
- 105,
124
- 106,
125
- 107,
126
- 108,
127
- 109,
128
- 110,
129
- 111,
130
- 112,
131
- 113,
132
- 114,
133
- 115,
134
- 116,
135
- 117,
136
- 118,
137
- 119,
138
- 120,
139
- 121,
140
- 122,
141
- 123,
142
- 124,
143
- 125,
144
- 126,
145
- 127,
146
- 128,
147
- 129,
148
- 130,
149
- 131,
150
- 132,
151
- 133,
152
- 134,
153
- 135,
154
- 136,
155
- 137,
156
- 138,
157
- 139,
158
- 140,
159
- 141,
160
- 142,
161
- 143,
162
- 144,
163
- 145,
164
- 146,
165
- 147,
166
- 148,
167
- 149,
168
- 150,
169
- 151,
170
- 152,
171
- 153,
172
- 154,
173
- 155,
174
- 156,
175
- 157,
176
- 158,
177
- 159,
178
- 160,
179
- 161,
180
- 162,
181
- 163,
182
- 164,
183
- 165,
184
- 166,
185
- 167,
186
- 168,
187
- 169,
188
- 170,
189
- 171,
190
- 172,
191
- 173,
192
- 174,
193
- 175,
194
- 176,
195
- 177,
196
- 178,
197
- 179,
198
- 180,
199
- 181,
200
- 182,
201
- 183,
202
- 184,
203
- 185,
204
- 186,
205
- 187,
206
- 188,
207
- 189,
208
- 190,
209
- 191,
210
- 192,
211
- 193,
212
- 194,
213
- 195,
214
- 196,
215
- 197,
216
- 198,
217
- 199,
218
- 200,
219
- 201,
220
- 202,
221
- 203,
222
- 204,
223
- 205,
224
- 206,
225
- 207,
226
- 208,
227
- 209,
228
- 210,
229
- 211,
230
- 212,
231
- 213,
232
- 214,
233
- 215,
234
- 216,
235
- 217,
236
- 218,
237
- 219,
238
- 220,
239
- 221,
240
- 222,
241
- 223,
242
- 224,
243
- 225,
244
- 226,
245
- 227,
246
- 228,
247
- 229,
248
- 230,
249
- 231,
250
- 232,
251
- 233,
252
- 234,
253
- 235,
254
- 236,
255
- 237,
256
- 238,
257
- 239,
258
- 240,
259
- 241,
260
- 242,
261
- 243,
262
- 244,
263
- 245,
264
- 246,
265
- 247,
266
- 248,
267
- 249,
268
- 250,
269
- 251,
270
- 252,
271
- 253,
272
- 254,
273
- 255,
274
- 256,
275
- 257,
276
- 258,
277
- 259,
278
- 260,
279
- 261,
280
- 262,
281
- 263,
282
- 264,
283
- 265,
284
- 266,
285
- 267,
286
- 268,
287
- 269,
288
- 270,
289
- 271,
290
- 272,
291
- 273,
292
- 274,
293
- 275,
294
- 276,
295
- 277,
296
- 278,
297
- 279,
298
- 280,
299
- 281,
300
- 282,
301
- 283,
302
- 284,
303
- 285,
304
- 286,
305
- 287,
306
- 288,
307
- 289,
308
- 290,
309
- 291,
310
- 292,
311
- 293,
312
- 294,
313
- 295,
314
- 296,
315
- 297,
316
- 298,
317
- 299,
318
- 300,
319
- 301,
320
- 302,
321
- 303,
322
- 304,
323
- 305,
324
- 306,
325
- 307,
326
- 308,
327
- 309,
328
- 310,
329
- 311,
330
- 312,
331
- 313,
332
- 314,
333
- 315,
334
- 316,
335
- 317,
336
- 318,
337
- 319,
338
- 320,
339
- 321,
340
- 322,
341
- 323,
342
- 324,
343
- 325,
344
- 326,
345
- 327,
346
- 328,
347
- 329,
348
- 330,
349
- 331,
350
- 332,
351
- 333,
352
- 334,
353
- 335,
354
- 336,
355
- 337,
356
- 338,
357
- 339,
358
- 340,
359
- 341,
360
- 342,
361
- 343,
362
- 344,
363
- 345,
364
- 346,
365
- 347,
366
- 348,
367
- 349,
368
- 350,
369
- 351,
370
- 352,
371
- 353,
372
- 354,
373
- 355,
374
- 356,
375
- 357,
376
- 358,
377
- 359,
378
- 360,
379
- 361,
380
- 362,
381
- 363,
382
- 364,
383
- 365,
384
- 366,
385
- 367,
386
- 368,
387
- 369,
388
- 370,
389
- 371,
390
- 372,
391
- 373,
392
- 374,
393
- 375,
394
- 376,
395
- 377,
396
- 378,
397
- 379,
398
- 380,
399
- 381,
400
- 382,
401
- 383,
402
- 384,
403
- 385,
404
- 386,
405
- 387,
406
- 388,
407
- 389,
408
- 390,
409
- 391,
410
- 392,
411
- 393,
412
- 394,
413
- 395,
414
- 396,
415
- 397,
416
- 398,
417
- 399,
418
- 400,
419
- 401,
420
- 402,
421
- 403,
422
- 404,
423
- 405,
424
- 406,
425
- 407,
426
- 408,
427
- 409,
428
- 410,
429
- 411,
430
- 412,
431
- 413,
432
- 414,
433
- 415,
434
- 416,
435
- 417,
436
- 418,
437
- 419,
438
- 420,
439
- 421,
440
- 422,
441
- 423,
442
- 424,
443
- 425,
444
- 426,
445
- 427,
446
- 428,
447
- 429,
448
- 430,
449
- 431,
450
- 432,
451
- 433,
452
- 434,
453
- 435,
454
- 436,
455
- 437,
456
- 438,
457
- 439,
458
- 440,
459
- 441,
460
- 442,
461
- 443,
462
- 444,
463
- 445,
464
- 446,
465
- 447,
466
- 448,
467
- 449,
468
- 450,
469
- 451,
470
- 452,
471
- 453,
472
- 454,
473
- 455,
474
- 456,
475
- 457,
476
- 458,
477
- 459,
478
- 460,
479
- 461,
480
- 462,
481
- 463,
482
- 464,
483
- 465,
484
- 466,
485
- 467,
486
- 468,
487
- 469,
488
- 470,
489
- 471,
490
- 472,
491
- 473,
492
- 474,
493
- 475,
494
- 476,
495
- 477,
496
- 478,
497
- 479,
498
- 480,
499
- 481,
500
- 482,
501
- 483,
502
- 484,
503
- 485,
504
- 486,
505
- 487,
506
- 488,
507
- 489,
508
- 490,
509
- 491,
510
- 492,
511
- 493,
512
- 494,
513
- 495,
514
- 496,
515
- 497,
516
- 498,
517
- 499,
518
- 500,
519
- 501,
520
- 502,
521
- 503,
522
- 504,
523
- 505,
524
- 506,
525
- 507,
526
- 508,
527
- 509,
528
- 510,
529
- 511,
530
- 512,
531
- 513,
532
- 514,
533
- 515,
534
- 516,
535
- 517,
536
- 518,
537
- 519,
538
- 520,
539
- 521,
540
- 522,
541
- 523,
542
- 524,
543
- 525,
544
- 526,
545
- 527,
546
- 528,
547
- 529,
548
- 530,
549
- 531,
550
- 532,
551
- 533,
552
- 534,
553
- 535,
554
- 536,
555
- 537,
556
- 538,
557
- 539,
558
- 540,
559
- 541,
560
- 542,
561
- 543,
562
- 544,
563
- 545,
564
- 546,
565
- 547,
566
- 548,
567
- 549,
568
- 550,
569
- 551,
570
- 552,
571
- 553,
572
- 554,
573
- 555,
574
- 556,
575
- 557,
576
- 558,
577
- 559,
578
- 560,
579
- 561,
580
- 562,
581
- 563,
582
- 564,
583
- 565,
584
- 566,
585
- 567,
586
- 568,
587
- 569,
588
- 570,
589
- 571,
590
- 572,
591
- 573,
592
- 574,
593
- 575,
594
- 576,
595
- 577,
596
- 578,
597
- 579,
598
- 580,
599
- 581,
600
- 582,
601
- 583,
602
- 584,
603
- 585,
604
- 586,
605
- 587,
606
- 588,
607
- 589,
608
- 590,
609
- 591,
610
- 592,
611
- 593,
612
- 594,
613
- 595,
614
- 596,
615
- 597,
616
- 598,
617
- 599,
618
- 600,
619
- 601,
620
- 602,
621
- 603,
622
- 604,
623
- 605,
624
- 606,
625
- 607,
626
- 608,
627
- 609,
628
- 610,
629
- 611,
630
- 612,
631
- 613,
632
- 614,
633
- 615,
634
- 616,
635
- 617,
636
- 618,
637
- 619,
638
- 620,
639
- 621,
640
- 622,
641
- 623,
642
- 624,
643
- 625,
644
- 626,
645
- 627,
646
- 628,
647
- 629,
648
- 630,
649
- 631,
650
- 632,
651
- 633,
652
- 634,
653
- 635,
654
- 636,
655
- 637,
656
- 638,
657
- 639,
658
- 640,
659
- 641,
660
- 642,
661
- 643,
662
- 644,
663
- 645,
664
- 646,
665
- 647,
666
- 648,
667
- 649,
668
- 650,
669
- 651,
670
- 652,
671
- 653,
672
- 654,
673
- 655,
674
- 656,
675
- 657,
676
- 658,
677
- 659,
678
- 660,
679
- 661,
680
- 662,
681
- 663,
682
- 664,
683
- 665,
684
- 666,
685
- 667,
686
- 668,
687
- 669,
688
- 670,
689
- 671,
690
- 672,
691
- 673,
692
- 674,
693
- 675,
694
- 676,
695
- 677,
696
- 678,
697
- 679,
698
- 680,
699
- 681,
700
- 682,
701
- 683,
702
- 684,
703
- 685,
704
- 686,
705
- 687,
706
- 688,
707
- 689,
708
- 690,
709
- 691,
710
- 692,
711
- 693,
712
- 694,
713
- 695,
714
- 696,
715
- 697,
716
- 698,
717
- 699,
718
- 700,
719
- 701,
720
- 702,
721
- 703,
722
- 704,
723
- 705,
724
- 706,
725
- 707,
726
- 708,
727
- 709,
728
- 710,
729
- 711,
730
- 712,
731
- 713,
732
- 714,
733
- 715,
734
- 716,
735
- 717,
736
- 718,
737
- 719,
738
- 720,
739
- 721,
740
- 722,
741
- 723,
742
- 724,
743
- 725,
744
- 726,
745
- 727,
746
- 728,
747
- 729,
748
- 730,
749
- 731,
750
- 732,
751
- 733,
752
- 734,
753
- 735,
754
- 736,
755
- 737,
756
- 738,
757
- 739,
758
- 740,
759
- 741,
760
- 742,
761
- 743,
762
- 744,
763
- 745,
764
- 746,
765
- 747,
766
- 748,
767
- 749,
768
- 750,
769
- 751,
770
- 752,
771
- 753,
772
- 754,
773
- 755,
774
- 756,
775
- 757,
776
- 758,
777
- 759,
778
- 760,
779
- 761,
780
- 762,
781
- 763,
782
- 764,
783
- 765,
784
- 766,
785
- 767,
786
- 768,
787
- 769,
788
- 770,
789
- 771,
790
- 772,
791
- 773,
792
- 774,
793
- 775,
794
- 776,
795
- 777,
796
- 778,
797
- 779,
798
- 780,
799
- 781,
800
- 782,
801
- 783,
802
- 784,
803
- 785,
804
- 786,
805
- 787,
806
- 788,
807
- 789,
808
- 790,
809
- 791,
810
- 792,
811
- 793,
812
- 794,
813
- 795,
814
- 796,
815
- 797,
816
- 798,
817
- 799,
818
- 800,
819
- 801,
820
- 802,
821
- 803,
822
- 804,
823
- 805,
824
- 806,
825
- 807,
826
- 808,
827
- 809,
828
- 810,
829
- 811,
830
- 812
831
- ]
832
- }
833
- ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoints/step_000500/training_state/optimizer_state.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e81464e3c3e8ceee241bf8bccebf2ecbf85bedf677293f72de2f1c6d829ac60
3
- size 2195136504
 
 
 
 
checkpoints/step_000500/training_state/rng_state.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c0759d2282f69bd10bd591e2fd9a63632e2c572b1b6943bf5225a4e27f1ba9f
3
- size 15708
 
 
 
 
checkpoints/step_000500/training_state/scheduler_state.json DELETED
@@ -1,15 +0,0 @@
1
- {
2
- "base_lrs": [
3
- 2.5e-05
4
- ],
5
- "last_epoch": 500,
6
- "verbose": false,
7
- "_step_count": 501,
8
- "_get_lr_called_within_step": false,
9
- "_last_lr": [
10
- 1.2512487512487514e-05
11
- ],
12
- "lr_lambdas": [
13
- null
14
- ]
15
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoints/step_000500/training_state/training_step.json DELETED
@@ -1,3 +0,0 @@
1
- {
2
- "step": 500
3
- }