bot commited on
Commit
6d47053
Β·
1 Parent(s): 683125d

Add job_name fix

Browse files
checkpoints/step_000500/pretrained_model/config.json ADDED
@@ -0,0 +1,95 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "type": "pi05",
3
+ "n_obs_steps": 1,
4
+ "input_features": {
5
+ "observation.images.base_0_rgb": {
6
+ "type": "VISUAL",
7
+ "shape": [
8
+ 3,
9
+ 224,
10
+ 224
11
+ ]
12
+ },
13
+ "observation.images.left_wrist_0_rgb": {
14
+ "type": "VISUAL",
15
+ "shape": [
16
+ 3,
17
+ 224,
18
+ 224
19
+ ]
20
+ },
21
+ "observation.images.right_wrist_0_rgb": {
22
+ "type": "VISUAL",
23
+ "shape": [
24
+ 3,
25
+ 224,
26
+ 224
27
+ ]
28
+ },
29
+ "observation.state": {
30
+ "type": "STATE",
31
+ "shape": [
32
+ 32
33
+ ]
34
+ }
35
+ },
36
+ "output_features": {
37
+ "action": {
38
+ "type": "ACTION",
39
+ "shape": [
40
+ 6
41
+ ]
42
+ }
43
+ },
44
+ "device": "cuda",
45
+ "use_amp": false,
46
+ "use_peft": false,
47
+ "push_to_hub": true,
48
+ "repo_id": "StrongRoboticsLab/pi05-so100-diverse",
49
+ "private": null,
50
+ "tags": null,
51
+ "license": null,
52
+ "pretrained_path": "lerobot/pi05_base",
53
+ "paligemma_variant": "gemma_2b",
54
+ "action_expert_variant": "gemma_300m",
55
+ "dtype": "bfloat16",
56
+ "chunk_size": 50,
57
+ "n_action_steps": 50,
58
+ "max_state_dim": 32,
59
+ "max_action_dim": 32,
60
+ "num_inference_steps": 10,
61
+ "time_sampling_beta_alpha": 1.5,
62
+ "time_sampling_beta_beta": 1.0,
63
+ "time_sampling_scale": 0.999,
64
+ "time_sampling_offset": 0.001,
65
+ "min_period": 0.004,
66
+ "max_period": 4.0,
67
+ "rtc_config": null,
68
+ "image_resolution": [
69
+ 224,
70
+ 224
71
+ ],
72
+ "empty_cameras": 0,
73
+ "tokenizer_max_length": 200,
74
+ "normalization_mapping": {
75
+ "VISUAL": "IDENTITY",
76
+ "STATE": "MEAN_STD",
77
+ "ACTION": "MEAN_STD"
78
+ },
79
+ "gradient_checkpointing": false,
80
+ "compile_model": false,
81
+ "compile_mode": "max-autotune",
82
+ "freeze_vision_encoder": false,
83
+ "train_expert_only": true,
84
+ "optimizer_lr": 2.5e-05,
85
+ "optimizer_betas": [
86
+ 0.9,
87
+ 0.95
88
+ ],
89
+ "optimizer_eps": 1e-08,
90
+ "optimizer_weight_decay": 0.01,
91
+ "optimizer_grad_clip_norm": 1.0,
92
+ "scheduler_warmup_steps": 1000,
93
+ "scheduler_decay_steps": 340000,
94
+ "scheduler_decay_lr": 2.5e-06
95
+ }
checkpoints/step_000500/pretrained_model/policy_postprocessor.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "policy_postprocessor",
3
+ "steps": [
4
+ {
5
+ "registry_name": "unnormalizer_processor",
6
+ "config": {
7
+ "eps": 1e-08,
8
+ "features": {
9
+ "action": {
10
+ "type": "ACTION",
11
+ "shape": [
12
+ 6
13
+ ]
14
+ }
15
+ },
16
+ "norm_map": {
17
+ "VISUAL": "IDENTITY",
18
+ "STATE": "MEAN_STD",
19
+ "ACTION": "MEAN_STD"
20
+ }
21
+ },
22
+ "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors"
23
+ },
24
+ {
25
+ "registry_name": "device_processor",
26
+ "config": {
27
+ "device": "cpu",
28
+ "float_dtype": null
29
+ }
30
+ }
31
+ ]
32
+ }
checkpoints/step_000500/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a631ee0d784519e7052f654e71248331b32f26ba470b8d15f29553e15d8a0f
3
+ size 768
checkpoints/step_000500/pretrained_model/policy_preprocessor.json ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "policy_preprocessor",
3
+ "steps": [
4
+ {
5
+ "registry_name": "rename_observations_processor",
6
+ "config": {
7
+ "rename_map": {
8
+ "observation.images.image": "observation.images.base_0_rgb",
9
+ "observation.images.image2": "observation.images.left_wrist_0_rgb"
10
+ }
11
+ }
12
+ },
13
+ {
14
+ "registry_name": "to_batch_processor",
15
+ "config": {}
16
+ },
17
+ {
18
+ "registry_name": "normalizer_processor",
19
+ "config": {
20
+ "eps": 1e-08,
21
+ "features": {
22
+ "observation.images.base_0_rgb": {
23
+ "type": "VISUAL",
24
+ "shape": [
25
+ 3,
26
+ 224,
27
+ 224
28
+ ]
29
+ },
30
+ "observation.images.left_wrist_0_rgb": {
31
+ "type": "VISUAL",
32
+ "shape": [
33
+ 3,
34
+ 224,
35
+ 224
36
+ ]
37
+ },
38
+ "observation.images.right_wrist_0_rgb": {
39
+ "type": "VISUAL",
40
+ "shape": [
41
+ 3,
42
+ 224,
43
+ 224
44
+ ]
45
+ },
46
+ "observation.state": {
47
+ "type": "STATE",
48
+ "shape": [
49
+ 32
50
+ ]
51
+ },
52
+ "action": {
53
+ "type": "ACTION",
54
+ "shape": [
55
+ 6
56
+ ]
57
+ }
58
+ },
59
+ "norm_map": {
60
+ "VISUAL": "IDENTITY",
61
+ "STATE": "MEAN_STD",
62
+ "ACTION": "MEAN_STD"
63
+ }
64
+ },
65
+ "state_file": "policy_preprocessor_step_2_normalizer_processor.safetensors"
66
+ },
67
+ {
68
+ "registry_name": "pi05_prepare_state_tokenizer_processor_step",
69
+ "config": {}
70
+ },
71
+ {
72
+ "registry_name": "tokenizer_processor",
73
+ "config": {
74
+ "max_length": 200,
75
+ "task_key": "task",
76
+ "padding_side": "right",
77
+ "padding": "max_length",
78
+ "truncation": true,
79
+ "tokenizer_name": "google/paligemma-3b-pt-224"
80
+ }
81
+ },
82
+ {
83
+ "registry_name": "device_processor",
84
+ "config": {
85
+ "device": "cuda",
86
+ "float_dtype": null
87
+ }
88
+ }
89
+ ]
90
+ }
checkpoints/step_000500/pretrained_model/policy_preprocessor_step_2_normalizer_processor.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a631ee0d784519e7052f654e71248331b32f26ba470b8d15f29553e15d8a0f
3
+ size 768
checkpoints/step_000500/pretrained_model/train_config.json ADDED
@@ -0,0 +1,236 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": {
3
+ "repo_id": "so100:/ephemeral/community_dataset_v3:/workspace/pi05-so100-diverse/filtered_index.json:/workspace/pi05-so100-diverse/norm_stats.json",
4
+ "root": null,
5
+ "episodes": null,
6
+ "image_transforms": {
7
+ "enable": false,
8
+ "max_num_transforms": 3,
9
+ "random_order": false,
10
+ "tfs": {
11
+ "brightness": {
12
+ "weight": 1.0,
13
+ "type": "ColorJitter",
14
+ "kwargs": {
15
+ "brightness": [
16
+ 0.8,
17
+ 1.2
18
+ ]
19
+ }
20
+ },
21
+ "contrast": {
22
+ "weight": 1.0,
23
+ "type": "ColorJitter",
24
+ "kwargs": {
25
+ "contrast": [
26
+ 0.8,
27
+ 1.2
28
+ ]
29
+ }
30
+ },
31
+ "saturation": {
32
+ "weight": 1.0,
33
+ "type": "ColorJitter",
34
+ "kwargs": {
35
+ "saturation": [
36
+ 0.5,
37
+ 1.5
38
+ ]
39
+ }
40
+ },
41
+ "hue": {
42
+ "weight": 1.0,
43
+ "type": "ColorJitter",
44
+ "kwargs": {
45
+ "hue": [
46
+ -0.05,
47
+ 0.05
48
+ ]
49
+ }
50
+ },
51
+ "sharpness": {
52
+ "weight": 1.0,
53
+ "type": "SharpnessJitter",
54
+ "kwargs": {
55
+ "sharpness": [
56
+ 0.5,
57
+ 1.5
58
+ ]
59
+ }
60
+ },
61
+ "affine": {
62
+ "weight": 1.0,
63
+ "type": "RandomAffine",
64
+ "kwargs": {
65
+ "degrees": [
66
+ -5.0,
67
+ 5.0
68
+ ],
69
+ "translate": [
70
+ 0.05,
71
+ 0.05
72
+ ]
73
+ }
74
+ }
75
+ }
76
+ },
77
+ "revision": null,
78
+ "use_imagenet_stats": true,
79
+ "video_backend": "torchcodec",
80
+ "streaming": false
81
+ },
82
+ "env": null,
83
+ "policy": {
84
+ "type": "pi05",
85
+ "n_obs_steps": 1,
86
+ "input_features": {
87
+ "observation.images.base_0_rgb": {
88
+ "type": "VISUAL",
89
+ "shape": [
90
+ 3,
91
+ 224,
92
+ 224
93
+ ]
94
+ },
95
+ "observation.images.left_wrist_0_rgb": {
96
+ "type": "VISUAL",
97
+ "shape": [
98
+ 3,
99
+ 224,
100
+ 224
101
+ ]
102
+ },
103
+ "observation.images.right_wrist_0_rgb": {
104
+ "type": "VISUAL",
105
+ "shape": [
106
+ 3,
107
+ 224,
108
+ 224
109
+ ]
110
+ },
111
+ "observation.state": {
112
+ "type": "STATE",
113
+ "shape": [
114
+ 32
115
+ ]
116
+ }
117
+ },
118
+ "output_features": {
119
+ "action": {
120
+ "type": "ACTION",
121
+ "shape": [
122
+ 6
123
+ ]
124
+ }
125
+ },
126
+ "device": "cuda",
127
+ "use_amp": false,
128
+ "use_peft": false,
129
+ "push_to_hub": true,
130
+ "repo_id": "StrongRoboticsLab/pi05-so100-diverse",
131
+ "private": null,
132
+ "tags": null,
133
+ "license": null,
134
+ "pretrained_path": "lerobot/pi05_base",
135
+ "paligemma_variant": "gemma_2b",
136
+ "action_expert_variant": "gemma_300m",
137
+ "dtype": "bfloat16",
138
+ "chunk_size": 50,
139
+ "n_action_steps": 50,
140
+ "max_state_dim": 32,
141
+ "max_action_dim": 32,
142
+ "num_inference_steps": 10,
143
+ "time_sampling_beta_alpha": 1.5,
144
+ "time_sampling_beta_beta": 1.0,
145
+ "time_sampling_scale": 0.999,
146
+ "time_sampling_offset": 0.001,
147
+ "min_period": 0.004,
148
+ "max_period": 4.0,
149
+ "rtc_config": null,
150
+ "image_resolution": [
151
+ 224,
152
+ 224
153
+ ],
154
+ "empty_cameras": 0,
155
+ "tokenizer_max_length": 200,
156
+ "normalization_mapping": {
157
+ "VISUAL": "IDENTITY",
158
+ "STATE": "MEAN_STD",
159
+ "ACTION": "MEAN_STD"
160
+ },
161
+ "gradient_checkpointing": false,
162
+ "compile_model": false,
163
+ "compile_mode": "max-autotune",
164
+ "freeze_vision_encoder": false,
165
+ "train_expert_only": true,
166
+ "optimizer_lr": 2.5e-05,
167
+ "optimizer_betas": [
168
+ 0.9,
169
+ 0.95
170
+ ],
171
+ "optimizer_eps": 1e-08,
172
+ "optimizer_weight_decay": 0.01,
173
+ "optimizer_grad_clip_norm": 1.0,
174
+ "scheduler_warmup_steps": 1000,
175
+ "scheduler_decay_steps": 340000,
176
+ "scheduler_decay_lr": 2.5e-06
177
+ },
178
+ "output_dir": "/ephemeral/production_run",
179
+ "job_name": "pi05",
180
+ "resume": false,
181
+ "seed": 1000,
182
+ "cudnn_deterministic": false,
183
+ "num_workers": 4,
184
+ "batch_size": 16,
185
+ "steps": 340000,
186
+ "eval_freq": 20000,
187
+ "log_freq": 50,
188
+ "tolerance_s": 0.0001,
189
+ "save_checkpoint": true,
190
+ "save_freq": 500,
191
+ "use_policy_training_preset": true,
192
+ "optimizer": {
193
+ "type": "adamw",
194
+ "lr": 2.5e-05,
195
+ "weight_decay": 0.01,
196
+ "grad_clip_norm": 1.0,
197
+ "betas": [
198
+ 0.9,
199
+ 0.95
200
+ ],
201
+ "eps": 1e-08
202
+ },
203
+ "scheduler": {
204
+ "type": "cosine_decay_with_warmup",
205
+ "num_warmup_steps": 1000,
206
+ "num_decay_steps": 340000,
207
+ "peak_lr": 2.5e-05,
208
+ "decay_lr": 2.5e-06
209
+ },
210
+ "eval": {
211
+ "n_episodes": 50,
212
+ "batch_size": 50,
213
+ "use_async_envs": false
214
+ },
215
+ "wandb": {
216
+ "enable": true,
217
+ "disable_artifact": false,
218
+ "project": "pi05-so100-diverse",
219
+ "entity": null,
220
+ "notes": null,
221
+ "run_id": "7zuftzeh",
222
+ "mode": null,
223
+ "add_tags": true
224
+ },
225
+ "peft": null,
226
+ "use_rabc": false,
227
+ "rabc_progress_path": null,
228
+ "rabc_kappa": 0.01,
229
+ "rabc_epsilon": 1e-06,
230
+ "rabc_head_mode": "sparse",
231
+ "rename_map": {
232
+ "observation.images.image": "observation.images.base_0_rgb",
233
+ "observation.images.image2": "observation.images.left_wrist_0_rgb"
234
+ },
235
+ "checkpoint_path": null
236
+ }
checkpoints/step_000500/training_state/optimizer_param_groups.json ADDED
@@ -0,0 +1,833 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "lr": 1.2512487512487514e-05,
4
+ "betas": [
5
+ 0.9,
6
+ 0.95
7
+ ],
8
+ "eps": 1e-08,
9
+ "weight_decay": 0.01,
10
+ "amsgrad": false,
11
+ "foreach": null,
12
+ "maximize": false,
13
+ "capturable": false,
14
+ "differentiable": false,
15
+ "fused": null,
16
+ "initial_lr": 2.5e-05,
17
+ "params": [
18
+ 0,
19
+ 1,
20
+ 2,
21
+ 3,
22
+ 4,
23
+ 5,
24
+ 6,
25
+ 7,
26
+ 8,
27
+ 9,
28
+ 10,
29
+ 11,
30
+ 12,
31
+ 13,
32
+ 14,
33
+ 15,
34
+ 16,
35
+ 17,
36
+ 18,
37
+ 19,
38
+ 20,
39
+ 21,
40
+ 22,
41
+ 23,
42
+ 24,
43
+ 25,
44
+ 26,
45
+ 27,
46
+ 28,
47
+ 29,
48
+ 30,
49
+ 31,
50
+ 32,
51
+ 33,
52
+ 34,
53
+ 35,
54
+ 36,
55
+ 37,
56
+ 38,
57
+ 39,
58
+ 40,
59
+ 41,
60
+ 42,
61
+ 43,
62
+ 44,
63
+ 45,
64
+ 46,
65
+ 47,
66
+ 48,
67
+ 49,
68
+ 50,
69
+ 51,
70
+ 52,
71
+ 53,
72
+ 54,
73
+ 55,
74
+ 56,
75
+ 57,
76
+ 58,
77
+ 59,
78
+ 60,
79
+ 61,
80
+ 62,
81
+ 63,
82
+ 64,
83
+ 65,
84
+ 66,
85
+ 67,
86
+ 68,
87
+ 69,
88
+ 70,
89
+ 71,
90
+ 72,
91
+ 73,
92
+ 74,
93
+ 75,
94
+ 76,
95
+ 77,
96
+ 78,
97
+ 79,
98
+ 80,
99
+ 81,
100
+ 82,
101
+ 83,
102
+ 84,
103
+ 85,
104
+ 86,
105
+ 87,
106
+ 88,
107
+ 89,
108
+ 90,
109
+ 91,
110
+ 92,
111
+ 93,
112
+ 94,
113
+ 95,
114
+ 96,
115
+ 97,
116
+ 98,
117
+ 99,
118
+ 100,
119
+ 101,
120
+ 102,
121
+ 103,
122
+ 104,
123
+ 105,
124
+ 106,
125
+ 107,
126
+ 108,
127
+ 109,
128
+ 110,
129
+ 111,
130
+ 112,
131
+ 113,
132
+ 114,
133
+ 115,
134
+ 116,
135
+ 117,
136
+ 118,
137
+ 119,
138
+ 120,
139
+ 121,
140
+ 122,
141
+ 123,
142
+ 124,
143
+ 125,
144
+ 126,
145
+ 127,
146
+ 128,
147
+ 129,
148
+ 130,
149
+ 131,
150
+ 132,
151
+ 133,
152
+ 134,
153
+ 135,
154
+ 136,
155
+ 137,
156
+ 138,
157
+ 139,
158
+ 140,
159
+ 141,
160
+ 142,
161
+ 143,
162
+ 144,
163
+ 145,
164
+ 146,
165
+ 147,
166
+ 148,
167
+ 149,
168
+ 150,
169
+ 151,
170
+ 152,
171
+ 153,
172
+ 154,
173
+ 155,
174
+ 156,
175
+ 157,
176
+ 158,
177
+ 159,
178
+ 160,
179
+ 161,
180
+ 162,
181
+ 163,
182
+ 164,
183
+ 165,
184
+ 166,
185
+ 167,
186
+ 168,
187
+ 169,
188
+ 170,
189
+ 171,
190
+ 172,
191
+ 173,
192
+ 174,
193
+ 175,
194
+ 176,
195
+ 177,
196
+ 178,
197
+ 179,
198
+ 180,
199
+ 181,
200
+ 182,
201
+ 183,
202
+ 184,
203
+ 185,
204
+ 186,
205
+ 187,
206
+ 188,
207
+ 189,
208
+ 190,
209
+ 191,
210
+ 192,
211
+ 193,
212
+ 194,
213
+ 195,
214
+ 196,
215
+ 197,
216
+ 198,
217
+ 199,
218
+ 200,
219
+ 201,
220
+ 202,
221
+ 203,
222
+ 204,
223
+ 205,
224
+ 206,
225
+ 207,
226
+ 208,
227
+ 209,
228
+ 210,
229
+ 211,
230
+ 212,
231
+ 213,
232
+ 214,
233
+ 215,
234
+ 216,
235
+ 217,
236
+ 218,
237
+ 219,
238
+ 220,
239
+ 221,
240
+ 222,
241
+ 223,
242
+ 224,
243
+ 225,
244
+ 226,
245
+ 227,
246
+ 228,
247
+ 229,
248
+ 230,
249
+ 231,
250
+ 232,
251
+ 233,
252
+ 234,
253
+ 235,
254
+ 236,
255
+ 237,
256
+ 238,
257
+ 239,
258
+ 240,
259
+ 241,
260
+ 242,
261
+ 243,
262
+ 244,
263
+ 245,
264
+ 246,
265
+ 247,
266
+ 248,
267
+ 249,
268
+ 250,
269
+ 251,
270
+ 252,
271
+ 253,
272
+ 254,
273
+ 255,
274
+ 256,
275
+ 257,
276
+ 258,
277
+ 259,
278
+ 260,
279
+ 261,
280
+ 262,
281
+ 263,
282
+ 264,
283
+ 265,
284
+ 266,
285
+ 267,
286
+ 268,
287
+ 269,
288
+ 270,
289
+ 271,
290
+ 272,
291
+ 273,
292
+ 274,
293
+ 275,
294
+ 276,
295
+ 277,
296
+ 278,
297
+ 279,
298
+ 280,
299
+ 281,
300
+ 282,
301
+ 283,
302
+ 284,
303
+ 285,
304
+ 286,
305
+ 287,
306
+ 288,
307
+ 289,
308
+ 290,
309
+ 291,
310
+ 292,
311
+ 293,
312
+ 294,
313
+ 295,
314
+ 296,
315
+ 297,
316
+ 298,
317
+ 299,
318
+ 300,
319
+ 301,
320
+ 302,
321
+ 303,
322
+ 304,
323
+ 305,
324
+ 306,
325
+ 307,
326
+ 308,
327
+ 309,
328
+ 310,
329
+ 311,
330
+ 312,
331
+ 313,
332
+ 314,
333
+ 315,
334
+ 316,
335
+ 317,
336
+ 318,
337
+ 319,
338
+ 320,
339
+ 321,
340
+ 322,
341
+ 323,
342
+ 324,
343
+ 325,
344
+ 326,
345
+ 327,
346
+ 328,
347
+ 329,
348
+ 330,
349
+ 331,
350
+ 332,
351
+ 333,
352
+ 334,
353
+ 335,
354
+ 336,
355
+ 337,
356
+ 338,
357
+ 339,
358
+ 340,
359
+ 341,
360
+ 342,
361
+ 343,
362
+ 344,
363
+ 345,
364
+ 346,
365
+ 347,
366
+ 348,
367
+ 349,
368
+ 350,
369
+ 351,
370
+ 352,
371
+ 353,
372
+ 354,
373
+ 355,
374
+ 356,
375
+ 357,
376
+ 358,
377
+ 359,
378
+ 360,
379
+ 361,
380
+ 362,
381
+ 363,
382
+ 364,
383
+ 365,
384
+ 366,
385
+ 367,
386
+ 368,
387
+ 369,
388
+ 370,
389
+ 371,
390
+ 372,
391
+ 373,
392
+ 374,
393
+ 375,
394
+ 376,
395
+ 377,
396
+ 378,
397
+ 379,
398
+ 380,
399
+ 381,
400
+ 382,
401
+ 383,
402
+ 384,
403
+ 385,
404
+ 386,
405
+ 387,
406
+ 388,
407
+ 389,
408
+ 390,
409
+ 391,
410
+ 392,
411
+ 393,
412
+ 394,
413
+ 395,
414
+ 396,
415
+ 397,
416
+ 398,
417
+ 399,
418
+ 400,
419
+ 401,
420
+ 402,
421
+ 403,
422
+ 404,
423
+ 405,
424
+ 406,
425
+ 407,
426
+ 408,
427
+ 409,
428
+ 410,
429
+ 411,
430
+ 412,
431
+ 413,
432
+ 414,
433
+ 415,
434
+ 416,
435
+ 417,
436
+ 418,
437
+ 419,
438
+ 420,
439
+ 421,
440
+ 422,
441
+ 423,
442
+ 424,
443
+ 425,
444
+ 426,
445
+ 427,
446
+ 428,
447
+ 429,
448
+ 430,
449
+ 431,
450
+ 432,
451
+ 433,
452
+ 434,
453
+ 435,
454
+ 436,
455
+ 437,
456
+ 438,
457
+ 439,
458
+ 440,
459
+ 441,
460
+ 442,
461
+ 443,
462
+ 444,
463
+ 445,
464
+ 446,
465
+ 447,
466
+ 448,
467
+ 449,
468
+ 450,
469
+ 451,
470
+ 452,
471
+ 453,
472
+ 454,
473
+ 455,
474
+ 456,
475
+ 457,
476
+ 458,
477
+ 459,
478
+ 460,
479
+ 461,
480
+ 462,
481
+ 463,
482
+ 464,
483
+ 465,
484
+ 466,
485
+ 467,
486
+ 468,
487
+ 469,
488
+ 470,
489
+ 471,
490
+ 472,
491
+ 473,
492
+ 474,
493
+ 475,
494
+ 476,
495
+ 477,
496
+ 478,
497
+ 479,
498
+ 480,
499
+ 481,
500
+ 482,
501
+ 483,
502
+ 484,
503
+ 485,
504
+ 486,
505
+ 487,
506
+ 488,
507
+ 489,
508
+ 490,
509
+ 491,
510
+ 492,
511
+ 493,
512
+ 494,
513
+ 495,
514
+ 496,
515
+ 497,
516
+ 498,
517
+ 499,
518
+ 500,
519
+ 501,
520
+ 502,
521
+ 503,
522
+ 504,
523
+ 505,
524
+ 506,
525
+ 507,
526
+ 508,
527
+ 509,
528
+ 510,
529
+ 511,
530
+ 512,
531
+ 513,
532
+ 514,
533
+ 515,
534
+ 516,
535
+ 517,
536
+ 518,
537
+ 519,
538
+ 520,
539
+ 521,
540
+ 522,
541
+ 523,
542
+ 524,
543
+ 525,
544
+ 526,
545
+ 527,
546
+ 528,
547
+ 529,
548
+ 530,
549
+ 531,
550
+ 532,
551
+ 533,
552
+ 534,
553
+ 535,
554
+ 536,
555
+ 537,
556
+ 538,
557
+ 539,
558
+ 540,
559
+ 541,
560
+ 542,
561
+ 543,
562
+ 544,
563
+ 545,
564
+ 546,
565
+ 547,
566
+ 548,
567
+ 549,
568
+ 550,
569
+ 551,
570
+ 552,
571
+ 553,
572
+ 554,
573
+ 555,
574
+ 556,
575
+ 557,
576
+ 558,
577
+ 559,
578
+ 560,
579
+ 561,
580
+ 562,
581
+ 563,
582
+ 564,
583
+ 565,
584
+ 566,
585
+ 567,
586
+ 568,
587
+ 569,
588
+ 570,
589
+ 571,
590
+ 572,
591
+ 573,
592
+ 574,
593
+ 575,
594
+ 576,
595
+ 577,
596
+ 578,
597
+ 579,
598
+ 580,
599
+ 581,
600
+ 582,
601
+ 583,
602
+ 584,
603
+ 585,
604
+ 586,
605
+ 587,
606
+ 588,
607
+ 589,
608
+ 590,
609
+ 591,
610
+ 592,
611
+ 593,
612
+ 594,
613
+ 595,
614
+ 596,
615
+ 597,
616
+ 598,
617
+ 599,
618
+ 600,
619
+ 601,
620
+ 602,
621
+ 603,
622
+ 604,
623
+ 605,
624
+ 606,
625
+ 607,
626
+ 608,
627
+ 609,
628
+ 610,
629
+ 611,
630
+ 612,
631
+ 613,
632
+ 614,
633
+ 615,
634
+ 616,
635
+ 617,
636
+ 618,
637
+ 619,
638
+ 620,
639
+ 621,
640
+ 622,
641
+ 623,
642
+ 624,
643
+ 625,
644
+ 626,
645
+ 627,
646
+ 628,
647
+ 629,
648
+ 630,
649
+ 631,
650
+ 632,
651
+ 633,
652
+ 634,
653
+ 635,
654
+ 636,
655
+ 637,
656
+ 638,
657
+ 639,
658
+ 640,
659
+ 641,
660
+ 642,
661
+ 643,
662
+ 644,
663
+ 645,
664
+ 646,
665
+ 647,
666
+ 648,
667
+ 649,
668
+ 650,
669
+ 651,
670
+ 652,
671
+ 653,
672
+ 654,
673
+ 655,
674
+ 656,
675
+ 657,
676
+ 658,
677
+ 659,
678
+ 660,
679
+ 661,
680
+ 662,
681
+ 663,
682
+ 664,
683
+ 665,
684
+ 666,
685
+ 667,
686
+ 668,
687
+ 669,
688
+ 670,
689
+ 671,
690
+ 672,
691
+ 673,
692
+ 674,
693
+ 675,
694
+ 676,
695
+ 677,
696
+ 678,
697
+ 679,
698
+ 680,
699
+ 681,
700
+ 682,
701
+ 683,
702
+ 684,
703
+ 685,
704
+ 686,
705
+ 687,
706
+ 688,
707
+ 689,
708
+ 690,
709
+ 691,
710
+ 692,
711
+ 693,
712
+ 694,
713
+ 695,
714
+ 696,
715
+ 697,
716
+ 698,
717
+ 699,
718
+ 700,
719
+ 701,
720
+ 702,
721
+ 703,
722
+ 704,
723
+ 705,
724
+ 706,
725
+ 707,
726
+ 708,
727
+ 709,
728
+ 710,
729
+ 711,
730
+ 712,
731
+ 713,
732
+ 714,
733
+ 715,
734
+ 716,
735
+ 717,
736
+ 718,
737
+ 719,
738
+ 720,
739
+ 721,
740
+ 722,
741
+ 723,
742
+ 724,
743
+ 725,
744
+ 726,
745
+ 727,
746
+ 728,
747
+ 729,
748
+ 730,
749
+ 731,
750
+ 732,
751
+ 733,
752
+ 734,
753
+ 735,
754
+ 736,
755
+ 737,
756
+ 738,
757
+ 739,
758
+ 740,
759
+ 741,
760
+ 742,
761
+ 743,
762
+ 744,
763
+ 745,
764
+ 746,
765
+ 747,
766
+ 748,
767
+ 749,
768
+ 750,
769
+ 751,
770
+ 752,
771
+ 753,
772
+ 754,
773
+ 755,
774
+ 756,
775
+ 757,
776
+ 758,
777
+ 759,
778
+ 760,
779
+ 761,
780
+ 762,
781
+ 763,
782
+ 764,
783
+ 765,
784
+ 766,
785
+ 767,
786
+ 768,
787
+ 769,
788
+ 770,
789
+ 771,
790
+ 772,
791
+ 773,
792
+ 774,
793
+ 775,
794
+ 776,
795
+ 777,
796
+ 778,
797
+ 779,
798
+ 780,
799
+ 781,
800
+ 782,
801
+ 783,
802
+ 784,
803
+ 785,
804
+ 786,
805
+ 787,
806
+ 788,
807
+ 789,
808
+ 790,
809
+ 791,
810
+ 792,
811
+ 793,
812
+ 794,
813
+ 795,
814
+ 796,
815
+ 797,
816
+ 798,
817
+ 799,
818
+ 800,
819
+ 801,
820
+ 802,
821
+ 803,
822
+ 804,
823
+ 805,
824
+ 806,
825
+ 807,
826
+ 808,
827
+ 809,
828
+ 810,
829
+ 811,
830
+ 812
831
+ ]
832
+ }
833
+ ]
checkpoints/step_000500/training_state/rng_state.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c0759d2282f69bd10bd591e2fd9a63632e2c572b1b6943bf5225a4e27f1ba9f
3
+ size 15708
checkpoints/step_000500/training_state/scheduler_state.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base_lrs": [
3
+ 2.5e-05
4
+ ],
5
+ "last_epoch": 500,
6
+ "verbose": false,
7
+ "_step_count": 501,
8
+ "_get_lr_called_within_step": false,
9
+ "_last_lr": [
10
+ 1.2512487512487514e-05
11
+ ],
12
+ "lr_lambdas": [
13
+ null
14
+ ]
15
+ }
checkpoints/step_000500/training_state/training_step.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "step": 500
3
+ }
logs/training_20260324_025549.log ADDED
@@ -0,0 +1,1136 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  ...timizer_state.safetensors: 0%| | 28.1kB / 2.20GB 
 
 
 
1
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
2
  ...timizer_state.safetensors: 0%| | 28.1kB / 2.20GB 
 
 
 
3
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
4
  ...timizer_state.safetensors: 1%| | 14.9MB / 2.20GB 
 
 
 
5
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
 
6
  ...timizer_state.safetensors: 3%|β–Ž | 64.0MB / 2.20GB 
 
 
 
7
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
 
8
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
9
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
 
10
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
11
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
12
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
13
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
14
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
15
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
16
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
17
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
18
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
19
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
20
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
21
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
22
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
23
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
24
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
 
 
 
25
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
 
 
26
  ...timizer_state.safetensors: 3%|β–Ž | 71.5MB / 2.20GB 
 
 
 
27
  ...d_model/model.safetensors: 0%| | 5.09MB / 9.35GB 
 
 
 
28
  ...timizer_state.safetensors: 5%|β–Œ | 119MB / 2.20GB 
 
 
 
29
  ...d_model/model.safetensors: 1%| | 47.8MB / 9.35GB 
 
 
 
30
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
 
 
 
31
  ...d_model/model.safetensors: 1%| | 66.7MB / 9.35GB 
 
 
 
32
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
 
 
 
33
  ...d_model/model.safetensors: 1%| | 66.7MB / 9.35GB 
 
 
34
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
 
 
 
35
  ...d_model/model.safetensors: 1%| | 66.7MB / 9.35GB 
 
 
36
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
 
 
 
37
  ...d_model/model.safetensors: 1%| | 67.1MB / 9.35GB 
 
 
 
38
  ...timizer_state.safetensors: 7%|β–‹ | 146MB / 2.20GB 
 
 
 
39
  ...d_model/model.safetensors: 1%| | 78.3MB / 9.35GB 
 
 
 
40
  ...timizer_state.safetensors: 9%|β–Š | 191MB / 2.20GB 
 
 
 
41
  ...d_model/model.safetensors: 1%|▏ | 125MB / 9.35GB 
 
 
 
42
  ...timizer_state.safetensors: 9%|β–‰ | 201MB / 2.20GB 
 
 
 
43
  ...d_model/model.safetensors: 2%|▏ | 169MB / 9.35GB 
 
 
 
44
  ...timizer_state.safetensors: 9%|β–‰ | 207MB / 2.20GB 
 
 
 
45
  ...d_model/model.safetensors: 2%|▏ | 201MB / 9.35GB 
 
 
 
46
  ...timizer_state.safetensors: 12%|β–ˆβ– | 256MB / 2.20GB 
 
 
 
47
  ...d_model/model.safetensors: 2%|▏ | 201MB / 9.35GB 
 
 
 
48
  ...timizer_state.safetensors: 12%|β–ˆβ– | 267MB / 2.20GB 
 
 
 
49
  ...d_model/model.safetensors: 2%|▏ | 201MB / 9.35GB 
 
 
 
50
  ...timizer_state.safetensors: 12%|β–ˆβ– | 272MB / 2.20GB 
 
 
 
51
  ...d_model/model.safetensors: 2%|▏ | 204MB / 9.35GB 
 
 
 
52
  ...timizer_state.safetensors: 14%|β–ˆβ– | 307MB / 2.20GB 
 
 
 
53
  ...d_model/model.safetensors: 2%|▏ | 214MB / 9.35GB 
 
 
 
54
  ...timizer_state.safetensors: 15%|β–ˆβ–Œ | 334MB / 2.20GB 
 
 
 
55
  ...d_model/model.safetensors: 3%|β–Ž | 264MB / 9.35GB 
 
 
 
56
  ...timizer_state.safetensors: 15%|β–ˆβ–Œ | 334MB / 2.20GB 
 
 
 
57
  ...d_model/model.safetensors: 3%|β–Ž | 295MB / 9.35GB 
 
 
 
58
  ...timizer_state.safetensors: 16%|β–ˆβ–Œ | 348MB / 2.20GB 
 
 
 
59
  ...d_model/model.safetensors: 3%|β–Ž | 306MB / 9.35GB 
 
 
 
60
  ...timizer_state.safetensors: 18%|β–ˆβ–Š | 397MB / 2.20GB 
 
 
 
61
  ...d_model/model.safetensors: 4%|β–Ž | 344MB / 9.35GB 
 
 
 
62
  ...timizer_state.safetensors: 18%|β–ˆβ–Š | 402MB / 2.20GB 
 
 
 
63
  ...d_model/model.safetensors: 4%|▍ | 392MB / 9.35GB 
 
 
 
64
  ...timizer_state.safetensors: 19%|β–ˆβ–‰ | 425MB / 2.20GB 
 
 
 
65
  ...d_model/model.safetensors: 4%|▍ | 402MB / 9.35GB 
 
 
 
66
  ...timizer_state.safetensors: 23%|β–ˆβ–ˆβ–Ž | 498MB / 2.20GB 
 
 
 
67
  ...d_model/model.safetensors: 4%|▍ | 402MB / 9.35GB 
 
 
 
68
  ...timizer_state.safetensors: 26%|β–ˆβ–ˆβ–Œ | 560MB / 2.20GB 
 
 
 
69
  ...d_model/model.safetensors: 5%|β–Œ | 495MB / 9.35GB 
 
 
 
70
  ...timizer_state.safetensors: 29%|β–ˆβ–ˆβ–‰ | 637MB / 2.20GB 
 
 
 
71
  ...d_model/model.safetensors: 8%|β–Š | 779MB / 9.35GB 
 
 
 
72
  ...timizer_state.safetensors: 32%|β–ˆβ–ˆβ–ˆβ– | 706MB / 2.20GB 
 
 
 
73
  ...d_model/model.safetensors: 11%|β–ˆ | 1.02GB / 9.35GB 
 
 
 
74
  ...timizer_state.safetensors: 36%|β–ˆβ–ˆβ–ˆβ–Œ | 793MB / 2.20GB 
 
 
 
75
  ...d_model/model.safetensors: 13%|β–ˆβ–Ž | 1.24GB / 9.35GB 
 
 
 
76
  ...timizer_state.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 824MB / 2.20GB 
 
 
 
77
  ...d_model/model.safetensors: 15%|β–ˆβ–Œ | 1.43GB / 9.35GB 
 
 
 
78
  ...timizer_state.safetensors: 40%|β–ˆβ–ˆβ–ˆβ–ˆ | 884MB / 2.20GB 
 
 
 
79
  ...d_model/model.safetensors: 17%|β–ˆβ–‹ | 1.62GB / 9.35GB 
 
 
 
80
  ...timizer_state.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 940MB / 2.20GB 
 
 
 
81
  ...d_model/model.safetensors: 19%|β–ˆβ–‰ | 1.82GB / 9.35GB 
 
 
 
82
  ...timizer_state.safetensors: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 1.02GB / 2.20GB 
 
 
 
83
  ...d_model/model.safetensors: 21%|β–ˆβ–ˆβ– | 2.01GB / 9.35GB 
 
 
 
84
  ...timizer_state.safetensors: 50%|β–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.09GB / 2.20GB 
 
 
 
85
  ...d_model/model.safetensors: 22%|β–ˆβ–ˆβ– | 2.08GB / 9.35GB 
 
 
 
86
  ...timizer_state.safetensors: 53%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 1.17GB / 2.20GB 
 
 
 
87
  ...d_model/model.safetensors: 22%|β–ˆβ–ˆβ– | 2.08GB / 9.35GB 
 
 
 
88
  ...timizer_state.safetensors: 56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 1.23GB / 2.20GB 
 
 
 
89
  ...d_model/model.safetensors: 24%|β–ˆβ–ˆβ–Ž | 2.22GB / 9.35GB 
 
 
 
90
  ...timizer_state.safetensors: 59%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.30GB / 2.20GB 
 
 
 
91
  ...d_model/model.safetensors: 24%|β–ˆβ–ˆβ–Ž | 2.22GB / 9.35GB 
 
 
 
92
  ...timizer_state.safetensors: 63%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 1.38GB / 2.20GB 
 
 
 
93
  ...d_model/model.safetensors: 24%|β–ˆβ–ˆβ– | 2.27GB / 9.35GB 
 
 
 
94
  ...timizer_state.safetensors: 66%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 1.44GB / 2.20GB 
 
 
 
95
  ...d_model/model.safetensors: 27%|β–ˆβ–ˆβ–‹ | 2.50GB / 9.35GB 
 
 
 
96
  ...timizer_state.safetensors: 68%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 1.50GB / 2.20GB 
 
 
 
97
  ...d_model/model.safetensors: 28%|β–ˆβ–ˆβ–Š | 2.61GB / 9.35GB 
 
 
 
98
  ...timizer_state.safetensors: 71%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 1.55GB / 2.20GB 
 
 
 
99
  ...d_model/model.safetensors: 28%|β–ˆβ–ˆβ–Š | 2.62GB / 9.35GB 
 
 
 
100
  ...timizer_state.safetensors: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 1.63GB / 2.20GB 
 
 
 
101
  ...d_model/model.safetensors: 28%|β–ˆβ–ˆβ–Š | 2.64GB / 9.35GB 
 
 
 
102
  ...timizer_state.safetensors: 78%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 1.71GB / 2.20GB 
 
 
 
103
  ...d_model/model.safetensors: 29%|β–ˆβ–ˆβ–‰ | 2.71GB / 9.35GB 
 
 
 
104
  ...timizer_state.safetensors: 81%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 1.77GB / 2.20GB 
 
 
 
105
  ...d_model/model.safetensors: 30%|β–ˆβ–ˆβ–‰ | 2.78GB / 9.35GB 
 
 
 
106
  ...timizer_state.safetensors: 84%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 1.84GB / 2.20GB 
 
 
 
107
  ...d_model/model.safetensors: 31%|β–ˆβ–ˆβ–ˆ | 2.86GB / 9.35GB 
 
 
 
108
  ...timizer_state.safetensors: 87%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 1.90GB / 2.20GB 
 
 
 
109
  ...d_model/model.safetensors: 31%|β–ˆβ–ˆβ–ˆ | 2.92GB / 9.35GB 
 
 
 
110
  ...timizer_state.safetensors: 90%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.97GB / 2.20GB 
 
 
 
111
  ...d_model/model.safetensors: 32%|β–ˆβ–ˆβ–ˆβ– | 2.98GB / 9.35GB 
 
 
112
  ...timizer_state.safetensors: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 1.99GB / 2.20GB 
 
 
 
113
  ...d_model/model.safetensors: 32%|β–ˆβ–ˆβ–ˆβ– | 3.02GB / 9.35GB 
 
 
114
  ...timizer_state.safetensors: 93%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž| 2.04GB / 2.20GB 
 
 
 
115
  ...d_model/model.safetensors: 33%|β–ˆβ–ˆβ–ˆβ–Ž | 3.08GB / 9.35GB 
 
 
 
116
  ...timizer_state.safetensors: 96%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ| 2.10GB / 2.20GB 
 
 
 
117
  ...d_model/model.safetensors: 33%|β–ˆβ–ˆβ–ˆβ–Ž | 3.09GB / 9.35GB 
 
 
 
118
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
119
  ...d_model/model.safetensors: 35%|β–ˆβ–ˆβ–ˆβ– | 3.23GB / 9.35GB 
 
 
 
120
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
121
  ...d_model/model.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 3.53GB / 9.35GB 
 
 
 
122
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
123
  ...d_model/model.safetensors: 40%|β–ˆβ–ˆβ–ˆβ–ˆ | 3.78GB / 9.35GB 
 
 
 
124
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
125
  ...d_model/model.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 4.03GB / 9.35GB 
 
 
 
126
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
127
  ...d_model/model.safetensors: 45%|β–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 4.23GB / 9.35GB 
 
 
 
128
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
129
  ...d_model/model.safetensors: 48%|β–ˆβ–ˆβ–ˆβ–ˆβ–Š | 4.46GB / 9.35GB 
 
 
 
130
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
131
  ...d_model/model.safetensors: 50%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 4.68GB / 9.35GB 
 
 
 
132
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
133
  ...d_model/model.safetensors: 52%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 4.86GB / 9.35GB 
 
 
 
134
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
135
  ...d_model/model.safetensors: 54%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 5.03GB / 9.35GB 
 
 
136
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
137
  ...d_model/model.safetensors: 56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 5.22GB / 9.35GB 
 
 
138
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
139
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.38GB / 9.35GB 
 
 
140
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
141
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.38GB / 9.35GB 
 
 
142
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
143
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.38GB / 9.35GB 
 
 
144
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
145
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.39GB / 9.35GB 
 
 
 
146
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
147
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.41GB / 9.35GB 
 
 
 
148
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
149
  ...d_model/model.safetensors: 60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 5.64GB / 9.35GB 
 
 
 
150
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
151
  ...d_model/model.safetensors: 63%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 5.87GB / 9.35GB 
 
 
 
152
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
153
  ...d_model/model.safetensors: 65%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 6.10GB / 9.35GB 
 
 
 
154
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
155
  ...d_model/model.safetensors: 67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 6.31GB / 9.35GB 
 
 
 
156
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
157
  ...d_model/model.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 6.51GB / 9.35GB 
 
 
158
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
159
  ...d_model/model.safetensors: 72%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 6.70GB / 9.35GB 
 
 
160
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
161
  ...d_model/model.safetensors: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 6.89GB / 9.35GB 
 
 
162
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
163
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 6.98GB / 9.35GB 
 
 
 
164
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
165
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 6.99GB / 9.35GB 
 
 
 
166
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
167
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 7.01GB / 9.35GB 
 
 
 
168
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
169
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 7.06GB / 9.35GB 
 
 
 
170
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
171
  ...d_model/model.safetensors: 77%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 7.24GB / 9.35GB 
 
 
 
172
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
173
  ...d_model/model.safetensors: 80%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 7.45GB / 9.35GB 
 
 
 
174
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
175
  ...d_model/model.safetensors: 82%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 7.65GB / 9.35GB 
 
 
 
176
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
177
  ...d_model/model.safetensors: 84%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 7.85GB / 9.35GB 
 
 
178
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
179
  ...d_model/model.safetensors: 86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 8.05GB / 9.35GB 
 
 
 
180
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
181
  ...d_model/model.safetensors: 88%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 8.25GB / 9.35GB 
 
 
182
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
183
  ...d_model/model.safetensors: 90%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 8.45GB / 9.35GB 
 
 
184
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
185
  ...d_model/model.safetensors: 93%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž| 8.67GB / 9.35GB 
 
 
 
186
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
187
  ...d_model/model.safetensors: 95%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 8.86GB / 9.35GB 
 
 
188
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
189
  ...d_model/model.safetensors: 97%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 9.07GB / 9.35GB 
 
 
190
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
191
  ...d_model/model.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.27GB / 9.35GB 
 
 
192
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
 
 
 
193
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.34GB / 9.35GB 
 
 
 
 
194
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
 
 
 
 
 
195
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
 
 
 
 
 
 
196
  ...ate/rng_state.safetensors: 14%|β–ˆβ– | 2.23kB / 15.7kB 
 
 
197
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.16GB / 2.20GB 
 
 
 
198
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.34GB / 9.35GB 
 
 
 
 
199
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
 
 
 
 
 
200
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
 
 
 
 
 
 
201
  ...ate/rng_state.safetensors: 14%|β–ˆβ– | 2.23kB / 15.7kB 
 
 
 
202
  ...timizer_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.17GB / 2.20GB 
 
 
 
203
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.34GB / 9.35GB 
 
 
 
 
204
  ...zer_processor.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 327B / 768B 
 
 
 
 
 
205
  ...zer_processor.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 327B / 768B 
 
 
 
 
 
 
206
  ...ate/rng_state.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 6.69kB / 15.7kB 
 
 
 
207
  ...timizer_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.18GB / 2.20GB 
 
 
 
208
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
209
  ...zer_processor.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 537B / 768B 
 
 
 
 
 
210
  ...zer_processor.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 537B / 768B 
 
 
 
 
 
 
211
  ...ate/rng_state.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 11.0kB / 15.7kB 
 
 
 
212
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
 
 
 
213
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
214
  ...zer_processor.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 755B / 768B 
 
 
 
 
 
215
  ...zer_processor.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 755B / 768B 
 
 
 
 
 
 
216
  ...ate/rng_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 15.4kB / 15.7kB 
 
 
 
217
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
 
 
 
218
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
219
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
220
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
 
221
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
 
 
 
222
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
 
 
 
223
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
224
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
225
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
 
226
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
 
 
227
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
 
 
 
228
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
229
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
230
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
 
231
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
 
 
232
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
 
 
 
233
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
234
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
235
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
 
 
 
 
 
 
236
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
 
 
237
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
 
 
 
238
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
239
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
240
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
 
241
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
 
 
 
242
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
 
 
 
243
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
244
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
245
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
 
246
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
 
 
247
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
 
 
 
248
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
249
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
250
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
 
251
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
 
 
252
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
 
 
 
253
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
254
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
255
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
 
256
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
 
 
257
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
 
 
 
258
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
259
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
260
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
 
261
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
 
 
262
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
 
 
 
263
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
264
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
265
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
 
266
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
 
 
267
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
 
 
 
268
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
 
 
 
 
269
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
270
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
 
 
 
 
 
 
271
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
 
 
272
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB
 
273
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB
 
274
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B
 
275
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B
 
276
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ === Starting Training ===
2
+ The following values were not passed to `accelerate launch` and had defaults used instead:
3
+ `--num_processes` was set to a value of `1`
4
+ `--num_machines` was set to a value of `1`
5
+ `--mixed_precision` was set to a value of `'no'`
6
+ `--dynamo_backend` was set to a value of `'no'`
7
+ To avoid this warning pass in values for each of the problematic parameters or run `accelerate config`.
8
+ WARNING:lerobot.configs.policies:Device 'mps' is not available. Switching to 'cuda'.
9
+ WARNING:lerobot.configs.policies:Device 'mps' is not available. Switching to 'cuda'.
10
+ INFO 2026-03-24 02:55:56 ot_train.py:198 {'batch_size': 16,
11
+ 'checkpoint_path': None,
12
+ 'cudnn_deterministic': False,
13
+ 'dataset': {'episodes': None,
14
+ 'image_transforms': {'enable': False,
15
+ 'max_num_transforms': 3,
16
+ 'random_order': False,
17
+ 'tfs': {'affine': {'kwargs': {'degrees': [-5.0,
18
+ 5.0],
19
+ 'translate': [0.05,
20
+ 0.05]},
21
+ 'type': 'RandomAffine',
22
+ 'weight': 1.0},
23
+ 'brightness': {'kwargs': {'brightness': [0.8,
24
+ 1.2]},
25
+ 'type': 'ColorJitter',
26
+ 'weight': 1.0},
27
+ 'contrast': {'kwargs': {'contrast': [0.8,
28
+ 1.2]},
29
+ 'type': 'ColorJitter',
30
+ 'weight': 1.0},
31
+ 'hue': {'kwargs': {'hue': [-0.05,
32
+ 0.05]},
33
+ 'type': 'ColorJitter',
34
+ 'weight': 1.0},
35
+ 'saturation': {'kwargs': {'saturation': [0.5,
36
+ 1.5]},
37
+ 'type': 'ColorJitter',
38
+ 'weight': 1.0},
39
+ 'sharpness': {'kwargs': {'sharpness': [0.5,
40
+ 1.5]},
41
+ 'type': 'SharpnessJitter',
42
+ 'weight': 1.0}}},
43
+ 'repo_id': 'so100:/ephemeral/community_dataset_v3:/workspace/pi05-so100-diverse/filtered_index.json:/workspace/pi05-so100-diverse/norm_stats.json',
44
+ 'revision': None,
45
+ 'root': None,
46
+ 'streaming': False,
47
+ 'use_imagenet_stats': True,
48
+ 'video_backend': 'torchcodec'},
49
+ 'env': None,
50
+ 'eval': {'batch_size': 50, 'n_episodes': 50, 'use_async_envs': False},
51
+ 'eval_freq': 20000,
52
+ 'job_name': 'pi05',
53
+ 'log_freq': 50,
54
+ 'num_workers': 4,
55
+ 'optimizer': {'betas': [0.9, 0.95],
56
+ 'eps': 1e-08,
57
+ 'grad_clip_norm': 1.0,
58
+ 'lr': 2.5e-05,
59
+ 'type': 'adamw',
60
+ 'weight_decay': 0.01},
61
+ 'output_dir': '/ephemeral/production_run',
62
+ 'peft': None,
63
+ 'policy': {'action_expert_variant': 'gemma_300m',
64
+ 'chunk_size': 50,
65
+ 'compile_mode': 'max-autotune',
66
+ 'compile_model': False,
67
+ 'device': 'cuda',
68
+ 'dtype': 'bfloat16',
69
+ 'empty_cameras': 0,
70
+ 'freeze_vision_encoder': False,
71
+ 'gradient_checkpointing': False,
72
+ 'image_resolution': [224, 224],
73
+ 'input_features': {'observation.images.base_0_rgb': {'shape': [3,
74
+ 224,
75
+ 224],
76
+ 'type': <FeatureType.VISUAL: 'VISUAL'>},
77
+ 'observation.images.left_wrist_0_rgb': {'shape': [3,
78
+ 224,
79
+ 224],
80
+ 'type': <FeatureType.VISUAL: 'VISUAL'>},
81
+ 'observation.images.right_wrist_0_rgb': {'shape': [3,
82
+ 224,
83
+ 224],
84
+ 'type': <FeatureType.VISUAL: 'VISUAL'>},
85
+ 'observation.state': {'shape': [32],
86
+ 'type': <FeatureType.STATE: 'STATE'>}},
87
+ 'license': None,
88
+ 'max_action_dim': 32,
89
+ 'max_period': 4.0,
90
+ 'max_state_dim': 32,
91
+ 'min_period': 0.004,
92
+ 'n_action_steps': 50,
93
+ 'n_obs_steps': 1,
94
+ 'normalization_mapping': {'ACTION': <NormalizationMode.MEAN_STD: 'MEAN_STD'>,
95
+ 'STATE': <NormalizationMode.MEAN_STD: 'MEAN_STD'>,
96
+ 'VISUAL': <NormalizationMode.IDENTITY: 'IDENTITY'>},
97
+ 'num_inference_steps': 10,
98
+ 'optimizer_betas': [0.9, 0.95],
99
+ 'optimizer_eps': 1e-08,
100
+ 'optimizer_grad_clip_norm': 1.0,
101
+ 'optimizer_lr': 2.5e-05,
102
+ 'optimizer_weight_decay': 0.01,
103
+ 'output_features': {'action': {'shape': [32],
104
+ 'type': <FeatureType.ACTION: 'ACTION'>}},
105
+ 'paligemma_variant': 'gemma_2b',
106
+ 'pretrained_path': 'lerobot/pi05_base',
107
+ 'private': None,
108
+ 'push_to_hub': True,
109
+ 'repo_id': 'StrongRoboticsLab/pi05-so100-diverse',
110
+ 'rtc_config': None,
111
+ 'scheduler_decay_lr': 2.5e-06,
112
+ 'scheduler_decay_steps': 340000,
113
+ 'scheduler_warmup_steps': 1000,
114
+ 'tags': None,
115
+ 'time_sampling_beta_alpha': 1.5,
116
+ 'time_sampling_beta_beta': 1.0,
117
+ 'time_sampling_offset': 0.001,
118
+ 'time_sampling_scale': 0.999,
119
+ 'tokenizer_max_length': 200,
120
+ 'train_expert_only': True,
121
+ 'type': 'pi05',
122
+ 'use_amp': False,
123
+ 'use_peft': False},
124
+ 'rabc_epsilon': 1e-06,
125
+ 'rabc_head_mode': 'sparse',
126
+ 'rabc_kappa': 0.01,
127
+ 'rabc_progress_path': None,
128
+ 'rename_map': {'observation.images.image': 'observation.images.base_0_rgb',
129
+ 'observation.images.image2': 'observation.images.left_wrist_0_rgb'},
130
+ 'resume': False,
131
+ 'save_checkpoint': True,
132
+ 'save_freq': 500,
133
+ 'scheduler': {'decay_lr': 2.5e-06,
134
+ 'num_decay_steps': 340000,
135
+ 'num_warmup_steps': 1000,
136
+ 'peak_lr': 2.5e-05,
137
+ 'type': 'cosine_decay_with_warmup'},
138
+ 'seed': 1000,
139
+ 'steps': 340000,
140
+ 'tolerance_s': 0.0001,
141
+ 'use_policy_training_preset': True,
142
+ 'use_rabc': False,
143
+ 'wandb': {'add_tags': True,
144
+ 'disable_artifact': False,
145
+ 'enable': True,
146
+ 'entity': None,
147
+ 'mode': None,
148
+ 'notes': None,
149
+ 'project': 'pi05-so100-diverse',
150
+ 'run_id': None}}
151
+ INFO 2026-03-24 02:55:58 db_utils.py:117 Logs will be synced with wandb.
152
+ INFO 2026-03-24 02:55:58 db_utils.py:118 Track this run --> https://wandb.ai/gptjustin-strong-robotics-lab/pi05-so100-diverse/runs/7zuftzeh
153
+ INFO 2026-03-24 02:55:58 ot_train.py:222 Creating dataset
154
+ INFO 2026-03-24 02:56:01 ot_train.py:240 Creating policy
155
+ INFO 2026-03-24 02:57:56 _client.py:1025 HTTP Request: HEAD https://huggingface.co/lerobot/pi05_base/resolve/main/model.safetensors "HTTP/1.1 302 Found"
156
+ INFO 2026-03-24 02:57:56 _client.py:1025 HTTP Request: GET https://huggingface.co/api/models/lerobot/pi05_base/xet-read-token/9e55186ad36e66b95cda57bc47818d9e6237ae30 "HTTP/1.1 200 OK"
157
+ WARNING 2026-03-24 02:58:13 ng_pi05.py:1102 Vision embedding key might need handling: paligemma_with_expert.paligemma.model.vision_tower.vision_model.embeddings.patch_embedding.bias
158
+ WARNING 2026-03-24 02:58:13 ng_pi05.py:1102 Vision embedding key might need handling: paligemma_with_expert.paligemma.model.vision_tower.vision_model.embeddings.patch_embedding.weight
159
+ INFO 2026-03-24 02:58:18 _client.py:1025 HTTP Request: HEAD https://huggingface.co/lerobot/pi05_base/resolve/main/policy_preprocessor.json "HTTP/1.1 307 Temporary Redirect"
160
+ INFO 2026-03-24 02:58:18 _client.py:1025 HTTP Request: HEAD https://huggingface.co/api/resolve-cache/models/lerobot/pi05_base/9e55186ad36e66b95cda57bc47818d9e6237ae30/policy_preprocessor.json "HTTP/1.1 200 OK"
161
+ INFO 2026-03-24 02:58:18 _client.py:1025 HTTP Request: GET https://huggingface.co/api/resolve-cache/models/lerobot/pi05_base/9e55186ad36e66b95cda57bc47818d9e6237ae30/policy_preprocessor.json "HTTP/1.1 200 OK"
162
+ INFO 2026-03-24 02:58:18 _client.py:1025 HTTP Request: HEAD https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/config.json "HTTP/1.1 200 OK"
163
+ INFO 2026-03-24 02:58:18 _client.py:1025 HTTP Request: GET https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/config.json "HTTP/1.1 200 OK"
164
+ INFO 2026-03-24 02:58:18 _client.py:1025 HTTP Request: HEAD https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/tokenizer_config.json "HTTP/1.1 200 OK"
165
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: GET https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/tokenizer_config.json "HTTP/1.1 200 OK"
166
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: GET https://huggingface.co/api/models/google/paligemma-3b-pt-224/tree/main/additional_chat_templates?recursive=false&expand=false "HTTP/1.1 404 Not Found"
167
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: GET https://huggingface.co/api/models/google/paligemma-3b-pt-224/tree/main?recursive=true&expand=false "HTTP/1.1 200 OK"
168
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: HEAD https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/tokenizer.json "HTTP/1.1 302 Found"
169
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: GET https://huggingface.co/api/models/google/paligemma-3b-pt-224/xet-read-token/35e4f46485b4d07967e7e9935bc3786aad50687c "HTTP/1.1 200 OK"
170
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: HEAD https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/added_tokens.json "HTTP/1.1 200 OK"
171
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: GET https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/added_tokens.json "HTTP/1.1 200 OK"
172
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: HEAD https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/special_tokens_map.json "HTTP/1.1 200 OK"
173
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: GET https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/special_tokens_map.json "HTTP/1.1 200 OK"
174
+ INFO 2026-03-24 02:58:19 _client.py:1025 HTTP Request: HEAD https://huggingface.co/google/paligemma-3b-pt-224/resolve/main/chat_template.jinja "HTTP/1.1 404 Not Found"
175
+ INFO 2026-03-24 02:58:21 _client.py:1025 HTTP Request: GET https://huggingface.co/api/models/google/paligemma-3b-pt-224 "HTTP/1.1 200 OK"
176
+ INFO 2026-03-24 02:58:21 _client.py:1025 HTTP Request: HEAD https://huggingface.co/lerobot/pi05_base/resolve/main/policy_postprocessor.json "HTTP/1.1 307 Temporary Redirect"
177
+ INFO 2026-03-24 02:58:21 _client.py:1025 HTTP Request: HEAD https://huggingface.co/api/resolve-cache/models/lerobot/pi05_base/9e55186ad36e66b95cda57bc47818d9e6237ae30/policy_postprocessor.json "HTTP/1.1 200 OK"
178
+ INFO 2026-03-24 02:58:21 _client.py:1025 HTTP Request: GET https://huggingface.co/api/resolve-cache/models/lerobot/pi05_base/9e55186ad36e66b95cda57bc47818d9e6237ae30/policy_postprocessor.json "HTTP/1.1 200 OK"
179
+ INFO 2026-03-24 02:58:21 ot_train.py:295 Creating optimizer and scheduler
180
+ INFO 2026-03-24 02:58:21 ot_train.py:330 Output dir: /ephemeral/production_run
181
+ INFO 2026-03-24 02:58:21 ot_train.py:337 cfg.steps=340000 (340K)
182
+ INFO 2026-03-24 02:58:21 ot_train.py:338 dataset.num_frames=4923840 (5M)
183
+ INFO 2026-03-24 02:58:21 ot_train.py:339 dataset.num_episodes=10155
184
+ INFO 2026-03-24 02:58:21 ot_train.py:342 Effective batch size: 16 x 1 = 16
185
+ INFO 2026-03-24 02:58:21 ot_train.py:343 num_learnable_params=693422112 (693M)
186
+ INFO 2026-03-24 02:58:21 ot_train.py:344 num_total_params=4143404816 (4B)
187
+ The PI05 model is a direct port of the OpenPI implementation.
188
+ This implementation follows the original OpenPI structure for compatibility.
189
+ Original implementation: https://github.com/Physical-Intelligence/openpi
190
+ Loading model from: lerobot/pi05_base
191
+ βœ“ Loaded state dict from model.safetensors
192
+ Remapped 812 state dict keys
193
+ All keys loaded successfully!
194
+
195
+
196
+ WARNING 2026-03-24 02:59:05 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
197
+
198
+ WARNING 2026-03-24 02:59:47 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
199
+
200
+ WARNING 2026-03-24 03:00:30 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
201
+
202
+ WARNING 2026-03-24 03:01:13 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
203
+
204
+ WARNING 2026-03-24 03:01:56 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
205
+
206
+ WARNING 2026-03-24 03:02:39 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
207
+
208
+ WARNING 2026-03-24 03:03:22 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
209
+
210
+ WARNING 2026-03-24 03:04:05 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
211
+
212
+ WARNING 2026-03-24 03:04:48 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
213
+
214
+ WARNING 2026-03-24 03:05:31 db_utils.py:181 WandB logging of key "loss_per_dim" was ignored as its type "<class 'list'>" is not handled by this wrapper.
215
+ INFO 2026-03-24 03:05:31 ot_train.py:461 Checkpoint policy after step 500
216
+ INFO 2026-03-24 03:05:55 _client.py:1025 HTTP Request: POST https://huggingface.co/api/models/StrongRoboticsLab/pi05-so100-diverse/preupload/main "HTTP/1.1 200 OK"
217
+ INFO 2026-03-24 03:05:55 _client.py:1025 HTTP Request: POST https://huggingface.co/StrongRoboticsLab/pi05-so100-diverse.git/info/lfs/objects/batch "HTTP/1.1 200 OK"
218
+ INFO 2026-03-24 03:05:55 _client.py:1025 HTTP Request: GET https://huggingface.co/api/models/StrongRoboticsLab/pi05-so100-diverse/xet-write-token/main "HTTP/1.1 200 OK"
219
+
220
+
221
+
222
+
223
  ...timizer_state.safetensors: 0%| | 28.1kB / 2.20GB 
224
+
225
+
226
+
227
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
228
+
229
+
230
  ...timizer_state.safetensors: 0%| | 28.1kB / 2.20GB 
231
+
232
+
233
+
234
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
235
+
236
+
237
  ...timizer_state.safetensors: 1%| | 14.9MB / 2.20GB 
238
+
239
+
240
+
241
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
242
+
243
+
244
+
245
  ...timizer_state.safetensors: 3%|β–Ž | 64.0MB / 2.20GB 
246
+
247
+
248
+
249
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
250
+
251
+
252
+
253
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
254
+
255
+
256
+
257
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
258
+
259
+
260
+
261
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
262
+
263
+
264
+
265
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
266
+
267
+
268
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
269
+
270
+
271
+
272
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
273
+
274
+
275
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
276
+
277
+
278
+
279
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
280
+
281
+
282
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
283
+
284
+
285
+
286
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
287
+
288
+
289
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
290
+
291
+
292
+
293
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
294
+
295
+
296
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
297
+
298
+
299
+
300
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
301
+
302
+
303
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
304
+
305
+
306
+
307
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
308
+
309
+
310
  ...timizer_state.safetensors: 3%|β–Ž | 66.7MB / 2.20GB 
311
+
312
+
313
+
314
  ...d_model/model.safetensors: 0%| | 98.2kB / 9.35GB 
315
+
316
+
317
  ...timizer_state.safetensors: 3%|β–Ž | 71.5MB / 2.20GB 
318
+
319
+
320
+
321
  ...d_model/model.safetensors: 0%| | 5.09MB / 9.35GB 
322
+
323
+
324
+
325
  ...timizer_state.safetensors: 5%|β–Œ | 119MB / 2.20GB 
326
+
327
+
328
+
329
  ...d_model/model.safetensors: 1%| | 47.8MB / 9.35GB 
330
+
331
+
332
+
333
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
334
+
335
+
336
+
337
  ...d_model/model.safetensors: 1%| | 66.7MB / 9.35GB 
338
+
339
+
340
+
341
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
342
+
343
+
344
+
345
  ...d_model/model.safetensors: 1%| | 66.7MB / 9.35GB 
346
+
347
+
348
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
349
+
350
+
351
+
352
  ...d_model/model.safetensors: 1%| | 66.7MB / 9.35GB 
353
+
354
+
355
  ...timizer_state.safetensors: 6%|β–Œ | 134MB / 2.20GB 
356
+
357
+
358
+
359
  ...d_model/model.safetensors: 1%| | 67.1MB / 9.35GB 
360
+
361
+
362
+
363
  ...timizer_state.safetensors: 7%|β–‹ | 146MB / 2.20GB 
364
+
365
+
366
+
367
  ...d_model/model.safetensors: 1%| | 78.3MB / 9.35GB 
368
+
369
+
370
+
371
  ...timizer_state.safetensors: 9%|β–Š | 191MB / 2.20GB 
372
+
373
+
374
+
375
  ...d_model/model.safetensors: 1%|▏ | 125MB / 9.35GB 
376
+
377
+
378
+
379
  ...timizer_state.safetensors: 9%|β–‰ | 201MB / 2.20GB 
380
+
381
+
382
+
383
  ...d_model/model.safetensors: 2%|▏ | 169MB / 9.35GB 
384
+
385
+
386
+
387
  ...timizer_state.safetensors: 9%|β–‰ | 207MB / 2.20GB 
388
+
389
+
390
+
391
  ...d_model/model.safetensors: 2%|▏ | 201MB / 9.35GB 
392
+
393
+
394
+
395
  ...timizer_state.safetensors: 12%|β–ˆβ– | 256MB / 2.20GB 
396
+
397
+
398
+
399
  ...d_model/model.safetensors: 2%|▏ | 201MB / 9.35GB 
400
+
401
+
402
+
403
  ...timizer_state.safetensors: 12%|β–ˆβ– | 267MB / 2.20GB 
404
+
405
+
406
+
407
  ...d_model/model.safetensors: 2%|▏ | 201MB / 9.35GB 
408
+
409
+
410
+
411
  ...timizer_state.safetensors: 12%|β–ˆβ– | 272MB / 2.20GB 
412
+
413
+
414
+
415
  ...d_model/model.safetensors: 2%|▏ | 204MB / 9.35GB 
416
+
417
+
418
+
419
  ...timizer_state.safetensors: 14%|β–ˆβ– | 307MB / 2.20GB 
420
+
421
+
422
+
423
  ...d_model/model.safetensors: 2%|▏ | 214MB / 9.35GB 
424
+
425
+
426
+
427
  ...timizer_state.safetensors: 15%|β–ˆβ–Œ | 334MB / 2.20GB 
428
+
429
+
430
+
431
  ...d_model/model.safetensors: 3%|β–Ž | 264MB / 9.35GB 
432
+
433
+
434
+
435
  ...timizer_state.safetensors: 15%|β–ˆβ–Œ | 334MB / 2.20GB 
436
+
437
+
438
+
439
  ...d_model/model.safetensors: 3%|β–Ž | 295MB / 9.35GB 
440
+
441
+
442
+
443
  ...timizer_state.safetensors: 16%|β–ˆβ–Œ | 348MB / 2.20GB 
444
+
445
+
446
+
447
  ...d_model/model.safetensors: 3%|β–Ž | 306MB / 9.35GB 
448
+
449
+
450
+
451
  ...timizer_state.safetensors: 18%|β–ˆβ–Š | 397MB / 2.20GB 
452
+
453
+
454
+
455
  ...d_model/model.safetensors: 4%|β–Ž | 344MB / 9.35GB 
456
+
457
+
458
+
459
  ...timizer_state.safetensors: 18%|β–ˆβ–Š | 402MB / 2.20GB 
460
+
461
+
462
+
463
  ...d_model/model.safetensors: 4%|▍ | 392MB / 9.35GB 
464
+
465
+
466
+
467
  ...timizer_state.safetensors: 19%|β–ˆβ–‰ | 425MB / 2.20GB 
468
+
469
+
470
+
471
  ...d_model/model.safetensors: 4%|▍ | 402MB / 9.35GB 
472
+
473
+
474
+
475
  ...timizer_state.safetensors: 23%|β–ˆβ–ˆβ–Ž | 498MB / 2.20GB 
476
+
477
+
478
+
479
  ...d_model/model.safetensors: 4%|▍ | 402MB / 9.35GB 
480
+
481
+
482
+
483
  ...timizer_state.safetensors: 26%|β–ˆβ–ˆβ–Œ | 560MB / 2.20GB 
484
+
485
+
486
+
487
  ...d_model/model.safetensors: 5%|β–Œ | 495MB / 9.35GB 
488
+
489
+
490
+
491
  ...timizer_state.safetensors: 29%|β–ˆβ–ˆβ–‰ | 637MB / 2.20GB 
492
+
493
+
494
+
495
  ...d_model/model.safetensors: 8%|β–Š | 779MB / 9.35GB 
496
+
497
+
498
+
499
  ...timizer_state.safetensors: 32%|β–ˆβ–ˆβ–ˆβ– | 706MB / 2.20GB 
500
+
501
+
502
+
503
  ...d_model/model.safetensors: 11%|β–ˆ | 1.02GB / 9.35GB 
504
+
505
+
506
+
507
  ...timizer_state.safetensors: 36%|β–ˆβ–ˆβ–ˆβ–Œ | 793MB / 2.20GB 
508
+
509
+
510
+
511
  ...d_model/model.safetensors: 13%|β–ˆβ–Ž | 1.24GB / 9.35GB 
512
+
513
+
514
+
515
  ...timizer_state.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 824MB / 2.20GB 
516
+
517
+
518
+
519
  ...d_model/model.safetensors: 15%|β–ˆβ–Œ | 1.43GB / 9.35GB 
520
+
521
+
522
+
523
  ...timizer_state.safetensors: 40%|β–ˆβ–ˆβ–ˆβ–ˆ | 884MB / 2.20GB 
524
+
525
+
526
+
527
  ...d_model/model.safetensors: 17%|β–ˆβ–‹ | 1.62GB / 9.35GB 
528
+
529
+
530
+
531
  ...timizer_state.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 940MB / 2.20GB 
532
+
533
+
534
+
535
  ...d_model/model.safetensors: 19%|β–ˆβ–‰ | 1.82GB / 9.35GB 
536
+
537
+
538
+
539
  ...timizer_state.safetensors: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 1.02GB / 2.20GB 
540
+
541
+
542
+
543
  ...d_model/model.safetensors: 21%|β–ˆβ–ˆβ– | 2.01GB / 9.35GB 
544
+
545
+
546
+
547
  ...timizer_state.safetensors: 50%|β–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.09GB / 2.20GB 
548
+
549
+
550
+
551
  ...d_model/model.safetensors: 22%|β–ˆβ–ˆβ– | 2.08GB / 9.35GB 
552
+
553
+
554
+
555
  ...timizer_state.safetensors: 53%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 1.17GB / 2.20GB 
556
+
557
+
558
+
559
  ...d_model/model.safetensors: 22%|β–ˆβ–ˆβ– | 2.08GB / 9.35GB 
560
+
561
+
562
+
563
  ...timizer_state.safetensors: 56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 1.23GB / 2.20GB 
564
+
565
+
566
+
567
  ...d_model/model.safetensors: 24%|β–ˆβ–ˆβ–Ž | 2.22GB / 9.35GB 
568
+
569
+
570
+
571
  ...timizer_state.safetensors: 59%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.30GB / 2.20GB 
572
+
573
+
574
+
575
  ...d_model/model.safetensors: 24%|β–ˆβ–ˆβ–Ž | 2.22GB / 9.35GB 
576
+
577
+
578
+
579
  ...timizer_state.safetensors: 63%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 1.38GB / 2.20GB 
580
+
581
+
582
+
583
  ...d_model/model.safetensors: 24%|β–ˆβ–ˆβ– | 2.27GB / 9.35GB 
584
+
585
+
586
+
587
  ...timizer_state.safetensors: 66%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 1.44GB / 2.20GB 
588
+
589
+
590
+
591
  ...d_model/model.safetensors: 27%|β–ˆβ–ˆβ–‹ | 2.50GB / 9.35GB 
592
+
593
+
594
+
595
  ...timizer_state.safetensors: 68%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 1.50GB / 2.20GB 
596
+
597
+
598
+
599
  ...d_model/model.safetensors: 28%|β–ˆβ–ˆβ–Š | 2.61GB / 9.35GB 
600
+
601
+
602
+
603
  ...timizer_state.safetensors: 71%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 1.55GB / 2.20GB 
604
+
605
+
606
+
607
  ...d_model/model.safetensors: 28%|β–ˆβ–ˆβ–Š | 2.62GB / 9.35GB 
608
+
609
+
610
+
611
  ...timizer_state.safetensors: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 1.63GB / 2.20GB 
612
+
613
+
614
+
615
  ...d_model/model.safetensors: 28%|β–ˆβ–ˆβ–Š | 2.64GB / 9.35GB 
616
+
617
+
618
+
619
  ...timizer_state.safetensors: 78%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 1.71GB / 2.20GB 
620
+
621
+
622
+
623
  ...d_model/model.safetensors: 29%|β–ˆβ–ˆβ–‰ | 2.71GB / 9.35GB 
624
+
625
+
626
+
627
  ...timizer_state.safetensors: 81%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 1.77GB / 2.20GB 
628
+
629
+
630
+
631
  ...d_model/model.safetensors: 30%|β–ˆβ–ˆβ–‰ | 2.78GB / 9.35GB 
632
+
633
+
634
+
635
  ...timizer_state.safetensors: 84%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 1.84GB / 2.20GB 
636
+
637
+
638
+
639
  ...d_model/model.safetensors: 31%|β–ˆβ–ˆβ–ˆ | 2.86GB / 9.35GB 
640
+
641
+
642
+
643
  ...timizer_state.safetensors: 87%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 1.90GB / 2.20GB 
644
+
645
+
646
+
647
  ...d_model/model.safetensors: 31%|β–ˆβ–ˆβ–ˆ | 2.92GB / 9.35GB 
648
+
649
+
650
+
651
  ...timizer_state.safetensors: 90%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.97GB / 2.20GB 
652
+
653
+
654
+
655
  ...d_model/model.safetensors: 32%|β–ˆβ–ˆβ–ˆβ– | 2.98GB / 9.35GB 
656
+
657
+
658
  ...timizer_state.safetensors: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 1.99GB / 2.20GB 
659
+
660
+
661
+
662
  ...d_model/model.safetensors: 32%|β–ˆβ–ˆβ–ˆβ– | 3.02GB / 9.35GB 
663
+
664
+
665
  ...timizer_state.safetensors: 93%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž| 2.04GB / 2.20GB 
666
+
667
+
668
+
669
  ...d_model/model.safetensors: 33%|β–ˆβ–ˆβ–ˆβ–Ž | 3.08GB / 9.35GB 
670
+
671
+
672
+
673
  ...timizer_state.safetensors: 96%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ| 2.10GB / 2.20GB 
674
+
675
+
676
+
677
  ...d_model/model.safetensors: 33%|β–ˆβ–ˆβ–ˆβ–Ž | 3.09GB / 9.35GB 
678
+
679
+
680
+
681
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
682
+
683
+
684
+
685
  ...d_model/model.safetensors: 35%|β–ˆβ–ˆβ–ˆβ– | 3.23GB / 9.35GB 
686
+
687
+
688
+
689
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
690
+
691
+
692
+
693
  ...d_model/model.safetensors: 38%|β–ˆβ–ˆβ–ˆβ–Š | 3.53GB / 9.35GB 
694
+
695
+
696
+
697
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
698
+
699
+
700
+
701
  ...d_model/model.safetensors: 40%|β–ˆβ–ˆβ–ˆβ–ˆ | 3.78GB / 9.35GB 
702
+
703
+
704
+
705
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
706
+
707
+
708
+
709
  ...d_model/model.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 4.03GB / 9.35GB 
710
+
711
+
712
+
713
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
714
+
715
+
716
+
717
  ...d_model/model.safetensors: 45%|β–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 4.23GB / 9.35GB 
718
+
719
+
720
+
721
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
722
+
723
+
724
+
725
  ...d_model/model.safetensors: 48%|β–ˆβ–ˆβ–ˆβ–ˆβ–Š | 4.46GB / 9.35GB 
726
+
727
+
728
+
729
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
730
+
731
+
732
+
733
  ...d_model/model.safetensors: 50%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 4.68GB / 9.35GB 
734
+
735
+
736
+
737
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
738
+
739
+
740
+
741
  ...d_model/model.safetensors: 52%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 4.86GB / 9.35GB 
742
+
743
+
744
+
745
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
746
+
747
+
748
+
749
  ...d_model/model.safetensors: 54%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 5.03GB / 9.35GB 
750
+
751
+
752
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
753
+
754
+
755
+
756
  ...d_model/model.safetensors: 56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 5.22GB / 9.35GB 
757
+
758
+
759
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
760
+
761
+
762
+
763
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.38GB / 9.35GB 
764
+
765
+
766
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
767
+
768
+
769
+
770
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.38GB / 9.35GB 
771
+
772
+
773
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
774
+
775
+
776
+
777
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.38GB / 9.35GB 
778
+
779
+
780
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
781
+
782
+
783
+
784
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.39GB / 9.35GB 
785
+
786
+
787
+
788
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
789
+
790
+
791
+
792
  ...d_model/model.safetensors: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 5.41GB / 9.35GB 
793
+
794
+
795
+
796
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
797
+
798
+
799
+
800
  ...d_model/model.safetensors: 60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 5.64GB / 9.35GB 
801
+
802
+
803
+
804
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
805
+
806
+
807
+
808
  ...d_model/model.safetensors: 63%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 5.87GB / 9.35GB 
809
+
810
+
811
+
812
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
813
+
814
+
815
+
816
  ...d_model/model.safetensors: 65%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 6.10GB / 9.35GB 
817
+
818
+
819
+
820
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
821
+
822
+
823
+
824
  ...d_model/model.safetensors: 67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 6.31GB / 9.35GB 
825
+
826
+
827
+
828
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
829
+
830
+
831
+
832
  ...d_model/model.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 6.51GB / 9.35GB 
833
+
834
+
835
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
836
+
837
+
838
+
839
  ...d_model/model.safetensors: 72%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 6.70GB / 9.35GB 
840
+
841
+
842
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
843
+
844
+
845
+
846
  ...d_model/model.safetensors: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 6.89GB / 9.35GB 
847
+
848
+
849
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
850
+
851
+
852
+
853
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 6.98GB / 9.35GB 
854
+
855
+
856
+
857
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
858
+
859
+
860
+
861
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 6.99GB / 9.35GB 
862
+
863
+
864
+
865
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
866
+
867
+
868
+
869
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 7.01GB / 9.35GB 
870
+
871
+
872
+
873
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
874
+
875
+
876
+
877
  ...d_model/model.safetensors: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 7.06GB / 9.35GB 
878
+
879
+
880
+
881
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
882
+
883
+
884
+
885
  ...d_model/model.safetensors: 77%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 7.24GB / 9.35GB 
886
+
887
+
888
+
889
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
890
+
891
+
892
+
893
  ...d_model/model.safetensors: 80%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 7.45GB / 9.35GB 
894
+
895
+
896
+
897
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
898
+
899
+
900
+
901
  ...d_model/model.safetensors: 82%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 7.65GB / 9.35GB 
902
+
903
+
904
+
905
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
906
+
907
+
908
+
909
  ...d_model/model.safetensors: 84%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 7.85GB / 9.35GB 
910
+
911
+
912
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
913
+
914
+
915
+
916
  ...d_model/model.safetensors: 86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 8.05GB / 9.35GB 
917
+
918
+
919
+
920
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
921
+
922
+
923
+
924
  ...d_model/model.safetensors: 88%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 8.25GB / 9.35GB 
925
+
926
+
927
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
928
+
929
+
930
+
931
  ...d_model/model.safetensors: 90%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 8.45GB / 9.35GB 
932
+
933
+
934
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
935
+
936
+
937
+
938
  ...d_model/model.safetensors: 93%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž| 8.67GB / 9.35GB 
939
+
940
+
941
+
942
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
943
+
944
+
945
+
946
  ...d_model/model.safetensors: 95%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 8.86GB / 9.35GB 
947
+
948
+
949
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
950
+
951
+
952
+
953
  ...d_model/model.safetensors: 97%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 9.07GB / 9.35GB 
954
+
955
+
956
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
957
+
958
+
959
+
960
  ...d_model/model.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.27GB / 9.35GB 
961
+
962
+
963
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.15GB / 2.20GB 
964
+
965
+
966
+
967
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.34GB / 9.35GB 
968
+
969
+
970
+
971
+
972
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
973
+
974
+
975
+
976
+
977
+
978
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
979
+
980
+
981
+
982
+
983
+
984
+
985
  ...ate/rng_state.safetensors: 14%|β–ˆβ– | 2.23kB / 15.7kB 
986
+
987
+
988
  ...timizer_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 2.16GB / 2.20GB 
989
+
990
+
991
+
992
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.34GB / 9.35GB 
993
+
994
+
995
+
996
+
997
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
998
+
999
+
1000
+
1001
+
1002
+
1003
  ...zer_processor.safetensors: 14%|β–ˆβ– | 109B / 768B 
1004
+
1005
+
1006
+
1007
+
1008
+
1009
+
1010
  ...ate/rng_state.safetensors: 14%|β–ˆβ– | 2.23kB / 15.7kB 
1011
+
1012
+
1013
+
1014
  ...timizer_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.17GB / 2.20GB 
1015
+
1016
+
1017
+
1018
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.34GB / 9.35GB 
1019
+
1020
+
1021
+
1022
+
1023
  ...zer_processor.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 327B / 768B 
1024
+
1025
+
1026
+
1027
+
1028
+
1029
  ...zer_processor.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 327B / 768B 
1030
+
1031
+
1032
+
1033
+
1034
+
1035
+
1036
  ...ate/rng_state.safetensors: 43%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 6.69kB / 15.7kB 
1037
+
1038
+
1039
+
1040
  ...timizer_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.18GB / 2.20GB 
1041
+
1042
+
1043
+
1044
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1045
+
1046
+
1047
+
1048
+
1049
  ...zer_processor.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 537B / 768B 
1050
+
1051
+
1052
+
1053
+
1054
+
1055
  ...zer_processor.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 537B / 768B 
1056
+
1057
+
1058
+
1059
+
1060
+
1061
+
1062
  ...ate/rng_state.safetensors: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 11.0kB / 15.7kB 
1063
+
1064
+
1065
+
1066
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
1067
+
1068
+
1069
+
1070
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1071
+
1072
+
1073
+
1074
+
1075
  ...zer_processor.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 755B / 768B 
1076
+
1077
+
1078
+
1079
+
1080
+
1081
  ...zer_processor.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 755B / 768B 
1082
+
1083
+
1084
+
1085
+
1086
+
1087
+
1088
  ...ate/rng_state.safetensors: 98%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š| 15.4kB / 15.7kB 
1089
+
1090
+
1091
+
1092
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
1093
+
1094
+
1095
+
1096
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1097
+
1098
+
1099
+
1100
+
1101
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1102
+
1103
+
1104
+
1105
+
1106
+
1107
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1108
+
1109
+
1110
+
1111
+
1112
+
1113
+
1114
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
1115
+
1116
+
1117
+
1118
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
1119
+
1120
+
1121
+
1122
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1123
+
1124
+
1125
+
1126
+
1127
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1128
+
1129
+
1130
+
1131
+
1132
+
1133
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1134
+
1135
+
1136
+
1137
+
1138
+
1139
+
1140
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
1141
+
1142
+
1143
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
1144
+
1145
+
1146
+
1147
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1148
+
1149
+
1150
+
1151
+
1152
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1153
+
1154
+
1155
+
1156
+
1157
+
1158
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1159
+
1160
+
1161
+
1162
+
1163
+
1164
+
1165
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
1166
+
1167
+
1168
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 2.19GB / 2.20GB 
1169
+
1170
+
1171
+
1172
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1173
+
1174
+
1175
+
1176
+
1177
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1178
+
1179
+
1180
+
1181
+
1182
+
1183
  ...zer_processor.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 763B / 768B 
1184
+
1185
+
1186
+
1187
+
1188
+
1189
+
1190
  ...ate/rng_state.safetensors: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 15.6kB / 15.7kB 
1191
+
1192
+
1193
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
1194
+
1195
+
1196
+
1197
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1198
+
1199
+
1200
+
1201
+
1202
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1203
+
1204
+
1205
+
1206
+
1207
+
1208
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1209
+
1210
+
1211
+
1212
+
1213
+
1214
+
1215
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
1216
+
1217
+
1218
+
1219
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
1220
+
1221
+
1222
+
1223
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1224
+
1225
+
1226
+
1227
+
1228
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1229
+
1230
+
1231
+
1232
+
1233
+
1234
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1235
+
1236
+
1237
+
1238
+
1239
+
1240
+
1241
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
1242
+
1243
+
1244
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
1245
+
1246
+
1247
+
1248
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1249
+
1250
+
1251
+
1252
+
1253
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1254
+
1255
+
1256
+
1257
+
1258
+
1259
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1260
+
1261
+
1262
+
1263
+
1264
+
1265
+
1266
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
1267
+
1268
+
1269
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
1270
+
1271
+
1272
+
1273
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1274
+
1275
+
1276
+
1277
+
1278
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1279
+
1280
+
1281
+
1282
+
1283
+
1284
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1285
+
1286
+
1287
+
1288
+
1289
+
1290
+
1291
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
1292
+
1293
+
1294
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
1295
+
1296
+
1297
+
1298
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1299
+
1300
+
1301
+
1302
+
1303
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1304
+
1305
+
1306
+
1307
+
1308
+
1309
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1310
+
1311
+
1312
+
1313
+
1314
+
1315
+
1316
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
1317
+
1318
+
1319
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
1320
+
1321
+
1322
+
1323
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1324
+
1325
+
1326
+
1327
+
1328
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1329
+
1330
+
1331
+
1332
+
1333
+
1334
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1335
+
1336
+
1337
+
1338
+
1339
+
1340
+
1341
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
1342
+
1343
+
1344
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB 
1345
+
1346
+
1347
+
1348
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB 
1349
+
1350
+
1351
+
1352
+
1353
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1354
+
1355
+
1356
+
1357
+
1358
+
1359
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B 
1360
+
1361
+
1362
+
1363
+
1364
+
1365
+
1366
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB 
1367
+
1368
+
1369
  ...timizer_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 2.20GB / 2.20GB
1370
+
1371
  ...d_model/model.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 9.35GB / 9.35GB
1372
+
1373
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B
1374
+
1375
  ...zer_processor.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 768B / 768B
1376
+
1377
  ...ate/rng_state.safetensors: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 15.7kB / 15.7kB
1378
+ INFO 2026-03-24 03:06:18 _client.py:1025 HTTP Request: POST https://huggingface.co/api/models/StrongRoboticsLab/pi05-so100-diverse/commit/main "HTTP/1.1 200 OK"
1379
+ INFO 2026-03-24 03:06:18 ot_train.py:485 Uploaded checkpoint step 500 to HF
1380
+ Traceback (most recent call last):
1381
+ File "<frozen runpy>", line 198, in _run_module_as_main
1382
+ File "<frozen runpy>", line 88, in _run_code
1383
+ File "/workspace/pi05-so100-diverse/lerobot/src/lerobot/scripts/lerobot_train.py", line 575, in <module>
1384
+ main()
1385
+ File "/workspace/pi05-so100-diverse/lerobot/src/lerobot/scripts/lerobot_train.py", line 571, in main
1386
+ train()
1387
+ File "/workspace/pi05-so100-diverse/lerobot/src/lerobot/configs/parser.py", line 233, in wrapper_inner
1388
+ response = fn(cfg, *args, **kwargs)
1389
+ ^^^^^^^^^^^^^^^^^^^^^^^^
1390
+ File "/workspace/pi05-so100-diverse/lerobot/src/lerobot/scripts/lerobot_train.py", line 493, in train
1391
+ wandb_logger.log_policy(checkpoint_dir)
1392
+ File "/workspace/pi05-so100-diverse/lerobot/src/lerobot/rl/wandb_utils.py", line 129, in log_policy
1393
+ artifact = self._wandb.Artifact(artifact_name, type="model")
1394
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
1395
+ File "/usr/local/lib/python3.12/dist-packages/wandb/sdk/artifacts/artifact.py", line 201, in __init__
1396
+ self._name: str = validate_artifact_name(name) # includes version after saving
1397
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
1398
+ File "/usr/local/lib/python3.12/dist-packages/wandb/sdk/artifacts/_validators.py", line 72, in validate_artifact_name
1399
+ raise ValueError(
1400
+ ValueError: Artifact name is longer than 128 characters: 'policy_pi05-seed_1000-dataset_so100__ephemeral_community_dataset_v3__workspace_pi05-so100-diverse_filtered_index.json__workspace ...'
1401
+ Traceback (most recent call last):
1402
+ File "<frozen runpy>", line 198, in _run_module_as_main
1403
+ File "<frozen runpy>", line 88, in _run_code
1404
+ File "/usr/local/lib/python3.12/dist-packages/accelerate/commands/launch.py", line 1415, in <module>
1405
+ main()
1406
+ File "/usr/local/lib/python3.12/dist-packages/accelerate/commands/launch.py", line 1411, in main
1407
+ launch_command(args)
1408
+ File "/usr/local/lib/python3.12/dist-packages/accelerate/commands/launch.py", line 1405, in launch_command
1409
+ simple_launcher(args)
1410
+ File "/usr/local/lib/python3.12/dist-packages/accelerate/commands/launch.py", line 993, in simple_launcher
1411
+ raise subprocess.CalledProcessError(returncode=process.returncode, cmd=cmd)
1412
+ subprocess.CalledProcessError: Command '['/usr/bin/python3.12', '-m', 'lerobot.scripts.lerobot_train', '--dataset.repo_id=so100:/ephemeral/community_dataset_v3:/workspace/pi05-so100-diverse/filtered_index.json:/workspace/pi05-so100-diverse/norm_stats.json', '--policy.path=lerobot/pi05_base', '--policy.train_expert_only=true', '--policy.dtype=bfloat16', '--policy.gradient_checkpointing=false', '--policy.push_to_hub=true', '--policy.repo_id=StrongRoboticsLab/pi05-so100-diverse', '--policy.normalization_mapping={"VISUAL": "IDENTITY", "STATE": "MEAN_STD", "ACTION": "MEAN_STD"}', '--policy.scheduler_warmup_steps=1000', '--policy.scheduler_decay_steps=340000', '--rename_map={"observation.images.image": "observation.images.base_0_rgb", "observation.images.image2": "observation.images.left_wrist_0_rgb"}', '--batch_size=16', '--steps=340000', '--save_freq=500', '--log_freq=50', '--num_workers=4', '--wandb.enable=true', '--wandb.project=pi05-so100-diverse', '--output_dir=/ephemeral/production_run']' returned non-zero exit status 1.
1413
+ === Training Complete (exit: 1) ===
train_cloud.sh CHANGED
@@ -47,7 +47,6 @@ python3.12 -m accelerate.commands.launch $ACCEL_FLAGS \
47
  --save_freq=500 \
48
  --log_freq=50 \
49
  --num_workers=4 \
50
- --job_name=pi05-so100-diverse \
51
  --wandb.enable=true \
52
  --wandb.project=pi05-so100-diverse \
53
  --output_dir=/ephemeral/production_run \
 
47
  --save_freq=500 \
48
  --log_freq=50 \
49
  --num_workers=4 \
 
50
  --wandb.enable=true \
51
  --wandb.project=pi05-so100-diverse \
52
  --output_dir=/ephemeral/production_run \