Training in progress, step 52000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1193,6 +1193,10 @@ You can finetune this model on your own dataset.
|
|
| 1193 |
| 0.9136 | 51700 | 0.3088 |
|
| 1194 |
| 0.9145 | 51750 | 0.2287 |
|
| 1195 |
| 0.9153 | 51800 | 0.2067 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1196 |
|
| 1197 |
|
| 1198 |
### Framework Versions
|
|
|
|
| 1193 |
| 0.9136 | 51700 | 0.3088 |
|
| 1194 |
| 0.9145 | 51750 | 0.2287 |
|
| 1195 |
| 0.9153 | 51800 | 0.2067 |
|
| 1196 |
+
| 0.9162 | 51850 | 0.2735 |
|
| 1197 |
+
| 0.9171 | 51900 | 0.3976 |
|
| 1198 |
+
| 0.9180 | 51950 | 0.2939 |
|
| 1199 |
+
| 0.9189 | 52000 | 0.3193 |
|
| 1200 |
|
| 1201 |
|
| 1202 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64df739ab78548e5d75f993ab6041c207785adcb30fa9a57cf9234173976387d
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab3798d7d967dd27d94d9da8c3b443a2ae8d98157d0a447c72ba241256385ef3
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bf77e2ef33f60ef48f8a5fc09cb1943760ae6ba4d88634c23d14cfcf6cad117
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12597bbc3e3311f727af17ce6725c67e2c62ce8d20a5da4fcf3ead6fc2b4cd3a
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69967b924386ed794e36fcb2fe2f94715b55410c1d3076df0af1214b0c14df7b
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -7260,6 +7260,34 @@
|
|
| 7260 |
"learning_rate": 4.724038404900748e-06,
|
| 7261 |
"loss": 0.2067,
|
| 7262 |
"step": 51800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7263 |
}
|
| 7264 |
],
|
| 7265 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.9188740259051793,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 52000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 7260 |
"learning_rate": 4.724038404900748e-06,
|
| 7261 |
"loss": 0.2067,
|
| 7262 |
"step": 51800
|
| 7263 |
+
},
|
| 7264 |
+
{
|
| 7265 |
+
"epoch": 0.9162234277535297,
|
| 7266 |
+
"grad_norm": 1.1146478652954102,
|
| 7267 |
+
"learning_rate": 4.674952386562212e-06,
|
| 7268 |
+
"loss": 0.2735,
|
| 7269 |
+
"step": 51850
|
| 7270 |
+
},
|
| 7271 |
+
{
|
| 7272 |
+
"epoch": 0.9171069604707462,
|
| 7273 |
+
"grad_norm": 2.2454397678375244,
|
| 7274 |
+
"learning_rate": 4.625866368223675e-06,
|
| 7275 |
+
"loss": 0.3976,
|
| 7276 |
+
"step": 51900
|
| 7277 |
+
},
|
| 7278 |
+
{
|
| 7279 |
+
"epoch": 0.9179904931879628,
|
| 7280 |
+
"grad_norm": 1.902377724647522,
|
| 7281 |
+
"learning_rate": 4.576780349885139e-06,
|
| 7282 |
+
"loss": 0.2939,
|
| 7283 |
+
"step": 51950
|
| 7284 |
+
},
|
| 7285 |
+
{
|
| 7286 |
+
"epoch": 0.9188740259051793,
|
| 7287 |
+
"grad_norm": 4.320808410644531,
|
| 7288 |
+
"learning_rate": 4.527694331546602e-06,
|
| 7289 |
+
"loss": 0.3193,
|
| 7290 |
+
"step": 52000
|
| 7291 |
}
|
| 7292 |
],
|
| 7293 |
"logging_steps": 50,
|