Training in progress, step 26000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1543,6 +1543,10 @@ You can finetune this model on your own dataset.
|
|
| 1543 |
| 0.4541 | 25700 | 0.2669 |
|
| 1544 |
| 0.4550 | 25750 | 0.3316 |
|
| 1545 |
| 0.4559 | 25800 | 0.3395 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1546 |
|
| 1547 |
</details>
|
| 1548 |
|
|
|
|
| 1543 |
| 0.4541 | 25700 | 0.2669 |
|
| 1544 |
| 0.4550 | 25750 | 0.3316 |
|
| 1545 |
| 0.4559 | 25800 | 0.3395 |
|
| 1546 |
+
| 0.4568 | 25850 | 0.3631 |
|
| 1547 |
+
| 0.4577 | 25900 | 0.3418 |
|
| 1548 |
+
| 0.4586 | 25950 | 0.3351 |
|
| 1549 |
+
| 0.4594 | 26000 | 0.3117 |
|
| 1550 |
|
| 1551 |
</details>
|
| 1552 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d9b275662690960867e4c5004de25c023e37f1f7c4ebe3e55950090be859db5
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccf58858fe88830e35307ea10b8a5b6180e3bcc733d316d0262f05ad1036e132
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa2ed85cbcfc26a558906734eea48312aeda57b3baa4220e882e04b5dde95173
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5a1824f2390986b90c617282d9a88df5bdc60e3f12c5d84551697fb36352fa3
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67c6214bd46d06bb31b87e2550447bf08cbff7452cc6c1e25562bc8a18251786
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -3620,6 +3620,34 @@
|
|
| 3620 |
"learning_rate": 3.0236987296538455e-05,
|
| 3621 |
"loss": 0.3395,
|
| 3622 |
"step": 25800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3623 |
}
|
| 3624 |
],
|
| 3625 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.45943701295258965,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 26000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 3620 |
"learning_rate": 3.0236987296538455e-05,
|
| 3621 |
"loss": 0.3395,
|
| 3622 |
"step": 25800
|
| 3623 |
+
},
|
| 3624 |
+
{
|
| 3625 |
+
"epoch": 0.45678641480094007,
|
| 3626 |
+
"grad_norm": 2.8250796794891357,
|
| 3627 |
+
"learning_rate": 3.018790127819992e-05,
|
| 3628 |
+
"loss": 0.3631,
|
| 3629 |
+
"step": 25850
|
| 3630 |
+
},
|
| 3631 |
+
{
|
| 3632 |
+
"epoch": 0.4576699475181566,
|
| 3633 |
+
"grad_norm": 1.1532173156738281,
|
| 3634 |
+
"learning_rate": 3.013881525986138e-05,
|
| 3635 |
+
"loss": 0.3418,
|
| 3636 |
+
"step": 25900
|
| 3637 |
+
},
|
| 3638 |
+
{
|
| 3639 |
+
"epoch": 0.4585534802353731,
|
| 3640 |
+
"grad_norm": 1.687465786933899,
|
| 3641 |
+
"learning_rate": 3.0089729241522846e-05,
|
| 3642 |
+
"loss": 0.3351,
|
| 3643 |
+
"step": 25950
|
| 3644 |
+
},
|
| 3645 |
+
{
|
| 3646 |
+
"epoch": 0.45943701295258965,
|
| 3647 |
+
"grad_norm": 4.05789852142334,
|
| 3648 |
+
"learning_rate": 3.004064322318431e-05,
|
| 3649 |
+
"loss": 0.3117,
|
| 3650 |
+
"step": 26000
|
| 3651 |
}
|
| 3652 |
],
|
| 3653 |
"logging_steps": 50,
|