Training in progress, step 49400, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1277,6 +1277,10 @@ You can finetune this model on your own dataset.
|
|
| 1277 |
| 0.8676 | 49100 | 0.3881 |
|
| 1278 |
| 0.8685 | 49150 | 0.253 |
|
| 1279 |
| 0.8694 | 49200 | 0.2827 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1280 |
|
| 1281 |
|
| 1282 |
### Framework Versions
|
|
|
|
| 1277 |
| 0.8676 | 49100 | 0.3881 |
|
| 1278 |
| 0.8685 | 49150 | 0.253 |
|
| 1279 |
| 0.8694 | 49200 | 0.2827 |
|
| 1280 |
+
| 0.8703 | 49250 | 0.266 |
|
| 1281 |
+
| 0.8712 | 49300 | 0.3008 |
|
| 1282 |
+
| 0.8720 | 49350 | 0.3406 |
|
| 1283 |
+
| 0.8729 | 49400 | 0.3348 |
|
| 1284 |
|
| 1285 |
|
| 1286 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d54875bf531798288ddb4b3fbae3f4ae380603d3b22e5d05230773e3c542f66
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf9cbc9f060e9473758fc47c31fa40ee4cde249f6a49d58103beecc7d51b4a81
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51c3b32231fb132bb00c65088bba338cce412cdb74ffd139a1f27a4b9e6c9314
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8d9e833107ed9942fa0d2735bf0fb4ceb0909143f01ecba6b48822116d17b49
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be95a1e2a9d21081dedb60183caea1d3c628d9f653733abb462690fc704b6522
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -6896,6 +6896,34 @@
|
|
| 6896 |
"learning_rate": 7.2755296381378734e-06,
|
| 6897 |
"loss": 0.2827,
|
| 6898 |
"step": 49200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6899 |
}
|
| 6900 |
],
|
| 6901 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.8729303246099203,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 49400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 6896 |
"learning_rate": 7.2755296381378734e-06,
|
| 6897 |
"loss": 0.2827,
|
| 6898 |
"step": 49200
|
| 6899 |
+
},
|
| 6900 |
+
{
|
| 6901 |
+
"epoch": 0.8702797264582708,
|
| 6902 |
+
"grad_norm": 1.333967924118042,
|
| 6903 |
+
"learning_rate": 7.2264436197993364e-06,
|
| 6904 |
+
"loss": 0.266,
|
| 6905 |
+
"step": 49250
|
| 6906 |
+
},
|
| 6907 |
+
{
|
| 6908 |
+
"epoch": 0.8711632591754873,
|
| 6909 |
+
"grad_norm": 1.3817411661148071,
|
| 6910 |
+
"learning_rate": 7.1773576014608e-06,
|
| 6911 |
+
"loss": 0.3008,
|
| 6912 |
+
"step": 49300
|
| 6913 |
+
},
|
| 6914 |
+
{
|
| 6915 |
+
"epoch": 0.8720467918927037,
|
| 6916 |
+
"grad_norm": 1.269362211227417,
|
| 6917 |
+
"learning_rate": 7.128271583122263e-06,
|
| 6918 |
+
"loss": 0.3406,
|
| 6919 |
+
"step": 49350
|
| 6920 |
+
},
|
| 6921 |
+
{
|
| 6922 |
+
"epoch": 0.8729303246099203,
|
| 6923 |
+
"grad_norm": 1.5153824090957642,
|
| 6924 |
+
"learning_rate": 7.079185564783727e-06,
|
| 6925 |
+
"loss": 0.3348,
|
| 6926 |
+
"step": 49400
|
| 6927 |
}
|
| 6928 |
],
|
| 6929 |
"logging_steps": 50,
|