Training in progress, step 46200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1213,6 +1213,10 @@ You can finetune this model on your own dataset.
|
|
| 1213 |
| 0.8111 | 45900 | 0.285 |
|
| 1214 |
| 0.8120 | 45950 | 0.3952 |
|
| 1215 |
| 0.8129 | 46000 | 0.2802 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1216 |
|
| 1217 |
|
| 1218 |
### Framework Versions
|
|
|
|
| 1213 |
| 0.8111 | 45900 | 0.285 |
|
| 1214 |
| 0.8120 | 45950 | 0.3952 |
|
| 1215 |
| 0.8129 | 46000 | 0.2802 |
|
| 1216 |
+
| 0.8137 | 46050 | 0.2687 |
|
| 1217 |
+
| 0.8146 | 46100 | 0.2787 |
|
| 1218 |
+
| 0.8155 | 46150 | 0.2943 |
|
| 1219 |
+
| 0.8164 | 46200 | 0.3386 |
|
| 1220 |
|
| 1221 |
|
| 1222 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:317dee7bdf4b84d46a50601403d19626cd472b80bda36741dc48bf64d5b51d05
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5717440dcd3e2f09e5f546818459b38ffae88bc9a9b8cb8d67aa113aebadabd8
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bb8a12ff0a64fc5ed6adc7345aa4a83fd87d261a05c853430ab076afe05a154
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:346548a4c17d9cad2c82496da0276965825c893a3342335d781b694e90a062d5
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32b13323b686f2ab7c5492467b0d1175f40fe477951600d7f6162cdddd7d92fb
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -6448,6 +6448,34 @@
|
|
| 6448 |
"learning_rate": 1.0415071371070664e-05,
|
| 6449 |
"loss": 0.2802,
|
| 6450 |
"step": 46000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6451 |
}
|
| 6452 |
],
|
| 6453 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.8163842307080631,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 46200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 6448 |
"learning_rate": 1.0415071371070664e-05,
|
| 6449 |
"loss": 0.2802,
|
| 6450 |
"step": 46000
|
| 6451 |
+
},
|
| 6452 |
+
{
|
| 6453 |
+
"epoch": 0.8137336325564135,
|
| 6454 |
+
"grad_norm": 0.8188498020172119,
|
| 6455 |
+
"learning_rate": 1.0365985352732128e-05,
|
| 6456 |
+
"loss": 0.2687,
|
| 6457 |
+
"step": 46050
|
| 6458 |
+
},
|
| 6459 |
+
{
|
| 6460 |
+
"epoch": 0.81461716527363,
|
| 6461 |
+
"grad_norm": 1.3656600713729858,
|
| 6462 |
+
"learning_rate": 1.0316899334393591e-05,
|
| 6463 |
+
"loss": 0.2787,
|
| 6464 |
+
"step": 46100
|
| 6465 |
+
},
|
| 6466 |
+
{
|
| 6467 |
+
"epoch": 0.8155006979908466,
|
| 6468 |
+
"grad_norm": 1.3830708265304565,
|
| 6469 |
+
"learning_rate": 1.0267813316055056e-05,
|
| 6470 |
+
"loss": 0.2943,
|
| 6471 |
+
"step": 46150
|
| 6472 |
+
},
|
| 6473 |
+
{
|
| 6474 |
+
"epoch": 0.8163842307080631,
|
| 6475 |
+
"grad_norm": 1.866623878479004,
|
| 6476 |
+
"learning_rate": 1.0218727297716519e-05,
|
| 6477 |
+
"loss": 0.3386,
|
| 6478 |
+
"step": 46200
|
| 6479 |
}
|
| 6480 |
],
|
| 6481 |
"logging_steps": 50,
|