Training in progress, step 42400, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1363,6 +1363,10 @@ You can finetune this model on your own dataset.
|
|
| 1363 |
| 0.7439 | 42100 | 0.3288 |
|
| 1364 |
| 0.7448 | 42150 | 0.3333 |
|
| 1365 |
| 0.7457 | 42200 | 0.3602 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1366 |
|
| 1367 |
</details>
|
| 1368 |
|
|
|
|
| 1363 |
| 0.7439 | 42100 | 0.3288 |
|
| 1364 |
| 0.7448 | 42150 | 0.3333 |
|
| 1365 |
| 0.7457 | 42200 | 0.3602 |
|
| 1366 |
+
| 0.7466 | 42250 | 0.3631 |
|
| 1367 |
+
| 0.7475 | 42300 | 0.2374 |
|
| 1368 |
+
| 0.7484 | 42350 | 0.3347 |
|
| 1369 |
+
| 0.7492 | 42400 | 0.3031 |
|
| 1370 |
|
| 1371 |
</details>
|
| 1372 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6aa92be7deea9d9fa0443a8e7ac43099edac64700ac1948c996c7d56587f9eab
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87b7fd53fc83dc52997172f5fd46299f5a9cb53791e47663db9b33ca688d8e9d
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c78cdd0913fe6a8bd516be3fa927565353e6ccb7f2abf432b224a447c2067b40
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:36ad923444303f7830b2be707d7167336797f0569cde414d2b04df5898c738d4
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c406d8129b27e63cb0cbf299bbeba9e703c540df5033871f11031330a77f043
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5916,6 +5916,34 @@
|
|
| 5916 |
"learning_rate": 1.4143645324065894e-05,
|
| 5917 |
"loss": 0.3602,
|
| 5918 |
"step": 42200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5919 |
}
|
| 5920 |
],
|
| 5921 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.7492357441996077,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 42400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5916 |
"learning_rate": 1.4143645324065894e-05,
|
| 5917 |
"loss": 0.3602,
|
| 5918 |
"step": 42200
|
| 5919 |
+
},
|
| 5920 |
+
{
|
| 5921 |
+
"epoch": 0.7465851460479581,
|
| 5922 |
+
"grad_norm": 1.546533226966858,
|
| 5923 |
+
"learning_rate": 1.4094559305727355e-05,
|
| 5924 |
+
"loss": 0.3631,
|
| 5925 |
+
"step": 42250
|
| 5926 |
+
},
|
| 5927 |
+
{
|
| 5928 |
+
"epoch": 0.7474686787651746,
|
| 5929 |
+
"grad_norm": 1.3664302825927734,
|
| 5930 |
+
"learning_rate": 1.4045473287388822e-05,
|
| 5931 |
+
"loss": 0.2374,
|
| 5932 |
+
"step": 42300
|
| 5933 |
+
},
|
| 5934 |
+
{
|
| 5935 |
+
"epoch": 0.7483522114823912,
|
| 5936 |
+
"grad_norm": 4.161416053771973,
|
| 5937 |
+
"learning_rate": 1.3996387269050285e-05,
|
| 5938 |
+
"loss": 0.3347,
|
| 5939 |
+
"step": 42350
|
| 5940 |
+
},
|
| 5941 |
+
{
|
| 5942 |
+
"epoch": 0.7492357441996077,
|
| 5943 |
+
"grad_norm": 1.3883721828460693,
|
| 5944 |
+
"learning_rate": 1.3947301250711748e-05,
|
| 5945 |
+
"loss": 0.3031,
|
| 5946 |
+
"step": 42400
|
| 5947 |
}
|
| 5948 |
],
|
| 5949 |
"logging_steps": 50,
|