Training in progress, step 46400, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1217,6 +1217,10 @@ You can finetune this model on your own dataset.
|
|
| 1217 |
| 0.8146 | 46100 | 0.2787 |
|
| 1218 |
| 0.8155 | 46150 | 0.2943 |
|
| 1219 |
| 0.8164 | 46200 | 0.3386 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1220 |
|
| 1221 |
|
| 1222 |
### Framework Versions
|
|
|
|
| 1217 |
| 0.8146 | 46100 | 0.2787 |
|
| 1218 |
| 0.8155 | 46150 | 0.2943 |
|
| 1219 |
| 0.8164 | 46200 | 0.3386 |
|
| 1220 |
+
| 0.8173 | 46250 | 0.3227 |
|
| 1221 |
+
| 0.8182 | 46300 | 0.2582 |
|
| 1222 |
+
| 0.8190 | 46350 | 0.285 |
|
| 1223 |
+
| 0.8199 | 46400 | 0.2989 |
|
| 1224 |
|
| 1225 |
|
| 1226 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:627d2b4f8ecea5cdfb170d123ae59ee0402c361c798b4d5c0a5332e334584559
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef488a1aa99df1a7495ba789415dfd6ce209c02bba2a2c44e7bfe3c32f6adaaa
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bc1e5c929cb8f54d58e9ee1847d7a0b3eca4210598cf360f322a008e7b3cfc7
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4443157a5e465be0625068722ad0be9b943ae7cfc578916594c92f0db7089d29
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:77c2f010939ae1c15c3c974f7d0a87bffdc388e9851106b282750c10255b68df
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -6476,6 +6476,34 @@
|
|
| 6476 |
"learning_rate": 1.0218727297716519e-05,
|
| 6477 |
"loss": 0.3386,
|
| 6478 |
"step": 46200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6479 |
}
|
| 6480 |
],
|
| 6481 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.8199183615769292,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 46400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 6476 |
"learning_rate": 1.0218727297716519e-05,
|
| 6477 |
"loss": 0.3386,
|
| 6478 |
"step": 46200
|
| 6479 |
+
},
|
| 6480 |
+
{
|
| 6481 |
+
"epoch": 0.8172677634252796,
|
| 6482 |
+
"grad_norm": 1.5368878841400146,
|
| 6483 |
+
"learning_rate": 1.0169641279377982e-05,
|
| 6484 |
+
"loss": 0.3227,
|
| 6485 |
+
"step": 46250
|
| 6486 |
+
},
|
| 6487 |
+
{
|
| 6488 |
+
"epoch": 0.8181512961424962,
|
| 6489 |
+
"grad_norm": 3.281324625015259,
|
| 6490 |
+
"learning_rate": 1.0120555261039447e-05,
|
| 6491 |
+
"loss": 0.2582,
|
| 6492 |
+
"step": 46300
|
| 6493 |
+
},
|
| 6494 |
+
{
|
| 6495 |
+
"epoch": 0.8190348288597127,
|
| 6496 |
+
"grad_norm": 1.4477012157440186,
|
| 6497 |
+
"learning_rate": 1.007146924270091e-05,
|
| 6498 |
+
"loss": 0.285,
|
| 6499 |
+
"step": 46350
|
| 6500 |
+
},
|
| 6501 |
+
{
|
| 6502 |
+
"epoch": 0.8199183615769292,
|
| 6503 |
+
"grad_norm": 2.9229135513305664,
|
| 6504 |
+
"learning_rate": 1.0022383224362374e-05,
|
| 6505 |
+
"loss": 0.2989,
|
| 6506 |
+
"step": 46400
|
| 6507 |
}
|
| 6508 |
],
|
| 6509 |
"logging_steps": 50,
|