Training in progress, step 25200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1527,6 +1527,10 @@ You can finetune this model on your own dataset.
|
|
| 1527 |
| 0.4400 | 24900 | 0.3627 |
|
| 1528 |
| 0.4409 | 24950 | 0.3403 |
|
| 1529 |
| 0.4418 | 25000 | 0.349 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1530 |
|
| 1531 |
</details>
|
| 1532 |
|
|
|
|
| 1527 |
| 0.4400 | 24900 | 0.3627 |
|
| 1528 |
| 0.4409 | 24950 | 0.3403 |
|
| 1529 |
| 0.4418 | 25000 | 0.349 |
|
| 1530 |
+
| 0.4426 | 25050 | 0.3527 |
|
| 1531 |
+
| 0.4435 | 25100 | 0.3773 |
|
| 1532 |
+
| 0.4444 | 25150 | 0.3372 |
|
| 1533 |
+
| 0.4453 | 25200 | 0.3178 |
|
| 1534 |
|
| 1535 |
</details>
|
| 1536 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:841fdf3c58c8f29d1dbc4b6aa518d6d4f0e4c702d0d79eae99a7a6f05440afb8
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d042b648040ac616e95ada7c18231cfcd360f4f2b7dea533dbe8440f0bfa84b
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3ad48efbb9bf93a84390a5aea5643acbd41bf262a8aa17ab3278f0f314a581a
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8f8fa593fe1292958817d4226b917c242a5dd7ed49104de560771ecc5cb6968
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8139c38e3bba457a10055977964d7aab9920cd7bb0ccf9d0c0ca174f5b19226
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -3508,6 +3508,34 @@
|
|
| 3508 |
"learning_rate": 3.1021381869588265e-05,
|
| 3509 |
"loss": 0.349,
|
| 3510 |
"step": 25000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3511 |
}
|
| 3512 |
],
|
| 3513 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.44530048947712536,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 25200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 3508 |
"learning_rate": 3.1021381869588265e-05,
|
| 3509 |
"loss": 0.349,
|
| 3510 |
"step": 25000
|
| 3511 |
+
},
|
| 3512 |
+
{
|
| 3513 |
+
"epoch": 0.4426498913254758,
|
| 3514 |
+
"grad_norm": 1.4080630540847778,
|
| 3515 |
+
"learning_rate": 3.0972295851249736e-05,
|
| 3516 |
+
"loss": 0.3527,
|
| 3517 |
+
"step": 25050
|
| 3518 |
+
},
|
| 3519 |
+
{
|
| 3520 |
+
"epoch": 0.4435334240426923,
|
| 3521 |
+
"grad_norm": 1.7197438478469849,
|
| 3522 |
+
"learning_rate": 3.0923209832911194e-05,
|
| 3523 |
+
"loss": 0.3773,
|
| 3524 |
+
"step": 25100
|
| 3525 |
+
},
|
| 3526 |
+
{
|
| 3527 |
+
"epoch": 0.44441695675990883,
|
| 3528 |
+
"grad_norm": 1.5831055641174316,
|
| 3529 |
+
"learning_rate": 3.087510553493943e-05,
|
| 3530 |
+
"loss": 0.3372,
|
| 3531 |
+
"step": 25150
|
| 3532 |
+
},
|
| 3533 |
+
{
|
| 3534 |
+
"epoch": 0.44530048947712536,
|
| 3535 |
+
"grad_norm": 1.7535090446472168,
|
| 3536 |
+
"learning_rate": 3.082601951660089e-05,
|
| 3537 |
+
"loss": 0.3178,
|
| 3538 |
+
"step": 25200
|
| 3539 |
}
|
| 3540 |
],
|
| 3541 |
"logging_steps": 50,
|