Training in progress, step 19000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1403,6 +1403,10 @@ You can finetune this model on your own dataset.
|
|
| 1403 |
| 0.3304 | 18700 | 0.3543 |
|
| 1404 |
| 0.3313 | 18750 | 0.3642 |
|
| 1405 |
| 0.3322 | 18800 | 0.3415 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1406 |
|
| 1407 |
</details>
|
| 1408 |
|
|
|
|
| 1403 |
| 0.3304 | 18700 | 0.3543 |
|
| 1404 |
| 0.3313 | 18750 | 0.3642 |
|
| 1405 |
| 0.3322 | 18800 | 0.3415 |
|
| 1406 |
+
| 0.3331 | 18850 | 0.3069 |
|
| 1407 |
+
| 0.3340 | 18900 | 0.2962 |
|
| 1408 |
+
| 0.3349 | 18950 | 0.3156 |
|
| 1409 |
+
| 0.3357 | 19000 | 0.3791 |
|
| 1410 |
|
| 1411 |
</details>
|
| 1412 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:123a3c7e068975f2d73a559688da89498d96c9f5f3906b2f60a8f55923c134f5
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e186b88037a18eebc7b613039df85cfc79c02be57538ce16444dea0485fdf79
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03af62e0682690ebbb7904f13bcb54bda8192bd3193a8746111a4da158c48b8c
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10840146a6e19998f1fdbf028a41f37469dd8a3b8988531196e63b1251245096
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23958946bfe31c250bee11672fccb9ed52902b5ac707ac8090942157c16267c1
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -2640,6 +2640,34 @@
|
|
| 2640 |
"learning_rate": 3.710510298246648e-05,
|
| 2641 |
"loss": 0.3415,
|
| 2642 |
"step": 18800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2643 |
}
|
| 2644 |
],
|
| 2645 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.33574243254227704,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 19000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 2640 |
"learning_rate": 3.710510298246648e-05,
|
| 2641 |
"loss": 0.3415,
|
| 2642 |
"step": 18800
|
| 2643 |
+
},
|
| 2644 |
+
{
|
| 2645 |
+
"epoch": 0.3330918343906275,
|
| 2646 |
+
"grad_norm": 1.4388914108276367,
|
| 2647 |
+
"learning_rate": 3.7056016964127937e-05,
|
| 2648 |
+
"loss": 0.3069,
|
| 2649 |
+
"step": 18850
|
| 2650 |
+
},
|
| 2651 |
+
{
|
| 2652 |
+
"epoch": 0.333975367107844,
|
| 2653 |
+
"grad_norm": 1.5527664422988892,
|
| 2654 |
+
"learning_rate": 3.70069309457894e-05,
|
| 2655 |
+
"loss": 0.2962,
|
| 2656 |
+
"step": 18900
|
| 2657 |
+
},
|
| 2658 |
+
{
|
| 2659 |
+
"epoch": 0.3348588998250605,
|
| 2660 |
+
"grad_norm": 1.6680736541748047,
|
| 2661 |
+
"learning_rate": 3.6957844927450866e-05,
|
| 2662 |
+
"loss": 0.3156,
|
| 2663 |
+
"step": 18950
|
| 2664 |
+
},
|
| 2665 |
+
{
|
| 2666 |
+
"epoch": 0.33574243254227704,
|
| 2667 |
+
"grad_norm": 2.266108274459839,
|
| 2668 |
+
"learning_rate": 3.69097406294791e-05,
|
| 2669 |
+
"loss": 0.3791,
|
| 2670 |
+
"step": 19000
|
| 2671 |
}
|
| 2672 |
],
|
| 2673 |
"logging_steps": 50,
|