Training in progress, step 41000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1335,6 +1335,10 @@ You can finetune this model on your own dataset.
|
|
| 1335 |
| 0.7192 | 40700 | 0.2873 |
|
| 1336 |
| 0.7201 | 40750 | 0.3705 |
|
| 1337 |
| 0.7210 | 40800 | 0.2985 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1338 |
|
| 1339 |
</details>
|
| 1340 |
|
|
|
|
| 1335 |
| 0.7192 | 40700 | 0.2873 |
|
| 1336 |
| 0.7201 | 40750 | 0.3705 |
|
| 1337 |
| 0.7210 | 40800 | 0.2985 |
|
| 1338 |
+
| 0.7218 | 40850 | 0.3355 |
|
| 1339 |
+
| 0.7227 | 40900 | 0.3322 |
|
| 1340 |
+
| 0.7236 | 40950 | 0.3424 |
|
| 1341 |
+
| 0.7245 | 41000 | 0.2834 |
|
| 1342 |
|
| 1343 |
</details>
|
| 1344 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bad5fe2e60c5aa24260d1942f5fd36c57da4fa95b5377f04b02dcc5ceb9e653
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8fece1064662d61321c117cc1d24216b16971ad97b1195b94af13fb853181101
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d73c58855bdaef926976cbbf2d9665190e116bcc636d4b89a717f6e32bf6a98
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a4677c24f01289fca4e4e6cb6d863cf74dbec8f2665874e2aeb1133c6e53329
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9861609e13b6dfba877602ae0e61dca8ad368849f8b20c6f7958302bb7e1b3b
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5720,6 +5720,34 @@
|
|
| 5720 |
"learning_rate": 1.5518053837544916e-05,
|
| 5721 |
"loss": 0.2985,
|
| 5722 |
"step": 40800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5723 |
}
|
| 5724 |
],
|
| 5725 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.7244968281175452,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 41000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5720 |
"learning_rate": 1.5518053837544916e-05,
|
| 5721 |
"loss": 0.2985,
|
| 5722 |
"step": 40800
|
| 5723 |
+
},
|
| 5724 |
+
{
|
| 5725 |
+
"epoch": 0.7218462299658956,
|
| 5726 |
+
"grad_norm": 1.8306645154953003,
|
| 5727 |
+
"learning_rate": 1.546896781920638e-05,
|
| 5728 |
+
"loss": 0.3355,
|
| 5729 |
+
"step": 40850
|
| 5730 |
+
},
|
| 5731 |
+
{
|
| 5732 |
+
"epoch": 0.7227297626831122,
|
| 5733 |
+
"grad_norm": 1.4840078353881836,
|
| 5734 |
+
"learning_rate": 1.541988180086784e-05,
|
| 5735 |
+
"loss": 0.3322,
|
| 5736 |
+
"step": 40900
|
| 5737 |
+
},
|
| 5738 |
+
{
|
| 5739 |
+
"epoch": 0.7236132954003287,
|
| 5740 |
+
"grad_norm": 2.7773265838623047,
|
| 5741 |
+
"learning_rate": 1.5370795782529303e-05,
|
| 5742 |
+
"loss": 0.3424,
|
| 5743 |
+
"step": 40950
|
| 5744 |
+
},
|
| 5745 |
+
{
|
| 5746 |
+
"epoch": 0.7244968281175452,
|
| 5747 |
+
"grad_norm": 1.3592840433120728,
|
| 5748 |
+
"learning_rate": 1.532170976419077e-05,
|
| 5749 |
+
"loss": 0.2834,
|
| 5750 |
+
"step": 41000
|
| 5751 |
}
|
| 5752 |
],
|
| 5753 |
"logging_steps": 50,
|