Training in progress, step 34200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1197,6 +1197,10 @@ You can finetune this model on your own dataset.
|
|
| 1197 |
| 0.5990 | 33900 | 0.2361 |
|
| 1198 |
| 0.5999 | 33950 | 0.4459 |
|
| 1199 |
| 0.6008 | 34000 | 0.3169 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1200 |
|
| 1201 |
|
| 1202 |
### Framework Versions
|
|
|
|
| 1197 |
| 0.5990 | 33900 | 0.2361 |
|
| 1198 |
| 0.5999 | 33950 | 0.4459 |
|
| 1199 |
| 0.6008 | 34000 | 0.3169 |
|
| 1200 |
+
| 0.6017 | 34050 | 0.3146 |
|
| 1201 |
+
| 0.6026 | 34100 | 0.3125 |
|
| 1202 |
+
| 0.6035 | 34150 | 0.2738 |
|
| 1203 |
+
| 0.6043 | 34200 | 0.3062 |
|
| 1204 |
|
| 1205 |
|
| 1206 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bdca6c44be34b9e69175940da4b56167b7928c9d214c258d43c5b620bc91b46
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e8cce5c0114dfe6db2b221097701d4f63da8b0269ca76f1850aa97156719ebf
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed40b835a3a95c0d5caa9e2f9ac60fe5821207cfed755931f0a4c6a4e1bc7f9c
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:62c9791c94ed19713d54c258fa73c1747c3a24c92cf2d0108a3b66f313c783e0
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67100c483c5008bb6cb432330fcbe9399cb2dfd8372d624a774af533d43e3106
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4768,6 +4768,34 @@
|
|
| 4768 |
"learning_rate": 2.218982545011879e-05,
|
| 4769 |
"loss": 0.3169,
|
| 4770 |
"step": 34000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4771 |
}
|
| 4772 |
],
|
| 4773 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6043363785760987,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 34200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4768 |
"learning_rate": 2.218982545011879e-05,
|
| 4769 |
"loss": 0.3169,
|
| 4770 |
"step": 34000
|
| 4771 |
+
},
|
| 4772 |
+
{
|
| 4773 |
+
"epoch": 0.6016857804244491,
|
| 4774 |
+
"grad_norm": 1.1555734872817993,
|
| 4775 |
+
"learning_rate": 2.2140739431780252e-05,
|
| 4776 |
+
"loss": 0.3146,
|
| 4777 |
+
"step": 34050
|
| 4778 |
+
},
|
| 4779 |
+
{
|
| 4780 |
+
"epoch": 0.6025693131416656,
|
| 4781 |
+
"grad_norm": 1.4827885627746582,
|
| 4782 |
+
"learning_rate": 2.2091653413441717e-05,
|
| 4783 |
+
"loss": 0.3125,
|
| 4784 |
+
"step": 34100
|
| 4785 |
+
},
|
| 4786 |
+
{
|
| 4787 |
+
"epoch": 0.6034528458588821,
|
| 4788 |
+
"grad_norm": 1.5724104642868042,
|
| 4789 |
+
"learning_rate": 2.204256739510318e-05,
|
| 4790 |
+
"loss": 0.2738,
|
| 4791 |
+
"step": 34150
|
| 4792 |
+
},
|
| 4793 |
+
{
|
| 4794 |
+
"epoch": 0.6043363785760987,
|
| 4795 |
+
"grad_norm": 1.5903054475784302,
|
| 4796 |
+
"learning_rate": 2.1993481376764643e-05,
|
| 4797 |
+
"loss": 0.3062,
|
| 4798 |
+
"step": 34200
|
| 4799 |
}
|
| 4800 |
],
|
| 4801 |
"logging_steps": 50,
|