Training in progress, step 27800, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1213,6 +1213,10 @@ You can finetune this model on your own dataset.
|
|
| 1213 |
| 0.4859 | 27500 | 0.3959 |
|
| 1214 |
| 0.4868 | 27550 | 0.3754 |
|
| 1215 |
| 0.4877 | 27600 | 0.3163 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1216 |
|
| 1217 |
|
| 1218 |
### Framework Versions
|
|
|
|
| 1213 |
| 0.4859 | 27500 | 0.3959 |
|
| 1214 |
| 0.4868 | 27550 | 0.3754 |
|
| 1215 |
| 0.4877 | 27600 | 0.3163 |
|
| 1216 |
+
| 0.4886 | 27650 | 0.35 |
|
| 1217 |
+
| 0.4895 | 27700 | 0.3397 |
|
| 1218 |
+
| 0.4904 | 27750 | 0.3853 |
|
| 1219 |
+
| 0.4912 | 27800 | 0.2568 |
|
| 1220 |
|
| 1221 |
|
| 1222 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cdfacab69b0182b267f66ce210afc2a929861f8a381fcb609abe7250efbad353
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d101e20d6391c1d00393694ed7c13a8ed5d54b7059e36795228521dd1687fa5d
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6ca64734da2f01bf95a86973d81c98cfbac0699ced506e6f5d14bfc6d5da161
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e43246be50aae83c1910a5dc4ce6db1d2f843a5836c33c56704984643d301b0e
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e6ed64f7e529220ff21286b422216dac7ffe45f3b61319d3fedf56a8725ea92a
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -3872,6 +3872,34 @@
|
|
| 3872 |
"learning_rate": 2.8470872356717916e-05,
|
| 3873 |
"loss": 0.3163,
|
| 3874 |
"step": 27600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3875 |
}
|
| 3876 |
],
|
| 3877 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.4912441907723843,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 27800,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 3872 |
"learning_rate": 2.8470872356717916e-05,
|
| 3873 |
"loss": 0.3163,
|
| 3874 |
"step": 27600
|
| 3875 |
+
},
|
| 3876 |
+
{
|
| 3877 |
+
"epoch": 0.48859359262073476,
|
| 3878 |
+
"grad_norm": 1.654520869255066,
|
| 3879 |
+
"learning_rate": 2.8421786338379374e-05,
|
| 3880 |
+
"loss": 0.35,
|
| 3881 |
+
"step": 27650
|
| 3882 |
+
},
|
| 3883 |
+
{
|
| 3884 |
+
"epoch": 0.4894771253379513,
|
| 3885 |
+
"grad_norm": 1.5777958631515503,
|
| 3886 |
+
"learning_rate": 2.8372700320040842e-05,
|
| 3887 |
+
"loss": 0.3397,
|
| 3888 |
+
"step": 27700
|
| 3889 |
+
},
|
| 3890 |
+
{
|
| 3891 |
+
"epoch": 0.49036065805516776,
|
| 3892 |
+
"grad_norm": 1.4474226236343384,
|
| 3893 |
+
"learning_rate": 2.8323614301702307e-05,
|
| 3894 |
+
"loss": 0.3853,
|
| 3895 |
+
"step": 27750
|
| 3896 |
+
},
|
| 3897 |
+
{
|
| 3898 |
+
"epoch": 0.4912441907723843,
|
| 3899 |
+
"grad_norm": 1.603667140007019,
|
| 3900 |
+
"learning_rate": 2.8274528283363765e-05,
|
| 3901 |
+
"loss": 0.2568,
|
| 3902 |
+
"step": 27800
|
| 3903 |
}
|
| 3904 |
],
|
| 3905 |
"logging_steps": 50,
|