Training in progress, step 48600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1261,6 +1261,10 @@ You can finetune this model on your own dataset.
|
|
| 1261 |
| 0.8535 | 48300 | 0.2645 |
|
| 1262 |
| 0.8544 | 48350 | 0.3358 |
|
| 1263 |
| 0.8553 | 48400 | 0.2939 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1264 |
|
| 1265 |
|
| 1266 |
### Framework Versions
|
|
|
|
| 1261 |
| 0.8535 | 48300 | 0.2645 |
|
| 1262 |
| 0.8544 | 48350 | 0.3358 |
|
| 1263 |
| 0.8553 | 48400 | 0.2939 |
|
| 1264 |
+
| 0.8561 | 48450 | 0.4063 |
|
| 1265 |
+
| 0.8570 | 48500 | 0.3492 |
|
| 1266 |
+
| 0.8579 | 48550 | 0.2794 |
|
| 1267 |
+
| 0.8588 | 48600 | 0.2854 |
|
| 1268 |
|
| 1269 |
|
| 1270 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3f97e4be59707659beabd834e11f6a65a7292265dfb49c2caf9bc89b0c6716a
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:48984ae26e348d11908c5f2745c34cd2def85ea7c810d9fbea301d1fb62f8737
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7b99c2c71b3197a1fb7e795c175200808e384737d0136671189f7f54df62c39
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05d2345a7bbddb12fb6a365e62bd73e47296785a601a5379725821a73d3794f3
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53bf9eae9141600b1f20ec91bc52ae342d59856e71a200d65bc37505fde53a5f
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -6784,6 +6784,34 @@
|
|
| 6784 |
"learning_rate": 8.059924211187687e-06,
|
| 6785 |
"loss": 0.2939,
|
| 6786 |
"step": 48400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6787 |
}
|
| 6788 |
],
|
| 6789 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.858793801134456,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 48600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 6784 |
"learning_rate": 8.059924211187687e-06,
|
| 6785 |
"loss": 0.2939,
|
| 6786 |
"step": 48400
|
| 6787 |
+
},
|
| 6788 |
+
{
|
| 6789 |
+
"epoch": 0.8561432029828064,
|
| 6790 |
+
"grad_norm": 4.159787654876709,
|
| 6791 |
+
"learning_rate": 8.010838192849148e-06,
|
| 6792 |
+
"loss": 0.4063,
|
| 6793 |
+
"step": 48450
|
| 6794 |
+
},
|
| 6795 |
+
{
|
| 6796 |
+
"epoch": 0.857026735700023,
|
| 6797 |
+
"grad_norm": 2.129241466522217,
|
| 6798 |
+
"learning_rate": 7.961752174510613e-06,
|
| 6799 |
+
"loss": 0.3492,
|
| 6800 |
+
"step": 48500
|
| 6801 |
+
},
|
| 6802 |
+
{
|
| 6803 |
+
"epoch": 0.8579102684172395,
|
| 6804 |
+
"grad_norm": 1.48981511592865,
|
| 6805 |
+
"learning_rate": 7.912666156172076e-06,
|
| 6806 |
+
"loss": 0.2794,
|
| 6807 |
+
"step": 48550
|
| 6808 |
+
},
|
| 6809 |
+
{
|
| 6810 |
+
"epoch": 0.858793801134456,
|
| 6811 |
+
"grad_norm": 2.017918348312378,
|
| 6812 |
+
"learning_rate": 7.86358013783354e-06,
|
| 6813 |
+
"loss": 0.2854,
|
| 6814 |
+
"step": 48600
|
| 6815 |
}
|
| 6816 |
],
|
| 6817 |
"logging_steps": 50,
|