Training in progress, step 41600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1347,6 +1347,10 @@ You can finetune this model on your own dataset.
|
|
| 1347 |
| 0.7298 | 41300 | 0.3289 |
|
| 1348 |
| 0.7307 | 41350 | 0.3119 |
|
| 1349 |
| 0.7316 | 41400 | 0.3007 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1350 |
|
| 1351 |
</details>
|
| 1352 |
|
|
|
|
| 1347 |
| 0.7298 | 41300 | 0.3289 |
|
| 1348 |
| 0.7307 | 41350 | 0.3119 |
|
| 1349 |
| 0.7316 | 41400 | 0.3007 |
|
| 1350 |
+
| 0.7324 | 41450 | 0.3499 |
|
| 1351 |
+
| 0.7333 | 41500 | 0.3016 |
|
| 1352 |
+
| 0.7342 | 41550 | 0.3232 |
|
| 1353 |
+
| 0.7351 | 41600 | 0.2577 |
|
| 1354 |
|
| 1355 |
</details>
|
| 1356 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5968fa9233e27ceab0b50d025526b14878df9c3a5cc0dd8ab8e3bfb4e8731159
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f9b287a89c14a672aa169e1144107274fac0f234f450dc15728e411970cfec4
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29c7015785925a4c92109508d00189934d2658c038f9a9b3126f34a88d70d109
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd530e72b22c1ce77a70b73b0e2553d90cdc69cb660d5df5b7ea28fe660cd767
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:36751f2c6aca47874fa4d1553b1d00dffae813bb24cca7967068d98d45a147e3
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5804,6 +5804,34 @@
|
|
| 5804 |
"learning_rate": 1.4929021617482478e-05,
|
| 5805 |
"loss": 0.3007,
|
| 5806 |
"step": 41400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5807 |
}
|
| 5808 |
],
|
| 5809 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.7350992207241435,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 41600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5804 |
"learning_rate": 1.4929021617482478e-05,
|
| 5805 |
"loss": 0.3007,
|
| 5806 |
"step": 41400
|
| 5807 |
+
},
|
| 5808 |
+
{
|
| 5809 |
+
"epoch": 0.7324486225724939,
|
| 5810 |
+
"grad_norm": 2.910383939743042,
|
| 5811 |
+
"learning_rate": 1.4879935599143941e-05,
|
| 5812 |
+
"loss": 0.3499,
|
| 5813 |
+
"step": 41450
|
| 5814 |
+
},
|
| 5815 |
+
{
|
| 5816 |
+
"epoch": 0.7333321552897104,
|
| 5817 |
+
"grad_norm": 1.0191997289657593,
|
| 5818 |
+
"learning_rate": 1.4830849580805404e-05,
|
| 5819 |
+
"loss": 0.3016,
|
| 5820 |
+
"step": 41500
|
| 5821 |
+
},
|
| 5822 |
+
{
|
| 5823 |
+
"epoch": 0.7342156880069269,
|
| 5824 |
+
"grad_norm": 0.9859305620193481,
|
| 5825 |
+
"learning_rate": 1.4781763562466869e-05,
|
| 5826 |
+
"loss": 0.3232,
|
| 5827 |
+
"step": 41550
|
| 5828 |
+
},
|
| 5829 |
+
{
|
| 5830 |
+
"epoch": 0.7350992207241435,
|
| 5831 |
+
"grad_norm": 1.4275975227355957,
|
| 5832 |
+
"learning_rate": 1.4732677544128332e-05,
|
| 5833 |
+
"loss": 0.2577,
|
| 5834 |
+
"step": 41600
|
| 5835 |
}
|
| 5836 |
],
|
| 5837 |
"logging_steps": 50,
|