Training in progress, step 38200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1277,6 +1277,10 @@ You can finetune this model on your own dataset.
|
|
| 1277 |
| 0.6697 | 37900 | 0.287 |
|
| 1278 |
| 0.6706 | 37950 | 0.267 |
|
| 1279 |
| 0.6715 | 38000 | 0.2862 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1280 |
|
| 1281 |
|
| 1282 |
### Framework Versions
|
|
|
|
| 1277 |
| 0.6697 | 37900 | 0.287 |
|
| 1278 |
| 0.6706 | 37950 | 0.267 |
|
| 1279 |
| 0.6715 | 38000 | 0.2862 |
|
| 1280 |
+
| 0.6724 | 38050 | 0.2931 |
|
| 1281 |
+
| 0.6733 | 38100 | 0.3039 |
|
| 1282 |
+
| 0.6741 | 38150 | 0.3067 |
|
| 1283 |
+
| 0.6750 | 38200 | 0.3072 |
|
| 1284 |
|
| 1285 |
|
| 1286 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75ff9aaaf5100bcdf47810c9aef74f277666d0563b69786a02f96d2765837422
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e4f4dca1f6c69a542bde78c0327dd4270176a1625067e2256ceced634a93d6c
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:21df5a3de36303453637c6260c11dc60608b83605f06af49a76c4215097f965f
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:254ca1be196224bf5f7fb5303e3156f8228d188caec22f35ae76f9309a50e396
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8546f3abee9c0d442ca93d26c327328480bf0ee1f8248e94c717f8d8cb3ba4b
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5328,6 +5328,34 @@
|
|
| 5328 |
"learning_rate": 1.8264907423769416e-05,
|
| 5329 |
"loss": 0.2862,
|
| 5330 |
"step": 38000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5331 |
}
|
| 5332 |
],
|
| 5333 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6750189959534202,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 38200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5328 |
"learning_rate": 1.8264907423769416e-05,
|
| 5329 |
"loss": 0.2862,
|
| 5330 |
"step": 38000
|
| 5331 |
+
},
|
| 5332 |
+
{
|
| 5333 |
+
"epoch": 0.6723683978017706,
|
| 5334 |
+
"grad_norm": 1.389864444732666,
|
| 5335 |
+
"learning_rate": 1.8215821405430877e-05,
|
| 5336 |
+
"loss": 0.2931,
|
| 5337 |
+
"step": 38050
|
| 5338 |
+
},
|
| 5339 |
+
{
|
| 5340 |
+
"epoch": 0.6732519305189871,
|
| 5341 |
+
"grad_norm": 1.2709695100784302,
|
| 5342 |
+
"learning_rate": 1.816673538709234e-05,
|
| 5343 |
+
"loss": 0.3039,
|
| 5344 |
+
"step": 38100
|
| 5345 |
+
},
|
| 5346 |
+
{
|
| 5347 |
+
"epoch": 0.6741354632362037,
|
| 5348 |
+
"grad_norm": 1.2036606073379517,
|
| 5349 |
+
"learning_rate": 1.8117649368753806e-05,
|
| 5350 |
+
"loss": 0.3067,
|
| 5351 |
+
"step": 38150
|
| 5352 |
+
},
|
| 5353 |
+
{
|
| 5354 |
+
"epoch": 0.6750189959534202,
|
| 5355 |
+
"grad_norm": 1.3336296081542969,
|
| 5356 |
+
"learning_rate": 1.8068563350415268e-05,
|
| 5357 |
+
"loss": 0.3072,
|
| 5358 |
+
"step": 38200
|
| 5359 |
}
|
| 5360 |
],
|
| 5361 |
"logging_steps": 50,
|