Training in progress, step 38000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1273,6 +1273,10 @@ You can finetune this model on your own dataset.
|
|
| 1273 |
| 0.6662 | 37700 | 0.3 |
|
| 1274 |
| 0.6671 | 37750 | 0.3147 |
|
| 1275 |
| 0.6680 | 37800 | 0.2895 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1276 |
|
| 1277 |
|
| 1278 |
### Framework Versions
|
|
|
|
| 1273 |
| 0.6662 | 37700 | 0.3 |
|
| 1274 |
| 0.6671 | 37750 | 0.3147 |
|
| 1275 |
| 0.6680 | 37800 | 0.2895 |
|
| 1276 |
+
| 0.6688 | 37850 | 0.2649 |
|
| 1277 |
+
| 0.6697 | 37900 | 0.287 |
|
| 1278 |
+
| 0.6706 | 37950 | 0.267 |
|
| 1279 |
+
| 0.6715 | 38000 | 0.2862 |
|
| 1280 |
|
| 1281 |
|
| 1282 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0d08023f1bb62ce1d0130d07526322a2c5fda70606088482affec032e342b5c
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8b44bc19e6a23e08867d09cb20779d3a37e861123bffe86f50954d881ed4c90
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28b8300b2a2312e0bd0c6c541da810ac2f229a1e589baac1c616b441c52c2040
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c9e92d7ca7e11f8c8280a110c0e95f7fc8368104e07cf4940880e3ea39426da
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:604774c1c43f2a9fc2aaee736abd7cd490fcb173a1997d86fd932e858e22ca53
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5300,6 +5300,34 @@
|
|
| 5300 |
"learning_rate": 1.846125149712356e-05,
|
| 5301 |
"loss": 0.2895,
|
| 5302 |
"step": 37800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5303 |
}
|
| 5304 |
],
|
| 5305 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6714848650845541,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 38000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5300 |
"learning_rate": 1.846125149712356e-05,
|
| 5301 |
"loss": 0.2895,
|
| 5302 |
"step": 37800
|
| 5303 |
+
},
|
| 5304 |
+
{
|
| 5305 |
+
"epoch": 0.6688342669329045,
|
| 5306 |
+
"grad_norm": 1.7297286987304688,
|
| 5307 |
+
"learning_rate": 1.8412165478785025e-05,
|
| 5308 |
+
"loss": 0.2649,
|
| 5309 |
+
"step": 37850
|
| 5310 |
+
},
|
| 5311 |
+
{
|
| 5312 |
+
"epoch": 0.669717799650121,
|
| 5313 |
+
"grad_norm": 1.2361524105072021,
|
| 5314 |
+
"learning_rate": 1.8363079460446486e-05,
|
| 5315 |
+
"loss": 0.287,
|
| 5316 |
+
"step": 37900
|
| 5317 |
+
},
|
| 5318 |
+
{
|
| 5319 |
+
"epoch": 0.6706013323673375,
|
| 5320 |
+
"grad_norm": 1.472721815109253,
|
| 5321 |
+
"learning_rate": 1.831399344210795e-05,
|
| 5322 |
+
"loss": 0.267,
|
| 5323 |
+
"step": 37950
|
| 5324 |
+
},
|
| 5325 |
+
{
|
| 5326 |
+
"epoch": 0.6714848650845541,
|
| 5327 |
+
"grad_norm": 1.7498071193695068,
|
| 5328 |
+
"learning_rate": 1.8264907423769416e-05,
|
| 5329 |
+
"loss": 0.2862,
|
| 5330 |
+
"step": 38000
|
| 5331 |
}
|
| 5332 |
],
|
| 5333 |
"logging_steps": 50,
|