Training in progress, step 40400, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1323,6 +1323,10 @@ You can finetune this model on your own dataset.
|
|
| 1323 |
| 0.7086 | 40100 | 0.2649 |
|
| 1324 |
| 0.7095 | 40150 | 0.3184 |
|
| 1325 |
| 0.7104 | 40200 | 0.334 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1326 |
|
| 1327 |
</details>
|
| 1328 |
|
|
|
|
| 1323 |
| 0.7086 | 40100 | 0.2649 |
|
| 1324 |
| 0.7095 | 40150 | 0.3184 |
|
| 1325 |
| 0.7104 | 40200 | 0.334 |
|
| 1326 |
+
| 0.7112 | 40250 | 0.3609 |
|
| 1327 |
+
| 0.7121 | 40300 | 0.306 |
|
| 1328 |
+
| 0.7130 | 40350 | 0.2629 |
|
| 1329 |
+
| 0.7139 | 40400 | 0.2311 |
|
| 1330 |
|
| 1331 |
</details>
|
| 1332 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a50f06d6c0fd8326af39a398662f171a8273231c42342726a949dca804e1fec3
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a31f8e8daa44a5969c8468131e422d3890bd1b3dfc09e140da75d5ff08dd8929
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8789e63d322628b9bf8ef047af43291db3bd5935067320bb834f1fe83567f97
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f096ecf59986ddd611fd8ea1bd90586f9039a1554c47a1316352f4e9e8082419
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8fca1118641eb340cc4f5e2369cd22f797bffa655fc6d743b877326b0bf15332
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5636,6 +5636,34 @@
|
|
| 5636 |
"learning_rate": 1.6106104337240583e-05,
|
| 5637 |
"loss": 0.334,
|
| 5638 |
"step": 40200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5639 |
}
|
| 5640 |
],
|
| 5641 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.713894435510947,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 40400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5636 |
"learning_rate": 1.6106104337240583e-05,
|
| 5637 |
"loss": 0.334,
|
| 5638 |
"step": 40200
|
| 5639 |
+
},
|
| 5640 |
+
{
|
| 5641 |
+
"epoch": 0.7112438373592974,
|
| 5642 |
+
"grad_norm": 1.348560094833374,
|
| 5643 |
+
"learning_rate": 1.6057018318902045e-05,
|
| 5644 |
+
"loss": 0.3609,
|
| 5645 |
+
"step": 40250
|
| 5646 |
+
},
|
| 5647 |
+
{
|
| 5648 |
+
"epoch": 0.7121273700765139,
|
| 5649 |
+
"grad_norm": 0.9920164942741394,
|
| 5650 |
+
"learning_rate": 1.600793230056351e-05,
|
| 5651 |
+
"loss": 0.306,
|
| 5652 |
+
"step": 40300
|
| 5653 |
+
},
|
| 5654 |
+
{
|
| 5655 |
+
"epoch": 0.7130109027937305,
|
| 5656 |
+
"grad_norm": 1.3321669101715088,
|
| 5657 |
+
"learning_rate": 1.595884628222497e-05,
|
| 5658 |
+
"loss": 0.2629,
|
| 5659 |
+
"step": 40350
|
| 5660 |
+
},
|
| 5661 |
+
{
|
| 5662 |
+
"epoch": 0.713894435510947,
|
| 5663 |
+
"grad_norm": 1.257283329963684,
|
| 5664 |
+
"learning_rate": 1.5909760263886435e-05,
|
| 5665 |
+
"loss": 0.2311,
|
| 5666 |
+
"step": 40400
|
| 5667 |
}
|
| 5668 |
],
|
| 5669 |
"logging_steps": 50,
|