Training in progress, step 27400, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1205,6 +1205,10 @@ You can finetune this model on your own dataset.
|
|
| 1205 |
| 0.4789 | 27100 | 0.2753 |
|
| 1206 |
| 0.4798 | 27150 | 0.35 |
|
| 1207 |
| 0.4806 | 27200 | 0.3143 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1208 |
|
| 1209 |
|
| 1210 |
### Framework Versions
|
|
|
|
| 1205 |
| 0.4789 | 27100 | 0.2753 |
|
| 1206 |
| 0.4798 | 27150 | 0.35 |
|
| 1207 |
| 0.4806 | 27200 | 0.3143 |
|
| 1208 |
+
| 0.4815 | 27250 | 0.3968 |
|
| 1209 |
+
| 0.4824 | 27300 | 0.3246 |
|
| 1210 |
+
| 0.4833 | 27350 | 0.3131 |
|
| 1211 |
+
| 0.4842 | 27400 | 0.3078 |
|
| 1212 |
|
| 1213 |
|
| 1214 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e42bafc26f64fc942eebe9b36d05cb9ebd690bc7e84350aba5ef5927bebd23aa
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86493a89e1b924fce58823b6948f096f29423c5ce2b1e2b2de815c28e7f95699
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1ffba3c8137c0af09582c28fee3245b77ce6875ddb2ff1a79f1003af6257b2b
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d79db97c4b1cd4a4d432cc88a5b1b07dc74a6838264e86b10e57ab5d0be29f45
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10c98a9a1e72b7cb62494c74d5b84c2a61b0c8fb7089e16aa24c2bd64d181a5f
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -3816,6 +3816,34 @@
|
|
| 3816 |
"learning_rate": 2.8863560503426205e-05,
|
| 3817 |
"loss": 0.3143,
|
| 3818 |
"step": 27200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3819 |
}
|
| 3820 |
],
|
| 3821 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.4841759290346522,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 27400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 3816 |
"learning_rate": 2.8863560503426205e-05,
|
| 3817 |
"loss": 0.3143,
|
| 3818 |
"step": 27200
|
| 3819 |
+
},
|
| 3820 |
+
{
|
| 3821 |
+
"epoch": 0.4815253308830026,
|
| 3822 |
+
"grad_norm": 1.6409038305282593,
|
| 3823 |
+
"learning_rate": 2.8814474485087667e-05,
|
| 3824 |
+
"loss": 0.3968,
|
| 3825 |
+
"step": 27250
|
| 3826 |
+
},
|
| 3827 |
+
{
|
| 3828 |
+
"epoch": 0.4824088636002191,
|
| 3829 |
+
"grad_norm": 1.4830607175827026,
|
| 3830 |
+
"learning_rate": 2.876538846674913e-05,
|
| 3831 |
+
"loss": 0.3246,
|
| 3832 |
+
"step": 27300
|
| 3833 |
+
},
|
| 3834 |
+
{
|
| 3835 |
+
"epoch": 0.48329239631743565,
|
| 3836 |
+
"grad_norm": 1.6359367370605469,
|
| 3837 |
+
"learning_rate": 2.87163024484106e-05,
|
| 3838 |
+
"loss": 0.3131,
|
| 3839 |
+
"step": 27350
|
| 3840 |
+
},
|
| 3841 |
+
{
|
| 3842 |
+
"epoch": 0.4841759290346522,
|
| 3843 |
+
"grad_norm": 1.1834681034088135,
|
| 3844 |
+
"learning_rate": 2.8667216430072057e-05,
|
| 3845 |
+
"loss": 0.3078,
|
| 3846 |
+
"step": 27400
|
| 3847 |
}
|
| 3848 |
],
|
| 3849 |
"logging_steps": 50,
|