Training in progress, step 43800, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1391,6 +1391,10 @@ You can finetune this model on your own dataset.
|
|
| 1391 |
| 0.7687 | 43500 | 0.2443 |
|
| 1392 |
| 0.7696 | 43550 | 0.2998 |
|
| 1393 |
| 0.7704 | 43600 | 0.3619 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1394 |
|
| 1395 |
</details>
|
| 1396 |
|
|
|
|
| 1391 |
| 0.7687 | 43500 | 0.2443 |
|
| 1392 |
| 0.7696 | 43550 | 0.2998 |
|
| 1393 |
| 0.7704 | 43600 | 0.3619 |
|
| 1394 |
+
| 0.7713 | 43650 | 0.2586 |
|
| 1395 |
+
| 0.7722 | 43700 | 0.251 |
|
| 1396 |
+
| 0.7731 | 43750 | 0.3154 |
|
| 1397 |
+
| 0.7740 | 43800 | 0.3309 |
|
| 1398 |
|
| 1399 |
</details>
|
| 1400 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87245a00c511204e0c66583191ab9429ad97c78538541227c616f90b8381119e
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b6c1541af87dcd1797f9d736a3cac898e50e3ecafd501e98798ccab543ede07
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69c36e80b730b2d3f19367fe96dc275025a093a975c30683cdcf06771c2e520f
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c2a170b686e6b3841063ec2a8f0cf18b4985f4986723acd35709abf15d5c19e
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1960f4f5d6f42011bfc954842f6c57ccfbbc8ac7380b9fbe5cdcbb8bd1b0029
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -6112,6 +6112,34 @@
|
|
| 6112 |
"learning_rate": 1.2770218530953642e-05,
|
| 6113 |
"loss": 0.3619,
|
| 6114 |
"step": 43600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6115 |
}
|
| 6116 |
],
|
| 6117 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.7739746602816703,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 43800,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 6112 |
"learning_rate": 1.2770218530953642e-05,
|
| 6113 |
"loss": 0.3619,
|
| 6114 |
"step": 43600
|
| 6115 |
+
},
|
| 6116 |
+
{
|
| 6117 |
+
"epoch": 0.7713240621300207,
|
| 6118 |
+
"grad_norm": 2.726393461227417,
|
| 6119 |
+
"learning_rate": 1.2721132512615109e-05,
|
| 6120 |
+
"loss": 0.2586,
|
| 6121 |
+
"step": 43650
|
| 6122 |
+
},
|
| 6123 |
+
{
|
| 6124 |
+
"epoch": 0.7722075948472372,
|
| 6125 |
+
"grad_norm": 1.146583080291748,
|
| 6126 |
+
"learning_rate": 1.2672046494276572e-05,
|
| 6127 |
+
"loss": 0.251,
|
| 6128 |
+
"step": 43700
|
| 6129 |
+
},
|
| 6130 |
+
{
|
| 6131 |
+
"epoch": 0.7730911275644538,
|
| 6132 |
+
"grad_norm": 1.2839117050170898,
|
| 6133 |
+
"learning_rate": 1.2622960475938033e-05,
|
| 6134 |
+
"loss": 0.3154,
|
| 6135 |
+
"step": 43750
|
| 6136 |
+
},
|
| 6137 |
+
{
|
| 6138 |
+
"epoch": 0.7739746602816703,
|
| 6139 |
+
"grad_norm": 1.3681036233901978,
|
| 6140 |
+
"learning_rate": 1.25738744575995e-05,
|
| 6141 |
+
"loss": 0.3309,
|
| 6142 |
+
"step": 43800
|
| 6143 |
}
|
| 6144 |
],
|
| 6145 |
"logging_steps": 50,
|