Training in progress, step 35600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1225,6 +1225,10 @@ You can finetune this model on your own dataset.
|
|
| 1225 |
| 0.6238 | 35300 | 0.3355 |
|
| 1226 |
| 0.6247 | 35350 | 0.3626 |
|
| 1227 |
| 0.6255 | 35400 | 0.2542 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1228 |
|
| 1229 |
|
| 1230 |
### Framework Versions
|
|
|
|
| 1225 |
| 0.6238 | 35300 | 0.3355 |
|
| 1226 |
| 0.6247 | 35350 | 0.3626 |
|
| 1227 |
| 0.6255 | 35400 | 0.2542 |
|
| 1228 |
+
| 0.6264 | 35450 | 0.2555 |
|
| 1229 |
+
| 0.6273 | 35500 | 0.3418 |
|
| 1230 |
+
| 0.6282 | 35550 | 0.3118 |
|
| 1231 |
+
| 0.6291 | 35600 | 0.2889 |
|
| 1232 |
|
| 1233 |
|
| 1234 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20174b6b2c2d93226ddeb321dbabd4bc1c8af76305e7d7148c8cc355e3d7cd60
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5a9d9a1fa3ca8642b4bdf418f1c296a72f8625176479edd5bcdc2533d1bdf26
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f3288273f695a1df0217fae4938baee576d7a5a6d2a38836aee6bceb6a8de02
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8450c711e1de0810b6e36b835decaee09acd21b4ab25d2432aa749fd8de4d2d4
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41e3f9784f622226c37c073ce2a64e597153fe7fa7c42f2778e8d0d5f771e26e
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4964,6 +4964,34 @@
|
|
| 4964 |
"learning_rate": 2.0816398657006537e-05,
|
| 4965 |
"loss": 0.2542,
|
| 4966 |
"step": 35400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4967 |
}
|
| 4968 |
],
|
| 4969 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6290752946581611,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 35600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4964 |
"learning_rate": 2.0816398657006537e-05,
|
| 4965 |
"loss": 0.2542,
|
| 4966 |
"step": 35400
|
| 4967 |
+
},
|
| 4968 |
+
{
|
| 4969 |
+
"epoch": 0.6264246965065117,
|
| 4970 |
+
"grad_norm": 1.4315252304077148,
|
| 4971 |
+
"learning_rate": 2.0767312638668002e-05,
|
| 4972 |
+
"loss": 0.2555,
|
| 4973 |
+
"step": 35450
|
| 4974 |
+
},
|
| 4975 |
+
{
|
| 4976 |
+
"epoch": 0.6273082292237282,
|
| 4977 |
+
"grad_norm": 2.861154079437256,
|
| 4978 |
+
"learning_rate": 2.0718226620329467e-05,
|
| 4979 |
+
"loss": 0.3418,
|
| 4980 |
+
"step": 35500
|
| 4981 |
+
},
|
| 4982 |
+
{
|
| 4983 |
+
"epoch": 0.6281917619409447,
|
| 4984 |
+
"grad_norm": 1.378416895866394,
|
| 4985 |
+
"learning_rate": 2.066914060199093e-05,
|
| 4986 |
+
"loss": 0.3118,
|
| 4987 |
+
"step": 35550
|
| 4988 |
+
},
|
| 4989 |
+
{
|
| 4990 |
+
"epoch": 0.6290752946581611,
|
| 4991 |
+
"grad_norm": 4.129642486572266,
|
| 4992 |
+
"learning_rate": 2.0620054583652393e-05,
|
| 4993 |
+
"loss": 0.2889,
|
| 4994 |
+
"step": 35600
|
| 4995 |
}
|
| 4996 |
],
|
| 4997 |
"logging_steps": 50,
|