Training in progress, step 49600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1281,6 +1281,10 @@ You can finetune this model on your own dataset.
|
|
| 1281 |
| 0.8712 | 49300 | 0.3008 |
|
| 1282 |
| 0.8720 | 49350 | 0.3406 |
|
| 1283 |
| 0.8729 | 49400 | 0.3348 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1284 |
|
| 1285 |
|
| 1286 |
### Framework Versions
|
|
|
|
| 1281 |
| 0.8712 | 49300 | 0.3008 |
|
| 1282 |
| 0.8720 | 49350 | 0.3406 |
|
| 1283 |
| 0.8729 | 49400 | 0.3348 |
|
| 1284 |
+
| 0.8738 | 49450 | 0.3021 |
|
| 1285 |
+
| 0.8747 | 49500 | 0.3182 |
|
| 1286 |
+
| 0.8756 | 49550 | 0.3063 |
|
| 1287 |
+
| 0.8765 | 49600 | 0.2385 |
|
| 1288 |
|
| 1289 |
|
| 1290 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8131e17a996f8828e5a4d3b270f9fd8ff6e941e36a00908536ef7a5e8550aaba
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e1ac75d8f0e3ef9befe27d47520e773ab09b8e31d1344e3def76ce5cd49eb10
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:281a95f6afaa2c9511c5ed8a9ce2381872188baca75f43c1972f2ab2f8eef316
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8cac657ef6092bde192981138bb915fe2e134b5e72b8ef8fc2e6cf2847fb45f5
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81093c41fdabf9a6d7f304a197f461407189d93225316dffdaf89ead0f00b3f5
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -6924,6 +6924,34 @@
|
|
| 6924 |
"learning_rate": 7.079185564783727e-06,
|
| 6925 |
"loss": 0.3348,
|
| 6926 |
"step": 49400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6927 |
}
|
| 6928 |
],
|
| 6929 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.8764644554787864,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 49600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 6924 |
"learning_rate": 7.079185564783727e-06,
|
| 6925 |
"loss": 0.3348,
|
| 6926 |
"step": 49400
|
| 6927 |
+
},
|
| 6928 |
+
{
|
| 6929 |
+
"epoch": 0.8738138573271368,
|
| 6930 |
+
"grad_norm": 1.6337603330612183,
|
| 6931 |
+
"learning_rate": 7.03009954644519e-06,
|
| 6932 |
+
"loss": 0.3021,
|
| 6933 |
+
"step": 49450
|
| 6934 |
+
},
|
| 6935 |
+
{
|
| 6936 |
+
"epoch": 0.8746973900443533,
|
| 6937 |
+
"grad_norm": 1.4994523525238037,
|
| 6938 |
+
"learning_rate": 6.981013528106655e-06,
|
| 6939 |
+
"loss": 0.3182,
|
| 6940 |
+
"step": 49500
|
| 6941 |
+
},
|
| 6942 |
+
{
|
| 6943 |
+
"epoch": 0.8755809227615698,
|
| 6944 |
+
"grad_norm": 1.2485002279281616,
|
| 6945 |
+
"learning_rate": 6.9319275097681185e-06,
|
| 6946 |
+
"loss": 0.3063,
|
| 6947 |
+
"step": 49550
|
| 6948 |
+
},
|
| 6949 |
+
{
|
| 6950 |
+
"epoch": 0.8764644554787864,
|
| 6951 |
+
"grad_norm": 1.538524866104126,
|
| 6952 |
+
"learning_rate": 6.8828414914295815e-06,
|
| 6953 |
+
"loss": 0.2385,
|
| 6954 |
+
"step": 49600
|
| 6955 |
}
|
| 6956 |
],
|
| 6957 |
"logging_steps": 50,
|