Training in progress, step 28000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1217,6 +1217,10 @@ You can finetune this model on your own dataset.
|
|
| 1217 |
| 0.4895 | 27700 | 0.3397 |
|
| 1218 |
| 0.4904 | 27750 | 0.3853 |
|
| 1219 |
| 0.4912 | 27800 | 0.2568 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1220 |
|
| 1221 |
|
| 1222 |
### Framework Versions
|
|
|
|
| 1217 |
| 0.4895 | 27700 | 0.3397 |
|
| 1218 |
| 0.4904 | 27750 | 0.3853 |
|
| 1219 |
| 0.4912 | 27800 | 0.2568 |
|
| 1220 |
+
| 0.4921 | 27850 | 0.3108 |
|
| 1221 |
+
| 0.4930 | 27900 | 0.4098 |
|
| 1222 |
+
| 0.4939 | 27950 | 0.3364 |
|
| 1223 |
+
| 0.4948 | 28000 | 0.3354 |
|
| 1224 |
|
| 1225 |
|
| 1226 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de68ecb62cb177a69e2ea7a2d8815c238cc32cec342188055a5fefa4de66dcc5
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e99ec639b3e9bec0cbb3889051137c9795f5cf34c03f83c5e27e4203004378a8
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b2bb1065a03f3a3cc81b13be34dd1b158c384419d61db5c56d91448ea10ea2e
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b46b4db6042cc9cc0d2e82b27079ac2205bbc9a103068ad0178d3c56c11b3021
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b4cd14cf09830d2d2a5966f0c329a3b566132e79593057303cd71a113d5be9d
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -3900,6 +3900,34 @@
|
|
| 3900 |
"learning_rate": 2.8274528283363765e-05,
|
| 3901 |
"loss": 0.2568,
|
| 3902 |
"step": 27800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3903 |
}
|
| 3904 |
],
|
| 3905 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.49477832164125035,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 28000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 3900 |
"learning_rate": 2.8274528283363765e-05,
|
| 3901 |
"loss": 0.2568,
|
| 3902 |
"step": 27800
|
| 3903 |
+
},
|
| 3904 |
+
{
|
| 3905 |
+
"epoch": 0.4921277234896008,
|
| 3906 |
+
"grad_norm": 1.727280855178833,
|
| 3907 |
+
"learning_rate": 2.8225442265025233e-05,
|
| 3908 |
+
"loss": 0.3108,
|
| 3909 |
+
"step": 27850
|
| 3910 |
+
},
|
| 3911 |
+
{
|
| 3912 |
+
"epoch": 0.49301125620681735,
|
| 3913 |
+
"grad_norm": 1.4632737636566162,
|
| 3914 |
+
"learning_rate": 2.8176356246686697e-05,
|
| 3915 |
+
"loss": 0.4098,
|
| 3916 |
+
"step": 27900
|
| 3917 |
+
},
|
| 3918 |
+
{
|
| 3919 |
+
"epoch": 0.4938947889240339,
|
| 3920 |
+
"grad_norm": 1.5443991422653198,
|
| 3921 |
+
"learning_rate": 2.812727022834816e-05,
|
| 3922 |
+
"loss": 0.3364,
|
| 3923 |
+
"step": 27950
|
| 3924 |
+
},
|
| 3925 |
+
{
|
| 3926 |
+
"epoch": 0.49477832164125035,
|
| 3927 |
+
"grad_norm": 1.7304097414016724,
|
| 3928 |
+
"learning_rate": 2.8078184210009623e-05,
|
| 3929 |
+
"loss": 0.3354,
|
| 3930 |
+
"step": 28000
|
| 3931 |
}
|
| 3932 |
],
|
| 3933 |
"logging_steps": 50,
|