Training in progress, step 16600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1355,6 +1355,10 @@ You can finetune this model on your own dataset.
|
|
| 1355 |
| 0.2880 | 16300 | 0.3508 |
|
| 1356 |
| 0.2889 | 16350 | 0.3443 |
|
| 1357 |
| 0.2898 | 16400 | 0.4346 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1358 |
|
| 1359 |
</details>
|
| 1360 |
|
|
|
|
| 1355 |
| 0.2880 | 16300 | 0.3508 |
|
| 1356 |
| 0.2889 | 16350 | 0.3443 |
|
| 1357 |
| 0.2898 | 16400 | 0.4346 |
|
| 1358 |
+
| 0.2907 | 16450 | 0.4262 |
|
| 1359 |
+
| 0.2916 | 16500 | 0.3065 |
|
| 1360 |
+
| 0.2924 | 16550 | 0.4003 |
|
| 1361 |
+
| 0.2933 | 16600 | 0.5295 |
|
| 1362 |
|
| 1363 |
</details>
|
| 1364 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bdc8b58e69308ebfbfc0eb50f8d94cc9702cadcdc42e3254287236a6a1b09a4e
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:705df85026bb51643b710bf960103e3bb1661185afb2f1e06a383d34dc56e4bf
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f891a9e7af458bc02af6e87abb160c7f8d056d1f22f1437aa987e99557c38c6d
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ec9685408ff856249d18165c59f9d1d95d1e000415171f3550ac55d011d4b84
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4750d7049889a8742682de7ab1e907cdb0b4e5ab032bf6b9deca530e9913b39d
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -2304,6 +2304,34 @@
|
|
| 2304 |
"learning_rate": 3.946025014234945e-05,
|
| 2305 |
"loss": 0.4346,
|
| 2306 |
"step": 16400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2307 |
}
|
| 2308 |
],
|
| 2309 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.29333286211588416,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 16600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 2304 |
"learning_rate": 3.946025014234945e-05,
|
| 2305 |
"loss": 0.4346,
|
| 2306 |
"step": 16400
|
| 2307 |
+
},
|
| 2308 |
+
{
|
| 2309 |
+
"epoch": 0.2906822639642346,
|
| 2310 |
+
"grad_norm": 1.9500783681869507,
|
| 2311 |
+
"learning_rate": 3.941116412401092e-05,
|
| 2312 |
+
"loss": 0.4262,
|
| 2313 |
+
"step": 16450
|
| 2314 |
+
},
|
| 2315 |
+
{
|
| 2316 |
+
"epoch": 0.2915657966814511,
|
| 2317 |
+
"grad_norm": 1.344519853591919,
|
| 2318 |
+
"learning_rate": 3.936207810567238e-05,
|
| 2319 |
+
"loss": 0.3065,
|
| 2320 |
+
"step": 16500
|
| 2321 |
+
},
|
| 2322 |
+
{
|
| 2323 |
+
"epoch": 0.29244932939866763,
|
| 2324 |
+
"grad_norm": 1.4747456312179565,
|
| 2325 |
+
"learning_rate": 3.9312992087333846e-05,
|
| 2326 |
+
"loss": 0.4003,
|
| 2327 |
+
"step": 16550
|
| 2328 |
+
},
|
| 2329 |
+
{
|
| 2330 |
+
"epoch": 0.29333286211588416,
|
| 2331 |
+
"grad_norm": 1.5639158487319946,
|
| 2332 |
+
"learning_rate": 3.926390606899531e-05,
|
| 2333 |
+
"loss": 0.5295,
|
| 2334 |
+
"step": 16600
|
| 2335 |
}
|
| 2336 |
],
|
| 2337 |
"logging_steps": 50,
|