Training in progress, step 19400, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1411,6 +1411,10 @@ You can finetune this model on your own dataset.
|
|
| 1411 |
| 0.3375 | 19100 | 0.4034 |
|
| 1412 |
| 0.3384 | 19150 | 0.3476 |
|
| 1413 |
| 0.3393 | 19200 | 0.363 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1414 |
|
| 1415 |
</details>
|
| 1416 |
|
|
|
|
| 1411 |
| 0.3375 | 19100 | 0.4034 |
|
| 1412 |
| 0.3384 | 19150 | 0.3476 |
|
| 1413 |
| 0.3393 | 19200 | 0.363 |
|
| 1414 |
+
| 0.3402 | 19250 | 0.3182 |
|
| 1415 |
+
| 0.3410 | 19300 | 0.3238 |
|
| 1416 |
+
| 0.3419 | 19350 | 0.3043 |
|
| 1417 |
+
| 0.3428 | 19400 | 0.3902 |
|
| 1418 |
|
| 1419 |
</details>
|
| 1420 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c809593a4e810558b7888d3e612f15efc51c5db37b7d0556584318528272574d
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:415abbc1cb409cdbfc5f39cef8004307a437f7f9f53d32a212cdbb581c0e45e1
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d2ab8a0a44cb42f1e8599f3d83384df303f90a2cb7c743c1865d9517262e7ef
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1362f5572f2c24512c1a63574772877b23a9cc814bbc44fff72e3cde5341c40a
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:404504f0a70dc9bf558ab7039928bcb08279726175fd39a9b8bf44633e9ee073
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -2696,6 +2696,34 @@
|
|
| 2696 |
"learning_rate": 3.671339655612496e-05,
|
| 2697 |
"loss": 0.363,
|
| 2698 |
"step": 19200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2699 |
}
|
| 2700 |
],
|
| 2701 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.3428106942800092,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 19400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 2696 |
"learning_rate": 3.671339655612496e-05,
|
| 2697 |
"loss": 0.363,
|
| 2698 |
"step": 19200
|
| 2699 |
+
},
|
| 2700 |
+
{
|
| 2701 |
+
"epoch": 0.3401600961283596,
|
| 2702 |
+
"grad_norm": 1.965834379196167,
|
| 2703 |
+
"learning_rate": 3.666431053778642e-05,
|
| 2704 |
+
"loss": 0.3182,
|
| 2705 |
+
"step": 19250
|
| 2706 |
+
},
|
| 2707 |
+
{
|
| 2708 |
+
"epoch": 0.34104362884557615,
|
| 2709 |
+
"grad_norm": 1.607900857925415,
|
| 2710 |
+
"learning_rate": 3.661522451944788e-05,
|
| 2711 |
+
"loss": 0.3238,
|
| 2712 |
+
"step": 19300
|
| 2713 |
+
},
|
| 2714 |
+
{
|
| 2715 |
+
"epoch": 0.3419271615627927,
|
| 2716 |
+
"grad_norm": 1.4051165580749512,
|
| 2717 |
+
"learning_rate": 3.6566138501109346e-05,
|
| 2718 |
+
"loss": 0.3043,
|
| 2719 |
+
"step": 19350
|
| 2720 |
+
},
|
| 2721 |
+
{
|
| 2722 |
+
"epoch": 0.3428106942800092,
|
| 2723 |
+
"grad_norm": 1.4679523706436157,
|
| 2724 |
+
"learning_rate": 3.651705248277081e-05,
|
| 2725 |
+
"loss": 0.3902,
|
| 2726 |
+
"step": 19400
|
| 2727 |
}
|
| 2728 |
],
|
| 2729 |
"logging_steps": 50,
|