Training in progress, step 42800, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1371,6 +1371,10 @@ You can finetune this model on your own dataset.
|
|
| 1371 |
| 0.7510 | 42500 | 0.3433 |
|
| 1372 |
| 0.7519 | 42550 | 0.3273 |
|
| 1373 |
| 0.7528 | 42600 | 0.3123 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1374 |
|
| 1375 |
</details>
|
| 1376 |
|
|
|
|
| 1371 |
| 0.7510 | 42500 | 0.3433 |
|
| 1372 |
| 0.7519 | 42550 | 0.3273 |
|
| 1373 |
| 0.7528 | 42600 | 0.3123 |
|
| 1374 |
+
| 0.7537 | 42650 | 0.29 |
|
| 1375 |
+
| 0.7545 | 42700 | 0.3352 |
|
| 1376 |
+
| 0.7554 | 42750 | 0.3143 |
|
| 1377 |
+
| 0.7563 | 42800 | 0.2833 |
|
| 1378 |
|
| 1379 |
</details>
|
| 1380 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:947ad26bf0a1ea98a40d7847b1d4081968d0ea03f777dd415d118a3341c7d595
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbe6b037eef5d6174a1e64a06f40631b730395d9ff0774dfc1245b870b5a756f
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a0a70fc822cbf0577f57f474f054d71e07e1660e7791d186284f5053153721d
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31395f18239b3bc788fb9174ae1acda597a1a3b63f5595848ade3391438691e5
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff01474c5f0e5dbd5aec03f387f08f61e0a9ae8d77c69168920103f17f16f317
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5972,6 +5972,34 @@
|
|
| 5972 |
"learning_rate": 1.3750957177357601e-05,
|
| 5973 |
"loss": 0.3123,
|
| 5974 |
"step": 42600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5975 |
}
|
| 5976 |
],
|
| 5977 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.7563040059373398,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 42800,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5972 |
"learning_rate": 1.3750957177357601e-05,
|
| 5973 |
"loss": 0.3123,
|
| 5974 |
"step": 42600
|
| 5975 |
+
},
|
| 5976 |
+
{
|
| 5977 |
+
"epoch": 0.7536534077856903,
|
| 5978 |
+
"grad_norm": 4.600383758544922,
|
| 5979 |
+
"learning_rate": 1.3701871159019066e-05,
|
| 5980 |
+
"loss": 0.29,
|
| 5981 |
+
"step": 42650
|
| 5982 |
+
},
|
| 5983 |
+
{
|
| 5984 |
+
"epoch": 0.7545369405029069,
|
| 5985 |
+
"grad_norm": 4.080932140350342,
|
| 5986 |
+
"learning_rate": 1.3652785140680529e-05,
|
| 5987 |
+
"loss": 0.3352,
|
| 5988 |
+
"step": 42700
|
| 5989 |
+
},
|
| 5990 |
+
{
|
| 5991 |
+
"epoch": 0.7554204732201233,
|
| 5992 |
+
"grad_norm": 1.4026703834533691,
|
| 5993 |
+
"learning_rate": 1.3603699122341992e-05,
|
| 5994 |
+
"loss": 0.3143,
|
| 5995 |
+
"step": 42750
|
| 5996 |
+
},
|
| 5997 |
+
{
|
| 5998 |
+
"epoch": 0.7563040059373398,
|
| 5999 |
+
"grad_norm": 1.4037362337112427,
|
| 6000 |
+
"learning_rate": 1.3555594824370226e-05,
|
| 6001 |
+
"loss": 0.2833,
|
| 6002 |
+
"step": 42800
|
| 6003 |
}
|
| 6004 |
],
|
| 6005 |
"logging_steps": 50,
|