Training in progress, step 37600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1265,6 +1265,10 @@ You can finetune this model on your own dataset.
|
|
| 1265 |
| 0.6591 | 37300 | 0.2822 |
|
| 1266 |
| 0.6600 | 37350 | 0.2538 |
|
| 1267 |
| 0.6609 | 37400 | 0.2212 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1268 |
|
| 1269 |
|
| 1270 |
### Framework Versions
|
|
|
|
| 1265 |
| 0.6591 | 37300 | 0.2822 |
|
| 1266 |
| 0.6600 | 37350 | 0.2538 |
|
| 1267 |
| 0.6609 | 37400 | 0.2212 |
|
| 1268 |
+
| 0.6618 | 37450 | 0.2687 |
|
| 1269 |
+
| 0.6626 | 37500 | 0.3288 |
|
| 1270 |
+
| 0.6635 | 37550 | 0.4221 |
|
| 1271 |
+
| 0.6644 | 37600 | 0.3711 |
|
| 1272 |
|
| 1273 |
|
| 1274 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:49cc2b93728e49de217dc60cd367d1893bf2f9bed3ceb4afe515eabf48f6ed08
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:336c01379450b237f69846bbca72ce99e84b15f94ed370646502b855f060fb86
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d1e5086acf3138ad2715b1b0217454786680720f4c61739eebdb529556b78ae
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa03be736ad2e04b4837e2c32a43b6b3386812b76663243651e6e6a4bb8fb202
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:188c2cbd8075ea7a1b7865239bd6d95b63ebe7d536a5366864b0e98bf73e24a0
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5244,6 +5244,34 @@
|
|
| 5244 |
"learning_rate": 1.8853939643831853e-05,
|
| 5245 |
"loss": 0.2212,
|
| 5246 |
"step": 37400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5247 |
}
|
| 5248 |
],
|
| 5249 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.664416603346822,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 37600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5244 |
"learning_rate": 1.8853939643831853e-05,
|
| 5245 |
"loss": 0.2212,
|
| 5246 |
"step": 37400
|
| 5247 |
+
},
|
| 5248 |
+
{
|
| 5249 |
+
"epoch": 0.6617660051951724,
|
| 5250 |
+
"grad_norm": 1.2916769981384277,
|
| 5251 |
+
"learning_rate": 1.8804853625493314e-05,
|
| 5252 |
+
"loss": 0.2687,
|
| 5253 |
+
"step": 37450
|
| 5254 |
+
},
|
| 5255 |
+
{
|
| 5256 |
+
"epoch": 0.6626495379123889,
|
| 5257 |
+
"grad_norm": 1.5212571620941162,
|
| 5258 |
+
"learning_rate": 1.875576760715478e-05,
|
| 5259 |
+
"loss": 0.3288,
|
| 5260 |
+
"step": 37500
|
| 5261 |
+
},
|
| 5262 |
+
{
|
| 5263 |
+
"epoch": 0.6635330706296054,
|
| 5264 |
+
"grad_norm": 1.5829190015792847,
|
| 5265 |
+
"learning_rate": 1.870668158881624e-05,
|
| 5266 |
+
"loss": 0.4221,
|
| 5267 |
+
"step": 37550
|
| 5268 |
+
},
|
| 5269 |
+
{
|
| 5270 |
+
"epoch": 0.664416603346822,
|
| 5271 |
+
"grad_norm": 1.4784077405929565,
|
| 5272 |
+
"learning_rate": 1.8657595570477705e-05,
|
| 5273 |
+
"loss": 0.3711,
|
| 5274 |
+
"step": 37600
|
| 5275 |
}
|
| 5276 |
],
|
| 5277 |
"logging_steps": 50,
|