Training in progress, step 34800, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1209,6 +1209,10 @@ You can finetune this model on your own dataset.
|
|
| 1209 |
| 0.6096 | 34500 | 0.4175 |
|
| 1210 |
| 0.6105 | 34550 | 0.3104 |
|
| 1211 |
| 0.6114 | 34600 | 0.3305 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1212 |
|
| 1213 |
|
| 1214 |
### Framework Versions
|
|
|
|
| 1209 |
| 0.6096 | 34500 | 0.4175 |
|
| 1210 |
| 0.6105 | 34550 | 0.3104 |
|
| 1211 |
| 0.6114 | 34600 | 0.3305 |
|
| 1212 |
+
| 0.6123 | 34650 | 0.2832 |
|
| 1213 |
+
| 0.6132 | 34700 | 0.3007 |
|
| 1214 |
+
| 0.6141 | 34750 | 0.3932 |
|
| 1215 |
+
| 0.6149 | 34800 | 0.3 |
|
| 1216 |
|
| 1217 |
|
| 1218 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:78346a0c56430d22fa1490f284416b4aeee8fb9539989a398220c805d75e2e61
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:332311a89c1a8130797191a2ad7878850bf8a5f8687fb07aa8ce26dd6bf3aca2
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:663998c1aaed54adecb3878007dbade857c46ba6a1c5eaffb67717a822135458
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:480efcc1d108b2db853c5d91deb1ed2fd305f7b9cbbdf50854f3a85cc79a1117
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e917b101e0be67dbb3890bb4d8dceac22ecd3870c266a2b20cb6488727437a58
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4852,6 +4852,34 @@
|
|
| 4852 |
"learning_rate": 2.1601774950423123e-05,
|
| 4853 |
"loss": 0.3305,
|
| 4854 |
"step": 34600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4855 |
}
|
| 4856 |
],
|
| 4857 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6149387711826969,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 34800,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4852 |
"learning_rate": 2.1601774950423123e-05,
|
| 4853 |
"loss": 0.3305,
|
| 4854 |
"step": 34600
|
| 4855 |
+
},
|
| 4856 |
+
{
|
| 4857 |
+
"epoch": 0.6122881730310473,
|
| 4858 |
+
"grad_norm": 1.416923999786377,
|
| 4859 |
+
"learning_rate": 2.1552688932084584e-05,
|
| 4860 |
+
"loss": 0.2832,
|
| 4861 |
+
"step": 34650
|
| 4862 |
+
},
|
| 4863 |
+
{
|
| 4864 |
+
"epoch": 0.6131717057482639,
|
| 4865 |
+
"grad_norm": 1.7992863655090332,
|
| 4866 |
+
"learning_rate": 2.150360291374605e-05,
|
| 4867 |
+
"loss": 0.3007,
|
| 4868 |
+
"step": 34700
|
| 4869 |
+
},
|
| 4870 |
+
{
|
| 4871 |
+
"epoch": 0.6140552384654804,
|
| 4872 |
+
"grad_norm": 1.3988946676254272,
|
| 4873 |
+
"learning_rate": 2.1454516895407514e-05,
|
| 4874 |
+
"loss": 0.3932,
|
| 4875 |
+
"step": 34750
|
| 4876 |
+
},
|
| 4877 |
+
{
|
| 4878 |
+
"epoch": 0.6149387711826969,
|
| 4879 |
+
"grad_norm": 1.7125048637390137,
|
| 4880 |
+
"learning_rate": 2.1405430877068978e-05,
|
| 4881 |
+
"loss": 0.3,
|
| 4882 |
+
"step": 34800
|
| 4883 |
}
|
| 4884 |
],
|
| 4885 |
"logging_steps": 50,
|