Training in progress, step 30000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1257,6 +1257,10 @@ You can finetune this model on your own dataset.
|
|
| 1257 |
| 0.5248 | 29700 | 0.3791 |
|
| 1258 |
| 0.5257 | 29750 | 0.3346 |
|
| 1259 |
| 0.5266 | 29800 | 0.2743 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1260 |
|
| 1261 |
|
| 1262 |
### Framework Versions
|
|
|
|
| 1257 |
| 0.5248 | 29700 | 0.3791 |
|
| 1258 |
| 0.5257 | 29750 | 0.3346 |
|
| 1259 |
| 0.5266 | 29800 | 0.2743 |
|
| 1260 |
+
| 0.5275 | 29850 | 0.2927 |
|
| 1261 |
+
| 0.5284 | 29900 | 0.3775 |
|
| 1262 |
+
| 0.5292 | 29950 | 0.3114 |
|
| 1263 |
+
| 0.5301 | 30000 | 0.2383 |
|
| 1264 |
|
| 1265 |
|
| 1266 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7bb95ae4ccdc1225fa61fa51177153a06dac70457a68aef666cd0a1eed08ba1a
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71a7aa1c487fa54454696db788c6e152307a22042949edfa76090e98becd066e
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb7e98986a27a407adbceaabeb5013a890ed1e6ec34d83926bcddbcf669ec678
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:571d19b834362983e79e52affef058f87dcf5429e544d22e5fa9121931e62b84
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9f6718e4a878b8d1ac645f468a8f963dffffaa70e597cacccbc9fdb9c7011a3
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4180,6 +4180,34 @@
|
|
| 4180 |
"learning_rate": 2.631108754982231e-05,
|
| 4181 |
"loss": 0.2743,
|
| 4182 |
"step": 29800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4183 |
}
|
| 4184 |
],
|
| 4185 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.5301196303299112,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 30000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4180 |
"learning_rate": 2.631108754982231e-05,
|
| 4181 |
"loss": 0.2743,
|
| 4182 |
"step": 29800
|
| 4183 |
+
},
|
| 4184 |
+
{
|
| 4185 |
+
"epoch": 0.5274690321782616,
|
| 4186 |
+
"grad_norm": 1.63582181930542,
|
| 4187 |
+
"learning_rate": 2.6262001531483772e-05,
|
| 4188 |
+
"loss": 0.2927,
|
| 4189 |
+
"step": 29850
|
| 4190 |
+
},
|
| 4191 |
+
{
|
| 4192 |
+
"epoch": 0.5283525648954781,
|
| 4193 |
+
"grad_norm": 1.843386173248291,
|
| 4194 |
+
"learning_rate": 2.6212915513145237e-05,
|
| 4195 |
+
"loss": 0.3775,
|
| 4196 |
+
"step": 29900
|
| 4197 |
+
},
|
| 4198 |
+
{
|
| 4199 |
+
"epoch": 0.5292360976126946,
|
| 4200 |
+
"grad_norm": 1.236327886581421,
|
| 4201 |
+
"learning_rate": 2.61638294948067e-05,
|
| 4202 |
+
"loss": 0.3114,
|
| 4203 |
+
"step": 29950
|
| 4204 |
+
},
|
| 4205 |
+
{
|
| 4206 |
+
"epoch": 0.5301196303299112,
|
| 4207 |
+
"grad_norm": 1.5327879190444946,
|
| 4208 |
+
"learning_rate": 2.6114743476468162e-05,
|
| 4209 |
+
"loss": 0.2383,
|
| 4210 |
+
"step": 30000
|
| 4211 |
}
|
| 4212 |
],
|
| 4213 |
"logging_steps": 50,
|