Training in progress, epoch 18
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +18 -3
- pytorch_model.bin +1 -1
- runs/Apr30_07-42-25_943994db1dae/events.out.tfevents.1682840548.943994db1dae.1004.2 +2 -2
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 875994245
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc75999f1d0b091bfa41f436063ea648c8e517d8f5a2a215556cf7ddf81f38b8
|
| 3 |
size 875994245
|
last-checkpoint/pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 438010997
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5a6721f39f29d90b1b921202ae0d43aeffbd63a6e49d9985bd9654450952a99
|
| 3 |
size 438010997
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14575
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a25fb43cfa33d769c422622e784efab40303fdcf63ac58682a09fe2fe56544db
|
| 3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 627
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22a47655b61fd105c4795e613c42d120578086bc058f22f5c8b742b10d62284e
|
| 3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.508567750453949,
|
| 3 |
"best_model_checkpoint": "bert_final_model/checkpoint-430",
|
| 4 |
-
"epoch":
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -243,11 +243,26 @@
|
|
| 243 |
"eval_samples_per_second": 239.124,
|
| 244 |
"eval_steps_per_second": 3.789,
|
| 245 |
"step": 7310
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 246 |
}
|
| 247 |
],
|
| 248 |
"max_steps": 8600,
|
| 249 |
"num_train_epochs": 20,
|
| 250 |
-
"total_flos": 2.
|
| 251 |
"trial_name": null,
|
| 252 |
"trial_params": null
|
| 253 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.508567750453949,
|
| 3 |
"best_model_checkpoint": "bert_final_model/checkpoint-430",
|
| 4 |
+
"epoch": 18.0,
|
| 5 |
+
"global_step": 7740,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 243 |
"eval_samples_per_second": 239.124,
|
| 244 |
"eval_steps_per_second": 3.789,
|
| 245 |
"step": 7310
|
| 246 |
+
},
|
| 247 |
+
{
|
| 248 |
+
"epoch": 17.44,
|
| 249 |
+
"learning_rate": 1.2790697674418605e-06,
|
| 250 |
+
"loss": 0.0421,
|
| 251 |
+
"step": 7500
|
| 252 |
+
},
|
| 253 |
+
{
|
| 254 |
+
"epoch": 18.0,
|
| 255 |
+
"eval_accuracy": 0.787209960384833,
|
| 256 |
+
"eval_loss": 1.2152066230773926,
|
| 257 |
+
"eval_runtime": 14.8521,
|
| 258 |
+
"eval_samples_per_second": 237.946,
|
| 259 |
+
"eval_steps_per_second": 3.771,
|
| 260 |
+
"step": 7740
|
| 261 |
}
|
| 262 |
],
|
| 263 |
"max_steps": 8600,
|
| 264 |
"num_train_epochs": 20,
|
| 265 |
+
"total_flos": 2.796216263381772e+16,
|
| 266 |
"trial_name": null,
|
| 267 |
"trial_params": null
|
| 268 |
}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 438010997
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5a6721f39f29d90b1b921202ae0d43aeffbd63a6e49d9985bd9654450952a99
|
| 3 |
size 438010997
|
runs/Apr30_07-42-25_943994db1dae/events.out.tfevents.1682840548.943994db1dae.1004.2
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5aedacc08a356b09f03d2c8cea007707c9d120534279fddab8e01e5fd86d6aa
|
| 3 |
+
size 12362
|