Training in progress, step 1800
Browse files- last-checkpoint/model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +3 -36
- last-checkpoint/training_args.bin +1 -1
- model.safetensors +1 -1
- runs/Dec04_19-45-12_1328ad249ece/events.out.tfevents.1701719133.1328ad249ece.5627.0 +3 -0
- training_args.bin +1 -1
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 966995080
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2ea132becf87dc52197cf8a159e74b0528f1247ff978154da29acbbc2518801
|
| 3 |
size 966995080
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1925064044
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fc2acc2a6470bfc38326462621d18c5f641b87e8c17fb748004af842c9e4d6c
|
| 3 |
size 1925064044
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:153f4050e22e2494e5c9cdfc54488cbdedf363e2e2f8bc78cef38c7af2fa76ee
|
| 3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3466ad5bf04d87f27e472dda1dbd8f7524011eeb345f9a73787480c172c7321
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": 70.1955074875208,
|
| 3 |
"best_model_checkpoint": "./whisper-it/checkpoint-300",
|
| 4 |
-
"epoch": 3.
|
| 5 |
"eval_steps": 100,
|
| 6 |
-
"global_step":
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
@@ -535,39 +535,6 @@
|
|
| 535 |
"eval_steps_per_second": 0.11,
|
| 536 |
"eval_wer": 166.51414309484193,
|
| 537 |
"step": 1600
|
| 538 |
-
},
|
| 539 |
-
{
|
| 540 |
-
"epoch": 3.1,
|
| 541 |
-
"learning_rate": 6.8028571428571434e-06,
|
| 542 |
-
"loss": 0.0353,
|
| 543 |
-
"step": 1625
|
| 544 |
-
},
|
| 545 |
-
{
|
| 546 |
-
"epoch": 3.15,
|
| 547 |
-
"learning_rate": 6.7314285714285724e-06,
|
| 548 |
-
"loss": 0.0366,
|
| 549 |
-
"step": 1650
|
| 550 |
-
},
|
| 551 |
-
{
|
| 552 |
-
"epoch": 3.2,
|
| 553 |
-
"learning_rate": 6.660000000000001e-06,
|
| 554 |
-
"loss": 0.034,
|
| 555 |
-
"step": 1675
|
| 556 |
-
},
|
| 557 |
-
{
|
| 558 |
-
"epoch": 3.24,
|
| 559 |
-
"learning_rate": 6.588571428571429e-06,
|
| 560 |
-
"loss": 0.0324,
|
| 561 |
-
"step": 1700
|
| 562 |
-
},
|
| 563 |
-
{
|
| 564 |
-
"epoch": 3.24,
|
| 565 |
-
"eval_loss": 0.3962928354740143,
|
| 566 |
-
"eval_runtime": 1676.3692,
|
| 567 |
-
"eval_samples_per_second": 0.895,
|
| 568 |
-
"eval_steps_per_second": 0.112,
|
| 569 |
-
"eval_wer": 170.93039378813089,
|
| 570 |
-
"step": 1700
|
| 571 |
}
|
| 572 |
],
|
| 573 |
"logging_steps": 25,
|
|
@@ -575,7 +542,7 @@
|
|
| 575 |
"num_input_tokens_seen": 0,
|
| 576 |
"num_train_epochs": 8,
|
| 577 |
"save_steps": 100,
|
| 578 |
-
"total_flos": 1.
|
| 579 |
"trial_name": null,
|
| 580 |
"trial_params": null
|
| 581 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": 70.1955074875208,
|
| 3 |
"best_model_checkpoint": "./whisper-it/checkpoint-300",
|
| 4 |
+
"epoch": 3.053435114503817,
|
| 5 |
"eval_steps": 100,
|
| 6 |
+
"global_step": 1600,
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
|
|
| 535 |
"eval_steps_per_second": 0.11,
|
| 536 |
"eval_wer": 166.51414309484193,
|
| 537 |
"step": 1600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 538 |
}
|
| 539 |
],
|
| 540 |
"logging_steps": 25,
|
|
|
|
| 542 |
"num_input_tokens_seen": 0,
|
| 543 |
"num_train_epochs": 8,
|
| 544 |
"save_steps": 100,
|
| 545 |
+
"total_flos": 1.476951220297728e+19,
|
| 546 |
"trial_name": null,
|
| 547 |
"trial_params": null
|
| 548 |
}
|
last-checkpoint/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4856
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:671df0b935ce81783da8e41ef1c633553d21543422fa2f0117e9c7591df7d4f5
|
| 3 |
size 4856
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 966995080
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53b109faeebfa0c0ba61658697fa9237074126c445642641b79158eb7ba30739
|
| 3 |
size 966995080
|
runs/Dec04_19-45-12_1328ad249ece/events.out.tfevents.1701719133.1328ad249ece.5627.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e83979b98d97b44e6be12eee19eeb7a9394eb5fbee9f7de514b49294a44c70e5
|
| 3 |
+
size 7065
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4856
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56b1eae5bcb377ffc0d4c8ff2741201cd456f48425776cda068ae6f4f3917a46
|
| 3 |
size 4856
|