"auto-commit"
Browse files- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/config.json +0 -0
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/optimizer.pt +1 -1
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/preprocessor_config.json +0 -0
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/pytorch_model.bin +1 -1
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/rng_state.pth +1 -1
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/scaler.pt +1 -1
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/scheduler.pt +1 -1
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/trainer_state.json +323 -5
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/training_args.bin +0 -0
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/config.json +0 -0
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/optimizer.pt +1 -1
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/preprocessor_config.json +0 -0
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/pytorch_model.bin +1 -1
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/rng_state.pth +1 -1
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/scaler.pt +1 -1
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/scheduler.pt +1 -1
- model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/trainer_state.json +0 -0
- model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/training_args.bin +0 -0
- model-bin/finetune/base/log/1629953182.9450378/events.out.tfevents.1629953182.8e89bd551565.924.61 +3 -0
- model-bin/finetune/base/log/1629953612.4487836/events.out.tfevents.1629953612.8e89bd551565.924.63 +3 -0
- model-bin/finetune/base/log/1629954051.5022223/events.out.tfevents.1629954051.8e89bd551565.924.65 +3 -0
- model-bin/finetune/base/log/1629954491.5162795/events.out.tfevents.1629954491.8e89bd551565.924.67 +3 -0
- model-bin/finetune/base/log/1629954926.9743078/events.out.tfevents.1629954926.8e89bd551565.924.69 +3 -0
- model-bin/finetune/base/log/events.out.tfevents.1629953182.8e89bd551565.924.60 +3 -0
- model-bin/finetune/base/log/events.out.tfevents.1629953611.8e89bd551565.924.62 +3 -0
- model-bin/finetune/base/log/events.out.tfevents.1629954051.8e89bd551565.924.64 +3 -0
- model-bin/finetune/base/log/events.out.tfevents.1629954491.8e89bd551565.924.66 +3 -0
- model-bin/finetune/base/log/events.out.tfevents.1629954926.8e89bd551565.924.68 +3 -0
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/config.json
RENAMED
|
File without changes
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 722165393
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:460104b948102228d8f4e44ca5432f12ce434c92aefcae8151f6b0f67025b393
|
| 3 |
size 722165393
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/preprocessor_config.json
RENAMED
|
File without changes
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/pytorch_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377909911
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20a10c1e3eaed90b158c748dacb3658dddf5d6b2d6783ea01e464fad88e3e2ef
|
| 3 |
size 377909911
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/rng_state.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76e556530c6adc43805be97155f9e3f38e205e502190f575068d2af435e78eb9
|
| 3 |
size 14503
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/scaler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 559
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:402fb8096e67cd128a68844dd405d89a5f73be58935a2a425532e62a90e6c743
|
| 3 |
size 559
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 623
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d1d6ed993918c34b8e318045ece9a61bad704f813c84d295cde72741ddbfdfe
|
| 3 |
size 623
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92342}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric": 0.
|
| 3 |
-
"best_model_checkpoint": "./model-bin/finetune/base/checkpoint-
|
| 4 |
-
"epoch":
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -216534,11 +216534,329 @@
|
|
| 216534 |
"eval_steps_per_second": 0.718,
|
| 216535 |
"eval_wer": 0.1839959593044231,
|
| 216536 |
"step": 92092
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 216537 |
}
|
| 216538 |
],
|
| 216539 |
"max_steps": 625000,
|
| 216540 |
"num_train_epochs": 5000,
|
| 216541 |
-
"total_flos": 2.
|
| 216542 |
"trial_name": null,
|
| 216543 |
"trial_params": null
|
| 216544 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 0.17637692697401752,
|
| 3 |
+
"best_model_checkpoint": "./model-bin/finetune/base/checkpoint-92342",
|
| 4 |
+
"epoch": 737.9960159362549,
|
| 5 |
+
"global_step": 92342,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 216534 |
"eval_steps_per_second": 0.718,
|
| 216535 |
"eval_wer": 0.1839959593044231,
|
| 216536 |
"step": 92092
|
| 216537 |
+
},
|
| 216538 |
+
{
|
| 216539 |
+
"epoch": 736.02,
|
| 216540 |
+
"learning_rate": 8.540721153846154e-06,
|
| 216541 |
+
"loss": 0.3209,
|
| 216542 |
+
"step": 92095
|
| 216543 |
+
},
|
| 216544 |
+
{
|
| 216545 |
+
"epoch": 736.06,
|
| 216546 |
+
"learning_rate": 8.540641025641027e-06,
|
| 216547 |
+
"loss": 0.31,
|
| 216548 |
+
"step": 92100
|
| 216549 |
+
},
|
| 216550 |
+
{
|
| 216551 |
+
"epoch": 736.1,
|
| 216552 |
+
"learning_rate": 8.540560897435898e-06,
|
| 216553 |
+
"loss": 0.319,
|
| 216554 |
+
"step": 92105
|
| 216555 |
+
},
|
| 216556 |
+
{
|
| 216557 |
+
"epoch": 736.14,
|
| 216558 |
+
"learning_rate": 8.54048076923077e-06,
|
| 216559 |
+
"loss": 0.3606,
|
| 216560 |
+
"step": 92110
|
| 216561 |
+
},
|
| 216562 |
+
{
|
| 216563 |
+
"epoch": 736.18,
|
| 216564 |
+
"learning_rate": 8.540400641025641e-06,
|
| 216565 |
+
"loss": 0.7215,
|
| 216566 |
+
"step": 92115
|
| 216567 |
+
},
|
| 216568 |
+
{
|
| 216569 |
+
"epoch": 736.22,
|
| 216570 |
+
"learning_rate": 8.540336538461538e-06,
|
| 216571 |
+
"loss": 1.2349,
|
| 216572 |
+
"step": 92120
|
| 216573 |
+
},
|
| 216574 |
+
{
|
| 216575 |
+
"epoch": 736.26,
|
| 216576 |
+
"learning_rate": 8.540256410256412e-06,
|
| 216577 |
+
"loss": 0.2743,
|
| 216578 |
+
"step": 92125
|
| 216579 |
+
},
|
| 216580 |
+
{
|
| 216581 |
+
"epoch": 736.3,
|
| 216582 |
+
"learning_rate": 8.540176282051283e-06,
|
| 216583 |
+
"loss": 0.2852,
|
| 216584 |
+
"step": 92130
|
| 216585 |
+
},
|
| 216586 |
+
{
|
| 216587 |
+
"epoch": 736.34,
|
| 216588 |
+
"learning_rate": 8.540096153846154e-06,
|
| 216589 |
+
"loss": 0.3859,
|
| 216590 |
+
"step": 92135
|
| 216591 |
+
},
|
| 216592 |
+
{
|
| 216593 |
+
"epoch": 736.38,
|
| 216594 |
+
"learning_rate": 8.540016025641026e-06,
|
| 216595 |
+
"loss": 0.6902,
|
| 216596 |
+
"step": 92140
|
| 216597 |
+
},
|
| 216598 |
+
{
|
| 216599 |
+
"epoch": 736.42,
|
| 216600 |
+
"learning_rate": 8.539935897435899e-06,
|
| 216601 |
+
"loss": 0.9061,
|
| 216602 |
+
"step": 92145
|
| 216603 |
+
},
|
| 216604 |
+
{
|
| 216605 |
+
"epoch": 736.46,
|
| 216606 |
+
"learning_rate": 8.53985576923077e-06,
|
| 216607 |
+
"loss": 0.2886,
|
| 216608 |
+
"step": 92150
|
| 216609 |
+
},
|
| 216610 |
+
{
|
| 216611 |
+
"epoch": 736.5,
|
| 216612 |
+
"learning_rate": 8.539775641025641e-06,
|
| 216613 |
+
"loss": 0.2821,
|
| 216614 |
+
"step": 92155
|
| 216615 |
+
},
|
| 216616 |
+
{
|
| 216617 |
+
"epoch": 736.54,
|
| 216618 |
+
"learning_rate": 8.539695512820514e-06,
|
| 216619 |
+
"loss": 0.4494,
|
| 216620 |
+
"step": 92160
|
| 216621 |
+
},
|
| 216622 |
+
{
|
| 216623 |
+
"epoch": 736.58,
|
| 216624 |
+
"learning_rate": 8.539615384615386e-06,
|
| 216625 |
+
"loss": 0.8264,
|
| 216626 |
+
"step": 92165
|
| 216627 |
+
},
|
| 216628 |
+
{
|
| 216629 |
+
"epoch": 736.62,
|
| 216630 |
+
"learning_rate": 8.539535256410257e-06,
|
| 216631 |
+
"loss": 0.8041,
|
| 216632 |
+
"step": 92170
|
| 216633 |
+
},
|
| 216634 |
+
{
|
| 216635 |
+
"epoch": 736.66,
|
| 216636 |
+
"learning_rate": 8.539455128205129e-06,
|
| 216637 |
+
"loss": 0.4122,
|
| 216638 |
+
"step": 92175
|
| 216639 |
+
},
|
| 216640 |
+
{
|
| 216641 |
+
"epoch": 736.7,
|
| 216642 |
+
"learning_rate": 8.539375000000002e-06,
|
| 216643 |
+
"loss": 0.291,
|
| 216644 |
+
"step": 92180
|
| 216645 |
+
},
|
| 216646 |
+
{
|
| 216647 |
+
"epoch": 736.74,
|
| 216648 |
+
"learning_rate": 8.539294871794871e-06,
|
| 216649 |
+
"loss": 0.4323,
|
| 216650 |
+
"step": 92185
|
| 216651 |
+
},
|
| 216652 |
+
{
|
| 216653 |
+
"epoch": 736.78,
|
| 216654 |
+
"learning_rate": 8.539214743589744e-06,
|
| 216655 |
+
"loss": 0.9154,
|
| 216656 |
+
"step": 92190
|
| 216657 |
+
},
|
| 216658 |
+
{
|
| 216659 |
+
"epoch": 736.82,
|
| 216660 |
+
"learning_rate": 8.539134615384617e-06,
|
| 216661 |
+
"loss": 1.0553,
|
| 216662 |
+
"step": 92195
|
| 216663 |
+
},
|
| 216664 |
+
{
|
| 216665 |
+
"epoch": 736.86,
|
| 216666 |
+
"learning_rate": 8.539054487179487e-06,
|
| 216667 |
+
"loss": 0.2851,
|
| 216668 |
+
"step": 92200
|
| 216669 |
+
},
|
| 216670 |
+
{
|
| 216671 |
+
"epoch": 736.9,
|
| 216672 |
+
"learning_rate": 8.53897435897436e-06,
|
| 216673 |
+
"loss": 0.3103,
|
| 216674 |
+
"step": 92205
|
| 216675 |
+
},
|
| 216676 |
+
{
|
| 216677 |
+
"epoch": 736.94,
|
| 216678 |
+
"learning_rate": 8.538894230769231e-06,
|
| 216679 |
+
"loss": 0.3377,
|
| 216680 |
+
"step": 92210
|
| 216681 |
+
},
|
| 216682 |
+
{
|
| 216683 |
+
"epoch": 736.98,
|
| 216684 |
+
"learning_rate": 8.538814102564103e-06,
|
| 216685 |
+
"loss": 0.9135,
|
| 216686 |
+
"step": 92215
|
| 216687 |
+
},
|
| 216688 |
+
{
|
| 216689 |
+
"epoch": 737.0,
|
| 216690 |
+
"eval_loss": 0.457086443901062,
|
| 216691 |
+
"eval_runtime": 38.6091,
|
| 216692 |
+
"eval_samples_per_second": 21.705,
|
| 216693 |
+
"eval_steps_per_second": 0.699,
|
| 216694 |
+
"eval_wer": 0.1959658421672556,
|
| 216695 |
+
"step": 92217
|
| 216696 |
+
},
|
| 216697 |
+
{
|
| 216698 |
+
"epoch": 737.02,
|
| 216699 |
+
"learning_rate": 8.538733974358974e-06,
|
| 216700 |
+
"loss": 0.339,
|
| 216701 |
+
"step": 92220
|
| 216702 |
+
},
|
| 216703 |
+
{
|
| 216704 |
+
"epoch": 737.06,
|
| 216705 |
+
"learning_rate": 8.538653846153847e-06,
|
| 216706 |
+
"loss": 0.2819,
|
| 216707 |
+
"step": 92225
|
| 216708 |
+
},
|
| 216709 |
+
{
|
| 216710 |
+
"epoch": 737.1,
|
| 216711 |
+
"learning_rate": 8.538573717948719e-06,
|
| 216712 |
+
"loss": 0.2901,
|
| 216713 |
+
"step": 92230
|
| 216714 |
+
},
|
| 216715 |
+
{
|
| 216716 |
+
"epoch": 737.14,
|
| 216717 |
+
"learning_rate": 8.53849358974359e-06,
|
| 216718 |
+
"loss": 0.3861,
|
| 216719 |
+
"step": 92235
|
| 216720 |
+
},
|
| 216721 |
+
{
|
| 216722 |
+
"epoch": 737.18,
|
| 216723 |
+
"learning_rate": 8.538413461538461e-06,
|
| 216724 |
+
"loss": 0.8026,
|
| 216725 |
+
"step": 92240
|
| 216726 |
+
},
|
| 216727 |
+
{
|
| 216728 |
+
"epoch": 737.22,
|
| 216729 |
+
"learning_rate": 8.538333333333334e-06,
|
| 216730 |
+
"loss": 1.0275,
|
| 216731 |
+
"step": 92245
|
| 216732 |
+
},
|
| 216733 |
+
{
|
| 216734 |
+
"epoch": 737.26,
|
| 216735 |
+
"learning_rate": 8.538253205128206e-06,
|
| 216736 |
+
"loss": 0.2957,
|
| 216737 |
+
"step": 92250
|
| 216738 |
+
},
|
| 216739 |
+
{
|
| 216740 |
+
"epoch": 737.3,
|
| 216741 |
+
"learning_rate": 8.538173076923077e-06,
|
| 216742 |
+
"loss": 0.2704,
|
| 216743 |
+
"step": 92255
|
| 216744 |
+
},
|
| 216745 |
+
{
|
| 216746 |
+
"epoch": 737.34,
|
| 216747 |
+
"learning_rate": 8.53809294871795e-06,
|
| 216748 |
+
"loss": 0.403,
|
| 216749 |
+
"step": 92260
|
| 216750 |
+
},
|
| 216751 |
+
{
|
| 216752 |
+
"epoch": 737.38,
|
| 216753 |
+
"learning_rate": 8.538012820512821e-06,
|
| 216754 |
+
"loss": 0.7417,
|
| 216755 |
+
"step": 92265
|
| 216756 |
+
},
|
| 216757 |
+
{
|
| 216758 |
+
"epoch": 737.42,
|
| 216759 |
+
"learning_rate": 8.537932692307693e-06,
|
| 216760 |
+
"loss": 0.9031,
|
| 216761 |
+
"step": 92270
|
| 216762 |
+
},
|
| 216763 |
+
{
|
| 216764 |
+
"epoch": 737.46,
|
| 216765 |
+
"learning_rate": 8.537852564102564e-06,
|
| 216766 |
+
"loss": 0.264,
|
| 216767 |
+
"step": 92275
|
| 216768 |
+
},
|
| 216769 |
+
{
|
| 216770 |
+
"epoch": 737.5,
|
| 216771 |
+
"learning_rate": 8.537772435897437e-06,
|
| 216772 |
+
"loss": 0.3321,
|
| 216773 |
+
"step": 92280
|
| 216774 |
+
},
|
| 216775 |
+
{
|
| 216776 |
+
"epoch": 737.54,
|
| 216777 |
+
"learning_rate": 8.537692307692309e-06,
|
| 216778 |
+
"loss": 0.3582,
|
| 216779 |
+
"step": 92285
|
| 216780 |
+
},
|
| 216781 |
+
{
|
| 216782 |
+
"epoch": 737.58,
|
| 216783 |
+
"learning_rate": 8.53761217948718e-06,
|
| 216784 |
+
"loss": 0.7083,
|
| 216785 |
+
"step": 92290
|
| 216786 |
+
},
|
| 216787 |
+
{
|
| 216788 |
+
"epoch": 737.62,
|
| 216789 |
+
"learning_rate": 8.537532051282053e-06,
|
| 216790 |
+
"loss": 0.8834,
|
| 216791 |
+
"step": 92295
|
| 216792 |
+
},
|
| 216793 |
+
{
|
| 216794 |
+
"epoch": 737.66,
|
| 216795 |
+
"learning_rate": 8.537451923076924e-06,
|
| 216796 |
+
"loss": 0.3581,
|
| 216797 |
+
"step": 92300
|
| 216798 |
+
},
|
| 216799 |
+
{
|
| 216800 |
+
"epoch": 737.7,
|
| 216801 |
+
"learning_rate": 8.537371794871796e-06,
|
| 216802 |
+
"loss": 0.2924,
|
| 216803 |
+
"step": 92305
|
| 216804 |
+
},
|
| 216805 |
+
{
|
| 216806 |
+
"epoch": 737.74,
|
| 216807 |
+
"learning_rate": 8.537291666666667e-06,
|
| 216808 |
+
"loss": 0.3176,
|
| 216809 |
+
"step": 92310
|
| 216810 |
+
},
|
| 216811 |
+
{
|
| 216812 |
+
"epoch": 737.78,
|
| 216813 |
+
"learning_rate": 8.53721153846154e-06,
|
| 216814 |
+
"loss": 0.7043,
|
| 216815 |
+
"step": 92315
|
| 216816 |
+
},
|
| 216817 |
+
{
|
| 216818 |
+
"epoch": 737.82,
|
| 216819 |
+
"learning_rate": 8.537131410256411e-06,
|
| 216820 |
+
"loss": 0.9477,
|
| 216821 |
+
"step": 92320
|
| 216822 |
+
},
|
| 216823 |
+
{
|
| 216824 |
+
"epoch": 737.86,
|
| 216825 |
+
"learning_rate": 8.537051282051283e-06,
|
| 216826 |
+
"loss": 0.3398,
|
| 216827 |
+
"step": 92325
|
| 216828 |
+
},
|
| 216829 |
+
{
|
| 216830 |
+
"epoch": 737.9,
|
| 216831 |
+
"learning_rate": 8.536971153846154e-06,
|
| 216832 |
+
"loss": 0.2718,
|
| 216833 |
+
"step": 92330
|
| 216834 |
+
},
|
| 216835 |
+
{
|
| 216836 |
+
"epoch": 737.94,
|
| 216837 |
+
"learning_rate": 8.536891025641027e-06,
|
| 216838 |
+
"loss": 0.4498,
|
| 216839 |
+
"step": 92335
|
| 216840 |
+
},
|
| 216841 |
+
{
|
| 216842 |
+
"epoch": 737.98,
|
| 216843 |
+
"learning_rate": 8.536810897435897e-06,
|
| 216844 |
+
"loss": 0.7016,
|
| 216845 |
+
"step": 92340
|
| 216846 |
+
},
|
| 216847 |
+
{
|
| 216848 |
+
"epoch": 738.0,
|
| 216849 |
+
"eval_loss": 0.36441364884376526,
|
| 216850 |
+
"eval_runtime": 38.395,
|
| 216851 |
+
"eval_samples_per_second": 21.826,
|
| 216852 |
+
"eval_steps_per_second": 0.703,
|
| 216853 |
+
"eval_wer": 0.17637692697401752,
|
| 216854 |
+
"step": 92342
|
| 216855 |
}
|
| 216856 |
],
|
| 216857 |
"max_steps": 625000,
|
| 216858 |
"num_train_epochs": 5000,
|
| 216859 |
+
"total_flos": 2.5986190372093516e+20,
|
| 216860 |
"trial_name": null,
|
| 216861 |
"trial_params": null
|
| 216862 |
}
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92342}/training_args.bin
RENAMED
|
File without changes
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/config.json
RENAMED
|
File without changes
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 722165393
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b86d347e2ac850a06a739fb250cca46ccf7413c38a373a94aa8a9fe5480612c
|
| 3 |
size 722165393
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/preprocessor_config.json
RENAMED
|
File without changes
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/pytorch_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377909911
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d4e00c3aca057fc06951c90e1ba26c2a0b3e92dc34823ed7e416768166200a8
|
| 3 |
size 377909911
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/rng_state.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14503
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b419e9f9ee202e4bd0541e9a9ca2050c78eed10785c5d57dbf485edd535e5845
|
| 3 |
size 14503
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/scaler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 559
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0f9e297a360c24f890998e23df50e902eeb8189c56a4a57dedacdb8e2c40578
|
| 3 |
size 559
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 623
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64acd86ad63a962b0845061b96348fbe0b268b9e0d38b9c0e468f17a33d8275b
|
| 3 |
size 623
|
model-bin/finetune/base/{checkpoint-88857 β checkpoint-92716}/trainer_state.json
RENAMED
|
The diff for this file is too large to render.
See raw diff
|
|
|
model-bin/finetune/base/{checkpoint-92092 β checkpoint-92716}/training_args.bin
RENAMED
|
File without changes
|
model-bin/finetune/base/log/1629953182.9450378/events.out.tfevents.1629953182.8e89bd551565.924.61
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3276415366a4ac47501efb15fe42aac2c3310d121703804984d9ebbfa2efe8e0
|
| 3 |
+
size 4194
|
model-bin/finetune/base/log/1629953612.4487836/events.out.tfevents.1629953612.8e89bd551565.924.63
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba36c58c7c072c47e7a927032bbcf095c95856bcb399ebb1beb74c7393a2a012
|
| 3 |
+
size 4194
|
model-bin/finetune/base/log/1629954051.5022223/events.out.tfevents.1629954051.8e89bd551565.924.65
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c2d41f47998c260381eacd035447b8e2171d91d18eed5eae8a9fe8fab96d8bf
|
| 3 |
+
size 4194
|
model-bin/finetune/base/log/1629954491.5162795/events.out.tfevents.1629954491.8e89bd551565.924.67
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a60d419ef9dab9ea82872042000ebc5f051b29473494e4b3a7b7571b30712d1
|
| 3 |
+
size 4194
|
model-bin/finetune/base/log/1629954926.9743078/events.out.tfevents.1629954926.8e89bd551565.924.69
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a299ae1902307d11ad027a37a0aa571bf2f099e35e98c81476629f47d9ec633
|
| 3 |
+
size 4194
|
model-bin/finetune/base/log/events.out.tfevents.1629953182.8e89bd551565.924.60
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72ef2da38fa34b847ce53ae9b30ea841a76cf7479999716be6c380af4740fc60
|
| 3 |
+
size 8622
|
model-bin/finetune/base/log/events.out.tfevents.1629953611.8e89bd551565.924.62
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97e7aa845b37467c614a4079377aa9601c24aded3c9afbb8a12a8ace304464c1
|
| 3 |
+
size 8622
|
model-bin/finetune/base/log/events.out.tfevents.1629954051.8e89bd551565.924.64
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3d0839704f6d799bde22f49f819ad4457efde21373f921747241c9a001747e2d
|
| 3 |
+
size 8622
|
model-bin/finetune/base/log/events.out.tfevents.1629954491.8e89bd551565.924.66
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f76303b3db8bc0a3909b04e3ca0588f0c127ccc10519cf5e6633ff8998f176c3
|
| 3 |
+
size 8622
|
model-bin/finetune/base/log/events.out.tfevents.1629954926.8e89bd551565.924.68
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:637c7c70f9630615bf272f9deebd62e97984495343a440e46627969ab35c5451
|
| 3 |
+
size 8622
|