| { | |
| "best_global_step": 5000, | |
| "best_metric": 63.25362763131004, | |
| "best_model_checkpoint": "./whisper-tiny-ml-2/checkpoint-5000", | |
| "epoch": 14.0424, | |
| "eval_steps": 500, | |
| "global_step": 5000, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0316, | |
| "grad_norm": 16.492067337036133, | |
| "learning_rate": 3.7275e-05, | |
| "loss": 1.25, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.0316, | |
| "eval_loss": 0.5131270885467529, | |
| "eval_runtime": 464.8494, | |
| "eval_samples_per_second": 0.809, | |
| "eval_steps_per_second": 0.404, | |
| "eval_wer": 99.85693848354794, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 2.0632, | |
| "grad_norm": 6.0215654373168945, | |
| "learning_rate": 3.335833333333333e-05, | |
| "loss": 0.29, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 2.0632, | |
| "eval_loss": 0.184208482503891, | |
| "eval_runtime": 453.1356, | |
| "eval_samples_per_second": 0.83, | |
| "eval_steps_per_second": 0.415, | |
| "eval_wer": 75.1277334968322, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 4.0264, | |
| "grad_norm": 4.435523986816406, | |
| "learning_rate": 2.9191666666666667e-05, | |
| "loss": 0.1325, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 4.0264, | |
| "eval_loss": 0.18078354001045227, | |
| "eval_runtime": 469.9597, | |
| "eval_samples_per_second": 0.8, | |
| "eval_steps_per_second": 0.4, | |
| "eval_wer": 73.65624361332516, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 5.058, | |
| "grad_norm": 3.5488216876983643, | |
| "learning_rate": 2.5025e-05, | |
| "loss": 0.0741, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 5.058, | |
| "eval_loss": 0.19534532725811005, | |
| "eval_runtime": 452.9853, | |
| "eval_samples_per_second": 0.83, | |
| "eval_steps_per_second": 0.415, | |
| "eval_wer": 71.71469446147557, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 7.0212, | |
| "grad_norm": 2.182008743286133, | |
| "learning_rate": 2.085833333333333e-05, | |
| "loss": 0.0424, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 7.0212, | |
| "eval_loss": 0.2104445993900299, | |
| "eval_runtime": 452.8543, | |
| "eval_samples_per_second": 0.83, | |
| "eval_steps_per_second": 0.415, | |
| "eval_wer": 66.13529531984467, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 8.0528, | |
| "grad_norm": 1.6725220680236816, | |
| "learning_rate": 1.6691666666666665e-05, | |
| "loss": 0.0241, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 8.0528, | |
| "eval_loss": 0.2327151745557785, | |
| "eval_runtime": 461.1495, | |
| "eval_samples_per_second": 0.815, | |
| "eval_steps_per_second": 0.408, | |
| "eval_wer": 66.17617003883099, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 10.016, | |
| "grad_norm": 2.495150089263916, | |
| "learning_rate": 1.2525e-05, | |
| "loss": 0.0122, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 10.016, | |
| "eval_loss": 0.24628408253192902, | |
| "eval_runtime": 457.1775, | |
| "eval_samples_per_second": 0.822, | |
| "eval_steps_per_second": 0.411, | |
| "eval_wer": 66.46229307173513, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 11.0476, | |
| "grad_norm": 0.36194851994514465, | |
| "learning_rate": 8.358333333333333e-06, | |
| "loss": 0.0054, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 11.0476, | |
| "eval_loss": 0.2554023861885071, | |
| "eval_runtime": 457.1667, | |
| "eval_samples_per_second": 0.822, | |
| "eval_steps_per_second": 0.411, | |
| "eval_wer": 64.41855712241978, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 13.0108, | |
| "grad_norm": 0.10494792461395264, | |
| "learning_rate": 4.191666666666667e-06, | |
| "loss": 0.002, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 13.0108, | |
| "eval_loss": 0.2660194933414459, | |
| "eval_runtime": 457.2487, | |
| "eval_samples_per_second": 0.822, | |
| "eval_steps_per_second": 0.411, | |
| "eval_wer": 64.05068465154302, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 14.0424, | |
| "grad_norm": 0.12081502377986908, | |
| "learning_rate": 2.4999999999999996e-08, | |
| "loss": 0.0007, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 14.0424, | |
| "eval_loss": 0.2695574164390564, | |
| "eval_runtime": 455.3759, | |
| "eval_samples_per_second": 0.826, | |
| "eval_steps_per_second": 0.413, | |
| "eval_wer": 63.25362763131004, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 14.0424, | |
| "step": 5000, | |
| "total_flos": 9.8544473358336e+17, | |
| "train_loss": 0.18335246599316596, | |
| "train_runtime": 6674.7567, | |
| "train_samples_per_second": 5.993, | |
| "train_steps_per_second": 0.749 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 5000, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 9223372036854775807, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": true | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 9.8544473358336e+17, | |
| "train_batch_size": 2, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |