{ "best_metric": null, "best_model_checkpoint": null, "epoch": 24.0, "global_step": 1500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.99, "eval_loss": 2.6419124603271484, "eval_runtime": 3.6969, "eval_samples_per_second": 185.289, "eval_steps_per_second": 23.263, "eval_wer": 1.0, "step": 62 }, { "epoch": 2.0, "eval_loss": 2.58249568939209, "eval_runtime": 3.6751, "eval_samples_per_second": 186.389, "eval_steps_per_second": 23.401, "eval_wer": 1.0, "step": 125 }, { "epoch": 2.99, "eval_loss": 2.574338436126709, "eval_runtime": 3.7046, "eval_samples_per_second": 184.905, "eval_steps_per_second": 23.214, "eval_wer": 1.0, "step": 187 }, { "epoch": 4.0, "eval_loss": 2.5320825576782227, "eval_runtime": 3.7133, "eval_samples_per_second": 184.472, "eval_steps_per_second": 23.16, "eval_wer": 0.9994711792702274, "step": 250 }, { "epoch": 4.99, "eval_loss": 2.2844398021698, "eval_runtime": 3.7345, "eval_samples_per_second": 183.424, "eval_steps_per_second": 23.028, "eval_wer": 1.0, "step": 312 }, { "epoch": 6.0, "eval_loss": 1.7816661596298218, "eval_runtime": 3.7402, "eval_samples_per_second": 183.147, "eval_steps_per_second": 22.994, "eval_wer": 0.9640401903754627, "step": 375 }, { "epoch": 6.99, "eval_loss": 1.4727487564086914, "eval_runtime": 3.7405, "eval_samples_per_second": 183.132, "eval_steps_per_second": 22.992, "eval_wer": 0.9299312533051296, "step": 437 }, { "epoch": 8.0, "learning_rate": 0.0002193548387096774, "loss": 2.3698, "step": 500 }, { "epoch": 8.0, "eval_loss": 1.7388513088226318, "eval_runtime": 3.735, "eval_samples_per_second": 183.399, "eval_steps_per_second": 23.025, "eval_wer": 0.9227921734531994, "step": 500 }, { "epoch": 8.99, "eval_loss": 1.5088895559310913, "eval_runtime": 3.7383, "eval_samples_per_second": 183.241, "eval_steps_per_second": 23.005, "eval_wer": 0.9021681649920676, "step": 562 }, { "epoch": 10.0, "eval_loss": 1.6695538759231567, "eval_runtime": 3.7391, "eval_samples_per_second": 183.201, "eval_steps_per_second": 23.0, "eval_wer": 0.8802221047065045, "step": 625 }, { "epoch": 10.99, "eval_loss": 1.8177894353866577, "eval_runtime": 3.7376, "eval_samples_per_second": 183.272, "eval_steps_per_second": 23.009, "eval_wer": 0.9471179270227393, "step": 687 }, { "epoch": 12.0, "eval_loss": 1.5107115507125854, "eval_runtime": 3.7409, "eval_samples_per_second": 183.109, "eval_steps_per_second": 22.989, "eval_wer": 0.8791644632469593, "step": 750 }, { "epoch": 12.99, "eval_loss": 1.704025149345398, "eval_runtime": 3.7269, "eval_samples_per_second": 183.796, "eval_steps_per_second": 23.075, "eval_wer": 0.8799576943416182, "step": 812 }, { "epoch": 14.0, "eval_loss": 1.6209287643432617, "eval_runtime": 3.73, "eval_samples_per_second": 183.648, "eval_steps_per_second": 23.057, "eval_wer": 0.8860391327340031, "step": 875 }, { "epoch": 14.99, "eval_loss": 1.7103419303894043, "eval_runtime": 3.8137, "eval_samples_per_second": 179.615, "eval_steps_per_second": 22.55, "eval_wer": 0.920676890534109, "step": 937 }, { "epoch": 16.0, "learning_rate": 0.0001387096774193548, "loss": 0.7913, "step": 1000 }, { "epoch": 16.0, "eval_loss": 1.8196772336959839, "eval_runtime": 3.7484, "eval_samples_per_second": 182.743, "eval_steps_per_second": 22.943, "eval_wer": 0.891062929666843, "step": 1000 }, { "epoch": 16.99, "eval_loss": 1.871021032333374, "eval_runtime": 3.739, "eval_samples_per_second": 183.206, "eval_steps_per_second": 23.001, "eval_wer": 0.9138022210470651, "step": 1062 }, { "epoch": 18.0, "eval_loss": 2.0114657878875732, "eval_runtime": 3.7597, "eval_samples_per_second": 182.194, "eval_steps_per_second": 22.874, "eval_wer": 0.9138022210470651, "step": 1125 }, { "epoch": 18.99, "eval_loss": 2.164022922515869, "eval_runtime": 3.7353, "eval_samples_per_second": 183.384, "eval_steps_per_second": 23.023, "eval_wer": 0.9180327868852459, "step": 1187 }, { "epoch": 20.0, "eval_loss": 2.1961405277252197, "eval_runtime": 3.7569, "eval_samples_per_second": 182.332, "eval_steps_per_second": 22.891, "eval_wer": 0.9214701216287678, "step": 1250 }, { "epoch": 20.99, "eval_loss": 2.2560768127441406, "eval_runtime": 3.7531, "eval_samples_per_second": 182.517, "eval_steps_per_second": 22.915, "eval_wer": 0.905076679005817, "step": 1312 }, { "epoch": 22.0, "eval_loss": 2.2624008655548096, "eval_runtime": 3.7599, "eval_samples_per_second": 182.187, "eval_steps_per_second": 22.873, "eval_wer": 0.905076679005817, "step": 1375 }, { "epoch": 22.99, "eval_loss": 2.3477489948272705, "eval_runtime": 3.7551, "eval_samples_per_second": 182.418, "eval_steps_per_second": 22.902, "eval_wer": 0.9026969857218403, "step": 1437 }, { "epoch": 24.0, "learning_rate": 5.806451612903225e-05, "loss": 0.284, "step": 1500 } ], "max_steps": 1860, "num_train_epochs": 30, "total_flos": 6.874539672176118e+18, "trial_name": null, "trial_params": null }