{ "best_metric": null, "best_model_checkpoint": null, "epoch": 25.12562814070352, "global_step": 2500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.99, "eval_loss": 2.7764203548431396, "eval_runtime": 34.2112, "eval_samples_per_second": 24.612, "eval_steps_per_second": 3.098, "eval_wer": 1.0, "step": 99 }, { "epoch": 2.0, "eval_loss": 2.762573003768921, "eval_runtime": 33.9987, "eval_samples_per_second": 24.766, "eval_steps_per_second": 3.118, "eval_wer": 1.0, "step": 199 }, { "epoch": 2.99, "eval_loss": 1.5485457181930542, "eval_runtime": 34.1904, "eval_samples_per_second": 24.627, "eval_steps_per_second": 3.1, "eval_wer": 0.9983126781870018, "step": 298 }, { "epoch": 4.0, "eval_loss": 0.4536263048648834, "eval_runtime": 34.3008, "eval_samples_per_second": 24.548, "eval_steps_per_second": 3.09, "eval_wer": 0.6440914644789667, "step": 398 }, { "epoch": 4.99, "eval_loss": 0.32973894476890564, "eval_runtime": 34.0188, "eval_samples_per_second": 24.751, "eval_steps_per_second": 3.116, "eval_wer": 0.5054983417699423, "step": 497 }, { "epoch": 5.03, "learning_rate": 0.0002497979797979798, "loss": 2.1303, "step": 500 }, { "epoch": 6.0, "eval_loss": 0.27073708176612854, "eval_runtime": 33.9387, "eval_samples_per_second": 24.809, "eval_steps_per_second": 3.123, "eval_wer": 0.3777273520684238, "step": 597 }, { "epoch": 6.99, "eval_loss": 0.2596016526222229, "eval_runtime": 33.9444, "eval_samples_per_second": 24.805, "eval_steps_per_second": 3.123, "eval_wer": 0.3815092802699715, "step": 696 }, { "epoch": 8.0, "eval_loss": 0.25216805934906006, "eval_runtime": 33.8461, "eval_samples_per_second": 24.877, "eval_steps_per_second": 3.132, "eval_wer": 0.2978413917495782, "step": 796 }, { "epoch": 8.99, "eval_loss": 0.22613081336021423, "eval_runtime": 33.8906, "eval_samples_per_second": 24.845, "eval_steps_per_second": 3.128, "eval_wer": 0.30965264444056556, "step": 895 }, { "epoch": 10.0, "eval_loss": 0.23950138688087463, "eval_runtime": 33.9858, "eval_samples_per_second": 24.775, "eval_steps_per_second": 3.119, "eval_wer": 0.2646767905975447, "step": 995 }, { "epoch": 10.05, "learning_rate": 0.00019929292929292926, "loss": 0.2057, "step": 1000 }, { "epoch": 10.99, "eval_loss": 0.21791674196720123, "eval_runtime": 33.9224, "eval_samples_per_second": 24.821, "eval_steps_per_second": 3.125, "eval_wer": 0.2613603304823413, "step": 1094 }, { "epoch": 12.0, "eval_loss": 0.21110226213932037, "eval_runtime": 33.8358, "eval_samples_per_second": 24.885, "eval_steps_per_second": 3.133, "eval_wer": 0.25903299005061964, "step": 1194 }, { "epoch": 12.99, "eval_loss": 0.22310343384742737, "eval_runtime": 33.7767, "eval_samples_per_second": 24.928, "eval_steps_per_second": 3.138, "eval_wer": 0.25368010705765986, "step": 1293 }, { "epoch": 14.0, "eval_loss": 0.2454575151205063, "eval_runtime": 33.8201, "eval_samples_per_second": 24.896, "eval_steps_per_second": 3.134, "eval_wer": 0.2483854075754931, "step": 1393 }, { "epoch": 14.99, "eval_loss": 0.24834834039211273, "eval_runtime": 33.7913, "eval_samples_per_second": 24.918, "eval_steps_per_second": 3.137, "eval_wer": 0.23663233839529876, "step": 1492 }, { "epoch": 15.08, "learning_rate": 0.00014878787878787875, "loss": 0.0945, "step": 1500 }, { "epoch": 16.0, "eval_loss": 0.259757936000824, "eval_runtime": 33.8499, "eval_samples_per_second": 24.875, "eval_steps_per_second": 3.131, "eval_wer": 0.22348286495607145, "step": 1592 }, { "epoch": 16.99, "eval_loss": 0.26361608505249023, "eval_runtime": 33.9334, "eval_samples_per_second": 24.813, "eval_steps_per_second": 3.124, "eval_wer": 0.21935183568976552, "step": 1691 }, { "epoch": 18.0, "eval_loss": 0.2598336637020111, "eval_runtime": 33.8712, "eval_samples_per_second": 24.859, "eval_steps_per_second": 3.13, "eval_wer": 0.21964275324373073, "step": 1791 }, { "epoch": 18.99, "eval_loss": 0.24791987240314484, "eval_runtime": 33.8138, "eval_samples_per_second": 24.901, "eval_steps_per_second": 3.135, "eval_wer": 0.20882062023622505, "step": 1890 }, { "epoch": 20.0, "eval_loss": 0.24469724297523499, "eval_runtime": 33.9448, "eval_samples_per_second": 24.805, "eval_steps_per_second": 3.123, "eval_wer": 0.2091697213009833, "step": 1990 }, { "epoch": 20.1, "learning_rate": 9.828282828282828e-05, "loss": 0.0567, "step": 2000 }, { "epoch": 20.99, "eval_loss": 0.25630325078964233, "eval_runtime": 33.677, "eval_samples_per_second": 25.002, "eval_steps_per_second": 3.148, "eval_wer": 0.20463140745912609, "step": 2089 }, { "epoch": 22.0, "eval_loss": 0.2675672173500061, "eval_runtime": 33.7312, "eval_samples_per_second": 24.962, "eval_steps_per_second": 3.142, "eval_wer": 0.198871239890615, "step": 2189 }, { "epoch": 22.99, "eval_loss": 0.25741901993751526, "eval_runtime": 33.6669, "eval_samples_per_second": 25.01, "eval_steps_per_second": 3.148, "eval_wer": 0.19951125850933846, "step": 2288 }, { "epoch": 24.0, "eval_loss": 0.2615770101547241, "eval_runtime": 33.8091, "eval_samples_per_second": 24.905, "eval_steps_per_second": 3.135, "eval_wer": 0.1961947983941351, "step": 2388 }, { "epoch": 24.99, "eval_loss": 0.257935494184494, "eval_runtime": 33.8705, "eval_samples_per_second": 24.859, "eval_steps_per_second": 3.13, "eval_wer": 0.1956129632862047, "step": 2487 }, { "epoch": 25.13, "learning_rate": 4.777777777777778e-05, "loss": 0.0418, "step": 2500 } ], "max_steps": 2970, "num_train_epochs": 30, "total_flos": 6.454758338809764e+19, "trial_name": null, "trial_params": null }