| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 24.0, | |
| "global_step": 1500, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.99, | |
| "eval_loss": 2.6419124603271484, | |
| "eval_runtime": 3.6969, | |
| "eval_samples_per_second": 185.289, | |
| "eval_steps_per_second": 23.263, | |
| "eval_wer": 1.0, | |
| "step": 62 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_loss": 2.58249568939209, | |
| "eval_runtime": 3.6751, | |
| "eval_samples_per_second": 186.389, | |
| "eval_steps_per_second": 23.401, | |
| "eval_wer": 1.0, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 2.99, | |
| "eval_loss": 2.574338436126709, | |
| "eval_runtime": 3.7046, | |
| "eval_samples_per_second": 184.905, | |
| "eval_steps_per_second": 23.214, | |
| "eval_wer": 1.0, | |
| "step": 187 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_loss": 2.5320825576782227, | |
| "eval_runtime": 3.7133, | |
| "eval_samples_per_second": 184.472, | |
| "eval_steps_per_second": 23.16, | |
| "eval_wer": 0.9994711792702274, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 4.99, | |
| "eval_loss": 2.2844398021698, | |
| "eval_runtime": 3.7345, | |
| "eval_samples_per_second": 183.424, | |
| "eval_steps_per_second": 23.028, | |
| "eval_wer": 1.0, | |
| "step": 312 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_loss": 1.7816661596298218, | |
| "eval_runtime": 3.7402, | |
| "eval_samples_per_second": 183.147, | |
| "eval_steps_per_second": 22.994, | |
| "eval_wer": 0.9640401903754627, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 6.99, | |
| "eval_loss": 1.4727487564086914, | |
| "eval_runtime": 3.7405, | |
| "eval_samples_per_second": 183.132, | |
| "eval_steps_per_second": 22.992, | |
| "eval_wer": 0.9299312533051296, | |
| "step": 437 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 0.0002193548387096774, | |
| "loss": 2.3698, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_loss": 1.7388513088226318, | |
| "eval_runtime": 3.735, | |
| "eval_samples_per_second": 183.399, | |
| "eval_steps_per_second": 23.025, | |
| "eval_wer": 0.9227921734531994, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 8.99, | |
| "eval_loss": 1.5088895559310913, | |
| "eval_runtime": 3.7383, | |
| "eval_samples_per_second": 183.241, | |
| "eval_steps_per_second": 23.005, | |
| "eval_wer": 0.9021681649920676, | |
| "step": 562 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_loss": 1.6695538759231567, | |
| "eval_runtime": 3.7391, | |
| "eval_samples_per_second": 183.201, | |
| "eval_steps_per_second": 23.0, | |
| "eval_wer": 0.8802221047065045, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 10.99, | |
| "eval_loss": 1.8177894353866577, | |
| "eval_runtime": 3.7376, | |
| "eval_samples_per_second": 183.272, | |
| "eval_steps_per_second": 23.009, | |
| "eval_wer": 0.9471179270227393, | |
| "step": 687 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_loss": 1.5107115507125854, | |
| "eval_runtime": 3.7409, | |
| "eval_samples_per_second": 183.109, | |
| "eval_steps_per_second": 22.989, | |
| "eval_wer": 0.8791644632469593, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 12.99, | |
| "eval_loss": 1.704025149345398, | |
| "eval_runtime": 3.7269, | |
| "eval_samples_per_second": 183.796, | |
| "eval_steps_per_second": 23.075, | |
| "eval_wer": 0.8799576943416182, | |
| "step": 812 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_loss": 1.6209287643432617, | |
| "eval_runtime": 3.73, | |
| "eval_samples_per_second": 183.648, | |
| "eval_steps_per_second": 23.057, | |
| "eval_wer": 0.8860391327340031, | |
| "step": 875 | |
| }, | |
| { | |
| "epoch": 14.99, | |
| "eval_loss": 1.7103419303894043, | |
| "eval_runtime": 3.8137, | |
| "eval_samples_per_second": 179.615, | |
| "eval_steps_per_second": 22.55, | |
| "eval_wer": 0.920676890534109, | |
| "step": 937 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "learning_rate": 0.0001387096774193548, | |
| "loss": 0.7913, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_loss": 1.8196772336959839, | |
| "eval_runtime": 3.7484, | |
| "eval_samples_per_second": 182.743, | |
| "eval_steps_per_second": 22.943, | |
| "eval_wer": 0.891062929666843, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 16.99, | |
| "eval_loss": 1.871021032333374, | |
| "eval_runtime": 3.739, | |
| "eval_samples_per_second": 183.206, | |
| "eval_steps_per_second": 23.001, | |
| "eval_wer": 0.9138022210470651, | |
| "step": 1062 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_loss": 2.0114657878875732, | |
| "eval_runtime": 3.7597, | |
| "eval_samples_per_second": 182.194, | |
| "eval_steps_per_second": 22.874, | |
| "eval_wer": 0.9138022210470651, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 18.99, | |
| "eval_loss": 2.164022922515869, | |
| "eval_runtime": 3.7353, | |
| "eval_samples_per_second": 183.384, | |
| "eval_steps_per_second": 23.023, | |
| "eval_wer": 0.9180327868852459, | |
| "step": 1187 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_loss": 2.1961405277252197, | |
| "eval_runtime": 3.7569, | |
| "eval_samples_per_second": 182.332, | |
| "eval_steps_per_second": 22.891, | |
| "eval_wer": 0.9214701216287678, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 20.99, | |
| "eval_loss": 2.2560768127441406, | |
| "eval_runtime": 3.7531, | |
| "eval_samples_per_second": 182.517, | |
| "eval_steps_per_second": 22.915, | |
| "eval_wer": 0.905076679005817, | |
| "step": 1312 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_loss": 2.2624008655548096, | |
| "eval_runtime": 3.7599, | |
| "eval_samples_per_second": 182.187, | |
| "eval_steps_per_second": 22.873, | |
| "eval_wer": 0.905076679005817, | |
| "step": 1375 | |
| }, | |
| { | |
| "epoch": 22.99, | |
| "eval_loss": 2.3477489948272705, | |
| "eval_runtime": 3.7551, | |
| "eval_samples_per_second": 182.418, | |
| "eval_steps_per_second": 22.902, | |
| "eval_wer": 0.9026969857218403, | |
| "step": 1437 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "learning_rate": 5.806451612903225e-05, | |
| "loss": 0.284, | |
| "step": 1500 | |
| } | |
| ], | |
| "max_steps": 1860, | |
| "num_train_epochs": 30, | |
| "total_flos": 6.874539672176118e+18, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |