| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 2.9242372300308537, | |
| "global_step": 4264, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.22, | |
| "learning_rate": 6.115909912286932e-07, | |
| "loss": 1.0478, | |
| "step": 328 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_loss": 0.20066721737384796, | |
| "eval_runtime": 421.2422, | |
| "eval_samples_per_second": 7.122, | |
| "eval_steps_per_second": 0.89, | |
| "eval_wer": 0.2669276913682244, | |
| "step": 328 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "learning_rate": 9.100780032860387e-07, | |
| "loss": 1.0471, | |
| "step": 656 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "eval_loss": 0.2007066309452057, | |
| "eval_runtime": 420.7757, | |
| "eval_samples_per_second": 7.13, | |
| "eval_steps_per_second": 0.891, | |
| "eval_wer": 0.26699953302920365, | |
| "step": 656 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "learning_rate": 8.2992075702454e-07, | |
| "loss": 1.031, | |
| "step": 984 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "eval_loss": 0.20067130029201508, | |
| "eval_runtime": 419.7329, | |
| "eval_samples_per_second": 7.147, | |
| "eval_steps_per_second": 0.893, | |
| "eval_wer": 0.266245195588922, | |
| "step": 984 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "learning_rate": 7.497635107630415e-07, | |
| "loss": 1.044, | |
| "step": 1312 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "eval_loss": 0.20047353208065033, | |
| "eval_runtime": 419.6669, | |
| "eval_samples_per_second": 7.149, | |
| "eval_steps_per_second": 0.894, | |
| "eval_wer": 0.265885987284026, | |
| "step": 1312 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "learning_rate": 6.698506463499012e-07, | |
| "loss": 1.0448, | |
| "step": 1640 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "eval_loss": 0.2001875340938568, | |
| "eval_runtime": 423.812, | |
| "eval_samples_per_second": 7.079, | |
| "eval_steps_per_second": 0.885, | |
| "eval_wer": 0.2658141456230468, | |
| "step": 1640 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "learning_rate": 5.896934000884026e-07, | |
| "loss": 1.0489, | |
| "step": 1968 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "eval_loss": 0.2000104784965515, | |
| "eval_runtime": 432.0862, | |
| "eval_samples_per_second": 6.943, | |
| "eval_steps_per_second": 0.868, | |
| "eval_wer": 0.2658500664535364, | |
| "step": 1968 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "learning_rate": 5.09536153826904e-07, | |
| "loss": 1.0277, | |
| "step": 2296 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "eval_loss": 0.200164794921875, | |
| "eval_runtime": 428.8208, | |
| "eval_samples_per_second": 6.996, | |
| "eval_steps_per_second": 0.874, | |
| "eval_wer": 0.26552677897913, | |
| "step": 2296 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "learning_rate": 4.2937890756540545e-07, | |
| "loss": 1.0364, | |
| "step": 2624 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "eval_loss": 0.2002057284116745, | |
| "eval_runtime": 426.0723, | |
| "eval_samples_per_second": 7.041, | |
| "eval_steps_per_second": 0.88, | |
| "eval_wer": 0.2659578289450052, | |
| "step": 2624 | |
| }, | |
| { | |
| "epoch": 2.02, | |
| "learning_rate": 3.492216613039069e-07, | |
| "loss": 1.035, | |
| "step": 2952 | |
| }, | |
| { | |
| "epoch": 2.02, | |
| "eval_loss": 0.20034705102443695, | |
| "eval_runtime": 425.252, | |
| "eval_samples_per_second": 7.055, | |
| "eval_steps_per_second": 0.882, | |
| "eval_wer": 0.26635295808039083, | |
| "step": 2952 | |
| }, | |
| { | |
| "epoch": 2.25, | |
| "learning_rate": 2.690644150424083e-07, | |
| "loss": 1.0306, | |
| "step": 3280 | |
| }, | |
| { | |
| "epoch": 2.25, | |
| "eval_loss": 0.20014077425003052, | |
| "eval_runtime": 418.7166, | |
| "eval_samples_per_second": 7.165, | |
| "eval_steps_per_second": 0.896, | |
| "eval_wer": 0.2662092747584324, | |
| "step": 3280 | |
| }, | |
| { | |
| "epoch": 2.47, | |
| "learning_rate": 1.8890716878090973e-07, | |
| "loss": 1.0395, | |
| "step": 3608 | |
| }, | |
| { | |
| "epoch": 2.47, | |
| "eval_loss": 0.2000894397497177, | |
| "eval_runtime": 418.0797, | |
| "eval_samples_per_second": 7.176, | |
| "eval_steps_per_second": 0.897, | |
| "eval_wer": 0.2654908581486404, | |
| "step": 3608 | |
| }, | |
| { | |
| "epoch": 2.7, | |
| "learning_rate": 1.0874992251941118e-07, | |
| "loss": 1.0426, | |
| "step": 3936 | |
| }, | |
| { | |
| "epoch": 2.7, | |
| "eval_loss": 0.20004504919052124, | |
| "eval_runtime": 416.8848, | |
| "eval_samples_per_second": 7.196, | |
| "eval_steps_per_second": 0.9, | |
| "eval_wer": 0.2658141456230468, | |
| "step": 3936 | |
| }, | |
| { | |
| "epoch": 2.92, | |
| "learning_rate": 2.883705810627083e-08, | |
| "loss": 1.0431, | |
| "step": 4264 | |
| }, | |
| { | |
| "epoch": 2.92, | |
| "eval_loss": 0.20020076632499695, | |
| "eval_runtime": 419.7762, | |
| "eval_samples_per_second": 7.147, | |
| "eval_steps_per_second": 0.893, | |
| "eval_wer": 0.2656345414705988, | |
| "step": 4264 | |
| } | |
| ], | |
| "max_steps": 4374, | |
| "num_train_epochs": 3, | |
| "total_flos": 1.8745213924829307e+19, | |
| "trial_name": null, | |
| "trial_params": null | |
| } |