| { |
| "best_metric": 0.2075, |
| "best_model_checkpoint": "/content/model_asr/checkpoint-1100", |
| "epoch": 80.0, |
| "global_step": 1200, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 3.33, |
| "learning_rate": 4.600000000000001e-05, |
| "loss": 8.6183, |
| "step": 50 |
| }, |
| { |
| "epoch": 3.33, |
| "eval_loss": 4.025334358215332, |
| "eval_runtime": 15.3335, |
| "eval_samples_per_second": 31.304, |
| "eval_steps_per_second": 3.913, |
| "eval_wer": 1.0, |
| "step": 50 |
| }, |
| { |
| "epoch": 6.67, |
| "learning_rate": 9.6e-05, |
| "loss": 3.2794, |
| "step": 100 |
| }, |
| { |
| "epoch": 6.67, |
| "eval_loss": 3.0245492458343506, |
| "eval_runtime": 15.5923, |
| "eval_samples_per_second": 30.784, |
| "eval_steps_per_second": 3.848, |
| "eval_wer": 1.0, |
| "step": 100 |
| }, |
| { |
| "epoch": 10.0, |
| "learning_rate": 9.956913093678348e-05, |
| "loss": 2.9692, |
| "step": 150 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_loss": 2.8865509033203125, |
| "eval_runtime": 15.6178, |
| "eval_samples_per_second": 30.734, |
| "eval_steps_per_second": 3.842, |
| "eval_wer": 1.0, |
| "step": 150 |
| }, |
| { |
| "epoch": 13.33, |
| "learning_rate": 9.813243995692098e-05, |
| "loss": 2.8042, |
| "step": 200 |
| }, |
| { |
| "epoch": 13.33, |
| "eval_loss": 2.635584831237793, |
| "eval_runtime": 15.4284, |
| "eval_samples_per_second": 31.112, |
| "eval_steps_per_second": 3.889, |
| "eval_wer": 1.0, |
| "step": 200 |
| }, |
| { |
| "epoch": 16.67, |
| "learning_rate": 9.57159113020304e-05, |
| "loss": 2.5114, |
| "step": 250 |
| }, |
| { |
| "epoch": 16.67, |
| "eval_loss": 2.116630792617798, |
| "eval_runtime": 15.5962, |
| "eval_samples_per_second": 30.777, |
| "eval_steps_per_second": 3.847, |
| "eval_wer": 1.0, |
| "step": 250 |
| }, |
| { |
| "epoch": 20.0, |
| "learning_rate": 9.236873852683213e-05, |
| "loss": 1.7677, |
| "step": 300 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_loss": 1.0035134553909302, |
| "eval_runtime": 15.4247, |
| "eval_samples_per_second": 31.119, |
| "eval_steps_per_second": 3.89, |
| "eval_wer": 0.89375, |
| "step": 300 |
| }, |
| { |
| "epoch": 23.33, |
| "learning_rate": 8.815906041658002e-05, |
| "loss": 0.8802, |
| "step": 350 |
| }, |
| { |
| "epoch": 23.33, |
| "eval_loss": 0.3643040060997009, |
| "eval_runtime": 15.6657, |
| "eval_samples_per_second": 30.64, |
| "eval_steps_per_second": 3.83, |
| "eval_wer": 0.5025, |
| "step": 350 |
| }, |
| { |
| "epoch": 26.67, |
| "learning_rate": 8.31725738778896e-05, |
| "loss": 0.4318, |
| "step": 400 |
| }, |
| { |
| "epoch": 26.67, |
| "eval_loss": 0.14456388354301453, |
| "eval_runtime": 15.4959, |
| "eval_samples_per_second": 30.976, |
| "eval_steps_per_second": 3.872, |
| "eval_wer": 0.3075, |
| "step": 400 |
| }, |
| { |
| "epoch": 30.0, |
| "learning_rate": 7.751078939684885e-05, |
| "loss": 0.2275, |
| "step": 450 |
| }, |
| { |
| "epoch": 30.0, |
| "eval_loss": 0.07944890111684799, |
| "eval_runtime": 16.2382, |
| "eval_samples_per_second": 29.56, |
| "eval_steps_per_second": 3.695, |
| "eval_wer": 0.25, |
| "step": 450 |
| }, |
| { |
| "epoch": 33.33, |
| "learning_rate": 7.128896457825364e-05, |
| "loss": 0.1407, |
| "step": 500 |
| }, |
| { |
| "epoch": 33.33, |
| "eval_loss": 0.05435527116060257, |
| "eval_runtime": 15.4181, |
| "eval_samples_per_second": 31.132, |
| "eval_steps_per_second": 3.892, |
| "eval_wer": 0.22125, |
| "step": 500 |
| }, |
| { |
| "epoch": 36.67, |
| "learning_rate": 6.463375783314937e-05, |
| "loss": 0.1191, |
| "step": 550 |
| }, |
| { |
| "epoch": 36.67, |
| "eval_loss": 0.046384669840335846, |
| "eval_runtime": 15.8291, |
| "eval_samples_per_second": 30.324, |
| "eval_steps_per_second": 3.79, |
| "eval_wer": 0.23375, |
| "step": 550 |
| }, |
| { |
| "epoch": 40.0, |
| "learning_rate": 5.768064997883498e-05, |
| "loss": 0.0825, |
| "step": 600 |
| }, |
| { |
| "epoch": 40.0, |
| "eval_loss": 0.03952096030116081, |
| "eval_runtime": 15.4288, |
| "eval_samples_per_second": 31.111, |
| "eval_steps_per_second": 3.889, |
| "eval_wer": 0.25625, |
| "step": 600 |
| }, |
| { |
| "epoch": 43.33, |
| "learning_rate": 5.057118624011702e-05, |
| "loss": 0.0699, |
| "step": 650 |
| }, |
| { |
| "epoch": 43.33, |
| "eval_loss": 0.03604818880558014, |
| "eval_runtime": 15.4828, |
| "eval_samples_per_second": 31.002, |
| "eval_steps_per_second": 3.875, |
| "eval_wer": 0.2125, |
| "step": 650 |
| }, |
| { |
| "epoch": 46.67, |
| "learning_rate": 4.345009479671536e-05, |
| "loss": 0.0592, |
| "step": 700 |
| }, |
| { |
| "epoch": 46.67, |
| "eval_loss": 0.02805432118475437, |
| "eval_runtime": 15.5578, |
| "eval_samples_per_second": 30.853, |
| "eval_steps_per_second": 3.857, |
| "eval_wer": 0.23875, |
| "step": 700 |
| }, |
| { |
| "epoch": 50.0, |
| "learning_rate": 3.646234053488574e-05, |
| "loss": 0.0546, |
| "step": 750 |
| }, |
| { |
| "epoch": 50.0, |
| "eval_loss": 0.023771686479449272, |
| "eval_runtime": 15.8929, |
| "eval_samples_per_second": 30.202, |
| "eval_steps_per_second": 3.775, |
| "eval_wer": 0.26375, |
| "step": 750 |
| }, |
| { |
| "epoch": 53.33, |
| "learning_rate": 2.9750173980379736e-05, |
| "loss": 0.0455, |
| "step": 800 |
| }, |
| { |
| "epoch": 53.33, |
| "eval_loss": 0.021949028596282005, |
| "eval_runtime": 15.824, |
| "eval_samples_per_second": 30.334, |
| "eval_steps_per_second": 3.792, |
| "eval_wer": 0.24125, |
| "step": 800 |
| }, |
| { |
| "epoch": 56.67, |
| "learning_rate": 2.3450235487957135e-05, |
| "loss": 0.0391, |
| "step": 850 |
| }, |
| { |
| "epoch": 56.67, |
| "eval_loss": 0.020865805447101593, |
| "eval_runtime": 16.0515, |
| "eval_samples_per_second": 29.904, |
| "eval_steps_per_second": 3.738, |
| "eval_wer": 0.24375, |
| "step": 850 |
| }, |
| { |
| "epoch": 60.0, |
| "learning_rate": 1.7690773637801294e-05, |
| "loss": 0.0367, |
| "step": 900 |
| }, |
| { |
| "epoch": 60.0, |
| "eval_loss": 0.022958721965551376, |
| "eval_runtime": 15.4228, |
| "eval_samples_per_second": 31.123, |
| "eval_steps_per_second": 3.89, |
| "eval_wer": 0.21625, |
| "step": 900 |
| }, |
| { |
| "epoch": 63.33, |
| "learning_rate": 1.2589034464264932e-05, |
| "loss": 0.0333, |
| "step": 950 |
| }, |
| { |
| "epoch": 63.33, |
| "eval_loss": 0.021822014823555946, |
| "eval_runtime": 15.5217, |
| "eval_samples_per_second": 30.924, |
| "eval_steps_per_second": 3.866, |
| "eval_wer": 0.23, |
| "step": 950 |
| }, |
| { |
| "epoch": 66.67, |
| "learning_rate": 8.248874664720375e-06, |
| "loss": 0.0327, |
| "step": 1000 |
| }, |
| { |
| "epoch": 66.67, |
| "eval_loss": 0.02000792883336544, |
| "eval_runtime": 15.8435, |
| "eval_samples_per_second": 30.296, |
| "eval_steps_per_second": 3.787, |
| "eval_wer": 0.21625, |
| "step": 1000 |
| }, |
| { |
| "epoch": 70.0, |
| "learning_rate": 4.758647376699032e-06, |
| "loss": 0.0306, |
| "step": 1050 |
| }, |
| { |
| "epoch": 70.0, |
| "eval_loss": 0.02014043927192688, |
| "eval_runtime": 15.7796, |
| "eval_samples_per_second": 30.419, |
| "eval_steps_per_second": 3.802, |
| "eval_wer": 0.21625, |
| "step": 1050 |
| }, |
| { |
| "epoch": 73.33, |
| "learning_rate": 2.1894035628006517e-06, |
| "loss": 0.0269, |
| "step": 1100 |
| }, |
| { |
| "epoch": 73.33, |
| "eval_loss": 0.02098565548658371, |
| "eval_runtime": 16.1184, |
| "eval_samples_per_second": 29.78, |
| "eval_steps_per_second": 3.722, |
| "eval_wer": 0.2075, |
| "step": 1100 |
| }, |
| { |
| "epoch": 76.67, |
| "learning_rate": 5.934456179888804e-07, |
| "loss": 0.0288, |
| "step": 1150 |
| }, |
| { |
| "epoch": 76.67, |
| "eval_loss": 0.021614952012896538, |
| "eval_runtime": 15.8598, |
| "eval_samples_per_second": 30.265, |
| "eval_steps_per_second": 3.783, |
| "eval_wer": 0.21625, |
| "step": 1150 |
| }, |
| { |
| "epoch": 80.0, |
| "learning_rate": 3.262643657425679e-09, |
| "loss": 0.0289, |
| "step": 1200 |
| }, |
| { |
| "epoch": 80.0, |
| "eval_loss": 0.02152070961892605, |
| "eval_runtime": 16.1024, |
| "eval_samples_per_second": 29.809, |
| "eval_steps_per_second": 3.726, |
| "eval_wer": 0.21625, |
| "step": 1200 |
| } |
| ], |
| "max_steps": 1200, |
| "num_train_epochs": 80, |
| "total_flos": 3.3688058529081743e+18, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|