{ "best_metric": 0.03376658633351326, "best_model_checkpoint": "./wav2vec2-base-demo/checkpoint-4000", "epoch": 13.513513513513514, "eval_steps": 500, "global_step": 6500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0395010395010396, "grad_norm": 1.9346532821655273, "learning_rate": 4.99e-05, "loss": 0.0523, "step": 500 }, { "epoch": 1.0395010395010396, "eval_cer": 0.029377520894839703, "eval_loss": 0.04082171246409416, "eval_mer": 0.09753672187970566, "eval_runtime": 69.2746, "eval_samples_per_second": 44.36, "eval_steps_per_second": 5.558, "eval_wer": 0.0977199624263471, "eval_wil": 0.17927306635544427, "eval_wip": 0.8207269336445557, "step": 500 }, { "epoch": 2.079002079002079, "grad_norm": 2.06243634223938, "learning_rate": 4.726425438596491e-05, "loss": 0.1255, "step": 1000 }, { "epoch": 2.079002079002079, "eval_cer": 0.031144746143290783, "eval_loss": 0.04166610538959503, "eval_mer": 0.09972456484084391, "eval_runtime": 68.8885, "eval_samples_per_second": 44.608, "eval_steps_per_second": 5.589, "eval_wer": 0.09996868862258404, "eval_wil": 0.1818749372014863, "eval_wip": 0.8181250627985137, "step": 1000 }, { "epoch": 3.1185031185031185, "grad_norm": 1.8282793760299683, "learning_rate": 4.452302631578947e-05, "loss": 0.1456, "step": 1500 }, { "epoch": 3.1185031185031185, "eval_cer": 0.030666555781945194, "eval_loss": 0.04946601018309593, "eval_mer": 0.09887519172868262, "eval_runtime": 69.4551, "eval_samples_per_second": 44.244, "eval_steps_per_second": 5.543, "eval_wer": 0.09908627707722524, "eval_wil": 0.18065502190864302, "eval_wip": 0.819344978091357, "step": 1500 }, { "epoch": 4.158004158004158, "grad_norm": 1.501983880996704, "learning_rate": 4.178728070175439e-05, "loss": 0.1348, "step": 2000 }, { "epoch": 4.158004158004158, "eval_cer": 0.031241770274578293, "eval_loss": 0.04532551020383835, "eval_mer": 0.09941786170665909, "eval_runtime": 69.1184, "eval_samples_per_second": 44.46, "eval_steps_per_second": 5.57, "eval_wer": 0.09965557484842447, "eval_wil": 0.18122310589648583, "eval_wip": 0.8187768941035142, "step": 2000 }, { "epoch": 5.197505197505198, "grad_norm": 2.2279298305511475, "learning_rate": 3.904605263157895e-05, "loss": 0.1328, "step": 2500 }, { "epoch": 5.197505197505198, "eval_cer": 0.030694276962313055, "eval_loss": 0.043331652879714966, "eval_mer": 0.09920499716070415, "eval_runtime": 69.2256, "eval_samples_per_second": 44.391, "eval_steps_per_second": 5.562, "eval_wer": 0.09945632062850474, "eval_wil": 0.1809313141913549, "eval_wip": 0.8190686858086451, "step": 2500 }, { "epoch": 6.237006237006237, "grad_norm": 3.002439498901367, "learning_rate": 3.6321271929824565e-05, "loss": 0.1179, "step": 3000 }, { "epoch": 6.237006237006237, "eval_cer": 0.030153713945139785, "eval_loss": 0.03851901367306709, "eval_mer": 0.09771598808341608, "eval_runtime": 68.9837, "eval_samples_per_second": 44.547, "eval_steps_per_second": 5.581, "eval_wer": 0.09803307620050668, "eval_wil": 0.17836955409428712, "eval_wip": 0.8216304459057129, "step": 3000 }, { "epoch": 7.276507276507276, "grad_norm": 2.6515450477600098, "learning_rate": 3.358004385964912e-05, "loss": 0.1162, "step": 3500 }, { "epoch": 7.276507276507276, "eval_cer": 0.029925014207104937, "eval_loss": 0.03501337394118309, "eval_mer": 0.09821960984751682, "eval_runtime": 69.3123, "eval_samples_per_second": 44.336, "eval_steps_per_second": 5.555, "eval_wer": 0.0984600495289061, "eval_wil": 0.1797471797395056, "eval_wip": 0.8202528202604944, "step": 3500 }, { "epoch": 8.316008316008316, "grad_norm": 1.6817522048950195, "learning_rate": 3.0838815789473685e-05, "loss": 0.1365, "step": 4000 }, { "epoch": 8.316008316008316, "eval_cer": 0.03011906246967996, "eval_loss": 0.03376658633351326, "eval_mer": 0.09842117219445706, "eval_runtime": 68.9641, "eval_samples_per_second": 44.559, "eval_steps_per_second": 5.583, "eval_wer": 0.09865930374882582, "eval_wil": 0.18011352865946695, "eval_wip": 0.819886471340533, "step": 4000 }, { "epoch": 9.355509355509355, "grad_norm": 0.6051247119903564, "learning_rate": 2.81030701754386e-05, "loss": 0.1347, "step": 4500 }, { "epoch": 9.355509355509355, "eval_cer": 0.029703244764162057, "eval_loss": 0.03462997451424599, "eval_mer": 0.09795732833319129, "eval_runtime": 69.4003, "eval_samples_per_second": 44.279, "eval_steps_per_second": 5.548, "eval_wer": 0.09814693575474652, "eval_wil": 0.17949922019601927, "eval_wip": 0.8205007798039807, "step": 4500 }, { "epoch": 10.395010395010395, "grad_norm": 1.5656287670135498, "learning_rate": 2.536732456140351e-05, "loss": 0.1068, "step": 5000 }, { "epoch": 10.395010395010395, "eval_cer": 0.029682453878886163, "eval_loss": 0.037345826625823975, "eval_mer": 0.09753812079393474, "eval_runtime": 69.4802, "eval_samples_per_second": 44.228, "eval_steps_per_second": 5.541, "eval_wer": 0.09777689220346703, "eval_wil": 0.1784365366866959, "eval_wip": 0.8215634633133041, "step": 5000 }, { "epoch": 11.434511434511435, "grad_norm": 2.0051817893981934, "learning_rate": 2.2631578947368423e-05, "loss": 0.1137, "step": 5500 }, { "epoch": 11.434511434511435, "eval_cer": 0.02954384797704686, "eval_loss": 0.03467037156224251, "eval_mer": 0.09743283921167717, "eval_runtime": 68.8824, "eval_samples_per_second": 44.612, "eval_steps_per_second": 5.589, "eval_wer": 0.09766303264922718, "eval_wil": 0.178736836050011, "eval_wip": 0.821263163949989, "step": 5500 }, { "epoch": 12.474012474012474, "grad_norm": 1.0739721059799194, "learning_rate": 1.9890350877192984e-05, "loss": 0.1172, "step": 6000 }, { "epoch": 12.474012474012474, "eval_cer": 0.02943989355066739, "eval_loss": 0.03584234416484833, "eval_mer": 0.09757691105871659, "eval_runtime": 69.0922, "eval_samples_per_second": 44.477, "eval_steps_per_second": 5.572, "eval_wer": 0.09777689220346703, "eval_wil": 0.17892556337428467, "eval_wip": 0.8210744366257153, "step": 6000 }, { "epoch": 13.513513513513514, "grad_norm": 2.266472339630127, "learning_rate": 1.7154605263157897e-05, "loss": 0.1115, "step": 6500 }, { "epoch": 13.513513513513514, "eval_cer": 0.02930821794392005, "eval_loss": 0.034342650324106216, "eval_mer": 0.09706725718990432, "eval_runtime": 69.2359, "eval_samples_per_second": 44.384, "eval_steps_per_second": 5.561, "eval_wer": 0.09732145398650764, "eval_wil": 0.17795643596108135, "eval_wip": 0.8220435640389187, "step": 6500 } ], "logging_steps": 500, "max_steps": 9620, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 4.1652748241888937e+18, "train_batch_size": 16, "trial_name": null, "trial_params": null }