| { | |
| "best_metric": 0.03376658633351326, | |
| "best_model_checkpoint": "./wav2vec2-base-demo/checkpoint-4000", | |
| "epoch": 13.513513513513514, | |
| "eval_steps": 500, | |
| "global_step": 6500, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0395010395010396, | |
| "grad_norm": 1.9346532821655273, | |
| "learning_rate": 4.99e-05, | |
| "loss": 0.0523, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.0395010395010396, | |
| "eval_cer": 0.029377520894839703, | |
| "eval_loss": 0.04082171246409416, | |
| "eval_mer": 0.09753672187970566, | |
| "eval_runtime": 69.2746, | |
| "eval_samples_per_second": 44.36, | |
| "eval_steps_per_second": 5.558, | |
| "eval_wer": 0.0977199624263471, | |
| "eval_wil": 0.17927306635544427, | |
| "eval_wip": 0.8207269336445557, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 2.079002079002079, | |
| "grad_norm": 2.06243634223938, | |
| "learning_rate": 4.726425438596491e-05, | |
| "loss": 0.1255, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 2.079002079002079, | |
| "eval_cer": 0.031144746143290783, | |
| "eval_loss": 0.04166610538959503, | |
| "eval_mer": 0.09972456484084391, | |
| "eval_runtime": 68.8885, | |
| "eval_samples_per_second": 44.608, | |
| "eval_steps_per_second": 5.589, | |
| "eval_wer": 0.09996868862258404, | |
| "eval_wil": 0.1818749372014863, | |
| "eval_wip": 0.8181250627985137, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 3.1185031185031185, | |
| "grad_norm": 1.8282793760299683, | |
| "learning_rate": 4.452302631578947e-05, | |
| "loss": 0.1456, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 3.1185031185031185, | |
| "eval_cer": 0.030666555781945194, | |
| "eval_loss": 0.04946601018309593, | |
| "eval_mer": 0.09887519172868262, | |
| "eval_runtime": 69.4551, | |
| "eval_samples_per_second": 44.244, | |
| "eval_steps_per_second": 5.543, | |
| "eval_wer": 0.09908627707722524, | |
| "eval_wil": 0.18065502190864302, | |
| "eval_wip": 0.819344978091357, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 4.158004158004158, | |
| "grad_norm": 1.501983880996704, | |
| "learning_rate": 4.178728070175439e-05, | |
| "loss": 0.1348, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 4.158004158004158, | |
| "eval_cer": 0.031241770274578293, | |
| "eval_loss": 0.04532551020383835, | |
| "eval_mer": 0.09941786170665909, | |
| "eval_runtime": 69.1184, | |
| "eval_samples_per_second": 44.46, | |
| "eval_steps_per_second": 5.57, | |
| "eval_wer": 0.09965557484842447, | |
| "eval_wil": 0.18122310589648583, | |
| "eval_wip": 0.8187768941035142, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 5.197505197505198, | |
| "grad_norm": 2.2279298305511475, | |
| "learning_rate": 3.904605263157895e-05, | |
| "loss": 0.1328, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 5.197505197505198, | |
| "eval_cer": 0.030694276962313055, | |
| "eval_loss": 0.043331652879714966, | |
| "eval_mer": 0.09920499716070415, | |
| "eval_runtime": 69.2256, | |
| "eval_samples_per_second": 44.391, | |
| "eval_steps_per_second": 5.562, | |
| "eval_wer": 0.09945632062850474, | |
| "eval_wil": 0.1809313141913549, | |
| "eval_wip": 0.8190686858086451, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 6.237006237006237, | |
| "grad_norm": 3.002439498901367, | |
| "learning_rate": 3.6321271929824565e-05, | |
| "loss": 0.1179, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 6.237006237006237, | |
| "eval_cer": 0.030153713945139785, | |
| "eval_loss": 0.03851901367306709, | |
| "eval_mer": 0.09771598808341608, | |
| "eval_runtime": 68.9837, | |
| "eval_samples_per_second": 44.547, | |
| "eval_steps_per_second": 5.581, | |
| "eval_wer": 0.09803307620050668, | |
| "eval_wil": 0.17836955409428712, | |
| "eval_wip": 0.8216304459057129, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 7.276507276507276, | |
| "grad_norm": 2.6515450477600098, | |
| "learning_rate": 3.358004385964912e-05, | |
| "loss": 0.1162, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 7.276507276507276, | |
| "eval_cer": 0.029925014207104937, | |
| "eval_loss": 0.03501337394118309, | |
| "eval_mer": 0.09821960984751682, | |
| "eval_runtime": 69.3123, | |
| "eval_samples_per_second": 44.336, | |
| "eval_steps_per_second": 5.555, | |
| "eval_wer": 0.0984600495289061, | |
| "eval_wil": 0.1797471797395056, | |
| "eval_wip": 0.8202528202604944, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 8.316008316008316, | |
| "grad_norm": 1.6817522048950195, | |
| "learning_rate": 3.0838815789473685e-05, | |
| "loss": 0.1365, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 8.316008316008316, | |
| "eval_cer": 0.03011906246967996, | |
| "eval_loss": 0.03376658633351326, | |
| "eval_mer": 0.09842117219445706, | |
| "eval_runtime": 68.9641, | |
| "eval_samples_per_second": 44.559, | |
| "eval_steps_per_second": 5.583, | |
| "eval_wer": 0.09865930374882582, | |
| "eval_wil": 0.18011352865946695, | |
| "eval_wip": 0.819886471340533, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 9.355509355509355, | |
| "grad_norm": 0.6051247119903564, | |
| "learning_rate": 2.81030701754386e-05, | |
| "loss": 0.1347, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 9.355509355509355, | |
| "eval_cer": 0.029703244764162057, | |
| "eval_loss": 0.03462997451424599, | |
| "eval_mer": 0.09795732833319129, | |
| "eval_runtime": 69.4003, | |
| "eval_samples_per_second": 44.279, | |
| "eval_steps_per_second": 5.548, | |
| "eval_wer": 0.09814693575474652, | |
| "eval_wil": 0.17949922019601927, | |
| "eval_wip": 0.8205007798039807, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 10.395010395010395, | |
| "grad_norm": 1.5656287670135498, | |
| "learning_rate": 2.536732456140351e-05, | |
| "loss": 0.1068, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 10.395010395010395, | |
| "eval_cer": 0.029682453878886163, | |
| "eval_loss": 0.037345826625823975, | |
| "eval_mer": 0.09753812079393474, | |
| "eval_runtime": 69.4802, | |
| "eval_samples_per_second": 44.228, | |
| "eval_steps_per_second": 5.541, | |
| "eval_wer": 0.09777689220346703, | |
| "eval_wil": 0.1784365366866959, | |
| "eval_wip": 0.8215634633133041, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 11.434511434511435, | |
| "grad_norm": 2.0051817893981934, | |
| "learning_rate": 2.2631578947368423e-05, | |
| "loss": 0.1137, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 11.434511434511435, | |
| "eval_cer": 0.02954384797704686, | |
| "eval_loss": 0.03467037156224251, | |
| "eval_mer": 0.09743283921167717, | |
| "eval_runtime": 68.8824, | |
| "eval_samples_per_second": 44.612, | |
| "eval_steps_per_second": 5.589, | |
| "eval_wer": 0.09766303264922718, | |
| "eval_wil": 0.178736836050011, | |
| "eval_wip": 0.821263163949989, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 12.474012474012474, | |
| "grad_norm": 1.0739721059799194, | |
| "learning_rate": 1.9890350877192984e-05, | |
| "loss": 0.1172, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 12.474012474012474, | |
| "eval_cer": 0.02943989355066739, | |
| "eval_loss": 0.03584234416484833, | |
| "eval_mer": 0.09757691105871659, | |
| "eval_runtime": 69.0922, | |
| "eval_samples_per_second": 44.477, | |
| "eval_steps_per_second": 5.572, | |
| "eval_wer": 0.09777689220346703, | |
| "eval_wil": 0.17892556337428467, | |
| "eval_wip": 0.8210744366257153, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 13.513513513513514, | |
| "grad_norm": 2.266472339630127, | |
| "learning_rate": 1.7154605263157897e-05, | |
| "loss": 0.1115, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 13.513513513513514, | |
| "eval_cer": 0.02930821794392005, | |
| "eval_loss": 0.034342650324106216, | |
| "eval_mer": 0.09706725718990432, | |
| "eval_runtime": 69.2359, | |
| "eval_samples_per_second": 44.384, | |
| "eval_steps_per_second": 5.561, | |
| "eval_wer": 0.09732145398650764, | |
| "eval_wil": 0.17795643596108135, | |
| "eval_wip": 0.8220435640389187, | |
| "step": 6500 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 9620, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 20, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": false | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 4.1652748241888937e+18, | |
| "train_batch_size": 16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |