{ "best_metric": 0.8212058967880319, "best_model_checkpoint": "./outputs/facebook/wav2vec2-xls-r-1b/checkpoint-6716", "epoch": 29.969293756397136, "eval_steps": 500, "global_step": 18300, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 6.07e-05, "loss": 4.5214, "step": 610 }, { "epoch": 1.0, "eval_loss": 2.5036747455596924, "eval_runtime": 53.3547, "eval_samples_per_second": 139.182, "eval_steps_per_second": 4.367, "eval_wer": 0.9721338592696271, "step": 610 }, { "epoch": 2.0, "learning_rate": 9.873988439306359e-05, "loss": 0.5588, "step": 1221 }, { "epoch": 2.0, "eval_loss": 2.375758171081543, "eval_runtime": 52.8335, "eval_samples_per_second": 140.555, "eval_steps_per_second": 4.41, "eval_wer": 0.9198734844491302, "step": 1221 }, { "epoch": 3.0, "learning_rate": 9.521387283236995e-05, "loss": 0.4547, "step": 1831 }, { "epoch": 3.0, "eval_loss": 2.2466094493865967, "eval_runtime": 53.1764, "eval_samples_per_second": 139.648, "eval_steps_per_second": 4.382, "eval_wer": 0.9418864631996073, "step": 1831 }, { "epoch": 4.0, "learning_rate": 9.16820809248555e-05, "loss": 0.4025, "step": 2442 }, { "epoch": 4.0, "eval_loss": 2.2312777042388916, "eval_runtime": 54.1165, "eval_samples_per_second": 137.223, "eval_steps_per_second": 4.306, "eval_wer": 0.8876083834729973, "step": 2442 }, { "epoch": 5.0, "learning_rate": 8.815606936416185e-05, "loss": 0.3789, "step": 3053 }, { "epoch": 5.0, "eval_loss": 2.244392156600952, "eval_runtime": 52.4474, "eval_samples_per_second": 141.589, "eval_steps_per_second": 4.443, "eval_wer": 0.8844636722229291, "step": 3053 }, { "epoch": 6.0, "learning_rate": 8.463005780346821e-05, "loss": 0.3542, "step": 3663 }, { "epoch": 6.0, "eval_loss": 1.9893066883087158, "eval_runtime": 54.83, "eval_samples_per_second": 135.437, "eval_steps_per_second": 4.249, "eval_wer": 0.8913711304600731, "step": 3663 }, { "epoch": 7.0, "learning_rate": 8.109826589595376e-05, "loss": 0.3383, "step": 4274 }, { "epoch": 7.0, "eval_loss": 1.3484952449798584, "eval_runtime": 53.4092, "eval_samples_per_second": 139.04, "eval_steps_per_second": 4.363, "eval_wer": 0.8356752040426808, "step": 4274 }, { "epoch": 8.0, "learning_rate": 7.756647398843931e-05, "loss": 0.3239, "step": 4885 }, { "epoch": 8.0, "eval_loss": 1.98879075050354, "eval_runtime": 53.1444, "eval_samples_per_second": 139.732, "eval_steps_per_second": 4.384, "eval_wer": 0.8775743915074619, "step": 4885 }, { "epoch": 9.0, "learning_rate": 7.404624277456647e-05, "loss": 0.3074, "step": 5495 }, { "epoch": 9.0, "eval_loss": 1.9461687803268433, "eval_runtime": 53.2785, "eval_samples_per_second": 139.381, "eval_steps_per_second": 4.373, "eval_wer": 0.8689400687110319, "step": 5495 }, { "epoch": 10.0, "learning_rate": 7.051445086705202e-05, "loss": 0.2883, "step": 6106 }, { "epoch": 10.0, "eval_loss": 1.5767468214035034, "eval_runtime": 53.0357, "eval_samples_per_second": 140.019, "eval_steps_per_second": 4.393, "eval_wer": 0.8871357679094032, "step": 6106 }, { "epoch": 11.0, "learning_rate": 6.698843930635838e-05, "loss": 0.2749, "step": 6716 }, { "epoch": 11.0, "eval_loss": 1.3259695768356323, "eval_runtime": 53.7403, "eval_samples_per_second": 138.183, "eval_steps_per_second": 4.336, "eval_wer": 0.8212058967880319, "step": 6716 }, { "epoch": 12.0, "learning_rate": 6.345664739884394e-05, "loss": 0.2563, "step": 7327 }, { "epoch": 12.0, "eval_loss": 1.8269567489624023, "eval_runtime": 53.4539, "eval_samples_per_second": 138.923, "eval_steps_per_second": 4.359, "eval_wer": 0.844000508970607, "step": 7327 }, { "epoch": 13.0, "learning_rate": 5.992485549132948e-05, "loss": 0.2474, "step": 7938 }, { "epoch": 13.0, "eval_loss": 1.8218885660171509, "eval_runtime": 53.3104, "eval_samples_per_second": 139.297, "eval_steps_per_second": 4.371, "eval_wer": 0.8676676421936633, "step": 7938 }, { "epoch": 14.0, "learning_rate": 5.6398843930635835e-05, "loss": 0.2347, "step": 8548 }, { "epoch": 14.0, "eval_loss": 1.5345903635025024, "eval_runtime": 53.5574, "eval_samples_per_second": 138.655, "eval_steps_per_second": 4.35, "eval_wer": 0.8634504571646702, "step": 8548 }, { "epoch": 15.0, "learning_rate": 5.28728323699422e-05, "loss": 0.2211, "step": 9159 }, { "epoch": 15.0, "eval_loss": 1.7185391187667847, "eval_runtime": 53.0996, "eval_samples_per_second": 139.85, "eval_steps_per_second": 4.388, "eval_wer": 0.8636140548597604, "step": 9159 }, { "epoch": 16.0, "learning_rate": 4.934104046242775e-05, "loss": 0.2117, "step": 9770 }, { "epoch": 16.0, "eval_loss": 1.8662818670272827, "eval_runtime": 54.2061, "eval_samples_per_second": 136.996, "eval_steps_per_second": 4.298, "eval_wer": 0.8696671695780998, "step": 9770 }, { "epoch": 17.0, "learning_rate": 4.582080924855491e-05, "loss": 0.1987, "step": 10380 }, { "epoch": 17.0, "eval_loss": 1.4298427104949951, "eval_runtime": 53.5752, "eval_samples_per_second": 138.609, "eval_steps_per_second": 4.349, "eval_wer": 0.8686674058858815, "step": 10380 }, { "epoch": 18.0, "learning_rate": 4.228901734104046e-05, "loss": 0.1814, "step": 10991 }, { "epoch": 18.0, "eval_loss": 1.5630472898483276, "eval_runtime": 54.0558, "eval_samples_per_second": 137.377, "eval_steps_per_second": 4.31, "eval_wer": 0.8680130151055205, "step": 10991 }, { "epoch": 19.0, "learning_rate": 3.8763005780346824e-05, "loss": 0.1694, "step": 11601 }, { "epoch": 19.0, "eval_loss": 1.3626692295074463, "eval_runtime": 53.8757, "eval_samples_per_second": 137.836, "eval_steps_per_second": 4.325, "eval_wer": 0.8573246323596241, "step": 11601 }, { "epoch": 20.0, "learning_rate": 3.523121387283237e-05, "loss": 0.1597, "step": 12212 }, { "epoch": 20.0, "eval_loss": 1.7108192443847656, "eval_runtime": 54.0651, "eval_samples_per_second": 137.353, "eval_steps_per_second": 4.31, "eval_wer": 0.8641775580317379, "step": 12212 }, { "epoch": 21.0, "learning_rate": 3.169942196531792e-05, "loss": 0.1517, "step": 12823 }, { "epoch": 21.0, "eval_loss": 1.8344017267227173, "eval_runtime": 53.2307, "eval_samples_per_second": 139.506, "eval_steps_per_second": 4.377, "eval_wer": 0.8794466762401614, "step": 12823 }, { "epoch": 22.0, "learning_rate": 2.817341040462428e-05, "loss": 0.1405, "step": 13433 }, { "epoch": 22.0, "eval_loss": 1.4837909936904907, "eval_runtime": 52.8743, "eval_samples_per_second": 140.446, "eval_steps_per_second": 4.407, "eval_wer": 0.8508352571210441, "step": 13433 }, { "epoch": 23.0, "learning_rate": 2.4641618497109827e-05, "loss": 0.1262, "step": 14044 }, { "epoch": 23.0, "eval_loss": 1.5321871042251587, "eval_runtime": 57.0975, "eval_samples_per_second": 130.058, "eval_steps_per_second": 4.081, "eval_wer": 0.8415283660225765, "step": 14044 }, { "epoch": 24.0, "learning_rate": 2.1109826589595376e-05, "loss": 0.1171, "step": 14655 }, { "epoch": 24.0, "eval_loss": 1.7094522714614868, "eval_runtime": 54.2703, "eval_samples_per_second": 136.834, "eval_steps_per_second": 4.293, "eval_wer": 0.8682493228873176, "step": 14655 }, { "epoch": 25.0, "learning_rate": 1.7589595375722546e-05, "loss": 0.1079, "step": 15265 }, { "epoch": 25.0, "eval_loss": 1.744529128074646, "eval_runtime": 53.2445, "eval_samples_per_second": 139.47, "eval_steps_per_second": 4.376, "eval_wer": 0.8719211822660099, "step": 15265 }, { "epoch": 26.0, "learning_rate": 1.4057803468208095e-05, "loss": 0.0996, "step": 15876 }, { "epoch": 26.0, "eval_loss": 1.73218834400177, "eval_runtime": 55.182, "eval_samples_per_second": 134.573, "eval_steps_per_second": 4.222, "eval_wer": 0.8501808663406831, "step": 15876 }, { "epoch": 27.0, "learning_rate": 1.0537572254335262e-05, "loss": 0.0922, "step": 16486 }, { "epoch": 27.0, "eval_loss": 1.8349395990371704, "eval_runtime": 55.3784, "eval_samples_per_second": 134.096, "eval_steps_per_second": 4.207, "eval_wer": 0.862450693472452, "step": 16486 }, { "epoch": 28.0, "learning_rate": 7.00578034682081e-06, "loss": 0.0855, "step": 17097 }, { "epoch": 28.0, "eval_loss": 1.8259180784225464, "eval_runtime": 52.9961, "eval_samples_per_second": 140.124, "eval_steps_per_second": 4.397, "eval_wer": 0.8645592859869485, "step": 17097 }, { "epoch": 29.0, "learning_rate": 3.473988439306359e-06, "loss": 0.081, "step": 17708 }, { "epoch": 29.0, "eval_loss": 1.818723440170288, "eval_runtime": 53.212, "eval_samples_per_second": 139.555, "eval_steps_per_second": 4.379, "eval_wer": 0.8650864341155727, "step": 17708 }, { "epoch": 29.97, "learning_rate": 5.2023121387283234e-08, "loss": 0.0771, "step": 18300 }, { "epoch": 29.97, "eval_loss": 1.842650055885315, "eval_runtime": 54.1155, "eval_samples_per_second": 137.225, "eval_steps_per_second": 4.306, "eval_wer": 0.8623598058640685, "step": 18300 }, { "epoch": 29.97, "step": 18300, "total_flos": 2.0400693356246094e+21, "train_loss": 0.372250930494298, "train_runtime": 52675.4843, "train_samples_per_second": 89.021, "train_steps_per_second": 0.347 } ], "logging_steps": 500, "max_steps": 18300, "num_train_epochs": 30, "save_steps": 500, "total_flos": 2.0400693356246094e+21, "trial_name": null, "trial_params": null }