{ "best_global_step": 9000, "best_metric": 0.3495483628152051, "best_model_checkpoint": "/content/drive/MyDrive/Model-Finetuning/wav2vec2/model/zu_wav2vec2/checkpoint-9000", "epoch": 10.0, "eval_steps": 500, "global_step": 9380, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.5333333333333333, "grad_norm": 2.2490434646606445, "learning_rate": 0.00029939999999999996, "loss": 5.3513, "step": 500 }, { "epoch": 0.5333333333333333, "eval_loss": 3.067410707473755, "eval_runtime": 142.738, "eval_samples_per_second": 21.018, "eval_steps_per_second": 2.627, "eval_wer": 1.0, "step": 500 }, { "epoch": 1.0661333333333334, "grad_norm": 1.0280228853225708, "learning_rate": 0.0002831418918918919, "loss": 2.4793, "step": 1000 }, { "epoch": 1.0661333333333334, "eval_loss": 1.1224186420440674, "eval_runtime": 144.1294, "eval_samples_per_second": 20.815, "eval_steps_per_second": 2.602, "eval_wer": 0.992002258185924, "step": 1000 }, { "epoch": 1.5994666666666668, "grad_norm": 1.6041176319122314, "learning_rate": 0.00026624999999999994, "loss": 0.9637, "step": 1500 }, { "epoch": 1.5994666666666668, "eval_loss": 0.6741820573806763, "eval_runtime": 143.9596, "eval_samples_per_second": 20.839, "eval_steps_per_second": 2.605, "eval_wer": 0.7161272111403839, "step": 1500 }, { "epoch": 2.1322666666666668, "grad_norm": 1.4150700569152832, "learning_rate": 0.00024935810810810806, "loss": 0.717, "step": 2000 }, { "epoch": 2.1322666666666668, "eval_loss": 0.5053547620773315, "eval_runtime": 145.0264, "eval_samples_per_second": 20.686, "eval_steps_per_second": 2.586, "eval_wer": 0.620530673692134, "step": 2000 }, { "epoch": 2.6656, "grad_norm": 1.3749128580093384, "learning_rate": 0.0002324662162162162, "loss": 0.5979, "step": 2500 }, { "epoch": 2.6656, "eval_loss": 0.4564489424228668, "eval_runtime": 145.9072, "eval_samples_per_second": 20.561, "eval_steps_per_second": 2.57, "eval_wer": 0.5550432818968761, "step": 2500 }, { "epoch": 3.1984, "grad_norm": 1.1167936325073242, "learning_rate": 0.00021557432432432432, "loss": 0.5388, "step": 3000 }, { "epoch": 3.1984, "eval_loss": 0.4222851097583771, "eval_runtime": 146.8407, "eval_samples_per_second": 20.43, "eval_steps_per_second": 2.554, "eval_wer": 0.5333082423786225, "step": 3000 }, { "epoch": 3.7317333333333336, "grad_norm": 1.713294267654419, "learning_rate": 0.00019868243243243244, "loss": 0.4762, "step": 3500 }, { "epoch": 3.7317333333333336, "eval_loss": 0.3905419409275055, "eval_runtime": 146.5994, "eval_samples_per_second": 20.464, "eval_steps_per_second": 2.558, "eval_wer": 0.4974595408355288, "step": 3500 }, { "epoch": 4.2645333333333335, "grad_norm": 2.082676887512207, "learning_rate": 0.0001817905405405405, "loss": 0.4398, "step": 4000 }, { "epoch": 4.2645333333333335, "eval_loss": 0.3778238892555237, "eval_runtime": 145.863, "eval_samples_per_second": 20.567, "eval_steps_per_second": 2.571, "eval_wer": 0.48692133985698155, "step": 4000 }, { "epoch": 4.797866666666667, "grad_norm": 2.2089028358459473, "learning_rate": 0.00016489864864864862, "loss": 0.4098, "step": 4500 }, { "epoch": 4.797866666666667, "eval_loss": 0.35478344559669495, "eval_runtime": 146.045, "eval_samples_per_second": 20.542, "eval_steps_per_second": 2.568, "eval_wer": 0.4574708317651487, "step": 4500 }, { "epoch": 5.330666666666667, "grad_norm": 1.058657169342041, "learning_rate": 0.00014800675675675674, "loss": 0.3823, "step": 5000 }, { "epoch": 5.330666666666667, "eval_loss": 0.3355245292186737, "eval_runtime": 145.8678, "eval_samples_per_second": 20.567, "eval_steps_per_second": 2.571, "eval_wer": 0.45079036507339104, "step": 5000 }, { "epoch": 5.864, "grad_norm": 1.4570820331573486, "learning_rate": 0.00013111486486486486, "loss": 0.3513, "step": 5500 }, { "epoch": 5.864, "eval_loss": 0.32364729046821594, "eval_runtime": 147.2305, "eval_samples_per_second": 20.376, "eval_steps_per_second": 2.547, "eval_wer": 0.4314076025592774, "step": 5500 }, { "epoch": 6.3968, "grad_norm": 2.4523627758026123, "learning_rate": 0.00011422297297297297, "loss": 0.3111, "step": 6000 }, { "epoch": 6.3968, "eval_loss": 0.3129761517047882, "eval_runtime": 146.9224, "eval_samples_per_second": 20.419, "eval_steps_per_second": 2.552, "eval_wer": 0.4113662024840045, "step": 6000 }, { "epoch": 6.930133333333333, "grad_norm": 1.3307918310165405, "learning_rate": 9.733108108108107e-05, "loss": 0.3032, "step": 6500 }, { "epoch": 6.930133333333333, "eval_loss": 0.301826536655426, "eval_runtime": 147.6721, "eval_samples_per_second": 20.315, "eval_steps_per_second": 2.539, "eval_wer": 0.4039330071509221, "step": 6500 }, { "epoch": 7.462933333333333, "grad_norm": 1.828587532043457, "learning_rate": 8.043918918918918e-05, "loss": 0.2698, "step": 7000 }, { "epoch": 7.462933333333333, "eval_loss": 0.29749611020088196, "eval_runtime": 146.8529, "eval_samples_per_second": 20.429, "eval_steps_per_second": 2.554, "eval_wer": 0.3873729770417764, "step": 7000 }, { "epoch": 7.996266666666667, "grad_norm": 1.7805229425430298, "learning_rate": 6.354729729729729e-05, "loss": 0.2661, "step": 7500 }, { "epoch": 7.996266666666667, "eval_loss": 0.2899162769317627, "eval_runtime": 147.9735, "eval_samples_per_second": 20.274, "eval_steps_per_second": 2.534, "eval_wer": 0.3744824990590892, "step": 7500 }, { "epoch": 8.529066666666667, "grad_norm": 1.059174656867981, "learning_rate": 4.66554054054054e-05, "loss": 0.233, "step": 8000 }, { "epoch": 8.529066666666667, "eval_loss": 0.2895633280277252, "eval_runtime": 147.1645, "eval_samples_per_second": 20.385, "eval_steps_per_second": 2.548, "eval_wer": 0.36356793375987956, "step": 8000 }, { "epoch": 9.061866666666667, "grad_norm": 0.938797116279602, "learning_rate": 2.976351351351351e-05, "loss": 0.2336, "step": 8500 }, { "epoch": 9.061866666666667, "eval_loss": 0.2831208407878876, "eval_runtime": 147.624, "eval_samples_per_second": 20.322, "eval_steps_per_second": 2.54, "eval_wer": 0.35641701166729395, "step": 8500 }, { "epoch": 9.5952, "grad_norm": 6.92275333404541, "learning_rate": 1.287162162162162e-05, "loss": 0.2137, "step": 9000 }, { "epoch": 9.5952, "eval_loss": 0.27855604887008667, "eval_runtime": 146.2994, "eval_samples_per_second": 20.506, "eval_steps_per_second": 2.563, "eval_wer": 0.3495483628152051, "step": 9000 } ], "logging_steps": 500, "max_steps": 9380, "num_input_tokens_seen": 0, "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.167851661799376e+19, "train_batch_size": 8, "trial_name": null, "trial_params": null }