{ "best_global_step": 9000, "best_metric": 0.2908235294117647, "best_model_checkpoint": "/content/drive/MyDrive/Model-Finetuning/wav2vec2/model/nbl_wav2vec2/checkpoint-9000", "epoch": 10.0, "eval_steps": 500, "global_step": 9380, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.5333333333333333, "grad_norm": 2.6857900619506836, "learning_rate": 0.00029939999999999996, "loss": 5.2283, "step": 500 }, { "epoch": 0.5333333333333333, "eval_loss": 2.025707721710205, "eval_runtime": 148.4202, "eval_samples_per_second": 20.213, "eval_steps_per_second": 2.527, "eval_wer": 1.0111372549019608, "step": 500 }, { "epoch": 1.0661333333333334, "grad_norm": 1.386874794960022, "learning_rate": 0.0002831418918918919, "loss": 0.9713, "step": 1000 }, { "epoch": 1.0661333333333334, "eval_loss": 0.5391530394554138, "eval_runtime": 148.3623, "eval_samples_per_second": 20.221, "eval_steps_per_second": 2.528, "eval_wer": 0.6509019607843137, "step": 1000 }, { "epoch": 1.5994666666666668, "grad_norm": 2.7049543857574463, "learning_rate": 0.00026624999999999994, "loss": 0.6379, "step": 1500 }, { "epoch": 1.5994666666666668, "eval_loss": 0.42855554819107056, "eval_runtime": 148.347, "eval_samples_per_second": 20.223, "eval_steps_per_second": 2.528, "eval_wer": 0.5332549019607843, "step": 1500 }, { "epoch": 2.1322666666666668, "grad_norm": 1.8714250326156616, "learning_rate": 0.00024935810810810806, "loss": 0.5595, "step": 2000 }, { "epoch": 2.1322666666666668, "eval_loss": 0.39198794960975647, "eval_runtime": 149.3713, "eval_samples_per_second": 20.084, "eval_steps_per_second": 2.511, "eval_wer": 0.5109803921568628, "step": 2000 }, { "epoch": 2.6656, "grad_norm": 1.8362187147140503, "learning_rate": 0.0002324662162162162, "loss": 0.4807, "step": 2500 }, { "epoch": 2.6656, "eval_loss": 0.3563985228538513, "eval_runtime": 149.1684, "eval_samples_per_second": 20.112, "eval_steps_per_second": 2.514, "eval_wer": 0.46658823529411764, "step": 2500 }, { "epoch": 3.1984, "grad_norm": 1.0880553722381592, "learning_rate": 0.00021557432432432432, "loss": 0.4404, "step": 3000 }, { "epoch": 3.1984, "eval_loss": 0.3388464152812958, "eval_runtime": 149.8437, "eval_samples_per_second": 20.021, "eval_steps_per_second": 2.503, "eval_wer": 0.42486274509803923, "step": 3000 }, { "epoch": 3.7317333333333336, "grad_norm": 10.404922485351562, "learning_rate": 0.00019868243243243244, "loss": 0.4022, "step": 3500 }, { "epoch": 3.7317333333333336, "eval_loss": 0.3252636194229126, "eval_runtime": 150.8413, "eval_samples_per_second": 19.888, "eval_steps_per_second": 2.486, "eval_wer": 0.4043921568627451, "step": 3500 }, { "epoch": 4.2645333333333335, "grad_norm": 4.443390846252441, "learning_rate": 0.0001817905405405405, "loss": 0.3754, "step": 4000 }, { "epoch": 4.2645333333333335, "eval_loss": 0.3209179937839508, "eval_runtime": 150.4901, "eval_samples_per_second": 19.935, "eval_steps_per_second": 2.492, "eval_wer": 0.4051764705882353, "step": 4000 }, { "epoch": 4.797866666666667, "grad_norm": 1.9804564714431763, "learning_rate": 0.00016489864864864862, "loss": 0.3379, "step": 4500 }, { "epoch": 4.797866666666667, "eval_loss": 0.30479735136032104, "eval_runtime": 149.6398, "eval_samples_per_second": 20.048, "eval_steps_per_second": 2.506, "eval_wer": 0.3894901960784314, "step": 4500 }, { "epoch": 5.330666666666667, "grad_norm": 1.1342227458953857, "learning_rate": 0.00014800675675675674, "loss": 0.3184, "step": 5000 }, { "epoch": 5.330666666666667, "eval_loss": 0.28083688020706177, "eval_runtime": 150.4194, "eval_samples_per_second": 19.944, "eval_steps_per_second": 2.493, "eval_wer": 0.3618823529411765, "step": 5000 }, { "epoch": 5.864, "grad_norm": 0.6732638478279114, "learning_rate": 0.00013111486486486486, "loss": 0.3003, "step": 5500 }, { "epoch": 5.864, "eval_loss": 0.27100080251693726, "eval_runtime": 150.5926, "eval_samples_per_second": 19.921, "eval_steps_per_second": 2.49, "eval_wer": 0.3436078431372549, "step": 5500 }, { "epoch": 6.3968, "grad_norm": 4.13991117477417, "learning_rate": 0.00011422297297297297, "loss": 0.264, "step": 6000 }, { "epoch": 6.3968, "eval_loss": 0.264404833316803, "eval_runtime": 151.1359, "eval_samples_per_second": 19.85, "eval_steps_per_second": 2.481, "eval_wer": 0.33356862745098037, "step": 6000 }, { "epoch": 6.930133333333333, "grad_norm": 3.0504963397979736, "learning_rate": 9.733108108108107e-05, "loss": 0.2574, "step": 6500 }, { "epoch": 6.930133333333333, "eval_loss": 0.24905848503112793, "eval_runtime": 151.2904, "eval_samples_per_second": 19.829, "eval_steps_per_second": 2.479, "eval_wer": 0.3235294117647059, "step": 6500 }, { "epoch": 7.462933333333333, "grad_norm": 1.2022693157196045, "learning_rate": 8.043918918918918e-05, "loss": 0.2319, "step": 7000 }, { "epoch": 7.462933333333333, "eval_loss": 0.26013123989105225, "eval_runtime": 150.0311, "eval_samples_per_second": 19.996, "eval_steps_per_second": 2.499, "eval_wer": 0.31301960784313726, "step": 7000 }, { "epoch": 7.996266666666667, "grad_norm": 0.9905935525894165, "learning_rate": 6.354729729729729e-05, "loss": 0.2194, "step": 7500 }, { "epoch": 7.996266666666667, "eval_loss": 0.24855607748031616, "eval_runtime": 151.4319, "eval_samples_per_second": 19.811, "eval_steps_per_second": 2.476, "eval_wer": 0.3060392156862745, "step": 7500 }, { "epoch": 8.529066666666667, "grad_norm": 1.2119730710983276, "learning_rate": 4.66554054054054e-05, "loss": 0.1958, "step": 8000 }, { "epoch": 8.529066666666667, "eval_loss": 0.24899743497371674, "eval_runtime": 151.042, "eval_samples_per_second": 19.862, "eval_steps_per_second": 2.483, "eval_wer": 0.30227450980392156, "step": 8000 }, { "epoch": 9.061866666666667, "grad_norm": 0.6335813999176025, "learning_rate": 2.976351351351351e-05, "loss": 0.1912, "step": 8500 }, { "epoch": 9.061866666666667, "eval_loss": 0.23850028216838837, "eval_runtime": 152.7072, "eval_samples_per_second": 19.645, "eval_steps_per_second": 2.456, "eval_wer": 0.2931764705882353, "step": 8500 }, { "epoch": 9.5952, "grad_norm": 2.9868931770324707, "learning_rate": 1.287162162162162e-05, "loss": 0.1749, "step": 9000 }, { "epoch": 9.5952, "eval_loss": 0.2415107637643814, "eval_runtime": 150.7897, "eval_samples_per_second": 19.895, "eval_steps_per_second": 2.487, "eval_wer": 0.2908235294117647, "step": 9000 } ], "logging_steps": 500, "max_steps": 9380, "num_input_tokens_seen": 0, "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.270554818805736e+19, "train_batch_size": 8, "trial_name": null, "trial_params": null }