| { | |
| "best_global_step": 9000, | |
| "best_metric": 0.3495483628152051, | |
| "best_model_checkpoint": "/content/drive/MyDrive/Model-Finetuning/wav2vec2/model/zu_wav2vec2/checkpoint-9000", | |
| "epoch": 10.0, | |
| "eval_steps": 500, | |
| "global_step": 9380, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.5333333333333333, | |
| "grad_norm": 2.2490434646606445, | |
| "learning_rate": 0.00029939999999999996, | |
| "loss": 5.3513, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.5333333333333333, | |
| "eval_loss": 3.067410707473755, | |
| "eval_runtime": 142.738, | |
| "eval_samples_per_second": 21.018, | |
| "eval_steps_per_second": 2.627, | |
| "eval_wer": 1.0, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.0661333333333334, | |
| "grad_norm": 1.0280228853225708, | |
| "learning_rate": 0.0002831418918918919, | |
| "loss": 2.4793, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 1.0661333333333334, | |
| "eval_loss": 1.1224186420440674, | |
| "eval_runtime": 144.1294, | |
| "eval_samples_per_second": 20.815, | |
| "eval_steps_per_second": 2.602, | |
| "eval_wer": 0.992002258185924, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 1.5994666666666668, | |
| "grad_norm": 1.6041176319122314, | |
| "learning_rate": 0.00026624999999999994, | |
| "loss": 0.9637, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 1.5994666666666668, | |
| "eval_loss": 0.6741820573806763, | |
| "eval_runtime": 143.9596, | |
| "eval_samples_per_second": 20.839, | |
| "eval_steps_per_second": 2.605, | |
| "eval_wer": 0.7161272111403839, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 2.1322666666666668, | |
| "grad_norm": 1.4150700569152832, | |
| "learning_rate": 0.00024935810810810806, | |
| "loss": 0.717, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 2.1322666666666668, | |
| "eval_loss": 0.5053547620773315, | |
| "eval_runtime": 145.0264, | |
| "eval_samples_per_second": 20.686, | |
| "eval_steps_per_second": 2.586, | |
| "eval_wer": 0.620530673692134, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 2.6656, | |
| "grad_norm": 1.3749128580093384, | |
| "learning_rate": 0.0002324662162162162, | |
| "loss": 0.5979, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 2.6656, | |
| "eval_loss": 0.4564489424228668, | |
| "eval_runtime": 145.9072, | |
| "eval_samples_per_second": 20.561, | |
| "eval_steps_per_second": 2.57, | |
| "eval_wer": 0.5550432818968761, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 3.1984, | |
| "grad_norm": 1.1167936325073242, | |
| "learning_rate": 0.00021557432432432432, | |
| "loss": 0.5388, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 3.1984, | |
| "eval_loss": 0.4222851097583771, | |
| "eval_runtime": 146.8407, | |
| "eval_samples_per_second": 20.43, | |
| "eval_steps_per_second": 2.554, | |
| "eval_wer": 0.5333082423786225, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 3.7317333333333336, | |
| "grad_norm": 1.713294267654419, | |
| "learning_rate": 0.00019868243243243244, | |
| "loss": 0.4762, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 3.7317333333333336, | |
| "eval_loss": 0.3905419409275055, | |
| "eval_runtime": 146.5994, | |
| "eval_samples_per_second": 20.464, | |
| "eval_steps_per_second": 2.558, | |
| "eval_wer": 0.4974595408355288, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 4.2645333333333335, | |
| "grad_norm": 2.082676887512207, | |
| "learning_rate": 0.0001817905405405405, | |
| "loss": 0.4398, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 4.2645333333333335, | |
| "eval_loss": 0.3778238892555237, | |
| "eval_runtime": 145.863, | |
| "eval_samples_per_second": 20.567, | |
| "eval_steps_per_second": 2.571, | |
| "eval_wer": 0.48692133985698155, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 4.797866666666667, | |
| "grad_norm": 2.2089028358459473, | |
| "learning_rate": 0.00016489864864864862, | |
| "loss": 0.4098, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 4.797866666666667, | |
| "eval_loss": 0.35478344559669495, | |
| "eval_runtime": 146.045, | |
| "eval_samples_per_second": 20.542, | |
| "eval_steps_per_second": 2.568, | |
| "eval_wer": 0.4574708317651487, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 5.330666666666667, | |
| "grad_norm": 1.058657169342041, | |
| "learning_rate": 0.00014800675675675674, | |
| "loss": 0.3823, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 5.330666666666667, | |
| "eval_loss": 0.3355245292186737, | |
| "eval_runtime": 145.8678, | |
| "eval_samples_per_second": 20.567, | |
| "eval_steps_per_second": 2.571, | |
| "eval_wer": 0.45079036507339104, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 5.864, | |
| "grad_norm": 1.4570820331573486, | |
| "learning_rate": 0.00013111486486486486, | |
| "loss": 0.3513, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 5.864, | |
| "eval_loss": 0.32364729046821594, | |
| "eval_runtime": 147.2305, | |
| "eval_samples_per_second": 20.376, | |
| "eval_steps_per_second": 2.547, | |
| "eval_wer": 0.4314076025592774, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 6.3968, | |
| "grad_norm": 2.4523627758026123, | |
| "learning_rate": 0.00011422297297297297, | |
| "loss": 0.3111, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 6.3968, | |
| "eval_loss": 0.3129761517047882, | |
| "eval_runtime": 146.9224, | |
| "eval_samples_per_second": 20.419, | |
| "eval_steps_per_second": 2.552, | |
| "eval_wer": 0.4113662024840045, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 6.930133333333333, | |
| "grad_norm": 1.3307918310165405, | |
| "learning_rate": 9.733108108108107e-05, | |
| "loss": 0.3032, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 6.930133333333333, | |
| "eval_loss": 0.301826536655426, | |
| "eval_runtime": 147.6721, | |
| "eval_samples_per_second": 20.315, | |
| "eval_steps_per_second": 2.539, | |
| "eval_wer": 0.4039330071509221, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 7.462933333333333, | |
| "grad_norm": 1.828587532043457, | |
| "learning_rate": 8.043918918918918e-05, | |
| "loss": 0.2698, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 7.462933333333333, | |
| "eval_loss": 0.29749611020088196, | |
| "eval_runtime": 146.8529, | |
| "eval_samples_per_second": 20.429, | |
| "eval_steps_per_second": 2.554, | |
| "eval_wer": 0.3873729770417764, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 7.996266666666667, | |
| "grad_norm": 1.7805229425430298, | |
| "learning_rate": 6.354729729729729e-05, | |
| "loss": 0.2661, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 7.996266666666667, | |
| "eval_loss": 0.2899162769317627, | |
| "eval_runtime": 147.9735, | |
| "eval_samples_per_second": 20.274, | |
| "eval_steps_per_second": 2.534, | |
| "eval_wer": 0.3744824990590892, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 8.529066666666667, | |
| "grad_norm": 1.059174656867981, | |
| "learning_rate": 4.66554054054054e-05, | |
| "loss": 0.233, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 8.529066666666667, | |
| "eval_loss": 0.2895633280277252, | |
| "eval_runtime": 147.1645, | |
| "eval_samples_per_second": 20.385, | |
| "eval_steps_per_second": 2.548, | |
| "eval_wer": 0.36356793375987956, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 9.061866666666667, | |
| "grad_norm": 0.938797116279602, | |
| "learning_rate": 2.976351351351351e-05, | |
| "loss": 0.2336, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 9.061866666666667, | |
| "eval_loss": 0.2831208407878876, | |
| "eval_runtime": 147.624, | |
| "eval_samples_per_second": 20.322, | |
| "eval_steps_per_second": 2.54, | |
| "eval_wer": 0.35641701166729395, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 9.5952, | |
| "grad_norm": 6.92275333404541, | |
| "learning_rate": 1.287162162162162e-05, | |
| "loss": 0.2137, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 9.5952, | |
| "eval_loss": 0.27855604887008667, | |
| "eval_runtime": 146.2994, | |
| "eval_samples_per_second": 20.506, | |
| "eval_steps_per_second": 2.563, | |
| "eval_wer": 0.3495483628152051, | |
| "step": 9000 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 9380, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 10, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": true | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 2.167851661799376e+19, | |
| "train_batch_size": 8, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |