{ "best_global_step": 4200, "best_metric": 0.27899159663865547, "best_model_checkpoint": "/content/drive/MyDrive/Model-Finetuning/wav2vec2/model/ssw_wav2vec2/checkpoint-4200", "epoch": 9.0, "eval_steps": 200, "global_step": 4221, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.42643923240938164, "eval_loss": 3.127868413925171, "eval_runtime": 142.7527, "eval_samples_per_second": 21.015, "eval_steps_per_second": 2.627, "eval_wer": 1.0, "step": 200 }, { "epoch": 0.8528784648187633, "grad_norm": 0.9250941276550293, "learning_rate": 0.0002394, "loss": 6.4279, "step": 400 }, { "epoch": 0.8528784648187633, "eval_loss": 3.041430950164795, "eval_runtime": 139.9604, "eval_samples_per_second": 21.435, "eval_steps_per_second": 2.679, "eval_wer": 1.0, "step": 400 }, { "epoch": 1.279317697228145, "eval_loss": 0.7837706804275513, "eval_runtime": 142.266, "eval_samples_per_second": 21.087, "eval_steps_per_second": 2.636, "eval_wer": 0.8429013710747457, "step": 600 }, { "epoch": 1.7057569296375266, "grad_norm": 1.504073977470398, "learning_rate": 0.00027589357699543134, "loss": 1.5163, "step": 800 }, { "epoch": 1.7057569296375266, "eval_loss": 0.43869534134864807, "eval_runtime": 142.8144, "eval_samples_per_second": 21.006, "eval_steps_per_second": 2.626, "eval_wer": 0.572578505086245, "step": 800 }, { "epoch": 2.1321961620469083, "eval_loss": 0.3610222041606903, "eval_runtime": 142.7562, "eval_samples_per_second": 21.015, "eval_steps_per_second": 2.627, "eval_wer": 0.49570986289252544, "step": 1000 }, { "epoch": 2.55863539445629, "grad_norm": 0.7447084784507751, "learning_rate": 0.00024364418167159365, "loss": 0.5075, "step": 1200 }, { "epoch": 2.55863539445629, "eval_loss": 0.31982430815696716, "eval_runtime": 143.4945, "eval_samples_per_second": 20.907, "eval_steps_per_second": 2.613, "eval_wer": 0.443343653250774, "step": 1200 }, { "epoch": 2.9850746268656714, "eval_loss": 0.3008059561252594, "eval_runtime": 143.8433, "eval_samples_per_second": 20.856, "eval_steps_per_second": 2.607, "eval_wer": 0.4136222910216718, "step": 1400 }, { "epoch": 3.411513859275053, "grad_norm": 1.511812448501587, "learning_rate": 0.00021139478634775596, "loss": 0.3842, "step": 1600 }, { "epoch": 3.411513859275053, "eval_loss": 0.28225278854370117, "eval_runtime": 143.5383, "eval_samples_per_second": 20.9, "eval_steps_per_second": 2.613, "eval_wer": 0.3946926138876603, "step": 1600 }, { "epoch": 3.837953091684435, "eval_loss": 0.2640756368637085, "eval_runtime": 143.3526, "eval_samples_per_second": 20.927, "eval_steps_per_second": 2.616, "eval_wer": 0.3823971693940734, "step": 1800 }, { "epoch": 4.264392324093817, "grad_norm": 0.5882211327552795, "learning_rate": 0.0001791453910239183, "loss": 0.3314, "step": 2000 }, { "epoch": 4.264392324093817, "eval_loss": 0.25088655948638916, "eval_runtime": 142.3146, "eval_samples_per_second": 21.08, "eval_steps_per_second": 2.635, "eval_wer": 0.36134453781512604, "step": 2000 }, { "epoch": 4.690831556503198, "eval_loss": 0.23431462049484253, "eval_runtime": 143.7921, "eval_samples_per_second": 20.863, "eval_steps_per_second": 2.608, "eval_wer": 0.3430340557275542, "step": 2200 }, { "epoch": 5.11727078891258, "grad_norm": 0.9549380540847778, "learning_rate": 0.00014689599570008062, "loss": 0.2881, "step": 2400 }, { "epoch": 5.11727078891258, "eval_loss": 0.238094761967659, "eval_runtime": 144.6143, "eval_samples_per_second": 20.745, "eval_steps_per_second": 2.593, "eval_wer": 0.3442724458204334, "step": 2400 }, { "epoch": 5.543710021321962, "eval_loss": 0.23333857953548431, "eval_runtime": 145.5196, "eval_samples_per_second": 20.616, "eval_steps_per_second": 2.577, "eval_wer": 0.32596196373286157, "step": 2600 }, { "epoch": 5.970149253731344, "grad_norm": 0.9989615678787231, "learning_rate": 0.00011464660037624293, "loss": 0.254, "step": 2800 }, { "epoch": 5.970149253731344, "eval_loss": 0.21401432156562805, "eval_runtime": 145.1881, "eval_samples_per_second": 20.663, "eval_steps_per_second": 2.583, "eval_wer": 0.3229544449358691, "step": 2800 }, { "epoch": 6.396588486140725, "eval_loss": 0.2184174358844757, "eval_runtime": 144.6886, "eval_samples_per_second": 20.734, "eval_steps_per_second": 2.592, "eval_wer": 0.3101282618310482, "step": 3000 }, { "epoch": 6.823027718550106, "grad_norm": 1.2803609371185303, "learning_rate": 8.239720505240526e-05, "loss": 0.2216, "step": 3200 }, { "epoch": 6.823027718550106, "eval_loss": 0.20931990444660187, "eval_runtime": 147.2603, "eval_samples_per_second": 20.372, "eval_steps_per_second": 2.547, "eval_wer": 0.2998673153471915, "step": 3200 }, { "epoch": 7.249466950959488, "eval_loss": 0.2027914673089981, "eval_runtime": 147.0408, "eval_samples_per_second": 20.403, "eval_steps_per_second": 2.55, "eval_wer": 0.2978328173374613, "step": 3400 }, { "epoch": 7.67590618336887, "grad_norm": 0.5627148151397705, "learning_rate": 5.014780972856759e-05, "loss": 0.2088, "step": 3600 }, { "epoch": 7.67590618336887, "eval_loss": 0.20001129806041718, "eval_runtime": 147.1699, "eval_samples_per_second": 20.385, "eval_steps_per_second": 2.548, "eval_wer": 0.28907563025210087, "step": 3600 }, { "epoch": 8.102345415778252, "eval_loss": 0.20037885010242462, "eval_runtime": 147.1466, "eval_samples_per_second": 20.388, "eval_steps_per_second": 2.548, "eval_wer": 0.2854489164086687, "step": 3800 }, { "epoch": 8.528784648187633, "grad_norm": 1.2863858938217163, "learning_rate": 1.789841440472991e-05, "loss": 0.181, "step": 4000 }, { "epoch": 8.528784648187633, "eval_loss": 0.1965806633234024, "eval_runtime": 146.72, "eval_samples_per_second": 20.447, "eval_steps_per_second": 2.556, "eval_wer": 0.2815568332596196, "step": 4000 }, { "epoch": 8.955223880597014, "eval_loss": 0.19471502304077148, "eval_runtime": 146.2668, "eval_samples_per_second": 20.51, "eval_steps_per_second": 2.564, "eval_wer": 0.27899159663865547, "step": 4200 } ], "logging_steps": 400, "max_steps": 4221, "num_input_tokens_seen": 0, "num_train_epochs": 9, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.0631810349421126e+19, "train_batch_size": 16, "trial_name": null, "trial_params": null }