model3FromWav2vec / checkpoint-2400 /trainer_state.json
fkHug's picture
Update from
6566740
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 30.0,
"global_step": 2400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 5.0,
"learning_rate": 8e-05,
"loss": 9.4971,
"step": 400
},
{
"epoch": 5.0,
"eval_loss": 3.1448328495025635,
"eval_runtime": 45.2941,
"eval_samples_per_second": 14.13,
"eval_wer": 1.0,
"step": 400
},
{
"epoch": 10.0,
"learning_rate": 8.421052631578948e-05,
"loss": 2.4507,
"step": 800
},
{
"epoch": 10.0,
"eval_loss": 1.3176685571670532,
"eval_runtime": 45.3981,
"eval_samples_per_second": 14.098,
"eval_wer": 1.029591836734694,
"step": 800
},
{
"epoch": 15.0,
"learning_rate": 6.31578947368421e-05,
"loss": 0.6394,
"step": 1200
},
{
"epoch": 15.0,
"eval_loss": 1.0083409547805786,
"eval_runtime": 45.4018,
"eval_samples_per_second": 14.096,
"eval_wer": 0.7188775510204082,
"step": 1200
},
{
"epoch": 20.0,
"learning_rate": 4.210526315789474e-05,
"loss": 0.3395,
"step": 1600
},
{
"epoch": 20.0,
"eval_loss": 1.0249711275100708,
"eval_runtime": 45.9714,
"eval_samples_per_second": 13.922,
"eval_wer": 0.6642857142857143,
"step": 1600
},
{
"epoch": 25.0,
"learning_rate": 2.105263157894737e-05,
"loss": 0.2434,
"step": 2000
},
{
"epoch": 25.0,
"eval_loss": 1.1575790643692017,
"eval_runtime": 46.2674,
"eval_samples_per_second": 13.833,
"eval_wer": 0.6357142857142857,
"step": 2000
},
{
"epoch": 30.0,
"learning_rate": 0.0,
"loss": 0.2048,
"step": 2400
},
{
"epoch": 30.0,
"eval_loss": 1.2169420719146729,
"eval_runtime": 49.8509,
"eval_samples_per_second": 12.838,
"eval_wer": 0.625,
"step": 2400
}
],
"max_steps": 2400,
"num_train_epochs": 30,
"total_flos": 7.003249081477079e+18,
"trial_name": null,
"trial_params": null
}