w2v-Morisyen / trainer_state.json
eleferrand's picture
Upload folder using huggingface_hub
e565b52 verified
{
"best_metric": 0.4995602462620932,
"best_model_checkpoint": "/scratch/leferran/model_computel/Morisyen_xlsr53_2phase_mapped_French/checkpoint-830",
"epoch": 10.0,
"global_step": 830,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_loss": 0.7071983218193054,
"eval_runtime": 0.6963,
"eval_samples_per_second": 231.238,
"eval_steps_per_second": 30.162,
"eval_wer": 0.6086191732629728,
"step": 83
},
{
"epoch": 2.0,
"eval_loss": 0.6636466383934021,
"eval_runtime": 0.6661,
"eval_samples_per_second": 241.713,
"eval_steps_per_second": 31.528,
"eval_wer": 0.5593667546174143,
"step": 166
},
{
"epoch": 3.0,
"eval_loss": 0.7175659537315369,
"eval_runtime": 0.6672,
"eval_samples_per_second": 241.298,
"eval_steps_per_second": 31.474,
"eval_wer": 0.5461741424802111,
"step": 249
},
{
"epoch": 4.0,
"eval_loss": 0.7306005954742432,
"eval_runtime": 0.6669,
"eval_samples_per_second": 241.429,
"eval_steps_per_second": 31.491,
"eval_wer": 0.5285839929639402,
"step": 332
},
{
"epoch": 5.0,
"eval_loss": 0.7698836326599121,
"eval_runtime": 0.6667,
"eval_samples_per_second": 241.506,
"eval_steps_per_second": 31.501,
"eval_wer": 0.5461741424802111,
"step": 415
},
{
"epoch": 6.0,
"eval_loss": 0.7805858254432678,
"eval_runtime": 0.6659,
"eval_samples_per_second": 241.763,
"eval_steps_per_second": 31.534,
"eval_wer": 0.5576077396657871,
"step": 498
},
{
"epoch": 6.02,
"learning_rate": 0.00023987951807228914,
"loss": 0.6806,
"step": 500
},
{
"epoch": 7.0,
"eval_loss": 0.8358508944511414,
"eval_runtime": 0.668,
"eval_samples_per_second": 241.027,
"eval_steps_per_second": 31.438,
"eval_wer": 0.5417766051011433,
"step": 581
},
{
"epoch": 8.0,
"eval_loss": 0.9229233860969543,
"eval_runtime": 0.6689,
"eval_samples_per_second": 240.71,
"eval_steps_per_second": 31.397,
"eval_wer": 0.5408970976253298,
"step": 664
},
{
"epoch": 9.0,
"eval_loss": 0.9406667947769165,
"eval_runtime": 0.6681,
"eval_samples_per_second": 240.977,
"eval_steps_per_second": 31.432,
"eval_wer": 0.5074758135444152,
"step": 747
},
{
"epoch": 10.0,
"eval_loss": 0.9393610954284668,
"eval_runtime": 0.6679,
"eval_samples_per_second": 241.051,
"eval_steps_per_second": 31.441,
"eval_wer": 0.4995602462620932,
"step": 830
}
],
"max_steps": 2490,
"num_train_epochs": 30,
"total_flos": 3.21639689183166e+18,
"trial_name": null,
"trial_params": null
}