devvanshhh's picture
Training in progress, epoch 5, checkpoint
d95e6cf
{
"best_metric": 0.3688497543334961,
"best_model_checkpoint": "flanT5-description-generation/checkpoint-495",
"epoch": 5.0,
"eval_steps": 500,
"global_step": 495,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_gen_len": 2.4263959390862944,
"eval_loss": 3.9740889072418213,
"eval_rouge1": 7.1174,
"eval_rouge2": 6.3701,
"eval_rougeL": 6.7345,
"eval_rougeLsum": 6.7347,
"eval_runtime": 14.6896,
"eval_samples_per_second": 13.411,
"eval_steps_per_second": 1.702,
"step": 99
},
{
"epoch": 2.0,
"eval_gen_len": 2.6142131979695433,
"eval_loss": 1.633987307548523,
"eval_rouge1": 7.0189,
"eval_rouge2": 6.2738,
"eval_rougeL": 6.6359,
"eval_rougeLsum": 6.6379,
"eval_runtime": 16.099,
"eval_samples_per_second": 12.237,
"eval_steps_per_second": 1.553,
"step": 198
},
{
"epoch": 3.0,
"eval_gen_len": 3.0406091370558377,
"eval_loss": 0.7071468234062195,
"eval_rouge1": 6.887,
"eval_rouge2": 6.1128,
"eval_rougeL": 6.512,
"eval_rougeLsum": 6.515,
"eval_runtime": 12.3043,
"eval_samples_per_second": 16.011,
"eval_steps_per_second": 2.032,
"step": 297
},
{
"epoch": 4.0,
"eval_gen_len": 5.5786802030456855,
"eval_loss": 0.42786499857902527,
"eval_rouge1": 6.0645,
"eval_rouge2": 5.1995,
"eval_rougeL": 5.6723,
"eval_rougeLsum": 5.6926,
"eval_runtime": 16.8779,
"eval_samples_per_second": 11.672,
"eval_steps_per_second": 1.481,
"step": 396
},
{
"epoch": 5.0,
"eval_gen_len": 4.604060913705584,
"eval_loss": 0.3688497543334961,
"eval_rouge1": 6.3055,
"eval_rouge2": 5.5351,
"eval_rougeL": 5.9301,
"eval_rougeLsum": 5.9371,
"eval_runtime": 15.2339,
"eval_samples_per_second": 12.932,
"eval_steps_per_second": 1.641,
"step": 495
}
],
"logging_steps": 500,
"max_steps": 495,
"num_train_epochs": 5,
"save_steps": 500,
"total_flos": 731479136010240.0,
"trial_name": null,
"trial_params": null
}