add_BERT_24_mrpc / trainer_state.json
gokuls's picture
End of training
fef580f
{
"best_metric": 0.584678053855896,
"best_model_checkpoint": "add_BERT_24_mrpc/checkpoint-29",
"epoch": 6.0,
"global_step": 174,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 3.9200000000000004e-05,
"loss": 0.6554,
"step": 29
},
{
"epoch": 1.0,
"eval_accuracy": 0.7009803921568627,
"eval_combined_score": 0.7572180248246088,
"eval_f1": 0.8134556574923548,
"eval_loss": 0.584678053855896,
"eval_runtime": 0.7789,
"eval_samples_per_second": 523.804,
"eval_steps_per_second": 5.135,
"step": 29
},
{
"epoch": 2.0,
"learning_rate": 3.8400000000000005e-05,
"loss": 0.6027,
"step": 58
},
{
"epoch": 2.0,
"eval_accuracy": 0.6985294117647058,
"eval_combined_score": 0.7567835028748342,
"eval_f1": 0.8150375939849624,
"eval_loss": 0.592502772808075,
"eval_runtime": 0.7816,
"eval_samples_per_second": 522.024,
"eval_steps_per_second": 5.118,
"step": 58
},
{
"epoch": 3.0,
"learning_rate": 3.76e-05,
"loss": 0.5423,
"step": 87
},
{
"epoch": 3.0,
"eval_accuracy": 0.6887254901960784,
"eval_combined_score": 0.7468205023945063,
"eval_f1": 0.804915514592934,
"eval_loss": 0.6009986996650696,
"eval_runtime": 0.7825,
"eval_samples_per_second": 521.386,
"eval_steps_per_second": 5.112,
"step": 87
},
{
"epoch": 4.0,
"learning_rate": 3.680000000000001e-05,
"loss": 0.4401,
"step": 116
},
{
"epoch": 4.0,
"eval_accuracy": 0.696078431372549,
"eval_combined_score": 0.7505549389567148,
"eval_f1": 0.8050314465408805,
"eval_loss": 0.6617496609687805,
"eval_runtime": 0.7798,
"eval_samples_per_second": 523.205,
"eval_steps_per_second": 5.129,
"step": 116
},
{
"epoch": 5.0,
"learning_rate": 3.6e-05,
"loss": 0.2731,
"step": 145
},
{
"epoch": 5.0,
"eval_accuracy": 0.6348039215686274,
"eval_combined_score": 0.674954542046264,
"eval_f1": 0.7151051625239007,
"eval_loss": 0.9531154036521912,
"eval_runtime": 0.7861,
"eval_samples_per_second": 519.042,
"eval_steps_per_second": 5.089,
"step": 145
},
{
"epoch": 6.0,
"learning_rate": 3.52e-05,
"loss": 0.16,
"step": 174
},
{
"epoch": 6.0,
"eval_accuracy": 0.6985294117647058,
"eval_combined_score": 0.7514904610492845,
"eval_f1": 0.8044515103338632,
"eval_loss": 1.0282580852508545,
"eval_runtime": 0.7848,
"eval_samples_per_second": 519.861,
"eval_steps_per_second": 5.097,
"step": 174
},
{
"epoch": 6.0,
"step": 174,
"total_flos": 3143269802311680.0,
"train_loss": 0.44560779374221277,
"train_runtime": 154.5382,
"train_samples_per_second": 1186.762,
"train_steps_per_second": 9.383
}
],
"max_steps": 1450,
"num_train_epochs": 50,
"total_flos": 3143269802311680.0,
"trial_name": null,
"trial_params": null
}