grammar-anarchist's picture
Upload trainer_state.json with huggingface_hub
2e50a9c
{
"best_metric": 0.27009761333465576,
"best_model_checkpoint": "./models/results_semeval_2021_task_7_47/checkpoint-125",
"epoch": 1.0,
"global_step": 125,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.06,
"learning_rate": 4.000000000000001e-06,
"loss": 0.6826,
"step": 8
},
{
"epoch": 0.13,
"learning_rate": 8.000000000000001e-06,
"loss": 0.6743,
"step": 16
},
{
"epoch": 0.19,
"learning_rate": 1.2e-05,
"loss": 0.6628,
"step": 24
},
{
"epoch": 0.2,
"eval_accuracy": 0.632,
"eval_f1": 0.7745098039215685,
"eval_loss": 0.6330053806304932,
"eval_precision": 0.632,
"eval_recall": 1.0,
"eval_runtime": 5.3505,
"eval_samples_per_second": 186.899,
"eval_steps_per_second": 23.362,
"step": 25
},
{
"epoch": 0.26,
"learning_rate": 1.55e-05,
"loss": 0.6508,
"step": 32
},
{
"epoch": 0.32,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.6273,
"step": 40
},
{
"epoch": 0.38,
"learning_rate": 2.35e-05,
"loss": 0.4721,
"step": 48
},
{
"epoch": 0.4,
"eval_accuracy": 0.866,
"eval_f1": 0.8962848297213623,
"eval_loss": 0.34409669041633606,
"eval_precision": 0.8772727272727273,
"eval_recall": 0.9161392405063291,
"eval_runtime": 5.3938,
"eval_samples_per_second": 185.399,
"eval_steps_per_second": 23.175,
"step": 50
},
{
"epoch": 0.45,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.3121,
"step": 56
},
{
"epoch": 0.51,
"learning_rate": 3.15e-05,
"loss": 0.3055,
"step": 64
},
{
"epoch": 0.58,
"learning_rate": 3.55e-05,
"loss": 0.2453,
"step": 72
},
{
"epoch": 0.6,
"eval_accuracy": 0.88,
"eval_f1": 0.904153354632588,
"eval_loss": 0.28931811451911926,
"eval_precision": 0.9129032258064517,
"eval_recall": 0.8955696202531646,
"eval_runtime": 5.3384,
"eval_samples_per_second": 187.324,
"eval_steps_per_second": 23.415,
"step": 75
},
{
"epoch": 0.64,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.1981,
"step": 80
},
{
"epoch": 0.7,
"learning_rate": 4.35e-05,
"loss": 0.2172,
"step": 88
},
{
"epoch": 0.77,
"learning_rate": 4.75e-05,
"loss": 0.1548,
"step": 96
},
{
"epoch": 0.8,
"eval_accuracy": 0.886,
"eval_f1": 0.9053156146179402,
"eval_loss": 0.2869994044303894,
"eval_precision": 0.9527972027972028,
"eval_recall": 0.8623417721518988,
"eval_runtime": 5.3401,
"eval_samples_per_second": 187.263,
"eval_steps_per_second": 23.408,
"step": 100
},
{
"epoch": 0.83,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1933,
"step": 104
},
{
"epoch": 0.9,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.1873,
"step": 112
},
{
"epoch": 0.96,
"learning_rate": 1.2e-05,
"loss": 0.184,
"step": 120
},
{
"epoch": 1.0,
"eval_accuracy": 0.897,
"eval_f1": 0.9203402938901779,
"eval_loss": 0.27009761333465576,
"eval_precision": 0.9001512859304085,
"eval_recall": 0.9414556962025317,
"eval_runtime": 5.3512,
"eval_samples_per_second": 186.874,
"eval_steps_per_second": 23.359,
"step": 125
}
],
"max_steps": 125,
"num_train_epochs": 1,
"total_flos": 546777661920000.0,
"trial_name": null,
"trial_params": null
}