grammar-anarchist's picture
Upload trainer_state.json with huggingface_hub
f5037fc
{
"best_metric": 0.2773796319961548,
"best_model_checkpoint": "./models/results_semeval_2017_task_7_693/checkpoint-40",
"epoch": 0.9078014184397163,
"global_step": 40,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.11,
"eval_accuracy": 0.7047146401985112,
"eval_f1": 0.826783114992722,
"eval_loss": 0.5785936117172241,
"eval_precision": 0.7047146401985112,
"eval_recall": 1.0,
"eval_runtime": 2.1163,
"eval_samples_per_second": 190.428,
"eval_steps_per_second": 24.099,
"step": 5
},
{
"epoch": 0.18,
"learning_rate": 4.0909090909090915e-05,
"loss": 0.6121,
"step": 8
},
{
"epoch": 0.23,
"eval_accuracy": 0.7047146401985112,
"eval_f1": 0.826783114992722,
"eval_loss": 0.512681782245636,
"eval_precision": 0.7047146401985112,
"eval_recall": 1.0,
"eval_runtime": 2.1906,
"eval_samples_per_second": 183.972,
"eval_steps_per_second": 23.282,
"step": 10
},
{
"epoch": 0.34,
"eval_accuracy": 0.7047146401985112,
"eval_f1": 0.826783114992722,
"eval_loss": 0.41043248772621155,
"eval_precision": 0.7047146401985112,
"eval_recall": 1.0,
"eval_runtime": 2.1431,
"eval_samples_per_second": 188.049,
"eval_steps_per_second": 23.798,
"step": 15
},
{
"epoch": 0.36,
"learning_rate": 3.181818181818182e-05,
"loss": 0.5116,
"step": 16
},
{
"epoch": 0.45,
"eval_accuracy": 0.7568238213399504,
"eval_f1": 0.8515151515151514,
"eval_loss": 0.37497952580451965,
"eval_precision": 0.7473404255319149,
"eval_recall": 0.9894366197183099,
"eval_runtime": 2.1596,
"eval_samples_per_second": 186.61,
"eval_steps_per_second": 23.616,
"step": 20
},
{
"epoch": 0.54,
"learning_rate": 2.272727272727273e-05,
"loss": 0.3673,
"step": 24
},
{
"epoch": 0.57,
"eval_accuracy": 0.8883374689826302,
"eval_f1": 0.9189189189189191,
"eval_loss": 0.28403061628341675,
"eval_precision": 0.940959409594096,
"eval_recall": 0.897887323943662,
"eval_runtime": 2.1799,
"eval_samples_per_second": 184.873,
"eval_steps_per_second": 23.396,
"step": 25
},
{
"epoch": 0.68,
"eval_accuracy": 0.8957816377171216,
"eval_f1": 0.9275862068965517,
"eval_loss": 0.3391099274158478,
"eval_precision": 0.9087837837837838,
"eval_recall": 0.9471830985915493,
"eval_runtime": 2.1847,
"eval_samples_per_second": 184.465,
"eval_steps_per_second": 23.344,
"step": 30
},
{
"epoch": 0.73,
"learning_rate": 1.4772727272727274e-05,
"loss": 0.3116,
"step": 32
},
{
"epoch": 0.79,
"eval_accuracy": 0.890818858560794,
"eval_f1": 0.9230769230769231,
"eval_loss": 0.31251412630081177,
"eval_precision": 0.9166666666666666,
"eval_recall": 0.9295774647887324,
"eval_runtime": 2.1117,
"eval_samples_per_second": 190.845,
"eval_steps_per_second": 24.152,
"step": 35
},
{
"epoch": 0.91,
"learning_rate": 5.681818181818182e-06,
"loss": 0.2684,
"step": 40
},
{
"epoch": 0.91,
"eval_accuracy": 0.890818858560794,
"eval_f1": 0.9225352112676056,
"eval_loss": 0.2773796319961548,
"eval_precision": 0.9225352112676056,
"eval_recall": 0.9225352112676056,
"eval_runtime": 2.1762,
"eval_samples_per_second": 185.184,
"eval_steps_per_second": 23.435,
"step": 40
}
],
"max_steps": 44,
"num_train_epochs": 1,
"total_flos": 111822198528000.0,
"trial_name": null,
"trial_params": null
}