roberta-large-bne-finetuned-ner / trainer_state.json
josecannete's picture
adding model finetuned on NER
744886d
{
"best_metric": 0.24747222661972046,
"best_model_checkpoint": "/home/jcanete/ft-data/all_results/ner/roberta_large_bne/epochs_2_bs_16_lr_5e-5/checkpoint-1000",
"epoch": 2.0,
"global_step": 1042,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.19,
"eval_accuracy": 0.8513695074658768,
"eval_f1": 0.1648726699921239,
"eval_loss": 0.5836164951324463,
"eval_precision": 0.4988085782366958,
"eval_recall": 0.09875766629973266,
"eval_runtime": 3.7205,
"eval_samples_per_second": 514.978,
"eval_steps_per_second": 32.253,
"step": 100
},
{
"epoch": 0.38,
"eval_accuracy": 0.8838590491312712,
"eval_f1": 0.3543647363872084,
"eval_loss": 0.40415123105049133,
"eval_precision": 0.45510606808090776,
"eval_recall": 0.2901399591130681,
"eval_runtime": 3.5735,
"eval_samples_per_second": 536.167,
"eval_steps_per_second": 33.58,
"step": 200
},
{
"epoch": 0.58,
"eval_accuracy": 0.8917982228464991,
"eval_f1": 0.4051617172636281,
"eval_loss": 0.37282565236091614,
"eval_precision": 0.4273996509598604,
"eval_recall": 0.38512344708287466,
"eval_runtime": 3.5615,
"eval_samples_per_second": 537.975,
"eval_steps_per_second": 33.694,
"step": 300
},
{
"epoch": 0.77,
"eval_accuracy": 0.9021496839598155,
"eval_f1": 0.441752880814198,
"eval_loss": 0.3306070864200592,
"eval_precision": 0.47486437613019894,
"eval_recall": 0.4129580122660796,
"eval_runtime": 3.5725,
"eval_samples_per_second": 536.317,
"eval_steps_per_second": 33.59,
"step": 400
},
{
"epoch": 0.96,
"learning_rate": 2.6199616122840692e-05,
"loss": 0.3639,
"step": 500
},
{
"epoch": 0.96,
"eval_accuracy": 0.9098293077651226,
"eval_f1": 0.4915268248326031,
"eval_loss": 0.3107258975505829,
"eval_precision": 0.5181247821540607,
"eval_recall": 0.46752634061959425,
"eval_runtime": 3.5465,
"eval_samples_per_second": 540.25,
"eval_steps_per_second": 33.836,
"step": 500
},
{
"epoch": 1.15,
"eval_accuracy": 0.9191425692387554,
"eval_f1": 0.5334455195624738,
"eval_loss": 0.28400444984436035,
"eval_precision": 0.573651827723489,
"eval_recall": 0.49850605441107093,
"eval_runtime": 3.6566,
"eval_samples_per_second": 523.984,
"eval_steps_per_second": 32.817,
"step": 600
},
{
"epoch": 1.34,
"eval_accuracy": 0.9191273015969953,
"eval_f1": 0.5345680983554207,
"eval_loss": 0.27888885140419006,
"eval_precision": 0.5428895735365656,
"eval_recall": 0.5264978770246894,
"eval_runtime": 3.5531,
"eval_samples_per_second": 539.251,
"eval_steps_per_second": 33.774,
"step": 700
},
{
"epoch": 1.54,
"eval_accuracy": 0.9216464624874042,
"eval_f1": 0.5420696324951644,
"eval_loss": 0.27768683433532715,
"eval_precision": 0.5559596627541742,
"eval_recall": 0.5288567384808932,
"eval_runtime": 3.6668,
"eval_samples_per_second": 522.526,
"eval_steps_per_second": 32.726,
"step": 800
},
{
"epoch": 1.73,
"eval_accuracy": 0.9239213411096522,
"eval_f1": 0.5558622929522572,
"eval_loss": 0.2659355401992798,
"eval_precision": 0.5746180963572268,
"eval_recall": 0.5382921843057085,
"eval_runtime": 3.5615,
"eval_samples_per_second": 537.969,
"eval_steps_per_second": 33.693,
"step": 900
},
{
"epoch": 1.92,
"learning_rate": 2.2072936660268714e-06,
"loss": 0.1284,
"step": 1000
},
{
"epoch": 1.92,
"eval_accuracy": 0.9300131301719137,
"eval_f1": 0.5886271324126726,
"eval_loss": 0.24747222661972046,
"eval_precision": 0.6088052428163334,
"eval_recall": 0.5697436703884259,
"eval_runtime": 3.5563,
"eval_samples_per_second": 538.768,
"eval_steps_per_second": 33.743,
"step": 1000
},
{
"epoch": 2.0,
"step": 1042,
"total_flos": 2679034988917632.0,
"train_loss": 0.2408974696944634,
"train_runtime": 222.5517,
"train_samples_per_second": 74.805,
"train_steps_per_second": 4.682
}
],
"max_steps": 1042,
"num_train_epochs": 2,
"total_flos": 2679034988917632.0,
"trial_name": null,
"trial_params": null
}