nerugm-base-2 / trainer_state.json
apwic's picture
End of training
fbc67b1 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 2.7315826416015625,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.3629,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.6941176470588235,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6210526315789474,
"eval_ORGANIZATION_recall": 0.7866666666666666,
"eval_PERSON_f1": 0.8888888888888888,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.5396825396825397,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.425,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.721311475409836,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6285714285714286,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.1598740667104721,
"eval_overall_accuracy": 0.9482111583687766,
"eval_overall_f1": 0.7839999999999999,
"eval_overall_precision": 0.7153284671532847,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.3626,
"eval_samples_per_second": 515.737,
"eval_steps_per_second": 8.274,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.3484944105148315,
"learning_rate": 4.9e-05,
"loss": 0.128,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.7922077922077924,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.782122905027933,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6730769230769231,
"eval_ORGANIZATION_recall": 0.9333333333333333,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8076923076923077,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8076923076923077,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.13682067394256592,
"eval_overall_accuracy": 0.9567175381536153,
"eval_overall_f1": 0.8238482384823848,
"eval_overall_precision": 0.7619047619047619,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3665,
"eval_samples_per_second": 510.258,
"eval_steps_per_second": 8.186,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 2.2102744579315186,
"learning_rate": 4.85e-05,
"loss": 0.0841,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.8028169014084506,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8142857142857143,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.7810650887573964,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7021276595744681,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8918032786885245,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8395061728395061,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8333333333333333,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.9090909090909091,
"eval_TIME_recall": 0.7692307692307693,
"eval_loss": 0.1551402360200882,
"eval_overall_accuracy": 0.9547160370277709,
"eval_overall_f1": 0.8256624825662482,
"eval_overall_precision": 0.783068783068783,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3569,
"eval_samples_per_second": 523.957,
"eval_steps_per_second": 8.406,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 8.499090194702148,
"learning_rate": 4.8e-05,
"loss": 0.0533,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.8053691275167787,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7719298245614036,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8778877887788779,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.83125,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5806451612903226,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7540983606557377,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6571428571428571,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.17204634845256805,
"eval_overall_accuracy": 0.9552164123092319,
"eval_overall_f1": 0.8130081300813008,
"eval_overall_precision": 0.7518796992481203,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3715,
"eval_samples_per_second": 503.365,
"eval_steps_per_second": 8.075,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 10.976715087890625,
"learning_rate": 4.75e-05,
"loss": 0.0359,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7784431137724551,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7065217391304348,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9049180327868852,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.6785714285714286,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5757575757575758,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.20843125879764557,
"eval_overall_accuracy": 0.9564673505128847,
"eval_overall_f1": 0.8310626702997276,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3572,
"eval_samples_per_second": 523.556,
"eval_steps_per_second": 8.399,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.3230496346950531,
"learning_rate": 4.7e-05,
"loss": 0.0256,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7597765363128492,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6538461538461539,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5588235294117647,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7368421052631579,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6774193548387096,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.2402852177619934,
"eval_overall_accuracy": 0.9539654741055792,
"eval_overall_f1": 0.8194070080862534,
"eval_overall_precision": 0.7543424317617866,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3663,
"eval_samples_per_second": 510.497,
"eval_steps_per_second": 8.19,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.021450912579894066,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.0188,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7624309392265193,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.6509433962264151,
"eval_ORGANIZATION_recall": 0.92,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7118644067796609,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.6363636363636364,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.22656874358654022,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8162162162162162,
"eval_overall_precision": 0.7531172069825436,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.356,
"eval_samples_per_second": 525.333,
"eval_steps_per_second": 8.428,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.026271946728229523,
"learning_rate": 4.600000000000001e-05,
"loss": 0.0134,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7530864197530864,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7011494252873564,
"eval_ORGANIZATION_recall": 0.8133333333333334,
"eval_PERSON_f1": 0.9066666666666667,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8662420382165605,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7719298245614036,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7096774193548387,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.24617096781730652,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8178025034770514,
"eval_overall_precision": 0.7736842105263158,
"eval_overall_recall": 0.8672566371681416,
"eval_runtime": 0.3558,
"eval_samples_per_second": 525.577,
"eval_steps_per_second": 8.432,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 0.6316163539886475,
"learning_rate": 4.55e-05,
"loss": 0.0135,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7972027972027971,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8028169014084507,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.8098159509202455,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8829431438127091,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8461538461538461,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.2374754250049591,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.829817158931083,
"eval_overall_precision": 0.793010752688172,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3585,
"eval_samples_per_second": 521.613,
"eval_steps_per_second": 8.368,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.20594312250614166,
"learning_rate": 4.5e-05,
"loss": 0.0082,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7904191616766466,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.717391304347826,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.27111825346946716,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8269230769230769,
"eval_overall_precision": 0.7737789203084833,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3597,
"eval_samples_per_second": 519.941,
"eval_steps_per_second": 8.341,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.010851857252418995,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0079,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7878787878787877,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7222222222222222,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.27776339650154114,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.825,
"eval_overall_precision": 0.7795275590551181,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3586,
"eval_samples_per_second": 521.408,
"eval_steps_per_second": 8.365,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 4.9953837394714355,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.0105,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7916666666666666,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7916666666666666,
"eval_LOCATION_recall": 0.7916666666666666,
"eval_ORGANIZATION_f1": 0.8101265822784811,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7710843373493976,
"eval_ORGANIZATION_recall": 0.8533333333333334,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.28447094559669495,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8373408769448375,
"eval_overall_precision": 0.8043478260869565,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3599,
"eval_samples_per_second": 519.532,
"eval_steps_per_second": 8.335,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.2857362926006317,
"learning_rate": 4.35e-05,
"loss": 0.0103,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.8170731707317072,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7528089887640449,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7037037037037037,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6129032258064516,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.9019607843137256,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.92,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.2690028250217438,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8403361344537816,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3608,
"eval_samples_per_second": 518.338,
"eval_steps_per_second": 8.316,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 0.11683321744203568,
"learning_rate": 4.3e-05,
"loss": 0.0045,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7887323943661971,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.7777777777777778,
"eval_ORGANIZATION_f1": 0.809248554913295,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.9333333333333333,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6545454545454547,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5625,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7636363636363636,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7241379310344828,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.304815411567688,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8248275862068966,
"eval_overall_precision": 0.7746113989637305,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3586,
"eval_samples_per_second": 521.439,
"eval_steps_per_second": 8.365,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.15561413764953613,
"learning_rate": 4.25e-05,
"loss": 0.005,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8000000000000002,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.775,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9054054054054055,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8758169934640523,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.27857497334480286,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8397163120567377,
"eval_overall_precision": 0.8087431693989071,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3743,
"eval_samples_per_second": 499.656,
"eval_steps_per_second": 8.016,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.24679070711135864,
"learning_rate": 4.2e-05,
"loss": 0.0041,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8170731707317072,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7528089887640449,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8903654485049833,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8481012658227848,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.30642324686050415,
"eval_overall_accuracy": 0.9572179134350763,
"eval_overall_f1": 0.8349514563106795,
"eval_overall_precision": 0.7879581151832461,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3572,
"eval_samples_per_second": 523.51,
"eval_steps_per_second": 8.399,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.17553383111953735,
"learning_rate": 4.15e-05,
"loss": 0.0061,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7733333333333334,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7701863354037267,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7209302325581395,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.300820916891098,
"eval_overall_accuracy": 0.9574681010758068,
"eval_overall_f1": 0.8205841446453408,
"eval_overall_precision": 0.7763157894736842,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3595,
"eval_samples_per_second": 520.18,
"eval_steps_per_second": 8.345,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.004105593077838421,
"learning_rate": 4.1e-05,
"loss": 0.0036,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8129032258064516,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7875,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8993288590604027,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.864516129032258,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.29750457406044006,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8434414668547249,
"eval_overall_precision": 0.8081081081081081,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3588,
"eval_samples_per_second": 521.143,
"eval_steps_per_second": 8.361,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.007032826077193022,
"learning_rate": 4.05e-05,
"loss": 0.0025,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8513513513513513,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.834355828220859,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7727272727272727,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3171651363372803,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.8599439775910364,
"eval_overall_precision": 0.8186666666666667,
"eval_overall_recall": 0.9056047197640118,
"eval_runtime": 0.3602,
"eval_samples_per_second": 519.212,
"eval_steps_per_second": 8.33,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.055253505706787,
"learning_rate": 4e-05,
"loss": 0.0039,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8098159509202455,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3097495436668396,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.8475524475524475,
"eval_overall_precision": 0.8058510638297872,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3569,
"eval_samples_per_second": 524.015,
"eval_steps_per_second": 8.407,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.4885401129722595,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0031,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.781456953642384,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.7974683544303797,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7590361445783133,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.32485198974609375,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.83008356545961,
"eval_overall_precision": 0.7862796833773087,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3689,
"eval_samples_per_second": 506.94,
"eval_steps_per_second": 8.133,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.03123115934431553,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0037,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.7972972972972973,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8263473053892216,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.92,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3308863937854767,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8386206896551724,
"eval_overall_precision": 0.7875647668393783,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3591,
"eval_samples_per_second": 520.739,
"eval_steps_per_second": 8.354,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.8348985314369202,
"learning_rate": 3.85e-05,
"loss": 0.0015,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8176100628930819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7738095238095238,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7692307692307693,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6896551724137931,
"eval_QUANTITY_recall": 0.8695652173913043,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.32765087485313416,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8423988842398884,
"eval_overall_precision": 0.798941798941799,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3569,
"eval_samples_per_second": 523.957,
"eval_steps_per_second": 8.406,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 0.006436940282583237,
"learning_rate": 3.8e-05,
"loss": 0.0027,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.8076923076923077,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7777777777777778,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3232249617576599,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8345120226308345,
"eval_overall_precision": 0.8016304347826086,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3705,
"eval_samples_per_second": 504.719,
"eval_steps_per_second": 8.097,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.9054812788963318,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0035,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8227848101265823,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7831325301204819,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6428571428571429,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5454545454545454,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.35135143995285034,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8337950138504155,
"eval_overall_precision": 0.7859007832898173,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3594,
"eval_samples_per_second": 520.314,
"eval_steps_per_second": 8.347,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.010295592248439789,
"learning_rate": 3.7e-05,
"loss": 0.0028,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8979591836734694,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8741721854304636,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3200477361679077,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8344923504867873,
"eval_overall_precision": 0.7894736842105263,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3624,
"eval_samples_per_second": 516.068,
"eval_steps_per_second": 8.279,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.0034800188150256872,
"learning_rate": 3.65e-05,
"loss": 0.0023,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7831325301204819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.8837209302325583,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8417721518987342,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3428550064563751,
"eval_overall_accuracy": 0.9569677257943457,
"eval_overall_f1": 0.8238557558945908,
"eval_overall_precision": 0.7774869109947644,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3592,
"eval_samples_per_second": 520.564,
"eval_steps_per_second": 8.351,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 0.001987306633964181,
"learning_rate": 3.6e-05,
"loss": 0.0031,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7777777777777777,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7241379310344828,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8983606557377047,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.845679012345679,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8070175438596492,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7419354838709677,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3218757212162018,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.828060522696011,
"eval_overall_precision": 0.7757731958762887,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3703,
"eval_samples_per_second": 504.962,
"eval_steps_per_second": 8.101,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.021353095769882202,
"learning_rate": 3.55e-05,
"loss": 0.0028,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8057553956834532,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.835820895522388,
"eval_LOCATION_recall": 0.7777777777777778,
"eval_ORGANIZATION_f1": 0.8076923076923077,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7777777777777778,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8800000000000001,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8407643312101911,
"eval_PERSON_recall": 0.9230769230769231,
"eval_QUANTITY_f1": 0.6415094339622641,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5666666666666667,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.35811248421669006,
"eval_overall_accuracy": 0.9562171628721541,
"eval_overall_f1": 0.8273894436519258,
"eval_overall_precision": 0.8011049723756906,
"eval_overall_recall": 0.855457227138643,
"eval_runtime": 0.3735,
"eval_samples_per_second": 500.719,
"eval_steps_per_second": 8.033,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.0009840091224759817,
"learning_rate": 3.5e-05,
"loss": 0.0031,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.830188679245283,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7857142857142857,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3134097754955292,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8503496503496504,
"eval_overall_precision": 0.8085106382978723,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3742,
"eval_samples_per_second": 499.673,
"eval_steps_per_second": 8.016,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 1.1641939878463745,
"learning_rate": 3.45e-05,
"loss": 0.0035,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.751592356687898,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.6941176470588235,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8387096774193549,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.8125,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.31325557827949524,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8372739916550764,
"eval_overall_precision": 0.7921052631578948,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3607,
"eval_samples_per_second": 518.406,
"eval_steps_per_second": 8.317,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.0497661791741848,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0028,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8214285714285714,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7419354838709677,
"eval_ORGANIZATION_recall": 0.92,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7755102040816326,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7307692307692307,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.32023829221725464,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8491620111731844,
"eval_overall_precision": 0.8063660477453581,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3634,
"eval_samples_per_second": 514.539,
"eval_steps_per_second": 8.255,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.0015366391744464636,
"learning_rate": 3.35e-05,
"loss": 0.0013,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7898089171974522,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7560975609756098,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3315739035606384,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8368794326241135,
"eval_overall_precision": 0.8060109289617486,
"eval_overall_recall": 0.8702064896755162,
"eval_runtime": 0.3575,
"eval_samples_per_second": 523.126,
"eval_steps_per_second": 8.392,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.05237346515059471,
"learning_rate": 3.3e-05,
"loss": 0.0018,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8048780487804879,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7415730337078652,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.36692577600479126,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.8495821727019498,
"eval_overall_precision": 0.8047493403693932,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3644,
"eval_samples_per_second": 513.118,
"eval_steps_per_second": 8.232,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.002315772697329521,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0022,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8378378378378377,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8198757763975156,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7674418604651163,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.91156462585034,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8874172185430463,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.9230769230769231,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3101156949996948,
"eval_overall_accuracy": 0.9649737302977233,
"eval_overall_f1": 0.8628005657708627,
"eval_overall_precision": 0.8288043478260869,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3638,
"eval_samples_per_second": 514.005,
"eval_steps_per_second": 8.246,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.0013785570627078414,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.002,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8198757763975156,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7674418604651163,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8933333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3521296977996826,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8435754189944135,
"eval_overall_precision": 0.8010610079575596,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3743,
"eval_samples_per_second": 499.566,
"eval_steps_per_second": 8.014,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.002585264155641198,
"learning_rate": 3.15e-05,
"loss": 0.0019,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8148148148148148,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7586206896551724,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8956228956228957,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8636363636363636,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.34240958094596863,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8435754189944135,
"eval_overall_precision": 0.8010610079575596,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3616,
"eval_samples_per_second": 517.085,
"eval_steps_per_second": 8.295,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 4.613161563873291,
"learning_rate": 3.1e-05,
"loss": 0.0012,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.825,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7764705882352941,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.6923076923076923,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6206896551724138,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3519201874732971,
"eval_overall_accuracy": 0.957968476357268,
"eval_overall_f1": 0.8396094839609484,
"eval_overall_precision": 0.7962962962962963,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3618,
"eval_samples_per_second": 516.793,
"eval_steps_per_second": 8.291,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.0017957445234060287,
"learning_rate": 3.05e-05,
"loss": 0.0012,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.825,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7764705882352941,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8926174496644295,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8580645161290322,
"eval_PERSON_recall": 0.9300699300699301,
"eval_QUANTITY_f1": 0.7169811320754716,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6333333333333333,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.7777777777777779,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.3654736876487732,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8419580419580419,
"eval_overall_precision": 0.800531914893617,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3617,
"eval_samples_per_second": 517.022,
"eval_steps_per_second": 8.294,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.001596860121935606,
"learning_rate": 3e-05,
"loss": 0.001,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7945205479452054,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.7948717948717949,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7654320987654321,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7755102040816326,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7307692307692307,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.34077638387680054,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8457142857142858,
"eval_overall_precision": 0.8199445983379502,
"eval_overall_recall": 0.8731563421828908,
"eval_runtime": 0.3642,
"eval_samples_per_second": 513.453,
"eval_steps_per_second": 8.237,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.0034711004700511694,
"learning_rate": 2.95e-05,
"loss": 0.0025,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8157894736842106,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.7898089171974522,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7560975609756098,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.912751677852349,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.340951144695282,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8415147265077138,
"eval_overall_precision": 0.8021390374331551,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.361,
"eval_samples_per_second": 518.055,
"eval_steps_per_second": 8.311,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.02040654979646206,
"learning_rate": 2.9e-05,
"loss": 0.0012,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8025477707006369,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7682926829268293,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.76,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.7037037037037037,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8076923076923077,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8076923076923077,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.3626217842102051,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8486562942008488,
"eval_overall_precision": 0.8152173913043478,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3631,
"eval_samples_per_second": 515.064,
"eval_steps_per_second": 8.263,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.001348801888525486,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.003,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7951807228915663,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7252747252747253,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.3544086813926697,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8391608391608392,
"eval_overall_precision": 0.7978723404255319,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3593,
"eval_samples_per_second": 520.389,
"eval_steps_per_second": 8.348,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 4.9029974937438965,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0027,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7999999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7157894736842105,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.8940397350993377,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8490566037735849,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7307692307692308,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6551724137931034,
"eval_QUANTITY_recall": 0.8260869565217391,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3703295886516571,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8356164383561644,
"eval_overall_precision": 0.7800511508951407,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3623,
"eval_samples_per_second": 516.147,
"eval_steps_per_second": 8.28,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.2568044662475586,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0015,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8354430379746836,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7951807228915663,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8076923076923077,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8076923076923077,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.34526732563972473,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8438818565400844,
"eval_overall_precision": 0.8064516129032258,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3579,
"eval_samples_per_second": 522.551,
"eval_steps_per_second": 8.383,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.0012396867386996746,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0018,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8170731707317072,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7528089887640449,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8235294117647058,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.84,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.3448871970176697,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.846262341325811,
"eval_overall_precision": 0.8108108108108109,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3635,
"eval_samples_per_second": 514.485,
"eval_steps_per_second": 8.254,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 1.6906110048294067,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0028,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8137931034482759,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8082191780821918,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8148148148148148,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7586206896551724,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.37111541628837585,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8474576271186441,
"eval_overall_precision": 0.8130081300813008,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3591,
"eval_samples_per_second": 520.775,
"eval_steps_per_second": 8.355,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.029315035790205002,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0014,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8309859154929577,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8198757763975156,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7674418604651163,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3521229922771454,
"eval_overall_accuracy": 0.9632224168126094,
"eval_overall_f1": 0.8522727272727273,
"eval_overall_precision": 0.821917808219178,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3694,
"eval_samples_per_second": 506.192,
"eval_steps_per_second": 8.121,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.02477916330099106,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0023,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8129032258064516,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7875,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.8874172185430464,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8427672955974843,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.36508724093437195,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8394366197183099,
"eval_overall_precision": 0.8032345013477089,
"eval_overall_recall": 0.8790560471976401,
"eval_runtime": 0.3605,
"eval_samples_per_second": 518.761,
"eval_steps_per_second": 8.322,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.017422163859009743,
"learning_rate": 2.5e-05,
"loss": 0.0027,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.9230769230769231,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3326910436153412,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8607594936708861,
"eval_overall_precision": 0.8225806451612904,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.368,
"eval_steps_per_second": 8.059,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.00688315462321043,
"learning_rate": 2.45e-05,
"loss": 0.0009,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8137931034482759,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8082191780821918,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8387096774193549,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.8125,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.912751677852349,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7083333333333334,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.68,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.9230769230769231,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.9230769230769231,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.33154383301734924,
"eval_overall_accuracy": 0.9659744808606455,
"eval_overall_f1": 0.8624641833810888,
"eval_overall_precision": 0.8384401114206128,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.358,
"eval_samples_per_second": 522.281,
"eval_steps_per_second": 8.379,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.0005034964415244758,
"learning_rate": 2.4e-05,
"loss": 0.001,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.7945205479452055,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7837837837837838,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.912751677852349,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.9056603773584906,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8888888888888888,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3466086983680725,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8531073446327683,
"eval_overall_precision": 0.8184281842818428,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3715,
"eval_samples_per_second": 503.309,
"eval_steps_per_second": 8.074,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.021436743438243866,
"learning_rate": 2.35e-05,
"loss": 0.0014,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8271604938271604,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7701149425287356,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.32782742381095886,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8515406162464986,
"eval_overall_precision": 0.8106666666666666,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3599,
"eval_samples_per_second": 519.612,
"eval_steps_per_second": 8.336,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.0009922637837007642,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0007,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.7976190476190477,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7204301075268817,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8910891089108911,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.84375,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.36466336250305176,
"eval_overall_accuracy": 0.9589692269201902,
"eval_overall_f1": 0.8406593406593406,
"eval_overall_precision": 0.7866323907455013,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.36,
"eval_samples_per_second": 519.408,
"eval_steps_per_second": 8.333,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.003993849270045757,
"learning_rate": 2.25e-05,
"loss": 0.0017,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7947019867549668,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.7948717948717949,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7654320987654321,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.9072847682119206,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8616352201257862,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6274509803921569,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5714285714285714,
"eval_QUANTITY_recall": 0.6956521739130435,
"eval_TIME_f1": 0.7857142857142856,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7333333333333333,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3635990619659424,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8296089385474861,
"eval_overall_precision": 0.7877984084880637,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3593,
"eval_samples_per_second": 520.494,
"eval_steps_per_second": 8.35,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.0005980022251605988,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0004,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.8516129032258064,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.825,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9042904290429041,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6792452830188679,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8235294117647058,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.84,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.3733396530151367,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8438818565400844,
"eval_overall_precision": 0.8064516129032258,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.3652,
"eval_samples_per_second": 512.007,
"eval_steps_per_second": 8.214,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.0007011191919445992,
"learning_rate": 2.15e-05,
"loss": 0.0009,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.858974358974359,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.8271604938271605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3640208840370178,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.849929873772791,
"eval_overall_precision": 0.8101604278074866,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3606,
"eval_samples_per_second": 518.592,
"eval_steps_per_second": 8.32,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.0015956854913383722,
"learning_rate": 2.1e-05,
"loss": 0.0003,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8220858895705522,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7613636363636364,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9023569023569024,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8701298701298701,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3814009130001068,
"eval_overall_accuracy": 0.9582186639979985,
"eval_overall_f1": 0.8440111420612812,
"eval_overall_precision": 0.7994722955145118,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3599,
"eval_samples_per_second": 519.642,
"eval_steps_per_second": 8.337,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.0003817932156380266,
"learning_rate": 2.05e-05,
"loss": 0.0005,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.8194444444444444,
"eval_ORGANIZATION_f1": 0.8441558441558442,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.8227848101265823,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.888888888888889,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.9230769230769231,
"eval_loss": 0.3739457130432129,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8567375886524823,
"eval_overall_precision": 0.825136612021858,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3596,
"eval_samples_per_second": 520.068,
"eval_steps_per_second": 8.343,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.00037515757139772177,
"learning_rate": 2e-05,
"loss": 0.0005,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8219178082191781,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8354430379746836,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7951807228915663,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3766981363296509,
"eval_overall_accuracy": 0.9604703527645734,
"eval_overall_f1": 0.8547249647390691,
"eval_overall_precision": 0.8189189189189189,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3687,
"eval_samples_per_second": 507.159,
"eval_steps_per_second": 8.136,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.00191974185872823,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0008,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8333333333333334,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.8024691358024691,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.903654485049834,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8607594936708861,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.36986875534057617,
"eval_overall_accuracy": 0.9622216662496873,
"eval_overall_f1": 0.849507735583685,
"eval_overall_precision": 0.8118279569892473,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3616,
"eval_samples_per_second": 517.178,
"eval_steps_per_second": 8.297,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 1.7503353357315063,
"learning_rate": 1.9e-05,
"loss": 0.0016,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.825,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7764705882352941,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8838709677419354,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8203592814371258,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.34973686933517456,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8437067773167358,
"eval_overall_precision": 0.7942708333333334,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.364,
"eval_samples_per_second": 513.749,
"eval_steps_per_second": 8.242,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.0005617731949314475,
"learning_rate": 1.85e-05,
"loss": 0.0004,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8299319727891157,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.834355828220859,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7727272727272727,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9210526315789473,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9790209790209791,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.7796610169491526,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.696969696969697,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3623858094215393,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.856353591160221,
"eval_overall_precision": 0.8051948051948052,
"eval_overall_recall": 0.9144542772861357,
"eval_runtime": 0.3601,
"eval_samples_per_second": 519.319,
"eval_steps_per_second": 8.331,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.04498714208602905,
"learning_rate": 1.8e-05,
"loss": 0.0009,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8435374149659863,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8374999999999999,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.788235294117647,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.37043052911758423,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8583450210378682,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.36,
"eval_samples_per_second": 519.423,
"eval_steps_per_second": 8.333,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.0003102279151789844,
"learning_rate": 1.75e-05,
"loss": 0.001,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8220858895705522,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7613636363636364,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9144736842105262,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.972027972027972,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3582930862903595,
"eval_overall_accuracy": 0.96347260445334,
"eval_overall_f1": 0.8583333333333333,
"eval_overall_precision": 0.8110236220472441,
"eval_overall_recall": 0.911504424778761,
"eval_runtime": 0.3574,
"eval_samples_per_second": 523.156,
"eval_steps_per_second": 8.393,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.023364154621958733,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0001,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8387096774193549,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.8125,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9139072847682119,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8679245283018868,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.35251596570014954,
"eval_overall_accuracy": 0.9627220415311484,
"eval_overall_f1": 0.8523206751054851,
"eval_overall_precision": 0.8145161290322581,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3673,
"eval_samples_per_second": 509.16,
"eval_steps_per_second": 8.168,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.0011218636063858867,
"learning_rate": 1.65e-05,
"loss": 0.0015,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8121212121212122,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7444444444444445,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9078947368421052,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.965034965034965,
"eval_QUANTITY_f1": 0.72,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.8679245283018868,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8518518518518519,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.37641996145248413,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8524137931034482,
"eval_overall_precision": 0.8005181347150259,
"eval_overall_recall": 0.911504424778761,
"eval_runtime": 0.3613,
"eval_samples_per_second": 517.565,
"eval_steps_per_second": 8.303,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.0007424333016388118,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0006,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.7878787878787877,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7222222222222222,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.782608695652174,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3496319651603699,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8475524475524475,
"eval_overall_precision": 0.8058510638297872,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3711,
"eval_samples_per_second": 503.904,
"eval_steps_per_second": 8.084,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.008528614416718483,
"learning_rate": 1.55e-05,
"loss": 0.0008,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8000000000000002,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.775,
"eval_ORGANIZATION_recall": 0.8266666666666667,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.34753233194351196,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8401697312588402,
"eval_overall_precision": 0.8070652173913043,
"eval_overall_recall": 0.8761061946902655,
"eval_runtime": 0.3588,
"eval_samples_per_second": 521.137,
"eval_steps_per_second": 8.36,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.014132479205727577,
"learning_rate": 1.5e-05,
"loss": 0.0,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8356164383561645,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8121212121212122,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7444444444444445,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.8844884488448846,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8375,
"eval_PERSON_recall": 0.9370629370629371,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3662912845611572,
"eval_overall_accuracy": 0.9592194145609206,
"eval_overall_f1": 0.8388888888888889,
"eval_overall_precision": 0.7926509186351706,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.4097,
"eval_samples_per_second": 456.444,
"eval_steps_per_second": 7.323,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.0005066086887381971,
"learning_rate": 1.45e-05,
"loss": 0.0002,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8055555555555556,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8055555555555556,
"eval_LOCATION_recall": 0.8055555555555556,
"eval_ORGANIZATION_f1": 0.8170731707317072,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7528089887640449,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3715399205684662,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.849507735583685,
"eval_overall_precision": 0.8118279569892473,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3561,
"eval_samples_per_second": 525.071,
"eval_steps_per_second": 8.424,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.00028915383154526353,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0001,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8435374149659863,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8072289156626506,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7362637362637363,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8214285714285715,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3853207230567932,
"eval_overall_accuracy": 0.9587190392794596,
"eval_overall_f1": 0.8523676880222841,
"eval_overall_precision": 0.8073878627968337,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.362,
"eval_samples_per_second": 516.586,
"eval_steps_per_second": 8.287,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.0008943734574131668,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0007,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.821917808219178,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.8198757763975156,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7674418604651163,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9060402684563759,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8709677419354839,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.35061854124069214,
"eval_overall_accuracy": 0.9599699774831123,
"eval_overall_f1": 0.8498583569405098,
"eval_overall_precision": 0.8174386920980926,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.357,
"eval_samples_per_second": 523.747,
"eval_steps_per_second": 8.402,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.0004187956510577351,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0002,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8095238095238095,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7311827956989247,
"eval_ORGANIZATION_recall": 0.9066666666666666,
"eval_PERSON_f1": 0.9163879598662208,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8782051282051282,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8148148148148148,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7857142857142857,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.4027647078037262,
"eval_overall_accuracy": 0.9584688516387291,
"eval_overall_f1": 0.847645429362881,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3573,
"eval_samples_per_second": 523.424,
"eval_steps_per_second": 8.397,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.0005983862793073058,
"learning_rate": 1.25e-05,
"loss": 0.0,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.816326530612245,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8333333333333334,
"eval_ORGANIZATION_f1": 0.825,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7764705882352941,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3929165005683899,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8478873239436621,
"eval_overall_precision": 0.8113207547169812,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3576,
"eval_samples_per_second": 522.919,
"eval_steps_per_second": 8.389,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.00021465642203111202,
"learning_rate": 1.2e-05,
"loss": 0.0002,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8271604938271604,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7701149425287356,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.4091399908065796,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8527777777777777,
"eval_overall_precision": 0.8057742782152231,
"eval_overall_recall": 0.9056047197640118,
"eval_runtime": 0.3609,
"eval_samples_per_second": 518.107,
"eval_steps_per_second": 8.312,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.00041957717621698976,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8271604938271604,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7701149425287356,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3996489346027374,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8491620111731844,
"eval_overall_precision": 0.8063660477453581,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3555,
"eval_samples_per_second": 526.025,
"eval_steps_per_second": 8.439,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.0018605925142765045,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8198757763975156,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7674418604651163,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3973155617713928,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8447552447552448,
"eval_overall_precision": 0.8031914893617021,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3588,
"eval_samples_per_second": 521.17,
"eval_steps_per_second": 8.361,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.0009037918644025922,
"learning_rate": 1.05e-05,
"loss": 0.0,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.825,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7764705882352941,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3981226086616516,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.84593837535014,
"eval_overall_precision": 0.8053333333333333,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3579,
"eval_samples_per_second": 522.564,
"eval_steps_per_second": 8.383,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.0010246345773339272,
"learning_rate": 1e-05,
"loss": 0.0,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.875,
"eval_ORGANIZATION_f1": 0.8198757763975156,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7674418604651163,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.4011876583099365,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8475524475524475,
"eval_overall_precision": 0.8058510638297872,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.061,
"eval_steps_per_second": 7.894,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.00019219562818761915,
"learning_rate": 9.5e-06,
"loss": 0.0006,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8271604938271604,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7701149425287356,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6538461538461539,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.5862068965517241,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.4144229590892792,
"eval_overall_accuracy": 0.9597197898423818,
"eval_overall_f1": 0.8467966573816156,
"eval_overall_precision": 0.8021108179419525,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3556,
"eval_samples_per_second": 525.889,
"eval_steps_per_second": 8.437,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.000247513729846105,
"learning_rate": 9e-06,
"loss": 0.0,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8227848101265823,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7831325301204819,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8598726114649682,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.40510478615760803,
"eval_overall_accuracy": 0.9594696022016512,
"eval_overall_f1": 0.8455056179775281,
"eval_overall_precision": 0.806970509383378,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3705,
"eval_samples_per_second": 504.754,
"eval_steps_per_second": 8.098,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.0001593719352968037,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0006,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8048780487804879,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7415730337078652,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.8970099667774087,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8544303797468354,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8518518518518519,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8214285714285714,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.4076941907405853,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8381742738589212,
"eval_overall_precision": 0.7890625,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3564,
"eval_samples_per_second": 524.736,
"eval_steps_per_second": 8.418,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.0038378555327653885,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0004,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8280254777070064,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7926829268292683,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.903010033444816,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8653846153846154,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.39616209268569946,
"eval_overall_accuracy": 0.960720540405304,
"eval_overall_f1": 0.8474576271186441,
"eval_overall_precision": 0.8130081300813008,
"eval_overall_recall": 0.8849557522123894,
"eval_runtime": 0.359,
"eval_samples_per_second": 520.922,
"eval_steps_per_second": 8.357,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.0006832346552982926,
"learning_rate": 7.5e-06,
"loss": 0.0005,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8235294117647058,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.8076923076923077,
"eval_ORGANIZATION_recall": 0.84,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8461538461538461,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.38612908124923706,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8542857142857142,
"eval_overall_precision": 0.8282548476454293,
"eval_overall_recall": 0.8820058997050148,
"eval_runtime": 0.3569,
"eval_samples_per_second": 523.906,
"eval_steps_per_second": 8.405,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.0012918419670313597,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8187919463087249,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8176100628930819,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7738095238095238,
"eval_ORGANIZATION_recall": 0.8666666666666667,
"eval_PERSON_f1": 0.9096989966555185,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8717948717948718,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.39533165097236633,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.8490832157968972,
"eval_overall_precision": 0.8135135135135135,
"eval_overall_recall": 0.887905604719764,
"eval_runtime": 0.3669,
"eval_samples_per_second": 509.639,
"eval_steps_per_second": 8.176,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.00013653105997946113,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0003,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8220858895705522,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7613636363636364,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9042904290429041,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.85625,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.41302046179771423,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8432732316227461,
"eval_overall_precision": 0.7958115183246073,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3613,
"eval_samples_per_second": 517.561,
"eval_steps_per_second": 8.303,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.0001936595799634233,
"learning_rate": 6e-06,
"loss": 0.0004,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8220858895705522,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7613636363636364,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.41551852226257324,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8416666666666667,
"eval_overall_precision": 0.7952755905511811,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3626,
"eval_samples_per_second": 515.716,
"eval_steps_per_second": 8.274,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.000983737176284194,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8220858895705522,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7613636363636364,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9006622516556291,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8553459119496856,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.7924528301886792,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.8076923076923077,
"eval_loss": 0.4156357944011688,
"eval_overall_accuracy": 0.9602201651238429,
"eval_overall_f1": 0.8416666666666667,
"eval_overall_precision": 0.7952755905511811,
"eval_overall_recall": 0.8938053097345132,
"eval_runtime": 0.3581,
"eval_samples_per_second": 522.251,
"eval_steps_per_second": 8.378,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.001763033214956522,
"learning_rate": 5e-06,
"loss": 0.0002,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8198757763975156,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7674418604651163,
"eval_ORGANIZATION_recall": 0.88,
"eval_PERSON_f1": 0.9090909090909092,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8766233766233766,
"eval_PERSON_recall": 0.9440559440559441,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.404066801071167,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.849507735583685,
"eval_overall_precision": 0.8118279569892473,
"eval_overall_recall": 0.8908554572271387,
"eval_runtime": 0.3736,
"eval_samples_per_second": 500.522,
"eval_steps_per_second": 8.03,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.0002766927646007389,
"learning_rate": 4.5e-06,
"loss": 0.0002,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3980797231197357,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8551336146272857,
"eval_overall_precision": 0.8172043010752689,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3573,
"eval_samples_per_second": 523.342,
"eval_steps_per_second": 8.396,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.0008579469285905361,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9158249158249158,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8831168831168831,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.830188679245283,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.8148148148148148,
"eval_TIME_recall": 0.8461538461538461,
"eval_loss": 0.3970873951911926,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8575458392101551,
"eval_overall_precision": 0.8216216216216217,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3615,
"eval_samples_per_second": 517.255,
"eval_steps_per_second": 8.298,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.00014306257071439177,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8266666666666667,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.4024323523044586,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8559440559440559,
"eval_overall_precision": 0.8138297872340425,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3607,
"eval_samples_per_second": 518.421,
"eval_steps_per_second": 8.317,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.00042846077121794224,
"learning_rate": 3e-06,
"loss": 0.0,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.3985014855861664,
"eval_overall_accuracy": 0.9619714786089567,
"eval_overall_f1": 0.8583450210378682,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.3651,
"eval_samples_per_second": 512.194,
"eval_steps_per_second": 8.217,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.000827198673505336,
"learning_rate": 2.5e-06,
"loss": 0.0,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8322147651006712,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8611111111111112,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6071428571428571,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.39939987659454346,
"eval_overall_accuracy": 0.9617212909682261,
"eval_overall_f1": 0.8571428571428571,
"eval_overall_precision": 0.816,
"eval_overall_recall": 0.9026548672566371,
"eval_runtime": 0.358,
"eval_samples_per_second": 522.401,
"eval_steps_per_second": 8.381,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.0002911574556492269,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0003,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.912751677852349,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.951048951048951,
"eval_QUANTITY_f1": 0.693877551020408,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6538461538461539,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.39506107568740845,
"eval_overall_accuracy": 0.961220915686765,
"eval_overall_f1": 0.8551336146272857,
"eval_overall_precision": 0.8172043010752689,
"eval_overall_recall": 0.8967551622418879,
"eval_runtime": 0.3613,
"eval_samples_per_second": 517.554,
"eval_steps_per_second": 8.303,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.0003046900383196771,
"learning_rate": 1.5e-06,
"loss": 0.0005,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9133333333333333,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8726114649681529,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.4083447754383087,
"eval_overall_accuracy": 0.9609707280460346,
"eval_overall_f1": 0.854341736694678,
"eval_overall_precision": 0.8133333333333334,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3599,
"eval_samples_per_second": 519.582,
"eval_steps_per_second": 8.336,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.00015339584206230938,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.407378226518631,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8567415730337079,
"eval_overall_precision": 0.8176943699731903,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3669,
"eval_samples_per_second": 509.703,
"eval_steps_per_second": 8.177,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.0002479134127497673,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.4076772630214691,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8567415730337079,
"eval_overall_precision": 0.8176943699731903,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3589,
"eval_samples_per_second": 521.056,
"eval_steps_per_second": 8.359,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.00025577095220796764,
"learning_rate": 0.0,
"loss": 0.0001,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8243243243243243,
"eval_LOCATION_number": 72,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8472222222222222,
"eval_ORGANIZATION_f1": 0.8322981366459627,
"eval_ORGANIZATION_number": 75,
"eval_ORGANIZATION_precision": 0.7790697674418605,
"eval_ORGANIZATION_recall": 0.8933333333333333,
"eval_PERSON_f1": 0.9194630872483223,
"eval_PERSON_number": 143,
"eval_PERSON_precision": 0.8838709677419355,
"eval_PERSON_recall": 0.958041958041958,
"eval_QUANTITY_f1": 0.68,
"eval_QUANTITY_number": 23,
"eval_QUANTITY_precision": 0.6296296296296297,
"eval_QUANTITY_recall": 0.7391304347826086,
"eval_TIME_f1": 0.8363636363636363,
"eval_TIME_number": 26,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8846153846153846,
"eval_loss": 0.40795865654945374,
"eval_overall_accuracy": 0.9614711033274956,
"eval_overall_f1": 0.8567415730337079,
"eval_overall_precision": 0.8176943699731903,
"eval_overall_recall": 0.8997050147492626,
"eval_runtime": 0.3623,
"eval_samples_per_second": 516.187,
"eval_steps_per_second": 8.281,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4502314993613766.0,
"train_loss": 0.008934246277599155,
"train_runtime": 970.249,
"train_samples_per_second": 173.873,
"train_steps_per_second": 10.925
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4502314993613766.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}