nerugm-base-1 / trainer_state.json
apwic's picture
End of training
b36a17e verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 3.2015111446380615,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.3254,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.5901639344262295,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5901639344262295,
"eval_ORGANIZATION_recall": 0.5901639344262295,
"eval_PERSON_f1": 0.89937106918239,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8666666666666667,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12376317381858826,
"eval_overall_accuracy": 0.9581372306167947,
"eval_overall_f1": 0.8072122052704577,
"eval_overall_precision": 0.776,
"eval_overall_recall": 0.8410404624277457,
"eval_runtime": 0.3597,
"eval_samples_per_second": 519.816,
"eval_steps_per_second": 8.339,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 3.5055294036865234,
"learning_rate": 4.9e-05,
"loss": 0.1103,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.8028169014084506,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7808219178082192,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6918238993710693,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5612244897959183,
"eval_ORGANIZATION_recall": 0.9016393442622951,
"eval_PERSON_f1": 0.89375,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8562874251497006,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7647058823529411,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7027027027027027,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14232417941093445,
"eval_overall_accuracy": 0.9556601436710429,
"eval_overall_f1": 0.8089591567852438,
"eval_overall_precision": 0.7433414043583535,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3736,
"eval_samples_per_second": 500.519,
"eval_steps_per_second": 8.03,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 3.338141918182373,
"learning_rate": 4.85e-05,
"loss": 0.0719,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.7945205479452054,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6749999999999999,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5454545454545454,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.909657320872274,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8690476190476191,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14947976171970367,
"eval_overall_accuracy": 0.9593757740896706,
"eval_overall_f1": 0.8194993412384717,
"eval_overall_precision": 0.7530266343825666,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3603,
"eval_samples_per_second": 519.072,
"eval_steps_per_second": 8.327,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.6828668117523193,
"learning_rate": 4.8e-05,
"loss": 0.0492,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7552447552447552,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.9130434782608696,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8698224852071006,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7605633802816901,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.675,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1601407825946808,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8351063829787234,
"eval_overall_precision": 0.7733990147783252,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3697,
"eval_samples_per_second": 505.814,
"eval_steps_per_second": 8.115,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.3032749891281128,
"learning_rate": 4.75e-05,
"loss": 0.0315,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.7619047619047619,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.717948717948718,
"eval_LOCATION_recall": 0.8115942028985508,
"eval_ORGANIZATION_f1": 0.6423357664233578,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5789473684210527,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7575757575757576,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.1780991554260254,
"eval_overall_accuracy": 0.9583849393113698,
"eval_overall_f1": 0.8086838534599727,
"eval_overall_precision": 0.7621483375959079,
"eval_overall_recall": 0.861271676300578,
"eval_runtime": 0.3628,
"eval_samples_per_second": 515.381,
"eval_steps_per_second": 8.268,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.877514362335205,
"learning_rate": 4.7e-05,
"loss": 0.0217,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7724137931034482,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7368421052631579,
"eval_LOCATION_recall": 0.8115942028985508,
"eval_ORGANIZATION_f1": 0.7397260273972602,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6352941176470588,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.9245283018867925,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8909090909090909,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7941176470588235,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7297297297297297,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.17554225027561188,
"eval_overall_accuracy": 0.9606143175625464,
"eval_overall_f1": 0.8277703604806409,
"eval_overall_precision": 0.7692307692307693,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3662,
"eval_samples_per_second": 510.654,
"eval_steps_per_second": 8.192,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.2853144705295563,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.0168,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7777777777777779,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7466666666666667,
"eval_LOCATION_recall": 0.8115942028985508,
"eval_ORGANIZATION_f1": 0.6901408450704226,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6049382716049383,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.915360501567398,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8795180722891566,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8253968253968254,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.19883674383163452,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8244897959183674,
"eval_overall_precision": 0.7789203084832905,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3599,
"eval_samples_per_second": 519.614,
"eval_steps_per_second": 8.336,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.052625108510255814,
"learning_rate": 4.600000000000001e-05,
"loss": 0.0134,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6857142857142857,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6075949367088608,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7575757575757576,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8115942028985507,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.19897328317165375,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8297297297297296,
"eval_overall_precision": 0.7791878172588832,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3619,
"eval_samples_per_second": 516.738,
"eval_steps_per_second": 8.29,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 0.2537504732608795,
"learning_rate": 4.55e-05,
"loss": 0.0101,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8211920529801324,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6929133858267716,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9311475409836065,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9342105263157895,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.20098058879375458,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8400556328233658,
"eval_overall_precision": 0.8096514745308311,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3599,
"eval_samples_per_second": 519.595,
"eval_steps_per_second": 8.336,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.2351408451795578,
"learning_rate": 4.5e-05,
"loss": 0.0101,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.8513513513513514,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6710526315789473,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9148264984227129,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8841463414634146,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2193160206079483,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.8509485094850948,
"eval_overall_precision": 0.8010204081632653,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3607,
"eval_samples_per_second": 518.462,
"eval_steps_per_second": 8.318,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.03327617421746254,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0063,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.8226950354609929,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8055555555555556,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7205882352941175,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6533333333333333,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.782608695652174,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7105263157894737,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22587580978870392,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8426812585499317,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3625,
"eval_samples_per_second": 515.878,
"eval_steps_per_second": 8.276,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 5.140894412994385,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.0059,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7517730496453902,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7361111111111112,
"eval_LOCATION_recall": 0.7681159420289855,
"eval_ORGANIZATION_f1": 0.6714285714285714,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5949367088607594,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9235668789808917,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9006211180124224,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.84375,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.23827865719795227,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8271092669432919,
"eval_overall_precision": 0.7931034482758621,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.3692,
"eval_samples_per_second": 506.502,
"eval_steps_per_second": 8.126,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 3.8915011882781982,
"learning_rate": 4.35e-05,
"loss": 0.007,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7894736842105263,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6585365853658537,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2511149048805237,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8304405874499332,
"eval_overall_precision": 0.771712158808933,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3685,
"eval_samples_per_second": 507.422,
"eval_steps_per_second": 8.14,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 0.0344400629401207,
"learning_rate": 4.3e-05,
"loss": 0.0058,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7763157894736842,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7352941176470588,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9396825396825397,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9135802469135802,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.24048586189746857,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8451086956521738,
"eval_overall_precision": 0.7974358974358975,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3742,
"eval_samples_per_second": 499.756,
"eval_steps_per_second": 8.017,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.006385091692209244,
"learning_rate": 4.25e-05,
"loss": 0.0053,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7972972972972974,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7407407407407408,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6756756756756757,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.7714285714285716,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6923076923076923,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.25498369336128235,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.844804318488529,
"eval_overall_precision": 0.7924050632911392,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.367,
"eval_samples_per_second": 509.472,
"eval_steps_per_second": 8.173,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.007103159092366695,
"learning_rate": 4.2e-05,
"loss": 0.0045,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.71875,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6865671641791045,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9367088607594937,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9079754601226994,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8615384615384615,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8484848484848485,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2411327213048935,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8559556786703602,
"eval_overall_precision": 0.8218085106382979,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.367,
"eval_samples_per_second": 509.544,
"eval_steps_per_second": 8.175,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.005618996452540159,
"learning_rate": 4.15e-05,
"loss": 0.0044,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7218045112781954,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8615384615384615,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8484848484848485,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.23781569302082062,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8496551724137931,
"eval_overall_precision": 0.8126649076517151,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3633,
"eval_samples_per_second": 514.728,
"eval_steps_per_second": 8.258,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.00691909808665514,
"learning_rate": 4.1e-05,
"loss": 0.004,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7205882352941175,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6533333333333333,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9211356466876972,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8902439024390244,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8115942028985507,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.28217267990112305,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8346883468834689,
"eval_overall_precision": 0.7857142857142857,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3659,
"eval_samples_per_second": 511.052,
"eval_steps_per_second": 8.199,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.018693506717681885,
"learning_rate": 4.05e-05,
"loss": 0.0043,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9426751592356687,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9192546583850931,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.23565581440925598,
"eval_overall_accuracy": 0.9658162001486252,
"eval_overall_f1": 0.8547945205479451,
"eval_overall_precision": 0.8125,
"eval_overall_recall": 0.9017341040462428,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.787,
"eval_steps_per_second": 8.05,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.0034094720613211393,
"learning_rate": 4e-05,
"loss": 0.0032,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7702702702702703,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7215189873417721,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.7301587301587301,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7076923076923077,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9201277955271565,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.24556776881217957,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8388888888888889,
"eval_overall_precision": 0.8074866310160428,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3742,
"eval_samples_per_second": 499.754,
"eval_steps_per_second": 8.017,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.006027919240295887,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0036,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6986301369863014,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9126213592233009,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9038461538461539,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8253968253968254,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.27808642387390137,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.828804347826087,
"eval_overall_precision": 0.782051282051282,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3671,
"eval_samples_per_second": 509.462,
"eval_steps_per_second": 8.173,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.08943280577659607,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0029,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7464788732394366,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.896969696969697,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.782608695652174,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7105263157894737,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.3044780194759369,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8506056527590848,
"eval_overall_precision": 0.7959697732997482,
"eval_overall_recall": 0.9132947976878613,
"eval_runtime": 0.3751,
"eval_samples_per_second": 498.515,
"eval_steps_per_second": 7.998,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.008143425919115543,
"learning_rate": 3.85e-05,
"loss": 0.0023,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8551724137931034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6911764705882353,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6266666666666667,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9367088607594937,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9079754601226994,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2635738253593445,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8520547945205479,
"eval_overall_precision": 0.8098958333333334,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3625,
"eval_samples_per_second": 515.906,
"eval_steps_per_second": 8.277,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 14.303221702575684,
"learning_rate": 3.8e-05,
"loss": 0.0059,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.786206896551724,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9426751592356687,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9192546583850931,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.272360235452652,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8392370572207084,
"eval_overall_precision": 0.7938144329896907,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3692,
"eval_samples_per_second": 506.476,
"eval_steps_per_second": 8.125,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.13158877193927765,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.002,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5875,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9389067524115756,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9240506329113924,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.25297293066978455,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8372093023255814,
"eval_overall_precision": 0.7948051948051948,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3604,
"eval_samples_per_second": 518.829,
"eval_steps_per_second": 8.323,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 1.7319470643997192,
"learning_rate": 3.7e-05,
"loss": 0.0037,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7517730496453902,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7361111111111112,
"eval_LOCATION_recall": 0.7681159420289855,
"eval_ORGANIZATION_f1": 0.7007299270072993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.631578947368421,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9299363057324841,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.906832298136646,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7887323943661971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8115942028985507,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2652280628681183,
"eval_overall_accuracy": 0.9601189001733961,
"eval_overall_f1": 0.8278688524590163,
"eval_overall_precision": 0.7849740932642487,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3664,
"eval_samples_per_second": 510.378,
"eval_steps_per_second": 8.188,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.21630139648914337,
"learning_rate": 3.65e-05,
"loss": 0.0052,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8026315789473685,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6993006993006993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6097560975609756,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9396825396825397,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9135802469135802,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8615384615384615,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8484848484848485,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.25186625123023987,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8463611859838275,
"eval_overall_precision": 0.7929292929292929,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3644,
"eval_samples_per_second": 513.133,
"eval_steps_per_second": 8.232,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 0.007407509256154299,
"learning_rate": 3.6e-05,
"loss": 0.0023,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8489208633093526,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8428571428571429,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7230769230769231,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6811594202898551,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9456869009584665,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.925,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7714285714285716,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6923076923076923,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.25416678190231323,
"eval_overall_accuracy": 0.9692841218726778,
"eval_overall_f1": 0.8575418994413407,
"eval_overall_precision": 0.8297297297297297,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3685,
"eval_samples_per_second": 507.471,
"eval_steps_per_second": 8.141,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 85.30389404296875,
"learning_rate": 3.55e-05,
"loss": 0.0042,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7441860465116278,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7058823529411765,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9551282051282051,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9371069182389937,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.24519670009613037,
"eval_overall_accuracy": 0.9687887044835274,
"eval_overall_f1": 0.8678720445062588,
"eval_overall_precision": 0.8364611260053619,
"eval_overall_recall": 0.9017341040462428,
"eval_runtime": 0.3665,
"eval_samples_per_second": 510.289,
"eval_steps_per_second": 8.186,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.044042494148015976,
"learning_rate": 3.5e-05,
"loss": 0.0016,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.851063829787234,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6976744186046512,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6617647058823529,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9490445859872612,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9254658385093167,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2484143078327179,
"eval_overall_accuracy": 0.9695318305672529,
"eval_overall_f1": 0.8603351955307263,
"eval_overall_precision": 0.8324324324324325,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3654,
"eval_samples_per_second": 511.826,
"eval_steps_per_second": 8.211,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.03026013821363449,
"learning_rate": 3.45e-05,
"loss": 0.0017,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7480916030534351,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9430379746835442,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9141104294478528,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.29129624366760254,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8559670781893004,
"eval_overall_precision": 0.814621409921671,
"eval_overall_recall": 0.9017341040462428,
"eval_runtime": 0.3674,
"eval_samples_per_second": 508.961,
"eval_steps_per_second": 8.165,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 1.4942476749420166,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0033,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.855072463768116,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.855072463768116,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7819548872180451,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7222222222222222,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9487179487179488,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9308176100628931,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.84375,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.23277780413627625,
"eval_overall_accuracy": 0.9722566262075799,
"eval_overall_f1": 0.880450070323488,
"eval_overall_precision": 0.8575342465753425,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3786,
"eval_samples_per_second": 493.877,
"eval_steps_per_second": 7.923,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.0030820919200778008,
"learning_rate": 3.35e-05,
"loss": 0.0021,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7310344827586208,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6309523809523809,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9245283018867925,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8909090909090909,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8484848484848485,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8235294117647058,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.28664737939834595,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8486486486486486,
"eval_overall_precision": 0.7969543147208121,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3626,
"eval_samples_per_second": 515.746,
"eval_steps_per_second": 8.274,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.013372019864618778,
"learning_rate": 3.3e-05,
"loss": 0.0034,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8450704225352113,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.821917808219178,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7536231884057972,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6753246753246753,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9363057324840764,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9130434782608695,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.24620448052883148,
"eval_overall_accuracy": 0.9705226653455536,
"eval_overall_f1": 0.8622589531680441,
"eval_overall_precision": 0.8236842105263158,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3647,
"eval_samples_per_second": 512.754,
"eval_steps_per_second": 8.226,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.00117175851482898,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0018,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.851063829787234,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7536231884057972,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6753246753246753,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.896969696969697,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8615384615384615,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8484848484848485,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2648729979991913,
"eval_overall_accuracy": 0.9685409957889521,
"eval_overall_f1": 0.8665749656121046,
"eval_overall_precision": 0.8267716535433071,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3621,
"eval_samples_per_second": 516.468,
"eval_steps_per_second": 8.286,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.004863755311816931,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0015,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8652482269503546,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8472222222222222,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7741935483870968,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7619047619047619,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9333333333333333,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9074074074074074,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7941176470588235,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7297297297297297,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2638514041900635,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.8667601683029452,
"eval_overall_precision": 0.8419618528610354,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3838,
"eval_samples_per_second": 487.261,
"eval_steps_per_second": 7.817,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.002965473337098956,
"learning_rate": 3.15e-05,
"loss": 0.0029,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7633587786259541,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9274447949526814,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8963414634146342,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2825859487056732,
"eval_overall_accuracy": 0.9670547436215011,
"eval_overall_f1": 0.8606896551724139,
"eval_overall_precision": 0.8232189973614775,
"eval_overall_recall": 0.9017341040462428,
"eval_runtime": 0.3647,
"eval_samples_per_second": 512.726,
"eval_steps_per_second": 8.226,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.022443190217018127,
"learning_rate": 3.1e-05,
"loss": 0.0027,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7391304347826089,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6623376623376623,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9456869009584665,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.925,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7647058823529411,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.26482775807380676,
"eval_overall_accuracy": 0.9660639088432004,
"eval_overall_f1": 0.8598901098901098,
"eval_overall_precision": 0.819371727748691,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.377,
"eval_samples_per_second": 496.079,
"eval_steps_per_second": 7.958,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.018067799508571625,
"learning_rate": 3.05e-05,
"loss": 0.0028,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8611111111111112,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7969924812030076,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7361111111111112,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9367088607594937,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9079754601226994,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8405797101449276,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7631578947368421,
"eval_TIME_recall": 0.9354838709677419,
"eval_loss": 0.2490389049053192,
"eval_overall_accuracy": 0.9687887044835274,
"eval_overall_f1": 0.8724279835390947,
"eval_overall_precision": 0.8302872062663186,
"eval_overall_recall": 0.9190751445086706,
"eval_runtime": 0.3616,
"eval_samples_per_second": 517.153,
"eval_steps_per_second": 8.297,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.012262631207704544,
"learning_rate": 3e-05,
"loss": 0.0015,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8695652173913043,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8695652173913043,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7323943661971831,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6419753086419753,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9456869009584665,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.925,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.23013749718666077,
"eval_overall_accuracy": 0.9712657914292792,
"eval_overall_f1": 0.8698060941828255,
"eval_overall_precision": 0.8351063829787234,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3684,
"eval_samples_per_second": 507.649,
"eval_steps_per_second": 8.144,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.0009043277241289616,
"learning_rate": 2.95e-05,
"loss": 0.0024,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.853146853146853,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7591240875912408,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9430379746835442,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9141104294478528,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2405707687139511,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.8677685950413223,
"eval_overall_precision": 0.8289473684210527,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3649,
"eval_samples_per_second": 512.484,
"eval_steps_per_second": 8.222,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.08815114200115204,
"learning_rate": 2.9e-05,
"loss": 0.0015,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.851063829787234,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8333333333333334,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7704918032786885,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7704918032786885,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9456869009584665,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.925,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2553688883781433,
"eval_overall_accuracy": 0.9695318305672529,
"eval_overall_f1": 0.8781869688385271,
"eval_overall_precision": 0.8611111111111112,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3688,
"eval_samples_per_second": 507.104,
"eval_steps_per_second": 8.135,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.0011932431953027844,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0008,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8591549295774648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7538461538461538,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7101449275362319,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.26496070623397827,
"eval_overall_accuracy": 0.9690364131781025,
"eval_overall_f1": 0.8666666666666667,
"eval_overall_precision": 0.8342245989304813,
"eval_overall_recall": 0.9017341040462428,
"eval_runtime": 0.3652,
"eval_samples_per_second": 512.034,
"eval_steps_per_second": 8.214,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 3.7293193340301514,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0017,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6710526315789473,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9423076923076923,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9245283018867925,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.26268908381462097,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.8603042876901797,
"eval_overall_precision": 0.8249336870026526,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3678,
"eval_samples_per_second": 508.483,
"eval_steps_per_second": 8.157,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.6390479803085327,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0013,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8732394366197183,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8493150684931506,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7464788732394366,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9363057324840764,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9130434782608695,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.25916871428489685,
"eval_overall_accuracy": 0.9695318305672529,
"eval_overall_f1": 0.8684931506849316,
"eval_overall_precision": 0.8255208333333334,
"eval_overall_recall": 0.9161849710982659,
"eval_runtime": 0.3656,
"eval_samples_per_second": 511.447,
"eval_steps_per_second": 8.205,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.010238826274871826,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0026,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.823529411764706,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2907452881336212,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8521505376344086,
"eval_overall_precision": 0.7964824120603015,
"eval_overall_recall": 0.9161849710982659,
"eval_runtime": 0.3653,
"eval_samples_per_second": 511.904,
"eval_steps_per_second": 8.212,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.0005274274735711515,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0018,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8611111111111112,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8266666666666667,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7591240875912408,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.896969696969697,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7462686567164178,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.2971247136592865,
"eval_overall_accuracy": 0.9658162001486252,
"eval_overall_f1": 0.8567530695770805,
"eval_overall_precision": 0.8113695090439277,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3657,
"eval_samples_per_second": 511.396,
"eval_steps_per_second": 8.204,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.014134509488940239,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0014,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8571428571428571,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8450704225352113,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7445255474452555,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6710526315789473,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.935897435897436,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9182389937106918,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2763230800628662,
"eval_overall_accuracy": 0.9680455783998019,
"eval_overall_f1": 0.8659217877094972,
"eval_overall_precision": 0.8378378378378378,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3626,
"eval_samples_per_second": 515.776,
"eval_steps_per_second": 8.274,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.01190261635929346,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0019,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.8450704225352113,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.821917808219178,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9294871794871795,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9119496855345912,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8709677419354839,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8709677419354839,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.27485761046409607,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.8563458856345887,
"eval_overall_precision": 0.8274932614555256,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3612,
"eval_samples_per_second": 517.682,
"eval_steps_per_second": 8.305,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.1005834341049194,
"learning_rate": 2.5e-05,
"loss": 0.0014,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7205882352941175,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6533333333333333,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9517684887459807,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9367088607594937,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.29507261514663696,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8571428571428571,
"eval_overall_precision": 0.8167539267015707,
"eval_overall_recall": 0.9017341040462428,
"eval_runtime": 0.3618,
"eval_samples_per_second": 516.881,
"eval_steps_per_second": 8.292,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.0018566737417131662,
"learning_rate": 2.45e-05,
"loss": 0.0017,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6962962962962963,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6351351351351351,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9329073482428115,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9125,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.28224554657936096,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.8468965517241379,
"eval_overall_precision": 0.8100263852242744,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3638,
"eval_samples_per_second": 514.07,
"eval_steps_per_second": 8.247,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.00030757131753489375,
"learning_rate": 2.4e-05,
"loss": 0.0015,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8322147651006713,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7142857142857143,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6329113924050633,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9423076923076923,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9245283018867925,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.29711785912513733,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8528610354223434,
"eval_overall_precision": 0.8067010309278351,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.362,
"eval_samples_per_second": 516.559,
"eval_steps_per_second": 8.287,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.012948980554938316,
"learning_rate": 2.35e-05,
"loss": 0.0013,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6956521739130435,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6233766233766234,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9040247678018575,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8588235294117647,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3104041516780853,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.8340080971659919,
"eval_overall_precision": 0.7822784810126582,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3612,
"eval_samples_per_second": 517.74,
"eval_steps_per_second": 8.306,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.00616478780284524,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0014,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.746031746031746,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7230769230769231,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.923076923076923,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9056603773584906,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.28169548511505127,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8559440559440559,
"eval_overall_precision": 0.8292682926829268,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3661,
"eval_samples_per_second": 510.754,
"eval_steps_per_second": 8.194,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.0019178962102159858,
"learning_rate": 2.25e-05,
"loss": 0.0005,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.711111111111111,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6486486486486487,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9453376205787781,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.930379746835443,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.29151037335395813,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8623087621696801,
"eval_overall_precision": 0.8310991957104558,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3686,
"eval_samples_per_second": 507.352,
"eval_steps_per_second": 8.139,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.0005920439143665135,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0009,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8413793103448277,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8026315789473685,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7299270072992702,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6578947368421053,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9487179487179488,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9308176100628931,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.30188778042793274,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8670360110803323,
"eval_overall_precision": 0.8324468085106383,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3652,
"eval_samples_per_second": 512.012,
"eval_steps_per_second": 8.214,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.0004883262445218861,
"learning_rate": 2.15e-05,
"loss": 0.0009,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8450704225352113,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.821917808219178,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.939297124600639,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.91875,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2943618893623352,
"eval_overall_accuracy": 0.9665593262323507,
"eval_overall_f1": 0.8631284916201116,
"eval_overall_precision": 0.8351351351351352,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3709,
"eval_samples_per_second": 504.197,
"eval_steps_per_second": 8.089,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.0014432142488658428,
"learning_rate": 2.1e-05,
"loss": 0.0006,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8368794326241135,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8194444444444444,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7230769230769231,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6811594202898551,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9363057324840764,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9130434782608695,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.28986239433288574,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8623595505617977,
"eval_overall_precision": 0.8387978142076503,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3712,
"eval_samples_per_second": 503.757,
"eval_steps_per_second": 8.082,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.0014531804481521249,
"learning_rate": 2.05e-05,
"loss": 0.0005,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8472222222222223,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7375886524822695,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9517684887459807,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9367088607594937,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.29187676310539246,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.8653846153846154,
"eval_overall_precision": 0.824607329842932,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3703,
"eval_samples_per_second": 505.003,
"eval_steps_per_second": 8.102,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.000528964155819267,
"learning_rate": 2e-05,
"loss": 0.0006,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.68,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9426751592356687,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9192546583850931,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3160874545574188,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.8579234972677596,
"eval_overall_precision": 0.8134715025906736,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3784,
"eval_samples_per_second": 494.206,
"eval_steps_per_second": 7.928,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.001857202616520226,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0017,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7518796992481204,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6944444444444444,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9396825396825397,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9135802469135802,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.84375,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2975999414920807,
"eval_overall_accuracy": 0.9658162001486252,
"eval_overall_f1": 0.8638239339752408,
"eval_overall_precision": 0.8241469816272966,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3649,
"eval_samples_per_second": 512.529,
"eval_steps_per_second": 8.222,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.0003795857774093747,
"learning_rate": 1.9e-05,
"loss": 0.0004,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.746031746031746,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7230769230769231,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9456869009584665,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.925,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3019534647464752,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.8599167822468794,
"eval_overall_precision": 0.8266666666666667,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3666,
"eval_samples_per_second": 510.155,
"eval_steps_per_second": 8.184,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.00042081772699020803,
"learning_rate": 1.85e-05,
"loss": 0.0004,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.762589928057554,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6794871794871795,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9453376205787781,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.930379746835443,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2791728079319,
"eval_overall_accuracy": 0.966807034926926,
"eval_overall_f1": 0.861454046639232,
"eval_overall_precision": 0.8198433420365535,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3576,
"eval_samples_per_second": 522.878,
"eval_steps_per_second": 8.388,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.015575162135064602,
"learning_rate": 1.8e-05,
"loss": 0.001,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6235294117647059,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.946031746031746,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9197530864197531,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2865269184112549,
"eval_overall_accuracy": 0.9665593262323507,
"eval_overall_f1": 0.8598639455782313,
"eval_overall_precision": 0.8123393316195373,
"eval_overall_recall": 0.9132947976878613,
"eval_runtime": 0.3652,
"eval_samples_per_second": 512.011,
"eval_steps_per_second": 8.214,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.0011894090566784143,
"learning_rate": 1.75e-05,
"loss": 0.0011,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8201438848920863,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8142857142857143,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.732824427480916,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6857142857142857,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9490445859872612,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9254658385093167,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.291652649641037,
"eval_overall_accuracy": 0.9680455783998019,
"eval_overall_f1": 0.8639551192145861,
"eval_overall_precision": 0.8392370572207084,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.361,
"eval_samples_per_second": 518.053,
"eval_steps_per_second": 8.311,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.0299760140478611,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0014,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8055555555555556,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7375886524822695,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.946031746031746,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9197530864197531,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.27525565028190613,
"eval_overall_accuracy": 0.9685409957889521,
"eval_overall_f1": 0.8598901098901098,
"eval_overall_precision": 0.819371727748691,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3758,
"eval_samples_per_second": 497.654,
"eval_steps_per_second": 7.984,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.0006641316576860845,
"learning_rate": 1.65e-05,
"loss": 0.0005,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7361111111111112,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9400630914826499,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9085365853658537,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.288452684879303,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8583106267029972,
"eval_overall_precision": 0.8118556701030928,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3617,
"eval_samples_per_second": 516.981,
"eval_steps_per_second": 8.294,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.0003661834343802184,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0004,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7647058823529411,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6933333333333334,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9551282051282051,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9371069182389937,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2738393545150757,
"eval_overall_accuracy": 0.971018082734704,
"eval_overall_f1": 0.8750000000000001,
"eval_overall_precision": 0.8422459893048129,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3691,
"eval_samples_per_second": 506.591,
"eval_steps_per_second": 8.127,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.00032552139600738883,
"learning_rate": 1.55e-05,
"loss": 0.0002,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7555555555555555,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6891891891891891,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9551282051282051,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9371069182389937,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2714591920375824,
"eval_overall_accuracy": 0.971018082734704,
"eval_overall_f1": 0.8758716875871689,
"eval_overall_precision": 0.8463611859838275,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3611,
"eval_samples_per_second": 517.91,
"eval_steps_per_second": 8.309,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.0012234537862241268,
"learning_rate": 1.5e-05,
"loss": 0.0003,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7761194029850746,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7123287671232876,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.946031746031746,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9197530864197531,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2793043553829193,
"eval_overall_accuracy": 0.9705226653455536,
"eval_overall_f1": 0.8750000000000001,
"eval_overall_precision": 0.8422459893048129,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3626,
"eval_samples_per_second": 515.737,
"eval_steps_per_second": 8.274,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.00031636914354749024,
"learning_rate": 1.45e-05,
"loss": 0.0001,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7761194029850746,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7123287671232876,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9430379746835442,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9141104294478528,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.29805585741996765,
"eval_overall_accuracy": 0.9690364131781025,
"eval_overall_f1": 0.8737864077669903,
"eval_overall_precision": 0.84,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3626,
"eval_samples_per_second": 515.664,
"eval_steps_per_second": 8.273,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.003590099047869444,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0005,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8260869565217391,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8260869565217391,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.7633587786259541,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9430379746835442,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9141104294478528,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.27618908882141113,
"eval_overall_accuracy": 0.9707703740401288,
"eval_overall_f1": 0.8735955056179775,
"eval_overall_precision": 0.8497267759562842,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3699,
"eval_samples_per_second": 505.485,
"eval_steps_per_second": 8.109,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.00027959441649727523,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0002,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8391608391608392,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.68,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.946031746031746,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9197530864197531,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.9032258064516129,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.9032258064516129,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.28340503573417664,
"eval_overall_accuracy": 0.9685409957889521,
"eval_overall_f1": 0.8698060941828255,
"eval_overall_precision": 0.8351063829787234,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.362,
"eval_samples_per_second": 516.608,
"eval_steps_per_second": 8.288,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.00044001045171171427,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0002,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7681159420289856,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6883116883116883,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9551282051282051,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9371069182389937,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.27885836362838745,
"eval_overall_accuracy": 0.9695318305672529,
"eval_overall_f1": 0.8756906077348067,
"eval_overall_precision": 0.8386243386243386,
"eval_overall_recall": 0.9161849710982659,
"eval_runtime": 0.3657,
"eval_samples_per_second": 511.381,
"eval_steps_per_second": 8.204,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.00027540308656170964,
"learning_rate": 1.25e-05,
"loss": 0.0001,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7737226277372262,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6973684210526315,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.9430379746835442,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9141104294478528,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7941176470588235,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2948344945907593,
"eval_overall_accuracy": 0.9673024523160763,
"eval_overall_f1": 0.8708791208791209,
"eval_overall_precision": 0.8298429319371727,
"eval_overall_recall": 0.9161849710982659,
"eval_runtime": 0.3634,
"eval_samples_per_second": 514.56,
"eval_steps_per_second": 8.255,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.007422334514558315,
"learning_rate": 1.2e-05,
"loss": 0.0004,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7067669172932329,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6527777777777778,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9400630914826499,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9085365853658537,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3101661205291748,
"eval_overall_accuracy": 0.966807034926926,
"eval_overall_f1": 0.8587257617728532,
"eval_overall_precision": 0.824468085106383,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3638,
"eval_samples_per_second": 513.997,
"eval_steps_per_second": 8.246,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.0005564504535868764,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0005,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7391304347826089,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6623376623376623,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9430379746835442,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9141104294478528,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.29981571435928345,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8618331053351572,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3758,
"eval_samples_per_second": 497.657,
"eval_steps_per_second": 7.984,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.003542252816259861,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0002,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7703703703703704,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7027027027027027,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.946031746031746,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9197530864197531,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.28981682658195496,
"eval_overall_accuracy": 0.9675501610106515,
"eval_overall_f1": 0.8686030428769017,
"eval_overall_precision": 0.8328912466843501,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3708,
"eval_samples_per_second": 504.361,
"eval_steps_per_second": 8.091,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.0004401499463710934,
"learning_rate": 1.05e-05,
"loss": 0.0003,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8169014084507042,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7945205479452054,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7538461538461538,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7101449275362319,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.952076677316294,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.93125,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.84375,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2755199670791626,
"eval_overall_accuracy": 0.9695318305672529,
"eval_overall_f1": 0.8735955056179775,
"eval_overall_precision": 0.8497267759562842,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3648,
"eval_samples_per_second": 512.67,
"eval_steps_per_second": 8.225,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.00034126470563933253,
"learning_rate": 1e-05,
"loss": 0.0004,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7424242424242424,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6901408450704225,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9371069182389938,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9030303030303031,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.787878787878788,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2898205518722534,
"eval_overall_accuracy": 0.96556849145405,
"eval_overall_f1": 0.8532235939643347,
"eval_overall_precision": 0.8120104438642297,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3951,
"eval_samples_per_second": 473.261,
"eval_steps_per_second": 7.592,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.000562498637009412,
"learning_rate": 9.5e-06,
"loss": 0.0003,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.68,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9337539432176657,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9024390243902439,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.84375,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.28580695390701294,
"eval_overall_accuracy": 0.9687887044835274,
"eval_overall_f1": 0.8646408839779005,
"eval_overall_precision": 0.828042328042328,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3627,
"eval_samples_per_second": 515.648,
"eval_steps_per_second": 8.272,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.0003717710787896067,
"learning_rate": 9e-06,
"loss": 0.0004,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.765625,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7313432835820896,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9430379746835442,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9141104294478528,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.28542497754096985,
"eval_overall_accuracy": 0.9695318305672529,
"eval_overall_f1": 0.8650904033379694,
"eval_overall_precision": 0.8337801608579088,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3698,
"eval_samples_per_second": 505.716,
"eval_steps_per_second": 8.113,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.0019057561876252294,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0004,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7941176470588235,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.72,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.9400630914826499,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9085365853658537,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2824600636959076,
"eval_overall_accuracy": 0.9692841218726778,
"eval_overall_f1": 0.8688524590163936,
"eval_overall_precision": 0.8238341968911918,
"eval_overall_recall": 0.9190751445086706,
"eval_runtime": 0.3654,
"eval_samples_per_second": 511.741,
"eval_steps_per_second": 8.21,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.001229365007020533,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0006,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8226950354609929,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8055555555555556,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7874015748031497,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7575757575757576,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.952076677316294,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.93125,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.26607078313827515,
"eval_overall_accuracy": 0.9720089175130047,
"eval_overall_f1": 0.876056338028169,
"eval_overall_precision": 0.8543956043956044,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3766,
"eval_samples_per_second": 496.598,
"eval_steps_per_second": 7.967,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.00014708787784911692,
"learning_rate": 7.5e-06,
"loss": 0.0003,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7559055118110236,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9400630914826499,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9085365853658537,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.293227881193161,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.8638888888888889,
"eval_overall_precision": 0.8315508021390374,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.364,
"eval_samples_per_second": 513.774,
"eval_steps_per_second": 8.242,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.003805099753662944,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0006,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8345323741007195,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8285714285714286,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.768,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.946031746031746,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9197530864197531,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2930375337600708,
"eval_overall_accuracy": 0.9685409957889521,
"eval_overall_f1": 0.8732394366197184,
"eval_overall_precision": 0.8516483516483516,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3668,
"eval_samples_per_second": 509.746,
"eval_steps_per_second": 8.178,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.04100840538740158,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0005,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8169014084507042,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7945205479452054,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7559055118110236,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.823529411764706,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3029007911682129,
"eval_overall_accuracy": 0.9663116175377756,
"eval_overall_f1": 0.8559556786703602,
"eval_overall_precision": 0.8218085106382979,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3762,
"eval_samples_per_second": 497.075,
"eval_steps_per_second": 7.974,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.0002212318213423714,
"learning_rate": 6e-06,
"loss": 0.0003,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8115942028985507,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.30660566687583923,
"eval_overall_accuracy": 0.9665593262323507,
"eval_overall_f1": 0.8598901098901098,
"eval_overall_precision": 0.819371727748691,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3705,
"eval_samples_per_second": 504.729,
"eval_steps_per_second": 8.097,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.000250909011811018,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0001,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7692307692307692,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7246376811594203,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9341692789968652,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8975903614457831,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8115942028985507,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.30867499113082886,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8571428571428571,
"eval_overall_precision": 0.8167539267015707,
"eval_overall_recall": 0.9017341040462428,
"eval_runtime": 0.3615,
"eval_samples_per_second": 517.307,
"eval_steps_per_second": 8.299,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.00021638131875079125,
"learning_rate": 5e-06,
"loss": 0.0001,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8266666666666668,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7633587786259541,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9216300940438872,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8855421686746988,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.31429383158683777,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8551912568306012,
"eval_overall_precision": 0.810880829015544,
"eval_overall_recall": 0.9046242774566474,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.676,
"eval_steps_per_second": 8.08,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.00013644745922647417,
"learning_rate": 4.5e-06,
"loss": 0.0001,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.930817610062893,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.896969696969697,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.2944120168685913,
"eval_overall_accuracy": 0.968293287094377,
"eval_overall_f1": 0.861454046639232,
"eval_overall_precision": 0.8198433420365535,
"eval_overall_recall": 0.9075144508670521,
"eval_runtime": 0.3632,
"eval_samples_per_second": 514.858,
"eval_steps_per_second": 8.26,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.0009539081365801394,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0002,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8322147651006713,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7727272727272727,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7183098591549296,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9249999999999999,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8862275449101796,
"eval_PERSON_recall": 0.9673202614379085,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.823529411764706,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.31182703375816345,
"eval_overall_accuracy": 0.9670547436215011,
"eval_overall_f1": 0.8610354223433242,
"eval_overall_precision": 0.8144329896907216,
"eval_overall_recall": 0.9132947976878613,
"eval_runtime": 0.3679,
"eval_samples_per_second": 508.226,
"eval_steps_per_second": 8.153,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.00018770851602312177,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0003,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.30489107966423035,
"eval_overall_accuracy": 0.968293287094377,
"eval_overall_f1": 0.8684931506849316,
"eval_overall_precision": 0.8255208333333334,
"eval_overall_recall": 0.9161849710982659,
"eval_runtime": 0.3644,
"eval_samples_per_second": 513.217,
"eval_steps_per_second": 8.233,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.0019927462562918663,
"learning_rate": 3e-06,
"loss": 0.0001,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8307692307692308,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8181818181818182,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3039020299911499,
"eval_overall_accuracy": 0.968293287094377,
"eval_overall_f1": 0.8657534246575342,
"eval_overall_precision": 0.8229166666666666,
"eval_overall_recall": 0.9132947976878613,
"eval_runtime": 0.3778,
"eval_samples_per_second": 494.941,
"eval_steps_per_second": 7.94,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.00036656216252595186,
"learning_rate": 2.5e-06,
"loss": 0.0003,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9371069182389938,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.9030303030303031,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.30329030752182007,
"eval_overall_accuracy": 0.968293287094377,
"eval_overall_f1": 0.8641975308641975,
"eval_overall_precision": 0.8224543080939948,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3655,
"eval_samples_per_second": 511.653,
"eval_steps_per_second": 8.208,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.00014269202074501663,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0005,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.30583375692367554,
"eval_overall_accuracy": 0.9675501610106515,
"eval_overall_f1": 0.8618331053351572,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3755,
"eval_samples_per_second": 497.939,
"eval_steps_per_second": 7.988,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.0001223723666043952,
"learning_rate": 1.5e-06,
"loss": 0.0001,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9341692789968652,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8975903614457831,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3053462505340576,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.863013698630137,
"eval_overall_precision": 0.8203125,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3619,
"eval_samples_per_second": 516.75,
"eval_steps_per_second": 8.29,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.0004060152277816087,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0001,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9341692789968652,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8975903614457831,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3043583929538727,
"eval_overall_accuracy": 0.9677978697052266,
"eval_overall_f1": 0.863013698630137,
"eval_overall_precision": 0.8203125,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3759,
"eval_samples_per_second": 497.529,
"eval_steps_per_second": 7.982,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.00019621806859504431,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0001,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3064700961112976,
"eval_overall_accuracy": 0.9675501610106515,
"eval_overall_f1": 0.8618331053351572,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3646,
"eval_samples_per_second": 512.932,
"eval_steps_per_second": 8.229,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.0006661502993665636,
"learning_rate": 0.0,
"loss": 0.0001,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7786259541984734,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.7285714285714285,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.93125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8922155688622755,
"eval_PERSON_recall": 0.9738562091503268,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.3065154552459717,
"eval_overall_accuracy": 0.9675501610106515,
"eval_overall_f1": 0.8618331053351572,
"eval_overall_precision": 0.8181818181818182,
"eval_overall_recall": 0.9104046242774566,
"eval_runtime": 0.3714,
"eval_samples_per_second": 503.447,
"eval_steps_per_second": 8.077,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4560509291304846.0,
"train_loss": 0.008112131665891283,
"train_runtime": 974.3295,
"train_samples_per_second": 173.145,
"train_steps_per_second": 10.879
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4560509291304846.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}