{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 3.2015111446380615, "learning_rate": 4.9500000000000004e-05, "loss": 0.3254, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.8082191780821918, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7662337662337663, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.5901639344262295, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5901639344262295, "eval_ORGANIZATION_recall": 0.5901639344262295, "eval_PERSON_f1": 0.89937106918239, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8666666666666667, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.12376317381858826, "eval_overall_accuracy": 0.9581372306167947, "eval_overall_f1": 0.8072122052704577, "eval_overall_precision": 0.776, "eval_overall_recall": 0.8410404624277457, "eval_runtime": 0.3597, "eval_samples_per_second": 519.816, "eval_steps_per_second": 8.339, "step": 106 }, { "epoch": 2.0, "grad_norm": 3.5055294036865234, "learning_rate": 4.9e-05, "loss": 0.1103, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.8028169014084506, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7808219178082192, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.6918238993710693, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5612244897959183, "eval_ORGANIZATION_recall": 0.9016393442622951, "eval_PERSON_f1": 0.89375, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8562874251497006, "eval_PERSON_recall": 0.934640522875817, "eval_QUANTITY_f1": 0.742857142857143, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.6842105263157895, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7647058823529411, "eval_TIME_number": 31, "eval_TIME_precision": 0.7027027027027027, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.14232417941093445, "eval_overall_accuracy": 0.9556601436710429, "eval_overall_f1": 0.8089591567852438, "eval_overall_precision": 0.7433414043583535, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3736, "eval_samples_per_second": 500.519, "eval_steps_per_second": 8.03, "step": 212 }, { "epoch": 3.0, "grad_norm": 3.338141918182373, "learning_rate": 4.85e-05, "loss": 0.0719, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.7945205479452054, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.6749999999999999, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5454545454545454, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.909657320872274, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8690476190476191, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 31, "eval_TIME_precision": 0.84375, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.14947976171970367, "eval_overall_accuracy": 0.9593757740896706, "eval_overall_f1": 0.8194993412384717, "eval_overall_precision": 0.7530266343825666, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3603, "eval_samples_per_second": 519.072, "eval_steps_per_second": 8.327, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.6828668117523193, "learning_rate": 4.8e-05, "loss": 0.0492, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.8194444444444444, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7866666666666666, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7552447552447552, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6585365853658537, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.9130434782608696, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8698224852071006, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.75, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.675, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.7605633802816901, "eval_TIME_number": 31, "eval_TIME_precision": 0.675, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.1601407825946808, "eval_overall_accuracy": 0.9621005697299975, "eval_overall_f1": 0.8351063829787234, "eval_overall_precision": 0.7733990147783252, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3697, "eval_samples_per_second": 505.814, "eval_steps_per_second": 8.115, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.3032749891281128, "learning_rate": 4.75e-05, "loss": 0.0315, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7619047619047619, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.717948717948718, "eval_LOCATION_recall": 0.8115942028985508, "eval_ORGANIZATION_f1": 0.6423357664233578, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5789473684210527, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.9216300940438872, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8855421686746988, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7575757575757576, "eval_TIME_number": 31, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8064516129032258, "eval_loss": 0.1780991554260254, "eval_overall_accuracy": 0.9583849393113698, "eval_overall_f1": 0.8086838534599727, "eval_overall_precision": 0.7621483375959079, "eval_overall_recall": 0.861271676300578, "eval_runtime": 0.3628, "eval_samples_per_second": 515.381, "eval_steps_per_second": 8.268, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.877514362335205, "learning_rate": 4.7e-05, "loss": 0.0217, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7724137931034482, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7368421052631579, "eval_LOCATION_recall": 0.8115942028985508, "eval_ORGANIZATION_f1": 0.7397260273972602, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6352941176470588, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.9245283018867925, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8909090909090909, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7222222222222223, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.65, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.17554225027561188, "eval_overall_accuracy": 0.9606143175625464, "eval_overall_f1": 0.8277703604806409, "eval_overall_precision": 0.7692307692307693, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3662, "eval_samples_per_second": 510.654, "eval_steps_per_second": 8.192, "step": 636 }, { "epoch": 7.0, "grad_norm": 0.2853144705295563, "learning_rate": 4.6500000000000005e-05, "loss": 0.0168, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7777777777777779, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7466666666666667, "eval_LOCATION_recall": 0.8115942028985508, "eval_ORGANIZATION_f1": 0.6901408450704226, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6049382716049383, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.915360501567398, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8795180722891566, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8253968253968254, "eval_TIME_number": 31, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.19883674383163452, "eval_overall_accuracy": 0.9608620262571216, "eval_overall_f1": 0.8244897959183674, "eval_overall_precision": 0.7789203084832905, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3599, "eval_samples_per_second": 519.614, "eval_steps_per_second": 8.336, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.052625108510255814, "learning_rate": 4.600000000000001e-05, "loss": 0.0134, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.8082191780821918, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7662337662337663, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6857142857142857, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6075949367088608, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9216300940438872, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8855421686746988, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7575757575757576, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7352941176470589, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8115942028985507, "eval_TIME_number": 31, "eval_TIME_precision": 0.7368421052631579, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.19897328317165375, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8297297297297296, "eval_overall_precision": 0.7791878172588832, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3619, "eval_samples_per_second": 516.738, "eval_steps_per_second": 8.29, "step": 848 }, { "epoch": 9.0, "grad_norm": 0.2537504732608795, "learning_rate": 4.55e-05, "loss": 0.0101, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.8211920529801324, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6929133858267716, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7213114754098361, "eval_PERSON_f1": 0.9311475409836065, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9342105263157895, "eval_PERSON_recall": 0.9281045751633987, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.20098058879375458, "eval_overall_accuracy": 0.9643299479811741, "eval_overall_f1": 0.8400556328233658, "eval_overall_precision": 0.8096514745308311, "eval_overall_recall": 0.8728323699421965, "eval_runtime": 0.3599, "eval_samples_per_second": 519.595, "eval_steps_per_second": 8.336, "step": 954 }, { "epoch": 10.0, "grad_norm": 0.2351408451795578, "learning_rate": 4.5e-05, "loss": 0.0101, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.8513513513513514, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7974683544303798, "eval_LOCATION_recall": 0.9130434782608695, "eval_ORGANIZATION_f1": 0.7445255474452555, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9148264984227129, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8841463414634146, "eval_PERSON_recall": 0.9477124183006536, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2193160206079483, "eval_overall_accuracy": 0.9638345305920237, "eval_overall_f1": 0.8509485094850948, "eval_overall_precision": 0.8010204081632653, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3607, "eval_samples_per_second": 518.462, "eval_steps_per_second": 8.318, "step": 1060 }, { "epoch": 11.0, "grad_norm": 0.03327617421746254, "learning_rate": 4.4500000000000004e-05, "loss": 0.0063, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.8226950354609929, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8055555555555556, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7205882352941175, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6533333333333333, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9303797468354431, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.901840490797546, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.782608695652174, "eval_TIME_number": 31, "eval_TIME_precision": 0.7105263157894737, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.22587580978870392, "eval_overall_accuracy": 0.9628436958137231, "eval_overall_f1": 0.8426812585499317, "eval_overall_precision": 0.8, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3625, "eval_samples_per_second": 515.878, "eval_steps_per_second": 8.276, "step": 1166 }, { "epoch": 12.0, "grad_norm": 5.140894412994385, "learning_rate": 4.4000000000000006e-05, "loss": 0.0059, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.7517730496453902, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7361111111111112, "eval_LOCATION_recall": 0.7681159420289855, "eval_ORGANIZATION_f1": 0.6714285714285714, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5949367088607594, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9235668789808917, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9006211180124224, "eval_PERSON_recall": 0.9477124183006536, "eval_QUANTITY_f1": 0.84375, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.84375, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.23827865719795227, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8271092669432919, "eval_overall_precision": 0.7931034482758621, "eval_overall_recall": 0.8641618497109826, "eval_runtime": 0.3692, "eval_samples_per_second": 506.502, "eval_steps_per_second": 8.126, "step": 1272 }, { "epoch": 13.0, "grad_norm": 3.8915011882781982, "learning_rate": 4.35e-05, "loss": 0.007, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7894736842105263, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9303797468354431, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.901840490797546, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.75, "eval_TIME_number": 31, "eval_TIME_precision": 0.6585365853658537, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2511149048805237, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8304405874499332, "eval_overall_precision": 0.771712158808933, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3685, "eval_samples_per_second": 507.422, "eval_steps_per_second": 8.14, "step": 1378 }, { "epoch": 14.0, "grad_norm": 0.0344400629401207, "learning_rate": 4.3e-05, "loss": 0.0058, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7763157894736842, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7352941176470588, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.24048586189746857, "eval_overall_accuracy": 0.9648253653703245, "eval_overall_f1": 0.8451086956521738, "eval_overall_precision": 0.7974358974358975, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3742, "eval_samples_per_second": 499.756, "eval_steps_per_second": 8.017, "step": 1484 }, { "epoch": 15.0, "grad_norm": 0.006385091692209244, "learning_rate": 4.25e-05, "loss": 0.0053, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.7972972972972974, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7407407407407408, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6756756756756757, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.823529411764706, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7777777777777778, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.7714285714285716, "eval_TIME_number": 31, "eval_TIME_precision": 0.6923076923076923, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.25498369336128235, "eval_overall_accuracy": 0.9623482784245727, "eval_overall_f1": 0.844804318488529, "eval_overall_precision": 0.7924050632911392, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.367, "eval_samples_per_second": 509.472, "eval_steps_per_second": 8.173, "step": 1590 }, { "epoch": 16.0, "grad_norm": 0.007103159092366695, "learning_rate": 4.2e-05, "loss": 0.0045, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.71875, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6865671641791045, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.9367088607594937, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9079754601226994, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8615384615384615, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8484848484848485, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2411327213048935, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8559556786703602, "eval_overall_precision": 0.8218085106382979, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.367, "eval_samples_per_second": 509.544, "eval_steps_per_second": 8.175, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.005618996452540159, "learning_rate": 4.15e-05, "loss": 0.0044, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.8194444444444444, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7866666666666666, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7218045112781954, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9240506329113924, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8957055214723927, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.8615384615384615, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8484848484848485, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.23781569302082062, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8496551724137931, "eval_overall_precision": 0.8126649076517151, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3633, "eval_samples_per_second": 514.728, "eval_steps_per_second": 8.258, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.00691909808665514, "learning_rate": 4.1e-05, "loss": 0.004, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.7891156462585034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7205882352941175, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6533333333333333, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9211356466876972, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8902439024390244, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8115942028985507, "eval_TIME_number": 31, "eval_TIME_precision": 0.7368421052631579, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.28217267990112305, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.8346883468834689, "eval_overall_precision": 0.7857142857142857, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3659, "eval_samples_per_second": 511.052, "eval_steps_per_second": 8.199, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.018693506717681885, "learning_rate": 4.05e-05, "loss": 0.0043, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.8275862068965517, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7894736842105263, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9426751592356687, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9192546583850931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.823529411764706, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7777777777777778, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.23565581440925598, "eval_overall_accuracy": 0.9658162001486252, "eval_overall_f1": 0.8547945205479451, "eval_overall_precision": 0.8125, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3727, "eval_samples_per_second": 501.787, "eval_steps_per_second": 8.05, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.0034094720613211393, "learning_rate": 4e-05, "loss": 0.0032, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.7702702702702703, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7215189873417721, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7301587301587301, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7076923076923077, "eval_ORGANIZATION_recall": 0.7540983606557377, "eval_PERSON_f1": 0.9201277955271565, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9, "eval_PERSON_recall": 0.9411764705882353, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8615384615384616, "eval_TIME_number": 31, "eval_TIME_precision": 0.8235294117647058, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.24556776881217957, "eval_overall_accuracy": 0.9635868218974486, "eval_overall_f1": 0.8388888888888889, "eval_overall_precision": 0.8074866310160428, "eval_overall_recall": 0.8728323699421965, "eval_runtime": 0.3742, "eval_samples_per_second": 499.754, "eval_steps_per_second": 8.017, "step": 2120 }, { "epoch": 21.0, "grad_norm": 0.006027919240295887, "learning_rate": 3.9500000000000005e-05, "loss": 0.0036, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6986301369863014, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9126213592233009, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9038461538461539, "eval_PERSON_recall": 0.9215686274509803, "eval_QUANTITY_f1": 0.7714285714285714, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7105263157894737, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8253968253968254, "eval_TIME_number": 31, "eval_TIME_precision": 0.8125, "eval_TIME_recall": 0.8387096774193549, "eval_loss": 0.27808642387390137, "eval_overall_accuracy": 0.9618528610354223, "eval_overall_f1": 0.828804347826087, "eval_overall_precision": 0.782051282051282, "eval_overall_recall": 0.8815028901734104, "eval_runtime": 0.3671, "eval_samples_per_second": 509.462, "eval_steps_per_second": 8.173, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.08943280577659607, "learning_rate": 3.9000000000000006e-05, "loss": 0.0029, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.8356164383561644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.654320987654321, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.896969696969697, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.782608695652174, "eval_TIME_number": 31, "eval_TIME_precision": 0.7105263157894737, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.3044780194759369, "eval_overall_accuracy": 0.9635868218974486, "eval_overall_f1": 0.8506056527590848, "eval_overall_precision": 0.7959697732997482, "eval_overall_recall": 0.9132947976878613, "eval_runtime": 0.3751, "eval_samples_per_second": 498.515, "eval_steps_per_second": 7.998, "step": 2332 }, { "epoch": 23.0, "grad_norm": 0.008143425919115543, "learning_rate": 3.85e-05, "loss": 0.0023, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8551724137931034, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8157894736842105, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.6911764705882353, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6266666666666667, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9367088607594937, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9079754601226994, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2635738253593445, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8520547945205479, "eval_overall_precision": 0.8098958333333334, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3625, "eval_samples_per_second": 515.906, "eval_steps_per_second": 8.277, "step": 2438 }, { "epoch": 24.0, "grad_norm": 14.303221702575684, "learning_rate": 3.8e-05, "loss": 0.0059, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.786206896551724, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.620253164556962, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9426751592356687, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9192546583850931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7826086956521738, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7297297297297297, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.272360235452652, "eval_overall_accuracy": 0.9633391132028735, "eval_overall_f1": 0.8392370572207084, "eval_overall_precision": 0.7938144329896907, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3692, "eval_samples_per_second": 506.476, "eval_steps_per_second": 8.125, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.13158877193927765, "learning_rate": 3.7500000000000003e-05, "loss": 0.002, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.8137931034482757, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.6666666666666666, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.5875, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9389067524115756, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9240506329113924, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7536231884057971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7027027027027027, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8615384615384616, "eval_TIME_number": 31, "eval_TIME_precision": 0.8235294117647058, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.25297293066978455, "eval_overall_accuracy": 0.9648253653703245, "eval_overall_f1": 0.8372093023255814, "eval_overall_precision": 0.7948051948051948, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3604, "eval_samples_per_second": 518.829, "eval_steps_per_second": 8.323, "step": 2650 }, { "epoch": 26.0, "grad_norm": 1.7319470643997192, "learning_rate": 3.7e-05, "loss": 0.0037, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.7517730496453902, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7361111111111112, "eval_LOCATION_recall": 0.7681159420289855, "eval_ORGANIZATION_f1": 0.7007299270072993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.631578947368421, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9299363057324841, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.906832298136646, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.7887323943661971, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8115942028985507, "eval_TIME_number": 31, "eval_TIME_precision": 0.7368421052631579, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2652280628681183, "eval_overall_accuracy": 0.9601189001733961, "eval_overall_f1": 0.8278688524590163, "eval_overall_precision": 0.7849740932642487, "eval_overall_recall": 0.8757225433526011, "eval_runtime": 0.3664, "eval_samples_per_second": 510.378, "eval_steps_per_second": 8.188, "step": 2756 }, { "epoch": 27.0, "grad_norm": 0.21630139648914337, "learning_rate": 3.65e-05, "loss": 0.0052, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.8026315789473685, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.6993006993006993, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6097560975609756, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8615384615384615, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8484848484848485, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.25186625123023987, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8463611859838275, "eval_overall_precision": 0.7929292929292929, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3644, "eval_samples_per_second": 513.133, "eval_steps_per_second": 8.232, "step": 2862 }, { "epoch": 28.0, "grad_norm": 0.007407509256154299, "learning_rate": 3.6e-05, "loss": 0.0023, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.8489208633093526, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8428571428571429, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7230769230769231, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9456869009584665, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.925, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8125, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7714285714285716, "eval_TIME_number": 31, "eval_TIME_precision": 0.6923076923076923, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.25416678190231323, "eval_overall_accuracy": 0.9692841218726778, "eval_overall_f1": 0.8575418994413407, "eval_overall_precision": 0.8297297297297297, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3685, "eval_samples_per_second": 507.471, "eval_steps_per_second": 8.141, "step": 2968 }, { "epoch": 29.0, "grad_norm": 85.30389404296875, "learning_rate": 3.55e-05, "loss": 0.0042, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.8356164383561644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7441860465116278, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7058823529411765, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9551282051282051, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9371069182389937, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8059701492537314, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7714285714285715, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.24519670009613037, "eval_overall_accuracy": 0.9687887044835274, "eval_overall_f1": 0.8678720445062588, "eval_overall_precision": 0.8364611260053619, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3665, "eval_samples_per_second": 510.289, "eval_steps_per_second": 8.186, "step": 3074 }, { "epoch": 30.0, "grad_norm": 0.044042494148015976, "learning_rate": 3.5e-05, "loss": 0.0016, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.851063829787234, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8333333333333334, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6976744186046512, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6617647058823529, "eval_ORGANIZATION_recall": 0.7377049180327869, "eval_PERSON_f1": 0.9490445859872612, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9254658385093167, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8059701492537314, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7714285714285715, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2484143078327179, "eval_overall_accuracy": 0.9695318305672529, "eval_overall_f1": 0.8603351955307263, "eval_overall_precision": 0.8324324324324325, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.3654, "eval_samples_per_second": 511.826, "eval_steps_per_second": 8.211, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.03026013821363449, "learning_rate": 3.45e-05, "loss": 0.0017, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7480916030534351, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.29129624366760254, "eval_overall_accuracy": 0.9643299479811741, "eval_overall_f1": 0.8559670781893004, "eval_overall_precision": 0.814621409921671, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3674, "eval_samples_per_second": 508.961, "eval_steps_per_second": 8.165, "step": 3286 }, { "epoch": 32.0, "grad_norm": 1.4942476749420166, "learning_rate": 3.4000000000000007e-05, "loss": 0.0033, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.855072463768116, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.855072463768116, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7819548872180451, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7222222222222222, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9487179487179488, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9308176100628931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.84375, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.84375, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.23277780413627625, "eval_overall_accuracy": 0.9722566262075799, "eval_overall_f1": 0.880450070323488, "eval_overall_precision": 0.8575342465753425, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3786, "eval_samples_per_second": 493.877, "eval_steps_per_second": 7.923, "step": 3392 }, { "epoch": 33.0, "grad_norm": 0.0030820919200778008, "learning_rate": 3.35e-05, "loss": 0.0021, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.8194444444444444, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7866666666666666, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7310344827586208, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6309523809523809, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9245283018867925, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8909090909090909, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8484848484848485, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8235294117647058, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.28664737939834595, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8486486486486486, "eval_overall_precision": 0.7969543147208121, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3626, "eval_samples_per_second": 515.746, "eval_steps_per_second": 8.274, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.013372019864618778, "learning_rate": 3.3e-05, "loss": 0.0034, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.8450704225352113, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.821917808219178, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7536231884057972, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6753246753246753, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.24620448052883148, "eval_overall_accuracy": 0.9705226653455536, "eval_overall_f1": 0.8622589531680441, "eval_overall_precision": 0.8236842105263158, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3647, "eval_samples_per_second": 512.754, "eval_steps_per_second": 8.226, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.00117175851482898, "learning_rate": 3.2500000000000004e-05, "loss": 0.0018, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.851063829787234, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8333333333333334, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7536231884057972, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6753246753246753, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.896969696969697, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8615384615384615, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8484848484848485, "eval_QUANTITY_recall": 0.875, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2648729979991913, "eval_overall_accuracy": 0.9685409957889521, "eval_overall_f1": 0.8665749656121046, "eval_overall_precision": 0.8267716535433071, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3621, "eval_samples_per_second": 516.468, "eval_steps_per_second": 8.286, "step": 3710 }, { "epoch": 36.0, "grad_norm": 0.004863755311816931, "learning_rate": 3.2000000000000005e-05, "loss": 0.0015, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.8652482269503546, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8472222222222222, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7741935483870968, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7619047619047619, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9333333333333333, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9074074074074074, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.7941176470588235, "eval_TIME_number": 31, "eval_TIME_precision": 0.7297297297297297, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2638514041900635, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.8667601683029452, "eval_overall_precision": 0.8419618528610354, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3838, "eval_samples_per_second": 487.261, "eval_steps_per_second": 7.817, "step": 3816 }, { "epoch": 37.0, "grad_norm": 0.002965473337098956, "learning_rate": 3.15e-05, "loss": 0.0029, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.8413793103448277, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8026315789473685, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7633587786259541, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9274447949526814, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8963414634146342, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8059701492537314, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7714285714285715, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8307692307692308, "eval_TIME_number": 31, "eval_TIME_precision": 0.7941176470588235, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2825859487056732, "eval_overall_accuracy": 0.9670547436215011, "eval_overall_f1": 0.8606896551724139, "eval_overall_precision": 0.8232189973614775, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3647, "eval_samples_per_second": 512.726, "eval_steps_per_second": 8.226, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.022443190217018127, "learning_rate": 3.1e-05, "loss": 0.0027, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8413793103448277, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8026315789473685, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7391304347826089, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6623376623376623, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9456869009584665, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.925, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7647058823529411, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7222222222222222, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.26482775807380676, "eval_overall_accuracy": 0.9660639088432004, "eval_overall_f1": 0.8598901098901098, "eval_overall_precision": 0.819371727748691, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.377, "eval_samples_per_second": 496.079, "eval_steps_per_second": 7.958, "step": 4028 }, { "epoch": 39.0, "grad_norm": 0.018067799508571625, "learning_rate": 3.05e-05, "loss": 0.0028, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7969924812030076, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7361111111111112, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9367088607594937, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9079754601226994, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8405797101449276, "eval_TIME_number": 31, "eval_TIME_precision": 0.7631578947368421, "eval_TIME_recall": 0.9354838709677419, "eval_loss": 0.2490389049053192, "eval_overall_accuracy": 0.9687887044835274, "eval_overall_f1": 0.8724279835390947, "eval_overall_precision": 0.8302872062663186, "eval_overall_recall": 0.9190751445086706, "eval_runtime": 0.3616, "eval_samples_per_second": 517.153, "eval_steps_per_second": 8.297, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.012262631207704544, "learning_rate": 3e-05, "loss": 0.0015, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.8695652173913043, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8695652173913043, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7323943661971831, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6419753086419753, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9456869009584665, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.925, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.23013749718666077, "eval_overall_accuracy": 0.9712657914292792, "eval_overall_f1": 0.8698060941828255, "eval_overall_precision": 0.8351063829787234, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3684, "eval_samples_per_second": 507.649, "eval_steps_per_second": 8.144, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.0009043277241289616, "learning_rate": 2.95e-05, "loss": 0.0024, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.853146853146853, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8243243243243243, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7591240875912408, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6842105263157895, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.84375, "eval_TIME_number": 31, "eval_TIME_precision": 0.8181818181818182, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2405707687139511, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.8677685950413223, "eval_overall_precision": 0.8289473684210527, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3649, "eval_samples_per_second": 512.484, "eval_steps_per_second": 8.222, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.08815114200115204, "learning_rate": 2.9e-05, "loss": 0.0015, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.851063829787234, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8333333333333334, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7704918032786885, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7704918032786885, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9456869009584665, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.925, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2553688883781433, "eval_overall_accuracy": 0.9695318305672529, "eval_overall_f1": 0.8781869688385271, "eval_overall_precision": 0.8611111111111112, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3688, "eval_samples_per_second": 507.104, "eval_steps_per_second": 8.135, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.0011932431953027844, "learning_rate": 2.8499999999999998e-05, "loss": 0.0008, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.8591549295774648, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8356164383561644, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7538461538461538, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7101449275362319, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9303797468354431, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.901840490797546, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7941176470588235, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.75, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.26496070623397827, "eval_overall_accuracy": 0.9690364131781025, "eval_overall_f1": 0.8666666666666667, "eval_overall_precision": 0.8342245989304813, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3652, "eval_samples_per_second": 512.034, "eval_steps_per_second": 8.214, "step": 4558 }, { "epoch": 44.0, "grad_norm": 3.7293193340301514, "learning_rate": 2.8000000000000003e-05, "loss": 0.0017, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.8333333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7445255474452555, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9423076923076923, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9245283018867925, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8615384615384616, "eval_TIME_number": 31, "eval_TIME_precision": 0.8235294117647058, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.26268908381462097, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.8603042876901797, "eval_overall_precision": 0.8249336870026526, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3678, "eval_samples_per_second": 508.483, "eval_steps_per_second": 8.157, "step": 4664 }, { "epoch": 45.0, "grad_norm": 0.6390479803085327, "learning_rate": 2.7500000000000004e-05, "loss": 0.0013, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8732394366197183, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8493150684931506, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7464788732394366, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.654320987654321, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.25916871428489685, "eval_overall_accuracy": 0.9695318305672529, "eval_overall_f1": 0.8684931506849316, "eval_overall_precision": 0.8255208333333334, "eval_overall_recall": 0.9161849710982659, "eval_runtime": 0.3656, "eval_samples_per_second": 511.447, "eval_steps_per_second": 8.205, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.010238826274871826, "learning_rate": 2.7000000000000002e-05, "loss": 0.0026, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.8356164383561644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6506024096385542, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.9216300940438872, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8855421686746988, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8059701492537314, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7714285714285715, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.823529411764706, "eval_TIME_number": 31, "eval_TIME_precision": 0.7567567567567568, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2907452881336212, "eval_overall_accuracy": 0.9648253653703245, "eval_overall_f1": 0.8521505376344086, "eval_overall_precision": 0.7964824120603015, "eval_overall_recall": 0.9161849710982659, "eval_runtime": 0.3653, "eval_samples_per_second": 511.904, "eval_steps_per_second": 8.212, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.0005274274735711515, "learning_rate": 2.6500000000000004e-05, "loss": 0.0018, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.8611111111111112, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8266666666666667, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7591240875912408, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6842105263157895, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.896969696969697, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7462686567164178, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7142857142857143, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8059701492537312, "eval_TIME_number": 31, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.2971247136592865, "eval_overall_accuracy": 0.9658162001486252, "eval_overall_f1": 0.8567530695770805, "eval_overall_precision": 0.8113695090439277, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3657, "eval_samples_per_second": 511.396, "eval_steps_per_second": 8.204, "step": 4982 }, { "epoch": 48.0, "grad_norm": 0.014134509488940239, "learning_rate": 2.6000000000000002e-05, "loss": 0.0014, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.8571428571428571, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8450704225352113, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7445255474452555, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6710526315789473, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.935897435897436, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9182389937106918, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.78125, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.78125, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2763230800628662, "eval_overall_accuracy": 0.9680455783998019, "eval_overall_f1": 0.8659217877094972, "eval_overall_precision": 0.8378378378378378, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3626, "eval_samples_per_second": 515.776, "eval_steps_per_second": 8.274, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.01190261635929346, "learning_rate": 2.5500000000000003e-05, "loss": 0.0019, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.8450704225352113, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.821917808219178, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7058823529411764, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.64, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9294871794871795, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9119496855345912, "eval_PERSON_recall": 0.9477124183006536, "eval_QUANTITY_f1": 0.8307692307692308, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8181818181818182, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8709677419354839, "eval_TIME_number": 31, "eval_TIME_precision": 0.8709677419354839, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.27485761046409607, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.8563458856345887, "eval_overall_precision": 0.8274932614555256, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3612, "eval_samples_per_second": 517.682, "eval_steps_per_second": 8.305, "step": 5194 }, { "epoch": 50.0, "grad_norm": 1.1005834341049194, "learning_rate": 2.5e-05, "loss": 0.0014, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.8133333333333332, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7205882352941175, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6533333333333333, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9517684887459807, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9367088607594937, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8615384615384616, "eval_TIME_number": 31, "eval_TIME_precision": 0.8235294117647058, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.29507261514663696, "eval_overall_accuracy": 0.9643299479811741, "eval_overall_f1": 0.8571428571428571, "eval_overall_precision": 0.8167539267015707, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3618, "eval_samples_per_second": 516.881, "eval_steps_per_second": 8.292, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.0018566737417131662, "learning_rate": 2.45e-05, "loss": 0.0017, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.8275862068965517, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7894736842105263, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6962962962962963, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6351351351351351, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9329073482428115, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9125, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8181818181818182, "eval_TIME_number": 31, "eval_TIME_precision": 0.7714285714285715, "eval_TIME_recall": 0.8709677419354839, "eval_loss": 0.28224554657936096, "eval_overall_accuracy": 0.9630914045082982, "eval_overall_f1": 0.8468965517241379, "eval_overall_precision": 0.8100263852242744, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3638, "eval_samples_per_second": 514.07, "eval_steps_per_second": 8.247, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.00030757131753489375, "learning_rate": 2.4e-05, "loss": 0.0015, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.8322147651006713, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7142857142857143, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6329113924050633, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9423076923076923, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9245283018867925, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.29711785912513733, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8528610354223434, "eval_overall_precision": 0.8067010309278351, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.362, "eval_samples_per_second": 516.559, "eval_steps_per_second": 8.287, "step": 5512 }, { "epoch": 53.0, "grad_norm": 0.012948980554938316, "learning_rate": 2.35e-05, "loss": 0.0013, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.8108108108108109, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.6956521739130435, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6233766233766234, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9040247678018575, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8588235294117647, "eval_PERSON_recall": 0.954248366013072, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3104041516780853, "eval_overall_accuracy": 0.9630914045082982, "eval_overall_f1": 0.8340080971659919, "eval_overall_precision": 0.7822784810126582, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3612, "eval_samples_per_second": 517.74, "eval_steps_per_second": 8.306, "step": 5618 }, { "epoch": 54.0, "grad_norm": 0.00616478780284524, "learning_rate": 2.3000000000000003e-05, "loss": 0.0014, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.8378378378378378, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.746031746031746, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7230769230769231, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.923076923076923, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9056603773584906, "eval_PERSON_recall": 0.9411764705882353, "eval_QUANTITY_f1": 0.7692307692307692, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7575757575757576, "eval_QUANTITY_recall": 0.78125, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.28169548511505127, "eval_overall_accuracy": 0.9645776566757494, "eval_overall_f1": 0.8559440559440559, "eval_overall_precision": 0.8292682926829268, "eval_overall_recall": 0.884393063583815, "eval_runtime": 0.3661, "eval_samples_per_second": 510.754, "eval_steps_per_second": 8.194, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.0019178962102159858, "learning_rate": 2.25e-05, "loss": 0.0005, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.8356164383561644, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7922077922077922, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.711111111111111, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6486486486486487, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9453376205787781, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.930379746835443, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.29151037335395813, "eval_overall_accuracy": 0.9648253653703245, "eval_overall_f1": 0.8623087621696801, "eval_overall_precision": 0.8310991957104558, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3686, "eval_samples_per_second": 507.352, "eval_steps_per_second": 8.139, "step": 5830 }, { "epoch": 56.0, "grad_norm": 0.0005920439143665135, "learning_rate": 2.2000000000000003e-05, "loss": 0.0009, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.8413793103448277, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8026315789473685, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7299270072992702, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6578947368421053, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9487179487179488, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9308176100628931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.30188778042793274, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8670360110803323, "eval_overall_precision": 0.8324468085106383, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3652, "eval_samples_per_second": 512.012, "eval_steps_per_second": 8.214, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.0004883262445218861, "learning_rate": 2.15e-05, "loss": 0.0009, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.8450704225352113, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.821917808219178, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7164179104477612, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6575342465753424, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.939297124600639, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.91875, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2943618893623352, "eval_overall_accuracy": 0.9665593262323507, "eval_overall_f1": 0.8631284916201116, "eval_overall_precision": 0.8351351351351352, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3709, "eval_samples_per_second": 504.197, "eval_steps_per_second": 8.089, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.0014432142488658428, "learning_rate": 2.1e-05, "loss": 0.0006, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.8368794326241135, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8194444444444444, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7230769230769231, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6811594202898551, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9363057324840764, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9130434782608695, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.28986239433288574, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8623595505617977, "eval_overall_precision": 0.8387978142076503, "eval_overall_recall": 0.8872832369942196, "eval_runtime": 0.3712, "eval_samples_per_second": 503.757, "eval_steps_per_second": 8.082, "step": 6148 }, { "epoch": 59.0, "grad_norm": 0.0014531804481521249, "learning_rate": 2.05e-05, "loss": 0.0005, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.8472222222222223, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8133333333333334, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7375886524822695, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9517684887459807, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9367088607594937, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.29187676310539246, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.8653846153846154, "eval_overall_precision": 0.824607329842932, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3703, "eval_samples_per_second": 505.003, "eval_steps_per_second": 8.102, "step": 6254 }, { "epoch": 60.0, "grad_norm": 0.000528964155819267, "learning_rate": 2e-05, "loss": 0.0006, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7500000000000001, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.68, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9426751592356687, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9192546583850931, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3160874545574188, "eval_overall_accuracy": 0.9638345305920237, "eval_overall_f1": 0.8579234972677596, "eval_overall_precision": 0.8134715025906736, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3784, "eval_samples_per_second": 494.206, "eval_steps_per_second": 7.928, "step": 6360 }, { "epoch": 61.0, "grad_norm": 0.001857202616520226, "learning_rate": 1.9500000000000003e-05, "loss": 0.0017, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7518796992481204, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6944444444444444, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9396825396825397, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9135802469135802, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.84375, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.84375, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2975999414920807, "eval_overall_accuracy": 0.9658162001486252, "eval_overall_f1": 0.8638239339752408, "eval_overall_precision": 0.8241469816272966, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3649, "eval_samples_per_second": 512.529, "eval_steps_per_second": 8.222, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.0003795857774093747, "learning_rate": 1.9e-05, "loss": 0.0004, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.746031746031746, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7230769230769231, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9456869009584665, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.925, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.7761194029850748, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7428571428571429, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3019534647464752, "eval_overall_accuracy": 0.9638345305920237, "eval_overall_f1": 0.8599167822468794, "eval_overall_precision": 0.8266666666666667, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3666, "eval_samples_per_second": 510.155, "eval_steps_per_second": 8.184, "step": 6572 }, { "epoch": 63.0, "grad_norm": 0.00042081772699020803, "learning_rate": 1.85e-05, "loss": 0.0004, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.821917808219178, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.762589928057554, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6794871794871795, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9453376205787781, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.930379746835443, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2791728079319, "eval_overall_accuracy": 0.966807034926926, "eval_overall_f1": 0.861454046639232, "eval_overall_precision": 0.8198433420365535, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3576, "eval_samples_per_second": 522.878, "eval_steps_per_second": 8.388, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.015575162135064602, "learning_rate": 1.8e-05, "loss": 0.001, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.8137931034482757, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.726027397260274, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6235294117647059, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2865269184112549, "eval_overall_accuracy": 0.9665593262323507, "eval_overall_f1": 0.8598639455782313, "eval_overall_precision": 0.8123393316195373, "eval_overall_recall": 0.9132947976878613, "eval_runtime": 0.3652, "eval_samples_per_second": 512.011, "eval_steps_per_second": 8.214, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.0011894090566784143, "learning_rate": 1.75e-05, "loss": 0.0011, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.8201438848920863, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8142857142857143, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.732824427480916, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6857142857142857, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9490445859872612, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9254658385093167, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.291652649641037, "eval_overall_accuracy": 0.9680455783998019, "eval_overall_f1": 0.8639551192145861, "eval_overall_precision": 0.8392370572207084, "eval_overall_recall": 0.8901734104046243, "eval_runtime": 0.361, "eval_samples_per_second": 518.053, "eval_steps_per_second": 8.311, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.0299760140478611, "learning_rate": 1.7000000000000003e-05, "loss": 0.0014, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.8055555555555556, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7733333333333333, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7375886524822695, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.65, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.27525565028190613, "eval_overall_accuracy": 0.9685409957889521, "eval_overall_f1": 0.8598901098901098, "eval_overall_precision": 0.819371727748691, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3758, "eval_samples_per_second": 497.654, "eval_steps_per_second": 7.984, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.0006641316576860845, "learning_rate": 1.65e-05, "loss": 0.0005, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.8194444444444444, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7866666666666666, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7361111111111112, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6385542168674698, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.288452684879303, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8583106267029972, "eval_overall_precision": 0.8118556701030928, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3617, "eval_samples_per_second": 516.981, "eval_steps_per_second": 8.294, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.0003661834343802184, "learning_rate": 1.6000000000000003e-05, "loss": 0.0004, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.8275862068965517, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7894736842105263, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7647058823529411, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6933333333333334, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9551282051282051, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9371069182389937, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8125, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2738393545150757, "eval_overall_accuracy": 0.971018082734704, "eval_overall_f1": 0.8750000000000001, "eval_overall_precision": 0.8422459893048129, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3691, "eval_samples_per_second": 506.591, "eval_steps_per_second": 8.127, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.00032552139600738883, "learning_rate": 1.55e-05, "loss": 0.0002, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.8333333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7555555555555555, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6891891891891891, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9551282051282051, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9371069182389937, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8125, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2714591920375824, "eval_overall_accuracy": 0.971018082734704, "eval_overall_f1": 0.8758716875871689, "eval_overall_precision": 0.8463611859838275, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3611, "eval_samples_per_second": 517.91, "eval_steps_per_second": 8.309, "step": 7314 }, { "epoch": 70.0, "grad_norm": 0.0012234537862241268, "learning_rate": 1.5e-05, "loss": 0.0003, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.8333333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7761194029850746, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7123287671232876, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2793043553829193, "eval_overall_accuracy": 0.9705226653455536, "eval_overall_f1": 0.8750000000000001, "eval_overall_precision": 0.8422459893048129, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3626, "eval_samples_per_second": 515.737, "eval_steps_per_second": 8.274, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.00031636914354749024, "learning_rate": 1.45e-05, "loss": 0.0001, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.8333333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7761194029850746, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7123287671232876, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.29805585741996765, "eval_overall_accuracy": 0.9690364131781025, "eval_overall_f1": 0.8737864077669903, "eval_overall_precision": 0.84, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3626, "eval_samples_per_second": 515.664, "eval_steps_per_second": 8.273, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.003590099047869444, "learning_rate": 1.4000000000000001e-05, "loss": 0.0005, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.8260869565217391, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8260869565217391, "eval_LOCATION_recall": 0.8260869565217391, "eval_ORGANIZATION_f1": 0.7633587786259541, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8307692307692308, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8181818181818182, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.27618908882141113, "eval_overall_accuracy": 0.9707703740401288, "eval_overall_f1": 0.8735955056179775, "eval_overall_precision": 0.8497267759562842, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3699, "eval_samples_per_second": 505.485, "eval_steps_per_second": 8.109, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.00027959441649727523, "learning_rate": 1.3500000000000001e-05, "loss": 0.0002, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8391608391608392, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8108108108108109, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7500000000000001, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.68, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.9032258064516129, "eval_TIME_number": 31, "eval_TIME_precision": 0.9032258064516129, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.28340503573417664, "eval_overall_accuracy": 0.9685409957889521, "eval_overall_f1": 0.8698060941828255, "eval_overall_precision": 0.8351063829787234, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.362, "eval_samples_per_second": 516.608, "eval_steps_per_second": 8.288, "step": 7738 }, { "epoch": 74.0, "grad_norm": 0.00044001045171171427, "learning_rate": 1.3000000000000001e-05, "loss": 0.0002, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8275862068965517, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7894736842105263, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7681159420289856, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6883116883116883, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9551282051282051, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9371069182389937, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.27885836362838745, "eval_overall_accuracy": 0.9695318305672529, "eval_overall_f1": 0.8756906077348067, "eval_overall_precision": 0.8386243386243386, "eval_overall_recall": 0.9161849710982659, "eval_runtime": 0.3657, "eval_samples_per_second": 511.381, "eval_steps_per_second": 8.204, "step": 7844 }, { "epoch": 75.0, "grad_norm": 0.00027540308656170964, "learning_rate": 1.25e-05, "loss": 0.0001, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.821917808219178, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7792207792207793, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7737226277372262, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6973684210526315, "eval_ORGANIZATION_recall": 0.8688524590163934, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8181818181818182, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7941176470588235, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2948344945907593, "eval_overall_accuracy": 0.9673024523160763, "eval_overall_f1": 0.8708791208791209, "eval_overall_precision": 0.8298429319371727, "eval_overall_recall": 0.9161849710982659, "eval_runtime": 0.3634, "eval_samples_per_second": 514.56, "eval_steps_per_second": 8.255, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.007422334514558315, "learning_rate": 1.2e-05, "loss": 0.0004, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.8194444444444444, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7866666666666666, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7067669172932329, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6527777777777778, "eval_ORGANIZATION_recall": 0.7704918032786885, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8307692307692308, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8181818181818182, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3101661205291748, "eval_overall_accuracy": 0.966807034926926, "eval_overall_f1": 0.8587257617728532, "eval_overall_precision": 0.824468085106383, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3638, "eval_samples_per_second": 513.997, "eval_steps_per_second": 8.246, "step": 8056 }, { "epoch": 77.0, "grad_norm": 0.0005564504535868764, "learning_rate": 1.1500000000000002e-05, "loss": 0.0005, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.8299319727891156, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.782051282051282, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7391304347826089, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6623376623376623, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.29981571435928345, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8618331053351572, "eval_overall_precision": 0.8181818181818182, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3758, "eval_samples_per_second": 497.657, "eval_steps_per_second": 7.984, "step": 8162 }, { "epoch": 78.0, "grad_norm": 0.003542252816259861, "learning_rate": 1.1000000000000001e-05, "loss": 0.0002, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.8194444444444444, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7866666666666666, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7703703703703704, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7027027027027027, "eval_ORGANIZATION_recall": 0.8524590163934426, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.28981682658195496, "eval_overall_accuracy": 0.9675501610106515, "eval_overall_f1": 0.8686030428769017, "eval_overall_precision": 0.8328912466843501, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3708, "eval_samples_per_second": 504.361, "eval_steps_per_second": 8.091, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.0004401499463710934, "learning_rate": 1.05e-05, "loss": 0.0003, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.8169014084507042, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7945205479452054, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7538461538461538, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7101449275362319, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.952076677316294, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.93125, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.84375, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.84375, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8888888888888888, "eval_TIME_number": 31, "eval_TIME_precision": 0.875, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2755199670791626, "eval_overall_accuracy": 0.9695318305672529, "eval_overall_f1": 0.8735955056179775, "eval_overall_precision": 0.8497267759562842, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3648, "eval_samples_per_second": 512.67, "eval_steps_per_second": 8.225, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.00034126470563933253, "learning_rate": 1e-05, "loss": 0.0004, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.8082191780821918, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7662337662337663, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7424242424242424, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.6901408450704225, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9371069182389938, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9030303030303031, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.787878787878788, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7647058823529411, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2898205518722534, "eval_overall_accuracy": 0.96556849145405, "eval_overall_f1": 0.8532235939643347, "eval_overall_precision": 0.8120104438642297, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3951, "eval_samples_per_second": 473.261, "eval_steps_per_second": 7.592, "step": 8480 }, { "epoch": 81.0, "grad_norm": 0.000562498637009412, "learning_rate": 9.5e-06, "loss": 0.0003, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.8251748251748252, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7972972972972973, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7500000000000001, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.68, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9337539432176657, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9024390243902439, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.84375, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.84375, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.28580695390701294, "eval_overall_accuracy": 0.9687887044835274, "eval_overall_f1": 0.8646408839779005, "eval_overall_precision": 0.828042328042328, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3627, "eval_samples_per_second": 515.648, "eval_steps_per_second": 8.272, "step": 8586 }, { "epoch": 82.0, "grad_norm": 0.0003717710787896067, "learning_rate": 9e-06, "loss": 0.0004, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.802721088435374, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7564102564102564, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.765625, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7313432835820896, "eval_ORGANIZATION_recall": 0.8032786885245902, "eval_PERSON_f1": 0.9430379746835442, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9141104294478528, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8125, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8125, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.28542497754096985, "eval_overall_accuracy": 0.9695318305672529, "eval_overall_f1": 0.8650904033379694, "eval_overall_precision": 0.8337801608579088, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3698, "eval_samples_per_second": 505.716, "eval_steps_per_second": 8.113, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.0019057561876252294, "learning_rate": 8.500000000000002e-06, "loss": 0.0004, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7941176470588235, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.72, "eval_ORGANIZATION_recall": 0.8852459016393442, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2824600636959076, "eval_overall_accuracy": 0.9692841218726778, "eval_overall_f1": 0.8688524590163936, "eval_overall_precision": 0.8238341968911918, "eval_overall_recall": 0.9190751445086706, "eval_runtime": 0.3654, "eval_samples_per_second": 511.741, "eval_steps_per_second": 8.21, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.001229365007020533, "learning_rate": 8.000000000000001e-06, "loss": 0.0006, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8226950354609929, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8055555555555556, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7874015748031497, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7575757575757576, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.952076677316294, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.93125, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.875, "eval_TIME_number": 31, "eval_TIME_precision": 0.8484848484848485, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.26607078313827515, "eval_overall_accuracy": 0.9720089175130047, "eval_overall_f1": 0.876056338028169, "eval_overall_precision": 0.8543956043956044, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.3766, "eval_samples_per_second": 496.598, "eval_steps_per_second": 7.967, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.00014708787784911692, "learning_rate": 7.5e-06, "loss": 0.0003, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8333333333333333, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8, "eval_LOCATION_recall": 0.8695652173913043, "eval_ORGANIZATION_f1": 0.7559055118110236, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7272727272727273, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.9400630914826499, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9085365853658537, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.293227881193161, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.8638888888888889, "eval_overall_precision": 0.8315508021390374, "eval_overall_recall": 0.8988439306358381, "eval_runtime": 0.364, "eval_samples_per_second": 513.774, "eval_steps_per_second": 8.242, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.003805099753662944, "learning_rate": 7.000000000000001e-06, "loss": 0.0006, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.8345323741007195, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.8285714285714286, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.768, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.75, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.946031746031746, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9197530864197531, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8307692307692308, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8181818181818182, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2930375337600708, "eval_overall_accuracy": 0.9685409957889521, "eval_overall_f1": 0.8732394366197184, "eval_overall_precision": 0.8516483516483516, "eval_overall_recall": 0.8959537572254336, "eval_runtime": 0.3668, "eval_samples_per_second": 509.746, "eval_steps_per_second": 8.178, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.04100840538740158, "learning_rate": 6.5000000000000004e-06, "loss": 0.0005, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8169014084507042, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7945205479452054, "eval_LOCATION_recall": 0.8405797101449275, "eval_ORGANIZATION_f1": 0.7559055118110236, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7272727272727273, "eval_ORGANIZATION_recall": 0.7868852459016393, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.823529411764706, "eval_TIME_number": 31, "eval_TIME_precision": 0.7567567567567568, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3029007911682129, "eval_overall_accuracy": 0.9663116175377756, "eval_overall_f1": 0.8559556786703602, "eval_overall_precision": 0.8218085106382979, "eval_overall_recall": 0.8930635838150289, "eval_runtime": 0.3762, "eval_samples_per_second": 497.075, "eval_steps_per_second": 7.974, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.0002212318213423714, "learning_rate": 6e-06, "loss": 0.0003, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.8251748251748252, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7972972972972973, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8115942028985507, "eval_TIME_number": 31, "eval_TIME_precision": 0.7368421052631579, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.30660566687583923, "eval_overall_accuracy": 0.9665593262323507, "eval_overall_f1": 0.8598901098901098, "eval_overall_precision": 0.819371727748691, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3705, "eval_samples_per_second": 504.729, "eval_steps_per_second": 8.097, "step": 9328 }, { "epoch": 89.0, "grad_norm": 0.000250909011811018, "learning_rate": 5.500000000000001e-06, "loss": 0.0001, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.8137931034482757, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7763157894736842, "eval_LOCATION_recall": 0.855072463768116, "eval_ORGANIZATION_f1": 0.7692307692307692, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7246376811594203, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8115942028985507, "eval_TIME_number": 31, "eval_TIME_precision": 0.7368421052631579, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.30867499113082886, "eval_overall_accuracy": 0.9650730740648997, "eval_overall_f1": 0.8571428571428571, "eval_overall_precision": 0.8167539267015707, "eval_overall_recall": 0.9017341040462428, "eval_runtime": 0.3615, "eval_samples_per_second": 517.307, "eval_steps_per_second": 8.299, "step": 9434 }, { "epoch": 90.0, "grad_norm": 0.00021638131875079125, "learning_rate": 5e-06, "loss": 0.0001, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.8266666666666668, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7654320987654321, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7633587786259541, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7142857142857143, "eval_ORGANIZATION_recall": 0.819672131147541, "eval_PERSON_f1": 0.9216300940438872, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8855421686746988, "eval_PERSON_recall": 0.9607843137254902, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.31429383158683777, "eval_overall_accuracy": 0.9653207827594749, "eval_overall_f1": 0.8551912568306012, "eval_overall_precision": 0.810880829015544, "eval_overall_recall": 0.9046242774566474, "eval_runtime": 0.3713, "eval_samples_per_second": 503.676, "eval_steps_per_second": 8.08, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.00013644745922647417, "learning_rate": 4.5e-06, "loss": 0.0001, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.930817610062893, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.896969696969697, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.835820895522388, "eval_TIME_number": 31, "eval_TIME_precision": 0.7777777777777778, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.2944120168685913, "eval_overall_accuracy": 0.968293287094377, "eval_overall_f1": 0.861454046639232, "eval_overall_precision": 0.8198433420365535, "eval_overall_recall": 0.9075144508670521, "eval_runtime": 0.3632, "eval_samples_per_second": 514.858, "eval_steps_per_second": 8.26, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.0009539081365801394, "learning_rate": 4.000000000000001e-06, "loss": 0.0002, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.8322147651006713, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.775, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7727272727272727, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7183098591549296, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9249999999999999, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8862275449101796, "eval_PERSON_recall": 0.9673202614379085, "eval_QUANTITY_f1": 0.8307692307692308, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8181818181818182, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.823529411764706, "eval_TIME_number": 31, "eval_TIME_precision": 0.7567567567567568, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.31182703375816345, "eval_overall_accuracy": 0.9670547436215011, "eval_overall_f1": 0.8610354223433242, "eval_overall_precision": 0.8144329896907216, "eval_overall_recall": 0.9132947976878613, "eval_runtime": 0.3679, "eval_samples_per_second": 508.226, "eval_steps_per_second": 8.153, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.00018770851602312177, "learning_rate": 3.5000000000000004e-06, "loss": 0.0003, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.8378378378378378, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7848101265822784, "eval_LOCATION_recall": 0.8985507246376812, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8307692307692308, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8181818181818182, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.30489107966423035, "eval_overall_accuracy": 0.968293287094377, "eval_overall_f1": 0.8684931506849316, "eval_overall_precision": 0.8255208333333334, "eval_overall_recall": 0.9161849710982659, "eval_runtime": 0.3644, "eval_samples_per_second": 513.217, "eval_steps_per_second": 8.233, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.0019927462562918663, "learning_rate": 3e-06, "loss": 0.0001, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.8243243243243245, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8307692307692308, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.8181818181818182, "eval_QUANTITY_recall": 0.84375, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3039020299911499, "eval_overall_accuracy": 0.968293287094377, "eval_overall_f1": 0.8657534246575342, "eval_overall_precision": 0.8229166666666666, "eval_overall_recall": 0.9132947976878613, "eval_runtime": 0.3778, "eval_samples_per_second": 494.941, "eval_steps_per_second": 7.94, "step": 9964 }, { "epoch": 95.0, "grad_norm": 0.00036656216252595186, "learning_rate": 2.5e-06, "loss": 0.0003, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9371069182389938, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.9030303030303031, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.30329030752182007, "eval_overall_accuracy": 0.968293287094377, "eval_overall_f1": 0.8641975308641975, "eval_overall_precision": 0.8224543080939948, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3655, "eval_samples_per_second": 511.653, "eval_steps_per_second": 8.208, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.00014269202074501663, "learning_rate": 2.0000000000000003e-06, "loss": 0.0005, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.30583375692367554, "eval_overall_accuracy": 0.9675501610106515, "eval_overall_f1": 0.8618331053351572, "eval_overall_precision": 0.8181818181818182, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3755, "eval_samples_per_second": 497.939, "eval_steps_per_second": 7.988, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.0001223723666043952, "learning_rate": 1.5e-06, "loss": 0.0001, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3053462505340576, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.863013698630137, "eval_overall_precision": 0.8203125, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3619, "eval_samples_per_second": 516.75, "eval_steps_per_second": 8.29, "step": 10282 }, { "epoch": 98.0, "grad_norm": 0.0004060152277816087, "learning_rate": 1.0000000000000002e-06, "loss": 0.0001, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.9341692789968652, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8975903614457831, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3043583929538727, "eval_overall_accuracy": 0.9677978697052266, "eval_overall_f1": 0.863013698630137, "eval_overall_precision": 0.8203125, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3759, "eval_samples_per_second": 497.529, "eval_steps_per_second": 7.982, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.00019621806859504431, "learning_rate": 5.000000000000001e-07, "loss": 0.0001, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3064700961112976, "eval_overall_accuracy": 0.9675501610106515, "eval_overall_f1": 0.8618331053351572, "eval_overall_precision": 0.8181818181818182, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3646, "eval_samples_per_second": 512.932, "eval_steps_per_second": 8.229, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.0006661502993665636, "learning_rate": 0.0, "loss": 0.0001, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.8187919463087248, "eval_LOCATION_number": 69, "eval_LOCATION_precision": 0.7625, "eval_LOCATION_recall": 0.8840579710144928, "eval_ORGANIZATION_f1": 0.7786259541984734, "eval_ORGANIZATION_number": 61, "eval_ORGANIZATION_precision": 0.7285714285714285, "eval_ORGANIZATION_recall": 0.8360655737704918, "eval_PERSON_f1": 0.93125, "eval_PERSON_number": 153, "eval_PERSON_precision": 0.8922155688622755, "eval_PERSON_recall": 0.9738562091503268, "eval_QUANTITY_f1": 0.8, "eval_QUANTITY_number": 32, "eval_QUANTITY_precision": 0.7878787878787878, "eval_QUANTITY_recall": 0.8125, "eval_TIME_f1": 0.8484848484848486, "eval_TIME_number": 31, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.9032258064516129, "eval_loss": 0.3065154552459717, "eval_overall_accuracy": 0.9675501610106515, "eval_overall_f1": 0.8618331053351572, "eval_overall_precision": 0.8181818181818182, "eval_overall_recall": 0.9104046242774566, "eval_runtime": 0.3714, "eval_samples_per_second": 503.447, "eval_steps_per_second": 8.077, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 4560509291304846.0, "train_loss": 0.008112131665891283, "train_runtime": 974.3295, "train_samples_per_second": 173.145, "train_steps_per_second": 10.879 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 4560509291304846.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }