| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 100.0, | |
| "eval_steps": 500, | |
| "global_step": 10600, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 3.2015111446380615, | |
| "learning_rate": 4.9500000000000004e-05, | |
| "loss": 0.3254, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_LOCATION_f1": 0.8082191780821918, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7662337662337663, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.5901639344262295, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.5901639344262295, | |
| "eval_ORGANIZATION_recall": 0.5901639344262295, | |
| "eval_PERSON_f1": 0.89937106918239, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8666666666666667, | |
| "eval_PERSON_recall": 0.934640522875817, | |
| "eval_QUANTITY_f1": 0.742857142857143, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.6842105263157895, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8307692307692308, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7941176470588235, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.12376317381858826, | |
| "eval_overall_accuracy": 0.9581372306167947, | |
| "eval_overall_f1": 0.8072122052704577, | |
| "eval_overall_precision": 0.776, | |
| "eval_overall_recall": 0.8410404624277457, | |
| "eval_runtime": 0.3597, | |
| "eval_samples_per_second": 519.816, | |
| "eval_steps_per_second": 8.339, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 3.5055294036865234, | |
| "learning_rate": 4.9e-05, | |
| "loss": 0.1103, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_LOCATION_f1": 0.8028169014084506, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7808219178082192, | |
| "eval_LOCATION_recall": 0.8260869565217391, | |
| "eval_ORGANIZATION_f1": 0.6918238993710693, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.5612244897959183, | |
| "eval_ORGANIZATION_recall": 0.9016393442622951, | |
| "eval_PERSON_f1": 0.89375, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8562874251497006, | |
| "eval_PERSON_recall": 0.934640522875817, | |
| "eval_QUANTITY_f1": 0.742857142857143, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.6842105263157895, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.7647058823529411, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7027027027027027, | |
| "eval_TIME_recall": 0.8387096774193549, | |
| "eval_loss": 0.14232417941093445, | |
| "eval_overall_accuracy": 0.9556601436710429, | |
| "eval_overall_f1": 0.8089591567852438, | |
| "eval_overall_precision": 0.7433414043583535, | |
| "eval_overall_recall": 0.8872832369942196, | |
| "eval_runtime": 0.3736, | |
| "eval_samples_per_second": 500.519, | |
| "eval_steps_per_second": 8.03, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 3.338141918182373, | |
| "learning_rate": 4.85e-05, | |
| "loss": 0.0719, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_LOCATION_f1": 0.7945205479452054, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7532467532467533, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.6749999999999999, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.5454545454545454, | |
| "eval_ORGANIZATION_recall": 0.8852459016393442, | |
| "eval_PERSON_f1": 0.909657320872274, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8690476190476191, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.7536231884057971, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7027027027027027, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8571428571428571, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.84375, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.14947976171970367, | |
| "eval_overall_accuracy": 0.9593757740896706, | |
| "eval_overall_f1": 0.8194993412384717, | |
| "eval_overall_precision": 0.7530266343825666, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3603, | |
| "eval_samples_per_second": 519.072, | |
| "eval_steps_per_second": 8.327, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 1.6828668117523193, | |
| "learning_rate": 4.8e-05, | |
| "loss": 0.0492, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_LOCATION_f1": 0.8194444444444444, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7552447552447552, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8852459016393442, | |
| "eval_PERSON_f1": 0.9130434782608696, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8698224852071006, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.75, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.675, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.7605633802816901, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.675, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.1601407825946808, | |
| "eval_overall_accuracy": 0.9621005697299975, | |
| "eval_overall_f1": 0.8351063829787234, | |
| "eval_overall_precision": 0.7733990147783252, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3697, | |
| "eval_samples_per_second": 505.814, | |
| "eval_steps_per_second": 8.115, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 1.3032749891281128, | |
| "learning_rate": 4.75e-05, | |
| "loss": 0.0315, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_LOCATION_f1": 0.7619047619047619, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.717948717948718, | |
| "eval_LOCATION_recall": 0.8115942028985508, | |
| "eval_ORGANIZATION_f1": 0.6423357664233578, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.5789473684210527, | |
| "eval_ORGANIZATION_recall": 0.7213114754098361, | |
| "eval_PERSON_f1": 0.9216300940438872, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8855421686746988, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.7647058823529411, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7222222222222222, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.7575757575757576, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7142857142857143, | |
| "eval_TIME_recall": 0.8064516129032258, | |
| "eval_loss": 0.1780991554260254, | |
| "eval_overall_accuracy": 0.9583849393113698, | |
| "eval_overall_f1": 0.8086838534599727, | |
| "eval_overall_precision": 0.7621483375959079, | |
| "eval_overall_recall": 0.861271676300578, | |
| "eval_runtime": 0.3628, | |
| "eval_samples_per_second": 515.381, | |
| "eval_steps_per_second": 8.268, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 1.877514362335205, | |
| "learning_rate": 4.7e-05, | |
| "loss": 0.0217, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_LOCATION_f1": 0.7724137931034482, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7368421052631579, | |
| "eval_LOCATION_recall": 0.8115942028985508, | |
| "eval_ORGANIZATION_f1": 0.7397260273972602, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6352941176470588, | |
| "eval_ORGANIZATION_recall": 0.8852459016393442, | |
| "eval_PERSON_f1": 0.9245283018867925, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8909090909090909, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.7222222222222223, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.65, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.7941176470588235, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7297297297297297, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.17554225027561188, | |
| "eval_overall_accuracy": 0.9606143175625464, | |
| "eval_overall_f1": 0.8277703604806409, | |
| "eval_overall_precision": 0.7692307692307693, | |
| "eval_overall_recall": 0.8959537572254336, | |
| "eval_runtime": 0.3662, | |
| "eval_samples_per_second": 510.654, | |
| "eval_steps_per_second": 8.192, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 0.2853144705295563, | |
| "learning_rate": 4.6500000000000005e-05, | |
| "loss": 0.0168, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_LOCATION_f1": 0.7777777777777779, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7466666666666667, | |
| "eval_LOCATION_recall": 0.8115942028985508, | |
| "eval_ORGANIZATION_f1": 0.6901408450704226, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6049382716049383, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.915360501567398, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8795180722891566, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.7761194029850748, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7428571428571429, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8253968253968254, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8125, | |
| "eval_TIME_recall": 0.8387096774193549, | |
| "eval_loss": 0.19883674383163452, | |
| "eval_overall_accuracy": 0.9608620262571216, | |
| "eval_overall_f1": 0.8244897959183674, | |
| "eval_overall_precision": 0.7789203084832905, | |
| "eval_overall_recall": 0.8757225433526011, | |
| "eval_runtime": 0.3599, | |
| "eval_samples_per_second": 519.614, | |
| "eval_steps_per_second": 8.336, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 0.052625108510255814, | |
| "learning_rate": 4.600000000000001e-05, | |
| "loss": 0.0134, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_LOCATION_f1": 0.8082191780821918, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7662337662337663, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.6857142857142857, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6075949367088608, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9216300940438872, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8855421686746988, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.7575757575757576, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.78125, | |
| "eval_TIME_f1": 0.8115942028985507, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7368421052631579, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.19897328317165375, | |
| "eval_overall_accuracy": 0.9601189001733961, | |
| "eval_overall_f1": 0.8297297297297296, | |
| "eval_overall_precision": 0.7791878172588832, | |
| "eval_overall_recall": 0.8872832369942196, | |
| "eval_runtime": 0.3619, | |
| "eval_samples_per_second": 516.738, | |
| "eval_steps_per_second": 8.29, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 0.2537504732608795, | |
| "learning_rate": 4.55e-05, | |
| "loss": 0.0101, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_LOCATION_f1": 0.8211920529801324, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7560975609756098, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.6929133858267716, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7213114754098361, | |
| "eval_PERSON_f1": 0.9311475409836065, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9342105263157895, | |
| "eval_PERSON_recall": 0.9281045751633987, | |
| "eval_QUANTITY_f1": 0.7536231884057971, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7027027027027027, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.20098058879375458, | |
| "eval_overall_accuracy": 0.9643299479811741, | |
| "eval_overall_f1": 0.8400556328233658, | |
| "eval_overall_precision": 0.8096514745308311, | |
| "eval_overall_recall": 0.8728323699421965, | |
| "eval_runtime": 0.3599, | |
| "eval_samples_per_second": 519.595, | |
| "eval_steps_per_second": 8.336, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 0.2351408451795578, | |
| "learning_rate": 4.5e-05, | |
| "loss": 0.0101, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_LOCATION_f1": 0.8513513513513514, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7974683544303798, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7445255474452555, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6710526315789473, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9148264984227129, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8841463414634146, | |
| "eval_PERSON_recall": 0.9477124183006536, | |
| "eval_QUANTITY_f1": 0.7714285714285714, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7105263157894737, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2193160206079483, | |
| "eval_overall_accuracy": 0.9638345305920237, | |
| "eval_overall_f1": 0.8509485094850948, | |
| "eval_overall_precision": 0.8010204081632653, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3607, | |
| "eval_samples_per_second": 518.462, | |
| "eval_steps_per_second": 8.318, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 0.03327617421746254, | |
| "learning_rate": 4.4500000000000004e-05, | |
| "loss": 0.0063, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_LOCATION_f1": 0.8226950354609929, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8055555555555556, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.7205882352941175, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6533333333333333, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9303797468354431, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.901840490797546, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.7826086956521738, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7297297297297297, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.782608695652174, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7105263157894737, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.22587580978870392, | |
| "eval_overall_accuracy": 0.9628436958137231, | |
| "eval_overall_f1": 0.8426812585499317, | |
| "eval_overall_precision": 0.8, | |
| "eval_overall_recall": 0.8901734104046243, | |
| "eval_runtime": 0.3625, | |
| "eval_samples_per_second": 515.878, | |
| "eval_steps_per_second": 8.276, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "grad_norm": 5.140894412994385, | |
| "learning_rate": 4.4000000000000006e-05, | |
| "loss": 0.0059, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_LOCATION_f1": 0.7517730496453902, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7361111111111112, | |
| "eval_LOCATION_recall": 0.7681159420289855, | |
| "eval_ORGANIZATION_f1": 0.6714285714285714, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.5949367088607594, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9235668789808917, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9006211180124224, | |
| "eval_PERSON_recall": 0.9477124183006536, | |
| "eval_QUANTITY_f1": 0.84375, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.84375, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.84375, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8181818181818182, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.23827865719795227, | |
| "eval_overall_accuracy": 0.9650730740648997, | |
| "eval_overall_f1": 0.8271092669432919, | |
| "eval_overall_precision": 0.7931034482758621, | |
| "eval_overall_recall": 0.8641618497109826, | |
| "eval_runtime": 0.3692, | |
| "eval_samples_per_second": 506.502, | |
| "eval_steps_per_second": 8.126, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "grad_norm": 3.8915011882781982, | |
| "learning_rate": 4.35e-05, | |
| "loss": 0.007, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_LOCATION_f1": 0.7894736842105263, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7228915662650602, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7142857142857143, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6329113924050633, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9303797468354431, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.901840490797546, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.7826086956521738, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7297297297297297, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.75, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.6585365853658537, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2511149048805237, | |
| "eval_overall_accuracy": 0.9618528610354223, | |
| "eval_overall_f1": 0.8304405874499332, | |
| "eval_overall_precision": 0.771712158808933, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3685, | |
| "eval_samples_per_second": 507.422, | |
| "eval_steps_per_second": 8.14, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "grad_norm": 0.0344400629401207, | |
| "learning_rate": 4.3e-05, | |
| "loss": 0.0058, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_LOCATION_f1": 0.7763157894736842, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7108433734939759, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7352941176470588, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9396825396825397, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9135802469135802, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.7941176470588235, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.75, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8307692307692308, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7941176470588235, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.24048586189746857, | |
| "eval_overall_accuracy": 0.9648253653703245, | |
| "eval_overall_f1": 0.8451086956521738, | |
| "eval_overall_precision": 0.7974358974358975, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3742, | |
| "eval_samples_per_second": 499.756, | |
| "eval_steps_per_second": 8.017, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "grad_norm": 0.006385091692209244, | |
| "learning_rate": 4.25e-05, | |
| "loss": 0.0053, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_LOCATION_f1": 0.7972972972972974, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7468354430379747, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7407407407407408, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6756756756756757, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.823529411764706, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7777777777777778, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.7714285714285716, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.6923076923076923, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.25498369336128235, | |
| "eval_overall_accuracy": 0.9623482784245727, | |
| "eval_overall_f1": 0.844804318488529, | |
| "eval_overall_precision": 0.7924050632911392, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.367, | |
| "eval_samples_per_second": 509.472, | |
| "eval_steps_per_second": 8.173, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "grad_norm": 0.007103159092366695, | |
| "learning_rate": 4.2e-05, | |
| "loss": 0.0045, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_LOCATION_f1": 0.8108108108108109, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.759493670886076, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.71875, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6865671641791045, | |
| "eval_ORGANIZATION_recall": 0.7540983606557377, | |
| "eval_PERSON_f1": 0.9367088607594937, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9079754601226994, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8615384615384615, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8484848484848485, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.8307692307692308, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7941176470588235, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2411327213048935, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8559556786703602, | |
| "eval_overall_precision": 0.8218085106382979, | |
| "eval_overall_recall": 0.8930635838150289, | |
| "eval_runtime": 0.367, | |
| "eval_samples_per_second": 509.544, | |
| "eval_steps_per_second": 8.175, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "grad_norm": 0.005618996452540159, | |
| "learning_rate": 4.15e-05, | |
| "loss": 0.0044, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_LOCATION_f1": 0.8194444444444444, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7218045112781954, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9240506329113924, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8957055214723927, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.8615384615384615, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8484848484848485, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.8059701492537312, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.23781569302082062, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8496551724137931, | |
| "eval_overall_precision": 0.8126649076517151, | |
| "eval_overall_recall": 0.8901734104046243, | |
| "eval_runtime": 0.3633, | |
| "eval_samples_per_second": 514.728, | |
| "eval_steps_per_second": 8.258, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "grad_norm": 0.00691909808665514, | |
| "learning_rate": 4.1e-05, | |
| "loss": 0.004, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_LOCATION_f1": 0.7891156462585034, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7435897435897436, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.7205882352941175, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6533333333333333, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9211356466876972, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8902439024390244, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.7826086956521738, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7297297297297297, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8115942028985507, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7368421052631579, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.28217267990112305, | |
| "eval_overall_accuracy": 0.9618528610354223, | |
| "eval_overall_f1": 0.8346883468834689, | |
| "eval_overall_precision": 0.7857142857142857, | |
| "eval_overall_recall": 0.8901734104046243, | |
| "eval_runtime": 0.3659, | |
| "eval_samples_per_second": 511.052, | |
| "eval_steps_per_second": 8.199, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "grad_norm": 0.018693506717681885, | |
| "learning_rate": 4.05e-05, | |
| "loss": 0.0043, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_LOCATION_f1": 0.8275862068965517, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7894736842105263, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7058823529411764, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.64, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9426751592356687, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9192546583850931, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.823529411764706, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7777777777777778, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.23565581440925598, | |
| "eval_overall_accuracy": 0.9658162001486252, | |
| "eval_overall_f1": 0.8547945205479451, | |
| "eval_overall_precision": 0.8125, | |
| "eval_overall_recall": 0.9017341040462428, | |
| "eval_runtime": 0.3727, | |
| "eval_samples_per_second": 501.787, | |
| "eval_steps_per_second": 8.05, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "grad_norm": 0.0034094720613211393, | |
| "learning_rate": 4e-05, | |
| "loss": 0.0032, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_LOCATION_f1": 0.7702702702702703, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7215189873417721, | |
| "eval_LOCATION_recall": 0.8260869565217391, | |
| "eval_ORGANIZATION_f1": 0.7301587301587301, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7076923076923077, | |
| "eval_ORGANIZATION_recall": 0.7540983606557377, | |
| "eval_PERSON_f1": 0.9201277955271565, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9, | |
| "eval_PERSON_recall": 0.9411764705882353, | |
| "eval_QUANTITY_f1": 0.7941176470588235, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.75, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8615384615384616, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8235294117647058, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.24556776881217957, | |
| "eval_overall_accuracy": 0.9635868218974486, | |
| "eval_overall_f1": 0.8388888888888889, | |
| "eval_overall_precision": 0.8074866310160428, | |
| "eval_overall_recall": 0.8728323699421965, | |
| "eval_runtime": 0.3742, | |
| "eval_samples_per_second": 499.754, | |
| "eval_steps_per_second": 8.017, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "grad_norm": 0.006027919240295887, | |
| "learning_rate": 3.9500000000000005e-05, | |
| "loss": 0.0036, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_LOCATION_f1": 0.8108108108108109, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.759493670886076, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.6986301369863014, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9126213592233009, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9038461538461539, | |
| "eval_PERSON_recall": 0.9215686274509803, | |
| "eval_QUANTITY_f1": 0.7714285714285714, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7105263157894737, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8253968253968254, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8125, | |
| "eval_TIME_recall": 0.8387096774193549, | |
| "eval_loss": 0.27808642387390137, | |
| "eval_overall_accuracy": 0.9618528610354223, | |
| "eval_overall_f1": 0.828804347826087, | |
| "eval_overall_precision": 0.782051282051282, | |
| "eval_overall_recall": 0.8815028901734104, | |
| "eval_runtime": 0.3671, | |
| "eval_samples_per_second": 509.462, | |
| "eval_steps_per_second": 8.173, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "grad_norm": 0.08943280577659607, | |
| "learning_rate": 3.9000000000000006e-05, | |
| "loss": 0.0029, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_LOCATION_f1": 0.8356164383561644, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7464788732394366, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.654320987654321, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.930817610062893, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.896969696969697, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.7941176470588235, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.75, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.782608695652174, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7105263157894737, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.3044780194759369, | |
| "eval_overall_accuracy": 0.9635868218974486, | |
| "eval_overall_f1": 0.8506056527590848, | |
| "eval_overall_precision": 0.7959697732997482, | |
| "eval_overall_recall": 0.9132947976878613, | |
| "eval_runtime": 0.3751, | |
| "eval_samples_per_second": 498.515, | |
| "eval_steps_per_second": 7.998, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "grad_norm": 0.008143425919115543, | |
| "learning_rate": 3.85e-05, | |
| "loss": 0.0023, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_LOCATION_f1": 0.8551724137931034, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8157894736842105, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.6911764705882353, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6266666666666667, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9367088607594937, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9079754601226994, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8059701492537312, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2635738253593445, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8520547945205479, | |
| "eval_overall_precision": 0.8098958333333334, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3625, | |
| "eval_samples_per_second": 515.906, | |
| "eval_steps_per_second": 8.277, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "grad_norm": 14.303221702575684, | |
| "learning_rate": 3.8e-05, | |
| "loss": 0.0059, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_LOCATION_f1": 0.786206896551724, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.75, | |
| "eval_LOCATION_recall": 0.8260869565217391, | |
| "eval_ORGANIZATION_f1": 0.7, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.620253164556962, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9426751592356687, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9192546583850931, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.7826086956521738, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7297297297297297, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8181818181818182, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7714285714285715, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.272360235452652, | |
| "eval_overall_accuracy": 0.9633391132028735, | |
| "eval_overall_f1": 0.8392370572207084, | |
| "eval_overall_precision": 0.7938144329896907, | |
| "eval_overall_recall": 0.8901734104046243, | |
| "eval_runtime": 0.3692, | |
| "eval_samples_per_second": 506.476, | |
| "eval_steps_per_second": 8.125, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "grad_norm": 0.13158877193927765, | |
| "learning_rate": 3.7500000000000003e-05, | |
| "loss": 0.002, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_LOCATION_f1": 0.8137931034482757, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7763157894736842, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.6666666666666666, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.5875, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9389067524115756, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9240506329113924, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.7536231884057971, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7027027027027027, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8615384615384616, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8235294117647058, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.25297293066978455, | |
| "eval_overall_accuracy": 0.9648253653703245, | |
| "eval_overall_f1": 0.8372093023255814, | |
| "eval_overall_precision": 0.7948051948051948, | |
| "eval_overall_recall": 0.884393063583815, | |
| "eval_runtime": 0.3604, | |
| "eval_samples_per_second": 518.829, | |
| "eval_steps_per_second": 8.323, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "grad_norm": 1.7319470643997192, | |
| "learning_rate": 3.7e-05, | |
| "loss": 0.0037, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_LOCATION_f1": 0.7517730496453902, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7361111111111112, | |
| "eval_LOCATION_recall": 0.7681159420289855, | |
| "eval_ORGANIZATION_f1": 0.7007299270072993, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.631578947368421, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9299363057324841, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.906832298136646, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.7887323943661971, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.8115942028985507, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7368421052631579, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2652280628681183, | |
| "eval_overall_accuracy": 0.9601189001733961, | |
| "eval_overall_f1": 0.8278688524590163, | |
| "eval_overall_precision": 0.7849740932642487, | |
| "eval_overall_recall": 0.8757225433526011, | |
| "eval_runtime": 0.3664, | |
| "eval_samples_per_second": 510.378, | |
| "eval_steps_per_second": 8.188, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "grad_norm": 0.21630139648914337, | |
| "learning_rate": 3.65e-05, | |
| "loss": 0.0052, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_LOCATION_f1": 0.8026315789473685, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.6993006993006993, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6097560975609756, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9396825396825397, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9135802469135802, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8615384615384615, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8484848484848485, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.8059701492537312, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.25186625123023987, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8463611859838275, | |
| "eval_overall_precision": 0.7929292929292929, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3644, | |
| "eval_samples_per_second": 513.133, | |
| "eval_steps_per_second": 8.232, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "grad_norm": 0.007407509256154299, | |
| "learning_rate": 3.6e-05, | |
| "loss": 0.0023, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_LOCATION_f1": 0.8489208633093526, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8428571428571429, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7230769230769231, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6811594202898551, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9456869009584665, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.925, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8125, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.7714285714285716, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.6923076923076923, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.25416678190231323, | |
| "eval_overall_accuracy": 0.9692841218726778, | |
| "eval_overall_f1": 0.8575418994413407, | |
| "eval_overall_precision": 0.8297297297297297, | |
| "eval_overall_recall": 0.8872832369942196, | |
| "eval_runtime": 0.3685, | |
| "eval_samples_per_second": 507.471, | |
| "eval_steps_per_second": 8.141, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "grad_norm": 85.30389404296875, | |
| "learning_rate": 3.55e-05, | |
| "loss": 0.0042, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_LOCATION_f1": 0.8356164383561644, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7441860465116278, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7058823529411765, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9551282051282051, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9371069182389937, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8059701492537314, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7714285714285715, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8307692307692308, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7941176470588235, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.24519670009613037, | |
| "eval_overall_accuracy": 0.9687887044835274, | |
| "eval_overall_f1": 0.8678720445062588, | |
| "eval_overall_precision": 0.8364611260053619, | |
| "eval_overall_recall": 0.9017341040462428, | |
| "eval_runtime": 0.3665, | |
| "eval_samples_per_second": 510.289, | |
| "eval_steps_per_second": 8.186, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "grad_norm": 0.044042494148015976, | |
| "learning_rate": 3.5e-05, | |
| "loss": 0.0016, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "eval_LOCATION_f1": 0.851063829787234, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8333333333333334, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.6976744186046512, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6617647058823529, | |
| "eval_ORGANIZATION_recall": 0.7377049180327869, | |
| "eval_PERSON_f1": 0.9490445859872612, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9254658385093167, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8059701492537314, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7714285714285715, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8307692307692308, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7941176470588235, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2484143078327179, | |
| "eval_overall_accuracy": 0.9695318305672529, | |
| "eval_overall_f1": 0.8603351955307263, | |
| "eval_overall_precision": 0.8324324324324325, | |
| "eval_overall_recall": 0.8901734104046243, | |
| "eval_runtime": 0.3654, | |
| "eval_samples_per_second": 511.826, | |
| "eval_steps_per_second": 8.211, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "grad_norm": 0.03026013821363449, | |
| "learning_rate": 3.45e-05, | |
| "loss": 0.0017, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7480916030534351, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9430379746835442, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9141104294478528, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.7761194029850748, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7428571428571429, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8181818181818182, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7714285714285715, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.29129624366760254, | |
| "eval_overall_accuracy": 0.9643299479811741, | |
| "eval_overall_f1": 0.8559670781893004, | |
| "eval_overall_precision": 0.814621409921671, | |
| "eval_overall_recall": 0.9017341040462428, | |
| "eval_runtime": 0.3674, | |
| "eval_samples_per_second": 508.961, | |
| "eval_steps_per_second": 8.165, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "grad_norm": 1.4942476749420166, | |
| "learning_rate": 3.4000000000000007e-05, | |
| "loss": 0.0033, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "eval_LOCATION_f1": 0.855072463768116, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.855072463768116, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7819548872180451, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7222222222222222, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.9487179487179488, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9308176100628931, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.84375, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.84375, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.84375, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8181818181818182, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.23277780413627625, | |
| "eval_overall_accuracy": 0.9722566262075799, | |
| "eval_overall_f1": 0.880450070323488, | |
| "eval_overall_precision": 0.8575342465753425, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.3786, | |
| "eval_samples_per_second": 493.877, | |
| "eval_steps_per_second": 7.923, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "grad_norm": 0.0030820919200778008, | |
| "learning_rate": 3.35e-05, | |
| "loss": 0.0021, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "eval_LOCATION_f1": 0.8194444444444444, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7310344827586208, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6309523809523809, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.9245283018867925, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8909090909090909, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8484848484848485, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8235294117647058, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.8059701492537312, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.28664737939834595, | |
| "eval_overall_accuracy": 0.9650730740648997, | |
| "eval_overall_f1": 0.8486486486486486, | |
| "eval_overall_precision": 0.7969543147208121, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3626, | |
| "eval_samples_per_second": 515.746, | |
| "eval_steps_per_second": 8.274, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "grad_norm": 0.013372019864618778, | |
| "learning_rate": 3.3e-05, | |
| "loss": 0.0034, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "eval_LOCATION_f1": 0.8450704225352113, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.821917808219178, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7536231884057972, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6753246753246753, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.9363057324840764, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9130434782608695, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8181818181818182, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7714285714285715, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.24620448052883148, | |
| "eval_overall_accuracy": 0.9705226653455536, | |
| "eval_overall_f1": 0.8622589531680441, | |
| "eval_overall_precision": 0.8236842105263158, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.3647, | |
| "eval_samples_per_second": 512.754, | |
| "eval_steps_per_second": 8.226, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "grad_norm": 0.00117175851482898, | |
| "learning_rate": 3.2500000000000004e-05, | |
| "loss": 0.0018, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "eval_LOCATION_f1": 0.851063829787234, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8333333333333334, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7536231884057972, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6753246753246753, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.930817610062893, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.896969696969697, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8615384615384615, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8484848484848485, | |
| "eval_QUANTITY_recall": 0.875, | |
| "eval_TIME_f1": 0.8307692307692308, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7941176470588235, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2648729979991913, | |
| "eval_overall_accuracy": 0.9685409957889521, | |
| "eval_overall_f1": 0.8665749656121046, | |
| "eval_overall_precision": 0.8267716535433071, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3621, | |
| "eval_samples_per_second": 516.468, | |
| "eval_steps_per_second": 8.286, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "grad_norm": 0.004863755311816931, | |
| "learning_rate": 3.2000000000000005e-05, | |
| "loss": 0.0015, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "eval_LOCATION_f1": 0.8652482269503546, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8472222222222222, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7741935483870968, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7619047619047619, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9333333333333333, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9074074074074074, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.7941176470588235, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7297297297297297, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2638514041900635, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.8667601683029452, | |
| "eval_overall_precision": 0.8419618528610354, | |
| "eval_overall_recall": 0.8930635838150289, | |
| "eval_runtime": 0.3838, | |
| "eval_samples_per_second": 487.261, | |
| "eval_steps_per_second": 7.817, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "grad_norm": 0.002965473337098956, | |
| "learning_rate": 3.15e-05, | |
| "loss": 0.0029, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "eval_LOCATION_f1": 0.8413793103448277, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7633587786259541, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7142857142857143, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9274447949526814, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8963414634146342, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8059701492537314, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7714285714285715, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8307692307692308, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7941176470588235, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2825859487056732, | |
| "eval_overall_accuracy": 0.9670547436215011, | |
| "eval_overall_f1": 0.8606896551724139, | |
| "eval_overall_precision": 0.8232189973614775, | |
| "eval_overall_recall": 0.9017341040462428, | |
| "eval_runtime": 0.3647, | |
| "eval_samples_per_second": 512.726, | |
| "eval_steps_per_second": 8.226, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "grad_norm": 0.022443190217018127, | |
| "learning_rate": 3.1e-05, | |
| "loss": 0.0027, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "eval_LOCATION_f1": 0.8413793103448277, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7391304347826089, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6623376623376623, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9456869009584665, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.925, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.7647058823529411, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7222222222222222, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.84375, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8181818181818182, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.26482775807380676, | |
| "eval_overall_accuracy": 0.9660639088432004, | |
| "eval_overall_f1": 0.8598901098901098, | |
| "eval_overall_precision": 0.819371727748691, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.377, | |
| "eval_samples_per_second": 496.079, | |
| "eval_steps_per_second": 7.958, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "grad_norm": 0.018067799508571625, | |
| "learning_rate": 3.05e-05, | |
| "loss": 0.0028, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "eval_LOCATION_f1": 0.8611111111111112, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8266666666666667, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7969924812030076, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7361111111111112, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.9367088607594937, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9079754601226994, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.7761194029850748, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7428571428571429, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8405797101449276, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.9354838709677419, | |
| "eval_loss": 0.2490389049053192, | |
| "eval_overall_accuracy": 0.9687887044835274, | |
| "eval_overall_f1": 0.8724279835390947, | |
| "eval_overall_precision": 0.8302872062663186, | |
| "eval_overall_recall": 0.9190751445086706, | |
| "eval_runtime": 0.3616, | |
| "eval_samples_per_second": 517.153, | |
| "eval_steps_per_second": 8.297, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "grad_norm": 0.012262631207704544, | |
| "learning_rate": 3e-05, | |
| "loss": 0.0015, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "eval_LOCATION_f1": 0.8695652173913043, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8695652173913043, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7323943661971831, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6419753086419753, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.9456869009584665, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.925, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.23013749718666077, | |
| "eval_overall_accuracy": 0.9712657914292792, | |
| "eval_overall_f1": 0.8698060941828255, | |
| "eval_overall_precision": 0.8351063829787234, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3684, | |
| "eval_samples_per_second": 507.649, | |
| "eval_steps_per_second": 8.144, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "grad_norm": 0.0009043277241289616, | |
| "learning_rate": 2.95e-05, | |
| "loss": 0.0024, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "eval_LOCATION_f1": 0.853146853146853, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8243243243243243, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7591240875912408, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6842105263157895, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.9430379746835442, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9141104294478528, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.84375, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8181818181818182, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2405707687139511, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.8677685950413223, | |
| "eval_overall_precision": 0.8289473684210527, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3649, | |
| "eval_samples_per_second": 512.484, | |
| "eval_steps_per_second": 8.222, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "grad_norm": 0.08815114200115204, | |
| "learning_rate": 2.9e-05, | |
| "loss": 0.0015, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "eval_LOCATION_f1": 0.851063829787234, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8333333333333334, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7704918032786885, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7704918032786885, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9456869009584665, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.925, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2553688883781433, | |
| "eval_overall_accuracy": 0.9695318305672529, | |
| "eval_overall_f1": 0.8781869688385271, | |
| "eval_overall_precision": 0.8611111111111112, | |
| "eval_overall_recall": 0.8959537572254336, | |
| "eval_runtime": 0.3688, | |
| "eval_samples_per_second": 507.104, | |
| "eval_steps_per_second": 8.135, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "grad_norm": 0.0011932431953027844, | |
| "learning_rate": 2.8499999999999998e-05, | |
| "loss": 0.0008, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "eval_LOCATION_f1": 0.8591549295774648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8356164383561644, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7538461538461538, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7101449275362319, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9303797468354431, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.901840490797546, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.7941176470588235, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.75, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.26496070623397827, | |
| "eval_overall_accuracy": 0.9690364131781025, | |
| "eval_overall_f1": 0.8666666666666667, | |
| "eval_overall_precision": 0.8342245989304813, | |
| "eval_overall_recall": 0.9017341040462428, | |
| "eval_runtime": 0.3652, | |
| "eval_samples_per_second": 512.034, | |
| "eval_steps_per_second": 8.214, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "grad_norm": 3.7293193340301514, | |
| "learning_rate": 2.8000000000000003e-05, | |
| "loss": 0.0017, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "eval_LOCATION_f1": 0.8333333333333333, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7445255474452555, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6710526315789473, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9423076923076923, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9245283018867925, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.78125, | |
| "eval_TIME_f1": 0.8615384615384616, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8235294117647058, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.26268908381462097, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.8603042876901797, | |
| "eval_overall_precision": 0.8249336870026526, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3678, | |
| "eval_samples_per_second": 508.483, | |
| "eval_steps_per_second": 8.157, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "grad_norm": 0.6390479803085327, | |
| "learning_rate": 2.7500000000000004e-05, | |
| "loss": 0.0013, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "eval_LOCATION_f1": 0.8732394366197183, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8493150684931506, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7464788732394366, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.654320987654321, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.9363057324840764, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9130434782608695, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.25916871428489685, | |
| "eval_overall_accuracy": 0.9695318305672529, | |
| "eval_overall_f1": 0.8684931506849316, | |
| "eval_overall_precision": 0.8255208333333334, | |
| "eval_overall_recall": 0.9161849710982659, | |
| "eval_runtime": 0.3656, | |
| "eval_samples_per_second": 511.447, | |
| "eval_steps_per_second": 8.205, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "grad_norm": 0.010238826274871826, | |
| "learning_rate": 2.7000000000000002e-05, | |
| "loss": 0.0026, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "eval_LOCATION_f1": 0.8356164383561644, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.75, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6506024096385542, | |
| "eval_ORGANIZATION_recall": 0.8852459016393442, | |
| "eval_PERSON_f1": 0.9216300940438872, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8855421686746988, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8059701492537314, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7714285714285715, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.823529411764706, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7567567567567568, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2907452881336212, | |
| "eval_overall_accuracy": 0.9648253653703245, | |
| "eval_overall_f1": 0.8521505376344086, | |
| "eval_overall_precision": 0.7964824120603015, | |
| "eval_overall_recall": 0.9161849710982659, | |
| "eval_runtime": 0.3653, | |
| "eval_samples_per_second": 511.904, | |
| "eval_steps_per_second": 8.212, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "grad_norm": 0.0005274274735711515, | |
| "learning_rate": 2.6500000000000004e-05, | |
| "loss": 0.0018, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "eval_LOCATION_f1": 0.8611111111111112, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8266666666666667, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7591240875912408, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6842105263157895, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.930817610062893, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.896969696969697, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.7462686567164178, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.78125, | |
| "eval_TIME_f1": 0.8059701492537312, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.2971247136592865, | |
| "eval_overall_accuracy": 0.9658162001486252, | |
| "eval_overall_f1": 0.8567530695770805, | |
| "eval_overall_precision": 0.8113695090439277, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3657, | |
| "eval_samples_per_second": 511.396, | |
| "eval_steps_per_second": 8.204, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "grad_norm": 0.014134509488940239, | |
| "learning_rate": 2.6000000000000002e-05, | |
| "loss": 0.0014, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "eval_LOCATION_f1": 0.8571428571428571, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8450704225352113, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7445255474452555, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6710526315789473, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.935897435897436, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9182389937106918, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.78125, | |
| "eval_QUANTITY_recall": 0.78125, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2763230800628662, | |
| "eval_overall_accuracy": 0.9680455783998019, | |
| "eval_overall_f1": 0.8659217877094972, | |
| "eval_overall_precision": 0.8378378378378378, | |
| "eval_overall_recall": 0.8959537572254336, | |
| "eval_runtime": 0.3626, | |
| "eval_samples_per_second": 515.776, | |
| "eval_steps_per_second": 8.274, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "grad_norm": 0.01190261635929346, | |
| "learning_rate": 2.5500000000000003e-05, | |
| "loss": 0.0019, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "eval_LOCATION_f1": 0.8450704225352113, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.821917808219178, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7058823529411764, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.64, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9294871794871795, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9119496855345912, | |
| "eval_PERSON_recall": 0.9477124183006536, | |
| "eval_QUANTITY_f1": 0.8307692307692308, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8181818181818182, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8709677419354839, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8709677419354839, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.27485761046409607, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.8563458856345887, | |
| "eval_overall_precision": 0.8274932614555256, | |
| "eval_overall_recall": 0.8872832369942196, | |
| "eval_runtime": 0.3612, | |
| "eval_samples_per_second": 517.682, | |
| "eval_steps_per_second": 8.305, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "grad_norm": 1.1005834341049194, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.0014, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "eval_LOCATION_f1": 0.8133333333333332, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7530864197530864, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7205882352941175, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6533333333333333, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9517684887459807, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9367088607594937, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8615384615384616, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8235294117647058, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.29507261514663696, | |
| "eval_overall_accuracy": 0.9643299479811741, | |
| "eval_overall_f1": 0.8571428571428571, | |
| "eval_overall_precision": 0.8167539267015707, | |
| "eval_overall_recall": 0.9017341040462428, | |
| "eval_runtime": 0.3618, | |
| "eval_samples_per_second": 516.881, | |
| "eval_steps_per_second": 8.292, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "grad_norm": 0.0018566737417131662, | |
| "learning_rate": 2.45e-05, | |
| "loss": 0.0017, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "eval_LOCATION_f1": 0.8275862068965517, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7894736842105263, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.6962962962962963, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6351351351351351, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9329073482428115, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9125, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8181818181818182, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7714285714285715, | |
| "eval_TIME_recall": 0.8709677419354839, | |
| "eval_loss": 0.28224554657936096, | |
| "eval_overall_accuracy": 0.9630914045082982, | |
| "eval_overall_f1": 0.8468965517241379, | |
| "eval_overall_precision": 0.8100263852242744, | |
| "eval_overall_recall": 0.8872832369942196, | |
| "eval_runtime": 0.3638, | |
| "eval_samples_per_second": 514.07, | |
| "eval_steps_per_second": 8.247, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "grad_norm": 0.00030757131753489375, | |
| "learning_rate": 2.4e-05, | |
| "loss": 0.0015, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "eval_LOCATION_f1": 0.8322147651006713, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.775, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7142857142857143, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6329113924050633, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9423076923076923, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9245283018867925, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.29711785912513733, | |
| "eval_overall_accuracy": 0.9650730740648997, | |
| "eval_overall_f1": 0.8528610354223434, | |
| "eval_overall_precision": 0.8067010309278351, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.362, | |
| "eval_samples_per_second": 516.559, | |
| "eval_steps_per_second": 8.287, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "grad_norm": 0.012948980554938316, | |
| "learning_rate": 2.35e-05, | |
| "loss": 0.0013, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "eval_LOCATION_f1": 0.8108108108108109, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.759493670886076, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.6956521739130435, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6233766233766234, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9040247678018575, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8588235294117647, | |
| "eval_PERSON_recall": 0.954248366013072, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3104041516780853, | |
| "eval_overall_accuracy": 0.9630914045082982, | |
| "eval_overall_f1": 0.8340080971659919, | |
| "eval_overall_precision": 0.7822784810126582, | |
| "eval_overall_recall": 0.8930635838150289, | |
| "eval_runtime": 0.3612, | |
| "eval_samples_per_second": 517.74, | |
| "eval_steps_per_second": 8.306, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "grad_norm": 0.00616478780284524, | |
| "learning_rate": 2.3000000000000003e-05, | |
| "loss": 0.0014, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "eval_LOCATION_f1": 0.8378378378378378, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.746031746031746, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7230769230769231, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.923076923076923, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9056603773584906, | |
| "eval_PERSON_recall": 0.9411764705882353, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.78125, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.28169548511505127, | |
| "eval_overall_accuracy": 0.9645776566757494, | |
| "eval_overall_f1": 0.8559440559440559, | |
| "eval_overall_precision": 0.8292682926829268, | |
| "eval_overall_recall": 0.884393063583815, | |
| "eval_runtime": 0.3661, | |
| "eval_samples_per_second": 510.754, | |
| "eval_steps_per_second": 8.194, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "grad_norm": 0.0019178962102159858, | |
| "learning_rate": 2.25e-05, | |
| "loss": 0.0005, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "eval_LOCATION_f1": 0.8356164383561644, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.711111111111111, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6486486486486487, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9453376205787781, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.930379746835443, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.29151037335395813, | |
| "eval_overall_accuracy": 0.9648253653703245, | |
| "eval_overall_f1": 0.8623087621696801, | |
| "eval_overall_precision": 0.8310991957104558, | |
| "eval_overall_recall": 0.8959537572254336, | |
| "eval_runtime": 0.3686, | |
| "eval_samples_per_second": 507.352, | |
| "eval_steps_per_second": 8.139, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "grad_norm": 0.0005920439143665135, | |
| "learning_rate": 2.2000000000000003e-05, | |
| "loss": 0.0009, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "eval_LOCATION_f1": 0.8413793103448277, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7299270072992702, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6578947368421053, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9487179487179488, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9308176100628931, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.30188778042793274, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8670360110803323, | |
| "eval_overall_precision": 0.8324468085106383, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.3652, | |
| "eval_samples_per_second": 512.012, | |
| "eval_steps_per_second": 8.214, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "grad_norm": 0.0004883262445218861, | |
| "learning_rate": 2.15e-05, | |
| "loss": 0.0009, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "eval_LOCATION_f1": 0.8450704225352113, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.821917808219178, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7164179104477612, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6575342465753424, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.939297124600639, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.91875, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2943618893623352, | |
| "eval_overall_accuracy": 0.9665593262323507, | |
| "eval_overall_f1": 0.8631284916201116, | |
| "eval_overall_precision": 0.8351351351351352, | |
| "eval_overall_recall": 0.8930635838150289, | |
| "eval_runtime": 0.3709, | |
| "eval_samples_per_second": 504.197, | |
| "eval_steps_per_second": 8.089, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "grad_norm": 0.0014432142488658428, | |
| "learning_rate": 2.1e-05, | |
| "loss": 0.0006, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "eval_LOCATION_f1": 0.8368794326241135, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8194444444444444, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7230769230769231, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6811594202898551, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9363057324840764, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9130434782608695, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.28986239433288574, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8623595505617977, | |
| "eval_overall_precision": 0.8387978142076503, | |
| "eval_overall_recall": 0.8872832369942196, | |
| "eval_runtime": 0.3712, | |
| "eval_samples_per_second": 503.757, | |
| "eval_steps_per_second": 8.082, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "grad_norm": 0.0014531804481521249, | |
| "learning_rate": 2.05e-05, | |
| "loss": 0.0005, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "eval_LOCATION_f1": 0.8472222222222223, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8133333333333334, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7375886524822695, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.65, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.9517684887459807, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9367088607594937, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.29187676310539246, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.8653846153846154, | |
| "eval_overall_precision": 0.824607329842932, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3703, | |
| "eval_samples_per_second": 505.003, | |
| "eval_steps_per_second": 8.102, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "grad_norm": 0.000528964155819267, | |
| "learning_rate": 2e-05, | |
| "loss": 0.0006, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7500000000000001, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.68, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9426751592356687, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9192546583850931, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3160874545574188, | |
| "eval_overall_accuracy": 0.9638345305920237, | |
| "eval_overall_f1": 0.8579234972677596, | |
| "eval_overall_precision": 0.8134715025906736, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3784, | |
| "eval_samples_per_second": 494.206, | |
| "eval_steps_per_second": 7.928, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "grad_norm": 0.001857202616520226, | |
| "learning_rate": 1.9500000000000003e-05, | |
| "loss": 0.0017, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "eval_LOCATION_f1": 0.8243243243243245, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7518796992481204, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6944444444444444, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9396825396825397, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9135802469135802, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.84375, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.84375, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2975999414920807, | |
| "eval_overall_accuracy": 0.9658162001486252, | |
| "eval_overall_f1": 0.8638239339752408, | |
| "eval_overall_precision": 0.8241469816272966, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3649, | |
| "eval_samples_per_second": 512.529, | |
| "eval_steps_per_second": 8.222, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "grad_norm": 0.0003795857774093747, | |
| "learning_rate": 1.9e-05, | |
| "loss": 0.0004, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "eval_LOCATION_f1": 0.8243243243243245, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.746031746031746, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7230769230769231, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9456869009584665, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.925, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.7761194029850748, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7428571428571429, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3019534647464752, | |
| "eval_overall_accuracy": 0.9638345305920237, | |
| "eval_overall_f1": 0.8599167822468794, | |
| "eval_overall_precision": 0.8266666666666667, | |
| "eval_overall_recall": 0.8959537572254336, | |
| "eval_runtime": 0.3666, | |
| "eval_samples_per_second": 510.155, | |
| "eval_steps_per_second": 8.184, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "grad_norm": 0.00042081772699020803, | |
| "learning_rate": 1.85e-05, | |
| "loss": 0.0004, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "eval_LOCATION_f1": 0.821917808219178, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7792207792207793, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.762589928057554, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6794871794871795, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.9453376205787781, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.930379746835443, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2791728079319, | |
| "eval_overall_accuracy": 0.966807034926926, | |
| "eval_overall_f1": 0.861454046639232, | |
| "eval_overall_precision": 0.8198433420365535, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3576, | |
| "eval_samples_per_second": 522.878, | |
| "eval_steps_per_second": 8.388, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "grad_norm": 0.015575162135064602, | |
| "learning_rate": 1.8e-05, | |
| "loss": 0.001, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "eval_LOCATION_f1": 0.8137931034482757, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7763157894736842, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.726027397260274, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6235294117647059, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.946031746031746, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9197530864197531, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2865269184112549, | |
| "eval_overall_accuracy": 0.9665593262323507, | |
| "eval_overall_f1": 0.8598639455782313, | |
| "eval_overall_precision": 0.8123393316195373, | |
| "eval_overall_recall": 0.9132947976878613, | |
| "eval_runtime": 0.3652, | |
| "eval_samples_per_second": 512.011, | |
| "eval_steps_per_second": 8.214, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "grad_norm": 0.0011894090566784143, | |
| "learning_rate": 1.75e-05, | |
| "loss": 0.0011, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "eval_LOCATION_f1": 0.8201438848920863, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8142857142857143, | |
| "eval_LOCATION_recall": 0.8260869565217391, | |
| "eval_ORGANIZATION_f1": 0.732824427480916, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6857142857142857, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9490445859872612, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9254658385093167, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.291652649641037, | |
| "eval_overall_accuracy": 0.9680455783998019, | |
| "eval_overall_f1": 0.8639551192145861, | |
| "eval_overall_precision": 0.8392370572207084, | |
| "eval_overall_recall": 0.8901734104046243, | |
| "eval_runtime": 0.361, | |
| "eval_samples_per_second": 518.053, | |
| "eval_steps_per_second": 8.311, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "grad_norm": 0.0299760140478611, | |
| "learning_rate": 1.7000000000000003e-05, | |
| "loss": 0.0014, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "eval_LOCATION_f1": 0.8055555555555556, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7733333333333333, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.7375886524822695, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.65, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.946031746031746, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9197530864197531, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.27525565028190613, | |
| "eval_overall_accuracy": 0.9685409957889521, | |
| "eval_overall_f1": 0.8598901098901098, | |
| "eval_overall_precision": 0.819371727748691, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.3758, | |
| "eval_samples_per_second": 497.654, | |
| "eval_steps_per_second": 7.984, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "grad_norm": 0.0006641316576860845, | |
| "learning_rate": 1.65e-05, | |
| "loss": 0.0005, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "eval_LOCATION_f1": 0.8194444444444444, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7361111111111112, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6385542168674698, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.9400630914826499, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9085365853658537, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.288452684879303, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8583106267029972, | |
| "eval_overall_precision": 0.8118556701030928, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3617, | |
| "eval_samples_per_second": 516.981, | |
| "eval_steps_per_second": 8.294, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "grad_norm": 0.0003661834343802184, | |
| "learning_rate": 1.6000000000000003e-05, | |
| "loss": 0.0004, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "eval_LOCATION_f1": 0.8275862068965517, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7894736842105263, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7647058823529411, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6933333333333334, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.9551282051282051, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9371069182389937, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8125, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2738393545150757, | |
| "eval_overall_accuracy": 0.971018082734704, | |
| "eval_overall_f1": 0.8750000000000001, | |
| "eval_overall_precision": 0.8422459893048129, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3691, | |
| "eval_samples_per_second": 506.591, | |
| "eval_steps_per_second": 8.127, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "grad_norm": 0.00032552139600738883, | |
| "learning_rate": 1.55e-05, | |
| "loss": 0.0002, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "eval_LOCATION_f1": 0.8333333333333333, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7555555555555555, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6891891891891891, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9551282051282051, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9371069182389937, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8125, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2714591920375824, | |
| "eval_overall_accuracy": 0.971018082734704, | |
| "eval_overall_f1": 0.8758716875871689, | |
| "eval_overall_precision": 0.8463611859838275, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3611, | |
| "eval_samples_per_second": 517.91, | |
| "eval_steps_per_second": 8.309, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "grad_norm": 0.0012234537862241268, | |
| "learning_rate": 1.5e-05, | |
| "loss": 0.0003, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "eval_LOCATION_f1": 0.8333333333333333, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7761194029850746, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7123287671232876, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.946031746031746, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9197530864197531, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2793043553829193, | |
| "eval_overall_accuracy": 0.9705226653455536, | |
| "eval_overall_f1": 0.8750000000000001, | |
| "eval_overall_precision": 0.8422459893048129, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3626, | |
| "eval_samples_per_second": 515.737, | |
| "eval_steps_per_second": 8.274, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "grad_norm": 0.00031636914354749024, | |
| "learning_rate": 1.45e-05, | |
| "loss": 0.0001, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "eval_LOCATION_f1": 0.8333333333333333, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7761194029850746, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7123287671232876, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.9430379746835442, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9141104294478528, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.29805585741996765, | |
| "eval_overall_accuracy": 0.9690364131781025, | |
| "eval_overall_f1": 0.8737864077669903, | |
| "eval_overall_precision": 0.84, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3626, | |
| "eval_samples_per_second": 515.664, | |
| "eval_steps_per_second": 8.273, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "grad_norm": 0.003590099047869444, | |
| "learning_rate": 1.4000000000000001e-05, | |
| "loss": 0.0005, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "eval_LOCATION_f1": 0.8260869565217391, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8260869565217391, | |
| "eval_LOCATION_recall": 0.8260869565217391, | |
| "eval_ORGANIZATION_f1": 0.7633587786259541, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7142857142857143, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9430379746835442, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9141104294478528, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8307692307692308, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8181818181818182, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.27618908882141113, | |
| "eval_overall_accuracy": 0.9707703740401288, | |
| "eval_overall_f1": 0.8735955056179775, | |
| "eval_overall_precision": 0.8497267759562842, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3699, | |
| "eval_samples_per_second": 505.485, | |
| "eval_steps_per_second": 8.109, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "grad_norm": 0.00027959441649727523, | |
| "learning_rate": 1.3500000000000001e-05, | |
| "loss": 0.0002, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "eval_LOCATION_f1": 0.8391608391608392, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8108108108108109, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7500000000000001, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.68, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.946031746031746, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9197530864197531, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.9032258064516129, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.9032258064516129, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.28340503573417664, | |
| "eval_overall_accuracy": 0.9685409957889521, | |
| "eval_overall_f1": 0.8698060941828255, | |
| "eval_overall_precision": 0.8351063829787234, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.362, | |
| "eval_samples_per_second": 516.608, | |
| "eval_steps_per_second": 8.288, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "grad_norm": 0.00044001045171171427, | |
| "learning_rate": 1.3000000000000001e-05, | |
| "loss": 0.0002, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "eval_LOCATION_f1": 0.8275862068965517, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7894736842105263, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7681159420289856, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6883116883116883, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.9551282051282051, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9371069182389937, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.27885836362838745, | |
| "eval_overall_accuracy": 0.9695318305672529, | |
| "eval_overall_f1": 0.8756906077348067, | |
| "eval_overall_precision": 0.8386243386243386, | |
| "eval_overall_recall": 0.9161849710982659, | |
| "eval_runtime": 0.3657, | |
| "eval_samples_per_second": 511.381, | |
| "eval_steps_per_second": 8.204, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "grad_norm": 0.00027540308656170964, | |
| "learning_rate": 1.25e-05, | |
| "loss": 0.0001, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "eval_LOCATION_f1": 0.821917808219178, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7792207792207793, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7737226277372262, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6973684210526315, | |
| "eval_ORGANIZATION_recall": 0.8688524590163934, | |
| "eval_PERSON_f1": 0.9430379746835442, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9141104294478528, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8181818181818182, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7941176470588235, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2948344945907593, | |
| "eval_overall_accuracy": 0.9673024523160763, | |
| "eval_overall_f1": 0.8708791208791209, | |
| "eval_overall_precision": 0.8298429319371727, | |
| "eval_overall_recall": 0.9161849710982659, | |
| "eval_runtime": 0.3634, | |
| "eval_samples_per_second": 514.56, | |
| "eval_steps_per_second": 8.255, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "grad_norm": 0.007422334514558315, | |
| "learning_rate": 1.2e-05, | |
| "loss": 0.0004, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "eval_LOCATION_f1": 0.8194444444444444, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7067669172932329, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6527777777777778, | |
| "eval_ORGANIZATION_recall": 0.7704918032786885, | |
| "eval_PERSON_f1": 0.9400630914826499, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9085365853658537, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8307692307692308, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8181818181818182, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3101661205291748, | |
| "eval_overall_accuracy": 0.966807034926926, | |
| "eval_overall_f1": 0.8587257617728532, | |
| "eval_overall_precision": 0.824468085106383, | |
| "eval_overall_recall": 0.8959537572254336, | |
| "eval_runtime": 0.3638, | |
| "eval_samples_per_second": 513.997, | |
| "eval_steps_per_second": 8.246, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "grad_norm": 0.0005564504535868764, | |
| "learning_rate": 1.1500000000000002e-05, | |
| "loss": 0.0005, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "eval_LOCATION_f1": 0.8299319727891156, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.782051282051282, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7391304347826089, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6623376623376623, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9430379746835442, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9141104294478528, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.29981571435928345, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8618331053351572, | |
| "eval_overall_precision": 0.8181818181818182, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3758, | |
| "eval_samples_per_second": 497.657, | |
| "eval_steps_per_second": 7.984, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "grad_norm": 0.003542252816259861, | |
| "learning_rate": 1.1000000000000001e-05, | |
| "loss": 0.0002, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "eval_LOCATION_f1": 0.8194444444444444, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7703703703703704, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7027027027027027, | |
| "eval_ORGANIZATION_recall": 0.8524590163934426, | |
| "eval_PERSON_f1": 0.946031746031746, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9197530864197531, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.28981682658195496, | |
| "eval_overall_accuracy": 0.9675501610106515, | |
| "eval_overall_f1": 0.8686030428769017, | |
| "eval_overall_precision": 0.8328912466843501, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3708, | |
| "eval_samples_per_second": 504.361, | |
| "eval_steps_per_second": 8.091, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "grad_norm": 0.0004401499463710934, | |
| "learning_rate": 1.05e-05, | |
| "loss": 0.0003, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "eval_LOCATION_f1": 0.8169014084507042, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7945205479452054, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.7538461538461538, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7101449275362319, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.952076677316294, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.93125, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.84375, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.84375, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8888888888888888, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2755199670791626, | |
| "eval_overall_accuracy": 0.9695318305672529, | |
| "eval_overall_f1": 0.8735955056179775, | |
| "eval_overall_precision": 0.8497267759562842, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3648, | |
| "eval_samples_per_second": 512.67, | |
| "eval_steps_per_second": 8.225, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "grad_norm": 0.00034126470563933253, | |
| "learning_rate": 1e-05, | |
| "loss": 0.0004, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "eval_LOCATION_f1": 0.8082191780821918, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7662337662337663, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7424242424242424, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.6901408450704225, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9371069182389938, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9030303030303031, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.787878787878788, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2898205518722534, | |
| "eval_overall_accuracy": 0.96556849145405, | |
| "eval_overall_f1": 0.8532235939643347, | |
| "eval_overall_precision": 0.8120104438642297, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3951, | |
| "eval_samples_per_second": 473.261, | |
| "eval_steps_per_second": 7.592, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "grad_norm": 0.000562498637009412, | |
| "learning_rate": 9.5e-06, | |
| "loss": 0.0003, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "eval_LOCATION_f1": 0.8251748251748252, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7972972972972973, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7500000000000001, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.68, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9337539432176657, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9024390243902439, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.84375, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.84375, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.28580695390701294, | |
| "eval_overall_accuracy": 0.9687887044835274, | |
| "eval_overall_f1": 0.8646408839779005, | |
| "eval_overall_precision": 0.828042328042328, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.3627, | |
| "eval_samples_per_second": 515.648, | |
| "eval_steps_per_second": 8.272, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "grad_norm": 0.0003717710787896067, | |
| "learning_rate": 9e-06, | |
| "loss": 0.0004, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "eval_LOCATION_f1": 0.802721088435374, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7564102564102564, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.765625, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7313432835820896, | |
| "eval_ORGANIZATION_recall": 0.8032786885245902, | |
| "eval_PERSON_f1": 0.9430379746835442, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9141104294478528, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8125, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.28542497754096985, | |
| "eval_overall_accuracy": 0.9695318305672529, | |
| "eval_overall_f1": 0.8650904033379694, | |
| "eval_overall_precision": 0.8337801608579088, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3698, | |
| "eval_samples_per_second": 505.716, | |
| "eval_steps_per_second": 8.113, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "grad_norm": 0.0019057561876252294, | |
| "learning_rate": 8.500000000000002e-06, | |
| "loss": 0.0004, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "eval_LOCATION_f1": 0.8243243243243245, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7941176470588235, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.72, | |
| "eval_ORGANIZATION_recall": 0.8852459016393442, | |
| "eval_PERSON_f1": 0.9400630914826499, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9085365853658537, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2824600636959076, | |
| "eval_overall_accuracy": 0.9692841218726778, | |
| "eval_overall_f1": 0.8688524590163936, | |
| "eval_overall_precision": 0.8238341968911918, | |
| "eval_overall_recall": 0.9190751445086706, | |
| "eval_runtime": 0.3654, | |
| "eval_samples_per_second": 511.741, | |
| "eval_steps_per_second": 8.21, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "grad_norm": 0.001229365007020533, | |
| "learning_rate": 8.000000000000001e-06, | |
| "loss": 0.0006, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "eval_LOCATION_f1": 0.8226950354609929, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8055555555555556, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.7874015748031497, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7575757575757576, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.952076677316294, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.93125, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.875, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8484848484848485, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.26607078313827515, | |
| "eval_overall_accuracy": 0.9720089175130047, | |
| "eval_overall_f1": 0.876056338028169, | |
| "eval_overall_precision": 0.8543956043956044, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.3766, | |
| "eval_samples_per_second": 496.598, | |
| "eval_steps_per_second": 7.967, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "grad_norm": 0.00014708787784911692, | |
| "learning_rate": 7.5e-06, | |
| "loss": 0.0003, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "eval_LOCATION_f1": 0.8333333333333333, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.7559055118110236, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7272727272727273, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.9400630914826499, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9085365853658537, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.293227881193161, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.8638888888888889, | |
| "eval_overall_precision": 0.8315508021390374, | |
| "eval_overall_recall": 0.8988439306358381, | |
| "eval_runtime": 0.364, | |
| "eval_samples_per_second": 513.774, | |
| "eval_steps_per_second": 8.242, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "grad_norm": 0.003805099753662944, | |
| "learning_rate": 7.000000000000001e-06, | |
| "loss": 0.0006, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "eval_LOCATION_f1": 0.8345323741007195, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8285714285714286, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.768, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.75, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.946031746031746, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9197530864197531, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8307692307692308, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8181818181818182, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2930375337600708, | |
| "eval_overall_accuracy": 0.9685409957889521, | |
| "eval_overall_f1": 0.8732394366197184, | |
| "eval_overall_precision": 0.8516483516483516, | |
| "eval_overall_recall": 0.8959537572254336, | |
| "eval_runtime": 0.3668, | |
| "eval_samples_per_second": 509.746, | |
| "eval_steps_per_second": 8.178, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "grad_norm": 0.04100840538740158, | |
| "learning_rate": 6.5000000000000004e-06, | |
| "loss": 0.0005, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "eval_LOCATION_f1": 0.8169014084507042, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7945205479452054, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.7559055118110236, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7272727272727273, | |
| "eval_ORGANIZATION_recall": 0.7868852459016393, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.823529411764706, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7567567567567568, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3029007911682129, | |
| "eval_overall_accuracy": 0.9663116175377756, | |
| "eval_overall_f1": 0.8559556786703602, | |
| "eval_overall_precision": 0.8218085106382979, | |
| "eval_overall_recall": 0.8930635838150289, | |
| "eval_runtime": 0.3762, | |
| "eval_samples_per_second": 497.075, | |
| "eval_steps_per_second": 7.974, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "grad_norm": 0.0002212318213423714, | |
| "learning_rate": 6e-06, | |
| "loss": 0.0003, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "eval_LOCATION_f1": 0.8251748251748252, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7972972972972973, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8115942028985507, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7368421052631579, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.30660566687583923, | |
| "eval_overall_accuracy": 0.9665593262323507, | |
| "eval_overall_f1": 0.8598901098901098, | |
| "eval_overall_precision": 0.819371727748691, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.3705, | |
| "eval_samples_per_second": 504.729, | |
| "eval_steps_per_second": 8.097, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "grad_norm": 0.000250909011811018, | |
| "learning_rate": 5.500000000000001e-06, | |
| "loss": 0.0001, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "eval_LOCATION_f1": 0.8137931034482757, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7763157894736842, | |
| "eval_LOCATION_recall": 0.855072463768116, | |
| "eval_ORGANIZATION_f1": 0.7692307692307692, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7246376811594203, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9341692789968652, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8975903614457831, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8115942028985507, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7368421052631579, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.30867499113082886, | |
| "eval_overall_accuracy": 0.9650730740648997, | |
| "eval_overall_f1": 0.8571428571428571, | |
| "eval_overall_precision": 0.8167539267015707, | |
| "eval_overall_recall": 0.9017341040462428, | |
| "eval_runtime": 0.3615, | |
| "eval_samples_per_second": 517.307, | |
| "eval_steps_per_second": 8.299, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "grad_norm": 0.00021638131875079125, | |
| "learning_rate": 5e-06, | |
| "loss": 0.0001, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "eval_LOCATION_f1": 0.8266666666666668, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7654320987654321, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7633587786259541, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7142857142857143, | |
| "eval_ORGANIZATION_recall": 0.819672131147541, | |
| "eval_PERSON_f1": 0.9216300940438872, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8855421686746988, | |
| "eval_PERSON_recall": 0.9607843137254902, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.31429383158683777, | |
| "eval_overall_accuracy": 0.9653207827594749, | |
| "eval_overall_f1": 0.8551912568306012, | |
| "eval_overall_precision": 0.810880829015544, | |
| "eval_overall_recall": 0.9046242774566474, | |
| "eval_runtime": 0.3713, | |
| "eval_samples_per_second": 503.676, | |
| "eval_steps_per_second": 8.08, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "grad_norm": 0.00013644745922647417, | |
| "learning_rate": 4.5e-06, | |
| "loss": 0.0001, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "eval_LOCATION_f1": 0.8243243243243245, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.930817610062893, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.896969696969697, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.835820895522388, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.2944120168685913, | |
| "eval_overall_accuracy": 0.968293287094377, | |
| "eval_overall_f1": 0.861454046639232, | |
| "eval_overall_precision": 0.8198433420365535, | |
| "eval_overall_recall": 0.9075144508670521, | |
| "eval_runtime": 0.3632, | |
| "eval_samples_per_second": 514.858, | |
| "eval_steps_per_second": 8.26, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "grad_norm": 0.0009539081365801394, | |
| "learning_rate": 4.000000000000001e-06, | |
| "loss": 0.0002, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "eval_LOCATION_f1": 0.8322147651006713, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.775, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7727272727272727, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7183098591549296, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9249999999999999, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8862275449101796, | |
| "eval_PERSON_recall": 0.9673202614379085, | |
| "eval_QUANTITY_f1": 0.8307692307692308, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8181818181818182, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.823529411764706, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.7567567567567568, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.31182703375816345, | |
| "eval_overall_accuracy": 0.9670547436215011, | |
| "eval_overall_f1": 0.8610354223433242, | |
| "eval_overall_precision": 0.8144329896907216, | |
| "eval_overall_recall": 0.9132947976878613, | |
| "eval_runtime": 0.3679, | |
| "eval_samples_per_second": 508.226, | |
| "eval_steps_per_second": 8.153, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "grad_norm": 0.00018770851602312177, | |
| "learning_rate": 3.5000000000000004e-06, | |
| "loss": 0.0003, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "eval_LOCATION_f1": 0.8378378378378378, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8307692307692308, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8181818181818182, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.30489107966423035, | |
| "eval_overall_accuracy": 0.968293287094377, | |
| "eval_overall_f1": 0.8684931506849316, | |
| "eval_overall_precision": 0.8255208333333334, | |
| "eval_overall_recall": 0.9161849710982659, | |
| "eval_runtime": 0.3644, | |
| "eval_samples_per_second": 513.217, | |
| "eval_steps_per_second": 8.233, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "grad_norm": 0.0019927462562918663, | |
| "learning_rate": 3e-06, | |
| "loss": 0.0001, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "eval_LOCATION_f1": 0.8243243243243245, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8307692307692308, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.8181818181818182, | |
| "eval_QUANTITY_recall": 0.84375, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3039020299911499, | |
| "eval_overall_accuracy": 0.968293287094377, | |
| "eval_overall_f1": 0.8657534246575342, | |
| "eval_overall_precision": 0.8229166666666666, | |
| "eval_overall_recall": 0.9132947976878613, | |
| "eval_runtime": 0.3778, | |
| "eval_samples_per_second": 494.941, | |
| "eval_steps_per_second": 7.94, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "grad_norm": 0.00036656216252595186, | |
| "learning_rate": 2.5e-06, | |
| "loss": 0.0003, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9371069182389938, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.9030303030303031, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.30329030752182007, | |
| "eval_overall_accuracy": 0.968293287094377, | |
| "eval_overall_f1": 0.8641975308641975, | |
| "eval_overall_precision": 0.8224543080939948, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3655, | |
| "eval_samples_per_second": 511.653, | |
| "eval_steps_per_second": 8.208, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "grad_norm": 0.00014269202074501663, | |
| "learning_rate": 2.0000000000000003e-06, | |
| "loss": 0.0005, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.30583375692367554, | |
| "eval_overall_accuracy": 0.9675501610106515, | |
| "eval_overall_f1": 0.8618331053351572, | |
| "eval_overall_precision": 0.8181818181818182, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3755, | |
| "eval_samples_per_second": 497.939, | |
| "eval_steps_per_second": 7.988, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "grad_norm": 0.0001223723666043952, | |
| "learning_rate": 1.5e-06, | |
| "loss": 0.0001, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9341692789968652, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8975903614457831, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3053462505340576, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.863013698630137, | |
| "eval_overall_precision": 0.8203125, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3619, | |
| "eval_samples_per_second": 516.75, | |
| "eval_steps_per_second": 8.29, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "grad_norm": 0.0004060152277816087, | |
| "learning_rate": 1.0000000000000002e-06, | |
| "loss": 0.0001, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.9341692789968652, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8975903614457831, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3043583929538727, | |
| "eval_overall_accuracy": 0.9677978697052266, | |
| "eval_overall_f1": 0.863013698630137, | |
| "eval_overall_precision": 0.8203125, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3759, | |
| "eval_samples_per_second": 497.529, | |
| "eval_steps_per_second": 7.982, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "grad_norm": 0.00019621806859504431, | |
| "learning_rate": 5.000000000000001e-07, | |
| "loss": 0.0001, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3064700961112976, | |
| "eval_overall_accuracy": 0.9675501610106515, | |
| "eval_overall_f1": 0.8618331053351572, | |
| "eval_overall_precision": 0.8181818181818182, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3646, | |
| "eval_samples_per_second": 512.932, | |
| "eval_steps_per_second": 8.229, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "grad_norm": 0.0006661502993665636, | |
| "learning_rate": 0.0, | |
| "loss": 0.0001, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "eval_LOCATION_f1": 0.8187919463087248, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.7786259541984734, | |
| "eval_ORGANIZATION_number": 61, | |
| "eval_ORGANIZATION_precision": 0.7285714285714285, | |
| "eval_ORGANIZATION_recall": 0.8360655737704918, | |
| "eval_PERSON_f1": 0.93125, | |
| "eval_PERSON_number": 153, | |
| "eval_PERSON_precision": 0.8922155688622755, | |
| "eval_PERSON_recall": 0.9738562091503268, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 32, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8125, | |
| "eval_TIME_f1": 0.8484848484848486, | |
| "eval_TIME_number": 31, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.9032258064516129, | |
| "eval_loss": 0.3065154552459717, | |
| "eval_overall_accuracy": 0.9675501610106515, | |
| "eval_overall_f1": 0.8618331053351572, | |
| "eval_overall_precision": 0.8181818181818182, | |
| "eval_overall_recall": 0.9104046242774566, | |
| "eval_runtime": 0.3714, | |
| "eval_samples_per_second": 503.447, | |
| "eval_steps_per_second": 8.077, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "step": 10600, | |
| "total_flos": 4560509291304846.0, | |
| "train_loss": 0.008112131665891283, | |
| "train_runtime": 974.3295, | |
| "train_samples_per_second": 173.145, | |
| "train_steps_per_second": 10.879 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 10600, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 100, | |
| "save_steps": 500, | |
| "total_flos": 4560509291304846.0, | |
| "train_batch_size": 16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |