| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 100.0, | |
| "eval_steps": 500, | |
| "global_step": 10600, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 2.184743642807007, | |
| "learning_rate": 4.9500000000000004e-05, | |
| "loss": 0.9441, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_LOCATION_f1": 0.0, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.0, | |
| "eval_LOCATION_recall": 0.0, | |
| "eval_ORGANIZATION_f1": 0.0, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.0, | |
| "eval_ORGANIZATION_recall": 0.0, | |
| "eval_PERSON_f1": 0.013071895424836602, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.3333333333333333, | |
| "eval_PERSON_recall": 0.006666666666666667, | |
| "eval_QUANTITY_f1": 0.0, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.0, | |
| "eval_QUANTITY_recall": 0.0, | |
| "eval_TIME_f1": 0.0, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.0, | |
| "eval_TIME_recall": 0.0, | |
| "eval_loss": 0.6184682846069336, | |
| "eval_overall_accuracy": 0.8414161008729389, | |
| "eval_overall_f1": 0.005714285714285714, | |
| "eval_overall_precision": 0.3333333333333333, | |
| "eval_overall_recall": 0.002881844380403458, | |
| "eval_runtime": 0.3345, | |
| "eval_samples_per_second": 558.979, | |
| "eval_steps_per_second": 8.968, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 1.0305746793746948, | |
| "learning_rate": 4.9e-05, | |
| "loss": 0.5645, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_LOCATION_f1": 0.22916666666666669, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.44, | |
| "eval_LOCATION_recall": 0.15492957746478872, | |
| "eval_ORGANIZATION_f1": 0.04, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.05714285714285714, | |
| "eval_ORGANIZATION_recall": 0.03076923076923077, | |
| "eval_PERSON_f1": 0.5449438202247192, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.470873786407767, | |
| "eval_PERSON_recall": 0.6466666666666666, | |
| "eval_QUANTITY_f1": 0.0, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.0, | |
| "eval_QUANTITY_recall": 0.0, | |
| "eval_TIME_f1": 0.43478260869565216, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.5555555555555556, | |
| "eval_TIME_recall": 0.35714285714285715, | |
| "eval_loss": 0.41943466663360596, | |
| "eval_overall_accuracy": 0.8877303588748787, | |
| "eval_overall_f1": 0.3803486529318542, | |
| "eval_overall_precision": 0.4225352112676056, | |
| "eval_overall_recall": 0.345821325648415, | |
| "eval_runtime": 0.3265, | |
| "eval_samples_per_second": 572.669, | |
| "eval_steps_per_second": 9.187, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 1.2039958238601685, | |
| "learning_rate": 4.85e-05, | |
| "loss": 0.3968, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_LOCATION_f1": 0.5153374233128835, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.45652173913043476, | |
| "eval_LOCATION_recall": 0.5915492957746479, | |
| "eval_ORGANIZATION_f1": 0.3278688524590164, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.3508771929824561, | |
| "eval_ORGANIZATION_recall": 0.3076923076923077, | |
| "eval_PERSON_f1": 0.6829268292682927, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.5753424657534246, | |
| "eval_PERSON_recall": 0.84, | |
| "eval_QUANTITY_f1": 0.1846153846153846, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.1875, | |
| "eval_QUANTITY_recall": 0.18181818181818182, | |
| "eval_TIME_f1": 0.8076923076923077, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.875, | |
| "eval_TIME_recall": 0.75, | |
| "eval_loss": 0.30941861867904663, | |
| "eval_overall_accuracy": 0.9202230843840931, | |
| "eval_overall_f1": 0.5577172503242542, | |
| "eval_overall_precision": 0.5070754716981132, | |
| "eval_overall_recall": 0.6195965417867435, | |
| "eval_runtime": 0.3361, | |
| "eval_samples_per_second": 556.318, | |
| "eval_steps_per_second": 8.925, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 4.7056145668029785, | |
| "learning_rate": 4.8e-05, | |
| "loss": 0.2937, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_LOCATION_f1": 0.5465116279069767, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.46534653465346537, | |
| "eval_LOCATION_recall": 0.6619718309859155, | |
| "eval_ORGANIZATION_f1": 0.4878048780487805, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5172413793103449, | |
| "eval_ORGANIZATION_recall": 0.46153846153846156, | |
| "eval_PERSON_f1": 0.8036809815950918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7443181818181818, | |
| "eval_PERSON_recall": 0.8733333333333333, | |
| "eval_QUANTITY_f1": 0.47368421052631576, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.4186046511627907, | |
| "eval_QUANTITY_recall": 0.5454545454545454, | |
| "eval_TIME_f1": 0.8363636363636364, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8518518518518519, | |
| "eval_TIME_recall": 0.8214285714285714, | |
| "eval_loss": 0.2222605049610138, | |
| "eval_overall_accuracy": 0.9369544131910766, | |
| "eval_overall_f1": 0.6622340425531915, | |
| "eval_overall_precision": 0.6148148148148148, | |
| "eval_overall_recall": 0.7175792507204611, | |
| "eval_runtime": 0.3341, | |
| "eval_samples_per_second": 559.672, | |
| "eval_steps_per_second": 8.979, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 1.303191900253296, | |
| "learning_rate": 4.75e-05, | |
| "loss": 0.2294, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_LOCATION_f1": 0.6496815286624205, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.5930232558139535, | |
| "eval_LOCATION_recall": 0.7183098591549296, | |
| "eval_ORGANIZATION_f1": 0.562962962962963, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5428571428571428, | |
| "eval_ORGANIZATION_recall": 0.5846153846153846, | |
| "eval_PERSON_f1": 0.8176100628930819, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7738095238095238, | |
| "eval_PERSON_recall": 0.8666666666666667, | |
| "eval_QUANTITY_f1": 0.5316455696202532, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.45652173913043476, | |
| "eval_QUANTITY_recall": 0.6363636363636364, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.18041133880615234, | |
| "eval_overall_accuracy": 0.9427740058195926, | |
| "eval_overall_f1": 0.7106325706594886, | |
| "eval_overall_precision": 0.6666666666666666, | |
| "eval_overall_recall": 0.760806916426513, | |
| "eval_runtime": 0.3273, | |
| "eval_samples_per_second": 571.404, | |
| "eval_steps_per_second": 9.167, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 1.6567788124084473, | |
| "learning_rate": 4.7e-05, | |
| "loss": 0.1955, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_LOCATION_f1": 0.7052023121387284, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.5980392156862745, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.5903614457831325, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.48514851485148514, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8109756097560976, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7471910112359551, | |
| "eval_PERSON_recall": 0.8866666666666667, | |
| "eval_QUANTITY_f1": 0.5517241379310345, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.4444444444444444, | |
| "eval_QUANTITY_recall": 0.7272727272727273, | |
| "eval_TIME_f1": 0.793103448275862, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.7666666666666667, | |
| "eval_TIME_recall": 0.8214285714285714, | |
| "eval_loss": 0.19565138220787048, | |
| "eval_overall_accuracy": 0.9396217264791464, | |
| "eval_overall_f1": 0.7142857142857143, | |
| "eval_overall_precision": 0.6236559139784946, | |
| "eval_overall_recall": 0.8357348703170029, | |
| "eval_runtime": 0.3286, | |
| "eval_samples_per_second": 569.125, | |
| "eval_steps_per_second": 9.13, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 2.8131422996520996, | |
| "learning_rate": 4.6500000000000005e-05, | |
| "loss": 0.1799, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_LOCATION_f1": 0.7374999999999999, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6629213483146067, | |
| "eval_LOCATION_recall": 0.8309859154929577, | |
| "eval_ORGANIZATION_f1": 0.6482758620689656, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5875, | |
| "eval_ORGANIZATION_recall": 0.7230769230769231, | |
| "eval_PERSON_f1": 0.81875, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7705882352941177, | |
| "eval_PERSON_recall": 0.8733333333333333, | |
| "eval_QUANTITY_f1": 0.6585365853658536, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.5510204081632653, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8275862068965518, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16057299077510834, | |
| "eval_overall_accuracy": 0.9468962172647915, | |
| "eval_overall_f1": 0.7529411764705883, | |
| "eval_overall_precision": 0.6889952153110048, | |
| "eval_overall_recall": 0.829971181556196, | |
| "eval_runtime": 0.3352, | |
| "eval_samples_per_second": 557.891, | |
| "eval_steps_per_second": 8.95, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 0.7265537977218628, | |
| "learning_rate": 4.600000000000001e-05, | |
| "loss": 0.1628, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_LOCATION_f1": 0.7349397590361445, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6421052631578947, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.6451612903225806, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5555555555555556, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8275862068965518, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7810650887573964, | |
| "eval_PERSON_recall": 0.88, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8421052631578947, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8275862068965517, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15270720422267914, | |
| "eval_overall_accuracy": 0.9510184287099903, | |
| "eval_overall_f1": 0.7587096774193549, | |
| "eval_overall_precision": 0.6869158878504673, | |
| "eval_overall_recall": 0.8472622478386167, | |
| "eval_runtime": 0.3301, | |
| "eval_samples_per_second": 566.514, | |
| "eval_steps_per_second": 9.088, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 1.15663743019104, | |
| "learning_rate": 4.55e-05, | |
| "loss": 0.1528, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_LOCATION_f1": 0.7564102564102564, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6941176470588235, | |
| "eval_LOCATION_recall": 0.8309859154929577, | |
| "eval_ORGANIZATION_f1": 0.6351351351351351, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5662650602409639, | |
| "eval_ORGANIZATION_recall": 0.7230769230769231, | |
| "eval_PERSON_f1": 0.8397435897435898, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.808641975308642, | |
| "eval_PERSON_recall": 0.8733333333333333, | |
| "eval_QUANTITY_f1": 0.7200000000000001, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8771929824561403, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8620689655172413, | |
| "eval_TIME_recall": 0.8928571428571429, | |
| "eval_loss": 0.14164027571678162, | |
| "eval_overall_accuracy": 0.9522308438409312, | |
| "eval_overall_f1": 0.7727272727272728, | |
| "eval_overall_precision": 0.7206982543640897, | |
| "eval_overall_recall": 0.8328530259365994, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.91, | |
| "eval_steps_per_second": 8.983, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 1.8798385858535767, | |
| "learning_rate": 4.5e-05, | |
| "loss": 0.1466, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_LOCATION_f1": 0.7307692307692307, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6705882352941176, | |
| "eval_LOCATION_recall": 0.8028169014084507, | |
| "eval_ORGANIZATION_f1": 0.625, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.569620253164557, | |
| "eval_ORGANIZATION_recall": 0.6923076923076923, | |
| "eval_PERSON_f1": 0.8387096774193549, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8125, | |
| "eval_PERSON_recall": 0.8666666666666667, | |
| "eval_QUANTITY_f1": 0.736842105263158, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6511627906976745, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8620689655172413, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8928571428571429, | |
| "eval_loss": 0.14073340594768524, | |
| "eval_overall_accuracy": 0.9522308438409312, | |
| "eval_overall_f1": 0.7661290322580645, | |
| "eval_overall_precision": 0.7178841309823678, | |
| "eval_overall_recall": 0.8213256484149856, | |
| "eval_runtime": 0.3345, | |
| "eval_samples_per_second": 559.025, | |
| "eval_steps_per_second": 8.968, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 0.9395531415939331, | |
| "learning_rate": 4.4500000000000004e-05, | |
| "loss": 0.138, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_LOCATION_f1": 0.775, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6966292134831461, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6666666666666666, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5975609756097561, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8360128617363344, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8074534161490683, | |
| "eval_PERSON_recall": 0.8666666666666667, | |
| "eval_QUANTITY_f1": 0.736842105263158, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6511627906976745, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8620689655172413, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8928571428571429, | |
| "eval_loss": 0.14058995246887207, | |
| "eval_overall_accuracy": 0.9536857419980601, | |
| "eval_overall_f1": 0.7819148936170213, | |
| "eval_overall_precision": 0.725925925925926, | |
| "eval_overall_recall": 0.8472622478386167, | |
| "eval_runtime": 0.3346, | |
| "eval_samples_per_second": 558.811, | |
| "eval_steps_per_second": 8.965, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "grad_norm": 1.2153416872024536, | |
| "learning_rate": 4.4000000000000006e-05, | |
| "loss": 0.1314, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_LOCATION_f1": 0.775, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6966292134831461, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6578947368421053, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5747126436781609, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8407643312101911, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8048780487804879, | |
| "eval_PERSON_recall": 0.88, | |
| "eval_QUANTITY_f1": 0.736842105263158, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6511627906976745, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14196860790252686, | |
| "eval_overall_accuracy": 0.953443258971872, | |
| "eval_overall_f1": 0.7769028871391075, | |
| "eval_overall_precision": 0.7132530120481928, | |
| "eval_overall_recall": 0.8530259365994236, | |
| "eval_runtime": 0.335, | |
| "eval_samples_per_second": 558.284, | |
| "eval_steps_per_second": 8.956, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "grad_norm": 0.6423377990722656, | |
| "learning_rate": 4.35e-05, | |
| "loss": 0.1285, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_LOCATION_f1": 0.7261146496815286, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6627906976744186, | |
| "eval_LOCATION_recall": 0.8028169014084507, | |
| "eval_ORGANIZATION_f1": 0.6493506493506495, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5617977528089888, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8461538461538461, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8148148148148148, | |
| "eval_PERSON_recall": 0.88, | |
| "eval_QUANTITY_f1": 0.7466666666666666, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.9090909090909091, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9259259259259259, | |
| "eval_TIME_recall": 0.8928571428571429, | |
| "eval_loss": 0.13416315615177155, | |
| "eval_overall_accuracy": 0.954898157129001, | |
| "eval_overall_f1": 0.7755644090305446, | |
| "eval_overall_precision": 0.7192118226600985, | |
| "eval_overall_recall": 0.8414985590778098, | |
| "eval_runtime": 0.3287, | |
| "eval_samples_per_second": 568.933, | |
| "eval_steps_per_second": 9.127, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "grad_norm": 3.325246572494507, | |
| "learning_rate": 4.3e-05, | |
| "loss": 0.1301, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_LOCATION_f1": 0.7792207792207793, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7228915662650602, | |
| "eval_LOCATION_recall": 0.8450704225352113, | |
| "eval_ORGANIZATION_f1": 0.5915492957746479, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5454545454545454, | |
| "eval_ORGANIZATION_recall": 0.6461538461538462, | |
| "eval_PERSON_f1": 0.8488745980707395, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8198757763975155, | |
| "eval_PERSON_recall": 0.88, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8620689655172413, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8928571428571429, | |
| "eval_loss": 0.12784981727600098, | |
| "eval_overall_accuracy": 0.95635305528613, | |
| "eval_overall_f1": 0.778833107191316, | |
| "eval_overall_precision": 0.735897435897436, | |
| "eval_overall_recall": 0.8270893371757925, | |
| "eval_runtime": 0.3278, | |
| "eval_samples_per_second": 570.447, | |
| "eval_steps_per_second": 9.152, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "grad_norm": 1.1983723640441895, | |
| "learning_rate": 4.25e-05, | |
| "loss": 0.1197, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_LOCATION_f1": 0.779874213836478, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7045454545454546, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7012987012987013, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6067415730337079, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8471337579617835, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8109756097560976, | |
| "eval_PERSON_recall": 0.8866666666666667, | |
| "eval_QUANTITY_f1": 0.7012987012987013, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6136363636363636, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8275862068965518, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1395217925310135, | |
| "eval_overall_accuracy": 0.9539282250242483, | |
| "eval_overall_f1": 0.7874015748031495, | |
| "eval_overall_precision": 0.7228915662650602, | |
| "eval_overall_recall": 0.8645533141210374, | |
| "eval_runtime": 0.3345, | |
| "eval_samples_per_second": 559.04, | |
| "eval_steps_per_second": 8.969, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "grad_norm": 2.9908885955810547, | |
| "learning_rate": 4.2e-05, | |
| "loss": 0.1147, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6853146853146853, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6282051282051282, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8461538461538461, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8148148148148148, | |
| "eval_PERSON_recall": 0.88, | |
| "eval_QUANTITY_f1": 0.7088607594936709, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6086956521739131, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13548891246318817, | |
| "eval_overall_accuracy": 0.9556256062075654, | |
| "eval_overall_f1": 0.787716955941255, | |
| "eval_overall_precision": 0.7338308457711443, | |
| "eval_overall_recall": 0.8501440922190202, | |
| "eval_runtime": 0.3346, | |
| "eval_samples_per_second": 558.836, | |
| "eval_steps_per_second": 8.965, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "grad_norm": 0.7757030129432678, | |
| "learning_rate": 4.15e-05, | |
| "loss": 0.1134, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_LOCATION_f1": 0.7922077922077921, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.6618705035971223, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6216216216216216, | |
| "eval_ORGANIZATION_recall": 0.7076923076923077, | |
| "eval_PERSON_f1": 0.8498402555910542, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8159509202453987, | |
| "eval_PERSON_recall": 0.8866666666666667, | |
| "eval_QUANTITY_f1": 0.7105263157894738, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.627906976744186, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8421052631578947, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8275862068965517, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.12935349345207214, | |
| "eval_overall_accuracy": 0.95635305528613, | |
| "eval_overall_f1": 0.7875507442489851, | |
| "eval_overall_precision": 0.7423469387755102, | |
| "eval_overall_recall": 0.8386167146974063, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.266, | |
| "eval_steps_per_second": 8.988, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "grad_norm": 1.1819586753845215, | |
| "learning_rate": 4.1e-05, | |
| "loss": 0.1103, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7162162162162162, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6385542168674698, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8507936507936508, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8121212121212121, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.736842105263158, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6511627906976745, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8421052631578947, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8275862068965517, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13496747612953186, | |
| "eval_overall_accuracy": 0.9568380213385063, | |
| "eval_overall_f1": 0.8015978695073236, | |
| "eval_overall_precision": 0.745049504950495, | |
| "eval_overall_recall": 0.8674351585014409, | |
| "eval_runtime": 0.329, | |
| "eval_samples_per_second": 568.336, | |
| "eval_steps_per_second": 9.118, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "grad_norm": 1.253257393836975, | |
| "learning_rate": 4.05e-05, | |
| "loss": 0.1078, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_LOCATION_f1": 0.7973856209150327, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7439024390243902, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7162162162162162, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6385542168674698, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8498402555910542, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8159509202453987, | |
| "eval_PERSON_recall": 0.8866666666666667, | |
| "eval_QUANTITY_f1": 0.7200000000000001, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8571428571428571, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8571428571428571, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13079425692558289, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.7999999999999999, | |
| "eval_overall_precision": 0.7487437185929648, | |
| "eval_overall_recall": 0.8587896253602305, | |
| "eval_runtime": 0.3276, | |
| "eval_samples_per_second": 570.782, | |
| "eval_steps_per_second": 9.157, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "grad_norm": 1.522292137145996, | |
| "learning_rate": 4e-05, | |
| "loss": 0.1051, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_LOCATION_f1": 0.7948717948717949, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7294117647058823, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6814814814814816, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7076923076923077, | |
| "eval_PERSON_f1": 0.858974358974359, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8271604938271605, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.12830358743667603, | |
| "eval_overall_accuracy": 0.9587778855480117, | |
| "eval_overall_f1": 0.8054794520547945, | |
| "eval_overall_precision": 0.7676240208877284, | |
| "eval_overall_recall": 0.8472622478386167, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.26, | |
| "eval_steps_per_second": 8.988, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "grad_norm": 1.3046311140060425, | |
| "learning_rate": 3.9500000000000005e-05, | |
| "loss": 0.1013, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7210884353741497, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6463414634146342, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8507936507936508, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8121212121212121, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.736842105263158, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6511627906976745, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1330733597278595, | |
| "eval_overall_accuracy": 0.9585354025218235, | |
| "eval_overall_f1": 0.8048128342245989, | |
| "eval_overall_precision": 0.7506234413965087, | |
| "eval_overall_recall": 0.8674351585014409, | |
| "eval_runtime": 0.3364, | |
| "eval_samples_per_second": 555.954, | |
| "eval_steps_per_second": 8.919, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "grad_norm": 1.648231863975525, | |
| "learning_rate": 3.9000000000000006e-05, | |
| "loss": 0.1015, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_LOCATION_f1": 0.7625, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6853932584269663, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7044025157232704, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5957446808510638, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8481012658227848, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8072289156626506, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.736842105263158, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6511627906976745, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8571428571428571, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8571428571428571, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1461816430091858, | |
| "eval_overall_accuracy": 0.9529582929194956, | |
| "eval_overall_f1": 0.7900912646675358, | |
| "eval_overall_precision": 0.7214285714285714, | |
| "eval_overall_recall": 0.8731988472622478, | |
| "eval_runtime": 0.3289, | |
| "eval_samples_per_second": 568.49, | |
| "eval_steps_per_second": 9.12, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "grad_norm": 1.236881136894226, | |
| "learning_rate": 3.85e-05, | |
| "loss": 0.0952, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_LOCATION_f1": 0.8157894736842104, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7654320987654321, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7375886524822695, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6842105263157895, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8525641025641025, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8209876543209876, | |
| "eval_PERSON_recall": 0.8866666666666667, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.12616348266601562, | |
| "eval_overall_accuracy": 0.9612027158098934, | |
| "eval_overall_f1": 0.8180574555403557, | |
| "eval_overall_precision": 0.7786458333333334, | |
| "eval_overall_recall": 0.861671469740634, | |
| "eval_runtime": 0.3343, | |
| "eval_samples_per_second": 559.416, | |
| "eval_steps_per_second": 8.975, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "grad_norm": 1.727121353149414, | |
| "learning_rate": 3.8e-05, | |
| "loss": 0.0957, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_LOCATION_f1": 0.7870967741935485, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7261904761904762, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7105263157894737, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6206896551724138, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8454258675078864, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8023952095808383, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.736842105263158, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6511627906976745, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8571428571428571, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8571428571428571, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14105214178562164, | |
| "eval_overall_accuracy": 0.9556256062075654, | |
| "eval_overall_f1": 0.7962962962962963, | |
| "eval_overall_precision": 0.7359413202933985, | |
| "eval_overall_recall": 0.8674351585014409, | |
| "eval_runtime": 0.3271, | |
| "eval_samples_per_second": 571.627, | |
| "eval_steps_per_second": 9.17, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "grad_norm": 1.6316332817077637, | |
| "learning_rate": 3.7500000000000003e-05, | |
| "loss": 0.0913, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7560975609756098, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7534246575342466, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6790123456790124, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8544303797468354, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8132530120481928, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.7272727272727273, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6363636363636364, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8421052631578947, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8275862068965517, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13811782002449036, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.8117489986648865, | |
| "eval_overall_precision": 0.7562189054726368, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.3283, | |
| "eval_samples_per_second": 569.644, | |
| "eval_steps_per_second": 9.139, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "grad_norm": 0.5518941879272461, | |
| "learning_rate": 3.7e-05, | |
| "loss": 0.091, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_LOCATION_f1": 0.782051282051282, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7176470588235294, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7361111111111112, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6708860759493671, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8643533123028392, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8203592814371258, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7179487179487178, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6222222222222222, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13771426677703857, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.808, | |
| "eval_overall_precision": 0.7518610421836228, | |
| "eval_overall_recall": 0.8731988472622478, | |
| "eval_runtime": 0.3284, | |
| "eval_samples_per_second": 569.498, | |
| "eval_steps_per_second": 9.136, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "grad_norm": 1.4636467695236206, | |
| "learning_rate": 3.65e-05, | |
| "loss": 0.0902, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_LOCATION_f1": 0.7770700636942676, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7093023255813954, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7248322147651007, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6428571428571429, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8517350157728706, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8083832335329342, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.6582278481012658, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.5652173913043478, | |
| "eval_QUANTITY_recall": 0.7878787878787878, | |
| "eval_TIME_f1": 0.8275862068965518, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14399109780788422, | |
| "eval_overall_accuracy": 0.9546556741028128, | |
| "eval_overall_f1": 0.7894736842105263, | |
| "eval_overall_precision": 0.7263922518159807, | |
| "eval_overall_recall": 0.8645533141210374, | |
| "eval_runtime": 0.3285, | |
| "eval_samples_per_second": 569.277, | |
| "eval_steps_per_second": 9.133, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "grad_norm": 1.3473738431930542, | |
| "learning_rate": 3.6e-05, | |
| "loss": 0.087, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_LOCATION_f1": 0.794701986754967, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.75, | |
| "eval_LOCATION_recall": 0.8450704225352113, | |
| "eval_ORGANIZATION_f1": 0.7142857142857143, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6179775280898876, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8626198083067093, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8282208588957055, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1355486363172531, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.8118279569892473, | |
| "eval_overall_precision": 0.760705289672544, | |
| "eval_overall_recall": 0.8703170028818443, | |
| "eval_runtime": 0.3358, | |
| "eval_samples_per_second": 556.936, | |
| "eval_steps_per_second": 8.935, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "grad_norm": 0.5319921970367432, | |
| "learning_rate": 3.55e-05, | |
| "loss": 0.0849, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_LOCATION_f1": 0.7922077922077921, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.6923076923076923, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5934065934065934, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8507936507936508, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8121212121212121, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.7500000000000001, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6923076923076923, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13350827991962433, | |
| "eval_overall_accuracy": 0.9585354025218235, | |
| "eval_overall_f1": 0.7989347536617842, | |
| "eval_overall_precision": 0.7425742574257426, | |
| "eval_overall_recall": 0.8645533141210374, | |
| "eval_runtime": 0.3355, | |
| "eval_samples_per_second": 557.411, | |
| "eval_steps_per_second": 8.942, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "grad_norm": 1.0683906078338623, | |
| "learning_rate": 3.5e-05, | |
| "loss": 0.0815, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "eval_LOCATION_f1": 0.7973856209150327, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7439024390243902, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7310344827586207, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6625, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7567567567567567, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6829268292682927, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13375303149223328, | |
| "eval_overall_accuracy": 0.9612027158098934, | |
| "eval_overall_f1": 0.8184281842818427, | |
| "eval_overall_precision": 0.7723785166240409, | |
| "eval_overall_recall": 0.8703170028818443, | |
| "eval_runtime": 0.3265, | |
| "eval_samples_per_second": 572.734, | |
| "eval_steps_per_second": 9.188, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "grad_norm": 0.8525239825248718, | |
| "learning_rate": 3.45e-05, | |
| "loss": 0.0838, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "eval_LOCATION_f1": 0.782051282051282, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7176470588235294, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7333333333333334, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6470588235294118, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7567567567567567, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6829268292682927, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13723136484622955, | |
| "eval_overall_accuracy": 0.9587778855480117, | |
| "eval_overall_f1": 0.8133333333333335, | |
| "eval_overall_precision": 0.7568238213399504, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3342, | |
| "eval_samples_per_second": 559.545, | |
| "eval_steps_per_second": 8.977, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "grad_norm": 1.4616408348083496, | |
| "learning_rate": 3.4000000000000007e-05, | |
| "loss": 0.076, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "eval_LOCATION_f1": 0.7770700636942676, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7093023255813954, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.708860759493671, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6021505376344086, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8643533123028392, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8203592814371258, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7088607594936709, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6086956521739131, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1504770815372467, | |
| "eval_overall_accuracy": 0.954898157129001, | |
| "eval_overall_f1": 0.7989556135770235, | |
| "eval_overall_precision": 0.7303102625298329, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3276, | |
| "eval_samples_per_second": 570.905, | |
| "eval_steps_per_second": 9.159, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "grad_norm": 2.1258466243743896, | |
| "learning_rate": 3.35e-05, | |
| "loss": 0.0775, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7560975609756098, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.72992700729927, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6944444444444444, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.8000000000000002, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7567567567567568, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13078542053699493, | |
| "eval_overall_accuracy": 0.9633850630455868, | |
| "eval_overall_f1": 0.8264462809917356, | |
| "eval_overall_precision": 0.7915567282321899, | |
| "eval_overall_recall": 0.8645533141210374, | |
| "eval_runtime": 0.3335, | |
| "eval_samples_per_second": 560.709, | |
| "eval_steps_per_second": 8.995, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "grad_norm": 1.6660958528518677, | |
| "learning_rate": 3.3e-05, | |
| "loss": 0.0768, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7560975609756098, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7516778523489933, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8681672025723473, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8385093167701864, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13354364037513733, | |
| "eval_overall_accuracy": 0.9612027158098934, | |
| "eval_overall_f1": 0.8254397834912043, | |
| "eval_overall_precision": 0.7780612244897959, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3334, | |
| "eval_samples_per_second": 560.904, | |
| "eval_steps_per_second": 8.998, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "grad_norm": 0.7892407774925232, | |
| "learning_rate": 3.2500000000000004e-05, | |
| "loss": 0.0746, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "eval_LOCATION_f1": 0.7870967741935485, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7261904761904762, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7549668874172185, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6627906976744186, | |
| "eval_ORGANIZATION_recall": 0.8769230769230769, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7671232876712328, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1393873244524002, | |
| "eval_overall_accuracy": 0.9587778855480117, | |
| "eval_overall_f1": 0.8225806451612904, | |
| "eval_overall_precision": 0.7707808564231738, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3336, | |
| "eval_samples_per_second": 560.581, | |
| "eval_steps_per_second": 8.993, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "grad_norm": 1.38412344455719, | |
| "learning_rate": 3.2000000000000005e-05, | |
| "loss": 0.0724, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "eval_LOCATION_f1": 0.7948717948717949, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7294117647058823, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7051282051282052, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6043956043956044, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8589341692789968, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8106508875739645, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.8169014084507042, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7631578947368421, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14194774627685547, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.8110964332892999, | |
| "eval_overall_precision": 0.748780487804878, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.328, | |
| "eval_samples_per_second": 570.085, | |
| "eval_steps_per_second": 9.146, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "grad_norm": 1.6571606397628784, | |
| "learning_rate": 3.15e-05, | |
| "loss": 0.0703, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "eval_LOCATION_f1": 0.7672955974842768, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6931818181818182, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.708860759493671, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6021505376344086, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8698412698412699, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8303030303030303, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15663577616214752, | |
| "eval_overall_accuracy": 0.9517458777885548, | |
| "eval_overall_f1": 0.7973856209150326, | |
| "eval_overall_precision": 0.7296650717703349, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3335, | |
| "eval_samples_per_second": 560.721, | |
| "eval_steps_per_second": 8.996, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "grad_norm": 0.8099401593208313, | |
| "learning_rate": 3.1e-05, | |
| "loss": 0.07, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "eval_LOCATION_f1": 0.7770700636942676, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7093023255813954, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7432432432432433, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6626506024096386, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.6835443037974683, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.5869565217391305, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8571428571428571, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8571428571428571, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14580821990966797, | |
| "eval_overall_accuracy": 0.9570805043646945, | |
| "eval_overall_f1": 0.8090185676392573, | |
| "eval_overall_precision": 0.7493857493857494, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3339, | |
| "eval_samples_per_second": 560.024, | |
| "eval_steps_per_second": 8.984, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "grad_norm": 1.7465280294418335, | |
| "learning_rate": 3.05e-05, | |
| "loss": 0.0688, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "eval_LOCATION_f1": 0.7721518987341772, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7011494252873564, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.713375796178344, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6086956521739131, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.8055555555555556, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7435897435897436, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14488695561885834, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.8158940397350992, | |
| "eval_overall_precision": 0.7549019607843137, | |
| "eval_overall_recall": 0.8876080691642652, | |
| "eval_runtime": 0.3336, | |
| "eval_samples_per_second": 560.606, | |
| "eval_steps_per_second": 8.994, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "grad_norm": 0.8754693269729614, | |
| "learning_rate": 3e-05, | |
| "loss": 0.0691, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7448275862068966, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.675, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7887323943661972, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7368421052631579, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.13563859462738037, | |
| "eval_overall_accuracy": 0.9614451988360815, | |
| "eval_overall_f1": 0.8281461434370772, | |
| "eval_overall_precision": 0.7806122448979592, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3276, | |
| "eval_samples_per_second": 570.796, | |
| "eval_steps_per_second": 9.157, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "grad_norm": 0.3340809941291809, | |
| "learning_rate": 2.95e-05, | |
| "loss": 0.0673, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "eval_LOCATION_f1": 0.7721518987341772, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7011494252873564, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.6962025316455697, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5913978494623656, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8698412698412699, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8303030303030303, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7012987012987013, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6136363636363636, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8571428571428571, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8571428571428571, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15314164757728577, | |
| "eval_overall_accuracy": 0.9539282250242483, | |
| "eval_overall_f1": 0.7958115183246073, | |
| "eval_overall_precision": 0.7290167865707434, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.906, | |
| "eval_steps_per_second": 8.982, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "grad_norm": 0.9933107495307922, | |
| "learning_rate": 2.9e-05, | |
| "loss": 0.0663, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7320261437908497, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6363636363636364, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8653846153846153, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8333333333333334, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.7466666666666666, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1424974650144577, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.8144192256341789, | |
| "eval_overall_precision": 0.7587064676616916, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3347, | |
| "eval_samples_per_second": 558.702, | |
| "eval_steps_per_second": 8.963, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "grad_norm": 0.6678488254547119, | |
| "learning_rate": 2.8499999999999998e-05, | |
| "loss": 0.0639, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "eval_LOCATION_f1": 0.7948717948717949, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7294117647058823, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7285714285714285, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.68, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8562300319488818, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8220858895705522, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.7671232876712328, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1413319855928421, | |
| "eval_overall_accuracy": 0.9592628516003879, | |
| "eval_overall_f1": 0.8113975576662144, | |
| "eval_overall_precision": 0.7666666666666667, | |
| "eval_overall_recall": 0.861671469740634, | |
| "eval_runtime": 0.3343, | |
| "eval_samples_per_second": 559.306, | |
| "eval_steps_per_second": 8.973, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "grad_norm": 0.8438284993171692, | |
| "learning_rate": 2.8000000000000003e-05, | |
| "loss": 0.064, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7560975609756098, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7152317880794703, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.627906976744186, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8698412698412699, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8303030303030303, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14022959768772125, | |
| "eval_overall_accuracy": 0.9604752667313288, | |
| "eval_overall_f1": 0.8187919463087249, | |
| "eval_overall_precision": 0.7663316582914573, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3348, | |
| "eval_samples_per_second": 558.615, | |
| "eval_steps_per_second": 8.962, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "grad_norm": 3.699862241744995, | |
| "learning_rate": 2.7500000000000004e-05, | |
| "loss": 0.0615, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "eval_LOCATION_f1": 0.7721518987341772, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7011494252873564, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7189542483660131, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.625, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15338602662086487, | |
| "eval_overall_accuracy": 0.9553831231813773, | |
| "eval_overall_f1": 0.8042328042328041, | |
| "eval_overall_precision": 0.7432762836185819, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.3274, | |
| "eval_samples_per_second": 571.112, | |
| "eval_steps_per_second": 9.162, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "grad_norm": 0.7766585946083069, | |
| "learning_rate": 2.7000000000000002e-05, | |
| "loss": 0.0614, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7560975609756098, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7236842105263158, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.632183908045977, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7887323943661972, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7368421052631579, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14268124103546143, | |
| "eval_overall_accuracy": 0.9612027158098934, | |
| "eval_overall_f1": 0.8221024258760108, | |
| "eval_overall_precision": 0.7721518987341772, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3351, | |
| "eval_samples_per_second": 558.121, | |
| "eval_steps_per_second": 8.954, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "grad_norm": 1.664536476135254, | |
| "learning_rate": 2.6500000000000004e-05, | |
| "loss": 0.0595, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7320261437908497, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6363636363636364, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8761904761904761, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8363636363636363, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7671232876712328, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8571428571428571, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8571428571428571, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.154044508934021, | |
| "eval_overall_accuracy": 0.9573229873908826, | |
| "eval_overall_f1": 0.8174603174603176, | |
| "eval_overall_precision": 0.7555012224938875, | |
| "eval_overall_recall": 0.8904899135446686, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.845, | |
| "eval_steps_per_second": 8.981, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "grad_norm": 1.3004956245422363, | |
| "learning_rate": 2.6000000000000002e-05, | |
| "loss": 0.0594, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7189542483660131, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.625, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8690095846645367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1491357684135437, | |
| "eval_overall_accuracy": 0.9587778855480117, | |
| "eval_overall_f1": 0.8154050464807437, | |
| "eval_overall_precision": 0.7561576354679803, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.3339, | |
| "eval_samples_per_second": 560.064, | |
| "eval_steps_per_second": 8.985, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "grad_norm": 1.524907112121582, | |
| "learning_rate": 2.5500000000000003e-05, | |
| "loss": 0.0579, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.697986577181208, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6190476190476191, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8726114649681529, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7466666666666666, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14881013333797455, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.8095872170439414, | |
| "eval_overall_precision": 0.7524752475247525, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.968, | |
| "eval_steps_per_second": 9.016, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "grad_norm": 1.4106496572494507, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.0561, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "eval_LOCATION_f1": 0.8051948051948051, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7469879518072289, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6933333333333334, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.611764705882353, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7887323943661972, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7368421052631579, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1435040831565857, | |
| "eval_overall_accuracy": 0.9604752667313288, | |
| "eval_overall_f1": 0.8151147098515519, | |
| "eval_overall_precision": 0.766497461928934, | |
| "eval_overall_recall": 0.8703170028818443, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.829, | |
| "eval_steps_per_second": 8.981, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "grad_norm": 0.9782974123954773, | |
| "learning_rate": 2.45e-05, | |
| "loss": 0.056, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6891891891891891, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6144578313253012, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15163768827915192, | |
| "eval_overall_accuracy": 0.9573229873908826, | |
| "eval_overall_f1": 0.808, | |
| "eval_overall_precision": 0.7518610421836228, | |
| "eval_overall_recall": 0.8731988472622478, | |
| "eval_runtime": 0.3287, | |
| "eval_samples_per_second": 568.941, | |
| "eval_steps_per_second": 9.127, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "grad_norm": 0.8598395586013794, | |
| "learning_rate": 2.4e-05, | |
| "loss": 0.0547, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "eval_LOCATION_f1": 0.8051948051948051, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7469879518072289, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7019867549668873, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6162790697674418, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.870967741935484, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84375, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.7297297297297297, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6585365853658537, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15105435252189636, | |
| "eval_overall_accuracy": 0.9587778855480117, | |
| "eval_overall_f1": 0.8091397849462366, | |
| "eval_overall_precision": 0.7581863979848866, | |
| "eval_overall_recall": 0.8674351585014409, | |
| "eval_runtime": 0.3281, | |
| "eval_samples_per_second": 569.979, | |
| "eval_steps_per_second": 9.144, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "grad_norm": 1.4993176460266113, | |
| "learning_rate": 2.35e-05, | |
| "loss": 0.0534, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.713375796178344, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6086956521739131, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7200000000000001, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16154761612415314, | |
| "eval_overall_accuracy": 0.9553831231813773, | |
| "eval_overall_f1": 0.8068331143232589, | |
| "eval_overall_precision": 0.7415458937198067, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.852, | |
| "eval_steps_per_second": 8.982, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "grad_norm": 1.0407500267028809, | |
| "learning_rate": 2.3000000000000003e-05, | |
| "loss": 0.0526, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6967741935483871, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.8055555555555556, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7435897435897436, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15213675796985626, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.8155080213903744, | |
| "eval_overall_precision": 0.7605985037406484, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3336, | |
| "eval_samples_per_second": 560.594, | |
| "eval_steps_per_second": 8.993, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "grad_norm": 0.6406387686729431, | |
| "learning_rate": 2.25e-05, | |
| "loss": 0.0538, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "eval_LOCATION_f1": 0.7875000000000001, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7078651685393258, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7051282051282052, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6043956043956044, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15997092425823212, | |
| "eval_overall_accuracy": 0.9551406401551892, | |
| "eval_overall_f1": 0.8015768725361366, | |
| "eval_overall_precision": 0.7367149758454107, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3333, | |
| "eval_samples_per_second": 561.061, | |
| "eval_steps_per_second": 9.001, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "grad_norm": 2.387361526489258, | |
| "learning_rate": 2.2000000000000003e-05, | |
| "loss": 0.0529, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7096774193548387, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6111111111111112, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8726114649681529, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7200000000000001, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1578657031059265, | |
| "eval_overall_accuracy": 0.9570805043646945, | |
| "eval_overall_f1": 0.8095238095238096, | |
| "eval_overall_precision": 0.7481662591687042, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3341, | |
| "eval_samples_per_second": 559.763, | |
| "eval_steps_per_second": 8.98, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "grad_norm": 1.3003697395324707, | |
| "learning_rate": 2.15e-05, | |
| "loss": 0.05, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6950354609929077, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6447368421052632, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.8055555555555556, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7435897435897436, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14940249919891357, | |
| "eval_overall_accuracy": 0.9602327837051406, | |
| "eval_overall_f1": 0.8185538881309686, | |
| "eval_overall_precision": 0.7772020725388601, | |
| "eval_overall_recall": 0.8645533141210374, | |
| "eval_runtime": 0.3288, | |
| "eval_samples_per_second": 568.755, | |
| "eval_steps_per_second": 9.124, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "grad_norm": 0.7399232387542725, | |
| "learning_rate": 2.1e-05, | |
| "loss": 0.0512, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "eval_LOCATION_f1": 0.7948717948717949, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7294117647058823, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7042253521126761, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6493506493506493, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7887323943661972, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7368421052631579, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.14740602672100067, | |
| "eval_overall_accuracy": 0.9597478176527643, | |
| "eval_overall_f1": 0.8163265306122449, | |
| "eval_overall_precision": 0.7731958762886598, | |
| "eval_overall_recall": 0.8645533141210374, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.957, | |
| "eval_steps_per_second": 8.983, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "grad_norm": 1.4280949831008911, | |
| "learning_rate": 2.05e-05, | |
| "loss": 0.047, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "eval_LOCATION_f1": 0.7848101265822784, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7126436781609196, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7248322147651007, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6428571428571429, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7777777777777778, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.717948717948718, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15319204330444336, | |
| "eval_overall_accuracy": 0.9595053346265762, | |
| "eval_overall_f1": 0.8187919463087249, | |
| "eval_overall_precision": 0.7663316582914573, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3339, | |
| "eval_samples_per_second": 559.992, | |
| "eval_steps_per_second": 8.984, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "grad_norm": 1.479651689529419, | |
| "learning_rate": 2e-05, | |
| "loss": 0.047, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "eval_LOCATION_f1": 0.7948717948717949, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7294117647058823, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7096774193548387, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6111111111111112, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.870967741935484, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84375, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.8169014084507042, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7631578947368421, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15390989184379578, | |
| "eval_overall_accuracy": 0.9590203685741998, | |
| "eval_overall_f1": 0.8176943699731903, | |
| "eval_overall_precision": 0.7644110275689223, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3333, | |
| "eval_samples_per_second": 560.986, | |
| "eval_steps_per_second": 9.0, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "grad_norm": 0.868341326713562, | |
| "learning_rate": 1.9500000000000003e-05, | |
| "loss": 0.0465, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7105263157894737, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6206896551724138, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8726114649681529, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7887323943661972, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7368421052631579, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15987202525138855, | |
| "eval_overall_accuracy": 0.9585354025218235, | |
| "eval_overall_f1": 0.816, | |
| "eval_overall_precision": 0.7593052109181141, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3345, | |
| "eval_samples_per_second": 559.074, | |
| "eval_steps_per_second": 8.969, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "grad_norm": 1.9663652181625366, | |
| "learning_rate": 1.9e-05, | |
| "loss": 0.045, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6973684210526315, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6091954022988506, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8753993610223643, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8404907975460123, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.8055555555555556, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7435897435897436, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1569298505783081, | |
| "eval_overall_accuracy": 0.9595053346265762, | |
| "eval_overall_f1": 0.8176943699731903, | |
| "eval_overall_precision": 0.7644110275689223, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3337, | |
| "eval_samples_per_second": 560.452, | |
| "eval_steps_per_second": 8.991, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "grad_norm": 4.453447341918945, | |
| "learning_rate": 1.85e-05, | |
| "loss": 0.0468, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7560975609756098, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7114093959731543, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6309523809523809, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.870967741935484, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84375, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.7887323943661972, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7368421052631579, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1518780142068863, | |
| "eval_overall_accuracy": 0.9612027158098934, | |
| "eval_overall_f1": 0.8195386702849389, | |
| "eval_overall_precision": 0.7743589743589744, | |
| "eval_overall_recall": 0.8703170028818443, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.932, | |
| "eval_steps_per_second": 8.983, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "grad_norm": 0.6715424656867981, | |
| "learning_rate": 1.8e-05, | |
| "loss": 0.0446, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "eval_LOCATION_f1": 0.7922077922077921, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7272727272727272, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7605633802816901, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7105263157894737, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.15471045672893524, | |
| "eval_overall_accuracy": 0.9609602327837051, | |
| "eval_overall_f1": 0.8201634877384196, | |
| "eval_overall_precision": 0.7777777777777778, | |
| "eval_overall_recall": 0.8674351585014409, | |
| "eval_runtime": 0.3347, | |
| "eval_samples_per_second": 558.627, | |
| "eval_steps_per_second": 8.962, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "grad_norm": 1.4069435596466064, | |
| "learning_rate": 1.75e-05, | |
| "loss": 0.0452, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "eval_LOCATION_f1": 0.7948717948717949, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7294117647058823, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7051282051282052, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6043956043956044, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7567567567567567, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6829268292682927, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16312921047210693, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8149134487350199, | |
| "eval_overall_precision": 0.7574257425742574, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3332, | |
| "eval_samples_per_second": 561.176, | |
| "eval_steps_per_second": 9.003, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "grad_norm": 0.9711624383926392, | |
| "learning_rate": 1.7000000000000003e-05, | |
| "loss": 0.0442, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "eval_LOCATION_f1": 0.7948717948717949, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7294117647058823, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7051282051282052, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6043956043956044, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8838709677419355, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.85625, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1615941822528839, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.8175765645805593, | |
| "eval_overall_precision": 0.7599009900990099, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.3281, | |
| "eval_samples_per_second": 569.904, | |
| "eval_steps_per_second": 9.143, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "grad_norm": 0.3948928415775299, | |
| "learning_rate": 1.65e-05, | |
| "loss": 0.0431, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "eval_LOCATION_f1": 0.7898089171974522, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7209302325581395, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7019867549668873, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6162790697674418, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8690095846645367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16082525253295898, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.8117489986648865, | |
| "eval_overall_precision": 0.7562189054726368, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.3276, | |
| "eval_samples_per_second": 570.856, | |
| "eval_steps_per_second": 9.158, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "grad_norm": 1.975942611694336, | |
| "learning_rate": 1.6000000000000003e-05, | |
| "loss": 0.0427, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7142857142857143, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6179775280898876, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8690095846645367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7012987012987013, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6136363636363636, | |
| "eval_QUANTITY_recall": 0.8181818181818182, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16873115301132202, | |
| "eval_overall_accuracy": 0.9556256062075654, | |
| "eval_overall_f1": 0.8047493403693932, | |
| "eval_overall_precision": 0.7420924574209246, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.333, | |
| "eval_samples_per_second": 561.488, | |
| "eval_steps_per_second": 9.008, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "grad_norm": 0.47350606322288513, | |
| "learning_rate": 1.55e-05, | |
| "loss": 0.043, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7012987012987013, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6067415730337079, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7945205479452054, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.725, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16365033388137817, | |
| "eval_overall_accuracy": 0.9573229873908826, | |
| "eval_overall_f1": 0.8138297872340426, | |
| "eval_overall_precision": 0.7555555555555555, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3339, | |
| "eval_samples_per_second": 560.112, | |
| "eval_steps_per_second": 8.986, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "grad_norm": 0.45649945735931396, | |
| "learning_rate": 1.5e-05, | |
| "loss": 0.0426, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7058823529411765, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6136363636363636, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7945205479452054, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.725, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16292014718055725, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.816, | |
| "eval_overall_precision": 0.7593052109181141, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3349, | |
| "eval_samples_per_second": 558.384, | |
| "eval_steps_per_second": 8.958, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "grad_norm": 2.033871650695801, | |
| "learning_rate": 1.45e-05, | |
| "loss": 0.0439, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "eval_LOCATION_f1": 0.775, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.6966292134831461, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7080745341614907, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.59375, | |
| "eval_ORGANIZATION_recall": 0.8769230769230769, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7631578947368421, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6744186046511628, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1787422150373459, | |
| "eval_overall_accuracy": 0.9541707080504365, | |
| "eval_overall_f1": 0.81151832460733, | |
| "eval_overall_precision": 0.7434052757793765, | |
| "eval_overall_recall": 0.8933717579250721, | |
| "eval_runtime": 0.3334, | |
| "eval_samples_per_second": 560.921, | |
| "eval_steps_per_second": 8.999, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "grad_norm": 1.839992642402649, | |
| "learning_rate": 1.4000000000000001e-05, | |
| "loss": 0.0409, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "eval_LOCATION_f1": 0.7922077922077921, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8591549295774648, | |
| "eval_ORGANIZATION_f1": 0.7105263157894737, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6206896551724138, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7945205479452054, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.725, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16144876182079315, | |
| "eval_overall_accuracy": 0.9590203685741998, | |
| "eval_overall_f1": 0.8172043010752689, | |
| "eval_overall_precision": 0.7657430730478589, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.3281, | |
| "eval_samples_per_second": 570.003, | |
| "eval_steps_per_second": 9.144, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "grad_norm": 0.7383960485458374, | |
| "learning_rate": 1.3500000000000001e-05, | |
| "loss": 0.0404, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6928104575163399, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6022727272727273, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16545303165912628, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.8122503328894807, | |
| "eval_overall_precision": 0.754950495049505, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3344, | |
| "eval_samples_per_second": 559.187, | |
| "eval_steps_per_second": 8.971, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "grad_norm": 1.1772239208221436, | |
| "learning_rate": 1.3000000000000001e-05, | |
| "loss": 0.0399, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "eval_LOCATION_f1": 0.8076923076923077, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7411764705882353, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6883116883116883, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5955056179775281, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16691727936267853, | |
| "eval_overall_accuracy": 0.9585354025218235, | |
| "eval_overall_f1": 0.8133333333333335, | |
| "eval_overall_precision": 0.7568238213399504, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3273, | |
| "eval_samples_per_second": 571.302, | |
| "eval_steps_per_second": 9.165, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "grad_norm": 0.3011506497859955, | |
| "learning_rate": 1.25e-05, | |
| "loss": 0.04, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7105263157894737, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6206896551724138, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8774193548387097, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.85, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16395699977874756, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.8181818181818181, | |
| "eval_overall_precision": 0.7630922693266833, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3336, | |
| "eval_samples_per_second": 560.492, | |
| "eval_steps_per_second": 8.992, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "grad_norm": 1.2410697937011719, | |
| "learning_rate": 1.2e-05, | |
| "loss": 0.0402, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7012987012987013, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6067415730337079, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16832870244979858, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.8127490039840637, | |
| "eval_overall_precision": 0.7536945812807881, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3277, | |
| "eval_samples_per_second": 570.614, | |
| "eval_steps_per_second": 9.154, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "grad_norm": 1.8908904790878296, | |
| "learning_rate": 1.1500000000000002e-05, | |
| "loss": 0.0402, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "eval_LOCATION_f1": 0.7875000000000001, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7078651685393258, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7066666666666667, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6235294117647059, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8690095846645367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7567567567567567, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6829268292682927, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17024052143096924, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8095872170439414, | |
| "eval_overall_precision": 0.7524752475247525, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.3331, | |
| "eval_samples_per_second": 561.412, | |
| "eval_steps_per_second": 9.007, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "grad_norm": 0.9162412881851196, | |
| "learning_rate": 1.1000000000000001e-05, | |
| "loss": 0.0379, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6928104575163399, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6022727272727273, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8653846153846153, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8333333333333334, | |
| "eval_PERSON_recall": 0.9, | |
| "eval_QUANTITY_f1": 0.7945205479452054, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.725, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16936184465885162, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.8095872170439414, | |
| "eval_overall_precision": 0.7524752475247525, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.3269, | |
| "eval_samples_per_second": 572.008, | |
| "eval_steps_per_second": 9.177, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "grad_norm": 0.6435752511024475, | |
| "learning_rate": 1.05e-05, | |
| "loss": 0.0371, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6883116883116883, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5955056179775281, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7567567567567567, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6829268292682927, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1731194704771042, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8100929614873836, | |
| "eval_overall_precision": 0.7512315270935961, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3342, | |
| "eval_samples_per_second": 559.625, | |
| "eval_steps_per_second": 8.978, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "grad_norm": 0.5504117608070374, | |
| "learning_rate": 1e-05, | |
| "loss": 0.0375, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "eval_LOCATION_f1": 0.8025477707006369, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7325581395348837, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6883116883116883, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5955056179775281, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7671232876712328, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17014098167419434, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8144192256341789, | |
| "eval_overall_precision": 0.7587064676616916, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3341, | |
| "eval_samples_per_second": 559.673, | |
| "eval_steps_per_second": 8.979, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "grad_norm": 0.46581876277923584, | |
| "learning_rate": 9.5e-06, | |
| "loss": 0.0367, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "eval_LOCATION_f1": 0.7898089171974522, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7209302325581395, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.6883116883116883, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5955056179775281, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8726114649681529, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16831910610198975, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8100929614873836, | |
| "eval_overall_precision": 0.7512315270935961, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3339, | |
| "eval_samples_per_second": 560.13, | |
| "eval_steps_per_second": 8.986, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "grad_norm": 1.1437621116638184, | |
| "learning_rate": 9e-06, | |
| "loss": 0.0369, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6794871794871795, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5824175824175825, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17457380890846252, | |
| "eval_overall_accuracy": 0.9570805043646945, | |
| "eval_overall_f1": 0.8132450331125827, | |
| "eval_overall_precision": 0.7524509803921569, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.3282, | |
| "eval_samples_per_second": 569.833, | |
| "eval_steps_per_second": 9.142, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "grad_norm": 1.673567771911621, | |
| "learning_rate": 8.500000000000002e-06, | |
| "loss": 0.0382, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "eval_LOCATION_f1": 0.7848101265822784, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7126436781609196, | |
| "eval_LOCATION_recall": 0.8732394366197183, | |
| "eval_ORGANIZATION_f1": 0.7019867549668873, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6162790697674418, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8690095846645367, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16617552936077118, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.8106666666666668, | |
| "eval_overall_precision": 0.7543424317617866, | |
| "eval_overall_recall": 0.8760806916426513, | |
| "eval_runtime": 0.334, | |
| "eval_samples_per_second": 559.883, | |
| "eval_steps_per_second": 8.982, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "grad_norm": 0.8704581260681152, | |
| "learning_rate": 8.000000000000001e-06, | |
| "loss": 0.0376, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6973684210526315, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6091954022988506, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7567567567567567, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.6829268292682927, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16935382783412933, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.8133333333333335, | |
| "eval_overall_precision": 0.7568238213399504, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.19, | |
| "eval_steps_per_second": 8.987, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "grad_norm": 2.838458299636841, | |
| "learning_rate": 7.5e-06, | |
| "loss": 0.0372, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7006369426751592, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5978260869565217, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7671232876712328, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7, | |
| "eval_QUANTITY_recall": 0.8484848484848485, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17407700419425964, | |
| "eval_overall_accuracy": 0.9570805043646945, | |
| "eval_overall_f1": 0.8143236074270557, | |
| "eval_overall_precision": 0.7542997542997543, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.3291, | |
| "eval_samples_per_second": 568.226, | |
| "eval_steps_per_second": 9.116, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "grad_norm": 0.5828319191932678, | |
| "learning_rate": 7.000000000000001e-06, | |
| "loss": 0.0351, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6928104575163399, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6022727272727273, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17182248830795288, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.8111702127659575, | |
| "eval_overall_precision": 0.7530864197530864, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3342, | |
| "eval_samples_per_second": 559.566, | |
| "eval_steps_per_second": 8.977, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "grad_norm": 0.9350789189338684, | |
| "learning_rate": 6.5000000000000004e-06, | |
| "loss": 0.0348, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6838709677419356, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5888888888888889, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17128072679042816, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.8100929614873836, | |
| "eval_overall_precision": 0.7512315270935961, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3342, | |
| "eval_samples_per_second": 559.586, | |
| "eval_steps_per_second": 8.977, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "grad_norm": 1.2203199863433838, | |
| "learning_rate": 6e-06, | |
| "loss": 0.0363, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6973684210526315, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6091954022988506, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17074672877788544, | |
| "eval_overall_accuracy": 0.9585354025218235, | |
| "eval_overall_f1": 0.8144192256341789, | |
| "eval_overall_precision": 0.7587064676616916, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3335, | |
| "eval_samples_per_second": 560.724, | |
| "eval_steps_per_second": 8.996, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "grad_norm": 0.67624431848526, | |
| "learning_rate": 5.500000000000001e-06, | |
| "loss": 0.0371, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "eval_LOCATION_f1": 0.7924528301886792, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6883116883116883, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5955056179775281, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8753993610223643, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8404907975460123, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17176063358783722, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8116710875331565, | |
| "eval_overall_precision": 0.7518427518427518, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.327, | |
| "eval_samples_per_second": 571.803, | |
| "eval_steps_per_second": 9.173, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "grad_norm": 1.9259661436080933, | |
| "learning_rate": 5e-06, | |
| "loss": 0.0367, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "eval_LOCATION_f1": 0.8025477707006369, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7325581395348837, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6973684210526315, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6091954022988506, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.887459807073955, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8571428571428571, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17073224484920502, | |
| "eval_overall_accuracy": 0.9590203685741998, | |
| "eval_overall_f1": 0.820855614973262, | |
| "eval_overall_precision": 0.7655860349127181, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.3283, | |
| "eval_samples_per_second": 569.578, | |
| "eval_steps_per_second": 9.138, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "grad_norm": 0.5366353392601013, | |
| "learning_rate": 4.5e-06, | |
| "loss": 0.0349, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7096774193548387, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6111111111111112, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8717948717948718, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17369931936264038, | |
| "eval_overall_accuracy": 0.957807953443259, | |
| "eval_overall_f1": 0.8154050464807437, | |
| "eval_overall_precision": 0.7561576354679803, | |
| "eval_overall_recall": 0.8847262247838616, | |
| "eval_runtime": 0.3271, | |
| "eval_samples_per_second": 571.651, | |
| "eval_steps_per_second": 9.171, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "grad_norm": 0.7619331479072571, | |
| "learning_rate": 4.000000000000001e-06, | |
| "loss": 0.0357, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "eval_LOCATION_f1": 0.8025477707006369, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7325581395348837, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7066666666666667, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6235294117647059, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.16904906928539276, | |
| "eval_overall_accuracy": 0.9590203685741998, | |
| "eval_overall_f1": 0.8192771084337349, | |
| "eval_overall_precision": 0.765, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3276, | |
| "eval_samples_per_second": 570.837, | |
| "eval_steps_per_second": 9.158, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "grad_norm": 0.7772564888000488, | |
| "learning_rate": 3.5000000000000004e-06, | |
| "loss": 0.0345, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.7019867549668873, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6162790697674418, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17138922214508057, | |
| "eval_overall_accuracy": 0.9585354025218235, | |
| "eval_overall_f1": 0.8170894526034712, | |
| "eval_overall_precision": 0.7611940298507462, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3295, | |
| "eval_samples_per_second": 567.54, | |
| "eval_steps_per_second": 9.105, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "grad_norm": 1.5932378768920898, | |
| "learning_rate": 3e-06, | |
| "loss": 0.0349, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6838709677419356, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5888888888888889, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1765890270471573, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8138297872340426, | |
| "eval_overall_precision": 0.7555555555555555, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3276, | |
| "eval_samples_per_second": 570.847, | |
| "eval_steps_per_second": 9.158, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "grad_norm": 0.8269696235656738, | |
| "learning_rate": 2.5e-06, | |
| "loss": 0.0352, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6838709677419356, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5888888888888889, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.8727272727272727, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17644113302230835, | |
| "eval_overall_accuracy": 0.9575654704170709, | |
| "eval_overall_f1": 0.8127490039840637, | |
| "eval_overall_precision": 0.7536945812807881, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3293, | |
| "eval_samples_per_second": 567.897, | |
| "eval_steps_per_second": 9.111, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "grad_norm": 1.2851319313049316, | |
| "learning_rate": 2.0000000000000003e-06, | |
| "loss": 0.0367, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6973684210526315, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6091954022988506, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17299894988536835, | |
| "eval_overall_accuracy": 0.9582929194956353, | |
| "eval_overall_f1": 0.816, | |
| "eval_overall_precision": 0.7593052109181141, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3337, | |
| "eval_samples_per_second": 560.433, | |
| "eval_steps_per_second": 8.991, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "grad_norm": 1.469909906387329, | |
| "learning_rate": 1.5e-06, | |
| "loss": 0.0352, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6928104575163399, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6022727272727273, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8838709677419355, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.85625, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1724460870027542, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.8170894526034712, | |
| "eval_overall_precision": 0.7611940298507462, | |
| "eval_overall_recall": 0.8818443804034583, | |
| "eval_runtime": 0.3335, | |
| "eval_samples_per_second": 560.658, | |
| "eval_steps_per_second": 8.995, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "grad_norm": 0.9896478652954102, | |
| "learning_rate": 1.0000000000000002e-06, | |
| "loss": 0.0341, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6794871794871795, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5824175824175825, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.1747630089521408, | |
| "eval_overall_accuracy": 0.9570805043646945, | |
| "eval_overall_f1": 0.8100929614873836, | |
| "eval_overall_precision": 0.7512315270935961, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3347, | |
| "eval_samples_per_second": 558.646, | |
| "eval_steps_per_second": 8.962, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "grad_norm": 1.395708441734314, | |
| "learning_rate": 5.000000000000001e-07, | |
| "loss": 0.0331, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6928104575163399, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6022727272727273, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17256887257099152, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.8133333333333335, | |
| "eval_overall_precision": 0.7568238213399504, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.3341, | |
| "eval_samples_per_second": 559.765, | |
| "eval_steps_per_second": 8.98, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "grad_norm": 0.4935811758041382, | |
| "learning_rate": 0.0, | |
| "loss": 0.0347, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "eval_LOCATION_f1": 0.7974683544303797, | |
| "eval_LOCATION_number": 71, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.8873239436619719, | |
| "eval_ORGANIZATION_f1": 0.6928104575163399, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6022727272727273, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8745980707395499, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.84472049689441, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7837837837837839, | |
| "eval_QUANTITY_number": 33, | |
| "eval_QUANTITY_precision": 0.7073170731707317, | |
| "eval_QUANTITY_recall": 0.8787878787878788, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 28, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.8571428571428571, | |
| "eval_loss": 0.17283295094966888, | |
| "eval_overall_accuracy": 0.9580504364694471, | |
| "eval_overall_f1": 0.8133333333333335, | |
| "eval_overall_precision": 0.7568238213399504, | |
| "eval_overall_recall": 0.8789625360230547, | |
| "eval_runtime": 0.336, | |
| "eval_samples_per_second": 556.513, | |
| "eval_steps_per_second": 8.928, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "step": 10600, | |
| "total_flos": 4639858441347408.0, | |
| "train_loss": 0.08816910017211482, | |
| "train_runtime": 623.006, | |
| "train_samples_per_second": 270.944, | |
| "train_steps_per_second": 17.014 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 10600, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 100, | |
| "save_steps": 500, | |
| "total_flos": 4639858441347408.0, | |
| "train_batch_size": 16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |