| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 100.0, | |
| "eval_steps": 500, | |
| "global_step": 10600, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 1.5824520587921143, | |
| "learning_rate": 4.9500000000000004e-05, | |
| "loss": 0.9315, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_LOCATION_f1": 0.0, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.0, | |
| "eval_LOCATION_recall": 0.0, | |
| "eval_ORGANIZATION_f1": 0.0, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.0, | |
| "eval_ORGANIZATION_recall": 0.0, | |
| "eval_PERSON_f1": 0.012987012987012988, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.25, | |
| "eval_PERSON_recall": 0.006666666666666667, | |
| "eval_QUANTITY_f1": 0.0, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.0, | |
| "eval_QUANTITY_recall": 0.0, | |
| "eval_TIME_f1": 0.0, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.0, | |
| "eval_TIME_recall": 0.0, | |
| "eval_loss": 0.6119179725646973, | |
| "eval_overall_accuracy": 0.8370662072360325, | |
| "eval_overall_f1": 0.005633802816901409, | |
| "eval_overall_precision": 0.25, | |
| "eval_overall_recall": 0.002849002849002849, | |
| "eval_runtime": 0.3369, | |
| "eval_samples_per_second": 555.024, | |
| "eval_steps_per_second": 8.904, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 1.5226932764053345, | |
| "learning_rate": 4.9e-05, | |
| "loss": 0.5353, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_LOCATION_f1": 0.40983606557377056, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.5102040816326531, | |
| "eval_LOCATION_recall": 0.3424657534246575, | |
| "eval_ORGANIZATION_f1": 0.08695652173913043, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.1, | |
| "eval_ORGANIZATION_recall": 0.07692307692307693, | |
| "eval_PERSON_f1": 0.574468085106383, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.4778761061946903, | |
| "eval_PERSON_recall": 0.72, | |
| "eval_QUANTITY_f1": 0.0, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.0, | |
| "eval_QUANTITY_recall": 0.0, | |
| "eval_TIME_f1": 0.5483870967741935, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.6071428571428571, | |
| "eval_TIME_recall": 0.5, | |
| "eval_loss": 0.411459743976593, | |
| "eval_overall_accuracy": 0.8924440068914595, | |
| "eval_overall_f1": 0.4397163120567376, | |
| "eval_overall_precision": 0.4378531073446328, | |
| "eval_overall_recall": 0.4415954415954416, | |
| "eval_runtime": 0.3252, | |
| "eval_samples_per_second": 574.99, | |
| "eval_steps_per_second": 9.224, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 1.2673431634902954, | |
| "learning_rate": 4.85e-05, | |
| "loss": 0.3686, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_LOCATION_f1": 0.5747126436781609, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.49504950495049505, | |
| "eval_LOCATION_recall": 0.684931506849315, | |
| "eval_ORGANIZATION_f1": 0.45528455284552843, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.4827586206896552, | |
| "eval_ORGANIZATION_recall": 0.4307692307692308, | |
| "eval_PERSON_f1": 0.7507163323782233, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.6582914572864321, | |
| "eval_PERSON_recall": 0.8733333333333333, | |
| "eval_QUANTITY_f1": 0.3934426229508197, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.375, | |
| "eval_QUANTITY_recall": 0.41379310344827586, | |
| "eval_TIME_f1": 0.8115942028985507, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8235294117647058, | |
| "eval_loss": 0.29026341438293457, | |
| "eval_overall_accuracy": 0.9288702928870293, | |
| "eval_overall_f1": 0.6417525773195876, | |
| "eval_overall_precision": 0.5858823529411765, | |
| "eval_overall_recall": 0.7094017094017094, | |
| "eval_runtime": 0.3326, | |
| "eval_samples_per_second": 562.209, | |
| "eval_steps_per_second": 9.019, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 1.4100310802459717, | |
| "learning_rate": 4.8e-05, | |
| "loss": 0.2668, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_LOCATION_f1": 0.5664739884393063, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.49, | |
| "eval_LOCATION_recall": 0.6712328767123288, | |
| "eval_ORGANIZATION_f1": 0.4878048780487805, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5172413793103449, | |
| "eval_ORGANIZATION_recall": 0.46153846153846156, | |
| "eval_PERSON_f1": 0.8246153846153845, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7657142857142857, | |
| "eval_PERSON_recall": 0.8933333333333333, | |
| "eval_QUANTITY_f1": 0.5245901639344263, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.5, | |
| "eval_QUANTITY_recall": 0.5517241379310345, | |
| "eval_TIME_f1": 0.8823529411764706, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.8823529411764706, | |
| "eval_TIME_recall": 0.8823529411764706, | |
| "eval_loss": 0.207948699593544, | |
| "eval_overall_accuracy": 0.9401919763721388, | |
| "eval_overall_f1": 0.6906666666666667, | |
| "eval_overall_precision": 0.6491228070175439, | |
| "eval_overall_recall": 0.7378917378917379, | |
| "eval_runtime": 0.3333, | |
| "eval_samples_per_second": 560.99, | |
| "eval_steps_per_second": 9.0, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 2.0687103271484375, | |
| "learning_rate": 4.75e-05, | |
| "loss": 0.2091, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_LOCATION_f1": 0.7195121951219512, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.6483516483516484, | |
| "eval_LOCATION_recall": 0.8082191780821918, | |
| "eval_ORGANIZATION_f1": 0.5714285714285715, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5588235294117647, | |
| "eval_ORGANIZATION_recall": 0.5846153846153846, | |
| "eval_PERSON_f1": 0.8369230769230769, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7771428571428571, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.5846153846153845, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.5277777777777778, | |
| "eval_QUANTITY_recall": 0.6551724137931034, | |
| "eval_TIME_f1": 0.8333333333333333, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7894736842105263, | |
| "eval_TIME_recall": 0.8823529411764706, | |
| "eval_loss": 0.17728105187416077, | |
| "eval_overall_accuracy": 0.9451144474526212, | |
| "eval_overall_f1": 0.7430830039525692, | |
| "eval_overall_precision": 0.6911764705882353, | |
| "eval_overall_recall": 0.8034188034188035, | |
| "eval_runtime": 0.3284, | |
| "eval_samples_per_second": 569.476, | |
| "eval_steps_per_second": 9.136, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 2.4117839336395264, | |
| "learning_rate": 4.7e-05, | |
| "loss": 0.1833, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_LOCATION_f1": 0.6971428571428572, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.5980392156862745, | |
| "eval_LOCATION_recall": 0.8356164383561644, | |
| "eval_ORGANIZATION_f1": 0.5818181818181819, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.48, | |
| "eval_ORGANIZATION_recall": 0.7384615384615385, | |
| "eval_PERSON_f1": 0.8353658536585366, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.7696629213483146, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.5555555555555556, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.46511627906976744, | |
| "eval_QUANTITY_recall": 0.6896551724137931, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.189751997590065, | |
| "eval_overall_accuracy": 0.9424070883583558, | |
| "eval_overall_f1": 0.7248157248157246, | |
| "eval_overall_precision": 0.6371490280777538, | |
| "eval_overall_recall": 0.8404558404558404, | |
| "eval_runtime": 0.3281, | |
| "eval_samples_per_second": 569.94, | |
| "eval_steps_per_second": 9.143, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 1.2822880744934082, | |
| "learning_rate": 4.6500000000000005e-05, | |
| "loss": 0.1653, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_LOCATION_f1": 0.7607361963190183, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.6888888888888889, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.5857142857142857, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5466666666666666, | |
| "eval_ORGANIZATION_recall": 0.6307692307692307, | |
| "eval_PERSON_f1": 0.8616352201257862, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8154761904761905, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.6666666666666667, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.5945945945945946, | |
| "eval_QUANTITY_recall": 0.7586206896551724, | |
| "eval_TIME_f1": 0.8450704225352113, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.8108108108108109, | |
| "eval_TIME_recall": 0.8823529411764706, | |
| "eval_loss": 0.15423187613487244, | |
| "eval_overall_accuracy": 0.9512675363032242, | |
| "eval_overall_f1": 0.770448548812665, | |
| "eval_overall_precision": 0.7174447174447175, | |
| "eval_overall_recall": 0.8319088319088319, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.152, | |
| "eval_steps_per_second": 8.986, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 1.469247817993164, | |
| "learning_rate": 4.600000000000001e-05, | |
| "loss": 0.1529, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_LOCATION_f1": 0.7590361445783131, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.6774193548387096, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.5915492957746479, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5454545454545454, | |
| "eval_ORGANIZATION_recall": 0.6461538461538462, | |
| "eval_PERSON_f1": 0.8500000000000001, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.7619047619047619, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.7058823529411765, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.861111111111111, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.8157894736842105, | |
| "eval_TIME_recall": 0.9117647058823529, | |
| "eval_loss": 0.14763768017292023, | |
| "eval_overall_accuracy": 0.9527442776273689, | |
| "eval_overall_f1": 0.7758846657929228, | |
| "eval_overall_precision": 0.7184466019417476, | |
| "eval_overall_recall": 0.8433048433048433, | |
| "eval_runtime": 0.3346, | |
| "eval_samples_per_second": 558.898, | |
| "eval_steps_per_second": 8.966, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 1.5628341436386108, | |
| "learning_rate": 4.55e-05, | |
| "loss": 0.1428, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_LOCATION_f1": 0.7544910179640719, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.6702127659574468, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.6225165562913907, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5465116279069767, | |
| "eval_ORGANIZATION_recall": 0.7230769230769231, | |
| "eval_PERSON_f1": 0.879746835443038, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8373493975903614, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.575, | |
| "eval_QUANTITY_recall": 0.7931034482758621, | |
| "eval_TIME_f1": 0.8266666666666665, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7560975609756098, | |
| "eval_TIME_recall": 0.9117647058823529, | |
| "eval_loss": 0.14981509745121002, | |
| "eval_overall_accuracy": 0.9497907949790795, | |
| "eval_overall_f1": 0.7789203084832904, | |
| "eval_overall_precision": 0.7096018735362998, | |
| "eval_overall_recall": 0.8632478632478633, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.163, | |
| "eval_steps_per_second": 8.987, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 1.2276618480682373, | |
| "learning_rate": 4.5e-05, | |
| "loss": 0.132, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_LOCATION_f1": 0.779874213836478, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7209302325581395, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.5925925925925927, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5714285714285714, | |
| "eval_ORGANIZATION_recall": 0.6153846153846154, | |
| "eval_PERSON_f1": 0.8616352201257862, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8154761904761905, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8108108108108107, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8823529411764706, | |
| "eval_loss": 0.14296573400497437, | |
| "eval_overall_accuracy": 0.9532365247354172, | |
| "eval_overall_f1": 0.7808764940239045, | |
| "eval_overall_precision": 0.7313432835820896, | |
| "eval_overall_recall": 0.8376068376068376, | |
| "eval_runtime": 0.3274, | |
| "eval_samples_per_second": 571.224, | |
| "eval_steps_per_second": 9.164, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 1.8262553215026855, | |
| "learning_rate": 4.4500000000000004e-05, | |
| "loss": 0.1288, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_LOCATION_f1": 0.7515151515151515, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.6739130434782609, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.6330935251798562, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5945945945945946, | |
| "eval_ORGANIZATION_recall": 0.676923076923077, | |
| "eval_PERSON_f1": 0.8698412698412699, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8303030303030303, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.6956521739130435, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7631578947368423, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.6904761904761905, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1460973471403122, | |
| "eval_overall_accuracy": 0.9515136598572483, | |
| "eval_overall_f1": 0.774869109947644, | |
| "eval_overall_precision": 0.7167070217917676, | |
| "eval_overall_recall": 0.8433048433048433, | |
| "eval_runtime": 0.3342, | |
| "eval_samples_per_second": 559.473, | |
| "eval_steps_per_second": 8.976, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "grad_norm": 1.1676838397979736, | |
| "learning_rate": 4.4000000000000006e-05, | |
| "loss": 0.1219, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_LOCATION_f1": 0.7590361445783131, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.6774193548387096, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.6433566433566433, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5897435897435898, | |
| "eval_ORGANIZATION_recall": 0.7076923076923077, | |
| "eval_PERSON_f1": 0.8734177215189873, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8313253012048193, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6153846153846154, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7631578947368423, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.6904761904761905, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14986908435821533, | |
| "eval_overall_accuracy": 0.9502830420871278, | |
| "eval_overall_f1": 0.7802340702210663, | |
| "eval_overall_precision": 0.7177033492822966, | |
| "eval_overall_recall": 0.8547008547008547, | |
| "eval_runtime": 0.333, | |
| "eval_samples_per_second": 561.614, | |
| "eval_steps_per_second": 9.01, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "grad_norm": 1.25841224193573, | |
| "learning_rate": 4.35e-05, | |
| "loss": 0.1176, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_LOCATION_f1": 0.7820512820512822, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8356164383561644, | |
| "eval_ORGANIZATION_f1": 0.6666666666666666, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5975609756097561, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13805125653743744, | |
| "eval_overall_accuracy": 0.9547132660595619, | |
| "eval_overall_f1": 0.7968337730870712, | |
| "eval_overall_precision": 0.742014742014742, | |
| "eval_overall_recall": 0.8603988603988604, | |
| "eval_runtime": 0.3326, | |
| "eval_samples_per_second": 562.243, | |
| "eval_steps_per_second": 9.02, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "grad_norm": 1.1619478464126587, | |
| "learning_rate": 4.3e-05, | |
| "loss": 0.1161, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_LOCATION_f1": 0.782608695652174, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7159090909090909, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.6666666666666666, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5975609756097561, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8761904761904761, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8363636363636363, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7536231884057972, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.65, | |
| "eval_QUANTITY_recall": 0.896551724137931, | |
| "eval_TIME_f1": 0.7631578947368423, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.6904761904761905, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14077436923980713, | |
| "eval_overall_accuracy": 0.9532365247354172, | |
| "eval_overall_f1": 0.7942708333333333, | |
| "eval_overall_precision": 0.7314148681055156, | |
| "eval_overall_recall": 0.8689458689458689, | |
| "eval_runtime": 0.3264, | |
| "eval_samples_per_second": 572.885, | |
| "eval_steps_per_second": 9.191, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "grad_norm": 1.547819972038269, | |
| "learning_rate": 4.25e-05, | |
| "loss": 0.1148, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_LOCATION_f1": 0.7777777777777778, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7078651685393258, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7058823529411765, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6136363636363636, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8726114649681529, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7246376811594203, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.625, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7733333333333334, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7073170731707317, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1482475847005844, | |
| "eval_overall_accuracy": 0.9537287718434654, | |
| "eval_overall_f1": 0.7968952134540751, | |
| "eval_overall_precision": 0.7298578199052133, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3273, | |
| "eval_samples_per_second": 571.301, | |
| "eval_steps_per_second": 9.165, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "grad_norm": 3.2295055389404297, | |
| "learning_rate": 4.2e-05, | |
| "loss": 0.1075, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_LOCATION_f1": 0.8076923076923077, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.6268656716417911, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6086956521739131, | |
| "eval_ORGANIZATION_recall": 0.6461538461538462, | |
| "eval_PERSON_f1": 0.8753993610223643, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8404907975460123, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7142857142857144, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6097560975609756, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7733333333333334, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7073170731707317, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14014115929603577, | |
| "eval_overall_accuracy": 0.9554516367216342, | |
| "eval_overall_f1": 0.7914438502673797, | |
| "eval_overall_precision": 0.7455919395465995, | |
| "eval_overall_recall": 0.8433048433048433, | |
| "eval_runtime": 0.3353, | |
| "eval_samples_per_second": 557.692, | |
| "eval_steps_per_second": 8.947, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "grad_norm": 0.9571211934089661, | |
| "learning_rate": 4.15e-05, | |
| "loss": 0.1058, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_LOCATION_f1": 0.7875, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7199999999999999, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6352941176470588, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8761904761904761, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8363636363636363, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7575757575757576, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7631578947368423, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.6904761904761905, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14074338972568512, | |
| "eval_overall_accuracy": 0.9542210189515137, | |
| "eval_overall_f1": 0.8057366362451107, | |
| "eval_overall_precision": 0.7427884615384616, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3268, | |
| "eval_samples_per_second": 572.193, | |
| "eval_steps_per_second": 9.18, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "grad_norm": 1.2484526634216309, | |
| "learning_rate": 4.1e-05, | |
| "loss": 0.1021, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_LOCATION_f1": 0.8076923076923077, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.6433566433566433, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.5897435897435898, | |
| "eval_ORGANIZATION_recall": 0.7076923076923077, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.6956521739130435, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13723434507846832, | |
| "eval_overall_accuracy": 0.9561900073837066, | |
| "eval_overall_f1": 0.7936507936507937, | |
| "eval_overall_precision": 0.7407407407407407, | |
| "eval_overall_recall": 0.8547008547008547, | |
| "eval_runtime": 0.3273, | |
| "eval_samples_per_second": 571.38, | |
| "eval_steps_per_second": 9.167, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "grad_norm": 0.977418839931488, | |
| "learning_rate": 4.05e-05, | |
| "loss": 0.1032, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_LOCATION_f1": 0.8026315789473685, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8356164383561644, | |
| "eval_ORGANIZATION_f1": 0.7066666666666667, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6235294117647059, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7812500000000001, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7733333333333334, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7073170731707317, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13176140189170837, | |
| "eval_overall_accuracy": 0.958897366477972, | |
| "eval_overall_f1": 0.8116710875331565, | |
| "eval_overall_precision": 0.7593052109181141, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3289, | |
| "eval_samples_per_second": 568.639, | |
| "eval_steps_per_second": 9.123, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "grad_norm": 1.2055819034576416, | |
| "learning_rate": 4e-05, | |
| "loss": 0.0979, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_LOCATION_f1": 0.7974683544303799, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7411764705882353, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7412587412587412, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6794871794871795, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1400451809167862, | |
| "eval_overall_accuracy": 0.956928378045779, | |
| "eval_overall_f1": 0.8132450331125828, | |
| "eval_overall_precision": 0.7599009900990099, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3266, | |
| "eval_samples_per_second": 572.647, | |
| "eval_steps_per_second": 9.187, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "grad_norm": 2.198835611343384, | |
| "learning_rate": 3.9500000000000005e-05, | |
| "loss": 0.098, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_LOCATION_f1": 0.8181818181818182, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7777777777777778, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.725925925925926, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.7, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13511410355567932, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8194070080862534, | |
| "eval_overall_precision": 0.7774936061381074, | |
| "eval_overall_recall": 0.8660968660968661, | |
| "eval_runtime": 0.3268, | |
| "eval_samples_per_second": 572.204, | |
| "eval_steps_per_second": 9.18, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "grad_norm": 3.7243123054504395, | |
| "learning_rate": 3.9000000000000006e-05, | |
| "loss": 0.0942, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_LOCATION_f1": 0.7820512820512822, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8356164383561644, | |
| "eval_ORGANIZATION_f1": 0.7027027027027027, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6265060240963856, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1375378519296646, | |
| "eval_overall_accuracy": 0.9574206251538272, | |
| "eval_overall_f1": 0.8085106382978723, | |
| "eval_overall_precision": 0.7581047381546134, | |
| "eval_overall_recall": 0.8660968660968661, | |
| "eval_runtime": 0.3271, | |
| "eval_samples_per_second": 571.696, | |
| "eval_steps_per_second": 9.172, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "grad_norm": 1.6769466400146484, | |
| "learning_rate": 3.85e-05, | |
| "loss": 0.0943, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.775, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.76, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6705882352941176, | |
| "eval_ORGANIZATION_recall": 0.8769230769230769, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13511058688163757, | |
| "eval_overall_accuracy": 0.9591434900319961, | |
| "eval_overall_f1": 0.8249336870026525, | |
| "eval_overall_precision": 0.771712158808933, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.3273, | |
| "eval_samples_per_second": 571.272, | |
| "eval_steps_per_second": 9.165, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "grad_norm": 1.9959501028060913, | |
| "learning_rate": 3.8e-05, | |
| "loss": 0.091, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_LOCATION_f1": 0.8050314465408805, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7441860465116279, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7682119205298013, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6744186046511628, | |
| "eval_ORGANIZATION_recall": 0.8923076923076924, | |
| "eval_PERSON_f1": 0.8753993610223643, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8404907975460123, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14082586765289307, | |
| "eval_overall_accuracy": 0.9579128722618755, | |
| "eval_overall_f1": 0.8183006535947712, | |
| "eval_overall_precision": 0.7560386473429952, | |
| "eval_overall_recall": 0.8917378917378918, | |
| "eval_runtime": 0.3276, | |
| "eval_samples_per_second": 570.878, | |
| "eval_steps_per_second": 9.158, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "grad_norm": 2.225444793701172, | |
| "learning_rate": 3.7500000000000003e-05, | |
| "loss": 0.089, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_LOCATION_f1": 0.8076923076923077, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7464788732394366, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6883116883116883, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8810289389067525, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8509316770186336, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7246376811594203, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.625, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1414780169725418, | |
| "eval_overall_accuracy": 0.9584051193699237, | |
| "eval_overall_f1": 0.8186666666666667, | |
| "eval_overall_precision": 0.7694235588972431, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3266, | |
| "eval_samples_per_second": 572.607, | |
| "eval_steps_per_second": 9.186, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "grad_norm": 1.2359886169433594, | |
| "learning_rate": 3.7e-05, | |
| "loss": 0.0862, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_LOCATION_f1": 0.7898089171974523, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7380952380952381, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.7194244604316546, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6756756756756757, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7142857142857144, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6097560975609756, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7733333333333334, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7073170731707317, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14282022416591644, | |
| "eval_overall_accuracy": 0.9561900073837066, | |
| "eval_overall_f1": 0.8052980132450331, | |
| "eval_overall_precision": 0.7524752475247525, | |
| "eval_overall_recall": 0.8660968660968661, | |
| "eval_runtime": 0.3275, | |
| "eval_samples_per_second": 570.999, | |
| "eval_steps_per_second": 9.16, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "grad_norm": 1.0968230962753296, | |
| "learning_rate": 3.65e-05, | |
| "loss": 0.0836, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_LOCATION_f1": 0.7950310559006212, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7272727272727273, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7323943661971831, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6753246753246753, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.676056338028169, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.5714285714285714, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7733333333333334, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7073170731707317, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14485140144824982, | |
| "eval_overall_accuracy": 0.9556977602756583, | |
| "eval_overall_f1": 0.8068331143232589, | |
| "eval_overall_precision": 0.748780487804878, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3284, | |
| "eval_samples_per_second": 569.433, | |
| "eval_steps_per_second": 9.135, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "grad_norm": 1.7558865547180176, | |
| "learning_rate": 3.6e-05, | |
| "loss": 0.0801, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.775, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.7338129496402878, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6891891891891891, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8774193548387097, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.85, | |
| "eval_PERSON_recall": 0.9066666666666666, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13724297285079956, | |
| "eval_overall_accuracy": 0.9579128722618755, | |
| "eval_overall_f1": 0.8156123822341856, | |
| "eval_overall_precision": 0.7729591836734694, | |
| "eval_overall_recall": 0.8632478632478633, | |
| "eval_runtime": 0.3346, | |
| "eval_samples_per_second": 558.811, | |
| "eval_steps_per_second": 8.965, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "grad_norm": 1.0294597148895264, | |
| "learning_rate": 3.55e-05, | |
| "loss": 0.0779, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_LOCATION_f1": 0.7974683544303799, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7411764705882353, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7682119205298013, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6744186046511628, | |
| "eval_ORGANIZATION_recall": 0.8923076923076924, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1392383724451065, | |
| "eval_overall_accuracy": 0.958897366477972, | |
| "eval_overall_f1": 0.8236842105263158, | |
| "eval_overall_precision": 0.7652811735941321, | |
| "eval_overall_recall": 0.8917378917378918, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.248, | |
| "eval_steps_per_second": 8.988, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "grad_norm": 1.9617377519607544, | |
| "learning_rate": 3.5e-05, | |
| "loss": 0.0776, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.725925925925926, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.7, | |
| "eval_ORGANIZATION_recall": 0.7538461538461538, | |
| "eval_PERSON_f1": 0.8853503184713376, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8475609756097561, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13599379360675812, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8236877523553163, | |
| "eval_overall_precision": 0.7806122448979592, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.332, | |
| "eval_samples_per_second": 563.281, | |
| "eval_steps_per_second": 9.037, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "grad_norm": 0.6533139944076538, | |
| "learning_rate": 3.45e-05, | |
| "loss": 0.0764, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "eval_LOCATION_f1": 0.8101265822784809, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7529411764705882, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7586206896551724, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6875, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7246376811594203, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.625, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7733333333333334, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7073170731707317, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14058609306812286, | |
| "eval_overall_accuracy": 0.9598818606940684, | |
| "eval_overall_f1": 0.8173455978975033, | |
| "eval_overall_precision": 0.7585365853658537, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.3334, | |
| "eval_samples_per_second": 560.883, | |
| "eval_steps_per_second": 8.998, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "grad_norm": 0.820826530456543, | |
| "learning_rate": 3.4000000000000007e-05, | |
| "loss": 0.0745, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "eval_LOCATION_f1": 0.7974683544303799, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7411764705882353, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7567567567567568, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6746987951807228, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.6857142857142856, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.5853658536585366, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8169014084507041, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7837837837837838, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1464959979057312, | |
| "eval_overall_accuracy": 0.9576667487078513, | |
| "eval_overall_f1": 0.8157894736842105, | |
| "eval_overall_precision": 0.7579462102689487, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3329, | |
| "eval_samples_per_second": 561.647, | |
| "eval_steps_per_second": 9.01, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "grad_norm": 0.9249401688575745, | |
| "learning_rate": 3.35e-05, | |
| "loss": 0.0729, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.72992700729927, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6944444444444444, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7936507936507937, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13697849214076996, | |
| "eval_overall_accuracy": 0.9606202313561408, | |
| "eval_overall_f1": 0.8243243243243243, | |
| "eval_overall_precision": 0.7840616966580977, | |
| "eval_overall_recall": 0.8689458689458689, | |
| "eval_runtime": 0.3343, | |
| "eval_samples_per_second": 559.37, | |
| "eval_steps_per_second": 8.974, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "grad_norm": 3.431596040725708, | |
| "learning_rate": 3.3e-05, | |
| "loss": 0.0719, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "eval_LOCATION_f1": 0.8311688311688312, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7901234567901234, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.6814814814814816, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7076923076923077, | |
| "eval_PERSON_f1": 0.8838709677419355, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.85625, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7812500000000001, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1357881724834442, | |
| "eval_overall_accuracy": 0.9616047255722373, | |
| "eval_overall_f1": 0.819047619047619, | |
| "eval_overall_precision": 0.7838541666666666, | |
| "eval_overall_recall": 0.8575498575498576, | |
| "eval_runtime": 0.3327, | |
| "eval_samples_per_second": 562.136, | |
| "eval_steps_per_second": 9.018, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "grad_norm": 0.9399017691612244, | |
| "learning_rate": 3.2500000000000004e-05, | |
| "loss": 0.0746, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "eval_LOCATION_f1": 0.8050314465408805, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7441860465116279, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7432432432432433, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6626506024096386, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7733333333333334, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7073170731707317, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14653536677360535, | |
| "eval_overall_accuracy": 0.9574206251538272, | |
| "eval_overall_f1": 0.8141361256544503, | |
| "eval_overall_precision": 0.7530266343825666, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.886, | |
| "eval_steps_per_second": 9.014, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "grad_norm": 0.6335604190826416, | |
| "learning_rate": 3.2000000000000005e-05, | |
| "loss": 0.0676, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7464788732394366, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6883116883116883, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13876868784427643, | |
| "eval_overall_accuracy": 0.9603741078021166, | |
| "eval_overall_f1": 0.8251001335113485, | |
| "eval_overall_precision": 0.7763819095477387, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.873, | |
| "eval_steps_per_second": 9.014, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "grad_norm": 1.0286895036697388, | |
| "learning_rate": 3.15e-05, | |
| "loss": 0.0674, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "eval_LOCATION_f1": 0.8076923076923077, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7432432432432433, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6626506024096386, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8761904761904761, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8363636363636363, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14836791157722473, | |
| "eval_overall_accuracy": 0.9586512429239479, | |
| "eval_overall_f1": 0.8131578947368421, | |
| "eval_overall_precision": 0.7555012224938875, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.202, | |
| "eval_steps_per_second": 8.987, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "grad_norm": 0.754433274269104, | |
| "learning_rate": 3.1e-05, | |
| "loss": 0.0653, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.6911764705882353, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6619718309859155, | |
| "eval_ORGANIZATION_recall": 0.7230769230769231, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1401306837797165, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8096514745308312, | |
| "eval_overall_precision": 0.7645569620253164, | |
| "eval_overall_recall": 0.8603988603988604, | |
| "eval_runtime": 0.3326, | |
| "eval_samples_per_second": 562.239, | |
| "eval_steps_per_second": 9.02, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "grad_norm": 1.2110971212387085, | |
| "learning_rate": 3.05e-05, | |
| "loss": 0.0638, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.775, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.7534246575342466, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6790123456790124, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7575757575757576, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1372911036014557, | |
| "eval_overall_accuracy": 0.9608663549101649, | |
| "eval_overall_f1": 0.8229027962716379, | |
| "eval_overall_precision": 0.7725, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.332, | |
| "eval_samples_per_second": 563.249, | |
| "eval_steps_per_second": 9.036, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "grad_norm": 0.7484323382377625, | |
| "learning_rate": 3e-05, | |
| "loss": 0.0641, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "eval_LOCATION_f1": 0.7875, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7241379310344828, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7567567567567568, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6746987951807228, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.879746835443038, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8373493975903614, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.6857142857142856, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.5853658536585366, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15354810655117035, | |
| "eval_overall_accuracy": 0.9566822544917548, | |
| "eval_overall_f1": 0.8098958333333335, | |
| "eval_overall_precision": 0.7458033573141487, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.3264, | |
| "eval_samples_per_second": 572.882, | |
| "eval_steps_per_second": 9.191, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "grad_norm": 0.8354088068008423, | |
| "learning_rate": 2.95e-05, | |
| "loss": 0.0632, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7801418439716312, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.7236842105263158, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7575757575757576, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.13777735829353333, | |
| "eval_overall_accuracy": 0.9613586020182131, | |
| "eval_overall_f1": 0.8326639892904953, | |
| "eval_overall_precision": 0.7853535353535354, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.333, | |
| "eval_samples_per_second": 561.553, | |
| "eval_steps_per_second": 9.009, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "grad_norm": 0.5027186274528503, | |
| "learning_rate": 2.9e-05, | |
| "loss": 0.0607, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.775, | |
| "eval_LOCATION_recall": 0.8493150684931506, | |
| "eval_ORGANIZATION_f1": 0.7464788732394366, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6883116883116883, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8782051282051282, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1403217911720276, | |
| "eval_overall_accuracy": 0.9606202313561408, | |
| "eval_overall_f1": 0.8192771084337349, | |
| "eval_overall_precision": 0.7727272727272727, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3336, | |
| "eval_samples_per_second": 560.597, | |
| "eval_steps_per_second": 8.994, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "grad_norm": 0.9568884968757629, | |
| "learning_rate": 2.8499999999999998e-05, | |
| "loss": 0.0596, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "eval_LOCATION_f1": 0.8311688311688312, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7901234567901234, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7323943661971831, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6753246753246753, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8838709677419355, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.85625, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1430799663066864, | |
| "eval_overall_accuracy": 0.9616047255722373, | |
| "eval_overall_f1": 0.8230563002680965, | |
| "eval_overall_precision": 0.7772151898734178, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3331, | |
| "eval_samples_per_second": 561.433, | |
| "eval_steps_per_second": 9.007, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "grad_norm": 5.6017351150512695, | |
| "learning_rate": 2.8000000000000003e-05, | |
| "loss": 0.0582, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7375886524822695, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6842105263157895, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8853503184713376, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8475609756097561, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.7837837837837837, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.725, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14417453110218048, | |
| "eval_overall_accuracy": 0.961112478464189, | |
| "eval_overall_f1": 0.8229027962716379, | |
| "eval_overall_precision": 0.7725, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3257, | |
| "eval_samples_per_second": 574.07, | |
| "eval_steps_per_second": 9.21, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "grad_norm": 2.356386184692383, | |
| "learning_rate": 2.7500000000000004e-05, | |
| "loss": 0.0606, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.763888888888889, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6962025316455697, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.879746835443038, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8373493975903614, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.7246376811594203, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.625, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14679183065891266, | |
| "eval_overall_accuracy": 0.9596357371400444, | |
| "eval_overall_f1": 0.8232189973614775, | |
| "eval_overall_precision": 0.7665847665847666, | |
| "eval_overall_recall": 0.8888888888888888, | |
| "eval_runtime": 0.3259, | |
| "eval_samples_per_second": 573.862, | |
| "eval_steps_per_second": 9.206, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "grad_norm": 0.9929021000862122, | |
| "learning_rate": 2.7000000000000002e-05, | |
| "loss": 0.0563, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "eval_LOCATION_f1": 0.8311688311688312, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7901234567901234, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7285714285714285, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.68, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14097212255001068, | |
| "eval_overall_accuracy": 0.9608663549101649, | |
| "eval_overall_f1": 0.8219544846050869, | |
| "eval_overall_precision": 0.7752525252525253, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.333, | |
| "eval_samples_per_second": 561.632, | |
| "eval_steps_per_second": 9.01, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "grad_norm": 0.8276335597038269, | |
| "learning_rate": 2.6500000000000004e-05, | |
| "loss": 0.0556, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "eval_LOCATION_f1": 0.7974683544303799, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7411764705882353, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7724137931034483, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.7, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.879746835443038, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8373493975903614, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.6857142857142856, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.5853658536585366, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15497690439224243, | |
| "eval_overall_accuracy": 0.9579128722618755, | |
| "eval_overall_f1": 0.8173455978975033, | |
| "eval_overall_precision": 0.7585365853658537, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.3319, | |
| "eval_samples_per_second": 563.4, | |
| "eval_steps_per_second": 9.039, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "grad_norm": 2.3347344398498535, | |
| "learning_rate": 2.6000000000000002e-05, | |
| "loss": 0.0578, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7534246575342466, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6790123456790124, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8825396825396825, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8424242424242424, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.6956521739130435, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.7945205479452054, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7435897435897436, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1532071828842163, | |
| "eval_overall_accuracy": 0.9576667487078513, | |
| "eval_overall_f1": 0.8184210526315789, | |
| "eval_overall_precision": 0.7603911980440098, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.332, | |
| "eval_samples_per_second": 563.241, | |
| "eval_steps_per_second": 9.036, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "grad_norm": 0.38269466161727905, | |
| "learning_rate": 2.5500000000000003e-05, | |
| "loss": 0.0559, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "eval_LOCATION_f1": 0.8311688311688312, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7901234567901234, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7428571428571429, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6933333333333334, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8825396825396825, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8424242424242424, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14444759488105774, | |
| "eval_overall_accuracy": 0.9618508491262614, | |
| "eval_overall_f1": 0.8262032085561498, | |
| "eval_overall_precision": 0.7783375314861462, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.332, | |
| "eval_samples_per_second": 563.256, | |
| "eval_steps_per_second": 9.036, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "grad_norm": 1.5551215410232544, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.0544, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.757142857142857, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.7066666666666667, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8853503184713376, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8475609756097561, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1467483639717102, | |
| "eval_overall_accuracy": 0.9608663549101649, | |
| "eval_overall_f1": 0.8266666666666667, | |
| "eval_overall_precision": 0.7769423558897243, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.888, | |
| "eval_steps_per_second": 9.014, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "grad_norm": 1.1728203296661377, | |
| "learning_rate": 2.45e-05, | |
| "loss": 0.0511, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7246376811594203, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.684931506849315, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8853503184713376, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8475609756097561, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14386440813541412, | |
| "eval_overall_accuracy": 0.9608663549101649, | |
| "eval_overall_f1": 0.8219544846050869, | |
| "eval_overall_precision": 0.7752525252525253, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3262, | |
| "eval_samples_per_second": 573.233, | |
| "eval_steps_per_second": 9.196, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "grad_norm": 1.3139925003051758, | |
| "learning_rate": 2.4e-05, | |
| "loss": 0.0516, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7567567567567568, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6746987951807228, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8734177215189873, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8313253012048193, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7575757575757576, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15267647802829742, | |
| "eval_overall_accuracy": 0.9596357371400444, | |
| "eval_overall_f1": 0.8221343873517786, | |
| "eval_overall_precision": 0.7647058823529411, | |
| "eval_overall_recall": 0.8888888888888888, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.953, | |
| "eval_steps_per_second": 9.015, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "grad_norm": 1.7045568227767944, | |
| "learning_rate": 2.35e-05, | |
| "loss": 0.0524, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.75, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6835443037974683, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8742138364779874, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8273809523809523, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.7246376811594203, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.625, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15286701917648315, | |
| "eval_overall_accuracy": 0.9598818606940684, | |
| "eval_overall_f1": 0.8194993412384717, | |
| "eval_overall_precision": 0.7622549019607843, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.3345, | |
| "eval_samples_per_second": 559.086, | |
| "eval_steps_per_second": 8.969, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "grad_norm": 2.6849210262298584, | |
| "learning_rate": 2.3000000000000003e-05, | |
| "loss": 0.0513, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7450980392156863, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6477272727272727, | |
| "eval_ORGANIZATION_recall": 0.8769230769230769, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6153846153846154, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15772588551044464, | |
| "eval_overall_accuracy": 0.9576667487078513, | |
| "eval_overall_f1": 0.817824377457405, | |
| "eval_overall_precision": 0.7572815533980582, | |
| "eval_overall_recall": 0.8888888888888888, | |
| "eval_runtime": 0.3319, | |
| "eval_samples_per_second": 563.4, | |
| "eval_steps_per_second": 9.039, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "grad_norm": 0.8173909783363342, | |
| "learning_rate": 2.25e-05, | |
| "loss": 0.0506, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "eval_LOCATION_f1": 0.8235294117647058, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7875, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7428571428571429, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6933333333333334, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8825396825396825, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8424242424242424, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15098540484905243, | |
| "eval_overall_accuracy": 0.9603741078021166, | |
| "eval_overall_f1": 0.8219544846050869, | |
| "eval_overall_precision": 0.7752525252525253, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3334, | |
| "eval_samples_per_second": 560.961, | |
| "eval_steps_per_second": 8.999, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "grad_norm": 1.8647905588150024, | |
| "learning_rate": 2.2000000000000003e-05, | |
| "loss": 0.0511, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7517730496453899, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6973684210526315, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8825396825396825, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8424242424242424, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14845135807991028, | |
| "eval_overall_accuracy": 0.9606202313561408, | |
| "eval_overall_f1": 0.8255659121171771, | |
| "eval_overall_precision": 0.775, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3279, | |
| "eval_samples_per_second": 570.365, | |
| "eval_steps_per_second": 9.15, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "grad_norm": 0.22929580509662628, | |
| "learning_rate": 2.15e-05, | |
| "loss": 0.0494, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "eval_LOCATION_f1": 0.8181818181818182, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7777777777777778, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7285714285714285, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.68, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8853503184713376, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8475609756097561, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8169014084507041, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7837837837837838, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14559510350227356, | |
| "eval_overall_accuracy": 0.9618508491262614, | |
| "eval_overall_f1": 0.8230563002680965, | |
| "eval_overall_precision": 0.7772151898734178, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3268, | |
| "eval_samples_per_second": 572.194, | |
| "eval_steps_per_second": 9.18, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "grad_norm": 0.6386439800262451, | |
| "learning_rate": 2.1e-05, | |
| "loss": 0.0494, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "eval_LOCATION_f1": 0.8101265822784809, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7529411764705882, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7391304347826088, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6986301369863014, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15255826711654663, | |
| "eval_overall_accuracy": 0.9603741078021166, | |
| "eval_overall_f1": 0.8181818181818181, | |
| "eval_overall_precision": 0.7707808564231738, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3324, | |
| "eval_samples_per_second": 562.613, | |
| "eval_steps_per_second": 9.026, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "grad_norm": 19.432247161865234, | |
| "learning_rate": 2.05e-05, | |
| "loss": 0.0478, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7432432432432433, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6626506024096386, | |
| "eval_ORGANIZATION_recall": 0.8461538461538461, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.6956521739130435, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1611391305923462, | |
| "eval_overall_accuracy": 0.9586512429239479, | |
| "eval_overall_f1": 0.8190224570673711, | |
| "eval_overall_precision": 0.7635467980295566, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3315, | |
| "eval_samples_per_second": 564.041, | |
| "eval_steps_per_second": 9.049, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "grad_norm": 2.1011621952056885, | |
| "learning_rate": 2e-05, | |
| "loss": 0.0471, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "eval_LOCATION_f1": 0.8311688311688312, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7901234567901234, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7092198581560285, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6578947368421053, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8169014084507041, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7837837837837838, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14900296926498413, | |
| "eval_overall_accuracy": 0.9613586020182131, | |
| "eval_overall_f1": 0.8214765100671142, | |
| "eval_overall_precision": 0.7766497461928934, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.901, | |
| "eval_steps_per_second": 9.014, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "grad_norm": 1.5730093717575073, | |
| "learning_rate": 1.9500000000000003e-05, | |
| "loss": 0.0457, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "eval_LOCATION_f1": 0.8366013071895425, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.75, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6835443037974683, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7301587301587301, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6764705882352942, | |
| "eval_QUANTITY_recall": 0.7931034482758621, | |
| "eval_TIME_f1": 0.8285714285714286, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.8055555555555556, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14521339535713196, | |
| "eval_overall_accuracy": 0.9623430962343096, | |
| "eval_overall_f1": 0.82907133243607, | |
| "eval_overall_precision": 0.7857142857142857, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3329, | |
| "eval_samples_per_second": 561.784, | |
| "eval_steps_per_second": 9.013, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "grad_norm": 0.7596818208694458, | |
| "learning_rate": 1.9e-05, | |
| "loss": 0.0453, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "eval_LOCATION_f1": 0.8129032258064516, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7682926829268293, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7234042553191491, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6710526315789473, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7575757575757576, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1535465270280838, | |
| "eval_overall_accuracy": 0.9608663549101649, | |
| "eval_overall_f1": 0.8203753351206434, | |
| "eval_overall_precision": 0.7746835443037975, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3263, | |
| "eval_samples_per_second": 573.007, | |
| "eval_steps_per_second": 9.193, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "grad_norm": 3.6123743057250977, | |
| "learning_rate": 1.85e-05, | |
| "loss": 0.0439, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "eval_LOCATION_f1": 0.8129032258064516, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7682926829268293, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7297297297297298, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6506024096385542, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15502122044563293, | |
| "eval_overall_accuracy": 0.9596357371400444, | |
| "eval_overall_f1": 0.8218085106382977, | |
| "eval_overall_precision": 0.770573566084788, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3317, | |
| "eval_samples_per_second": 563.702, | |
| "eval_steps_per_second": 9.043, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "grad_norm": 0.6118897199630737, | |
| "learning_rate": 1.8e-05, | |
| "loss": 0.0467, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "eval_LOCATION_f1": 0.8289473684210525, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7974683544303798, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.6814814814814816, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7076923076923077, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7419354838709677, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.696969696969697, | |
| "eval_QUANTITY_recall": 0.7931034482758621, | |
| "eval_TIME_f1": 0.8169014084507041, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7837837837837838, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.14392048120498657, | |
| "eval_overall_accuracy": 0.9613586020182131, | |
| "eval_overall_f1": 0.8169398907103825, | |
| "eval_overall_precision": 0.7847769028871391, | |
| "eval_overall_recall": 0.8518518518518519, | |
| "eval_runtime": 0.3318, | |
| "eval_samples_per_second": 563.555, | |
| "eval_steps_per_second": 9.041, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "grad_norm": 1.4808624982833862, | |
| "learning_rate": 1.75e-05, | |
| "loss": 0.0422, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7448275862068966, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.675, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.6956521739130435, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.160318523645401, | |
| "eval_overall_accuracy": 0.9591434900319961, | |
| "eval_overall_f1": 0.8185430463576159, | |
| "eval_overall_precision": 0.7648514851485149, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.332, | |
| "eval_samples_per_second": 563.291, | |
| "eval_steps_per_second": 9.037, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "grad_norm": 1.028084397315979, | |
| "learning_rate": 1.7000000000000003e-05, | |
| "loss": 0.0423, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.75, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6835443037974683, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7575757575757576, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1588248461484909, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.824468085106383, | |
| "eval_overall_precision": 0.773067331670823, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3263, | |
| "eval_samples_per_second": 573.167, | |
| "eval_steps_per_second": 9.195, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "grad_norm": 1.2602914571762085, | |
| "learning_rate": 1.65e-05, | |
| "loss": 0.0422, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "eval_LOCATION_f1": 0.8441558441558442, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.8024691358024691, | |
| "eval_LOCATION_recall": 0.8904109589041096, | |
| "eval_ORGANIZATION_f1": 0.7346938775510204, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8169014084507041, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7837837837837838, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15185856819152832, | |
| "eval_overall_accuracy": 0.9623430962343096, | |
| "eval_overall_f1": 0.8282290279627165, | |
| "eval_overall_precision": 0.7775, | |
| "eval_overall_recall": 0.886039886039886, | |
| "eval_runtime": 0.3269, | |
| "eval_samples_per_second": 572.038, | |
| "eval_steps_per_second": 9.177, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "grad_norm": 0.7608669996261597, | |
| "learning_rate": 1.6000000000000003e-05, | |
| "loss": 0.0416, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7448275862068966, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.675, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15464389324188232, | |
| "eval_overall_accuracy": 0.9616047255722373, | |
| "eval_overall_f1": 0.824468085106383, | |
| "eval_overall_precision": 0.773067331670823, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.332, | |
| "eval_samples_per_second": 563.246, | |
| "eval_steps_per_second": 9.036, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "grad_norm": 1.0217771530151367, | |
| "learning_rate": 1.55e-05, | |
| "loss": 0.0403, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "eval_LOCATION_f1": 0.8235294117647058, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7875, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7448275862068966, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.675, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.75, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1511322259902954, | |
| "eval_overall_accuracy": 0.9618508491262614, | |
| "eval_overall_f1": 0.824631860776439, | |
| "eval_overall_precision": 0.7777777777777778, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3329, | |
| "eval_samples_per_second": 561.81, | |
| "eval_steps_per_second": 9.013, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "grad_norm": 1.7045354843139648, | |
| "learning_rate": 1.5e-05, | |
| "loss": 0.0411, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7346938775510204, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15936115384101868, | |
| "eval_overall_accuracy": 0.9598818606940684, | |
| "eval_overall_f1": 0.8222811671087533, | |
| "eval_overall_precision": 0.7692307692307693, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3338, | |
| "eval_samples_per_second": 560.176, | |
| "eval_steps_per_second": 8.987, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "grad_norm": 1.8637417554855347, | |
| "learning_rate": 1.45e-05, | |
| "loss": 0.0391, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7225806451612903, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6222222222222222, | |
| "eval_ORGANIZATION_recall": 0.8615384615384616, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.17168858647346497, | |
| "eval_overall_accuracy": 0.9561900073837066, | |
| "eval_overall_f1": 0.8156862745098039, | |
| "eval_overall_precision": 0.7536231884057971, | |
| "eval_overall_recall": 0.8888888888888888, | |
| "eval_runtime": 0.332, | |
| "eval_samples_per_second": 563.182, | |
| "eval_steps_per_second": 9.035, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "grad_norm": 1.0552111864089966, | |
| "learning_rate": 1.4000000000000001e-05, | |
| "loss": 0.0393, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "eval_LOCATION_f1": 0.8101265822784809, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7529411764705882, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7397260273972603, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8789808917197452, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8414634146341463, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16536851227283478, | |
| "eval_overall_accuracy": 0.9584051193699237, | |
| "eval_overall_f1": 0.8190224570673711, | |
| "eval_overall_precision": 0.7635467980295566, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3264, | |
| "eval_samples_per_second": 572.834, | |
| "eval_steps_per_second": 9.19, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "grad_norm": 0.6572228670120239, | |
| "learning_rate": 1.3500000000000001e-05, | |
| "loss": 0.0411, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7323943661971831, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6753246753246753, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15696407854557037, | |
| "eval_overall_accuracy": 0.9608663549101649, | |
| "eval_overall_f1": 0.822429906542056, | |
| "eval_overall_precision": 0.7738693467336684, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3332, | |
| "eval_samples_per_second": 561.214, | |
| "eval_steps_per_second": 9.003, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "grad_norm": 0.9044064283370972, | |
| "learning_rate": 1.3000000000000001e-05, | |
| "loss": 0.0408, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7323943661971831, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6753246753246753, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8853503184713376, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8475609756097561, | |
| "eval_PERSON_recall": 0.9266666666666666, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8169014084507041, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7837837837837838, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1582627296447754, | |
| "eval_overall_accuracy": 0.9613586020182131, | |
| "eval_overall_f1": 0.824, | |
| "eval_overall_precision": 0.7744360902255639, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3319, | |
| "eval_samples_per_second": 563.385, | |
| "eval_steps_per_second": 9.038, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "grad_norm": 0.5799534916877747, | |
| "learning_rate": 1.25e-05, | |
| "loss": 0.0389, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7310344827586207, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6625, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6153846153846154, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16305667161941528, | |
| "eval_overall_accuracy": 0.9591434900319961, | |
| "eval_overall_f1": 0.8180610889774236, | |
| "eval_overall_precision": 0.7661691542288557, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3349, | |
| "eval_samples_per_second": 558.344, | |
| "eval_steps_per_second": 8.957, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "grad_norm": 1.983021855354309, | |
| "learning_rate": 1.2e-05, | |
| "loss": 0.0377, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7346938775510204, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.15857818722724915, | |
| "eval_overall_accuracy": 0.9613586020182131, | |
| "eval_overall_f1": 0.8207171314741036, | |
| "eval_overall_precision": 0.7686567164179104, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3261, | |
| "eval_samples_per_second": 573.446, | |
| "eval_steps_per_second": 9.2, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "grad_norm": 1.1891909837722778, | |
| "learning_rate": 1.1500000000000002e-05, | |
| "loss": 0.0404, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7346938775510204, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7272727272727273, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6486486486486487, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16166049242019653, | |
| "eval_overall_accuracy": 0.9601279842480925, | |
| "eval_overall_f1": 0.8207171314741036, | |
| "eval_overall_precision": 0.7686567164179104, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3315, | |
| "eval_samples_per_second": 564.102, | |
| "eval_steps_per_second": 9.05, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "grad_norm": 0.46722444891929626, | |
| "learning_rate": 1.1000000000000001e-05, | |
| "loss": 0.0388, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7310344827586207, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6625, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8169014084507041, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7837837837837838, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16035309433937073, | |
| "eval_overall_accuracy": 0.9618508491262614, | |
| "eval_overall_f1": 0.823529411764706, | |
| "eval_overall_precision": 0.7758186397984886, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3324, | |
| "eval_samples_per_second": 562.645, | |
| "eval_steps_per_second": 9.026, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "grad_norm": 0.8686147332191467, | |
| "learning_rate": 1.05e-05, | |
| "loss": 0.0383, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7183098591549296, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6623376623376623, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16000543534755707, | |
| "eval_overall_accuracy": 0.961112478464189, | |
| "eval_overall_f1": 0.8192771084337349, | |
| "eval_overall_precision": 0.7727272727272727, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3327, | |
| "eval_samples_per_second": 561.998, | |
| "eval_steps_per_second": 9.016, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "grad_norm": 0.674788773059845, | |
| "learning_rate": 1e-05, | |
| "loss": 0.0382, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7297297297297298, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6506024096385542, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.696969696969697, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6216216216216216, | |
| "eval_QUANTITY_recall": 0.7931034482758621, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16522908210754395, | |
| "eval_overall_accuracy": 0.9596357371400444, | |
| "eval_overall_f1": 0.8169761273209548, | |
| "eval_overall_precision": 0.7642679900744417, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3342, | |
| "eval_samples_per_second": 559.61, | |
| "eval_steps_per_second": 8.978, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "grad_norm": 1.6788341999053955, | |
| "learning_rate": 9.5e-06, | |
| "loss": 0.0378, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "eval_LOCATION_f1": 0.8101265822784809, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7529411764705882, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7297297297297298, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6506024096385542, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8846153846153846, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6153846153846154, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.17060095071792603, | |
| "eval_overall_accuracy": 0.9591434900319961, | |
| "eval_overall_f1": 0.8153034300791556, | |
| "eval_overall_precision": 0.7592137592137592, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3359, | |
| "eval_samples_per_second": 556.794, | |
| "eval_steps_per_second": 8.933, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "grad_norm": 0.7395833730697632, | |
| "learning_rate": 9e-06, | |
| "loss": 0.039, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "eval_LOCATION_f1": 0.8101265822784809, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7529411764705882, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7448275862068966, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.675, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7272727272727273, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6486486486486487, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16823621094226837, | |
| "eval_overall_accuracy": 0.9598818606940684, | |
| "eval_overall_f1": 0.8196286472148541, | |
| "eval_overall_precision": 0.7667493796526055, | |
| "eval_overall_recall": 0.8803418803418803, | |
| "eval_runtime": 0.3356, | |
| "eval_samples_per_second": 557.222, | |
| "eval_steps_per_second": 8.939, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "grad_norm": 0.7045236229896545, | |
| "learning_rate": 8.500000000000002e-06, | |
| "loss": 0.0372, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.6944444444444444, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6329113924050633, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8726114649681529, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9133333333333333, | |
| "eval_QUANTITY_f1": 0.7272727272727273, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6486486486486487, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16675511002540588, | |
| "eval_overall_accuracy": 0.958897366477972, | |
| "eval_overall_f1": 0.8095872170439414, | |
| "eval_overall_precision": 0.76, | |
| "eval_overall_recall": 0.8660968660968661, | |
| "eval_runtime": 0.3326, | |
| "eval_samples_per_second": 562.306, | |
| "eval_steps_per_second": 9.021, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "grad_norm": 2.7517426013946533, | |
| "learning_rate": 8.000000000000001e-06, | |
| "loss": 0.0368, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7346938775510204, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1667993813753128, | |
| "eval_overall_accuracy": 0.9598818606940684, | |
| "eval_overall_f1": 0.8211920529801325, | |
| "eval_overall_precision": 0.7673267326732673, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.958, | |
| "eval_steps_per_second": 9.015, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "grad_norm": 2.215299606323242, | |
| "learning_rate": 7.5e-06, | |
| "loss": 0.0374, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7194244604316546, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6756756756756757, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16433657705783844, | |
| "eval_overall_accuracy": 0.9606202313561408, | |
| "eval_overall_f1": 0.8176943699731903, | |
| "eval_overall_precision": 0.7721518987341772, | |
| "eval_overall_recall": 0.8689458689458689, | |
| "eval_runtime": 0.3273, | |
| "eval_samples_per_second": 571.286, | |
| "eval_steps_per_second": 9.165, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "grad_norm": 0.40606042742729187, | |
| "learning_rate": 7.000000000000001e-06, | |
| "loss": 0.0369, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7083333333333334, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6455696202531646, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1689991056919098, | |
| "eval_overall_accuracy": 0.9584051193699237, | |
| "eval_overall_f1": 0.8154050464807436, | |
| "eval_overall_precision": 0.763681592039801, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.979, | |
| "eval_steps_per_second": 9.016, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "grad_norm": 1.3081475496292114, | |
| "learning_rate": 6.5000000000000004e-06, | |
| "loss": 0.036, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7132867132867133, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6538461538461539, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7272727272727273, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6486486486486487, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16559894382953644, | |
| "eval_overall_accuracy": 0.9596357371400444, | |
| "eval_overall_f1": 0.8170894526034712, | |
| "eval_overall_precision": 0.7688442211055276, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3315, | |
| "eval_samples_per_second": 564.057, | |
| "eval_steps_per_second": 9.049, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "grad_norm": 0.7401718497276306, | |
| "learning_rate": 6e-06, | |
| "loss": 0.037, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7132867132867133, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6538461538461539, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7272727272727273, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6486486486486487, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16509054601192474, | |
| "eval_overall_accuracy": 0.9603741078021166, | |
| "eval_overall_f1": 0.8170894526034712, | |
| "eval_overall_precision": 0.7688442211055276, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3322, | |
| "eval_samples_per_second": 562.977, | |
| "eval_steps_per_second": 9.032, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "grad_norm": 0.570732057094574, | |
| "learning_rate": 5.500000000000001e-06, | |
| "loss": 0.0373, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7172413793103448, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.65, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16918015480041504, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8164893617021275, | |
| "eval_overall_precision": 0.7655860349127181, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3273, | |
| "eval_samples_per_second": 571.287, | |
| "eval_steps_per_second": 9.165, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "grad_norm": 1.0674538612365723, | |
| "learning_rate": 5e-06, | |
| "loss": 0.0357, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "eval_LOCATION_f1": 0.8258064516129032, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7092198581560285, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6578947368421053, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16437728703022003, | |
| "eval_overall_accuracy": 0.9603741078021166, | |
| "eval_overall_f1": 0.8155080213903743, | |
| "eval_overall_precision": 0.7682619647355163, | |
| "eval_overall_recall": 0.8689458689458689, | |
| "eval_runtime": 0.327, | |
| "eval_samples_per_second": 571.778, | |
| "eval_steps_per_second": 9.173, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "grad_norm": 0.779975414276123, | |
| "learning_rate": 4.5e-06, | |
| "loss": 0.0365, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7346938775510204, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1706375926733017, | |
| "eval_overall_accuracy": 0.9596357371400444, | |
| "eval_overall_f1": 0.8211920529801325, | |
| "eval_overall_precision": 0.7673267326732673, | |
| "eval_overall_recall": 0.8831908831908832, | |
| "eval_runtime": 0.3328, | |
| "eval_samples_per_second": 561.858, | |
| "eval_steps_per_second": 9.014, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "grad_norm": 1.6607707738876343, | |
| "learning_rate": 4.000000000000001e-06, | |
| "loss": 0.0358, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7210884353741497, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6463414634146342, | |
| "eval_ORGANIZATION_recall": 0.8153846153846154, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16552191972732544, | |
| "eval_overall_accuracy": 0.9606202313561408, | |
| "eval_overall_f1": 0.8158940397350993, | |
| "eval_overall_precision": 0.7623762376237624, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3345, | |
| "eval_samples_per_second": 559.095, | |
| "eval_steps_per_second": 8.969, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "grad_norm": 0.364473819732666, | |
| "learning_rate": 3.5000000000000004e-06, | |
| "loss": 0.0367, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7272727272727272, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16641728579998016, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8164893617021275, | |
| "eval_overall_precision": 0.7655860349127181, | |
| "eval_overall_recall": 0.8746438746438746, | |
| "eval_runtime": 0.3264, | |
| "eval_samples_per_second": 572.903, | |
| "eval_steps_per_second": 9.191, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "grad_norm": 1.1335537433624268, | |
| "learning_rate": 3e-06, | |
| "loss": 0.0367, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "eval_LOCATION_f1": 0.8076923076923077, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7123287671232877, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6419753086419753, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16745708882808685, | |
| "eval_overall_accuracy": 0.958897366477972, | |
| "eval_overall_f1": 0.8116710875331565, | |
| "eval_overall_precision": 0.7593052109181141, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3331, | |
| "eval_samples_per_second": 561.459, | |
| "eval_steps_per_second": 9.007, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "grad_norm": 2.660787582397461, | |
| "learning_rate": 2.5e-06, | |
| "loss": 0.0358, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "eval_LOCATION_f1": 0.8076923076923077, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.863013698630137, | |
| "eval_ORGANIZATION_f1": 0.7346938775510204, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6585365853658537, | |
| "eval_ORGANIZATION_recall": 0.8307692307692308, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6153846153846154, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.17253383994102478, | |
| "eval_overall_accuracy": 0.9591434900319961, | |
| "eval_overall_f1": 0.8148148148148149, | |
| "eval_overall_precision": 0.7604938271604939, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3324, | |
| "eval_samples_per_second": 562.55, | |
| "eval_steps_per_second": 9.025, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "grad_norm": 1.2606465816497803, | |
| "learning_rate": 2.0000000000000003e-06, | |
| "loss": 0.0374, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7123287671232877, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6419753086419753, | |
| "eval_ORGANIZATION_recall": 0.8, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8620689655172413, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1706884801387787, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8158940397350993, | |
| "eval_overall_precision": 0.7623762376237624, | |
| "eval_overall_recall": 0.8774928774928775, | |
| "eval_runtime": 0.3336, | |
| "eval_samples_per_second": 560.539, | |
| "eval_steps_per_second": 8.993, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "grad_norm": 2.224013090133667, | |
| "learning_rate": 1.5e-06, | |
| "loss": 0.0342, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7132867132867133, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6538461538461539, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16819004714488983, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8149134487350199, | |
| "eval_overall_precision": 0.765, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.3327, | |
| "eval_samples_per_second": 562.071, | |
| "eval_steps_per_second": 9.017, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "grad_norm": 1.7407749891281128, | |
| "learning_rate": 1.0000000000000002e-06, | |
| "loss": 0.0351, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "eval_LOCATION_f1": 0.8205128205128205, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7710843373493976, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.7234042553191491, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6710526315789473, | |
| "eval_ORGANIZATION_recall": 0.7846153846153846, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16785794496536255, | |
| "eval_overall_accuracy": 0.9593896135860202, | |
| "eval_overall_f1": 0.8170894526034712, | |
| "eval_overall_precision": 0.7688442211055276, | |
| "eval_overall_recall": 0.8717948717948718, | |
| "eval_runtime": 0.333, | |
| "eval_samples_per_second": 561.612, | |
| "eval_steps_per_second": 9.01, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "grad_norm": 0.9356883764266968, | |
| "learning_rate": 5.000000000000001e-07, | |
| "loss": 0.036, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.6993006993006994, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6410256410256411, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.1689637303352356, | |
| "eval_overall_accuracy": 0.9586512429239479, | |
| "eval_overall_f1": 0.8111702127659575, | |
| "eval_overall_precision": 0.7605985037406484, | |
| "eval_overall_recall": 0.8689458689458689, | |
| "eval_runtime": 0.3253, | |
| "eval_samples_per_second": 574.83, | |
| "eval_steps_per_second": 9.222, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "grad_norm": 0.6478390693664551, | |
| "learning_rate": 0.0, | |
| "loss": 0.0368, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "eval_LOCATION_f1": 0.8152866242038217, | |
| "eval_LOCATION_number": 73, | |
| "eval_LOCATION_precision": 0.7619047619047619, | |
| "eval_LOCATION_recall": 0.8767123287671232, | |
| "eval_ORGANIZATION_f1": 0.6993006993006994, | |
| "eval_ORGANIZATION_number": 65, | |
| "eval_ORGANIZATION_precision": 0.6410256410256411, | |
| "eval_ORGANIZATION_recall": 0.7692307692307693, | |
| "eval_PERSON_f1": 0.8817891373801918, | |
| "eval_PERSON_number": 150, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.92, | |
| "eval_QUANTITY_f1": 0.716417910447761, | |
| "eval_QUANTITY_number": 29, | |
| "eval_QUANTITY_precision": 0.631578947368421, | |
| "eval_QUANTITY_recall": 0.8275862068965517, | |
| "eval_TIME_f1": 0.8055555555555555, | |
| "eval_TIME_number": 34, | |
| "eval_TIME_precision": 0.7631578947368421, | |
| "eval_TIME_recall": 0.8529411764705882, | |
| "eval_loss": 0.16865810751914978, | |
| "eval_overall_accuracy": 0.9586512429239479, | |
| "eval_overall_f1": 0.8111702127659575, | |
| "eval_overall_precision": 0.7605985037406484, | |
| "eval_overall_recall": 0.8689458689458689, | |
| "eval_runtime": 0.3331, | |
| "eval_samples_per_second": 561.343, | |
| "eval_steps_per_second": 9.006, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "step": 10600, | |
| "total_flos": 4567780799240064.0, | |
| "train_loss": 0.08414012978661735, | |
| "train_runtime": 604.7606, | |
| "train_samples_per_second": 279.119, | |
| "train_steps_per_second": 17.528 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 10600, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 100, | |
| "save_steps": 500, | |
| "total_flos": 4567780799240064.0, | |
| "train_batch_size": 16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |