| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 100.0, | |
| "eval_steps": 500, | |
| "global_step": 10600, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 1.1115612983703613, | |
| "learning_rate": 4.9500000000000004e-05, | |
| "loss": 0.9255, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_LOCATION_f1": 0.0, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.0, | |
| "eval_LOCATION_recall": 0.0, | |
| "eval_ORGANIZATION_f1": 0.0, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.0, | |
| "eval_ORGANIZATION_recall": 0.0, | |
| "eval_PERSON_f1": 0.012820512820512818, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.25, | |
| "eval_PERSON_recall": 0.006578947368421052, | |
| "eval_QUANTITY_f1": 0.0, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.0, | |
| "eval_QUANTITY_recall": 0.0, | |
| "eval_TIME_f1": 0.0, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.0, | |
| "eval_TIME_recall": 0.0, | |
| "eval_loss": 0.6139789819717407, | |
| "eval_overall_accuracy": 0.8402048655569783, | |
| "eval_overall_f1": 0.005847953216374269, | |
| "eval_overall_precision": 0.25, | |
| "eval_overall_recall": 0.0029585798816568047, | |
| "eval_runtime": 0.288, | |
| "eval_samples_per_second": 649.255, | |
| "eval_steps_per_second": 10.416, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 1.1083379983901978, | |
| "learning_rate": 4.9e-05, | |
| "loss": 0.5503, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_LOCATION_f1": 0.09523809523809525, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.26666666666666666, | |
| "eval_LOCATION_recall": 0.057971014492753624, | |
| "eval_ORGANIZATION_f1": 0.0, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.0, | |
| "eval_ORGANIZATION_recall": 0.0, | |
| "eval_PERSON_f1": 0.5272727272727272, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.4887640449438202, | |
| "eval_PERSON_recall": 0.5723684210526315, | |
| "eval_QUANTITY_f1": 0.0, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.0, | |
| "eval_QUANTITY_recall": 0.0, | |
| "eval_TIME_f1": 0.4, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.5625, | |
| "eval_TIME_recall": 0.3103448275862069, | |
| "eval_loss": 0.3994744122028351, | |
| "eval_overall_accuracy": 0.8855313700384123, | |
| "eval_overall_f1": 0.35714285714285715, | |
| "eval_overall_precision": 0.45045045045045046, | |
| "eval_overall_recall": 0.2958579881656805, | |
| "eval_runtime": 0.2908, | |
| "eval_samples_per_second": 642.974, | |
| "eval_steps_per_second": 10.315, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 1.8157479763031006, | |
| "learning_rate": 4.85e-05, | |
| "loss": 0.3808, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_LOCATION_f1": 0.5454545454545455, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.49411764705882355, | |
| "eval_LOCATION_recall": 0.6086956521739131, | |
| "eval_ORGANIZATION_f1": 0.2978723404255319, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.3888888888888889, | |
| "eval_ORGANIZATION_recall": 0.2413793103448276, | |
| "eval_PERSON_f1": 0.735632183908046, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.6530612244897959, | |
| "eval_PERSON_recall": 0.8421052631578947, | |
| "eval_QUANTITY_f1": 0.28571428571428564, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.2727272727272727, | |
| "eval_QUANTITY_recall": 0.3, | |
| "eval_TIME_f1": 0.6785714285714286, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7037037037037037, | |
| "eval_TIME_recall": 0.6551724137931034, | |
| "eval_loss": 0.28895071148872375, | |
| "eval_overall_accuracy": 0.9267605633802817, | |
| "eval_overall_f1": 0.5930069930069929, | |
| "eval_overall_precision": 0.5623342175066313, | |
| "eval_overall_recall": 0.6272189349112426, | |
| "eval_runtime": 0.2887, | |
| "eval_samples_per_second": 647.772, | |
| "eval_steps_per_second": 10.392, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 1.4652637243270874, | |
| "learning_rate": 4.8e-05, | |
| "loss": 0.2833, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_LOCATION_f1": 0.6455696202531644, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.5730337078651685, | |
| "eval_LOCATION_recall": 0.7391304347826086, | |
| "eval_ORGANIZATION_f1": 0.4642857142857143, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.48148148148148145, | |
| "eval_ORGANIZATION_recall": 0.4482758620689655, | |
| "eval_PERSON_f1": 0.7904191616766467, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.7252747252747253, | |
| "eval_PERSON_recall": 0.868421052631579, | |
| "eval_QUANTITY_f1": 0.47058823529411764, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.42105263157894735, | |
| "eval_QUANTITY_recall": 0.5333333333333333, | |
| "eval_TIME_f1": 0.8275862068965517, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8275862068965517, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.21562312543392181, | |
| "eval_overall_accuracy": 0.9405889884763124, | |
| "eval_overall_f1": 0.6821917808219178, | |
| "eval_overall_precision": 0.6352040816326531, | |
| "eval_overall_recall": 0.7366863905325444, | |
| "eval_runtime": 0.2884, | |
| "eval_samples_per_second": 648.345, | |
| "eval_steps_per_second": 10.401, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 1.5371237993240356, | |
| "learning_rate": 4.75e-05, | |
| "loss": 0.2213, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_LOCATION_f1": 0.725, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.6373626373626373, | |
| "eval_LOCATION_recall": 0.8405797101449275, | |
| "eval_ORGANIZATION_f1": 0.5263157894736843, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5357142857142857, | |
| "eval_ORGANIZATION_recall": 0.5172413793103449, | |
| "eval_PERSON_f1": 0.8012048192771084, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.7388888888888889, | |
| "eval_PERSON_recall": 0.875, | |
| "eval_QUANTITY_f1": 0.5333333333333333, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.4444444444444444, | |
| "eval_QUANTITY_recall": 0.6666666666666666, | |
| "eval_TIME_f1": 0.8275862068965517, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8275862068965517, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.18281985819339752, | |
| "eval_overall_accuracy": 0.9434058898847631, | |
| "eval_overall_f1": 0.7171853856562923, | |
| "eval_overall_precision": 0.6608478802992519, | |
| "eval_overall_recall": 0.7840236686390533, | |
| "eval_runtime": 0.2945, | |
| "eval_samples_per_second": 634.984, | |
| "eval_steps_per_second": 10.187, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 1.388359546661377, | |
| "learning_rate": 4.7e-05, | |
| "loss": 0.1845, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_LOCATION_f1": 0.7721518987341773, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.6853932584269663, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.5757575757575758, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5135135135135135, | |
| "eval_ORGANIZATION_recall": 0.6551724137931034, | |
| "eval_PERSON_f1": 0.8192771084337349, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.7555555555555555, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.5714285714285715, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.5, | |
| "eval_QUANTITY_recall": 0.6666666666666666, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1697721779346466, | |
| "eval_overall_accuracy": 0.9467349551856594, | |
| "eval_overall_f1": 0.7446808510638298, | |
| "eval_overall_precision": 0.6763285024154589, | |
| "eval_overall_recall": 0.8284023668639053, | |
| "eval_runtime": 0.2919, | |
| "eval_samples_per_second": 640.647, | |
| "eval_steps_per_second": 10.278, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 0.574262261390686, | |
| "learning_rate": 4.6500000000000005e-05, | |
| "loss": 0.17, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_LOCATION_f1": 0.8026315789473685, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7349397590361446, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.6016260162601627, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5692307692307692, | |
| "eval_ORGANIZATION_recall": 0.6379310344827587, | |
| "eval_PERSON_f1": 0.8246153846153845, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.7745664739884393, | |
| "eval_PERSON_recall": 0.881578947368421, | |
| "eval_QUANTITY_f1": 0.7164179104477612, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6486486486486487, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1523420363664627, | |
| "eval_overall_accuracy": 0.9510883482714468, | |
| "eval_overall_f1": 0.7741046831955923, | |
| "eval_overall_precision": 0.7242268041237113, | |
| "eval_overall_recall": 0.8313609467455622, | |
| "eval_runtime": 0.292, | |
| "eval_samples_per_second": 640.421, | |
| "eval_steps_per_second": 10.274, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 0.5678428411483765, | |
| "learning_rate": 4.600000000000001e-05, | |
| "loss": 0.1552, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_LOCATION_f1": 0.8266666666666668, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7654320987654321, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.5891472868217055, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5352112676056338, | |
| "eval_ORGANIZATION_recall": 0.6551724137931034, | |
| "eval_PERSON_f1": 0.8307692307692307, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.7803468208092486, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.7272727272727272, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8064516129032258, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7575757575757576, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.14812210202217102, | |
| "eval_overall_accuracy": 0.9518565941101153, | |
| "eval_overall_f1": 0.7759562841530055, | |
| "eval_overall_precision": 0.7208121827411168, | |
| "eval_overall_recall": 0.8402366863905325, | |
| "eval_runtime": 0.2864, | |
| "eval_samples_per_second": 652.864, | |
| "eval_steps_per_second": 10.474, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 1.5933927297592163, | |
| "learning_rate": 4.55e-05, | |
| "loss": 0.1486, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_LOCATION_f1": 0.8299319727891156, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.782051282051282, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.5853658536585366, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5538461538461539, | |
| "eval_ORGANIZATION_recall": 0.6206896551724138, | |
| "eval_PERSON_f1": 0.8427672955974843, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8072289156626506, | |
| "eval_PERSON_recall": 0.881578947368421, | |
| "eval_QUANTITY_f1": 0.7575757575757577, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8196721311475409, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.78125, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1388072818517685, | |
| "eval_overall_accuracy": 0.9544174135723431, | |
| "eval_overall_f1": 0.7860139860139861, | |
| "eval_overall_precision": 0.7453580901856764, | |
| "eval_overall_recall": 0.8313609467455622, | |
| "eval_runtime": 0.2922, | |
| "eval_samples_per_second": 640.03, | |
| "eval_steps_per_second": 10.268, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 1.51088547706604, | |
| "learning_rate": 4.5e-05, | |
| "loss": 0.1369, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_LOCATION_f1": 0.8243243243243245, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.6141732283464567, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5652173913043478, | |
| "eval_ORGANIZATION_recall": 0.6724137931034483, | |
| "eval_PERSON_f1": 0.8348909657320872, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.7928994082840237, | |
| "eval_PERSON_recall": 0.881578947368421, | |
| "eval_QUANTITY_f1": 0.6956521739130435, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6153846153846154, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8253968253968255, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7647058823529411, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.13908080756664276, | |
| "eval_overall_accuracy": 0.9549295774647887, | |
| "eval_overall_f1": 0.7802197802197802, | |
| "eval_overall_precision": 0.7282051282051282, | |
| "eval_overall_recall": 0.8402366863905325, | |
| "eval_runtime": 0.2918, | |
| "eval_samples_per_second": 640.865, | |
| "eval_steps_per_second": 10.281, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 1.4912283420562744, | |
| "learning_rate": 4.4500000000000004e-05, | |
| "loss": 0.132, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_LOCATION_f1": 0.8456375838926175, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7875, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.6299212598425198, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5797101449275363, | |
| "eval_ORGANIZATION_recall": 0.6896551724137931, | |
| "eval_PERSON_f1": 0.8473520249221184, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8047337278106509, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7812500000000001, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7142857142857143, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.14170250296592712, | |
| "eval_overall_accuracy": 0.953393085787452, | |
| "eval_overall_f1": 0.7928669410150891, | |
| "eval_overall_precision": 0.7391304347826086, | |
| "eval_overall_recall": 0.8550295857988166, | |
| "eval_runtime": 0.2921, | |
| "eval_samples_per_second": 640.286, | |
| "eval_steps_per_second": 10.272, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "grad_norm": 2.726284980773926, | |
| "learning_rate": 4.4000000000000006e-05, | |
| "loss": 0.1268, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_LOCATION_f1": 0.8378378378378378, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.6140350877192983, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.625, | |
| "eval_ORGANIZATION_recall": 0.603448275862069, | |
| "eval_PERSON_f1": 0.8517350157728707, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8181818181818182, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.7878787878787877, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7222222222222222, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8196721311475409, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.78125, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.13159815967082977, | |
| "eval_overall_accuracy": 0.9577464788732394, | |
| "eval_overall_f1": 0.8016997167138811, | |
| "eval_overall_precision": 0.7690217391304348, | |
| "eval_overall_recall": 0.8372781065088757, | |
| "eval_runtime": 0.2918, | |
| "eval_samples_per_second": 640.768, | |
| "eval_steps_per_second": 10.28, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "grad_norm": 0.7623488903045654, | |
| "learning_rate": 4.35e-05, | |
| "loss": 0.1206, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_LOCATION_f1": 0.8571428571428572, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8076923076923077, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.6115702479338844, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5873015873015873, | |
| "eval_ORGANIZATION_recall": 0.6379310344827587, | |
| "eval_PERSON_f1": 0.8526645768025078, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8143712574850299, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.13245752453804016, | |
| "eval_overall_accuracy": 0.9574903969270167, | |
| "eval_overall_f1": 0.8011204481792716, | |
| "eval_overall_precision": 0.7606382978723404, | |
| "eval_overall_recall": 0.8461538461538461, | |
| "eval_runtime": 0.2913, | |
| "eval_samples_per_second": 641.931, | |
| "eval_steps_per_second": 10.298, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "grad_norm": 3.348172664642334, | |
| "learning_rate": 4.3e-05, | |
| "loss": 0.1186, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_LOCATION_f1": 0.8551724137931034, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8157894736842105, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7299270072992702, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6329113924050633, | |
| "eval_ORGANIZATION_recall": 0.8620689655172413, | |
| "eval_PERSON_f1": 0.8500000000000001, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8095238095238095, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8253968253968255, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7647058823529411, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.13963258266448975, | |
| "eval_overall_accuracy": 0.9577464788732394, | |
| "eval_overall_f1": 0.8158253751705321, | |
| "eval_overall_precision": 0.7569620253164557, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2864, | |
| "eval_samples_per_second": 652.876, | |
| "eval_steps_per_second": 10.474, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "grad_norm": 1.2007865905761719, | |
| "learning_rate": 4.25e-05, | |
| "loss": 0.1141, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_LOCATION_f1": 0.8611111111111112, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8266666666666667, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.6333333333333333, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6129032258064516, | |
| "eval_ORGANIZATION_recall": 0.6551724137931034, | |
| "eval_PERSON_f1": 0.8481012658227848, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8170731707317073, | |
| "eval_PERSON_recall": 0.881578947368421, | |
| "eval_QUANTITY_f1": 0.7575757575757577, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8064516129032258, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7575757575757576, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1281883716583252, | |
| "eval_overall_accuracy": 0.9582586427656851, | |
| "eval_overall_f1": 0.8022598870056498, | |
| "eval_overall_precision": 0.7675675675675676, | |
| "eval_overall_recall": 0.8402366863905325, | |
| "eval_runtime": 0.2866, | |
| "eval_samples_per_second": 652.52, | |
| "eval_steps_per_second": 10.468, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "grad_norm": 0.8597108721733093, | |
| "learning_rate": 4.2e-05, | |
| "loss": 0.1083, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_LOCATION_f1": 0.8571428571428572, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8076923076923077, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7131782945736435, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.647887323943662, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8526645768025078, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8143712574850299, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7272727272727272, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8253968253968255, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7647058823529411, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1355670541524887, | |
| "eval_overall_accuracy": 0.9577464788732394, | |
| "eval_overall_f1": 0.8149171270718233, | |
| "eval_overall_precision": 0.7642487046632125, | |
| "eval_overall_recall": 0.8727810650887574, | |
| "eval_runtime": 0.2918, | |
| "eval_samples_per_second": 640.866, | |
| "eval_steps_per_second": 10.281, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "grad_norm": 0.9207751154899597, | |
| "learning_rate": 4.15e-05, | |
| "loss": 0.1106, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.6612903225806452, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6212121212121212, | |
| "eval_ORGANIZATION_recall": 0.7068965517241379, | |
| "eval_PERSON_f1": 0.8517350157728707, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8181818181818182, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8064516129032258, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7575757575757576, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1327420026063919, | |
| "eval_overall_accuracy": 0.9585147247119078, | |
| "eval_overall_f1": 0.8089260808926082, | |
| "eval_overall_precision": 0.7651715039577837, | |
| "eval_overall_recall": 0.8579881656804734, | |
| "eval_runtime": 0.2911, | |
| "eval_samples_per_second": 642.326, | |
| "eval_steps_per_second": 10.305, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "grad_norm": 2.323946952819824, | |
| "learning_rate": 4.1e-05, | |
| "loss": 0.1053, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.6611570247933884, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6349206349206349, | |
| "eval_ORGANIZATION_recall": 0.6896551724137931, | |
| "eval_PERSON_f1": 0.8500000000000001, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8095238095238095, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7246376811594204, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6410256410256411, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7936507936507937, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7352941176470589, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1359253227710724, | |
| "eval_overall_accuracy": 0.9580025608194622, | |
| "eval_overall_f1": 0.8044382801664354, | |
| "eval_overall_precision": 0.7571801566579635, | |
| "eval_overall_recall": 0.8579881656804734, | |
| "eval_runtime": 0.2865, | |
| "eval_samples_per_second": 652.807, | |
| "eval_steps_per_second": 10.473, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "grad_norm": 24.915828704833984, | |
| "learning_rate": 4.05e-05, | |
| "loss": 0.1089, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_LOCATION_f1": 0.8450704225352113, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.821917808219178, | |
| "eval_LOCATION_recall": 0.8695652173913043, | |
| "eval_ORGANIZATION_f1": 0.584070796460177, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6, | |
| "eval_ORGANIZATION_recall": 0.5689655172413793, | |
| "eval_PERSON_f1": 0.8471337579617835, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8209876543209876, | |
| "eval_PERSON_recall": 0.875, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7428571428571429, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8813559322033899, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8666666666666667, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.12435611337423325, | |
| "eval_overall_accuracy": 0.9595390524967989, | |
| "eval_overall_f1": 0.8023088023088024, | |
| "eval_overall_precision": 0.7830985915492957, | |
| "eval_overall_recall": 0.8224852071005917, | |
| "eval_runtime": 0.2922, | |
| "eval_samples_per_second": 640.081, | |
| "eval_steps_per_second": 10.269, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "grad_norm": 0.8912884593009949, | |
| "learning_rate": 4e-05, | |
| "loss": 0.1046, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_LOCATION_f1": 0.863013698630137, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8181818181818182, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.6779661016949153, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.6896551724137931, | |
| "eval_PERSON_f1": 0.85625, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8154761904761905, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7575757575757577, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7741935483870968, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7272727272727273, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.12911909818649292, | |
| "eval_overall_accuracy": 0.9600512163892445, | |
| "eval_overall_f1": 0.8117977528089887, | |
| "eval_overall_precision": 0.7727272727272727, | |
| "eval_overall_recall": 0.8550295857988166, | |
| "eval_runtime": 0.2932, | |
| "eval_samples_per_second": 637.792, | |
| "eval_steps_per_second": 10.232, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "grad_norm": 0.48920294642448425, | |
| "learning_rate": 3.9500000000000005e-05, | |
| "loss": 0.0965, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_LOCATION_f1": 0.84, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7777777777777778, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7424242424242424, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6621621621621622, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.875, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8333333333333334, | |
| "eval_PERSON_recall": 0.9210526315789473, | |
| "eval_QUANTITY_f1": 0.7575757575757577, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7741935483870968, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7272727272727273, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.1389300525188446, | |
| "eval_overall_accuracy": 0.9572343149807938, | |
| "eval_overall_f1": 0.8246575342465754, | |
| "eval_overall_precision": 0.7678571428571429, | |
| "eval_overall_recall": 0.8905325443786982, | |
| "eval_runtime": 0.2936, | |
| "eval_samples_per_second": 637.017, | |
| "eval_steps_per_second": 10.22, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "grad_norm": 1.2225427627563477, | |
| "learning_rate": 3.9000000000000006e-05, | |
| "loss": 0.0958, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7633587786259542, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.684931506849315, | |
| "eval_ORGANIZATION_recall": 0.8620689655172413, | |
| "eval_PERSON_f1": 0.8544303797468354, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.823170731707317, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1278899759054184, | |
| "eval_overall_accuracy": 0.9618437900128041, | |
| "eval_overall_f1": 0.8328690807799444, | |
| "eval_overall_precision": 0.7868421052631579, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2942, | |
| "eval_samples_per_second": 635.574, | |
| "eval_steps_per_second": 10.196, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "grad_norm": 0.5433982014656067, | |
| "learning_rate": 3.85e-05, | |
| "loss": 0.0929, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_LOCATION_f1": 0.8591549295774648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8356164383561644, | |
| "eval_LOCATION_recall": 0.8840579710144928, | |
| "eval_ORGANIZATION_f1": 0.6499999999999999, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6290322580645161, | |
| "eval_ORGANIZATION_recall": 0.6724137931034483, | |
| "eval_PERSON_f1": 0.8616352201257862, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.12278664112091064, | |
| "eval_overall_accuracy": 0.9628681177976952, | |
| "eval_overall_f1": 0.8176638176638177, | |
| "eval_overall_precision": 0.7884615384615384, | |
| "eval_overall_recall": 0.849112426035503, | |
| "eval_runtime": 0.2929, | |
| "eval_samples_per_second": 638.552, | |
| "eval_steps_per_second": 10.244, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "grad_norm": 1.4073636531829834, | |
| "learning_rate": 3.8e-05, | |
| "loss": 0.0934, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.746268656716418, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6578947368421053, | |
| "eval_ORGANIZATION_recall": 0.8620689655172413, | |
| "eval_PERSON_f1": 0.8509316770186336, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8058823529411765, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8196721311475409, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.78125, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.13569365441799164, | |
| "eval_overall_accuracy": 0.9595390524967989, | |
| "eval_overall_f1": 0.8285322359396433, | |
| "eval_overall_precision": 0.7723785166240409, | |
| "eval_overall_recall": 0.893491124260355, | |
| "eval_runtime": 0.2923, | |
| "eval_samples_per_second": 639.683, | |
| "eval_steps_per_second": 10.262, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "grad_norm": 2.3010127544403076, | |
| "learning_rate": 3.7500000000000003e-05, | |
| "loss": 0.0887, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_LOCATION_f1": 0.8435374149659864, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7166666666666668, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6935483870967742, | |
| "eval_ORGANIZATION_recall": 0.7413793103448276, | |
| "eval_PERSON_f1": 0.8535031847133758, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8271604938271605, | |
| "eval_PERSON_recall": 0.881578947368421, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.12316982448101044, | |
| "eval_overall_accuracy": 0.9615877080665813, | |
| "eval_overall_f1": 0.8198581560283689, | |
| "eval_overall_precision": 0.7874659400544959, | |
| "eval_overall_recall": 0.8550295857988166, | |
| "eval_runtime": 0.2928, | |
| "eval_samples_per_second": 638.601, | |
| "eval_steps_per_second": 10.245, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "grad_norm": 1.5638922452926636, | |
| "learning_rate": 3.7e-05, | |
| "loss": 0.1025, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7716535433070866, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.7101449275362319, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.8616352201257862, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.1349707692861557, | |
| "eval_overall_accuracy": 0.9618437900128041, | |
| "eval_overall_f1": 0.8312412831241283, | |
| "eval_overall_precision": 0.7862796833773087, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2929, | |
| "eval_samples_per_second": 638.525, | |
| "eval_steps_per_second": 10.244, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "grad_norm": 1.3527199029922485, | |
| "learning_rate": 3.65e-05, | |
| "loss": 0.0868, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7777777777777778, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.7205882352941176, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7761194029850748, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7027027027027027, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.7868852459016394, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.1333594173192978, | |
| "eval_overall_accuracy": 0.9613316261203585, | |
| "eval_overall_f1": 0.8328690807799444, | |
| "eval_overall_precision": 0.7868421052631579, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2923, | |
| "eval_samples_per_second": 639.845, | |
| "eval_steps_per_second": 10.265, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "grad_norm": 2.2402167320251465, | |
| "learning_rate": 3.6e-05, | |
| "loss": 0.0836, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7258064516129032, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6818181818181818, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8616352201257862, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7575757575757577, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7419354838709677, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.696969696969697, | |
| "eval_TIME_recall": 0.7931034482758621, | |
| "eval_loss": 0.1318032443523407, | |
| "eval_overall_accuracy": 0.9620998719590269, | |
| "eval_overall_f1": 0.8212290502793296, | |
| "eval_overall_precision": 0.7777777777777778, | |
| "eval_overall_recall": 0.8698224852071006, | |
| "eval_runtime": 0.2923, | |
| "eval_samples_per_second": 639.756, | |
| "eval_steps_per_second": 10.263, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "grad_norm": 1.1857041120529175, | |
| "learning_rate": 3.55e-05, | |
| "loss": 0.0791, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_LOCATION_f1": 0.8513513513513514, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7974683544303798, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.746031746031746, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6911764705882353, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.85625, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8154761904761905, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.13442517817020416, | |
| "eval_overall_accuracy": 0.9618437900128041, | |
| "eval_overall_f1": 0.8256624825662484, | |
| "eval_overall_precision": 0.7810026385224275, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2926, | |
| "eval_samples_per_second": 639.174, | |
| "eval_steps_per_second": 10.254, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "grad_norm": 0.6588788032531738, | |
| "learning_rate": 3.5e-05, | |
| "loss": 0.0792, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7058823529411765, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6885245901639344, | |
| "eval_ORGANIZATION_recall": 0.7241379310344828, | |
| "eval_PERSON_f1": 0.8643533123028391, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8303030303030303, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.12328661233186722, | |
| "eval_overall_accuracy": 0.9651728553137003, | |
| "eval_overall_f1": 0.8312056737588652, | |
| "eval_overall_precision": 0.7983651226158038, | |
| "eval_overall_recall": 0.8668639053254438, | |
| "eval_runtime": 0.287, | |
| "eval_samples_per_second": 651.586, | |
| "eval_steps_per_second": 10.453, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "grad_norm": 0.4727123975753784, | |
| "learning_rate": 3.45e-05, | |
| "loss": 0.0772, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7317073170731708, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6923076923076923, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8652037617554859, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8263473053892215, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8135593220338982, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.1277562379837036, | |
| "eval_overall_accuracy": 0.9646606914212548, | |
| "eval_overall_f1": 0.8326300984528833, | |
| "eval_overall_precision": 0.7935656836461126, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2916, | |
| "eval_samples_per_second": 641.192, | |
| "eval_steps_per_second": 10.287, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "grad_norm": 0.8663144111633301, | |
| "learning_rate": 3.4000000000000007e-05, | |
| "loss": 0.0766, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7244094488188977, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8544303797468354, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.823170731707317, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8135593220338982, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.12748569250106812, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8258426966292135, | |
| "eval_overall_precision": 0.786096256684492, | |
| "eval_overall_recall": 0.8698224852071006, | |
| "eval_runtime": 0.287, | |
| "eval_samples_per_second": 651.573, | |
| "eval_steps_per_second": 10.453, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "grad_norm": 0.6088622808456421, | |
| "learning_rate": 3.35e-05, | |
| "loss": 0.0746, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7401574803149606, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6811594202898551, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8507936507936509, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8220858895705522, | |
| "eval_PERSON_recall": 0.881578947368421, | |
| "eval_QUANTITY_f1": 0.8253968253968254, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8135593220338982, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.13140520453453064, | |
| "eval_overall_accuracy": 0.9636363636363636, | |
| "eval_overall_f1": 0.8286516853932584, | |
| "eval_overall_precision": 0.7887700534759359, | |
| "eval_overall_recall": 0.8727810650887574, | |
| "eval_runtime": 0.293, | |
| "eval_samples_per_second": 638.168, | |
| "eval_steps_per_second": 10.238, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "grad_norm": 1.8929836750030518, | |
| "learning_rate": 3.3e-05, | |
| "loss": 0.072, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7559055118110236, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6956521739130435, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8626198083067094, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8385093167701864, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.8253968253968254, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8135593220338982, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.13353487849235535, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8366197183098592, | |
| "eval_overall_precision": 0.7983870967741935, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.293, | |
| "eval_samples_per_second": 638.242, | |
| "eval_steps_per_second": 10.239, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "grad_norm": 1.197149634361267, | |
| "learning_rate": 3.2500000000000004e-05, | |
| "loss": 0.0712, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7377049180327868, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.703125, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8625, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8214285714285714, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.8, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7428571428571429, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.13137878477573395, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8347338935574229, | |
| "eval_overall_precision": 0.7925531914893617, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2864, | |
| "eval_samples_per_second": 652.975, | |
| "eval_steps_per_second": 10.476, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "grad_norm": 0.49242687225341797, | |
| "learning_rate": 3.2000000000000005e-05, | |
| "loss": 0.0702, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "eval_LOCATION_f1": 0.8611111111111112, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8266666666666667, | |
| "eval_LOCATION_recall": 0.8985507246376812, | |
| "eval_ORGANIZATION_f1": 0.7230769230769231, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6527777777777778, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8626198083067094, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8385093167701864, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.8253968253968254, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7878787878787878, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8135593220338982, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.13032355904579163, | |
| "eval_overall_accuracy": 0.9641485275288092, | |
| "eval_overall_f1": 0.8293370944992947, | |
| "eval_overall_precision": 0.7924528301886793, | |
| "eval_overall_recall": 0.8698224852071006, | |
| "eval_runtime": 0.2939, | |
| "eval_samples_per_second": 636.252, | |
| "eval_steps_per_second": 10.207, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "grad_norm": 2.0146589279174805, | |
| "learning_rate": 3.15e-05, | |
| "loss": 0.0695, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7580645161290323, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.7121212121212122, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8616352201257862, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.12965013086795807, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.840620592383639, | |
| "eval_overall_precision": 0.8032345013477089, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2929, | |
| "eval_samples_per_second": 638.49, | |
| "eval_steps_per_second": 10.243, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "grad_norm": 0.8112408518791199, | |
| "learning_rate": 3.1e-05, | |
| "loss": 0.0674, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7419354838709677, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.696969696969697, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8706624605678233, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8363636363636363, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.7536231884057971, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1362360268831253, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8363636363636363, | |
| "eval_overall_precision": 0.7931034482758621, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2929, | |
| "eval_samples_per_second": 638.407, | |
| "eval_steps_per_second": 10.242, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "grad_norm": 0.4772998094558716, | |
| "learning_rate": 3.05e-05, | |
| "loss": 0.0653, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.6942148760330579, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7241379310344828, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.12953267991542816, | |
| "eval_overall_accuracy": 0.964404609475032, | |
| "eval_overall_f1": 0.8271954674220963, | |
| "eval_overall_precision": 0.7934782608695652, | |
| "eval_overall_recall": 0.863905325443787, | |
| "eval_runtime": 0.2928, | |
| "eval_samples_per_second": 638.701, | |
| "eval_steps_per_second": 10.247, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "grad_norm": 1.1962645053863525, | |
| "learning_rate": 3e-05, | |
| "loss": 0.0637, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "eval_LOCATION_f1": 0.8533333333333333, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7901234567901234, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7258064516129032, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6818181818181818, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8761904761904762, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8466257668711656, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.13492895662784576, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8330995792426368, | |
| "eval_overall_precision": 0.792, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2867, | |
| "eval_samples_per_second": 652.21, | |
| "eval_steps_per_second": 10.463, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "grad_norm": 0.6804232597351074, | |
| "learning_rate": 2.95e-05, | |
| "loss": 0.0634, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "eval_LOCATION_f1": 0.8749999999999999, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.84, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7619047619047619, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.7058823529411765, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8742138364779874, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8373493975903614, | |
| "eval_PERSON_recall": 0.9144736842105263, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.1353294402360916, | |
| "eval_overall_accuracy": 0.9651728553137003, | |
| "eval_overall_f1": 0.8410689170182841, | |
| "eval_overall_precision": 0.8016085790884718, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2941, | |
| "eval_samples_per_second": 635.842, | |
| "eval_steps_per_second": 10.201, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "grad_norm": 1.3958626985549927, | |
| "learning_rate": 2.9e-05, | |
| "loss": 0.0622, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7154471544715447, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.676923076923077, | |
| "eval_ORGANIZATION_recall": 0.7586206896551724, | |
| "eval_PERSON_f1": 0.8769716088328074, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8424242424242424, | |
| "eval_PERSON_recall": 0.9144736842105263, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.13502123951911926, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8377997179125528, | |
| "eval_overall_precision": 0.8005390835579514, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2888, | |
| "eval_samples_per_second": 647.481, | |
| "eval_steps_per_second": 10.387, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "grad_norm": 1.7736326456069946, | |
| "learning_rate": 2.8499999999999998e-05, | |
| "loss": 0.0616, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.752, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.7014925373134329, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8742138364779874, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8373493975903614, | |
| "eval_PERSON_recall": 0.9144736842105263, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1341027021408081, | |
| "eval_overall_accuracy": 0.9654289372599232, | |
| "eval_overall_f1": 0.8455056179775281, | |
| "eval_overall_precision": 0.8048128342245989, | |
| "eval_overall_recall": 0.8905325443786982, | |
| "eval_runtime": 0.2927, | |
| "eval_samples_per_second": 638.914, | |
| "eval_steps_per_second": 10.25, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "grad_norm": 4.0435028076171875, | |
| "learning_rate": 2.8000000000000003e-05, | |
| "loss": 0.0603, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "eval_LOCATION_f1": 0.8476821192052981, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.7804878048780488, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7286821705426356, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6619718309859155, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8714733542319749, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8323353293413174, | |
| "eval_PERSON_recall": 0.9144736842105263, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.14106552302837372, | |
| "eval_overall_accuracy": 0.9628681177976952, | |
| "eval_overall_f1": 0.8310249307479224, | |
| "eval_overall_precision": 0.78125, | |
| "eval_overall_recall": 0.8875739644970414, | |
| "eval_runtime": 0.2883, | |
| "eval_samples_per_second": 648.632, | |
| "eval_steps_per_second": 10.406, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "grad_norm": 1.2470722198486328, | |
| "learning_rate": 2.7500000000000004e-05, | |
| "loss": 0.0597, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7286821705426356, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6619718309859155, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8652037617554859, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8263473053892215, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.7352941176470588, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6578947368421053, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.14016938209533691, | |
| "eval_overall_accuracy": 0.9620998719590269, | |
| "eval_overall_f1": 0.8243430152143846, | |
| "eval_overall_precision": 0.7740259740259741, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2928, | |
| "eval_samples_per_second": 638.618, | |
| "eval_steps_per_second": 10.245, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "grad_norm": 0.7653511762619019, | |
| "learning_rate": 2.7000000000000002e-05, | |
| "loss": 0.059, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.736, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6865671641791045, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.13417667150497437, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8326300984528833, | |
| "eval_overall_precision": 0.7935656836461126, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2925, | |
| "eval_samples_per_second": 639.217, | |
| "eval_steps_per_second": 10.255, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "grad_norm": 1.0474615097045898, | |
| "learning_rate": 2.6500000000000004e-05, | |
| "loss": 0.0574, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.736, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6865671641791045, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7575757575757577, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7796610169491527, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7666666666666667, | |
| "eval_TIME_recall": 0.7931034482758621, | |
| "eval_loss": 0.13553491234779358, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8258426966292135, | |
| "eval_overall_precision": 0.786096256684492, | |
| "eval_overall_recall": 0.8698224852071006, | |
| "eval_runtime": 0.2928, | |
| "eval_samples_per_second": 638.657, | |
| "eval_steps_per_second": 10.246, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "grad_norm": 1.1858253479003906, | |
| "learning_rate": 2.6000000000000002e-05, | |
| "loss": 0.0581, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7377049180327868, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.703125, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.13520203530788422, | |
| "eval_overall_accuracy": 0.9659411011523688, | |
| "eval_overall_f1": 0.8389830508474576, | |
| "eval_overall_precision": 0.8027027027027027, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2932, | |
| "eval_samples_per_second": 637.868, | |
| "eval_steps_per_second": 10.233, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "grad_norm": 0.4307897090911865, | |
| "learning_rate": 2.5500000000000003e-05, | |
| "loss": 0.0561, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7301587301587301, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6764705882352942, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8679245283018868, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8313253012048193, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8813559322033899, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8666666666666667, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.13861991465091705, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8398876404494382, | |
| "eval_overall_precision": 0.7994652406417112, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2889, | |
| "eval_samples_per_second": 647.316, | |
| "eval_steps_per_second": 10.385, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "grad_norm": 0.8664003014564514, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.0544, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "eval_LOCATION_f1": 0.8749999999999999, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.84, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.736, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6865671641791045, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8471337579617835, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8209876543209876, | |
| "eval_PERSON_recall": 0.875, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8813559322033899, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8666666666666667, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.13451269268989563, | |
| "eval_overall_accuracy": 0.9651728553137003, | |
| "eval_overall_f1": 0.8312056737588652, | |
| "eval_overall_precision": 0.7983651226158038, | |
| "eval_overall_recall": 0.8668639053254438, | |
| "eval_runtime": 0.2869, | |
| "eval_samples_per_second": 651.752, | |
| "eval_steps_per_second": 10.456, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "grad_norm": 3.4700815677642822, | |
| "learning_rate": 2.45e-05, | |
| "loss": 0.0534, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7692307692307692, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6944444444444444, | |
| "eval_ORGANIZATION_recall": 0.8620689655172413, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.847457627118644, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8333333333333334, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.13688045740127563, | |
| "eval_overall_accuracy": 0.9651728553137003, | |
| "eval_overall_f1": 0.841514726507714, | |
| "eval_overall_precision": 0.8, | |
| "eval_overall_recall": 0.8875739644970414, | |
| "eval_runtime": 0.2922, | |
| "eval_samples_per_second": 640.064, | |
| "eval_steps_per_second": 10.268, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "grad_norm": 1.2102717161178589, | |
| "learning_rate": 2.4e-05, | |
| "loss": 0.0521, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7669172932330827, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.68, | |
| "eval_ORGANIZATION_recall": 0.8793103448275862, | |
| "eval_PERSON_f1": 0.8643533123028391, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8303030303030303, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.14608342945575714, | |
| "eval_overall_accuracy": 0.9628681177976952, | |
| "eval_overall_f1": 0.8337950138504154, | |
| "eval_overall_precision": 0.7838541666666666, | |
| "eval_overall_recall": 0.8905325443786982, | |
| "eval_runtime": 0.2926, | |
| "eval_samples_per_second": 639.189, | |
| "eval_steps_per_second": 10.254, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "grad_norm": 1.385406732559204, | |
| "learning_rate": 2.35e-05, | |
| "loss": 0.0524, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.768, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.7164179104477612, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1376073956489563, | |
| "eval_overall_accuracy": 0.9656850192061459, | |
| "eval_overall_f1": 0.8410689170182841, | |
| "eval_overall_precision": 0.8016085790884718, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2926, | |
| "eval_samples_per_second": 639.014, | |
| "eval_steps_per_second": 10.252, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "grad_norm": 0.37542441487312317, | |
| "learning_rate": 2.3000000000000003e-05, | |
| "loss": 0.0494, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7401574803149606, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6811594202898551, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.14096996188163757, | |
| "eval_overall_accuracy": 0.9659411011523688, | |
| "eval_overall_f1": 0.8398876404494382, | |
| "eval_overall_precision": 0.7994652406417112, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2945, | |
| "eval_samples_per_second": 635.027, | |
| "eval_steps_per_second": 10.188, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "grad_norm": 2.3441622257232666, | |
| "learning_rate": 2.25e-05, | |
| "loss": 0.0516, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7559055118110236, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6956521739130435, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8670886075949367, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8353658536585366, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.13822495937347412, | |
| "eval_overall_accuracy": 0.9659411011523688, | |
| "eval_overall_f1": 0.8455056179775281, | |
| "eval_overall_precision": 0.8048128342245989, | |
| "eval_overall_recall": 0.8905325443786982, | |
| "eval_runtime": 0.2928, | |
| "eval_samples_per_second": 638.657, | |
| "eval_steps_per_second": 10.246, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "grad_norm": 0.9206390976905823, | |
| "learning_rate": 2.2000000000000003e-05, | |
| "loss": 0.0497, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7200000000000001, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6716417910447762, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8571428571428571, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8282208588957055, | |
| "eval_PERSON_recall": 0.8881578947368421, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.13933928310871124, | |
| "eval_overall_accuracy": 0.9654289372599232, | |
| "eval_overall_f1": 0.8338028169014083, | |
| "eval_overall_precision": 0.7956989247311828, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.293, | |
| "eval_samples_per_second": 638.123, | |
| "eval_steps_per_second": 10.237, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "grad_norm": 0.8336784839630127, | |
| "learning_rate": 2.15e-05, | |
| "loss": 0.048, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.752, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.7014925373134329, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.14417044818401337, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8347338935574229, | |
| "eval_overall_precision": 0.7925531914893617, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2919, | |
| "eval_samples_per_second": 640.597, | |
| "eval_steps_per_second": 10.277, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "grad_norm": 1.4807782173156738, | |
| "learning_rate": 2.1e-05, | |
| "loss": 0.0474, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7480916030534351, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6712328767123288, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.8589341692789968, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8203592814371258, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.14203424751758575, | |
| "eval_overall_accuracy": 0.9646606914212548, | |
| "eval_overall_f1": 0.8372739916550764, | |
| "eval_overall_precision": 0.7900262467191601, | |
| "eval_overall_recall": 0.8905325443786982, | |
| "eval_runtime": 0.2926, | |
| "eval_samples_per_second": 639.123, | |
| "eval_steps_per_second": 10.253, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "grad_norm": 1.1692790985107422, | |
| "learning_rate": 2.05e-05, | |
| "loss": 0.0447, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.75, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6857142857142857, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8643533123028391, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8303030303030303, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1469813734292984, | |
| "eval_overall_accuracy": 0.9646606914212548, | |
| "eval_overall_f1": 0.8363636363636363, | |
| "eval_overall_precision": 0.7931034482758621, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.293, | |
| "eval_samples_per_second": 638.282, | |
| "eval_steps_per_second": 10.24, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "grad_norm": 0.8121991157531738, | |
| "learning_rate": 2e-05, | |
| "loss": 0.045, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7301587301587301, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6764705882352942, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.8125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7647058823529411, | |
| "eval_QUANTITY_recall": 0.8666666666666667, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.14526785910129547, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8330995792426368, | |
| "eval_overall_precision": 0.792, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2933, | |
| "eval_samples_per_second": 637.529, | |
| "eval_steps_per_second": 10.228, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "grad_norm": 0.9558350443840027, | |
| "learning_rate": 1.9500000000000003e-05, | |
| "loss": 0.0441, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "eval_LOCATION_f1": 0.8749999999999999, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.84, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7244094488188977, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1430891752243042, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8349788434414668, | |
| "eval_overall_precision": 0.7978436657681941, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.286, | |
| "eval_samples_per_second": 653.776, | |
| "eval_steps_per_second": 10.488, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "grad_norm": 1.2547602653503418, | |
| "learning_rate": 1.9e-05, | |
| "loss": 0.0474, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.71875, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8616352201257862, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8253012048192772, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1453644037246704, | |
| "eval_overall_accuracy": 0.9646606914212548, | |
| "eval_overall_f1": 0.8307692307692308, | |
| "eval_overall_precision": 0.7877984084880637, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.286, | |
| "eval_samples_per_second": 653.787, | |
| "eval_steps_per_second": 10.489, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "grad_norm": 0.2882705628871918, | |
| "learning_rate": 1.85e-05, | |
| "loss": 0.0441, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7258064516129032, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6818181818181818, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8706624605678233, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8363636363636363, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.14318965375423431, | |
| "eval_overall_accuracy": 0.9651728553137003, | |
| "eval_overall_f1": 0.8382559774964837, | |
| "eval_overall_precision": 0.7989276139410187, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2869, | |
| "eval_samples_per_second": 651.819, | |
| "eval_steps_per_second": 10.457, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "grad_norm": 1.046625018119812, | |
| "learning_rate": 1.8e-05, | |
| "loss": 0.0449, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "eval_LOCATION_f1": 0.8590604026845639, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7034482758620689, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.5862068965517241, | |
| "eval_ORGANIZATION_recall": 0.8793103448275862, | |
| "eval_PERSON_f1": 0.8598130841121495, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8165680473372781, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.7575757575757577, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6944444444444444, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.16219820082187653, | |
| "eval_overall_accuracy": 0.9590268886043534, | |
| "eval_overall_f1": 0.8178137651821863, | |
| "eval_overall_precision": 0.7518610421836228, | |
| "eval_overall_recall": 0.8964497041420119, | |
| "eval_runtime": 0.2859, | |
| "eval_samples_per_second": 654.058, | |
| "eval_steps_per_second": 10.493, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "grad_norm": 1.8243094682693481, | |
| "learning_rate": 1.75e-05, | |
| "loss": 0.0452, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7424242424242424, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6621621621621622, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.85625, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8154761904761905, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.14889490604400635, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8349514563106797, | |
| "eval_overall_precision": 0.7859007832898173, | |
| "eval_overall_recall": 0.8905325443786982, | |
| "eval_runtime": 0.2885, | |
| "eval_samples_per_second": 648.163, | |
| "eval_steps_per_second": 10.398, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "grad_norm": 0.7773322463035583, | |
| "learning_rate": 1.7000000000000003e-05, | |
| "loss": 0.0418, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7480916030534351, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6712328767123288, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.8625, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8214285714285714, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.15430662035942078, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8349514563106797, | |
| "eval_overall_precision": 0.7859007832898173, | |
| "eval_overall_recall": 0.8905325443786982, | |
| "eval_runtime": 0.2923, | |
| "eval_samples_per_second": 639.682, | |
| "eval_steps_per_second": 10.262, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "grad_norm": 0.9151946306228638, | |
| "learning_rate": 1.65e-05, | |
| "loss": 0.0421, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7538461538461538, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6805555555555556, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.8589341692789968, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8203592814371258, | |
| "eval_PERSON_recall": 0.9013157894736842, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.15378881990909576, | |
| "eval_overall_accuracy": 0.963124199743918, | |
| "eval_overall_f1": 0.8321775312066575, | |
| "eval_overall_precision": 0.783289817232376, | |
| "eval_overall_recall": 0.8875739644970414, | |
| "eval_runtime": 0.2921, | |
| "eval_samples_per_second": 640.251, | |
| "eval_steps_per_second": 10.271, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "grad_norm": 0.4768742322921753, | |
| "learning_rate": 1.6000000000000003e-05, | |
| "loss": 0.041, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7518796992481203, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.8620689655172413, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.15490765869617462, | |
| "eval_overall_accuracy": 0.9626120358514725, | |
| "eval_overall_f1": 0.8294036061026352, | |
| "eval_overall_precision": 0.7806788511749347, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2858, | |
| "eval_samples_per_second": 654.293, | |
| "eval_steps_per_second": 10.497, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "grad_norm": 1.6758042573928833, | |
| "learning_rate": 1.55e-05, | |
| "loss": 0.0411, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7401574803149606, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6811594202898551, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8553459119496855, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8192771084337349, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15107131004333496, | |
| "eval_overall_accuracy": 0.9651728553137003, | |
| "eval_overall_f1": 0.8347338935574229, | |
| "eval_overall_precision": 0.7925531914893617, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2937, | |
| "eval_samples_per_second": 636.611, | |
| "eval_steps_per_second": 10.213, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "grad_norm": 1.7515956163406372, | |
| "learning_rate": 1.5e-05, | |
| "loss": 0.0414, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7301587301587301, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6764705882352942, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8625, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8214285714285714, | |
| "eval_PERSON_recall": 0.9078947368421053, | |
| "eval_QUANTITY_f1": 0.746268656716418, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6756756756756757, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.7999999999999999, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.7741935483870968, | |
| "eval_TIME_recall": 0.8275862068965517, | |
| "eval_loss": 0.15384884178638458, | |
| "eval_overall_accuracy": 0.963124199743918, | |
| "eval_overall_f1": 0.8250000000000001, | |
| "eval_overall_precision": 0.7774869109947644, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2872, | |
| "eval_samples_per_second": 651.192, | |
| "eval_steps_per_second": 10.447, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "grad_norm": 1.0327603816986084, | |
| "learning_rate": 1.45e-05, | |
| "loss": 0.0407, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7384615384615385, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1484140008687973, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8375350140056023, | |
| "eval_overall_precision": 0.7952127659574468, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2923, | |
| "eval_samples_per_second": 639.759, | |
| "eval_steps_per_second": 10.264, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "grad_norm": 1.021155595779419, | |
| "learning_rate": 1.4000000000000001e-05, | |
| "loss": 0.0395, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "eval_LOCATION_f1": 0.8749999999999999, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.84, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7419354838709677, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.696969696969697, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.14668720960617065, | |
| "eval_overall_accuracy": 0.9649167733674776, | |
| "eval_overall_f1": 0.8385269121813032, | |
| "eval_overall_precision": 0.8043478260869565, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2936, | |
| "eval_samples_per_second": 636.931, | |
| "eval_steps_per_second": 10.218, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "grad_norm": 0.8261666893959045, | |
| "learning_rate": 1.3500000000000001e-05, | |
| "loss": 0.0388, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7441860465116279, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.676056338028169, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7936507936507938, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7575757575757576, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.14678049087524414, | |
| "eval_overall_accuracy": 0.9651728553137003, | |
| "eval_overall_f1": 0.8387096774193548, | |
| "eval_overall_precision": 0.7973333333333333, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2943, | |
| "eval_samples_per_second": 635.507, | |
| "eval_steps_per_second": 10.195, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "grad_norm": 1.6623172760009766, | |
| "learning_rate": 1.3000000000000001e-05, | |
| "loss": 0.0401, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7441860465116279, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.676056338028169, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15321803092956543, | |
| "eval_overall_accuracy": 0.9646606914212548, | |
| "eval_overall_f1": 0.8363636363636363, | |
| "eval_overall_precision": 0.7931034482758621, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2923, | |
| "eval_samples_per_second": 639.734, | |
| "eval_steps_per_second": 10.263, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "grad_norm": 0.745629608631134, | |
| "learning_rate": 1.25e-05, | |
| "loss": 0.0376, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.71875, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15535052120685577, | |
| "eval_overall_accuracy": 0.9636363636363636, | |
| "eval_overall_f1": 0.829608938547486, | |
| "eval_overall_precision": 0.7857142857142857, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2924, | |
| "eval_samples_per_second": 639.471, | |
| "eval_steps_per_second": 10.259, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "grad_norm": 1.3148008584976196, | |
| "learning_rate": 1.2e-05, | |
| "loss": 0.0389, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7480916030534351, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6712328767123288, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7500000000000001, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7058823529411765, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15534979104995728, | |
| "eval_overall_accuracy": 0.963124199743918, | |
| "eval_overall_f1": 0.8328690807799444, | |
| "eval_overall_precision": 0.7868421052631579, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2928, | |
| "eval_samples_per_second": 638.704, | |
| "eval_steps_per_second": 10.247, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "grad_norm": 0.5751745104789734, | |
| "learning_rate": 1.1500000000000002e-05, | |
| "loss": 0.0385, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7538461538461538, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6805555555555556, | |
| "eval_ORGANIZATION_recall": 0.8448275862068966, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1525815725326538, | |
| "eval_overall_accuracy": 0.964404609475032, | |
| "eval_overall_f1": 0.835195530726257, | |
| "eval_overall_precision": 0.791005291005291, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2918, | |
| "eval_samples_per_second": 640.799, | |
| "eval_steps_per_second": 10.28, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "grad_norm": 1.434624195098877, | |
| "learning_rate": 1.1000000000000001e-05, | |
| "loss": 0.0375, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7286821705426356, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6619718309859155, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15279057621955872, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.829608938547486, | |
| "eval_overall_precision": 0.7857142857142857, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2926, | |
| "eval_samples_per_second": 639.034, | |
| "eval_steps_per_second": 10.252, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "grad_norm": 0.7510130405426025, | |
| "learning_rate": 1.05e-05, | |
| "loss": 0.0373, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7244094488188977, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1517334133386612, | |
| "eval_overall_accuracy": 0.964404609475032, | |
| "eval_overall_f1": 0.8330995792426368, | |
| "eval_overall_precision": 0.792, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2862, | |
| "eval_samples_per_second": 653.312, | |
| "eval_steps_per_second": 10.481, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "grad_norm": 0.686745822429657, | |
| "learning_rate": 1e-05, | |
| "loss": 0.0375, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7401574803149606, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6811594202898551, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8553459119496855, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8192771084337349, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7500000000000001, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7058823529411765, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15770980715751648, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.829608938547486, | |
| "eval_overall_precision": 0.7857142857142857, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2918, | |
| "eval_samples_per_second": 640.906, | |
| "eval_steps_per_second": 10.282, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "grad_norm": 2.2296547889709473, | |
| "learning_rate": 9.5e-06, | |
| "loss": 0.0371, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7384615384615385, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1602996438741684, | |
| "eval_overall_accuracy": 0.963124199743918, | |
| "eval_overall_f1": 0.8317107093184978, | |
| "eval_overall_precision": 0.7847769028871391, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2862, | |
| "eval_samples_per_second": 653.41, | |
| "eval_steps_per_second": 10.483, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "grad_norm": 1.0859251022338867, | |
| "learning_rate": 9e-06, | |
| "loss": 0.0364, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7441860465116279, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.676056338028169, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15970273315906525, | |
| "eval_overall_accuracy": 0.9633802816901409, | |
| "eval_overall_f1": 0.8328690807799444, | |
| "eval_overall_precision": 0.7868421052631579, | |
| "eval_overall_recall": 0.8846153846153846, | |
| "eval_runtime": 0.2856, | |
| "eval_samples_per_second": 654.808, | |
| "eval_steps_per_second": 10.505, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "grad_norm": 0.759631872177124, | |
| "learning_rate": 8.500000000000002e-06, | |
| "loss": 0.0355, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.71875, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15819035470485687, | |
| "eval_overall_accuracy": 0.963124199743918, | |
| "eval_overall_f1": 0.8284518828451882, | |
| "eval_overall_precision": 0.783641160949868, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2921, | |
| "eval_samples_per_second": 640.257, | |
| "eval_steps_per_second": 10.271, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "grad_norm": 3.2821595668792725, | |
| "learning_rate": 8.000000000000001e-06, | |
| "loss": 0.0352, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "eval_LOCATION_f1": 0.8648648648648648, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.810126582278481, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7175572519083969, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6438356164383562, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8333333333333334, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8064516129032258, | |
| "eval_TIME_recall": 0.8620689655172413, | |
| "eval_loss": 0.1597450226545334, | |
| "eval_overall_accuracy": 0.9620998719590269, | |
| "eval_overall_f1": 0.8210818307905687, | |
| "eval_overall_precision": 0.7728459530026109, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2916, | |
| "eval_samples_per_second": 641.288, | |
| "eval_steps_per_second": 10.288, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "grad_norm": 1.4578148126602173, | |
| "learning_rate": 7.5e-06, | |
| "loss": 0.0351, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.71875, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15464067459106445, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8319327731092437, | |
| "eval_overall_precision": 0.7898936170212766, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.291, | |
| "eval_samples_per_second": 642.532, | |
| "eval_steps_per_second": 10.308, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "grad_norm": 3.6410322189331055, | |
| "learning_rate": 7.000000000000001e-06, | |
| "loss": 0.0358, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "eval_LOCATION_f1": 0.882758620689655, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8421052631578947, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7131782945736435, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.647887323943662, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8634920634920634, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15458884835243225, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8319327731092437, | |
| "eval_overall_precision": 0.7898936170212766, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2879, | |
| "eval_samples_per_second": 649.619, | |
| "eval_steps_per_second": 10.422, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "grad_norm": 0.8341395854949951, | |
| "learning_rate": 6.5000000000000004e-06, | |
| "loss": 0.0359, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7175572519083969, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6438356164383562, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15657885372638702, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8312412831241283, | |
| "eval_overall_precision": 0.7862796833773087, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.2923, | |
| "eval_samples_per_second": 639.721, | |
| "eval_steps_per_second": 10.263, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "grad_norm": 2.221242904663086, | |
| "learning_rate": 6e-06, | |
| "loss": 0.0338, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7086614173228347, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6521739130434783, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15500542521476746, | |
| "eval_overall_accuracy": 0.9641485275288092, | |
| "eval_overall_f1": 0.8302945301542777, | |
| "eval_overall_precision": 0.7893333333333333, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2854, | |
| "eval_samples_per_second": 655.275, | |
| "eval_steps_per_second": 10.512, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "grad_norm": 0.7178964018821716, | |
| "learning_rate": 5.500000000000001e-06, | |
| "loss": 0.0324, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.703125, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6428571428571429, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15786349773406982, | |
| "eval_overall_accuracy": 0.9633802816901409, | |
| "eval_overall_f1": 0.8256624825662484, | |
| "eval_overall_precision": 0.7810026385224275, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2857, | |
| "eval_samples_per_second": 654.47, | |
| "eval_steps_per_second": 10.5, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "grad_norm": 1.6527904272079468, | |
| "learning_rate": 5e-06, | |
| "loss": 0.034, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "eval_LOCATION_f1": 0.8571428571428572, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8076923076923077, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.71875, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15783792734146118, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8268156424581006, | |
| "eval_overall_precision": 0.783068783068783, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2925, | |
| "eval_samples_per_second": 639.316, | |
| "eval_steps_per_second": 10.256, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "grad_norm": 1.0714702606201172, | |
| "learning_rate": 4.5e-06, | |
| "loss": 0.0353, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "eval_LOCATION_f1": 0.8571428571428572, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8076923076923077, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7343749999999999, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6714285714285714, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15797153115272522, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.829608938547486, | |
| "eval_overall_precision": 0.7857142857142857, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.286, | |
| "eval_samples_per_second": 653.836, | |
| "eval_steps_per_second": 10.489, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "grad_norm": 1.2929750680923462, | |
| "learning_rate": 4.000000000000001e-06, | |
| "loss": 0.0325, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.71875, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6571428571428571, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.78125, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7352941176470589, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15651264786720276, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8307692307692308, | |
| "eval_overall_precision": 0.7877984084880637, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2929, | |
| "eval_samples_per_second": 638.474, | |
| "eval_steps_per_second": 10.243, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "grad_norm": 0.8345323801040649, | |
| "learning_rate": 3.5000000000000004e-06, | |
| "loss": 0.0344, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7343749999999999, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6714285714285714, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1590217500925064, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8284518828451882, | |
| "eval_overall_precision": 0.783641160949868, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2919, | |
| "eval_samples_per_second": 640.648, | |
| "eval_steps_per_second": 10.278, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "grad_norm": 0.6701174974441528, | |
| "learning_rate": 3e-06, | |
| "loss": 0.0336, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "eval_LOCATION_f1": 0.8571428571428572, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8076923076923077, | |
| "eval_LOCATION_recall": 0.9130434782608695, | |
| "eval_ORGANIZATION_f1": 0.7286821705426356, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6619718309859155, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7500000000000001, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7058823529411765, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1604832261800766, | |
| "eval_overall_accuracy": 0.9633802816901409, | |
| "eval_overall_f1": 0.8256624825662484, | |
| "eval_overall_precision": 0.7810026385224275, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2864, | |
| "eval_samples_per_second": 652.822, | |
| "eval_steps_per_second": 10.473, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "grad_norm": 0.5713714361190796, | |
| "learning_rate": 2.5e-06, | |
| "loss": 0.0337, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7244094488188977, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.16034719347953796, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.829608938547486, | |
| "eval_overall_precision": 0.7857142857142857, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2857, | |
| "eval_samples_per_second": 654.607, | |
| "eval_steps_per_second": 10.502, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "grad_norm": 1.4332071542739868, | |
| "learning_rate": 2.0000000000000003e-06, | |
| "loss": 0.0326, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.703125, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6428571428571429, | |
| "eval_ORGANIZATION_recall": 0.7758620689655172, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1593874990940094, | |
| "eval_overall_accuracy": 0.9633802816901409, | |
| "eval_overall_f1": 0.8256624825662484, | |
| "eval_overall_precision": 0.7810026385224275, | |
| "eval_overall_recall": 0.8757396449704142, | |
| "eval_runtime": 0.2921, | |
| "eval_samples_per_second": 640.143, | |
| "eval_steps_per_second": 10.27, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "grad_norm": 1.3420923948287964, | |
| "learning_rate": 1.5e-06, | |
| "loss": 0.0352, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7244094488188977, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6666666666666666, | |
| "eval_ORGANIZATION_recall": 0.7931034482758621, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7692307692307692, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.7142857142857143, | |
| "eval_QUANTITY_recall": 0.8333333333333334, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15942679345607758, | |
| "eval_overall_accuracy": 0.9641485275288092, | |
| "eval_overall_f1": 0.8307692307692308, | |
| "eval_overall_precision": 0.7877984084880637, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2927, | |
| "eval_samples_per_second": 638.801, | |
| "eval_steps_per_second": 10.248, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "grad_norm": 2.652052402496338, | |
| "learning_rate": 1.0000000000000002e-06, | |
| "loss": 0.0329, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "eval_LOCATION_f1": 0.8767123287671235, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8311688311688312, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7343749999999999, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6714285714285714, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1578895002603531, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8307692307692308, | |
| "eval_overall_precision": 0.7877984084880637, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2858, | |
| "eval_samples_per_second": 654.385, | |
| "eval_steps_per_second": 10.498, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "grad_norm": 1.3167122602462769, | |
| "learning_rate": 5.000000000000001e-07, | |
| "loss": 0.0321, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.75, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6857142857142857, | |
| "eval_ORGANIZATION_recall": 0.8275862068965517, | |
| "eval_PERSON_f1": 0.860759493670886, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8292682926829268, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.15904921293258667, | |
| "eval_overall_accuracy": 0.9641485275288092, | |
| "eval_overall_f1": 0.8324022346368716, | |
| "eval_overall_precision": 0.7883597883597884, | |
| "eval_overall_recall": 0.8816568047337278, | |
| "eval_runtime": 0.293, | |
| "eval_samples_per_second": 638.168, | |
| "eval_steps_per_second": 10.238, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "grad_norm": 0.26482483744621277, | |
| "learning_rate": 0.0, | |
| "loss": 0.0322, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "eval_LOCATION_f1": 0.870748299319728, | |
| "eval_LOCATION_number": 69, | |
| "eval_LOCATION_precision": 0.8205128205128205, | |
| "eval_LOCATION_recall": 0.927536231884058, | |
| "eval_ORGANIZATION_f1": 0.7343749999999999, | |
| "eval_ORGANIZATION_number": 58, | |
| "eval_ORGANIZATION_precision": 0.6714285714285714, | |
| "eval_ORGANIZATION_recall": 0.8103448275862069, | |
| "eval_PERSON_f1": 0.8580441640378549, | |
| "eval_PERSON_number": 152, | |
| "eval_PERSON_precision": 0.8242424242424242, | |
| "eval_PERSON_recall": 0.8947368421052632, | |
| "eval_QUANTITY_f1": 0.7384615384615385, | |
| "eval_QUANTITY_number": 30, | |
| "eval_QUANTITY_precision": 0.6857142857142857, | |
| "eval_QUANTITY_recall": 0.8, | |
| "eval_TIME_f1": 0.8666666666666666, | |
| "eval_TIME_number": 29, | |
| "eval_TIME_precision": 0.8387096774193549, | |
| "eval_TIME_recall": 0.896551724137931, | |
| "eval_loss": 0.1596968173980713, | |
| "eval_overall_accuracy": 0.9638924455825865, | |
| "eval_overall_f1": 0.8284518828451882, | |
| "eval_overall_precision": 0.783641160949868, | |
| "eval_overall_recall": 0.878698224852071, | |
| "eval_runtime": 0.2913, | |
| "eval_samples_per_second": 641.846, | |
| "eval_steps_per_second": 10.297, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "step": 10600, | |
| "total_flos": 4535639530574946.0, | |
| "train_loss": 0.08503569045156803, | |
| "train_runtime": 606.7172, | |
| "train_samples_per_second": 278.054, | |
| "train_steps_per_second": 17.471 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 10600, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 100, | |
| "save_steps": 500, | |
| "total_flos": 4535639530574946.0, | |
| "train_batch_size": 16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |