| { |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 100.0, |
| "eval_steps": 500, |
| "global_step": 9600, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "grad_norm": 1.4548790454864502, |
| "learning_rate": 4.9500000000000004e-05, |
| "loss": 1.1704, |
| "step": 96 |
| }, |
| { |
| "epoch": 1.0, |
| "eval_LOCATION_f1": 0.0, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.0, |
| "eval_LOCATION_recall": 0.0, |
| "eval_ORGANIZATION_f1": 0.0, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.0, |
| "eval_ORGANIZATION_recall": 0.0, |
| "eval_PERSON_f1": 0.0, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.0, |
| "eval_PERSON_recall": 0.0, |
| "eval_loss": 0.708549976348877, |
| "eval_overall_accuracy": 0.8342935528120713, |
| "eval_overall_f1": 0.0, |
| "eval_overall_precision": 0.0, |
| "eval_overall_recall": 0.0, |
| "eval_runtime": 0.2796, |
| "eval_samples_per_second": 608.047, |
| "eval_steps_per_second": 10.73, |
| "step": 96 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 1.531407117843628, |
| "learning_rate": 4.9e-05, |
| "loss": 0.668, |
| "step": 192 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_LOCATION_f1": 0.0, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.0, |
| "eval_LOCATION_recall": 0.0, |
| "eval_ORGANIZATION_f1": 0.011904761904761906, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.5, |
| "eval_ORGANIZATION_recall": 0.006024096385542169, |
| "eval_PERSON_f1": 0.0, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.0, |
| "eval_PERSON_recall": 0.0, |
| "eval_loss": 0.5722576975822449, |
| "eval_overall_accuracy": 0.8348422496570644, |
| "eval_overall_f1": 0.00495049504950495, |
| "eval_overall_precision": 0.3333333333333333, |
| "eval_overall_recall": 0.0024937655860349127, |
| "eval_runtime": 0.2814, |
| "eval_samples_per_second": 604.079, |
| "eval_steps_per_second": 10.66, |
| "step": 192 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 0.9092353582382202, |
| "learning_rate": 4.85e-05, |
| "loss": 0.5537, |
| "step": 288 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_LOCATION_f1": 0.0, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.0, |
| "eval_LOCATION_recall": 0.0, |
| "eval_ORGANIZATION_f1": 0.10526315789473684, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.4166666666666667, |
| "eval_ORGANIZATION_recall": 0.060240963855421686, |
| "eval_PERSON_f1": 0.09090909090909091, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.23529411764705882, |
| "eval_PERSON_recall": 0.056338028169014086, |
| "eval_loss": 0.44938454031944275, |
| "eval_overall_accuracy": 0.8455418381344307, |
| "eval_overall_f1": 0.07809110629067245, |
| "eval_overall_precision": 0.3, |
| "eval_overall_recall": 0.04488778054862843, |
| "eval_runtime": 0.2836, |
| "eval_samples_per_second": 599.368, |
| "eval_steps_per_second": 10.577, |
| "step": 288 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 1.0577952861785889, |
| "learning_rate": 4.8e-05, |
| "loss": 0.4382, |
| "step": 384 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_LOCATION_f1": 0.10434782608695652, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.2727272727272727, |
| "eval_LOCATION_recall": 0.06451612903225806, |
| "eval_ORGANIZATION_f1": 0.31724137931034485, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.3709677419354839, |
| "eval_ORGANIZATION_recall": 0.27710843373493976, |
| "eval_PERSON_f1": 0.4230769230769231, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.38823529411764707, |
| "eval_PERSON_recall": 0.4647887323943662, |
| "eval_loss": 0.3280525207519531, |
| "eval_overall_accuracy": 0.8883401920438957, |
| "eval_overall_f1": 0.32914923291492326, |
| "eval_overall_precision": 0.37341772151898733, |
| "eval_overall_recall": 0.2942643391521197, |
| "eval_runtime": 0.2879, |
| "eval_samples_per_second": 590.4, |
| "eval_steps_per_second": 10.419, |
| "step": 384 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.9427235126495361, |
| "learning_rate": 4.75e-05, |
| "loss": 0.32, |
| "step": 480 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_LOCATION_f1": 0.3312883435582822, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.38571428571428573, |
| "eval_LOCATION_recall": 0.2903225806451613, |
| "eval_ORGANIZATION_f1": 0.5650969529085873, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.5230769230769231, |
| "eval_ORGANIZATION_recall": 0.6144578313253012, |
| "eval_PERSON_f1": 0.6498422712933754, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.5885714285714285, |
| "eval_PERSON_recall": 0.7253521126760564, |
| "eval_loss": 0.2350081503391266, |
| "eval_overall_accuracy": 0.9292181069958848, |
| "eval_overall_f1": 0.5517241379310345, |
| "eval_overall_precision": 0.5272727272727272, |
| "eval_overall_recall": 0.5785536159600998, |
| "eval_runtime": 0.2889, |
| "eval_samples_per_second": 588.423, |
| "eval_steps_per_second": 10.384, |
| "step": 480 |
| }, |
| { |
| "epoch": 6.0, |
| "grad_norm": 1.7494196891784668, |
| "learning_rate": 4.7e-05, |
| "loss": 0.2426, |
| "step": 576 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_LOCATION_f1": 0.5775401069518716, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.574468085106383, |
| "eval_LOCATION_recall": 0.5806451612903226, |
| "eval_ORGANIZATION_f1": 0.6775067750677507, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.6157635467980296, |
| "eval_ORGANIZATION_recall": 0.7530120481927711, |
| "eval_PERSON_f1": 0.8208469055374593, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.7636363636363637, |
| "eval_PERSON_recall": 0.8873239436619719, |
| "eval_loss": 0.18390628695487976, |
| "eval_overall_accuracy": 0.9511659807956104, |
| "eval_overall_f1": 0.7068366164542296, |
| "eval_overall_precision": 0.6601731601731602, |
| "eval_overall_recall": 0.7605985037406484, |
| "eval_runtime": 0.2856, |
| "eval_samples_per_second": 595.176, |
| "eval_steps_per_second": 10.503, |
| "step": 576 |
| }, |
| { |
| "epoch": 7.0, |
| "grad_norm": 0.9670518040657043, |
| "learning_rate": 4.6500000000000005e-05, |
| "loss": 0.1962, |
| "step": 672 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_LOCATION_f1": 0.7301587301587302, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.71875, |
| "eval_LOCATION_recall": 0.7419354838709677, |
| "eval_ORGANIZATION_f1": 0.7333333333333334, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.6804123711340206, |
| "eval_ORGANIZATION_recall": 0.7951807228915663, |
| "eval_PERSON_f1": 0.9292929292929293, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.8903225806451613, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.1462562382221222, |
| "eval_overall_accuracy": 0.9618655692729767, |
| "eval_overall_f1": 0.8014184397163121, |
| "eval_overall_precision": 0.7617977528089888, |
| "eval_overall_recall": 0.8453865336658354, |
| "eval_runtime": 0.2846, |
| "eval_samples_per_second": 597.237, |
| "eval_steps_per_second": 10.539, |
| "step": 672 |
| }, |
| { |
| "epoch": 8.0, |
| "grad_norm": 0.7352226376533508, |
| "learning_rate": 4.600000000000001e-05, |
| "loss": 0.1696, |
| "step": 768 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_LOCATION_f1": 0.7894736842105262, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.7731958762886598, |
| "eval_LOCATION_recall": 0.8064516129032258, |
| "eval_ORGANIZATION_f1": 0.7727272727272727, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.7311827956989247, |
| "eval_ORGANIZATION_recall": 0.8192771084337349, |
| "eval_PERSON_f1": 0.9383561643835617, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9133333333333333, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.11997510492801666, |
| "eval_overall_accuracy": 0.9681755829903979, |
| "eval_overall_f1": 0.8345323741007196, |
| "eval_overall_precision": 0.8036951501154734, |
| "eval_overall_recall": 0.8678304239401496, |
| "eval_runtime": 0.2879, |
| "eval_samples_per_second": 590.554, |
| "eval_steps_per_second": 10.422, |
| "step": 768 |
| }, |
| { |
| "epoch": 9.0, |
| "grad_norm": 0.8205360174179077, |
| "learning_rate": 4.55e-05, |
| "loss": 0.1508, |
| "step": 864 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_LOCATION_f1": 0.8290155440414508, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8, |
| "eval_LOCATION_recall": 0.8602150537634409, |
| "eval_ORGANIZATION_f1": 0.7897727272727273, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.7473118279569892, |
| "eval_ORGANIZATION_recall": 0.8373493975903614, |
| "eval_PERSON_f1": 0.9387755102040817, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9078947368421053, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.10688301175832748, |
| "eval_overall_accuracy": 0.9695473251028807, |
| "eval_overall_f1": 0.8510131108462454, |
| "eval_overall_precision": 0.815068493150685, |
| "eval_overall_recall": 0.8902743142144638, |
| "eval_runtime": 0.2939, |
| "eval_samples_per_second": 578.353, |
| "eval_steps_per_second": 10.206, |
| "step": 864 |
| }, |
| { |
| "epoch": 10.0, |
| "grad_norm": 1.3305693864822388, |
| "learning_rate": 4.5e-05, |
| "loss": 0.1359, |
| "step": 960 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_LOCATION_f1": 0.8229166666666666, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.797979797979798, |
| "eval_LOCATION_recall": 0.8494623655913979, |
| "eval_ORGANIZATION_f1": 0.8011363636363636, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.7580645161290323, |
| "eval_ORGANIZATION_recall": 0.8493975903614458, |
| "eval_PERSON_f1": 0.9415807560137458, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9194630872483222, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.09369462728500366, |
| "eval_overall_accuracy": 0.9711934156378601, |
| "eval_overall_f1": 0.8550898203592814, |
| "eval_overall_precision": 0.8225806451612904, |
| "eval_overall_recall": 0.8902743142144638, |
| "eval_runtime": 0.2851, |
| "eval_samples_per_second": 596.337, |
| "eval_steps_per_second": 10.524, |
| "step": 960 |
| }, |
| { |
| "epoch": 11.0, |
| "grad_norm": 0.8002439141273499, |
| "learning_rate": 4.4500000000000004e-05, |
| "loss": 0.126, |
| "step": 1056 |
| }, |
| { |
| "epoch": 11.0, |
| "eval_LOCATION_f1": 0.8205128205128205, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.7843137254901961, |
| "eval_LOCATION_recall": 0.8602150537634409, |
| "eval_ORGANIZATION_f1": 0.8171428571428571, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.7771739130434783, |
| "eval_ORGANIZATION_recall": 0.8614457831325302, |
| "eval_PERSON_f1": 0.9383561643835617, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9133333333333333, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.08726800233125687, |
| "eval_overall_accuracy": 0.9725651577503429, |
| "eval_overall_f1": 0.860215053763441, |
| "eval_overall_precision": 0.8256880733944955, |
| "eval_overall_recall": 0.8977556109725686, |
| "eval_runtime": 0.2848, |
| "eval_samples_per_second": 596.875, |
| "eval_steps_per_second": 10.533, |
| "step": 1056 |
| }, |
| { |
| "epoch": 12.0, |
| "grad_norm": 5.6661248207092285, |
| "learning_rate": 4.4000000000000006e-05, |
| "loss": 0.1191, |
| "step": 1152 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_LOCATION_f1": 0.83248730964467, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.7884615384615384, |
| "eval_LOCATION_recall": 0.8817204301075269, |
| "eval_ORGANIZATION_f1": 0.8328611898016998, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.786096256684492, |
| "eval_ORGANIZATION_recall": 0.8855421686746988, |
| "eval_PERSON_f1": 0.9415807560137458, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9194630872483222, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.08264537155628204, |
| "eval_overall_accuracy": 0.9739368998628258, |
| "eval_overall_f1": 0.8703923900118906, |
| "eval_overall_precision": 0.8318181818181818, |
| "eval_overall_recall": 0.912718204488778, |
| "eval_runtime": 0.2805, |
| "eval_samples_per_second": 605.976, |
| "eval_steps_per_second": 10.694, |
| "step": 1152 |
| }, |
| { |
| "epoch": 13.0, |
| "grad_norm": 1.2274419069290161, |
| "learning_rate": 4.35e-05, |
| "loss": 0.1126, |
| "step": 1248 |
| }, |
| { |
| "epoch": 13.0, |
| "eval_LOCATION_f1": 0.8615384615384616, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8235294117647058, |
| "eval_LOCATION_recall": 0.9032258064516129, |
| "eval_ORGANIZATION_f1": 0.8497109826589595, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8166666666666667, |
| "eval_ORGANIZATION_recall": 0.8855421686746988, |
| "eval_PERSON_f1": 0.9480968858131488, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9319727891156463, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.07422925531864166, |
| "eval_overall_accuracy": 0.9769547325102881, |
| "eval_overall_f1": 0.8867469879518073, |
| "eval_overall_precision": 0.8578088578088578, |
| "eval_overall_recall": 0.9177057356608479, |
| "eval_runtime": 0.2855, |
| "eval_samples_per_second": 595.43, |
| "eval_steps_per_second": 10.508, |
| "step": 1248 |
| }, |
| { |
| "epoch": 14.0, |
| "grad_norm": 1.3920135498046875, |
| "learning_rate": 4.3e-05, |
| "loss": 0.1061, |
| "step": 1344 |
| }, |
| { |
| "epoch": 14.0, |
| "eval_LOCATION_f1": 0.8808290155440415, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.85, |
| "eval_LOCATION_recall": 0.9139784946236559, |
| "eval_ORGANIZATION_f1": 0.8613569321533923, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8439306358381503, |
| "eval_ORGANIZATION_recall": 0.8795180722891566, |
| "eval_PERSON_f1": 0.9480968858131488, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9319727891156463, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.07068616151809692, |
| "eval_overall_accuracy": 0.978875171467764, |
| "eval_overall_f1": 0.8964677222898904, |
| "eval_overall_precision": 0.8761904761904762, |
| "eval_overall_recall": 0.9177057356608479, |
| "eval_runtime": 0.2797, |
| "eval_samples_per_second": 607.712, |
| "eval_steps_per_second": 10.724, |
| "step": 1344 |
| }, |
| { |
| "epoch": 15.0, |
| "grad_norm": 0.7759754061698914, |
| "learning_rate": 4.25e-05, |
| "loss": 0.1003, |
| "step": 1440 |
| }, |
| { |
| "epoch": 15.0, |
| "eval_LOCATION_f1": 0.8911917098445595, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.86, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8612716763005781, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8277777777777777, |
| "eval_ORGANIZATION_recall": 0.8975903614457831, |
| "eval_PERSON_f1": 0.9547038327526133, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9448275862068966, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.0703127458691597, |
| "eval_overall_accuracy": 0.9783264746227709, |
| "eval_overall_f1": 0.9007263922518159, |
| "eval_overall_precision": 0.8752941176470588, |
| "eval_overall_recall": 0.9276807980049875, |
| "eval_runtime": 0.2858, |
| "eval_samples_per_second": 594.799, |
| "eval_steps_per_second": 10.496, |
| "step": 1440 |
| }, |
| { |
| "epoch": 16.0, |
| "grad_norm": 1.396679401397705, |
| "learning_rate": 4.2e-05, |
| "loss": 0.1008, |
| "step": 1536 |
| }, |
| { |
| "epoch": 16.0, |
| "eval_LOCATION_f1": 0.8923076923076922, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8529411764705882, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.8645533141210374, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8287292817679558, |
| "eval_ORGANIZATION_recall": 0.9036144578313253, |
| "eval_PERSON_f1": 0.9480968858131488, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9319727891156463, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.06862790882587433, |
| "eval_overall_accuracy": 0.9777777777777777, |
| "eval_overall_f1": 0.9001203369434417, |
| "eval_overall_precision": 0.8697674418604651, |
| "eval_overall_recall": 0.9326683291770573, |
| "eval_runtime": 0.2841, |
| "eval_samples_per_second": 598.386, |
| "eval_steps_per_second": 10.56, |
| "step": 1536 |
| }, |
| { |
| "epoch": 17.0, |
| "grad_norm": 0.9365902543067932, |
| "learning_rate": 4.15e-05, |
| "loss": 0.0957, |
| "step": 1632 |
| }, |
| { |
| "epoch": 17.0, |
| "eval_LOCATION_f1": 0.8911917098445595, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.86, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8790560471976401, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.861271676300578, |
| "eval_ORGANIZATION_recall": 0.8975903614457831, |
| "eval_PERSON_f1": 0.9580419580419581, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9513888888888888, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.061672553420066833, |
| "eval_overall_accuracy": 0.980246913580247, |
| "eval_overall_f1": 0.9095354523227384, |
| "eval_overall_precision": 0.8920863309352518, |
| "eval_overall_recall": 0.9276807980049875, |
| "eval_runtime": 0.2841, |
| "eval_samples_per_second": 598.364, |
| "eval_steps_per_second": 10.559, |
| "step": 1632 |
| }, |
| { |
| "epoch": 18.0, |
| "grad_norm": 0.5375998616218567, |
| "learning_rate": 4.1e-05, |
| "loss": 0.0923, |
| "step": 1728 |
| }, |
| { |
| "epoch": 18.0, |
| "eval_LOCATION_f1": 0.8958333333333334, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8686868686868687, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8842729970326408, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8713450292397661, |
| "eval_ORGANIZATION_recall": 0.8975903614457831, |
| "eval_PERSON_f1": 0.9614035087719298, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.958041958041958, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05938532203435898, |
| "eval_overall_accuracy": 0.9818930041152263, |
| "eval_overall_f1": 0.9140049140049139, |
| "eval_overall_precision": 0.9007263922518159, |
| "eval_overall_recall": 0.9276807980049875, |
| "eval_runtime": 0.2789, |
| "eval_samples_per_second": 609.62, |
| "eval_steps_per_second": 10.758, |
| "step": 1728 |
| }, |
| { |
| "epoch": 19.0, |
| "grad_norm": 0.978545069694519, |
| "learning_rate": 4.05e-05, |
| "loss": 0.0894, |
| "step": 1824 |
| }, |
| { |
| "epoch": 19.0, |
| "eval_LOCATION_f1": 0.8923076923076922, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8529411764705882, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.8672566371681416, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8497109826589595, |
| "eval_ORGANIZATION_recall": 0.8855421686746988, |
| "eval_PERSON_f1": 0.9547038327526133, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9448275862068966, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05911582335829735, |
| "eval_overall_accuracy": 0.9799725651577503, |
| "eval_overall_f1": 0.9037758830694275, |
| "eval_overall_precision": 0.8833333333333333, |
| "eval_overall_recall": 0.9251870324189526, |
| "eval_runtime": 0.2842, |
| "eval_samples_per_second": 598.194, |
| "eval_steps_per_second": 10.556, |
| "step": 1824 |
| }, |
| { |
| "epoch": 20.0, |
| "grad_norm": 1.320235252380371, |
| "learning_rate": 4e-05, |
| "loss": 0.0852, |
| "step": 1920 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_LOCATION_f1": 0.883248730964467, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8365384615384616, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.8742514970059881, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8690476190476191, |
| "eval_ORGANIZATION_recall": 0.8795180722891566, |
| "eval_PERSON_f1": 0.9547038327526133, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9448275862068966, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05648750439286232, |
| "eval_overall_accuracy": 0.9813443072702333, |
| "eval_overall_f1": 0.9046454767726162, |
| "eval_overall_precision": 0.8872901678657075, |
| "eval_overall_recall": 0.9226932668329177, |
| "eval_runtime": 0.2816, |
| "eval_samples_per_second": 603.678, |
| "eval_steps_per_second": 10.653, |
| "step": 1920 |
| }, |
| { |
| "epoch": 21.0, |
| "grad_norm": 1.0660918951034546, |
| "learning_rate": 3.9500000000000005e-05, |
| "loss": 0.0857, |
| "step": 2016 |
| }, |
| { |
| "epoch": 21.0, |
| "eval_LOCATION_f1": 0.8787878787878788, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8285714285714286, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.8739002932551319, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8514285714285714, |
| "eval_ORGANIZATION_recall": 0.8975903614457831, |
| "eval_PERSON_f1": 0.9614035087719298, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.958041958041958, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.059097353368997574, |
| "eval_overall_accuracy": 0.9816186556927298, |
| "eval_overall_f1": 0.9053398058252428, |
| "eval_overall_precision": 0.8817966903073287, |
| "eval_overall_recall": 0.9301745635910225, |
| "eval_runtime": 0.2823, |
| "eval_samples_per_second": 602.231, |
| "eval_steps_per_second": 10.628, |
| "step": 2016 |
| }, |
| { |
| "epoch": 22.0, |
| "grad_norm": 1.226671576499939, |
| "learning_rate": 3.9000000000000006e-05, |
| "loss": 0.0817, |
| "step": 2112 |
| }, |
| { |
| "epoch": 22.0, |
| "eval_LOCATION_f1": 0.8787878787878788, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8285714285714286, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.8705882352941176, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8505747126436781, |
| "eval_ORGANIZATION_recall": 0.891566265060241, |
| "eval_PERSON_f1": 0.9547038327526133, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9448275862068966, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05854226276278496, |
| "eval_overall_accuracy": 0.9807956104252401, |
| "eval_overall_f1": 0.9018181818181819, |
| "eval_overall_precision": 0.8773584905660378, |
| "eval_overall_recall": 0.9276807980049875, |
| "eval_runtime": 0.2824, |
| "eval_samples_per_second": 601.972, |
| "eval_steps_per_second": 10.623, |
| "step": 2112 |
| }, |
| { |
| "epoch": 23.0, |
| "grad_norm": 1.1954342126846313, |
| "learning_rate": 3.85e-05, |
| "loss": 0.0792, |
| "step": 2208 |
| }, |
| { |
| "epoch": 23.0, |
| "eval_LOCATION_f1": 0.882051282051282, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8431372549019608, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8674698795180723, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8674698795180723, |
| "eval_ORGANIZATION_recall": 0.8674698795180723, |
| "eval_PERSON_f1": 0.9614035087719298, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.958041958041958, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05442183464765549, |
| "eval_overall_accuracy": 0.9810699588477366, |
| "eval_overall_f1": 0.9039408866995073, |
| "eval_overall_precision": 0.8929440389294404, |
| "eval_overall_recall": 0.9152119700748129, |
| "eval_runtime": 0.2813, |
| "eval_samples_per_second": 604.426, |
| "eval_steps_per_second": 10.666, |
| "step": 2208 |
| }, |
| { |
| "epoch": 24.0, |
| "grad_norm": 1.1046844720840454, |
| "learning_rate": 3.8e-05, |
| "loss": 0.0788, |
| "step": 2304 |
| }, |
| { |
| "epoch": 24.0, |
| "eval_LOCATION_f1": 0.8730964467005077, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8269230769230769, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8674698795180723, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8674698795180723, |
| "eval_ORGANIZATION_recall": 0.8674698795180723, |
| "eval_PERSON_f1": 0.9614035087719298, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.958041958041958, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05480505898594856, |
| "eval_overall_accuracy": 0.9810699588477366, |
| "eval_overall_f1": 0.9017199017199016, |
| "eval_overall_precision": 0.8886198547215496, |
| "eval_overall_recall": 0.9152119700748129, |
| "eval_runtime": 0.2815, |
| "eval_samples_per_second": 603.885, |
| "eval_steps_per_second": 10.657, |
| "step": 2304 |
| }, |
| { |
| "epoch": 25.0, |
| "grad_norm": 1.003726840019226, |
| "learning_rate": 3.7500000000000003e-05, |
| "loss": 0.0772, |
| "step": 2400 |
| }, |
| { |
| "epoch": 25.0, |
| "eval_LOCATION_f1": 0.883248730964467, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8365384615384616, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.8802395209580839, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.875, |
| "eval_ORGANIZATION_recall": 0.8855421686746988, |
| "eval_PERSON_f1": 0.9580419580419581, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9513888888888888, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05413680523633957, |
| "eval_overall_accuracy": 0.9816186556927298, |
| "eval_overall_f1": 0.9082007343941249, |
| "eval_overall_precision": 0.8918269230769231, |
| "eval_overall_recall": 0.9251870324189526, |
| "eval_runtime": 0.285, |
| "eval_samples_per_second": 596.532, |
| "eval_steps_per_second": 10.527, |
| "step": 2400 |
| }, |
| { |
| "epoch": 26.0, |
| "grad_norm": 0.39463770389556885, |
| "learning_rate": 3.7e-05, |
| "loss": 0.0755, |
| "step": 2496 |
| }, |
| { |
| "epoch": 26.0, |
| "eval_LOCATION_f1": 0.900523560209424, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8775510204081632, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.890207715133531, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8771929824561403, |
| "eval_ORGANIZATION_recall": 0.9036144578313253, |
| "eval_PERSON_f1": 0.9580419580419581, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.9513888888888888, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05070779472589493, |
| "eval_overall_accuracy": 0.9835390946502057, |
| "eval_overall_f1": 0.9164619164619164, |
| "eval_overall_precision": 0.9031476997578692, |
| "eval_overall_recall": 0.9301745635910225, |
| "eval_runtime": 0.2828, |
| "eval_samples_per_second": 601.218, |
| "eval_steps_per_second": 10.61, |
| "step": 2496 |
| }, |
| { |
| "epoch": 27.0, |
| "grad_norm": 2.091871500015259, |
| "learning_rate": 3.65e-05, |
| "loss": 0.0717, |
| "step": 2592 |
| }, |
| { |
| "epoch": 27.0, |
| "eval_LOCATION_f1": 0.8958333333333334, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8686868686868687, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8882352941176471, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.867816091954023, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.9614035087719298, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.958041958041958, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.05057214945554733, |
| "eval_overall_accuracy": 0.9840877914951989, |
| "eval_overall_f1": 0.9155446756425949, |
| "eval_overall_precision": 0.8990384615384616, |
| "eval_overall_recall": 0.9326683291770573, |
| "eval_runtime": 0.2821, |
| "eval_samples_per_second": 602.66, |
| "eval_steps_per_second": 10.635, |
| "step": 2592 |
| }, |
| { |
| "epoch": 28.0, |
| "grad_norm": 1.2802491188049316, |
| "learning_rate": 3.6e-05, |
| "loss": 0.0725, |
| "step": 2688 |
| }, |
| { |
| "epoch": 28.0, |
| "eval_LOCATION_f1": 0.8775510204081631, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8349514563106796, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8869047619047619, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8764705882352941, |
| "eval_ORGANIZATION_recall": 0.8975903614457831, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.05177851393818855, |
| "eval_overall_accuracy": 0.9832647462277092, |
| "eval_overall_f1": 0.9142156862745099, |
| "eval_overall_precision": 0.8987951807228916, |
| "eval_overall_recall": 0.9301745635910225, |
| "eval_runtime": 0.284, |
| "eval_samples_per_second": 598.592, |
| "eval_steps_per_second": 10.563, |
| "step": 2688 |
| }, |
| { |
| "epoch": 29.0, |
| "grad_norm": 0.523560643196106, |
| "learning_rate": 3.55e-05, |
| "loss": 0.0713, |
| "step": 2784 |
| }, |
| { |
| "epoch": 29.0, |
| "eval_LOCATION_f1": 0.882051282051282, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8431372549019608, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.88955223880597, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8816568047337278, |
| "eval_ORGANIZATION_recall": 0.8975903614457831, |
| "eval_PERSON_f1": 0.9614035087719298, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.958041958041958, |
| "eval_PERSON_recall": 0.9647887323943662, |
| "eval_loss": 0.050521016120910645, |
| "eval_overall_accuracy": 0.9832647462277092, |
| "eval_overall_f1": 0.9128834355828221, |
| "eval_overall_precision": 0.8985507246376812, |
| "eval_overall_recall": 0.9276807980049875, |
| "eval_runtime": 0.2811, |
| "eval_samples_per_second": 604.758, |
| "eval_steps_per_second": 10.672, |
| "step": 2784 |
| }, |
| { |
| "epoch": 30.0, |
| "grad_norm": 1.3990178108215332, |
| "learning_rate": 3.5e-05, |
| "loss": 0.0671, |
| "step": 2880 |
| }, |
| { |
| "epoch": 30.0, |
| "eval_LOCATION_f1": 0.8958333333333334, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8686868686868687, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.9020771513353115, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8888888888888888, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.047653622925281525, |
| "eval_overall_accuracy": 0.984636488340192, |
| "eval_overall_f1": 0.9249692496924969, |
| "eval_overall_precision": 0.912621359223301, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2809, |
| "eval_samples_per_second": 605.116, |
| "eval_steps_per_second": 10.679, |
| "step": 2880 |
| }, |
| { |
| "epoch": 31.0, |
| "grad_norm": 0.28008055686950684, |
| "learning_rate": 3.45e-05, |
| "loss": 0.0666, |
| "step": 2976 |
| }, |
| { |
| "epoch": 31.0, |
| "eval_LOCATION_f1": 0.8775510204081631, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8349514563106796, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8855421686746989, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8855421686746988, |
| "eval_ORGANIZATION_recall": 0.8855421686746988, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04800420626997948, |
| "eval_overall_accuracy": 0.9838134430727024, |
| "eval_overall_f1": 0.9137931034482758, |
| "eval_overall_precision": 0.902676399026764, |
| "eval_overall_recall": 0.9251870324189526, |
| "eval_runtime": 0.2841, |
| "eval_samples_per_second": 598.335, |
| "eval_steps_per_second": 10.559, |
| "step": 2976 |
| }, |
| { |
| "epoch": 32.0, |
| "grad_norm": 4.019622325897217, |
| "learning_rate": 3.4000000000000007e-05, |
| "loss": 0.0638, |
| "step": 3072 |
| }, |
| { |
| "epoch": 32.0, |
| "eval_LOCATION_f1": 0.8865979381443299, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8514851485148515, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8948948948948949, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8922155688622755, |
| "eval_ORGANIZATION_recall": 0.8975903614457831, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.048197515308856964, |
| "eval_overall_accuracy": 0.9843621399176955, |
| "eval_overall_f1": 0.9198520345252775, |
| "eval_overall_precision": 0.9097560975609756, |
| "eval_overall_recall": 0.9301745635910225, |
| "eval_runtime": 0.2816, |
| "eval_samples_per_second": 603.772, |
| "eval_steps_per_second": 10.655, |
| "step": 3072 |
| }, |
| { |
| "epoch": 33.0, |
| "grad_norm": 0.4553819000720978, |
| "learning_rate": 3.35e-05, |
| "loss": 0.0647, |
| "step": 3168 |
| }, |
| { |
| "epoch": 33.0, |
| "eval_LOCATION_f1": 0.8775510204081631, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8349514563106796, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.888888888888889, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8862275449101796, |
| "eval_ORGANIZATION_recall": 0.891566265060241, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.048246119171381, |
| "eval_overall_accuracy": 0.9835390946502057, |
| "eval_overall_f1": 0.915129151291513, |
| "eval_overall_precision": 0.9029126213592233, |
| "eval_overall_recall": 0.9276807980049875, |
| "eval_runtime": 0.2812, |
| "eval_samples_per_second": 604.507, |
| "eval_steps_per_second": 10.668, |
| "step": 3168 |
| }, |
| { |
| "epoch": 34.0, |
| "grad_norm": 0.8945901393890381, |
| "learning_rate": 3.3e-05, |
| "loss": 0.0642, |
| "step": 3264 |
| }, |
| { |
| "epoch": 34.0, |
| "eval_LOCATION_f1": 0.882051282051282, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8431372549019608, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8934911242603549, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.877906976744186, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.968421052631579, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.965034965034965, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.048569679260253906, |
| "eval_overall_accuracy": 0.9832647462277092, |
| "eval_overall_f1": 0.9168704156479217, |
| "eval_overall_precision": 0.8992805755395683, |
| "eval_overall_recall": 0.9351620947630923, |
| "eval_runtime": 0.2909, |
| "eval_samples_per_second": 584.352, |
| "eval_steps_per_second": 10.312, |
| "step": 3264 |
| }, |
| { |
| "epoch": 35.0, |
| "grad_norm": 1.6167196035385132, |
| "learning_rate": 3.2500000000000004e-05, |
| "loss": 0.0603, |
| "step": 3360 |
| }, |
| { |
| "epoch": 35.0, |
| "eval_LOCATION_f1": 0.8865979381443299, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8514851485148515, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8982035928143712, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8928571428571429, |
| "eval_ORGANIZATION_recall": 0.9036144578313253, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04634106531739235, |
| "eval_overall_accuracy": 0.9851851851851852, |
| "eval_overall_f1": 0.9211822660098522, |
| "eval_overall_precision": 0.9099756690997567, |
| "eval_overall_recall": 0.9326683291770573, |
| "eval_runtime": 0.2828, |
| "eval_samples_per_second": 601.2, |
| "eval_steps_per_second": 10.609, |
| "step": 3360 |
| }, |
| { |
| "epoch": 36.0, |
| "grad_norm": 0.5620716214179993, |
| "learning_rate": 3.2000000000000005e-05, |
| "loss": 0.0627, |
| "step": 3456 |
| }, |
| { |
| "epoch": 36.0, |
| "eval_LOCATION_f1": 0.8775510204081631, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8349514563106796, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.8955223880597014, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8875739644970414, |
| "eval_ORGANIZATION_recall": 0.9036144578313253, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04827764630317688, |
| "eval_overall_accuracy": 0.984636488340192, |
| "eval_overall_f1": 0.9177914110429448, |
| "eval_overall_precision": 0.9033816425120773, |
| "eval_overall_recall": 0.9326683291770573, |
| "eval_runtime": 0.2836, |
| "eval_samples_per_second": 599.34, |
| "eval_steps_per_second": 10.577, |
| "step": 3456 |
| }, |
| { |
| "epoch": 37.0, |
| "grad_norm": 2.3784847259521484, |
| "learning_rate": 3.15e-05, |
| "loss": 0.0606, |
| "step": 3552 |
| }, |
| { |
| "epoch": 37.0, |
| "eval_LOCATION_f1": 0.900523560209424, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8775510204081632, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.9085545722713864, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8901734104046243, |
| "eval_ORGANIZATION_recall": 0.927710843373494, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04605403542518616, |
| "eval_overall_accuracy": 0.9854595336076818, |
| "eval_overall_f1": 0.9287469287469288, |
| "eval_overall_precision": 0.9152542372881356, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.287, |
| "eval_samples_per_second": 592.388, |
| "eval_steps_per_second": 10.454, |
| "step": 3552 |
| }, |
| { |
| "epoch": 38.0, |
| "grad_norm": 0.48580947518348694, |
| "learning_rate": 3.1e-05, |
| "loss": 0.0602, |
| "step": 3648 |
| }, |
| { |
| "epoch": 38.0, |
| "eval_LOCATION_f1": 0.9100529100529101, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8958333333333334, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.9112426035502958, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8953488372093024, |
| "eval_ORGANIZATION_recall": 0.927710843373494, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04565339908003807, |
| "eval_overall_accuracy": 0.9857338820301783, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2829, |
| "eval_samples_per_second": 601.012, |
| "eval_steps_per_second": 10.606, |
| "step": 3648 |
| }, |
| { |
| "epoch": 39.0, |
| "grad_norm": 1.0675240755081177, |
| "learning_rate": 3.05e-05, |
| "loss": 0.058, |
| "step": 3744 |
| }, |
| { |
| "epoch": 39.0, |
| "eval_LOCATION_f1": 0.9052631578947367, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8865979381443299, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.9085545722713864, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8901734104046243, |
| "eval_ORGANIZATION_recall": 0.927710843373494, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04524984955787659, |
| "eval_overall_accuracy": 0.9860082304526749, |
| "eval_overall_f1": 0.929889298892989, |
| "eval_overall_precision": 0.9174757281553398, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2837, |
| "eval_samples_per_second": 599.125, |
| "eval_steps_per_second": 10.573, |
| "step": 3744 |
| }, |
| { |
| "epoch": 40.0, |
| "grad_norm": 1.1679747104644775, |
| "learning_rate": 3e-05, |
| "loss": 0.0579, |
| "step": 3840 |
| }, |
| { |
| "epoch": 40.0, |
| "eval_LOCATION_f1": 0.9100529100529101, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8958333333333334, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.9107142857142857, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.044337525963783264, |
| "eval_overall_accuracy": 0.9862825788751715, |
| "eval_overall_f1": 0.9320148331273177, |
| "eval_overall_precision": 0.9240196078431373, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2853, |
| "eval_samples_per_second": 595.872, |
| "eval_steps_per_second": 10.515, |
| "step": 3840 |
| }, |
| { |
| "epoch": 41.0, |
| "grad_norm": 0.8956630229949951, |
| "learning_rate": 2.95e-05, |
| "loss": 0.0551, |
| "step": 3936 |
| }, |
| { |
| "epoch": 41.0, |
| "eval_LOCATION_f1": 0.9100529100529101, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8958333333333334, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.9144542772861357, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8959537572254336, |
| "eval_ORGANIZATION_recall": 0.9337349397590361, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04385361447930336, |
| "eval_overall_accuracy": 0.9868312757201646, |
| "eval_overall_f1": 0.9334975369458128, |
| "eval_overall_precision": 0.9221411192214112, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2844, |
| "eval_samples_per_second": 597.724, |
| "eval_steps_per_second": 10.548, |
| "step": 3936 |
| }, |
| { |
| "epoch": 42.0, |
| "grad_norm": 1.3600409030914307, |
| "learning_rate": 2.9e-05, |
| "loss": 0.0568, |
| "step": 4032 |
| }, |
| { |
| "epoch": 42.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9047619047619048, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8941176470588236, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.043516892939805984, |
| "eval_overall_accuracy": 0.9865569272976681, |
| "eval_overall_f1": 0.9285714285714285, |
| "eval_overall_precision": 0.9172749391727494, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2806, |
| "eval_samples_per_second": 605.74, |
| "eval_steps_per_second": 10.69, |
| "step": 4032 |
| }, |
| { |
| "epoch": 43.0, |
| "grad_norm": 0.8620499968528748, |
| "learning_rate": 2.8499999999999998e-05, |
| "loss": 0.0557, |
| "step": 4128 |
| }, |
| { |
| "epoch": 43.0, |
| "eval_LOCATION_f1": 0.9157894736842105, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8969072164948454, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.906906906906907, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9041916167664671, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04396757110953331, |
| "eval_overall_accuracy": 0.9860082304526749, |
| "eval_overall_f1": 0.9318463444857497, |
| "eval_overall_precision": 0.9261083743842364, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2853, |
| "eval_samples_per_second": 595.869, |
| "eval_steps_per_second": 10.515, |
| "step": 4128 |
| }, |
| { |
| "epoch": 44.0, |
| "grad_norm": 0.3250766396522522, |
| "learning_rate": 2.8000000000000003e-05, |
| "loss": 0.0582, |
| "step": 4224 |
| }, |
| { |
| "epoch": 44.0, |
| "eval_LOCATION_f1": 0.8923076923076922, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8529411764705882, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.896969696969697, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9024390243902439, |
| "eval_ORGANIZATION_recall": 0.891566265060241, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04460552707314491, |
| "eval_overall_accuracy": 0.9843621399176955, |
| "eval_overall_f1": 0.9221260815822002, |
| "eval_overall_precision": 0.9142156862745098, |
| "eval_overall_recall": 0.9301745635910225, |
| "eval_runtime": 0.2824, |
| "eval_samples_per_second": 601.921, |
| "eval_steps_per_second": 10.622, |
| "step": 4224 |
| }, |
| { |
| "epoch": 45.0, |
| "grad_norm": 1.508424997329712, |
| "learning_rate": 2.7500000000000004e-05, |
| "loss": 0.0548, |
| "step": 4320 |
| }, |
| { |
| "epoch": 45.0, |
| "eval_LOCATION_f1": 0.9109947643979057, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8877551020408163, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9161676646706587, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9107142857142857, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.042420320212841034, |
| "eval_overall_accuracy": 0.9865569272976681, |
| "eval_overall_f1": 0.9344870210135972, |
| "eval_overall_precision": 0.9264705882352942, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2838, |
| "eval_samples_per_second": 598.985, |
| "eval_steps_per_second": 10.57, |
| "step": 4320 |
| }, |
| { |
| "epoch": 46.0, |
| "grad_norm": 0.7623454928398132, |
| "learning_rate": 2.7000000000000002e-05, |
| "loss": 0.0533, |
| "step": 4416 |
| }, |
| { |
| "epoch": 46.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9041916167664671, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8988095238095238, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.0423850379884243, |
| "eval_overall_accuracy": 0.9865569272976681, |
| "eval_overall_f1": 0.928395061728395, |
| "eval_overall_precision": 0.9193154034229829, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2812, |
| "eval_samples_per_second": 604.565, |
| "eval_steps_per_second": 10.669, |
| "step": 4416 |
| }, |
| { |
| "epoch": 47.0, |
| "grad_norm": 0.9061383008956909, |
| "learning_rate": 2.6500000000000004e-05, |
| "loss": 0.0516, |
| "step": 4512 |
| }, |
| { |
| "epoch": 47.0, |
| "eval_LOCATION_f1": 0.8958333333333334, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8686868686868687, |
| "eval_LOCATION_recall": 0.9247311827956989, |
| "eval_ORGANIZATION_f1": 0.912280701754386, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8863636363636364, |
| "eval_ORGANIZATION_recall": 0.9397590361445783, |
| "eval_PERSON_f1": 0.968421052631579, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.965034965034965, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.0428488552570343, |
| "eval_overall_accuracy": 0.9860082304526749, |
| "eval_overall_f1": 0.9279609279609279, |
| "eval_overall_precision": 0.9090909090909091, |
| "eval_overall_recall": 0.9476309226932669, |
| "eval_runtime": 0.283, |
| "eval_samples_per_second": 600.703, |
| "eval_steps_per_second": 10.601, |
| "step": 4512 |
| }, |
| { |
| "epoch": 48.0, |
| "grad_norm": 0.753669798374176, |
| "learning_rate": 2.6000000000000002e-05, |
| "loss": 0.0501, |
| "step": 4608 |
| }, |
| { |
| "epoch": 48.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.906906906906907, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9041916167664671, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04297007992863655, |
| "eval_overall_accuracy": 0.9862825788751715, |
| "eval_overall_f1": 0.9295426452410381, |
| "eval_overall_precision": 0.9215686274509803, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2827, |
| "eval_samples_per_second": 601.339, |
| "eval_steps_per_second": 10.612, |
| "step": 4608 |
| }, |
| { |
| "epoch": 49.0, |
| "grad_norm": 1.0571324825286865, |
| "learning_rate": 2.5500000000000003e-05, |
| "loss": 0.053, |
| "step": 4704 |
| }, |
| { |
| "epoch": 49.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9134328358208955, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9053254437869822, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04329885542392731, |
| "eval_overall_accuracy": 0.9865569272976681, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2818, |
| "eval_samples_per_second": 603.355, |
| "eval_steps_per_second": 10.647, |
| "step": 4704 |
| }, |
| { |
| "epoch": 50.0, |
| "grad_norm": 0.5389184355735779, |
| "learning_rate": 2.5e-05, |
| "loss": 0.0483, |
| "step": 4800 |
| }, |
| { |
| "epoch": 50.0, |
| "eval_LOCATION_f1": 0.9206349206349206, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.90625, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04164545238018036, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9343246592317225, |
| "eval_overall_precision": 0.9285714285714286, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2839, |
| "eval_samples_per_second": 598.843, |
| "eval_steps_per_second": 10.568, |
| "step": 4800 |
| }, |
| { |
| "epoch": 51.0, |
| "grad_norm": 0.6280408501625061, |
| "learning_rate": 2.45e-05, |
| "loss": 0.0505, |
| "step": 4896 |
| }, |
| { |
| "epoch": 51.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9096385542168675, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9096385542168675, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04181710258126259, |
| "eval_overall_accuracy": 0.9865569272976681, |
| "eval_overall_f1": 0.9343246592317225, |
| "eval_overall_precision": 0.9285714285714286, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2821, |
| "eval_samples_per_second": 602.699, |
| "eval_steps_per_second": 10.636, |
| "step": 4896 |
| }, |
| { |
| "epoch": 52.0, |
| "grad_norm": 0.9616138935089111, |
| "learning_rate": 2.4e-05, |
| "loss": 0.05, |
| "step": 4992 |
| }, |
| { |
| "epoch": 52.0, |
| "eval_LOCATION_f1": 0.9304812834224598, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.925531914893617, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9053254437869822, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8895348837209303, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04034818708896637, |
| "eval_overall_accuracy": 0.9879286694101509, |
| "eval_overall_f1": 0.9344870210135972, |
| "eval_overall_precision": 0.9264705882352942, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2816, |
| "eval_samples_per_second": 603.695, |
| "eval_steps_per_second": 10.653, |
| "step": 4992 |
| }, |
| { |
| "epoch": 53.0, |
| "grad_norm": 0.9302768111228943, |
| "learning_rate": 2.35e-05, |
| "loss": 0.0493, |
| "step": 5088 |
| }, |
| { |
| "epoch": 53.0, |
| "eval_LOCATION_f1": 0.9157894736842105, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8969072164948454, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04219473525881767, |
| "eval_overall_accuracy": 0.9860082304526749, |
| "eval_overall_f1": 0.9331683168316831, |
| "eval_overall_precision": 0.9262899262899262, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2812, |
| "eval_samples_per_second": 604.63, |
| "eval_steps_per_second": 10.67, |
| "step": 5088 |
| }, |
| { |
| "epoch": 54.0, |
| "grad_norm": 0.40551334619522095, |
| "learning_rate": 2.3000000000000003e-05, |
| "loss": 0.0487, |
| "step": 5184 |
| }, |
| { |
| "epoch": 54.0, |
| "eval_LOCATION_f1": 0.925531914893617, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.9157894736842105, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9134328358208955, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9053254437869822, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04084800183773041, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9368029739776952, |
| "eval_overall_precision": 0.9310344827586207, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2813, |
| "eval_samples_per_second": 604.233, |
| "eval_steps_per_second": 10.663, |
| "step": 5184 |
| }, |
| { |
| "epoch": 55.0, |
| "grad_norm": 1.221318244934082, |
| "learning_rate": 2.25e-05, |
| "loss": 0.0485, |
| "step": 5280 |
| }, |
| { |
| "epoch": 55.0, |
| "eval_LOCATION_f1": 0.925531914893617, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.9157894736842105, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9194029850746269, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9112426035502958, |
| "eval_ORGANIZATION_recall": 0.927710843373494, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04019373282790184, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9392812887236679, |
| "eval_overall_precision": 0.9334975369458128, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2806, |
| "eval_samples_per_second": 605.767, |
| "eval_steps_per_second": 10.69, |
| "step": 5280 |
| }, |
| { |
| "epoch": 56.0, |
| "grad_norm": 2.138538360595703, |
| "learning_rate": 2.2000000000000003e-05, |
| "loss": 0.0491, |
| "step": 5376 |
| }, |
| { |
| "epoch": 56.0, |
| "eval_LOCATION_f1": 0.9109947643979057, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8877551020408163, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9144542772861357, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8959537572254336, |
| "eval_ORGANIZATION_recall": 0.9337349397590361, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.043160635977983475, |
| "eval_overall_accuracy": 0.9862825788751715, |
| "eval_overall_f1": 0.9336609336609337, |
| "eval_overall_precision": 0.9200968523002422, |
| "eval_overall_recall": 0.9476309226932669, |
| "eval_runtime": 0.2797, |
| "eval_samples_per_second": 607.881, |
| "eval_steps_per_second": 10.727, |
| "step": 5376 |
| }, |
| { |
| "epoch": 57.0, |
| "grad_norm": 0.7274695038795471, |
| "learning_rate": 2.15e-05, |
| "loss": 0.0495, |
| "step": 5472 |
| }, |
| { |
| "epoch": 57.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04091630131006241, |
| "eval_overall_accuracy": 0.9865569272976681, |
| "eval_overall_f1": 0.9344870210135972, |
| "eval_overall_precision": 0.9264705882352942, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2809, |
| "eval_samples_per_second": 605.197, |
| "eval_steps_per_second": 10.68, |
| "step": 5472 |
| }, |
| { |
| "epoch": 58.0, |
| "grad_norm": 0.6043224334716797, |
| "learning_rate": 2.1e-05, |
| "loss": 0.0495, |
| "step": 5568 |
| }, |
| { |
| "epoch": 58.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04245884343981743, |
| "eval_overall_accuracy": 0.9865569272976681, |
| "eval_overall_f1": 0.9344870210135972, |
| "eval_overall_precision": 0.9264705882352942, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2821, |
| "eval_samples_per_second": 602.589, |
| "eval_steps_per_second": 10.634, |
| "step": 5568 |
| }, |
| { |
| "epoch": 59.0, |
| "grad_norm": 0.7443007826805115, |
| "learning_rate": 2.05e-05, |
| "loss": 0.0462, |
| "step": 5664 |
| }, |
| { |
| "epoch": 59.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9129129129129129, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9101796407185628, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04124193638563156, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9356435643564357, |
| "eval_overall_precision": 0.9287469287469288, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2806, |
| "eval_samples_per_second": 605.911, |
| "eval_steps_per_second": 10.693, |
| "step": 5664 |
| }, |
| { |
| "epoch": 60.0, |
| "grad_norm": 1.2478013038635254, |
| "learning_rate": 2e-05, |
| "loss": 0.048, |
| "step": 5760 |
| }, |
| { |
| "epoch": 60.0, |
| "eval_LOCATION_f1": 0.9263157894736843, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.9072164948453608, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9156626506024096, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9156626506024096, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.040921688079833984, |
| "eval_overall_accuracy": 0.9868312757201646, |
| "eval_overall_f1": 0.9379652605459058, |
| "eval_overall_precision": 0.9333333333333333, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2812, |
| "eval_samples_per_second": 604.536, |
| "eval_steps_per_second": 10.668, |
| "step": 5760 |
| }, |
| { |
| "epoch": 61.0, |
| "grad_norm": 0.783888578414917, |
| "learning_rate": 1.9500000000000003e-05, |
| "loss": 0.048, |
| "step": 5856 |
| }, |
| { |
| "epoch": 61.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9129129129129129, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9101796407185628, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03963721916079521, |
| "eval_overall_accuracy": 0.9879286694101509, |
| "eval_overall_f1": 0.9356435643564357, |
| "eval_overall_precision": 0.9287469287469288, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2837, |
| "eval_samples_per_second": 599.237, |
| "eval_steps_per_second": 10.575, |
| "step": 5856 |
| }, |
| { |
| "epoch": 62.0, |
| "grad_norm": 1.2428171634674072, |
| "learning_rate": 1.9e-05, |
| "loss": 0.0461, |
| "step": 5952 |
| }, |
| { |
| "epoch": 62.0, |
| "eval_LOCATION_f1": 0.9157894736842105, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8969072164948454, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9014925373134328, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.893491124260355, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.040256600826978683, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9295426452410381, |
| "eval_overall_precision": 0.9215686274509803, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2805, |
| "eval_samples_per_second": 606.008, |
| "eval_steps_per_second": 10.694, |
| "step": 5952 |
| }, |
| { |
| "epoch": 63.0, |
| "grad_norm": 3.580406427383423, |
| "learning_rate": 1.85e-05, |
| "loss": 0.0459, |
| "step": 6048 |
| }, |
| { |
| "epoch": 63.0, |
| "eval_LOCATION_f1": 0.9166666666666667, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8888888888888888, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9189189189189191, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9161676646706587, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04053889960050583, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9369592088998765, |
| "eval_overall_precision": 0.928921568627451, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2795, |
| "eval_samples_per_second": 608.325, |
| "eval_steps_per_second": 10.735, |
| "step": 6048 |
| }, |
| { |
| "epoch": 64.0, |
| "grad_norm": 0.41149088740348816, |
| "learning_rate": 1.8e-05, |
| "loss": 0.0461, |
| "step": 6144 |
| }, |
| { |
| "epoch": 64.0, |
| "eval_LOCATION_f1": 0.9157894736842105, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8969072164948454, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.8988095238095238, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.888235294117647, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03941579535603523, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.928395061728395, |
| "eval_overall_precision": 0.9193154034229829, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2836, |
| "eval_samples_per_second": 599.391, |
| "eval_steps_per_second": 10.577, |
| "step": 6144 |
| }, |
| { |
| "epoch": 65.0, |
| "grad_norm": 0.4289607107639313, |
| "learning_rate": 1.75e-05, |
| "loss": 0.0431, |
| "step": 6240 |
| }, |
| { |
| "epoch": 65.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9063444108761329, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9090909090909091, |
| "eval_ORGANIZATION_recall": 0.9036144578313253, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.040837135165929794, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9330024813895781, |
| "eval_overall_precision": 0.928395061728395, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.282, |
| "eval_samples_per_second": 602.839, |
| "eval_steps_per_second": 10.638, |
| "step": 6240 |
| }, |
| { |
| "epoch": 66.0, |
| "grad_norm": 0.7041921615600586, |
| "learning_rate": 1.7000000000000003e-05, |
| "loss": 0.0448, |
| "step": 6336 |
| }, |
| { |
| "epoch": 66.0, |
| "eval_LOCATION_f1": 0.9263157894736843, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.9072164948453608, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9134328358208955, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9053254437869822, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03957487642765045, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9369592088998765, |
| "eval_overall_precision": 0.928921568627451, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2803, |
| "eval_samples_per_second": 606.538, |
| "eval_steps_per_second": 10.704, |
| "step": 6336 |
| }, |
| { |
| "epoch": 67.0, |
| "grad_norm": 0.8772794008255005, |
| "learning_rate": 1.65e-05, |
| "loss": 0.044, |
| "step": 6432 |
| }, |
| { |
| "epoch": 67.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9063444108761329, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9090909090909091, |
| "eval_ORGANIZATION_recall": 0.9036144578313253, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04030785709619522, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9330024813895781, |
| "eval_overall_precision": 0.928395061728395, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2815, |
| "eval_samples_per_second": 603.992, |
| "eval_steps_per_second": 10.659, |
| "step": 6432 |
| }, |
| { |
| "epoch": 68.0, |
| "grad_norm": 0.5797802209854126, |
| "learning_rate": 1.6000000000000003e-05, |
| "loss": 0.0439, |
| "step": 6528 |
| }, |
| { |
| "epoch": 68.0, |
| "eval_LOCATION_f1": 0.9166666666666667, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8888888888888888, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9151515151515153, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9207317073170732, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04043779894709587, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9354838709677419, |
| "eval_overall_precision": 0.9308641975308642, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2801, |
| "eval_samples_per_second": 607.009, |
| "eval_steps_per_second": 10.712, |
| "step": 6528 |
| }, |
| { |
| "epoch": 69.0, |
| "grad_norm": 1.7521965503692627, |
| "learning_rate": 1.55e-05, |
| "loss": 0.0451, |
| "step": 6624 |
| }, |
| { |
| "epoch": 69.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9151515151515153, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9207317073170732, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.0415940061211586, |
| "eval_overall_accuracy": 0.9868312757201646, |
| "eval_overall_f1": 0.9343246592317225, |
| "eval_overall_precision": 0.9285714285714286, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2807, |
| "eval_samples_per_second": 605.718, |
| "eval_steps_per_second": 10.689, |
| "step": 6624 |
| }, |
| { |
| "epoch": 70.0, |
| "grad_norm": 1.2547327280044556, |
| "learning_rate": 1.5e-05, |
| "loss": 0.0429, |
| "step": 6720 |
| }, |
| { |
| "epoch": 70.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9134328358208955, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9053254437869822, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04034920409321785, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9334975369458128, |
| "eval_overall_precision": 0.9221411192214112, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2822, |
| "eval_samples_per_second": 602.384, |
| "eval_steps_per_second": 10.63, |
| "step": 6720 |
| }, |
| { |
| "epoch": 71.0, |
| "grad_norm": 0.7320692539215088, |
| "learning_rate": 1.45e-05, |
| "loss": 0.0447, |
| "step": 6816 |
| }, |
| { |
| "epoch": 71.0, |
| "eval_LOCATION_f1": 0.9214659685863874, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8979591836734694, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9221556886227544, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9166666666666666, |
| "eval_ORGANIZATION_recall": 0.927710843373494, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04022010415792465, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9394313967861558, |
| "eval_overall_precision": 0.9313725490196079, |
| "eval_overall_recall": 0.9476309226932669, |
| "eval_runtime": 0.2802, |
| "eval_samples_per_second": 606.723, |
| "eval_steps_per_second": 10.707, |
| "step": 6816 |
| }, |
| { |
| "epoch": 72.0, |
| "grad_norm": 0.819017231464386, |
| "learning_rate": 1.4000000000000001e-05, |
| "loss": 0.0437, |
| "step": 6912 |
| }, |
| { |
| "epoch": 72.0, |
| "eval_LOCATION_f1": 0.9166666666666667, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8888888888888888, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9123867069486404, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9151515151515152, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03983786702156067, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9343246592317225, |
| "eval_overall_precision": 0.9285714285714286, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2814, |
| "eval_samples_per_second": 604.215, |
| "eval_steps_per_second": 10.663, |
| "step": 6912 |
| }, |
| { |
| "epoch": 73.0, |
| "grad_norm": 1.5767393112182617, |
| "learning_rate": 1.3500000000000001e-05, |
| "loss": 0.041, |
| "step": 7008 |
| }, |
| { |
| "epoch": 73.0, |
| "eval_LOCATION_f1": 0.9109947643979057, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8877551020408163, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9161676646706587, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9107142857142857, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03988140448927879, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9344870210135972, |
| "eval_overall_precision": 0.9264705882352942, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2828, |
| "eval_samples_per_second": 601.131, |
| "eval_steps_per_second": 10.608, |
| "step": 7008 |
| }, |
| { |
| "epoch": 74.0, |
| "grad_norm": 0.34249478578567505, |
| "learning_rate": 1.3000000000000001e-05, |
| "loss": 0.0425, |
| "step": 7104 |
| }, |
| { |
| "epoch": 74.0, |
| "eval_LOCATION_f1": 0.9157894736842105, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8969072164948454, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9194029850746269, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9112426035502958, |
| "eval_ORGANIZATION_recall": 0.927710843373494, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04064317047595978, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9369592088998765, |
| "eval_overall_precision": 0.928921568627451, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2816, |
| "eval_samples_per_second": 603.647, |
| "eval_steps_per_second": 10.653, |
| "step": 7104 |
| }, |
| { |
| "epoch": 75.0, |
| "grad_norm": 0.588118851184845, |
| "learning_rate": 1.25e-05, |
| "loss": 0.0426, |
| "step": 7200 |
| }, |
| { |
| "epoch": 75.0, |
| "eval_LOCATION_f1": 0.9109947643979057, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8877551020408163, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9107142857142857, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03951849043369293, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2807, |
| "eval_samples_per_second": 605.599, |
| "eval_steps_per_second": 10.687, |
| "step": 7200 |
| }, |
| { |
| "epoch": 76.0, |
| "grad_norm": 0.5939780473709106, |
| "learning_rate": 1.2e-05, |
| "loss": 0.0398, |
| "step": 7296 |
| }, |
| { |
| "epoch": 76.0, |
| "eval_LOCATION_f1": 0.9166666666666667, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8888888888888888, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.918429003021148, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9212121212121213, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.040211234241724014, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9368029739776952, |
| "eval_overall_precision": 0.9310344827586207, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2831, |
| "eval_samples_per_second": 600.543, |
| "eval_steps_per_second": 10.598, |
| "step": 7296 |
| }, |
| { |
| "epoch": 77.0, |
| "grad_norm": 0.6372460126876831, |
| "learning_rate": 1.1500000000000002e-05, |
| "loss": 0.0407, |
| "step": 7392 |
| }, |
| { |
| "epoch": 77.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9096385542168675, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9096385542168675, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.039185136556625366, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9306930693069307, |
| "eval_overall_precision": 0.9238329238329238, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2816, |
| "eval_samples_per_second": 603.751, |
| "eval_steps_per_second": 10.654, |
| "step": 7392 |
| }, |
| { |
| "epoch": 78.0, |
| "grad_norm": 0.7889866828918457, |
| "learning_rate": 1.1000000000000001e-05, |
| "loss": 0.0411, |
| "step": 7488 |
| }, |
| { |
| "epoch": 78.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9041916167664671, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8988095238095238, |
| "eval_ORGANIZATION_recall": 0.9096385542168675, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03939792886376381, |
| "eval_overall_accuracy": 0.9868312757201646, |
| "eval_overall_f1": 0.928395061728395, |
| "eval_overall_precision": 0.9193154034229829, |
| "eval_overall_recall": 0.9376558603491272, |
| "eval_runtime": 0.2813, |
| "eval_samples_per_second": 604.429, |
| "eval_steps_per_second": 10.666, |
| "step": 7488 |
| }, |
| { |
| "epoch": 79.0, |
| "grad_norm": 0.8031059503555298, |
| "learning_rate": 1.05e-05, |
| "loss": 0.0417, |
| "step": 7584 |
| }, |
| { |
| "epoch": 79.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9134328358208955, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9053254437869822, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.039482057094573975, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2824, |
| "eval_samples_per_second": 601.902, |
| "eval_steps_per_second": 10.622, |
| "step": 7584 |
| }, |
| { |
| "epoch": 80.0, |
| "grad_norm": 2.120938777923584, |
| "learning_rate": 1e-05, |
| "loss": 0.0412, |
| "step": 7680 |
| }, |
| { |
| "epoch": 80.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9053254437869822, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8895348837209303, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03960248827934265, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9287469287469288, |
| "eval_overall_precision": 0.9152542372881356, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2823, |
| "eval_samples_per_second": 602.136, |
| "eval_steps_per_second": 10.626, |
| "step": 7680 |
| }, |
| { |
| "epoch": 81.0, |
| "grad_norm": 0.5607914924621582, |
| "learning_rate": 9.5e-06, |
| "loss": 0.0431, |
| "step": 7776 |
| }, |
| { |
| "epoch": 81.0, |
| "eval_LOCATION_f1": 0.9015544041450777, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.87, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9047619047619048, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8941176470588236, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03992500156164169, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9274292742927428, |
| "eval_overall_precision": 0.9150485436893204, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2802, |
| "eval_samples_per_second": 606.677, |
| "eval_steps_per_second": 10.706, |
| "step": 7776 |
| }, |
| { |
| "epoch": 82.0, |
| "grad_norm": 1.140172004699707, |
| "learning_rate": 9e-06, |
| "loss": 0.042, |
| "step": 7872 |
| }, |
| { |
| "epoch": 82.0, |
| "eval_LOCATION_f1": 0.9166666666666667, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8888888888888888, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9189189189189191, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9161676646706587, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04006196931004524, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9369592088998765, |
| "eval_overall_precision": 0.928921568627451, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2823, |
| "eval_samples_per_second": 602.241, |
| "eval_steps_per_second": 10.628, |
| "step": 7872 |
| }, |
| { |
| "epoch": 83.0, |
| "grad_norm": 0.7160885334014893, |
| "learning_rate": 8.500000000000002e-06, |
| "loss": 0.0412, |
| "step": 7968 |
| }, |
| { |
| "epoch": 83.0, |
| "eval_LOCATION_f1": 0.9166666666666667, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8888888888888888, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9189189189189191, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9161676646706587, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.040310610085725784, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9369592088998765, |
| "eval_overall_precision": 0.928921568627451, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2826, |
| "eval_samples_per_second": 601.646, |
| "eval_steps_per_second": 10.617, |
| "step": 7968 |
| }, |
| { |
| "epoch": 84.0, |
| "grad_norm": 0.9255092144012451, |
| "learning_rate": 8.000000000000001e-06, |
| "loss": 0.0413, |
| "step": 8064 |
| }, |
| { |
| "epoch": 84.0, |
| "eval_LOCATION_f1": 0.9166666666666667, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8888888888888888, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9129129129129129, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9101796407185628, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.04085477441549301, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9344870210135972, |
| "eval_overall_precision": 0.9264705882352942, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2809, |
| "eval_samples_per_second": 605.295, |
| "eval_steps_per_second": 10.682, |
| "step": 8064 |
| }, |
| { |
| "epoch": 85.0, |
| "grad_norm": 0.6887927651405334, |
| "learning_rate": 7.5e-06, |
| "loss": 0.0405, |
| "step": 8160 |
| }, |
| { |
| "epoch": 85.0, |
| "eval_LOCATION_f1": 0.9072164948453608, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8712871287128713, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9161676646706587, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9107142857142857, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03969047591090202, |
| "eval_overall_accuracy": 0.9879286694101509, |
| "eval_overall_f1": 0.9334975369458128, |
| "eval_overall_precision": 0.9221411192214112, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2815, |
| "eval_samples_per_second": 603.924, |
| "eval_steps_per_second": 10.657, |
| "step": 8160 |
| }, |
| { |
| "epoch": 86.0, |
| "grad_norm": 1.2184239625930786, |
| "learning_rate": 7.000000000000001e-06, |
| "loss": 0.0405, |
| "step": 8256 |
| }, |
| { |
| "epoch": 86.0, |
| "eval_LOCATION_f1": 0.9072164948453608, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8712871287128713, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9161676646706587, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9107142857142857, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03970079496502876, |
| "eval_overall_accuracy": 0.9879286694101509, |
| "eval_overall_f1": 0.9334975369458128, |
| "eval_overall_precision": 0.9221411192214112, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2832, |
| "eval_samples_per_second": 600.222, |
| "eval_steps_per_second": 10.592, |
| "step": 8256 |
| }, |
| { |
| "epoch": 87.0, |
| "grad_norm": 1.5015846490859985, |
| "learning_rate": 6.5000000000000004e-06, |
| "loss": 0.0401, |
| "step": 8352 |
| }, |
| { |
| "epoch": 87.0, |
| "eval_LOCATION_f1": 0.9072164948453608, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8712871287128713, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03983263671398163, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9310344827586207, |
| "eval_overall_precision": 0.9197080291970803, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2817, |
| "eval_samples_per_second": 603.464, |
| "eval_steps_per_second": 10.649, |
| "step": 8352 |
| }, |
| { |
| "epoch": 88.0, |
| "grad_norm": 0.568331241607666, |
| "learning_rate": 6e-06, |
| "loss": 0.041, |
| "step": 8448 |
| }, |
| { |
| "epoch": 88.0, |
| "eval_LOCATION_f1": 0.9072164948453608, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8712871287128713, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9161676646706587, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9107142857142857, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.039770666509866714, |
| "eval_overall_accuracy": 0.9879286694101509, |
| "eval_overall_f1": 0.9334975369458128, |
| "eval_overall_precision": 0.9221411192214112, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.2825, |
| "eval_samples_per_second": 601.794, |
| "eval_steps_per_second": 10.62, |
| "step": 8448 |
| }, |
| { |
| "epoch": 89.0, |
| "grad_norm": 1.1911604404449463, |
| "learning_rate": 5.500000000000001e-06, |
| "loss": 0.0397, |
| "step": 8544 |
| }, |
| { |
| "epoch": 89.0, |
| "eval_LOCATION_f1": 0.9015544041450777, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.87, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.039621464908123016, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9297163995067818, |
| "eval_overall_precision": 0.9195121951219513, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2798, |
| "eval_samples_per_second": 607.512, |
| "eval_steps_per_second": 10.721, |
| "step": 8544 |
| }, |
| { |
| "epoch": 90.0, |
| "grad_norm": 2.4099748134613037, |
| "learning_rate": 5e-06, |
| "loss": 0.0398, |
| "step": 8640 |
| }, |
| { |
| "epoch": 90.0, |
| "eval_LOCATION_f1": 0.9015544041450777, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.87, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9134328358208955, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9053254437869822, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03956400975584984, |
| "eval_overall_accuracy": 0.9879286694101509, |
| "eval_overall_f1": 0.9310344827586207, |
| "eval_overall_precision": 0.9197080291970803, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2819, |
| "eval_samples_per_second": 603.1, |
| "eval_steps_per_second": 10.643, |
| "step": 8640 |
| }, |
| { |
| "epoch": 91.0, |
| "grad_norm": 0.42839816212654114, |
| "learning_rate": 4.5e-06, |
| "loss": 0.039, |
| "step": 8736 |
| }, |
| { |
| "epoch": 91.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9189189189189191, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9161676646706587, |
| "eval_ORGANIZATION_recall": 0.9216867469879518, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03948313742876053, |
| "eval_overall_accuracy": 0.9876543209876543, |
| "eval_overall_f1": 0.9358024691358026, |
| "eval_overall_precision": 0.9266503667481663, |
| "eval_overall_recall": 0.9451371571072319, |
| "eval_runtime": 0.285, |
| "eval_samples_per_second": 596.519, |
| "eval_steps_per_second": 10.527, |
| "step": 8736 |
| }, |
| { |
| "epoch": 92.0, |
| "grad_norm": 0.5673728585243225, |
| "learning_rate": 4.000000000000001e-06, |
| "loss": 0.0385, |
| "step": 8832 |
| }, |
| { |
| "epoch": 92.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03977023437619209, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2816, |
| "eval_samples_per_second": 603.659, |
| "eval_steps_per_second": 10.653, |
| "step": 8832 |
| }, |
| { |
| "epoch": 93.0, |
| "grad_norm": 0.6550965309143066, |
| "learning_rate": 3.5000000000000004e-06, |
| "loss": 0.0385, |
| "step": 8928 |
| }, |
| { |
| "epoch": 93.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.0398373156785965, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2844, |
| "eval_samples_per_second": 597.851, |
| "eval_steps_per_second": 10.55, |
| "step": 8928 |
| }, |
| { |
| "epoch": 94.0, |
| "grad_norm": 0.17871248722076416, |
| "learning_rate": 3e-06, |
| "loss": 0.0398, |
| "step": 9024 |
| }, |
| { |
| "epoch": 94.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03970322385430336, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2828, |
| "eval_samples_per_second": 601.056, |
| "eval_steps_per_second": 10.607, |
| "step": 9024 |
| }, |
| { |
| "epoch": 95.0, |
| "grad_norm": 0.2635639011859894, |
| "learning_rate": 2.5e-06, |
| "loss": 0.0382, |
| "step": 9120 |
| }, |
| { |
| "epoch": 95.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03960025683045387, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2838, |
| "eval_samples_per_second": 599.017, |
| "eval_steps_per_second": 10.571, |
| "step": 9120 |
| }, |
| { |
| "epoch": 96.0, |
| "grad_norm": 0.5545527935028076, |
| "learning_rate": 2.0000000000000003e-06, |
| "loss": 0.0408, |
| "step": 9216 |
| }, |
| { |
| "epoch": 96.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.039429329335689545, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2843, |
| "eval_samples_per_second": 597.868, |
| "eval_steps_per_second": 10.551, |
| "step": 9216 |
| }, |
| { |
| "epoch": 97.0, |
| "grad_norm": 0.20971649885177612, |
| "learning_rate": 1.5e-06, |
| "loss": 0.0372, |
| "step": 9312 |
| }, |
| { |
| "epoch": 97.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03945162892341614, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2901, |
| "eval_samples_per_second": 586.028, |
| "eval_steps_per_second": 10.342, |
| "step": 9312 |
| }, |
| { |
| "epoch": 98.0, |
| "grad_norm": 0.9901926517486572, |
| "learning_rate": 1.0000000000000002e-06, |
| "loss": 0.0392, |
| "step": 9408 |
| }, |
| { |
| "epoch": 98.0, |
| "eval_LOCATION_f1": 0.90625, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.8787878787878788, |
| "eval_LOCATION_recall": 0.9354838709677419, |
| "eval_ORGANIZATION_f1": 0.9074626865671641, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.8994082840236687, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.039484377950429916, |
| "eval_overall_accuracy": 0.9871056241426612, |
| "eval_overall_f1": 0.9297163995067818, |
| "eval_overall_precision": 0.9195121951219513, |
| "eval_overall_recall": 0.940149625935162, |
| "eval_runtime": 0.2824, |
| "eval_samples_per_second": 602.087, |
| "eval_steps_per_second": 10.625, |
| "step": 9408 |
| }, |
| { |
| "epoch": 99.0, |
| "grad_norm": 0.7696068286895752, |
| "learning_rate": 5.000000000000001e-07, |
| "loss": 0.0393, |
| "step": 9504 |
| }, |
| { |
| "epoch": 99.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03950231894850731, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2816, |
| "eval_samples_per_second": 603.609, |
| "eval_steps_per_second": 10.652, |
| "step": 9504 |
| }, |
| { |
| "epoch": 100.0, |
| "grad_norm": 0.9257699251174927, |
| "learning_rate": 0.0, |
| "loss": 0.0399, |
| "step": 9600 |
| }, |
| { |
| "epoch": 100.0, |
| "eval_LOCATION_f1": 0.911917098445596, |
| "eval_LOCATION_number": 93, |
| "eval_LOCATION_precision": 0.88, |
| "eval_LOCATION_recall": 0.946236559139785, |
| "eval_ORGANIZATION_f1": 0.9101796407185628, |
| "eval_ORGANIZATION_number": 166, |
| "eval_ORGANIZATION_precision": 0.9047619047619048, |
| "eval_ORGANIZATION_recall": 0.9156626506024096, |
| "eval_PERSON_f1": 0.971830985915493, |
| "eval_PERSON_number": 142, |
| "eval_PERSON_precision": 0.971830985915493, |
| "eval_PERSON_recall": 0.971830985915493, |
| "eval_loss": 0.03953361511230469, |
| "eval_overall_accuracy": 0.9873799725651577, |
| "eval_overall_f1": 0.9321824907521579, |
| "eval_overall_precision": 0.9219512195121952, |
| "eval_overall_recall": 0.942643391521197, |
| "eval_runtime": 0.2824, |
| "eval_samples_per_second": 601.932, |
| "eval_steps_per_second": 10.622, |
| "step": 9600 |
| }, |
| { |
| "epoch": 100.0, |
| "step": 9600, |
| "total_flos": 3784810278471630.0, |
| "train_loss": 0.09147172088424364, |
| "train_runtime": 505.6149, |
| "train_samples_per_second": 302.8, |
| "train_steps_per_second": 18.987 |
| } |
| ], |
| "logging_steps": 500, |
| "max_steps": 9600, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 100, |
| "save_steps": 500, |
| "total_flos": 3784810278471630.0, |
| "train_batch_size": 16, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|