| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 100.0, | |
| "eval_steps": 500, | |
| "global_step": 10600, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 2.7315826416015625, | |
| "learning_rate": 4.9500000000000004e-05, | |
| "loss": 0.3629, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7692307692307693, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.6941176470588235, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.6210526315789474, | |
| "eval_ORGANIZATION_recall": 0.7866666666666666, | |
| "eval_PERSON_f1": 0.8888888888888888, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8343558282208589, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.5396825396825397, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.425, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.721311475409836, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.6285714285714286, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.1598740667104721, | |
| "eval_overall_accuracy": 0.9482111583687766, | |
| "eval_overall_f1": 0.7839999999999999, | |
| "eval_overall_precision": 0.7153284671532847, | |
| "eval_overall_recall": 0.8672566371681416, | |
| "eval_runtime": 0.3626, | |
| "eval_samples_per_second": 515.737, | |
| "eval_steps_per_second": 8.274, | |
| "step": 106 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 1.3484944105148315, | |
| "learning_rate": 4.9e-05, | |
| "loss": 0.128, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_LOCATION_f1": 0.7922077922077924, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7439024390243902, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.782122905027933, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.6730769230769231, | |
| "eval_ORGANIZATION_recall": 0.9333333333333333, | |
| "eval_PERSON_f1": 0.8993288590604027, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.864516129032258, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.6545454545454547, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5625, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8076923076923077, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8076923076923077, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.13682067394256592, | |
| "eval_overall_accuracy": 0.9567175381536153, | |
| "eval_overall_f1": 0.8238482384823848, | |
| "eval_overall_precision": 0.7619047619047619, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3665, | |
| "eval_samples_per_second": 510.258, | |
| "eval_steps_per_second": 8.186, | |
| "step": 212 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 2.2102744579315186, | |
| "learning_rate": 4.85e-05, | |
| "loss": 0.0841, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_LOCATION_f1": 0.8028169014084506, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8142857142857143, | |
| "eval_LOCATION_recall": 0.7916666666666666, | |
| "eval_ORGANIZATION_f1": 0.7810650887573964, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7021276595744681, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8918032786885245, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8395061728395061, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.6415094339622641, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5666666666666667, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8333333333333333, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.9090909090909091, | |
| "eval_TIME_recall": 0.7692307692307693, | |
| "eval_loss": 0.1551402360200882, | |
| "eval_overall_accuracy": 0.9547160370277709, | |
| "eval_overall_f1": 0.8256624825662482, | |
| "eval_overall_precision": 0.783068783068783, | |
| "eval_overall_recall": 0.8731563421828908, | |
| "eval_runtime": 0.3569, | |
| "eval_samples_per_second": 523.957, | |
| "eval_steps_per_second": 8.406, | |
| "step": 318 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 8.499090194702148, | |
| "learning_rate": 4.8e-05, | |
| "loss": 0.0533, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_LOCATION_f1": 0.8053691275167787, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7792207792207793, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.7719298245614036, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.6875, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8778877887788779, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.83125, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.6666666666666667, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5806451612903226, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.7540983606557377, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.6571428571428571, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.17204634845256805, | |
| "eval_overall_accuracy": 0.9552164123092319, | |
| "eval_overall_f1": 0.8130081300813008, | |
| "eval_overall_precision": 0.7518796992481203, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3715, | |
| "eval_samples_per_second": 503.365, | |
| "eval_steps_per_second": 8.075, | |
| "step": 424 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 10.976715087890625, | |
| "learning_rate": 4.75e-05, | |
| "loss": 0.0359, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_LOCATION_f1": 0.8079470198675496, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.7784431137724551, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7065217391304348, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.9049180327868852, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8518518518518519, | |
| "eval_PERSON_recall": 0.965034965034965, | |
| "eval_QUANTITY_f1": 0.6785714285714286, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5757575757575758, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7586206896551724, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.20843125879764557, | |
| "eval_overall_accuracy": 0.9564673505128847, | |
| "eval_overall_f1": 0.8310626702997276, | |
| "eval_overall_precision": 0.7721518987341772, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3572, | |
| "eval_samples_per_second": 523.556, | |
| "eval_steps_per_second": 8.399, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 0.3230496346950531, | |
| "learning_rate": 4.7e-05, | |
| "loss": 0.0256, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_LOCATION_f1": 0.816326530612245, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.7597765363128492, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.6538461538461539, | |
| "eval_ORGANIZATION_recall": 0.9066666666666666, | |
| "eval_PERSON_f1": 0.9006622516556291, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8553459119496856, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.6666666666666667, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5588235294117647, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.7368421052631579, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.6774193548387096, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.2402852177619934, | |
| "eval_overall_accuracy": 0.9539654741055792, | |
| "eval_overall_f1": 0.8194070080862534, | |
| "eval_overall_precision": 0.7543424317617866, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3663, | |
| "eval_samples_per_second": 510.497, | |
| "eval_steps_per_second": 8.19, | |
| "step": 636 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 0.021450912579894066, | |
| "learning_rate": 4.6500000000000005e-05, | |
| "loss": 0.0188, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_LOCATION_f1": 0.8133333333333332, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.782051282051282, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.7624309392265193, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.6509433962264151, | |
| "eval_ORGANIZATION_recall": 0.92, | |
| "eval_PERSON_f1": 0.8926174496644295, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8580645161290322, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6206896551724138, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.7118644067796609, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.6363636363636364, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.22656874358654022, | |
| "eval_overall_accuracy": 0.9569677257943457, | |
| "eval_overall_f1": 0.8162162162162162, | |
| "eval_overall_precision": 0.7531172069825436, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.356, | |
| "eval_samples_per_second": 525.333, | |
| "eval_steps_per_second": 8.428, | |
| "step": 742 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 0.026271946728229523, | |
| "learning_rate": 4.600000000000001e-05, | |
| "loss": 0.0134, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_LOCATION_f1": 0.7891156462585034, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7733333333333333, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.7530864197530864, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7011494252873564, | |
| "eval_ORGANIZATION_recall": 0.8133333333333334, | |
| "eval_PERSON_f1": 0.9066666666666667, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8662420382165605, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.6415094339622641, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5666666666666667, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.7719298245614036, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7096774193548387, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.24617096781730652, | |
| "eval_overall_accuracy": 0.9572179134350763, | |
| "eval_overall_f1": 0.8178025034770514, | |
| "eval_overall_precision": 0.7736842105263158, | |
| "eval_overall_recall": 0.8672566371681416, | |
| "eval_runtime": 0.3558, | |
| "eval_samples_per_second": 525.577, | |
| "eval_steps_per_second": 8.432, | |
| "step": 848 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 0.6316163539886475, | |
| "learning_rate": 4.55e-05, | |
| "loss": 0.0135, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_LOCATION_f1": 0.7972027972027971, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8028169014084507, | |
| "eval_LOCATION_recall": 0.7916666666666666, | |
| "eval_ORGANIZATION_f1": 0.8098159509202455, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.75, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8829431438127091, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8461538461538461, | |
| "eval_PERSON_recall": 0.9230769230769231, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6206896551724138, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.2374754250049591, | |
| "eval_overall_accuracy": 0.9592194145609206, | |
| "eval_overall_f1": 0.829817158931083, | |
| "eval_overall_precision": 0.793010752688172, | |
| "eval_overall_recall": 0.8702064896755162, | |
| "eval_runtime": 0.3585, | |
| "eval_samples_per_second": 521.613, | |
| "eval_steps_per_second": 8.368, | |
| "step": 954 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 0.20594312250614166, | |
| "learning_rate": 4.5e-05, | |
| "loss": 0.0082, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_LOCATION_f1": 0.7973856209150327, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7530864197530864, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.7904191616766466, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.717391304347826, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8933333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8535031847133758, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.6415094339622641, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5666666666666667, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.27111825346946716, | |
| "eval_overall_accuracy": 0.9574681010758068, | |
| "eval_overall_f1": 0.8269230769230769, | |
| "eval_overall_precision": 0.7737789203084833, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3597, | |
| "eval_samples_per_second": 519.941, | |
| "eval_steps_per_second": 8.341, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 0.010851857252418995, | |
| "learning_rate": 4.4500000000000004e-05, | |
| "loss": 0.0079, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_LOCATION_f1": 0.7837837837837838, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7631578947368421, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.7878787878787877, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7222222222222222, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.903010033444816, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8653846153846154, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.6792452830188679, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.7636363636363636, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7241379310344828, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.27776339650154114, | |
| "eval_overall_accuracy": 0.9574681010758068, | |
| "eval_overall_f1": 0.825, | |
| "eval_overall_precision": 0.7795275590551181, | |
| "eval_overall_recall": 0.8761061946902655, | |
| "eval_runtime": 0.3586, | |
| "eval_samples_per_second": 521.408, | |
| "eval_steps_per_second": 8.365, | |
| "step": 1166 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "grad_norm": 4.9953837394714355, | |
| "learning_rate": 4.4000000000000006e-05, | |
| "loss": 0.0105, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_LOCATION_f1": 0.7916666666666666, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7916666666666666, | |
| "eval_LOCATION_recall": 0.7916666666666666, | |
| "eval_ORGANIZATION_f1": 0.8101265822784811, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7710843373493976, | |
| "eval_ORGANIZATION_recall": 0.8533333333333334, | |
| "eval_PERSON_f1": 0.903010033444816, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8653846153846154, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.7857142857142856, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7333333333333333, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.28447094559669495, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.8373408769448375, | |
| "eval_overall_precision": 0.8043478260869565, | |
| "eval_overall_recall": 0.8731563421828908, | |
| "eval_runtime": 0.3599, | |
| "eval_samples_per_second": 519.532, | |
| "eval_steps_per_second": 8.335, | |
| "step": 1272 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "grad_norm": 0.2857362926006317, | |
| "learning_rate": 4.35e-05, | |
| "loss": 0.0103, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_LOCATION_f1": 0.7891156462585034, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7733333333333333, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.8170731707317072, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7528089887640449, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.8926174496644295, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8580645161290322, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.7037037037037037, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6129032258064516, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.9019607843137256, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.92, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.2690028250217438, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8403361344537816, | |
| "eval_overall_precision": 0.8, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3608, | |
| "eval_samples_per_second": 518.338, | |
| "eval_steps_per_second": 8.316, | |
| "step": 1378 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "grad_norm": 0.11683321744203568, | |
| "learning_rate": 4.3e-05, | |
| "loss": 0.0045, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_LOCATION_f1": 0.7887323943661971, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.7777777777777778, | |
| "eval_ORGANIZATION_f1": 0.809248554913295, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7142857142857143, | |
| "eval_ORGANIZATION_recall": 0.9333333333333333, | |
| "eval_PERSON_f1": 0.8933333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8535031847133758, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.6545454545454547, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5625, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.7636363636363636, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7241379310344828, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.304815411567688, | |
| "eval_overall_accuracy": 0.957968476357268, | |
| "eval_overall_f1": 0.8248275862068966, | |
| "eval_overall_precision": 0.7746113989637305, | |
| "eval_overall_recall": 0.8820058997050148, | |
| "eval_runtime": 0.3586, | |
| "eval_samples_per_second": 521.439, | |
| "eval_steps_per_second": 8.365, | |
| "step": 1484 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "grad_norm": 0.15561413764953613, | |
| "learning_rate": 4.25e-05, | |
| "loss": 0.005, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_LOCATION_f1": 0.816326530612245, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8000000000000002, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.775, | |
| "eval_ORGANIZATION_recall": 0.8266666666666667, | |
| "eval_PERSON_f1": 0.9054054054054055, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8758169934640523, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.6792452830188679, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.27857497334480286, | |
| "eval_overall_accuracy": 0.9597197898423818, | |
| "eval_overall_f1": 0.8397163120567377, | |
| "eval_overall_precision": 0.8087431693989071, | |
| "eval_overall_recall": 0.8731563421828908, | |
| "eval_runtime": 0.3743, | |
| "eval_samples_per_second": 499.656, | |
| "eval_steps_per_second": 8.016, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "grad_norm": 0.24679070711135864, | |
| "learning_rate": 4.2e-05, | |
| "loss": 0.0041, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_LOCATION_f1": 0.7866666666666666, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7564102564102564, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8170731707317072, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7528089887640449, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.8903654485049833, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8481012658227848, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.7169811320754716, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6333333333333333, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.30642324686050415, | |
| "eval_overall_accuracy": 0.9572179134350763, | |
| "eval_overall_f1": 0.8349514563106795, | |
| "eval_overall_precision": 0.7879581151832461, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3572, | |
| "eval_samples_per_second": 523.51, | |
| "eval_steps_per_second": 8.399, | |
| "step": 1696 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "grad_norm": 0.17553383111953735, | |
| "learning_rate": 4.15e-05, | |
| "loss": 0.0061, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_LOCATION_f1": 0.7733333333333334, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7435897435897436, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.7701863354037267, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7209302325581395, | |
| "eval_ORGANIZATION_recall": 0.8266666666666667, | |
| "eval_PERSON_f1": 0.8910891089108911, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.84375, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.300820916891098, | |
| "eval_overall_accuracy": 0.9574681010758068, | |
| "eval_overall_f1": 0.8205841446453408, | |
| "eval_overall_precision": 0.7763157894736842, | |
| "eval_overall_recall": 0.8702064896755162, | |
| "eval_runtime": 0.3595, | |
| "eval_samples_per_second": 520.18, | |
| "eval_steps_per_second": 8.345, | |
| "step": 1802 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "grad_norm": 0.004105593077838421, | |
| "learning_rate": 4.1e-05, | |
| "loss": 0.0036, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_LOCATION_f1": 0.8133333333333332, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.782051282051282, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8129032258064516, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7875, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.8993288590604027, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.864516129032258, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.7307692307692308, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6551724137931034, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.29750457406044006, | |
| "eval_overall_accuracy": 0.9627220415311484, | |
| "eval_overall_f1": 0.8434414668547249, | |
| "eval_overall_precision": 0.8081081081081081, | |
| "eval_overall_recall": 0.8820058997050148, | |
| "eval_runtime": 0.3588, | |
| "eval_samples_per_second": 521.143, | |
| "eval_steps_per_second": 8.361, | |
| "step": 1908 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "grad_norm": 0.007032826077193022, | |
| "learning_rate": 4.05e-05, | |
| "loss": 0.0025, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_LOCATION_f1": 0.8513513513513513, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8289473684210527, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.834355828220859, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7727272727272727, | |
| "eval_ORGANIZATION_recall": 0.9066666666666666, | |
| "eval_PERSON_f1": 0.8970099667774087, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8544303797468354, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.76, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.7037037037037037, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8461538461538461, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8461538461538461, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3171651363372803, | |
| "eval_overall_accuracy": 0.9622216662496873, | |
| "eval_overall_f1": 0.8599439775910364, | |
| "eval_overall_precision": 0.8186666666666667, | |
| "eval_overall_recall": 0.9056047197640118, | |
| "eval_runtime": 0.3602, | |
| "eval_samples_per_second": 519.212, | |
| "eval_steps_per_second": 8.33, | |
| "step": 2014 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "grad_norm": 1.055253505706787, | |
| "learning_rate": 4e-05, | |
| "loss": 0.0039, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_LOCATION_f1": 0.8187919463087249, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8098159509202455, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.75, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8970099667774087, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8544303797468354, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.76, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.7037037037037037, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8461538461538461, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8461538461538461, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3097495436668396, | |
| "eval_overall_accuracy": 0.9622216662496873, | |
| "eval_overall_f1": 0.8475524475524475, | |
| "eval_overall_precision": 0.8058510638297872, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3569, | |
| "eval_samples_per_second": 524.015, | |
| "eval_steps_per_second": 8.407, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "grad_norm": 0.4885401129722595, | |
| "learning_rate": 3.9500000000000005e-05, | |
| "loss": 0.0031, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_LOCATION_f1": 0.781456953642384, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7468354430379747, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.7974683544303797, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7590361445783133, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.8940397350993377, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8490566037735849, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7307692307692308, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6551724137931034, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7586206896551724, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.32485198974609375, | |
| "eval_overall_accuracy": 0.9597197898423818, | |
| "eval_overall_f1": 0.83008356545961, | |
| "eval_overall_precision": 0.7862796833773087, | |
| "eval_overall_recall": 0.8790560471976401, | |
| "eval_runtime": 0.3689, | |
| "eval_samples_per_second": 506.94, | |
| "eval_steps_per_second": 8.133, | |
| "step": 2226 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "grad_norm": 0.03123115934431553, | |
| "learning_rate": 3.9000000000000006e-05, | |
| "loss": 0.0037, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_LOCATION_f1": 0.7972972972972973, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7763157894736842, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8263473053892216, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.75, | |
| "eval_ORGANIZATION_recall": 0.92, | |
| "eval_PERSON_f1": 0.8910891089108911, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.84375, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7307692307692308, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6551724137931034, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7586206896551724, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3308863937854767, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8386206896551724, | |
| "eval_overall_precision": 0.7875647668393783, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3591, | |
| "eval_samples_per_second": 520.739, | |
| "eval_steps_per_second": 8.354, | |
| "step": 2332 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "grad_norm": 0.8348985314369202, | |
| "learning_rate": 3.85e-05, | |
| "loss": 0.0015, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_LOCATION_f1": 0.8079470198675496, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8176100628930819, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7738095238095238, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.8933333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8535031847133758, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.7692307692307693, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6896551724137931, | |
| "eval_QUANTITY_recall": 0.8695652173913043, | |
| "eval_TIME_f1": 0.8, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7586206896551724, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.32765087485313416, | |
| "eval_overall_accuracy": 0.9609707280460346, | |
| "eval_overall_f1": 0.8423988842398884, | |
| "eval_overall_precision": 0.798941798941799, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3569, | |
| "eval_samples_per_second": 523.957, | |
| "eval_steps_per_second": 8.406, | |
| "step": 2438 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "grad_norm": 0.006436940282583237, | |
| "learning_rate": 3.8e-05, | |
| "loss": 0.0027, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_LOCATION_f1": 0.7837837837837838, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7631578947368421, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.8076923076923077, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7777777777777778, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.8933333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8535031847133758, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3232249617576599, | |
| "eval_overall_accuracy": 0.9609707280460346, | |
| "eval_overall_f1": 0.8345120226308345, | |
| "eval_overall_precision": 0.8016304347826086, | |
| "eval_overall_recall": 0.8702064896755162, | |
| "eval_runtime": 0.3705, | |
| "eval_samples_per_second": 504.719, | |
| "eval_steps_per_second": 8.097, | |
| "step": 2544 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "grad_norm": 0.9054812788963318, | |
| "learning_rate": 3.7500000000000003e-05, | |
| "loss": 0.0035, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_LOCATION_f1": 0.8129032258064516, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.8227848101265823, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7831325301204819, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.8926174496644295, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8580645161290322, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.6428571428571429, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5454545454545454, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7586206896551724, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.35135143995285034, | |
| "eval_overall_accuracy": 0.957968476357268, | |
| "eval_overall_f1": 0.8337950138504155, | |
| "eval_overall_precision": 0.7859007832898173, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3594, | |
| "eval_samples_per_second": 520.314, | |
| "eval_steps_per_second": 8.347, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "grad_norm": 0.010295592248439789, | |
| "learning_rate": 3.7e-05, | |
| "loss": 0.0028, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_LOCATION_f1": 0.8129032258064516, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7590361445783133, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.7831325301204819, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7142857142857143, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.8979591836734694, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8741721854304636, | |
| "eval_PERSON_recall": 0.9230769230769231, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3200477361679077, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8344923504867873, | |
| "eval_overall_precision": 0.7894736842105263, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3624, | |
| "eval_samples_per_second": 516.068, | |
| "eval_steps_per_second": 8.279, | |
| "step": 2756 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "grad_norm": 0.0034800188150256872, | |
| "learning_rate": 3.65e-05, | |
| "loss": 0.0023, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_LOCATION_f1": 0.8108108108108109, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7894736842105263, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.7831325301204819, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7142857142857143, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.8837209302325583, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8417721518987342, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.6538461538461539, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5862068965517241, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3428550064563751, | |
| "eval_overall_accuracy": 0.9569677257943457, | |
| "eval_overall_f1": 0.8238557558945908, | |
| "eval_overall_precision": 0.7774869109947644, | |
| "eval_overall_recall": 0.8761061946902655, | |
| "eval_runtime": 0.3592, | |
| "eval_samples_per_second": 520.564, | |
| "eval_steps_per_second": 8.351, | |
| "step": 2862 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "grad_norm": 0.001987306633964181, | |
| "learning_rate": 3.6e-05, | |
| "loss": 0.0031, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_LOCATION_f1": 0.8026315789473685, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.7777777777777777, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7241379310344828, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.8983606557377047, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.845679012345679, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8070175438596492, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7419354838709677, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3218757212162018, | |
| "eval_overall_accuracy": 0.9599699774831123, | |
| "eval_overall_f1": 0.828060522696011, | |
| "eval_overall_precision": 0.7757731958762887, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3703, | |
| "eval_samples_per_second": 504.962, | |
| "eval_steps_per_second": 8.101, | |
| "step": 2968 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "grad_norm": 0.021353095769882202, | |
| "learning_rate": 3.55e-05, | |
| "loss": 0.0028, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_LOCATION_f1": 0.8057553956834532, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.835820895522388, | |
| "eval_LOCATION_recall": 0.7777777777777778, | |
| "eval_ORGANIZATION_f1": 0.8076923076923077, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7777777777777778, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.8800000000000001, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8407643312101911, | |
| "eval_PERSON_recall": 0.9230769230769231, | |
| "eval_QUANTITY_f1": 0.6415094339622641, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5666666666666667, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.35811248421669006, | |
| "eval_overall_accuracy": 0.9562171628721541, | |
| "eval_overall_f1": 0.8273894436519258, | |
| "eval_overall_precision": 0.8011049723756906, | |
| "eval_overall_recall": 0.855457227138643, | |
| "eval_runtime": 0.3735, | |
| "eval_samples_per_second": 500.719, | |
| "eval_steps_per_second": 8.033, | |
| "step": 3074 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "grad_norm": 0.0009840091224759817, | |
| "learning_rate": 3.5e-05, | |
| "loss": 0.0031, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7692307692307693, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.830188679245283, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7857142857142857, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9163879598662208, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8782051282051282, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.7307692307692308, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6551724137931034, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7586206896551724, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3134097754955292, | |
| "eval_overall_accuracy": 0.9619714786089567, | |
| "eval_overall_f1": 0.8503496503496504, | |
| "eval_overall_precision": 0.8085106382978723, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3742, | |
| "eval_samples_per_second": 499.673, | |
| "eval_steps_per_second": 8.016, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "grad_norm": 1.1641939878463745, | |
| "learning_rate": 3.45e-05, | |
| "loss": 0.0035, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 31.0, | |
| "eval_LOCATION_f1": 0.751592356687898, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.6941176470588235, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8387096774193549, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.8125, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.9133333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8726114649681529, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6792452830188679, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.31325557827949524, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8372739916550764, | |
| "eval_overall_precision": 0.7921052631578948, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3607, | |
| "eval_samples_per_second": 518.406, | |
| "eval_steps_per_second": 8.317, | |
| "step": 3286 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "grad_norm": 0.0497661791741848, | |
| "learning_rate": 3.4000000000000007e-05, | |
| "loss": 0.0028, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 32.0, | |
| "eval_LOCATION_f1": 0.802721088435374, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8214285714285714, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7419354838709677, | |
| "eval_ORGANIZATION_recall": 0.92, | |
| "eval_PERSON_f1": 0.9, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8598726114649682, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7755102040816326, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.7307692307692307, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8461538461538461, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8461538461538461, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.32023829221725464, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.8491620111731844, | |
| "eval_overall_precision": 0.8063660477453581, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3634, | |
| "eval_samples_per_second": 514.539, | |
| "eval_steps_per_second": 8.255, | |
| "step": 3392 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "grad_norm": 0.0015366391744464636, | |
| "learning_rate": 3.35e-05, | |
| "loss": 0.0013, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 33.0, | |
| "eval_LOCATION_f1": 0.8219178082191781, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8108108108108109, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.7898089171974522, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7560975609756098, | |
| "eval_ORGANIZATION_recall": 0.8266666666666667, | |
| "eval_PERSON_f1": 0.8926174496644295, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8580645161290322, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6206896551724138, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8461538461538461, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8461538461538461, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3315739035606384, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.8368794326241135, | |
| "eval_overall_precision": 0.8060109289617486, | |
| "eval_overall_recall": 0.8702064896755162, | |
| "eval_runtime": 0.3575, | |
| "eval_samples_per_second": 523.126, | |
| "eval_steps_per_second": 8.392, | |
| "step": 3498 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "grad_norm": 0.05237346515059471, | |
| "learning_rate": 3.3e-05, | |
| "loss": 0.0018, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 34.0, | |
| "eval_LOCATION_f1": 0.8571428571428572, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.84, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.8048780487804879, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7415730337078652, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8970099667774087, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8544303797468354, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7169811320754716, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6333333333333333, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.36692577600479126, | |
| "eval_overall_accuracy": 0.9622216662496873, | |
| "eval_overall_f1": 0.8495821727019498, | |
| "eval_overall_precision": 0.8047493403693932, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3644, | |
| "eval_samples_per_second": 513.118, | |
| "eval_steps_per_second": 8.232, | |
| "step": 3604 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "grad_norm": 0.002315772697329521, | |
| "learning_rate": 3.2500000000000004e-05, | |
| "loss": 0.0022, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 35.0, | |
| "eval_LOCATION_f1": 0.8378378378378377, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8157894736842105, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8198757763975156, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7674418604651163, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.91156462585034, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8874172185430463, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.7307692307692308, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6551724137931034, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.9230769230769231, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.9230769230769231, | |
| "eval_loss": 0.3101156949996948, | |
| "eval_overall_accuracy": 0.9649737302977233, | |
| "eval_overall_f1": 0.8628005657708627, | |
| "eval_overall_precision": 0.8288043478260869, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3638, | |
| "eval_samples_per_second": 514.005, | |
| "eval_steps_per_second": 8.246, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "grad_norm": 0.0013785570627078414, | |
| "learning_rate": 3.2000000000000005e-05, | |
| "loss": 0.002, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 36.0, | |
| "eval_LOCATION_f1": 0.8266666666666667, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8198757763975156, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7674418604651163, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8933333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8535031847133758, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6206896551724138, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3521296977996826, | |
| "eval_overall_accuracy": 0.9592194145609206, | |
| "eval_overall_f1": 0.8435754189944135, | |
| "eval_overall_precision": 0.8010610079575596, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3743, | |
| "eval_samples_per_second": 499.566, | |
| "eval_steps_per_second": 8.014, | |
| "step": 3816 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "grad_norm": 0.002585264155641198, | |
| "learning_rate": 3.15e-05, | |
| "loss": 0.0019, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 37.0, | |
| "eval_LOCATION_f1": 0.8211920529801324, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8148148148148148, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7586206896551724, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8956228956228957, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8636363636363636, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.7307692307692308, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6551724137931034, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.34240958094596863, | |
| "eval_overall_accuracy": 0.9587190392794596, | |
| "eval_overall_f1": 0.8435754189944135, | |
| "eval_overall_precision": 0.8010610079575596, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3616, | |
| "eval_samples_per_second": 517.085, | |
| "eval_steps_per_second": 8.295, | |
| "step": 3922 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "grad_norm": 4.613161563873291, | |
| "learning_rate": 3.1e-05, | |
| "loss": 0.0012, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 38.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7654320987654321, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.825, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7764705882352941, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8926174496644295, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8580645161290322, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.6923076923076923, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6206896551724138, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3519201874732971, | |
| "eval_overall_accuracy": 0.957968476357268, | |
| "eval_overall_f1": 0.8396094839609484, | |
| "eval_overall_precision": 0.7962962962962963, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3618, | |
| "eval_samples_per_second": 516.793, | |
| "eval_steps_per_second": 8.291, | |
| "step": 4028 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "grad_norm": 0.0017957445234060287, | |
| "learning_rate": 3.05e-05, | |
| "loss": 0.0012, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 39.0, | |
| "eval_LOCATION_f1": 0.8266666666666667, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.825, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7764705882352941, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8926174496644295, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8580645161290322, | |
| "eval_PERSON_recall": 0.9300699300699301, | |
| "eval_QUANTITY_f1": 0.7169811320754716, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6333333333333333, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.7777777777777779, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.75, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.3654736876487732, | |
| "eval_overall_accuracy": 0.9587190392794596, | |
| "eval_overall_f1": 0.8419580419580419, | |
| "eval_overall_precision": 0.800531914893617, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3617, | |
| "eval_samples_per_second": 517.022, | |
| "eval_steps_per_second": 8.294, | |
| "step": 4134 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "grad_norm": 0.001596860121935606, | |
| "learning_rate": 3e-05, | |
| "loss": 0.001, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 40.0, | |
| "eval_LOCATION_f1": 0.8, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7945205479452054, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.7948717948717949, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7654320987654321, | |
| "eval_ORGANIZATION_recall": 0.8266666666666667, | |
| "eval_PERSON_f1": 0.9090909090909092, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8766233766233766, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7755102040816326, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.7307692307692307, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.34077638387680054, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.8457142857142858, | |
| "eval_overall_precision": 0.8199445983379502, | |
| "eval_overall_recall": 0.8731563421828908, | |
| "eval_runtime": 0.3642, | |
| "eval_samples_per_second": 513.453, | |
| "eval_steps_per_second": 8.237, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "grad_norm": 0.0034711004700511694, | |
| "learning_rate": 2.95e-05, | |
| "loss": 0.0025, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 41.0, | |
| "eval_LOCATION_f1": 0.8157894736842106, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.775, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.7898089171974522, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7560975609756098, | |
| "eval_ORGANIZATION_recall": 0.8266666666666667, | |
| "eval_PERSON_f1": 0.912751677852349, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8774193548387097, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7586206896551724, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.340951144695282, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8415147265077138, | |
| "eval_overall_precision": 0.8021390374331551, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.361, | |
| "eval_samples_per_second": 518.055, | |
| "eval_steps_per_second": 8.311, | |
| "step": 4346 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "grad_norm": 0.02040654979646206, | |
| "learning_rate": 2.9e-05, | |
| "loss": 0.0012, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 42.0, | |
| "eval_LOCATION_f1": 0.8322147651006712, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8051948051948052, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8025477707006369, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7682926829268293, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.903010033444816, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8653846153846154, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.76, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.7037037037037037, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8076923076923077, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8076923076923077, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.3626217842102051, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8486562942008488, | |
| "eval_overall_precision": 0.8152173913043478, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3631, | |
| "eval_samples_per_second": 515.064, | |
| "eval_steps_per_second": 8.263, | |
| "step": 4452 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "grad_norm": 0.001348801888525486, | |
| "learning_rate": 2.8499999999999998e-05, | |
| "loss": 0.003, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 43.0, | |
| "eval_LOCATION_f1": 0.816326530612245, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.7951807228915663, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7252747252747253, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9060402684563759, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8709677419354839, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.7924528301886792, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.3544086813926697, | |
| "eval_overall_accuracy": 0.9587190392794596, | |
| "eval_overall_f1": 0.8391608391608392, | |
| "eval_overall_precision": 0.7978723404255319, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3593, | |
| "eval_samples_per_second": 520.389, | |
| "eval_steps_per_second": 8.348, | |
| "step": 4558 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "grad_norm": 4.9029974937438965, | |
| "learning_rate": 2.8000000000000003e-05, | |
| "loss": 0.0027, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 44.0, | |
| "eval_LOCATION_f1": 0.8026315789473685, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7625, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.7999999999999999, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7157894736842105, | |
| "eval_ORGANIZATION_recall": 0.9066666666666666, | |
| "eval_PERSON_f1": 0.8940397350993377, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8490566037735849, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7307692307692308, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6551724137931034, | |
| "eval_QUANTITY_recall": 0.8260869565217391, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3703295886516571, | |
| "eval_overall_accuracy": 0.9587190392794596, | |
| "eval_overall_f1": 0.8356164383561644, | |
| "eval_overall_precision": 0.7800511508951407, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3623, | |
| "eval_samples_per_second": 516.147, | |
| "eval_steps_per_second": 8.28, | |
| "step": 4664 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "grad_norm": 0.2568044662475586, | |
| "learning_rate": 2.7500000000000004e-05, | |
| "loss": 0.0015, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 45.0, | |
| "eval_LOCATION_f1": 0.8108108108108109, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7894736842105263, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8354430379746836, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7951807228915663, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8910891089108911, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.84375, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8076923076923077, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8076923076923077, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.34526732563972473, | |
| "eval_overall_accuracy": 0.9604703527645734, | |
| "eval_overall_f1": 0.8438818565400844, | |
| "eval_overall_precision": 0.8064516129032258, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3579, | |
| "eval_samples_per_second": 522.551, | |
| "eval_steps_per_second": 8.383, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "grad_norm": 0.0012396867386996746, | |
| "learning_rate": 2.7000000000000002e-05, | |
| "loss": 0.0018, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 46.0, | |
| "eval_LOCATION_f1": 0.816326530612245, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8170731707317072, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7528089887640449, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9060402684563759, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8709677419354839, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.693877551020408, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6538461538461539, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8235294117647058, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.84, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.3448871970176697, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.846262341325811, | |
| "eval_overall_precision": 0.8108108108108109, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3635, | |
| "eval_samples_per_second": 514.485, | |
| "eval_steps_per_second": 8.254, | |
| "step": 4876 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "grad_norm": 1.6906110048294067, | |
| "learning_rate": 2.6500000000000004e-05, | |
| "loss": 0.0028, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 47.0, | |
| "eval_LOCATION_f1": 0.8137931034482759, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8082191780821918, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8148148148148148, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7586206896551724, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9060402684563759, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8709677419354839, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.37111541628837585, | |
| "eval_overall_accuracy": 0.9597197898423818, | |
| "eval_overall_f1": 0.8474576271186441, | |
| "eval_overall_precision": 0.8130081300813008, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3591, | |
| "eval_samples_per_second": 520.775, | |
| "eval_steps_per_second": 8.355, | |
| "step": 4982 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "grad_norm": 0.029315035790205002, | |
| "learning_rate": 2.6000000000000002e-05, | |
| "loss": 0.0014, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 48.0, | |
| "eval_LOCATION_f1": 0.8251748251748252, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8309859154929577, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8198757763975156, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7674418604651163, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9090909090909092, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8766233766233766, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3521229922771454, | |
| "eval_overall_accuracy": 0.9632224168126094, | |
| "eval_overall_f1": 0.8522727272727273, | |
| "eval_overall_precision": 0.821917808219178, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3694, | |
| "eval_samples_per_second": 506.192, | |
| "eval_steps_per_second": 8.121, | |
| "step": 5088 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "grad_norm": 0.02477916330099106, | |
| "learning_rate": 2.5500000000000003e-05, | |
| "loss": 0.0023, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 49.0, | |
| "eval_LOCATION_f1": 0.8187919463087249, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8129032258064516, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7875, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.8874172185430464, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8427672955974843, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.36508724093437195, | |
| "eval_overall_accuracy": 0.9592194145609206, | |
| "eval_overall_f1": 0.8394366197183099, | |
| "eval_overall_precision": 0.8032345013477089, | |
| "eval_overall_recall": 0.8790560471976401, | |
| "eval_runtime": 0.3605, | |
| "eval_samples_per_second": 518.761, | |
| "eval_steps_per_second": 8.322, | |
| "step": 5194 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "grad_norm": 0.017422163859009743, | |
| "learning_rate": 2.5e-05, | |
| "loss": 0.0027, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 50.0, | |
| "eval_LOCATION_f1": 0.8187919463087249, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9096989966555185, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8717948717948718, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.9230769230769231, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.9230769230769231, | |
| "eval_loss": 0.3326910436153412, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8607594936708861, | |
| "eval_overall_precision": 0.8225806451612904, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.3722, | |
| "eval_samples_per_second": 502.368, | |
| "eval_steps_per_second": 8.059, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "grad_norm": 0.00688315462321043, | |
| "learning_rate": 2.45e-05, | |
| "loss": 0.0009, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 51.0, | |
| "eval_LOCATION_f1": 0.8137931034482759, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8082191780821918, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8387096774193549, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.8125, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.912751677852349, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8774193548387097, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.7083333333333334, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.68, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.9230769230769231, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.9230769230769231, | |
| "eval_TIME_recall": 0.9230769230769231, | |
| "eval_loss": 0.33154383301734924, | |
| "eval_overall_accuracy": 0.9659744808606455, | |
| "eval_overall_f1": 0.8624641833810888, | |
| "eval_overall_precision": 0.8384401114206128, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.358, | |
| "eval_samples_per_second": 522.281, | |
| "eval_steps_per_second": 8.379, | |
| "step": 5406 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "grad_norm": 0.0005034964415244758, | |
| "learning_rate": 2.4e-05, | |
| "loss": 0.001, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 52.0, | |
| "eval_LOCATION_f1": 0.7945205479452055, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7837837837837838, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.912751677852349, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8774193548387097, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.9056603773584906, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8888888888888888, | |
| "eval_TIME_recall": 0.9230769230769231, | |
| "eval_loss": 0.3466086983680725, | |
| "eval_overall_accuracy": 0.960720540405304, | |
| "eval_overall_f1": 0.8531073446327683, | |
| "eval_overall_precision": 0.8184281842818428, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3715, | |
| "eval_samples_per_second": 503.309, | |
| "eval_steps_per_second": 8.074, | |
| "step": 5512 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "grad_norm": 0.021436743438243866, | |
| "learning_rate": 2.35e-05, | |
| "loss": 0.0014, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 53.0, | |
| "eval_LOCATION_f1": 0.8108108108108109, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7894736842105263, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8271604938271604, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7701149425287356, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9133333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8726114649681529, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8518518518518519, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8214285714285714, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.32782742381095886, | |
| "eval_overall_accuracy": 0.9609707280460346, | |
| "eval_overall_f1": 0.8515406162464986, | |
| "eval_overall_precision": 0.8106666666666666, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3599, | |
| "eval_samples_per_second": 519.612, | |
| "eval_steps_per_second": 8.336, | |
| "step": 5618 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "grad_norm": 0.0009922637837007642, | |
| "learning_rate": 2.3000000000000003e-05, | |
| "loss": 0.0007, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 54.0, | |
| "eval_LOCATION_f1": 0.8289473684210527, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7875, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.7976190476190477, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7204301075268817, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.8910891089108911, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.84375, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.36466336250305176, | |
| "eval_overall_accuracy": 0.9589692269201902, | |
| "eval_overall_f1": 0.8406593406593406, | |
| "eval_overall_precision": 0.7866323907455013, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.36, | |
| "eval_samples_per_second": 519.408, | |
| "eval_steps_per_second": 8.333, | |
| "step": 5724 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "grad_norm": 0.003993849270045757, | |
| "learning_rate": 2.25e-05, | |
| "loss": 0.0017, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 55.0, | |
| "eval_LOCATION_f1": 0.7947019867549668, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.759493670886076, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.7948717948717949, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7654320987654321, | |
| "eval_ORGANIZATION_recall": 0.8266666666666667, | |
| "eval_PERSON_f1": 0.9072847682119206, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8616352201257862, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6274509803921569, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5714285714285714, | |
| "eval_QUANTITY_recall": 0.6956521739130435, | |
| "eval_TIME_f1": 0.7857142857142856, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7333333333333333, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3635990619659424, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8296089385474861, | |
| "eval_overall_precision": 0.7877984084880637, | |
| "eval_overall_recall": 0.8761061946902655, | |
| "eval_runtime": 0.3593, | |
| "eval_samples_per_second": 520.494, | |
| "eval_steps_per_second": 8.35, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "grad_norm": 0.0005980022251605988, | |
| "learning_rate": 2.2000000000000003e-05, | |
| "loss": 0.0004, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 56.0, | |
| "eval_LOCATION_f1": 0.778523489932886, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7532467532467533, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.8516129032258064, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.825, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9042904290429041, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.85625, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6792452830188679, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8235294117647058, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.84, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.3733396530151367, | |
| "eval_overall_accuracy": 0.9597197898423818, | |
| "eval_overall_f1": 0.8438818565400844, | |
| "eval_overall_precision": 0.8064516129032258, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.3652, | |
| "eval_samples_per_second": 512.007, | |
| "eval_steps_per_second": 8.214, | |
| "step": 5936 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "grad_norm": 0.0007011191919445992, | |
| "learning_rate": 2.15e-05, | |
| "loss": 0.0009, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 57.0, | |
| "eval_LOCATION_f1": 0.8079470198675496, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7721518987341772, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.858974358974359, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.8271604938271605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.8970099667774087, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8544303797468354, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3640208840370178, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.849929873772791, | |
| "eval_overall_precision": 0.8101604278074866, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3606, | |
| "eval_samples_per_second": 518.592, | |
| "eval_steps_per_second": 8.32, | |
| "step": 6042 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "grad_norm": 0.0015956854913383722, | |
| "learning_rate": 2.1e-05, | |
| "loss": 0.0003, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 58.0, | |
| "eval_LOCATION_f1": 0.7973856209150327, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7530864197530864, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8220858895705522, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7613636363636364, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9023569023569024, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8701298701298701, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8518518518518519, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8214285714285714, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3814009130001068, | |
| "eval_overall_accuracy": 0.9582186639979985, | |
| "eval_overall_f1": 0.8440111420612812, | |
| "eval_overall_precision": 0.7994722955145118, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3599, | |
| "eval_samples_per_second": 519.642, | |
| "eval_steps_per_second": 8.337, | |
| "step": 6148 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "grad_norm": 0.0003817932156380266, | |
| "learning_rate": 2.05e-05, | |
| "loss": 0.0005, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 59.0, | |
| "eval_LOCATION_f1": 0.802721088435374, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7866666666666666, | |
| "eval_LOCATION_recall": 0.8194444444444444, | |
| "eval_ORGANIZATION_f1": 0.8441558441558442, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.8227848101265823, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.9096989966555185, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8717948717948718, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.888888888888889, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8571428571428571, | |
| "eval_TIME_recall": 0.9230769230769231, | |
| "eval_loss": 0.3739457130432129, | |
| "eval_overall_accuracy": 0.9619714786089567, | |
| "eval_overall_f1": 0.8567375886524823, | |
| "eval_overall_precision": 0.825136612021858, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3596, | |
| "eval_samples_per_second": 520.068, | |
| "eval_steps_per_second": 8.343, | |
| "step": 6254 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "grad_norm": 0.00037515757139772177, | |
| "learning_rate": 2e-05, | |
| "loss": 0.0005, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 60.0, | |
| "eval_LOCATION_f1": 0.8219178082191781, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8108108108108109, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8354430379746836, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7951807228915663, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9006622516556291, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8553459119496856, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8679245283018868, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8518518518518519, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3766981363296509, | |
| "eval_overall_accuracy": 0.9604703527645734, | |
| "eval_overall_f1": 0.8547249647390691, | |
| "eval_overall_precision": 0.8189189189189189, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3687, | |
| "eval_samples_per_second": 507.159, | |
| "eval_steps_per_second": 8.136, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "grad_norm": 0.00191974185872823, | |
| "learning_rate": 1.9500000000000003e-05, | |
| "loss": 0.0008, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 61.0, | |
| "eval_LOCATION_f1": 0.816326530612245, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8333333333333334, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.8024691358024691, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.903654485049834, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8607594936708861, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8214285714285715, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7666666666666667, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.36986875534057617, | |
| "eval_overall_accuracy": 0.9622216662496873, | |
| "eval_overall_f1": 0.849507735583685, | |
| "eval_overall_precision": 0.8118279569892473, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3616, | |
| "eval_samples_per_second": 517.178, | |
| "eval_steps_per_second": 8.297, | |
| "step": 6466 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "grad_norm": 1.7503353357315063, | |
| "learning_rate": 1.9e-05, | |
| "loss": 0.0016, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 62.0, | |
| "eval_LOCATION_f1": 0.8187919463087249, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.825, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7764705882352941, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8838709677419354, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8203592814371258, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8679245283018868, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8518518518518519, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.34973686933517456, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.8437067773167358, | |
| "eval_overall_precision": 0.7942708333333334, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.364, | |
| "eval_samples_per_second": 513.749, | |
| "eval_steps_per_second": 8.242, | |
| "step": 6572 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "grad_norm": 0.0005617731949314475, | |
| "learning_rate": 1.85e-05, | |
| "loss": 0.0004, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 63.0, | |
| "eval_LOCATION_f1": 0.8299319727891157, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8133333333333334, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.834355828220859, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7727272727272727, | |
| "eval_ORGANIZATION_recall": 0.9066666666666666, | |
| "eval_PERSON_f1": 0.9210526315789473, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8695652173913043, | |
| "eval_PERSON_recall": 0.9790209790209791, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.7796610169491526, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.696969696969697, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3623858094215393, | |
| "eval_overall_accuracy": 0.9617212909682261, | |
| "eval_overall_f1": 0.856353591160221, | |
| "eval_overall_precision": 0.8051948051948052, | |
| "eval_overall_recall": 0.9144542772861357, | |
| "eval_runtime": 0.3601, | |
| "eval_samples_per_second": 519.319, | |
| "eval_steps_per_second": 8.331, | |
| "step": 6678 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "grad_norm": 0.04498714208602905, | |
| "learning_rate": 1.8e-05, | |
| "loss": 0.0009, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 64.0, | |
| "eval_LOCATION_f1": 0.8435374149659863, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8266666666666667, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8374999999999999, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.788235294117647, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9006622516556291, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8553459119496856, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8518518518518519, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8214285714285714, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.37043052911758423, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8583450210378682, | |
| "eval_overall_precision": 0.8181818181818182, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.36, | |
| "eval_samples_per_second": 519.423, | |
| "eval_steps_per_second": 8.333, | |
| "step": 6784 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "grad_norm": 0.0003102279151789844, | |
| "learning_rate": 1.75e-05, | |
| "loss": 0.001, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 65.0, | |
| "eval_LOCATION_f1": 0.8266666666666667, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8220858895705522, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7613636363636364, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9144736842105262, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8633540372670807, | |
| "eval_PERSON_recall": 0.972027972027972, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8679245283018868, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8518518518518519, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3582930862903595, | |
| "eval_overall_accuracy": 0.96347260445334, | |
| "eval_overall_f1": 0.8583333333333333, | |
| "eval_overall_precision": 0.8110236220472441, | |
| "eval_overall_recall": 0.911504424778761, | |
| "eval_runtime": 0.3574, | |
| "eval_samples_per_second": 523.156, | |
| "eval_steps_per_second": 8.393, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "grad_norm": 0.023364154621958733, | |
| "learning_rate": 1.7000000000000003e-05, | |
| "loss": 0.0001, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 66.0, | |
| "eval_LOCATION_f1": 0.7894736842105262, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.75, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8387096774193549, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.8125, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.9139072847682119, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8679245283018868, | |
| "eval_PERSON_recall": 0.965034965034965, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8461538461538461, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8461538461538461, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.35251596570014954, | |
| "eval_overall_accuracy": 0.9627220415311484, | |
| "eval_overall_f1": 0.8523206751054851, | |
| "eval_overall_precision": 0.8145161290322581, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3673, | |
| "eval_samples_per_second": 509.16, | |
| "eval_steps_per_second": 8.168, | |
| "step": 6996 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "grad_norm": 0.0011218636063858867, | |
| "learning_rate": 1.65e-05, | |
| "loss": 0.0015, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 67.0, | |
| "eval_LOCATION_f1": 0.823529411764706, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7777777777777778, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.8121212121212122, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7444444444444445, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9078947368421052, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8571428571428571, | |
| "eval_PERSON_recall": 0.965034965034965, | |
| "eval_QUANTITY_f1": 0.72, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6666666666666666, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.8679245283018868, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8518518518518519, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.37641996145248413, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8524137931034482, | |
| "eval_overall_precision": 0.8005181347150259, | |
| "eval_overall_recall": 0.911504424778761, | |
| "eval_runtime": 0.3613, | |
| "eval_samples_per_second": 517.565, | |
| "eval_steps_per_second": 8.303, | |
| "step": 7102 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "grad_norm": 0.0007424333016388118, | |
| "learning_rate": 1.6000000000000003e-05, | |
| "loss": 0.0006, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 68.0, | |
| "eval_LOCATION_f1": 0.8356164383561645, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8243243243243243, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.7878787878787877, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7222222222222222, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.9133333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8726114649681529, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.7058823529411765, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6428571428571429, | |
| "eval_QUANTITY_recall": 0.782608695652174, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3496319651603699, | |
| "eval_overall_accuracy": 0.9594696022016512, | |
| "eval_overall_f1": 0.8475524475524475, | |
| "eval_overall_precision": 0.8058510638297872, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3711, | |
| "eval_samples_per_second": 503.904, | |
| "eval_steps_per_second": 8.084, | |
| "step": 7208 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "grad_norm": 0.008528614416718483, | |
| "learning_rate": 1.55e-05, | |
| "loss": 0.0008, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 69.0, | |
| "eval_LOCATION_f1": 0.8187919463087249, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8000000000000002, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.775, | |
| "eval_ORGANIZATION_recall": 0.8266666666666667, | |
| "eval_PERSON_f1": 0.8970099667774087, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8544303797468354, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.693877551020408, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6538461538461539, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.34753233194351196, | |
| "eval_overall_accuracy": 0.9594696022016512, | |
| "eval_overall_f1": 0.8401697312588402, | |
| "eval_overall_precision": 0.8070652173913043, | |
| "eval_overall_recall": 0.8761061946902655, | |
| "eval_runtime": 0.3588, | |
| "eval_samples_per_second": 521.137, | |
| "eval_steps_per_second": 8.36, | |
| "step": 7314 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "grad_norm": 0.014132479205727577, | |
| "learning_rate": 1.5e-05, | |
| "loss": 0.0, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 70.0, | |
| "eval_LOCATION_f1": 0.8356164383561645, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8243243243243243, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8121212121212122, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7444444444444445, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.8844884488448846, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8375, | |
| "eval_PERSON_recall": 0.9370629370629371, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8214285714285715, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7666666666666667, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3662912845611572, | |
| "eval_overall_accuracy": 0.9592194145609206, | |
| "eval_overall_f1": 0.8388888888888889, | |
| "eval_overall_precision": 0.7926509186351706, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.4097, | |
| "eval_samples_per_second": 456.444, | |
| "eval_steps_per_second": 7.323, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "grad_norm": 0.0005066086887381971, | |
| "learning_rate": 1.45e-05, | |
| "loss": 0.0002, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 71.0, | |
| "eval_LOCATION_f1": 0.8055555555555556, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8055555555555556, | |
| "eval_LOCATION_recall": 0.8055555555555556, | |
| "eval_ORGANIZATION_f1": 0.8170731707317072, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7528089887640449, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3715399205684662, | |
| "eval_overall_accuracy": 0.9597197898423818, | |
| "eval_overall_f1": 0.849507735583685, | |
| "eval_overall_precision": 0.8118279569892473, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3561, | |
| "eval_samples_per_second": 525.071, | |
| "eval_steps_per_second": 8.424, | |
| "step": 7526 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "grad_norm": 0.00028915383154526353, | |
| "learning_rate": 1.4000000000000001e-05, | |
| "loss": 0.0001, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 72.0, | |
| "eval_LOCATION_f1": 0.8435374149659863, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8266666666666667, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8072289156626506, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7362637362637363, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9163879598662208, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8782051282051282, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8214285714285715, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7666666666666667, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3853207230567932, | |
| "eval_overall_accuracy": 0.9587190392794596, | |
| "eval_overall_f1": 0.8523676880222841, | |
| "eval_overall_precision": 0.8073878627968337, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.362, | |
| "eval_samples_per_second": 516.586, | |
| "eval_steps_per_second": 8.287, | |
| "step": 7632 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "grad_norm": 0.0008943734574131668, | |
| "learning_rate": 1.3500000000000001e-05, | |
| "loss": 0.0007, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 73.0, | |
| "eval_LOCATION_f1": 0.8275862068965517, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.821917808219178, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.8198757763975156, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7674418604651163, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9060402684563759, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8709677419354839, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8461538461538461, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8461538461538461, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.35061854124069214, | |
| "eval_overall_accuracy": 0.9599699774831123, | |
| "eval_overall_f1": 0.8498583569405098, | |
| "eval_overall_precision": 0.8174386920980926, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.357, | |
| "eval_samples_per_second": 523.747, | |
| "eval_steps_per_second": 8.402, | |
| "step": 7738 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "grad_norm": 0.0004187956510577351, | |
| "learning_rate": 1.3000000000000001e-05, | |
| "loss": 0.0002, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 74.0, | |
| "eval_LOCATION_f1": 0.8322147651006712, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8051948051948052, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8095238095238095, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7311827956989247, | |
| "eval_ORGANIZATION_recall": 0.9066666666666666, | |
| "eval_PERSON_f1": 0.9163879598662208, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8782051282051282, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6538461538461539, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5862068965517241, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8148148148148148, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7857142857142857, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.4027647078037262, | |
| "eval_overall_accuracy": 0.9584688516387291, | |
| "eval_overall_f1": 0.847645429362881, | |
| "eval_overall_precision": 0.7989556135770235, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.3573, | |
| "eval_samples_per_second": 523.424, | |
| "eval_steps_per_second": 8.397, | |
| "step": 7844 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "grad_norm": 0.0005983862793073058, | |
| "learning_rate": 1.25e-05, | |
| "loss": 0.0, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 75.0, | |
| "eval_LOCATION_f1": 0.816326530612245, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8, | |
| "eval_LOCATION_recall": 0.8333333333333334, | |
| "eval_ORGANIZATION_f1": 0.825, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7764705882352941, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9096989966555185, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8717948717948718, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3929165005683899, | |
| "eval_overall_accuracy": 0.960720540405304, | |
| "eval_overall_f1": 0.8478873239436621, | |
| "eval_overall_precision": 0.8113207547169812, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3576, | |
| "eval_samples_per_second": 522.919, | |
| "eval_steps_per_second": 8.389, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "grad_norm": 0.00021465642203111202, | |
| "learning_rate": 1.2e-05, | |
| "loss": 0.0002, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 76.0, | |
| "eval_LOCATION_f1": 0.8181818181818181, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7682926829268293, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.8271604938271604, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7701149425287356, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.4091399908065796, | |
| "eval_overall_accuracy": 0.960720540405304, | |
| "eval_overall_f1": 0.8527777777777777, | |
| "eval_overall_precision": 0.8057742782152231, | |
| "eval_overall_recall": 0.9056047197640118, | |
| "eval_runtime": 0.3609, | |
| "eval_samples_per_second": 518.107, | |
| "eval_steps_per_second": 8.312, | |
| "step": 8056 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "grad_norm": 0.00041957717621698976, | |
| "learning_rate": 1.1500000000000002e-05, | |
| "loss": 0.0, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 77.0, | |
| "eval_LOCATION_f1": 0.8344370860927153, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7974683544303798, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.8271604938271604, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7701149425287356, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.903010033444816, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8653846153846154, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3996489346027374, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8491620111731844, | |
| "eval_overall_precision": 0.8063660477453581, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3555, | |
| "eval_samples_per_second": 526.025, | |
| "eval_steps_per_second": 8.439, | |
| "step": 8162 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "grad_norm": 0.0018605925142765045, | |
| "learning_rate": 1.1000000000000001e-05, | |
| "loss": 0.0, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 78.0, | |
| "eval_LOCATION_f1": 0.8266666666666667, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8198757763975156, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7674418604651163, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8598726114649682, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3973155617713928, | |
| "eval_overall_accuracy": 0.9597197898423818, | |
| "eval_overall_f1": 0.8447552447552448, | |
| "eval_overall_precision": 0.8031914893617021, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3588, | |
| "eval_samples_per_second": 521.17, | |
| "eval_steps_per_second": 8.361, | |
| "step": 8268 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "grad_norm": 0.0009037918644025922, | |
| "learning_rate": 1.05e-05, | |
| "loss": 0.0, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 79.0, | |
| "eval_LOCATION_f1": 0.8211920529801324, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.825, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7764705882352941, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.903010033444816, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8653846153846154, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3981226086616516, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.84593837535014, | |
| "eval_overall_precision": 0.8053333333333333, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3579, | |
| "eval_samples_per_second": 522.564, | |
| "eval_steps_per_second": 8.383, | |
| "step": 8374 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "grad_norm": 0.0010246345773339272, | |
| "learning_rate": 1e-05, | |
| "loss": 0.0, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 80.0, | |
| "eval_LOCATION_f1": 0.8344370860927153, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7974683544303798, | |
| "eval_LOCATION_recall": 0.875, | |
| "eval_ORGANIZATION_f1": 0.8198757763975156, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7674418604651163, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.903010033444816, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8653846153846154, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.4011876583099365, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8475524475524475, | |
| "eval_overall_precision": 0.8058510638297872, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.38, | |
| "eval_samples_per_second": 492.061, | |
| "eval_steps_per_second": 7.894, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "grad_norm": 0.00019219562818761915, | |
| "learning_rate": 9.5e-06, | |
| "loss": 0.0006, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 81.0, | |
| "eval_LOCATION_f1": 0.8266666666666667, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8271604938271604, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7701149425287356, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8598726114649682, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.6538461538461539, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.5862068965517241, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8518518518518519, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8214285714285714, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.4144229590892792, | |
| "eval_overall_accuracy": 0.9597197898423818, | |
| "eval_overall_f1": 0.8467966573816156, | |
| "eval_overall_precision": 0.8021108179419525, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3556, | |
| "eval_samples_per_second": 525.889, | |
| "eval_steps_per_second": 8.437, | |
| "step": 8586 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "grad_norm": 0.000247513729846105, | |
| "learning_rate": 9e-06, | |
| "loss": 0.0, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 82.0, | |
| "eval_LOCATION_f1": 0.8211920529801324, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8227848101265823, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7831325301204819, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.9, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8598726114649682, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.40510478615760803, | |
| "eval_overall_accuracy": 0.9594696022016512, | |
| "eval_overall_f1": 0.8455056179775281, | |
| "eval_overall_precision": 0.806970509383378, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3705, | |
| "eval_samples_per_second": 504.754, | |
| "eval_steps_per_second": 8.098, | |
| "step": 8692 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "grad_norm": 0.0001593719352968037, | |
| "learning_rate": 8.500000000000002e-06, | |
| "loss": 0.0006, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 83.0, | |
| "eval_LOCATION_f1": 0.8104575163398693, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7654320987654321, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8048780487804879, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7415730337078652, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.8970099667774087, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8544303797468354, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8518518518518519, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8214285714285714, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.4076941907405853, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8381742738589212, | |
| "eval_overall_precision": 0.7890625, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3564, | |
| "eval_samples_per_second": 524.736, | |
| "eval_steps_per_second": 8.418, | |
| "step": 8798 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "grad_norm": 0.0038378555327653885, | |
| "learning_rate": 8.000000000000001e-06, | |
| "loss": 0.0004, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 84.0, | |
| "eval_LOCATION_f1": 0.8187919463087249, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8280254777070064, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7926829268292683, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.903010033444816, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8653846153846154, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.39616209268569946, | |
| "eval_overall_accuracy": 0.960720540405304, | |
| "eval_overall_f1": 0.8474576271186441, | |
| "eval_overall_precision": 0.8130081300813008, | |
| "eval_overall_recall": 0.8849557522123894, | |
| "eval_runtime": 0.359, | |
| "eval_samples_per_second": 520.922, | |
| "eval_steps_per_second": 8.357, | |
| "step": 8904 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "grad_norm": 0.0006832346552982926, | |
| "learning_rate": 7.5e-06, | |
| "loss": 0.0005, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 85.0, | |
| "eval_LOCATION_f1": 0.8243243243243243, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8235294117647058, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.8076923076923077, | |
| "eval_ORGANIZATION_recall": 0.84, | |
| "eval_PERSON_f1": 0.9158249158249158, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8831168831168831, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8461538461538461, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8461538461538461, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.38612908124923706, | |
| "eval_overall_accuracy": 0.9617212909682261, | |
| "eval_overall_f1": 0.8542857142857142, | |
| "eval_overall_precision": 0.8282548476454293, | |
| "eval_overall_recall": 0.8820058997050148, | |
| "eval_runtime": 0.3569, | |
| "eval_samples_per_second": 523.906, | |
| "eval_steps_per_second": 8.405, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "grad_norm": 0.0012918419670313597, | |
| "learning_rate": 7.000000000000001e-06, | |
| "loss": 0.0, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 86.0, | |
| "eval_LOCATION_f1": 0.8187919463087249, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7922077922077922, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8176100628930819, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7738095238095238, | |
| "eval_ORGANIZATION_recall": 0.8666666666666667, | |
| "eval_PERSON_f1": 0.9096989966555185, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8717948717948718, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.693877551020408, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6538461538461539, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.39533165097236633, | |
| "eval_overall_accuracy": 0.9609707280460346, | |
| "eval_overall_f1": 0.8490832157968972, | |
| "eval_overall_precision": 0.8135135135135135, | |
| "eval_overall_recall": 0.887905604719764, | |
| "eval_runtime": 0.3669, | |
| "eval_samples_per_second": 509.639, | |
| "eval_steps_per_second": 8.176, | |
| "step": 9116 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "grad_norm": 0.00013653105997946113, | |
| "learning_rate": 6.5000000000000004e-06, | |
| "loss": 0.0003, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 87.0, | |
| "eval_LOCATION_f1": 0.8211920529801324, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8220858895705522, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7613636363636364, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9042904290429041, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.85625, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.7924528301886792, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.41302046179771423, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8432732316227461, | |
| "eval_overall_precision": 0.7958115183246073, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3613, | |
| "eval_samples_per_second": 517.561, | |
| "eval_steps_per_second": 8.303, | |
| "step": 9222 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "grad_norm": 0.0001936595799634233, | |
| "learning_rate": 6e-06, | |
| "loss": 0.0004, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 88.0, | |
| "eval_LOCATION_f1": 0.8211920529801324, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8220858895705522, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7613636363636364, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9006622516556291, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8553459119496856, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.7924528301886792, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.41551852226257324, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8416666666666667, | |
| "eval_overall_precision": 0.7952755905511811, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3626, | |
| "eval_samples_per_second": 515.716, | |
| "eval_steps_per_second": 8.274, | |
| "step": 9328 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "grad_norm": 0.000983737176284194, | |
| "learning_rate": 5.500000000000001e-06, | |
| "loss": 0.0, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 89.0, | |
| "eval_LOCATION_f1": 0.8211920529801324, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7848101265822784, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8220858895705522, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7613636363636364, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9006622516556291, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8553459119496856, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.7924528301886792, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7777777777777778, | |
| "eval_TIME_recall": 0.8076923076923077, | |
| "eval_loss": 0.4156357944011688, | |
| "eval_overall_accuracy": 0.9602201651238429, | |
| "eval_overall_f1": 0.8416666666666667, | |
| "eval_overall_precision": 0.7952755905511811, | |
| "eval_overall_recall": 0.8938053097345132, | |
| "eval_runtime": 0.3581, | |
| "eval_samples_per_second": 522.251, | |
| "eval_steps_per_second": 8.378, | |
| "step": 9434 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "grad_norm": 0.001763033214956522, | |
| "learning_rate": 5e-06, | |
| "loss": 0.0002, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 90.0, | |
| "eval_LOCATION_f1": 0.8266666666666667, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8198757763975156, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7674418604651163, | |
| "eval_ORGANIZATION_recall": 0.88, | |
| "eval_PERSON_f1": 0.9090909090909092, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8766233766233766, | |
| "eval_PERSON_recall": 0.9440559440559441, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.404066801071167, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.849507735583685, | |
| "eval_overall_precision": 0.8118279569892473, | |
| "eval_overall_recall": 0.8908554572271387, | |
| "eval_runtime": 0.3736, | |
| "eval_samples_per_second": 500.522, | |
| "eval_steps_per_second": 8.03, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "grad_norm": 0.0002766927646007389, | |
| "learning_rate": 4.5e-06, | |
| "loss": 0.0002, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 91.0, | |
| "eval_LOCATION_f1": 0.8322147651006712, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8051948051948052, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9158249158249158, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8831168831168831, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3980797231197357, | |
| "eval_overall_accuracy": 0.9617212909682261, | |
| "eval_overall_f1": 0.8551336146272857, | |
| "eval_overall_precision": 0.8172043010752689, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3573, | |
| "eval_samples_per_second": 523.342, | |
| "eval_steps_per_second": 8.396, | |
| "step": 9646 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "grad_norm": 0.0008579469285905361, | |
| "learning_rate": 4.000000000000001e-06, | |
| "loss": 0.0, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 92.0, | |
| "eval_LOCATION_f1": 0.8322147651006712, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8051948051948052, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9158249158249158, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8831168831168831, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.693877551020408, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6538461538461539, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.830188679245283, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.8148148148148148, | |
| "eval_TIME_recall": 0.8461538461538461, | |
| "eval_loss": 0.3970873951911926, | |
| "eval_overall_accuracy": 0.9617212909682261, | |
| "eval_overall_f1": 0.8575458392101551, | |
| "eval_overall_precision": 0.8216216216216217, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3615, | |
| "eval_samples_per_second": 517.255, | |
| "eval_steps_per_second": 8.298, | |
| "step": 9752 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "grad_norm": 0.00014306257071439177, | |
| "learning_rate": 3.5000000000000004e-06, | |
| "loss": 0.0, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 93.0, | |
| "eval_LOCATION_f1": 0.8266666666666667, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.7948717948717948, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.4024323523044586, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8559440559440559, | |
| "eval_overall_precision": 0.8138297872340425, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.3607, | |
| "eval_samples_per_second": 518.421, | |
| "eval_steps_per_second": 8.317, | |
| "step": 9858 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "grad_norm": 0.00042846077121794224, | |
| "learning_rate": 3e-06, | |
| "loss": 0.0, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 94.0, | |
| "eval_LOCATION_f1": 0.8322147651006712, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8051948051948052, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.3985014855861664, | |
| "eval_overall_accuracy": 0.9619714786089567, | |
| "eval_overall_f1": 0.8583450210378682, | |
| "eval_overall_precision": 0.8181818181818182, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.3651, | |
| "eval_samples_per_second": 512.194, | |
| "eval_steps_per_second": 8.217, | |
| "step": 9964 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "grad_norm": 0.000827198673505336, | |
| "learning_rate": 2.5e-06, | |
| "loss": 0.0, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 95.0, | |
| "eval_LOCATION_f1": 0.8322147651006712, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8051948051948052, | |
| "eval_LOCATION_recall": 0.8611111111111112, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.6666666666666666, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6071428571428571, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.39939987659454346, | |
| "eval_overall_accuracy": 0.9617212909682261, | |
| "eval_overall_f1": 0.8571428571428571, | |
| "eval_overall_precision": 0.816, | |
| "eval_overall_recall": 0.9026548672566371, | |
| "eval_runtime": 0.358, | |
| "eval_samples_per_second": 522.401, | |
| "eval_steps_per_second": 8.381, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "grad_norm": 0.0002911574556492269, | |
| "learning_rate": 2.0000000000000003e-06, | |
| "loss": 0.0003, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 96.0, | |
| "eval_LOCATION_f1": 0.8243243243243243, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.912751677852349, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8774193548387097, | |
| "eval_PERSON_recall": 0.951048951048951, | |
| "eval_QUANTITY_f1": 0.693877551020408, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6538461538461539, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.39506107568740845, | |
| "eval_overall_accuracy": 0.961220915686765, | |
| "eval_overall_f1": 0.8551336146272857, | |
| "eval_overall_precision": 0.8172043010752689, | |
| "eval_overall_recall": 0.8967551622418879, | |
| "eval_runtime": 0.3613, | |
| "eval_samples_per_second": 517.554, | |
| "eval_steps_per_second": 8.303, | |
| "step": 10176 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "grad_norm": 0.0003046900383196771, | |
| "learning_rate": 1.5e-06, | |
| "loss": 0.0005, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 97.0, | |
| "eval_LOCATION_f1": 0.8243243243243243, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9133333333333333, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8726114649681529, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.4083447754383087, | |
| "eval_overall_accuracy": 0.9609707280460346, | |
| "eval_overall_f1": 0.854341736694678, | |
| "eval_overall_precision": 0.8133333333333334, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3599, | |
| "eval_samples_per_second": 519.582, | |
| "eval_steps_per_second": 8.336, | |
| "step": 10282 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "grad_norm": 0.00015339584206230938, | |
| "learning_rate": 1.0000000000000002e-06, | |
| "loss": 0.0, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 98.0, | |
| "eval_LOCATION_f1": 0.8243243243243243, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.407378226518631, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8567415730337079, | |
| "eval_overall_precision": 0.8176943699731903, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3669, | |
| "eval_samples_per_second": 509.703, | |
| "eval_steps_per_second": 8.177, | |
| "step": 10388 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "grad_norm": 0.0002479134127497673, | |
| "learning_rate": 5.000000000000001e-07, | |
| "loss": 0.0, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 99.0, | |
| "eval_LOCATION_f1": 0.8243243243243243, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.4076772630214691, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8567415730337079, | |
| "eval_overall_precision": 0.8176943699731903, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3589, | |
| "eval_samples_per_second": 521.056, | |
| "eval_steps_per_second": 8.359, | |
| "step": 10494 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "grad_norm": 0.00025577095220796764, | |
| "learning_rate": 0.0, | |
| "loss": 0.0001, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "eval_LOCATION_f1": 0.8243243243243243, | |
| "eval_LOCATION_number": 72, | |
| "eval_LOCATION_precision": 0.8026315789473685, | |
| "eval_LOCATION_recall": 0.8472222222222222, | |
| "eval_ORGANIZATION_f1": 0.8322981366459627, | |
| "eval_ORGANIZATION_number": 75, | |
| "eval_ORGANIZATION_precision": 0.7790697674418605, | |
| "eval_ORGANIZATION_recall": 0.8933333333333333, | |
| "eval_PERSON_f1": 0.9194630872483223, | |
| "eval_PERSON_number": 143, | |
| "eval_PERSON_precision": 0.8838709677419355, | |
| "eval_PERSON_recall": 0.958041958041958, | |
| "eval_QUANTITY_f1": 0.68, | |
| "eval_QUANTITY_number": 23, | |
| "eval_QUANTITY_precision": 0.6296296296296297, | |
| "eval_QUANTITY_recall": 0.7391304347826086, | |
| "eval_TIME_f1": 0.8363636363636363, | |
| "eval_TIME_number": 26, | |
| "eval_TIME_precision": 0.7931034482758621, | |
| "eval_TIME_recall": 0.8846153846153846, | |
| "eval_loss": 0.40795865654945374, | |
| "eval_overall_accuracy": 0.9614711033274956, | |
| "eval_overall_f1": 0.8567415730337079, | |
| "eval_overall_precision": 0.8176943699731903, | |
| "eval_overall_recall": 0.8997050147492626, | |
| "eval_runtime": 0.3623, | |
| "eval_samples_per_second": 516.187, | |
| "eval_steps_per_second": 8.281, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 100.0, | |
| "step": 10600, | |
| "total_flos": 4502314993613766.0, | |
| "train_loss": 0.008934246277599155, | |
| "train_runtime": 970.249, | |
| "train_samples_per_second": 173.873, | |
| "train_steps_per_second": 10.925 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 10600, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 100, | |
| "save_steps": 500, | |
| "total_flos": 4502314993613766.0, | |
| "train_batch_size": 16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |