{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 0.8466603951081844, "eval_steps": 500, "global_step": 900, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0, "eval/E1/acc_on_CONSISTENT": 0.16435185185185186, "eval/E1/acc_on_INCONSISTENT": 0.9875, "eval/E1/accuracy": 0.29296875, "eval/E1/f1_INC": 0.3038461538461539, "eval/E1/precision_INC": 0.17954545454545454, "eval/E1/recall_INC": 0.9875, "eval/E2/acc_on_CONSISTENT": 0.6785714285714286, "eval/E2/acc_on_INCONSISTENT": 0.9594594594594594, "eval/E2/accuracy": 0.759765625, "eval/E2/f1_INC": 0.6977886977886979, "eval/E2/precision_INC": 0.5482625482625483, "eval/E2/recall_INC": 0.9594594594594594, "eval/E3/acc_on_CONSISTENT": 0.07098765432098765, "eval/E3/acc_on_INCONSISTENT": 0.9680851063829787, "eval/E3/accuracy": 0.400390625, "eval/E3/f1_INC": 0.5424739195230999, "eval/E3/precision_INC": 0.37681159420289856, "eval/E3/recall_INC": 0.9680851063829787, "eval/E4/acc_on_CONSISTENT": 0.0529595015576324, "eval/E4/acc_on_INCONSISTENT": 0.9476439790575916, "eval/E4/accuracy": 0.38671875, "eval/E4/f1_INC": 0.5355029585798816, "eval/E4/precision_INC": 0.3731958762886598, "eval/E4/recall_INC": 0.9476439790575916, "eval/edge_macro_accuracy": 0.4599609375, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.08133971291866028, "eval/overall/acc_on_INCONSISTENT": 0.966996699669967, "eval/overall/accuracy": 0.60546875, "eval/overall/f1_INC": 0.7436548223350254, "eval/overall/precision_INC": 0.6041237113402061, "eval/overall/recall_INC": 0.966996699669967, "eval/overall_exact_match": 0.064453125, "eval_label": "start", "step": 0 }, { "epoch": 0.01881467544684854, "grad_norm": 0.13588111102581024, "learning_rate": 5.9375e-05, "loss": 0.0936, "step": 20 }, { "epoch": 0.03762935089369708, "grad_norm": 0.15987196564674377, "learning_rate": 9.932104752667314e-05, "loss": 0.0348, "step": 40 }, { "epoch": 0.05644402634054563, "grad_norm": 0.14962074160575867, "learning_rate": 9.73811833171678e-05, "loss": 0.0273, "step": 60 }, { "epoch": 0.07525870178739416, "grad_norm": 0.1912640929222107, "learning_rate": 9.544131910766246e-05, "loss": 0.0248, "step": 80 }, { "epoch": 0.09407337723424271, "eval/E1/acc_on_CONSISTENT": 0.8819444444444444, "eval/E1/acc_on_INCONSISTENT": 0.4625, "eval/E1/accuracy": 0.81640625, "eval/E1/f1_INC": 0.44047619047619047, "eval/E1/precision_INC": 0.42045454545454547, "eval/E1/recall_INC": 0.4625, "eval/E2/acc_on_CONSISTENT": 0.9752747252747253, "eval/E2/acc_on_INCONSISTENT": 0.8243243243243243, "eval/E2/accuracy": 0.931640625, "eval/E2/f1_INC": 0.8745519713261649, "eval/E2/precision_INC": 0.9312977099236641, "eval/E2/recall_INC": 0.8243243243243243, "eval/E3/acc_on_CONSISTENT": 0.8179012345679012, "eval/E3/acc_on_INCONSISTENT": 0.6968085106382979, "eval/E3/accuracy": 0.7734375, "eval/E3/f1_INC": 0.6931216931216931, "eval/E3/precision_INC": 0.6894736842105263, "eval/E3/recall_INC": 0.6968085106382979, "eval/E4/acc_on_CONSISTENT": 0.8629283489096573, "eval/E4/acc_on_INCONSISTENT": 0.7068062827225131, "eval/E4/accuracy": 0.8046875, "eval/E4/f1_INC": 0.7297297297297297, "eval/E4/precision_INC": 0.7541899441340782, "eval/E4/recall_INC": 0.7068062827225131, "eval/edge_macro_accuracy": 0.83154296875, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.8325358851674641, "eval/overall/acc_on_INCONSISTENT": 0.7887788778877888, "eval/overall/accuracy": 0.806640625, "eval/overall/f1_INC": 0.82842287694974, "eval/overall/precision_INC": 0.8722627737226277, "eval/overall/recall_INC": 0.7887788778877888, "eval/overall_exact_match": 0.576171875, "eval_label": "step_100", "step": 100 }, { "epoch": 0.09407337723424271, "grad_norm": 0.10156096518039703, "learning_rate": 9.350145489815713e-05, "loss": 0.0248, "step": 100 }, { "epoch": 0.11288805268109126, "grad_norm": 0.15984299778938293, "learning_rate": 9.15615906886518e-05, "loss": 0.0241, "step": 120 }, { "epoch": 0.1317027281279398, "grad_norm": 0.14268864691257477, "learning_rate": 8.962172647914647e-05, "loss": 0.0222, "step": 140 }, { "epoch": 0.15051740357478832, "grad_norm": 0.09480800479650497, "learning_rate": 8.768186226964112e-05, "loss": 0.022, "step": 160 }, { "epoch": 0.16933207902163688, "grad_norm": 0.09908359497785568, "learning_rate": 8.57419980601358e-05, "loss": 0.0205, "step": 180 }, { "epoch": 0.18814675446848542, "eval/E1/acc_on_CONSISTENT": 0.9236111111111112, "eval/E1/acc_on_INCONSISTENT": 0.4125, "eval/E1/accuracy": 0.84375, "eval/E1/f1_INC": 0.4520547945205479, "eval/E1/precision_INC": 0.5, "eval/E1/recall_INC": 0.4125, "eval/E2/acc_on_CONSISTENT": 0.945054945054945, "eval/E2/acc_on_INCONSISTENT": 0.9391891891891891, "eval/E2/accuracy": 0.943359375, "eval/E2/f1_INC": 0.9055374592833876, "eval/E2/precision_INC": 0.8742138364779874, "eval/E2/recall_INC": 0.9391891891891891, "eval/E3/acc_on_CONSISTENT": 0.8703703703703703, "eval/E3/acc_on_INCONSISTENT": 0.8191489361702128, "eval/E3/accuracy": 0.8515625, "eval/E3/f1_INC": 0.8020833333333333, "eval/E3/precision_INC": 0.7857142857142857, "eval/E3/recall_INC": 0.8191489361702128, "eval/E4/acc_on_CONSISTENT": 0.8411214953271028, "eval/E4/acc_on_INCONSISTENT": 0.7905759162303665, "eval/E4/accuracy": 0.822265625, "eval/E4/f1_INC": 0.7684478371501273, "eval/E4/precision_INC": 0.7475247524752475, "eval/E4/recall_INC": 0.7905759162303665, "eval/edge_macro_accuracy": 0.865234375, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.7559808612440191, "eval/overall/acc_on_INCONSISTENT": 0.8712871287128713, "eval/overall/accuracy": 0.82421875, "eval/overall/f1_INC": 0.854368932038835, "eval/overall/precision_INC": 0.8380952380952381, "eval/overall/recall_INC": 0.8712871287128713, "eval/overall_exact_match": 0.63671875, "eval_label": "step_200", "step": 200 }, { "epoch": 0.18814675446848542, "grad_norm": 0.1302443891763687, "learning_rate": 8.380213385063046e-05, "loss": 0.0211, "step": 200 }, { "epoch": 0.20696142991533395, "grad_norm": 0.14304408431053162, "learning_rate": 8.186226964112513e-05, "loss": 0.0187, "step": 220 }, { "epoch": 0.2257761053621825, "grad_norm": 0.20394913852214813, "learning_rate": 7.99224054316198e-05, "loss": 0.0208, "step": 240 }, { "epoch": 0.24459078080903104, "grad_norm": 0.11161988973617554, "learning_rate": 7.798254122211446e-05, "loss": 0.019, "step": 260 }, { "epoch": 0.2634054562558796, "grad_norm": 0.11904545873403549, "learning_rate": 7.604267701260912e-05, "loss": 0.0204, "step": 280 }, { "epoch": 0.28222013170272814, "eval/E1/acc_on_CONSISTENT": 0.9652777777777778, "eval/E1/acc_on_INCONSISTENT": 0.3375, "eval/E1/accuracy": 0.8671875, "eval/E1/f1_INC": 0.4426229508196722, "eval/E1/precision_INC": 0.6428571428571429, "eval/E1/recall_INC": 0.3375, "eval/E2/acc_on_CONSISTENT": 0.967032967032967, "eval/E2/acc_on_INCONSISTENT": 0.9324324324324325, "eval/E2/accuracy": 0.95703125, "eval/E2/f1_INC": 0.9261744966442953, "eval/E2/precision_INC": 0.92, "eval/E2/recall_INC": 0.9324324324324325, "eval/E3/acc_on_CONSISTENT": 0.9382716049382716, "eval/E3/acc_on_INCONSISTENT": 0.8138297872340425, "eval/E3/accuracy": 0.892578125, "eval/E3/f1_INC": 0.8476454293628809, "eval/E3/precision_INC": 0.884393063583815, "eval/E3/recall_INC": 0.8138297872340425, "eval/E4/acc_on_CONSISTENT": 0.8940809968847352, "eval/E4/acc_on_INCONSISTENT": 0.8010471204188482, "eval/E4/accuracy": 0.859375, "eval/E4/f1_INC": 0.8095238095238095, "eval/E4/precision_INC": 0.8181818181818182, "eval/E4/recall_INC": 0.8010471204188482, "eval/edge_macro_accuracy": 0.89404296875, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.8851674641148325, "eval/overall/acc_on_INCONSISTENT": 0.8448844884488449, "eval/overall/accuracy": 0.861328125, "eval/overall/f1_INC": 0.8782161234991424, "eval/overall/precision_INC": 0.9142857142857143, "eval/overall/recall_INC": 0.8448844884488449, "eval/overall_exact_match": 0.697265625, "eval_label": "step_300", "step": 300 }, { "epoch": 0.28222013170272814, "grad_norm": 0.1075235903263092, "learning_rate": 7.410281280310378e-05, "loss": 0.0212, "step": 300 }, { "epoch": 0.30103480714957664, "grad_norm": 0.08106118440628052, "learning_rate": 7.216294859359845e-05, "loss": 0.0177, "step": 320 }, { "epoch": 0.3198494825964252, "grad_norm": 0.07731106132268906, "learning_rate": 7.022308438409312e-05, "loss": 0.0182, "step": 340 }, { "epoch": 0.33866415804327377, "grad_norm": 0.1482355296611786, "learning_rate": 6.828322017458779e-05, "loss": 0.0178, "step": 360 }, { "epoch": 0.35747883349012227, "grad_norm": 0.07897721230983734, "learning_rate": 6.634335596508244e-05, "loss": 0.018, "step": 380 }, { "epoch": 0.37629350893697083, "eval/E1/acc_on_CONSISTENT": 0.9722222222222222, "eval/E1/acc_on_INCONSISTENT": 0.45, "eval/E1/accuracy": 0.890625, "eval/E1/f1_INC": 0.5625000000000001, "eval/E1/precision_INC": 0.75, "eval/E1/recall_INC": 0.45, "eval/E2/acc_on_CONSISTENT": 0.9697802197802198, "eval/E2/acc_on_INCONSISTENT": 0.9324324324324325, "eval/E2/accuracy": 0.958984375, "eval/E2/f1_INC": 0.9292929292929293, "eval/E2/precision_INC": 0.9261744966442953, "eval/E2/recall_INC": 0.9324324324324325, "eval/E3/acc_on_CONSISTENT": 0.9598765432098766, "eval/E3/acc_on_INCONSISTENT": 0.8138297872340425, "eval/E3/accuracy": 0.90625, "eval/E3/f1_INC": 0.8644067796610171, "eval/E3/precision_INC": 0.9216867469879518, "eval/E3/recall_INC": 0.8138297872340425, "eval/E4/acc_on_CONSISTENT": 0.9096573208722741, "eval/E4/acc_on_INCONSISTENT": 0.806282722513089, "eval/E4/accuracy": 0.87109375, "eval/E4/f1_INC": 0.823529411764706, "eval/E4/precision_INC": 0.8415300546448088, "eval/E4/recall_INC": 0.806282722513089, "eval/edge_macro_accuracy": 0.90673828125, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.9282296650717703, "eval/overall/acc_on_INCONSISTENT": 0.8481848184818482, "eval/overall/accuracy": 0.880859375, "eval/overall/f1_INC": 0.8939130434782608, "eval/overall/precision_INC": 0.9448529411764706, "eval/overall/recall_INC": 0.8481848184818482, "eval/overall_exact_match": 0.728515625, "eval_label": "step_400", "step": 400 }, { "epoch": 0.37629350893697083, "grad_norm": 0.1120094284415245, "learning_rate": 6.440349175557712e-05, "loss": 0.0168, "step": 400 }, { "epoch": 0.3951081843838194, "grad_norm": 0.16071178019046783, "learning_rate": 6.246362754607178e-05, "loss": 0.016, "step": 420 }, { "epoch": 0.4139228598306679, "grad_norm": 0.10165177285671234, "learning_rate": 6.0523763336566445e-05, "loss": 0.0159, "step": 440 }, { "epoch": 0.43273753527751646, "grad_norm": 0.08946932107210159, "learning_rate": 5.8583899127061106e-05, "loss": 0.0167, "step": 460 }, { "epoch": 0.451552210724365, "grad_norm": 0.07830841839313507, "learning_rate": 5.664403491755578e-05, "loss": 0.016, "step": 480 }, { "epoch": 0.4703668861712135, "eval/E1/acc_on_CONSISTENT": 0.9444444444444444, "eval/E1/acc_on_INCONSISTENT": 0.575, "eval/E1/accuracy": 0.88671875, "eval/E1/f1_INC": 0.6133333333333333, "eval/E1/precision_INC": 0.6571428571428571, "eval/E1/recall_INC": 0.575, "eval/E2/acc_on_CONSISTENT": 0.9285714285714286, "eval/E2/acc_on_INCONSISTENT": 0.9594594594594594, "eval/E2/accuracy": 0.9375, "eval/E2/f1_INC": 0.8987341772151899, "eval/E2/precision_INC": 0.8452380952380952, "eval/E2/recall_INC": 0.9594594594594594, "eval/E3/acc_on_CONSISTENT": 0.8919753086419753, "eval/E3/acc_on_INCONSISTENT": 0.8882978723404256, "eval/E3/accuracy": 0.890625, "eval/E3/f1_INC": 0.8564102564102564, "eval/E3/precision_INC": 0.8267326732673267, "eval/E3/recall_INC": 0.8882978723404256, "eval/E4/acc_on_CONSISTENT": 0.8847352024922118, "eval/E4/acc_on_INCONSISTENT": 0.8638743455497382, "eval/E4/accuracy": 0.876953125, "eval/E4/f1_INC": 0.8396946564885497, "eval/E4/precision_INC": 0.8168316831683168, "eval/E4/recall_INC": 0.8638743455497382, "eval/edge_macro_accuracy": 0.89794921875, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.8325358851674641, "eval/overall/acc_on_INCONSISTENT": 0.8976897689768977, "eval/overall/accuracy": 0.87109375, "eval/overall/f1_INC": 0.8918032786885246, "eval/overall/precision_INC": 0.8859934853420195, "eval/overall/recall_INC": 0.8976897689768977, "eval/overall_exact_match": 0.71484375, "eval_label": "step_500", "step": 500 }, { "epoch": 0.4703668861712135, "grad_norm": 0.23986610770225525, "learning_rate": 5.470417070805044e-05, "loss": 0.0168, "step": 500 }, { "epoch": 0.4891815616180621, "grad_norm": 0.07184334099292755, "learning_rate": 5.27643064985451e-05, "loss": 0.0169, "step": 520 }, { "epoch": 0.5079962370649106, "grad_norm": 0.0486169196665287, "learning_rate": 5.0824442289039763e-05, "loss": 0.0148, "step": 540 }, { "epoch": 0.5268109125117592, "grad_norm": 0.11095824092626572, "learning_rate": 4.888457807953444e-05, "loss": 0.0173, "step": 560 }, { "epoch": 0.5456255879586077, "grad_norm": 0.11410392075777054, "learning_rate": 4.69447138700291e-05, "loss": 0.0149, "step": 580 }, { "epoch": 0.5644402634054563, "eval/E1/acc_on_CONSISTENT": 0.9722222222222222, "eval/E1/acc_on_INCONSISTENT": 0.4375, "eval/E1/accuracy": 0.888671875, "eval/E1/f1_INC": 0.5511811023622046, "eval/E1/precision_INC": 0.7446808510638298, "eval/E1/recall_INC": 0.4375, "eval/E2/acc_on_CONSISTENT": 0.978021978021978, "eval/E2/acc_on_INCONSISTENT": 0.9391891891891891, "eval/E2/accuracy": 0.966796875, "eval/E2/f1_INC": 0.9423728813559321, "eval/E2/precision_INC": 0.9455782312925171, "eval/E2/recall_INC": 0.9391891891891891, "eval/E3/acc_on_CONSISTENT": 0.9691358024691358, "eval/E3/acc_on_INCONSISTENT": 0.75, "eval/E3/accuracy": 0.888671875, "eval/E3/f1_INC": 0.831858407079646, "eval/E3/precision_INC": 0.9337748344370861, "eval/E3/recall_INC": 0.75, "eval/E4/acc_on_CONSISTENT": 0.956386292834891, "eval/E4/acc_on_INCONSISTENT": 0.7801047120418848, "eval/E4/accuracy": 0.890625, "eval/E4/f1_INC": 0.8418079096045198, "eval/E4/precision_INC": 0.9141104294478528, "eval/E4/recall_INC": 0.7801047120418848, "eval/edge_macro_accuracy": 0.90869140625, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.9473684210526315, "eval/overall/acc_on_INCONSISTENT": 0.8118811881188119, "eval/overall/accuracy": 0.8671875, "eval/overall/f1_INC": 0.8785714285714287, "eval/overall/precision_INC": 0.9571984435797666, "eval/overall/recall_INC": 0.8118811881188119, "eval/overall_exact_match": 0.728515625, "eval_label": "step_600", "step": 600 }, { "epoch": 0.5644402634054563, "grad_norm": 0.13476960361003876, "learning_rate": 4.500484966052377e-05, "loss": 0.0159, "step": 600 }, { "epoch": 0.5832549388523048, "grad_norm": 0.22448623180389404, "learning_rate": 4.306498545101843e-05, "loss": 0.0158, "step": 620 }, { "epoch": 0.6020696142991533, "grad_norm": 0.3091525435447693, "learning_rate": 4.1125121241513096e-05, "loss": 0.0163, "step": 640 }, { "epoch": 0.6208842897460018, "grad_norm": 0.06753229349851608, "learning_rate": 3.9185257032007764e-05, "loss": 0.0153, "step": 660 }, { "epoch": 0.6396989651928504, "grad_norm": 0.16454404592514038, "learning_rate": 3.724539282250243e-05, "loss": 0.0137, "step": 680 }, { "epoch": 0.658513640639699, "eval/E1/acc_on_CONSISTENT": 0.8958333333333334, "eval/E1/acc_on_INCONSISTENT": 0.7, "eval/E1/accuracy": 0.865234375, "eval/E1/f1_INC": 0.6187845303867403, "eval/E1/precision_INC": 0.5544554455445545, "eval/E1/recall_INC": 0.7, "eval/E2/acc_on_CONSISTENT": 0.9835164835164835, "eval/E2/acc_on_INCONSISTENT": 0.9391891891891891, "eval/E2/accuracy": 0.970703125, "eval/E2/f1_INC": 0.9488054607508533, "eval/E2/precision_INC": 0.9586206896551724, "eval/E2/recall_INC": 0.9391891891891891, "eval/E3/acc_on_CONSISTENT": 0.9444444444444444, "eval/E3/acc_on_INCONSISTENT": 0.8563829787234043, "eval/E3/accuracy": 0.912109375, "eval/E3/f1_INC": 0.8773841961852861, "eval/E3/precision_INC": 0.8994413407821229, "eval/E3/recall_INC": 0.8563829787234043, "eval/E4/acc_on_CONSISTENT": 0.9034267912772586, "eval/E4/acc_on_INCONSISTENT": 0.8691099476439791, "eval/E4/accuracy": 0.890625, "eval/E4/f1_INC": 0.8556701030927836, "eval/E4/precision_INC": 0.8426395939086294, "eval/E4/recall_INC": 0.8691099476439791, "eval/edge_macro_accuracy": 0.90966796875, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.8851674641148325, "eval/overall/acc_on_INCONSISTENT": 0.8943894389438944, "eval/overall/accuracy": 0.890625, "eval/overall/f1_INC": 0.9063545150501673, "eval/overall/precision_INC": 0.9186440677966101, "eval/overall/recall_INC": 0.8943894389438944, "eval/overall_exact_match": 0.736328125, "eval_label": "step_700", "step": 700 }, { "epoch": 0.658513640639699, "grad_norm": 0.10377257317304611, "learning_rate": 3.530552861299709e-05, "loss": 0.0159, "step": 700 }, { "epoch": 0.6773283160865475, "grad_norm": 0.08269070833921432, "learning_rate": 3.336566440349176e-05, "loss": 0.0154, "step": 720 }, { "epoch": 0.6961429915333961, "grad_norm": 0.13774652779102325, "learning_rate": 3.142580019398642e-05, "loss": 0.0164, "step": 740 }, { "epoch": 0.7149576669802445, "grad_norm": 0.0529085136950016, "learning_rate": 2.948593598448109e-05, "loss": 0.0289, "step": 760 }, { "epoch": 0.7337723424270931, "grad_norm": 0.07344073057174683, "learning_rate": 2.754607177497575e-05, "loss": 0.015, "step": 780 }, { "epoch": 0.7525870178739417, "eval/E1/acc_on_CONSISTENT": 0.9722222222222222, "eval/E1/acc_on_INCONSISTENT": 0.45, "eval/E1/accuracy": 0.890625, "eval/E1/f1_INC": 0.5625000000000001, "eval/E1/precision_INC": 0.75, "eval/E1/recall_INC": 0.45, "eval/E2/acc_on_CONSISTENT": 0.9587912087912088, "eval/E2/acc_on_INCONSISTENT": 0.9459459459459459, "eval/E2/accuracy": 0.955078125, "eval/E2/f1_INC": 0.9240924092409241, "eval/E2/precision_INC": 0.9032258064516129, "eval/E2/recall_INC": 0.9459459459459459, "eval/E3/acc_on_CONSISTENT": 0.9598765432098766, "eval/E3/acc_on_INCONSISTENT": 0.8404255319148937, "eval/E3/accuracy": 0.916015625, "eval/E3/f1_INC": 0.8802228412256267, "eval/E3/precision_INC": 0.9239766081871345, "eval/E3/recall_INC": 0.8404255319148937, "eval/E4/acc_on_CONSISTENT": 0.9345794392523364, "eval/E4/acc_on_INCONSISTENT": 0.837696335078534, "eval/E4/accuracy": 0.8984375, "eval/E4/f1_INC": 0.8602150537634408, "eval/E4/precision_INC": 0.8839779005524862, "eval/E4/recall_INC": 0.837696335078534, "eval/edge_macro_accuracy": 0.9150390625, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.9282296650717703, "eval/overall/acc_on_INCONSISTENT": 0.8547854785478548, "eval/overall/accuracy": 0.884765625, "eval/overall/f1_INC": 0.8977469670710573, "eval/overall/precision_INC": 0.9452554744525548, "eval/overall/recall_INC": 0.8547854785478548, "eval/overall_exact_match": 0.751953125, "eval_label": "step_800", "step": 800 }, { "epoch": 0.7525870178739417, "grad_norm": 0.07503994554281235, "learning_rate": 2.560620756547042e-05, "loss": 0.0146, "step": 800 }, { "epoch": 0.7714016933207902, "grad_norm": 0.05603089556097984, "learning_rate": 2.3666343355965083e-05, "loss": 0.0142, "step": 820 }, { "epoch": 0.7902163687676388, "grad_norm": 0.09725795686244965, "learning_rate": 2.172647914645975e-05, "loss": 0.0151, "step": 840 }, { "epoch": 0.8090310442144873, "grad_norm": 0.13120990991592407, "learning_rate": 1.9786614936954415e-05, "loss": 0.0136, "step": 860 }, { "epoch": 0.8278457196613358, "grad_norm": 0.09627928584814072, "learning_rate": 1.784675072744908e-05, "loss": 0.0121, "step": 880 }, { "epoch": 0.8466603951081844, "eval/E1/acc_on_CONSISTENT": 0.9467592592592593, "eval/E1/acc_on_INCONSISTENT": 0.575, "eval/E1/accuracy": 0.888671875, "eval/E1/f1_INC": 0.6174496644295301, "eval/E1/precision_INC": 0.6666666666666666, "eval/E1/recall_INC": 0.575, "eval/E2/acc_on_CONSISTENT": 0.9752747252747253, "eval/E2/acc_on_INCONSISTENT": 0.9391891891891891, "eval/E2/accuracy": 0.96484375, "eval/E2/f1_INC": 0.9391891891891891, "eval/E2/precision_INC": 0.9391891891891891, "eval/E2/recall_INC": 0.9391891891891891, "eval/E3/acc_on_CONSISTENT": 0.941358024691358, "eval/E3/acc_on_INCONSISTENT": 0.8297872340425532, "eval/E3/accuracy": 0.900390625, "eval/E3/f1_INC": 0.859504132231405, "eval/E3/precision_INC": 0.8914285714285715, "eval/E3/recall_INC": 0.8297872340425532, "eval/E4/acc_on_CONSISTENT": 0.9127725856697819, "eval/E4/acc_on_INCONSISTENT": 0.8638743455497382, "eval/E4/accuracy": 0.89453125, "eval/E4/f1_INC": 0.859375, "eval/E4/precision_INC": 0.8549222797927462, "eval/E4/recall_INC": 0.8638743455497382, "eval/edge_macro_accuracy": 0.912109375, "eval/malformed_rate": 0.0, "eval/n_eval": 512.0, "eval/overall/acc_on_CONSISTENT": 0.8899521531100478, "eval/overall/acc_on_INCONSISTENT": 0.8877887788778878, "eval/overall/accuracy": 0.888671875, "eval/overall/f1_INC": 0.9042016806722689, "eval/overall/precision_INC": 0.9212328767123288, "eval/overall/recall_INC": 0.8877887788778878, "eval/overall_exact_match": 0.748046875, "eval_label": "step_900", "step": 900 }, { "epoch": 0.8466603951081844, "grad_norm": 0.07019995152950287, "learning_rate": 1.5906886517943744e-05, "loss": 0.0151, "step": 900 } ], "logging_steps": 20, "max_steps": 1063, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 300, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1.3109687011550167e+18, "train_batch_size": 4, "trial_name": null, "trial_params": null }