New-Edge-Critic / trainer_state.json
mjf-su's picture
Upload trainer_state.json with huggingface_hub
77d98d6 verified
Raw
History Blame Contribute Delete
122 kB
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.9998117824204781,
"eval_steps": 531,
"global_step": 5312,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0,
"eval_E1/acc_on_CONSISTENT": 0.7284768211920529,
"eval_E1/acc_on_INCONSISTENT": 0.6122448979591837,
"eval_E1/accuracy": 0.7,
"eval_E1/balanced_accuracy": 0.6703608595756183,
"eval_E1/f1_INC": 0.4999999999999999,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.4225352112676056,
"eval_E1/recall_INC": 0.6122448979591837,
"eval_E2/acc_on_CONSISTENT": 0.9507042253521126,
"eval_E2/acc_on_INCONSISTENT": 0.6724137931034483,
"eval_E2/accuracy": 0.87,
"eval_E2/balanced_accuracy": 0.8115590092277805,
"eval_E2/f1_INC": 0.75,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.8478260869565217,
"eval_E2/recall_INC": 0.6724137931034483,
"eval_E3/acc_on_CONSISTENT": 1.0,
"eval_E3/acc_on_INCONSISTENT": 0.11428571428571428,
"eval_E3/accuracy": 0.69,
"eval_E3/balanced_accuracy": 0.5571428571428572,
"eval_E3/f1_INC": 0.20512820512820512,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 1.0,
"eval_E3/recall_INC": 0.11428571428571428,
"eval_E4/acc_on_CONSISTENT": 1.0,
"eval_E4/acc_on_INCONSISTENT": 0.09411764705882353,
"eval_E4/accuracy": 0.615,
"eval_E4/balanced_accuracy": 0.5470588235294118,
"eval_E4/f1_INC": 0.17204301075268816,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 1.0,
"eval_E4/recall_INC": 0.09411764705882353,
"eval_edge_macro_accuracy": 0.721,
"eval_edge_macro_balanced_accuracy": 0.6421245947954184,
"eval_edge_macro_f1_INC": 0.41293424317617866,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.8372093023255814,
"eval_overall/acc_on_INCONSISTENT": 0.6624203821656051,
"eval_overall/accuracy": 0.7,
"eval_overall/balanced_accuracy": 0.7498148422455932,
"eval_overall/f1_INC": 0.7761194029850745,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.9369369369369369,
"eval_overall/recall_INC": 0.6624203821656051,
"eval_overall_exact_match": 0.275,
"eval_scene/acc_on_CONSISTENT": 0.9259259259259259,
"eval_scene/acc_on_INCONSISTENT": 0.3230769230769231,
"eval_scene/accuracy": 0.73,
"eval_scene/balanced_accuracy": 0.6245014245014245,
"eval_scene/f1_INC": 0.4375,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.6774193548387096,
"eval_scene/recall_INC": 0.3230769230769231,
"step": 0
},
{
"epoch": 0.0018821757952192735,
"grad_norm": 2.9527316093444824,
"learning_rate": 2.821316614420063e-06,
"loss": 0.2619,
"step": 10
},
{
"epoch": 0.003764351590438547,
"grad_norm": 2.514927625656128,
"learning_rate": 5.956112852664577e-06,
"loss": 0.1351,
"step": 20
},
{
"epoch": 0.00564652738565782,
"grad_norm": 0.3812353312969208,
"learning_rate": 9.090909090909091e-06,
"loss": 0.0615,
"step": 30
},
{
"epoch": 0.007528703180877094,
"grad_norm": 0.41659271717071533,
"learning_rate": 1.2225705329153606e-05,
"loss": 0.0457,
"step": 40
},
{
"epoch": 0.009410878976096368,
"grad_norm": 0.35191452503204346,
"learning_rate": 1.536050156739812e-05,
"loss": 0.047,
"step": 50
},
{
"epoch": 0.01129305477131564,
"grad_norm": 0.37843215465545654,
"learning_rate": 1.8495297805642632e-05,
"loss": 0.0463,
"step": 60
},
{
"epoch": 0.013175230566534914,
"grad_norm": 0.4428830146789551,
"learning_rate": 2.1630094043887147e-05,
"loss": 0.0455,
"step": 70
},
{
"epoch": 0.015057406361754188,
"grad_norm": 0.3365268111228943,
"learning_rate": 2.4764890282131662e-05,
"loss": 0.0476,
"step": 80
},
{
"epoch": 0.01693958215697346,
"grad_norm": 0.231501042842865,
"learning_rate": 2.7899686520376177e-05,
"loss": 0.0432,
"step": 90
},
{
"epoch": 0.018821757952192736,
"grad_norm": 0.1805897206068039,
"learning_rate": 3.103448275862069e-05,
"loss": 0.0435,
"step": 100
},
{
"epoch": 0.020703933747412008,
"grad_norm": 0.18661439418792725,
"learning_rate": 3.4169278996865206e-05,
"loss": 0.0444,
"step": 110
},
{
"epoch": 0.02258610954263128,
"grad_norm": 0.3476637005805969,
"learning_rate": 3.730407523510972e-05,
"loss": 0.0453,
"step": 120
},
{
"epoch": 0.024468285337850556,
"grad_norm": 0.1493861973285675,
"learning_rate": 4.0438871473354236e-05,
"loss": 0.0453,
"step": 130
},
{
"epoch": 0.026350461133069828,
"grad_norm": 0.22454732656478882,
"learning_rate": 4.357366771159875e-05,
"loss": 0.0399,
"step": 140
},
{
"epoch": 0.028232636928289104,
"grad_norm": 0.13001784682273865,
"learning_rate": 4.670846394984326e-05,
"loss": 0.04,
"step": 150
},
{
"epoch": 0.030114812723508376,
"grad_norm": 0.18267126381397247,
"learning_rate": 4.9843260188087774e-05,
"loss": 0.04,
"step": 160
},
{
"epoch": 0.03199698851872765,
"grad_norm": 0.18140390515327454,
"learning_rate": 5.297805642633229e-05,
"loss": 0.0434,
"step": 170
},
{
"epoch": 0.03387916431394692,
"grad_norm": 0.21444028615951538,
"learning_rate": 5.611285266457681e-05,
"loss": 0.0365,
"step": 180
},
{
"epoch": 0.0357613401091662,
"grad_norm": 0.16569875180721283,
"learning_rate": 5.924764890282132e-05,
"loss": 0.0447,
"step": 190
},
{
"epoch": 0.03764351590438547,
"grad_norm": 0.3612789511680603,
"learning_rate": 6.238244514106584e-05,
"loss": 0.0403,
"step": 200
},
{
"epoch": 0.039525691699604744,
"grad_norm": 0.170634463429451,
"learning_rate": 6.551724137931034e-05,
"loss": 0.0402,
"step": 210
},
{
"epoch": 0.041407867494824016,
"grad_norm": 0.155662402510643,
"learning_rate": 6.865203761755487e-05,
"loss": 0.0422,
"step": 220
},
{
"epoch": 0.04329004329004329,
"grad_norm": 0.1258857697248459,
"learning_rate": 7.178683385579937e-05,
"loss": 0.0426,
"step": 230
},
{
"epoch": 0.04517221908526256,
"grad_norm": 0.16679541766643524,
"learning_rate": 7.49216300940439e-05,
"loss": 0.0396,
"step": 240
},
{
"epoch": 0.04705439488048184,
"grad_norm": 0.13958600163459778,
"learning_rate": 7.80564263322884e-05,
"loss": 0.0381,
"step": 250
},
{
"epoch": 0.04893657067570111,
"grad_norm": 0.2316679060459137,
"learning_rate": 8.119122257053292e-05,
"loss": 0.042,
"step": 260
},
{
"epoch": 0.050818746470920384,
"grad_norm": 0.16344308853149414,
"learning_rate": 8.432601880877743e-05,
"loss": 0.0392,
"step": 270
},
{
"epoch": 0.052700922266139656,
"grad_norm": 0.18365642428398132,
"learning_rate": 8.746081504702195e-05,
"loss": 0.0391,
"step": 280
},
{
"epoch": 0.05458309806135893,
"grad_norm": 0.24187475442886353,
"learning_rate": 9.059561128526646e-05,
"loss": 0.0384,
"step": 290
},
{
"epoch": 0.05646527385657821,
"grad_norm": 0.10886389017105103,
"learning_rate": 9.373040752351098e-05,
"loss": 0.0448,
"step": 300
},
{
"epoch": 0.05834744965179748,
"grad_norm": 0.24063026905059814,
"learning_rate": 9.686520376175549e-05,
"loss": 0.0403,
"step": 310
},
{
"epoch": 0.06022962544701675,
"grad_norm": 0.11817719042301178,
"learning_rate": 0.0001,
"loss": 0.0439,
"step": 320
},
{
"epoch": 0.062111801242236024,
"grad_norm": 0.10869932174682617,
"learning_rate": 9.990297855826138e-05,
"loss": 0.0405,
"step": 330
},
{
"epoch": 0.0639939770374553,
"grad_norm": 0.12196257710456848,
"learning_rate": 9.980595711652275e-05,
"loss": 0.0418,
"step": 340
},
{
"epoch": 0.06587615283267458,
"grad_norm": 0.14207176864147186,
"learning_rate": 9.970893567478413e-05,
"loss": 0.0421,
"step": 350
},
{
"epoch": 0.06775832862789384,
"grad_norm": 0.1136246919631958,
"learning_rate": 9.961191423304552e-05,
"loss": 0.037,
"step": 360
},
{
"epoch": 0.06964050442311312,
"grad_norm": 0.17720963060855865,
"learning_rate": 9.951489279130688e-05,
"loss": 0.0354,
"step": 370
},
{
"epoch": 0.0715226802183324,
"grad_norm": 0.11347354203462601,
"learning_rate": 9.941787134956826e-05,
"loss": 0.0397,
"step": 380
},
{
"epoch": 0.07340485601355166,
"grad_norm": 0.13800372183322906,
"learning_rate": 9.932084990782964e-05,
"loss": 0.0356,
"step": 390
},
{
"epoch": 0.07528703180877094,
"grad_norm": 0.11324790865182877,
"learning_rate": 9.922382846609101e-05,
"loss": 0.0351,
"step": 400
},
{
"epoch": 0.07716920760399021,
"grad_norm": 0.09300073236227036,
"learning_rate": 9.912680702435239e-05,
"loss": 0.0369,
"step": 410
},
{
"epoch": 0.07905138339920949,
"grad_norm": 0.17908748984336853,
"learning_rate": 9.902978558261376e-05,
"loss": 0.0434,
"step": 420
},
{
"epoch": 0.08093355919442875,
"grad_norm": 0.152435764670372,
"learning_rate": 9.893276414087514e-05,
"loss": 0.0342,
"step": 430
},
{
"epoch": 0.08281573498964803,
"grad_norm": 0.12728841602802277,
"learning_rate": 9.883574269913651e-05,
"loss": 0.0396,
"step": 440
},
{
"epoch": 0.08469791078486731,
"grad_norm": 0.12795382738113403,
"learning_rate": 9.87387212573979e-05,
"loss": 0.0388,
"step": 450
},
{
"epoch": 0.08658008658008658,
"grad_norm": 0.2675169110298157,
"learning_rate": 9.864169981565926e-05,
"loss": 0.037,
"step": 460
},
{
"epoch": 0.08846226237530586,
"grad_norm": 0.07247938960790634,
"learning_rate": 9.854467837392065e-05,
"loss": 0.0442,
"step": 470
},
{
"epoch": 0.09034443817052512,
"grad_norm": 0.2071535289287567,
"learning_rate": 9.844765693218202e-05,
"loss": 0.0364,
"step": 480
},
{
"epoch": 0.0922266139657444,
"grad_norm": 0.12736307084560394,
"learning_rate": 9.835063549044338e-05,
"loss": 0.0356,
"step": 490
},
{
"epoch": 0.09410878976096368,
"grad_norm": 0.15026968717575073,
"learning_rate": 9.825361404870477e-05,
"loss": 0.0368,
"step": 500
},
{
"epoch": 0.09599096555618294,
"grad_norm": 0.11605150252580643,
"learning_rate": 9.815659260696614e-05,
"loss": 0.0341,
"step": 510
},
{
"epoch": 0.09787314135140222,
"grad_norm": 0.09585551172494888,
"learning_rate": 9.805957116522752e-05,
"loss": 0.0386,
"step": 520
},
{
"epoch": 0.09975531714662149,
"grad_norm": 0.07335048168897629,
"learning_rate": 9.796254972348889e-05,
"loss": 0.038,
"step": 530
},
{
"epoch": 0.09994353472614342,
"eval_E1/acc_on_CONSISTENT": 0.7152317880794702,
"eval_E1/acc_on_INCONSISTENT": 0.673469387755102,
"eval_E1/accuracy": 0.705,
"eval_E1/balanced_accuracy": 0.6943505879172861,
"eval_E1/f1_INC": 0.528,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.4342105263157895,
"eval_E1/recall_INC": 0.673469387755102,
"eval_E2/acc_on_CONSISTENT": 0.9577464788732394,
"eval_E2/acc_on_INCONSISTENT": 0.9482758620689655,
"eval_E2/accuracy": 0.955,
"eval_E2/balanced_accuracy": 0.9530111704711024,
"eval_E2/f1_INC": 0.9243697478991596,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9016393442622951,
"eval_E2/recall_INC": 0.9482758620689655,
"eval_E3/acc_on_CONSISTENT": 0.9538461538461539,
"eval_E3/acc_on_INCONSISTENT": 0.5857142857142857,
"eval_E3/accuracy": 0.825,
"eval_E3/balanced_accuracy": 0.7697802197802198,
"eval_E3/f1_INC": 0.7008547008547009,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.8723404255319149,
"eval_E3/recall_INC": 0.5857142857142857,
"eval_E4/acc_on_CONSISTENT": 0.9652173913043478,
"eval_E4/acc_on_INCONSISTENT": 0.7411764705882353,
"eval_E4/accuracy": 0.87,
"eval_E4/balanced_accuracy": 0.8531969309462916,
"eval_E4/f1_INC": 0.8289473684210527,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.9402985074626866,
"eval_E4/recall_INC": 0.7411764705882353,
"eval_edge_macro_accuracy": 0.796,
"eval_edge_macro_balanced_accuracy": 0.7945236222788205,
"eval_edge_macro_f1_INC": 0.7195112865119058,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.32558139534883723,
"eval_overall/acc_on_INCONSISTENT": 0.9681528662420382,
"eval_overall/accuracy": 0.83,
"eval_overall/balanced_accuracy": 0.6468671307954377,
"eval_overall/f1_INC": 0.8994082840236687,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.8397790055248618,
"eval_overall/recall_INC": 0.9681528662420382,
"eval_overall_exact_match": 0.325,
"eval_scene/acc_on_CONSISTENT": 0.48148148148148145,
"eval_scene/acc_on_INCONSISTENT": 0.9230769230769231,
"eval_scene/accuracy": 0.625,
"eval_scene/balanced_accuracy": 0.7022792022792023,
"eval_scene/f1_INC": 0.6153846153846155,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.46153846153846156,
"eval_scene/recall_INC": 0.9230769230769231,
"step": 531
},
{
"epoch": 0.10163749294184077,
"grad_norm": 0.08944286406040192,
"learning_rate": 9.786552828175028e-05,
"loss": 0.0385,
"step": 540
},
{
"epoch": 0.10351966873706005,
"grad_norm": 0.17637431621551514,
"learning_rate": 9.776850684001164e-05,
"loss": 0.0373,
"step": 550
},
{
"epoch": 0.10540184453227931,
"grad_norm": 0.16188663244247437,
"learning_rate": 9.767148539827302e-05,
"loss": 0.037,
"step": 560
},
{
"epoch": 0.10728402032749859,
"grad_norm": 0.107484832406044,
"learning_rate": 9.75744639565344e-05,
"loss": 0.0392,
"step": 570
},
{
"epoch": 0.10916619612271786,
"grad_norm": 0.10150787979364395,
"learning_rate": 9.747744251479576e-05,
"loss": 0.0326,
"step": 580
},
{
"epoch": 0.11104837191793714,
"grad_norm": 0.12644043564796448,
"learning_rate": 9.738042107305715e-05,
"loss": 0.0364,
"step": 590
},
{
"epoch": 0.11293054771315642,
"grad_norm": 0.17111940681934357,
"learning_rate": 9.728339963131853e-05,
"loss": 0.0338,
"step": 600
},
{
"epoch": 0.11481272350837568,
"grad_norm": 0.10448424518108368,
"learning_rate": 9.71863781895799e-05,
"loss": 0.0355,
"step": 610
},
{
"epoch": 0.11669489930359496,
"grad_norm": 0.11952169984579086,
"learning_rate": 9.708935674784127e-05,
"loss": 0.0296,
"step": 620
},
{
"epoch": 0.11857707509881422,
"grad_norm": 0.13310925662517548,
"learning_rate": 9.699233530610265e-05,
"loss": 0.0359,
"step": 630
},
{
"epoch": 0.1204592508940335,
"grad_norm": 0.10829820483922958,
"learning_rate": 9.689531386436404e-05,
"loss": 0.0355,
"step": 640
},
{
"epoch": 0.12234142668925278,
"grad_norm": 0.2412945181131363,
"learning_rate": 9.67982924226254e-05,
"loss": 0.0321,
"step": 650
},
{
"epoch": 0.12422360248447205,
"grad_norm": 0.22749365866184235,
"learning_rate": 9.670127098088679e-05,
"loss": 0.0311,
"step": 660
},
{
"epoch": 0.12610577827969133,
"grad_norm": 0.11110606044530869,
"learning_rate": 9.660424953914816e-05,
"loss": 0.039,
"step": 670
},
{
"epoch": 0.1279879540749106,
"grad_norm": 0.1248956024646759,
"learning_rate": 9.650722809740953e-05,
"loss": 0.0342,
"step": 680
},
{
"epoch": 0.12987012987012986,
"grad_norm": 0.09956880658864975,
"learning_rate": 9.641020665567091e-05,
"loss": 0.0406,
"step": 690
},
{
"epoch": 0.13175230566534915,
"grad_norm": 0.1490594893693924,
"learning_rate": 9.631318521393228e-05,
"loss": 0.0323,
"step": 700
},
{
"epoch": 0.13363448146056842,
"grad_norm": 0.13403694331645966,
"learning_rate": 9.621616377219366e-05,
"loss": 0.0339,
"step": 710
},
{
"epoch": 0.13551665725578768,
"grad_norm": 0.16613461077213287,
"learning_rate": 9.611914233045503e-05,
"loss": 0.0333,
"step": 720
},
{
"epoch": 0.13739883305100697,
"grad_norm": 0.15149520337581635,
"learning_rate": 9.602212088871642e-05,
"loss": 0.0331,
"step": 730
},
{
"epoch": 0.13928100884622624,
"grad_norm": 0.1589352935552597,
"learning_rate": 9.592509944697778e-05,
"loss": 0.0342,
"step": 740
},
{
"epoch": 0.1411631846414455,
"grad_norm": 0.10555554926395416,
"learning_rate": 9.582807800523917e-05,
"loss": 0.0357,
"step": 750
},
{
"epoch": 0.1430453604366648,
"grad_norm": 0.09868290275335312,
"learning_rate": 9.573105656350054e-05,
"loss": 0.0303,
"step": 760
},
{
"epoch": 0.14492753623188406,
"grad_norm": 0.2058541476726532,
"learning_rate": 9.563403512176192e-05,
"loss": 0.0326,
"step": 770
},
{
"epoch": 0.14680971202710333,
"grad_norm": 0.08362213522195816,
"learning_rate": 9.553701368002329e-05,
"loss": 0.0321,
"step": 780
},
{
"epoch": 0.1486918878223226,
"grad_norm": 0.08654452115297318,
"learning_rate": 9.543999223828467e-05,
"loss": 0.0388,
"step": 790
},
{
"epoch": 0.1505740636175419,
"grad_norm": 0.14298202097415924,
"learning_rate": 9.534297079654604e-05,
"loss": 0.036,
"step": 800
},
{
"epoch": 0.15245623941276115,
"grad_norm": 0.09087004512548447,
"learning_rate": 9.524594935480741e-05,
"loss": 0.0335,
"step": 810
},
{
"epoch": 0.15433841520798042,
"grad_norm": 0.17010165750980377,
"learning_rate": 9.51489279130688e-05,
"loss": 0.0332,
"step": 820
},
{
"epoch": 0.1562205910031997,
"grad_norm": 0.3323134183883667,
"learning_rate": 9.505190647133016e-05,
"loss": 0.0332,
"step": 830
},
{
"epoch": 0.15810276679841898,
"grad_norm": 0.1222422793507576,
"learning_rate": 9.495488502959155e-05,
"loss": 0.0275,
"step": 840
},
{
"epoch": 0.15998494259363824,
"grad_norm": 0.0881538912653923,
"learning_rate": 9.485786358785292e-05,
"loss": 0.0399,
"step": 850
},
{
"epoch": 0.1618671183888575,
"grad_norm": 0.14195188879966736,
"learning_rate": 9.47608421461143e-05,
"loss": 0.0383,
"step": 860
},
{
"epoch": 0.1637492941840768,
"grad_norm": 0.10698339343070984,
"learning_rate": 9.466382070437567e-05,
"loss": 0.0319,
"step": 870
},
{
"epoch": 0.16563146997929606,
"grad_norm": 0.12031501531600952,
"learning_rate": 9.456679926263705e-05,
"loss": 0.034,
"step": 880
},
{
"epoch": 0.16751364577451533,
"grad_norm": 0.08794030547142029,
"learning_rate": 9.446977782089842e-05,
"loss": 0.0326,
"step": 890
},
{
"epoch": 0.16939582156973462,
"grad_norm": 0.09387672692537308,
"learning_rate": 9.43727563791598e-05,
"loss": 0.033,
"step": 900
},
{
"epoch": 0.1712779973649539,
"grad_norm": 0.10707499086856842,
"learning_rate": 9.427573493742118e-05,
"loss": 0.0364,
"step": 910
},
{
"epoch": 0.17316017316017315,
"grad_norm": 0.09533264487981796,
"learning_rate": 9.417871349568254e-05,
"loss": 0.0331,
"step": 920
},
{
"epoch": 0.17504234895539245,
"grad_norm": 0.09901942312717438,
"learning_rate": 9.408169205394393e-05,
"loss": 0.0384,
"step": 930
},
{
"epoch": 0.1769245247506117,
"grad_norm": 0.09254682064056396,
"learning_rate": 9.398467061220531e-05,
"loss": 0.0317,
"step": 940
},
{
"epoch": 0.17880670054583098,
"grad_norm": 0.16224852204322815,
"learning_rate": 9.388764917046667e-05,
"loss": 0.0321,
"step": 950
},
{
"epoch": 0.18068887634105024,
"grad_norm": 0.11423856765031815,
"learning_rate": 9.379062772872806e-05,
"loss": 0.0367,
"step": 960
},
{
"epoch": 0.18257105213626953,
"grad_norm": 0.08567370474338531,
"learning_rate": 9.369360628698943e-05,
"loss": 0.0375,
"step": 970
},
{
"epoch": 0.1844532279314888,
"grad_norm": 0.15707381069660187,
"learning_rate": 9.35965848452508e-05,
"loss": 0.0275,
"step": 980
},
{
"epoch": 0.18633540372670807,
"grad_norm": 0.121824711561203,
"learning_rate": 9.349956340351218e-05,
"loss": 0.0346,
"step": 990
},
{
"epoch": 0.18821757952192736,
"grad_norm": 0.09984467923641205,
"learning_rate": 9.340254196177357e-05,
"loss": 0.0296,
"step": 1000
},
{
"epoch": 0.19009975531714662,
"grad_norm": 0.1463792771100998,
"learning_rate": 9.330552052003493e-05,
"loss": 0.0315,
"step": 1010
},
{
"epoch": 0.1919819311123659,
"grad_norm": 0.0836787298321724,
"learning_rate": 9.32084990782963e-05,
"loss": 0.0342,
"step": 1020
},
{
"epoch": 0.19386410690758518,
"grad_norm": 0.08766288310289383,
"learning_rate": 9.311147763655769e-05,
"loss": 0.0371,
"step": 1030
},
{
"epoch": 0.19574628270280445,
"grad_norm": 0.12990380823612213,
"learning_rate": 9.301445619481905e-05,
"loss": 0.032,
"step": 1040
},
{
"epoch": 0.1976284584980237,
"grad_norm": 0.07059783488512039,
"learning_rate": 9.291743475308044e-05,
"loss": 0.0291,
"step": 1050
},
{
"epoch": 0.19951063429324298,
"grad_norm": 0.10190416872501373,
"learning_rate": 9.282041331134181e-05,
"loss": 0.0307,
"step": 1060
},
{
"epoch": 0.19988706945228685,
"eval_E1/acc_on_CONSISTENT": 0.7549668874172185,
"eval_E1/acc_on_INCONSISTENT": 0.7551020408163265,
"eval_E1/accuracy": 0.755,
"eval_E1/balanced_accuracy": 0.7550344641167726,
"eval_E1/f1_INC": 0.6016260162601625,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.5,
"eval_E1/recall_INC": 0.7551020408163265,
"eval_E2/acc_on_CONSISTENT": 0.9507042253521126,
"eval_E2/acc_on_INCONSISTENT": 0.9310344827586207,
"eval_E2/accuracy": 0.945,
"eval_E2/balanced_accuracy": 0.9408693540553666,
"eval_E2/f1_INC": 0.9075630252100839,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.8852459016393442,
"eval_E2/recall_INC": 0.9310344827586207,
"eval_E3/acc_on_CONSISTENT": 0.9076923076923077,
"eval_E3/acc_on_INCONSISTENT": 0.8,
"eval_E3/accuracy": 0.87,
"eval_E3/balanced_accuracy": 0.8538461538461539,
"eval_E3/f1_INC": 0.8115942028985507,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.8235294117647058,
"eval_E3/recall_INC": 0.8,
"eval_E4/acc_on_CONSISTENT": 0.8434782608695652,
"eval_E4/acc_on_INCONSISTENT": 0.8588235294117647,
"eval_E4/accuracy": 0.85,
"eval_E4/balanced_accuracy": 0.851150895140665,
"eval_E4/f1_INC": 0.8295454545454546,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.8021978021978022,
"eval_E4/recall_INC": 0.8588235294117647,
"eval_edge_macro_accuracy": 0.836,
"eval_edge_macro_balanced_accuracy": 0.8326588059104241,
"eval_edge_macro_f1_INC": 0.7652008749179855,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.5581395348837209,
"eval_overall/acc_on_INCONSISTENT": 0.9426751592356688,
"eval_overall/accuracy": 0.86,
"eval_overall/balanced_accuracy": 0.7504073470596948,
"eval_overall/f1_INC": 0.9135802469135802,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.8862275449101796,
"eval_overall/recall_INC": 0.9426751592356688,
"eval_overall_exact_match": 0.44,
"eval_scene/acc_on_CONSISTENT": 0.7555555555555555,
"eval_scene/acc_on_INCONSISTENT": 0.7692307692307693,
"eval_scene/accuracy": 0.76,
"eval_scene/balanced_accuracy": 0.7623931623931623,
"eval_scene/f1_INC": 0.6756756756756758,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.6024096385542169,
"eval_scene/recall_INC": 0.7692307692307693,
"step": 1062
},
{
"epoch": 0.20139281008846227,
"grad_norm": 0.12929263710975647,
"learning_rate": 9.272339186960319e-05,
"loss": 0.0265,
"step": 1070
},
{
"epoch": 0.20327498588368154,
"grad_norm": 0.11602164059877396,
"learning_rate": 9.262637042786456e-05,
"loss": 0.0313,
"step": 1080
},
{
"epoch": 0.2051571616789008,
"grad_norm": 0.07657571136951447,
"learning_rate": 9.252934898612594e-05,
"loss": 0.0343,
"step": 1090
},
{
"epoch": 0.2070393374741201,
"grad_norm": 0.10203532129526138,
"learning_rate": 9.243232754438731e-05,
"loss": 0.0307,
"step": 1100
},
{
"epoch": 0.20892151326933936,
"grad_norm": 0.10417009890079498,
"learning_rate": 9.233530610264868e-05,
"loss": 0.0261,
"step": 1110
},
{
"epoch": 0.21080368906455862,
"grad_norm": 0.2223087102174759,
"learning_rate": 9.223828466091007e-05,
"loss": 0.0339,
"step": 1120
},
{
"epoch": 0.2126858648597779,
"grad_norm": 0.07738861441612244,
"learning_rate": 9.214126321917143e-05,
"loss": 0.0357,
"step": 1130
},
{
"epoch": 0.21456804065499718,
"grad_norm": 0.0794491246342659,
"learning_rate": 9.204424177743282e-05,
"loss": 0.0298,
"step": 1140
},
{
"epoch": 0.21645021645021645,
"grad_norm": 0.1376914381980896,
"learning_rate": 9.19472203356942e-05,
"loss": 0.0364,
"step": 1150
},
{
"epoch": 0.2183323922454357,
"grad_norm": 0.14536234736442566,
"learning_rate": 9.185019889395557e-05,
"loss": 0.0334,
"step": 1160
},
{
"epoch": 0.220214568040655,
"grad_norm": 0.07669340819120407,
"learning_rate": 9.175317745221694e-05,
"loss": 0.0318,
"step": 1170
},
{
"epoch": 0.22209674383587427,
"grad_norm": 0.06761075556278229,
"learning_rate": 9.165615601047832e-05,
"loss": 0.0278,
"step": 1180
},
{
"epoch": 0.22397891963109354,
"grad_norm": 0.1162271574139595,
"learning_rate": 9.155913456873969e-05,
"loss": 0.0261,
"step": 1190
},
{
"epoch": 0.22586109542631283,
"grad_norm": 0.08550535887479782,
"learning_rate": 9.146211312700107e-05,
"loss": 0.0276,
"step": 1200
},
{
"epoch": 0.2277432712215321,
"grad_norm": 0.13457736372947693,
"learning_rate": 9.136509168526245e-05,
"loss": 0.0319,
"step": 1210
},
{
"epoch": 0.22962544701675136,
"grad_norm": 0.119078628718853,
"learning_rate": 9.126807024352381e-05,
"loss": 0.0325,
"step": 1220
},
{
"epoch": 0.23150762281197063,
"grad_norm": 0.16809587180614471,
"learning_rate": 9.11710488017852e-05,
"loss": 0.0293,
"step": 1230
},
{
"epoch": 0.23338979860718992,
"grad_norm": 0.09518276900053024,
"learning_rate": 9.107402736004658e-05,
"loss": 0.0338,
"step": 1240
},
{
"epoch": 0.23527197440240918,
"grad_norm": 0.08279918879270554,
"learning_rate": 9.097700591830795e-05,
"loss": 0.0344,
"step": 1250
},
{
"epoch": 0.23715415019762845,
"grad_norm": 0.1353113055229187,
"learning_rate": 9.087998447656933e-05,
"loss": 0.0319,
"step": 1260
},
{
"epoch": 0.23903632599284774,
"grad_norm": 0.09605402499437332,
"learning_rate": 9.07829630348307e-05,
"loss": 0.029,
"step": 1270
},
{
"epoch": 0.240918501788067,
"grad_norm": 0.09455064684152603,
"learning_rate": 9.068594159309209e-05,
"loss": 0.033,
"step": 1280
},
{
"epoch": 0.24280067758328627,
"grad_norm": 0.10571754723787308,
"learning_rate": 9.058892015135345e-05,
"loss": 0.033,
"step": 1290
},
{
"epoch": 0.24468285337850557,
"grad_norm": 0.2133651077747345,
"learning_rate": 9.049189870961484e-05,
"loss": 0.0332,
"step": 1300
},
{
"epoch": 0.24656502917372483,
"grad_norm": 0.087664894759655,
"learning_rate": 9.039487726787621e-05,
"loss": 0.0356,
"step": 1310
},
{
"epoch": 0.2484472049689441,
"grad_norm": 0.16927213966846466,
"learning_rate": 9.029785582613758e-05,
"loss": 0.036,
"step": 1320
},
{
"epoch": 0.2503293807641634,
"grad_norm": 0.15412355959415436,
"learning_rate": 9.020083438439896e-05,
"loss": 0.0311,
"step": 1330
},
{
"epoch": 0.25221155655938265,
"grad_norm": 0.14744532108306885,
"learning_rate": 9.010381294266033e-05,
"loss": 0.0302,
"step": 1340
},
{
"epoch": 0.2540937323546019,
"grad_norm": 0.05497835949063301,
"learning_rate": 9.000679150092171e-05,
"loss": 0.0317,
"step": 1350
},
{
"epoch": 0.2559759081498212,
"grad_norm": 0.09722839295864105,
"learning_rate": 8.990977005918308e-05,
"loss": 0.0287,
"step": 1360
},
{
"epoch": 0.25785808394504045,
"grad_norm": 0.09889890998601913,
"learning_rate": 8.981274861744447e-05,
"loss": 0.0269,
"step": 1370
},
{
"epoch": 0.2597402597402597,
"grad_norm": 0.09397543966770172,
"learning_rate": 8.971572717570583e-05,
"loss": 0.0275,
"step": 1380
},
{
"epoch": 0.26162243553547904,
"grad_norm": 0.08513490110635757,
"learning_rate": 8.961870573396722e-05,
"loss": 0.0323,
"step": 1390
},
{
"epoch": 0.2635046113306983,
"grad_norm": 0.08179810643196106,
"learning_rate": 8.952168429222859e-05,
"loss": 0.0295,
"step": 1400
},
{
"epoch": 0.26538678712591757,
"grad_norm": 0.11643363535404205,
"learning_rate": 8.942466285048995e-05,
"loss": 0.0308,
"step": 1410
},
{
"epoch": 0.26726896292113683,
"grad_norm": 0.08557505905628204,
"learning_rate": 8.932764140875134e-05,
"loss": 0.0285,
"step": 1420
},
{
"epoch": 0.2691511387163561,
"grad_norm": 0.14439290761947632,
"learning_rate": 8.923061996701272e-05,
"loss": 0.0357,
"step": 1430
},
{
"epoch": 0.27103331451157536,
"grad_norm": 0.06755843758583069,
"learning_rate": 8.913359852527409e-05,
"loss": 0.0327,
"step": 1440
},
{
"epoch": 0.27291549030679463,
"grad_norm": 0.05954171344637871,
"learning_rate": 8.903657708353546e-05,
"loss": 0.03,
"step": 1450
},
{
"epoch": 0.27479766610201395,
"grad_norm": 0.13399435579776764,
"learning_rate": 8.893955564179685e-05,
"loss": 0.029,
"step": 1460
},
{
"epoch": 0.2766798418972332,
"grad_norm": 0.09965696185827255,
"learning_rate": 8.884253420005821e-05,
"loss": 0.0301,
"step": 1470
},
{
"epoch": 0.2785620176924525,
"grad_norm": 0.11371038854122162,
"learning_rate": 8.874551275831959e-05,
"loss": 0.0319,
"step": 1480
},
{
"epoch": 0.28044419348767174,
"grad_norm": 0.1467040777206421,
"learning_rate": 8.864849131658098e-05,
"loss": 0.0343,
"step": 1490
},
{
"epoch": 0.282326369282891,
"grad_norm": 0.08408571034669876,
"learning_rate": 8.855146987484234e-05,
"loss": 0.0339,
"step": 1500
},
{
"epoch": 0.2842085450781103,
"grad_norm": 0.07174082100391388,
"learning_rate": 8.845444843310372e-05,
"loss": 0.0336,
"step": 1510
},
{
"epoch": 0.2860907208733296,
"grad_norm": 0.1409539431333542,
"learning_rate": 8.83574269913651e-05,
"loss": 0.0265,
"step": 1520
},
{
"epoch": 0.28797289666854886,
"grad_norm": 0.06694231927394867,
"learning_rate": 8.826040554962647e-05,
"loss": 0.0321,
"step": 1530
},
{
"epoch": 0.2898550724637681,
"grad_norm": 0.12007555365562439,
"learning_rate": 8.816338410788785e-05,
"loss": 0.0269,
"step": 1540
},
{
"epoch": 0.2917372482589874,
"grad_norm": 0.10798055678606033,
"learning_rate": 8.806636266614922e-05,
"loss": 0.0258,
"step": 1550
},
{
"epoch": 0.29361942405420666,
"grad_norm": 0.20466643571853638,
"learning_rate": 8.79693412244106e-05,
"loss": 0.026,
"step": 1560
},
{
"epoch": 0.2955015998494259,
"grad_norm": 0.11347216367721558,
"learning_rate": 8.787231978267197e-05,
"loss": 0.0336,
"step": 1570
},
{
"epoch": 0.2973837756446452,
"grad_norm": 0.1293070763349533,
"learning_rate": 8.777529834093336e-05,
"loss": 0.0323,
"step": 1580
},
{
"epoch": 0.2992659514398645,
"grad_norm": 0.16921190917491913,
"learning_rate": 8.767827689919472e-05,
"loss": 0.0315,
"step": 1590
},
{
"epoch": 0.29983060417843027,
"eval_E1/acc_on_CONSISTENT": 0.6821192052980133,
"eval_E1/acc_on_INCONSISTENT": 0.8367346938775511,
"eval_E1/accuracy": 0.72,
"eval_E1/balanced_accuracy": 0.7594269495877821,
"eval_E1/f1_INC": 0.5942028985507247,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.4606741573033708,
"eval_E1/recall_INC": 0.8367346938775511,
"eval_E2/acc_on_CONSISTENT": 0.9859154929577465,
"eval_E2/acc_on_INCONSISTENT": 0.8793103448275862,
"eval_E2/accuracy": 0.955,
"eval_E2/balanced_accuracy": 0.9326129188926664,
"eval_E2/f1_INC": 0.9189189189189189,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9622641509433962,
"eval_E2/recall_INC": 0.8793103448275862,
"eval_E3/acc_on_CONSISTENT": 0.9307692307692308,
"eval_E3/acc_on_INCONSISTENT": 0.8,
"eval_E3/accuracy": 0.885,
"eval_E3/balanced_accuracy": 0.8653846153846154,
"eval_E3/f1_INC": 0.8296296296296297,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.8615384615384616,
"eval_E3/recall_INC": 0.8,
"eval_E4/acc_on_CONSISTENT": 0.8608695652173913,
"eval_E4/acc_on_INCONSISTENT": 0.8705882352941177,
"eval_E4/accuracy": 0.865,
"eval_E4/balanced_accuracy": 0.8657289002557544,
"eval_E4/f1_INC": 0.8457142857142856,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.8222222222222222,
"eval_E4/recall_INC": 0.8705882352941177,
"eval_edge_macro_accuracy": 0.845,
"eval_edge_macro_balanced_accuracy": 0.8438329560264428,
"eval_edge_macro_f1_INC": 0.7813551183936978,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.5116279069767442,
"eval_overall/acc_on_INCONSISTENT": 0.9617834394904459,
"eval_overall/accuracy": 0.865,
"eval_overall/balanced_accuracy": 0.736705673233595,
"eval_overall/f1_INC": 0.9179331306990881,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.877906976744186,
"eval_overall/recall_INC": 0.9617834394904459,
"eval_overall_exact_match": 0.44,
"eval_scene/acc_on_CONSISTENT": 0.8074074074074075,
"eval_scene/acc_on_INCONSISTENT": 0.7846153846153846,
"eval_scene/accuracy": 0.8,
"eval_scene/balanced_accuracy": 0.796011396011396,
"eval_scene/f1_INC": 0.7183098591549296,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.6623376623376623,
"eval_scene/recall_INC": 0.7846153846153846,
"step": 1593
},
{
"epoch": 0.3011481272350838,
"grad_norm": 0.13088257610797882,
"learning_rate": 8.75812554574561e-05,
"loss": 0.0357,
"step": 1600
},
{
"epoch": 0.30303030303030304,
"grad_norm": 0.12424547970294952,
"learning_rate": 8.748423401571748e-05,
"loss": 0.0351,
"step": 1610
},
{
"epoch": 0.3049124788255223,
"grad_norm": 0.13020102679729462,
"learning_rate": 8.738721257397885e-05,
"loss": 0.0285,
"step": 1620
},
{
"epoch": 0.30679465462074157,
"grad_norm": 0.0963355079293251,
"learning_rate": 8.729019113224023e-05,
"loss": 0.0321,
"step": 1630
},
{
"epoch": 0.30867683041596083,
"grad_norm": 0.10007308423519135,
"learning_rate": 8.71931696905016e-05,
"loss": 0.035,
"step": 1640
},
{
"epoch": 0.3105590062111801,
"grad_norm": 0.09309057146310806,
"learning_rate": 8.709614824876298e-05,
"loss": 0.0332,
"step": 1650
},
{
"epoch": 0.3124411820063994,
"grad_norm": 0.13886569440364838,
"learning_rate": 8.699912680702435e-05,
"loss": 0.0312,
"step": 1660
},
{
"epoch": 0.3143233578016187,
"grad_norm": 0.10759452730417252,
"learning_rate": 8.690210536528574e-05,
"loss": 0.0334,
"step": 1670
},
{
"epoch": 0.31620553359683795,
"grad_norm": 0.11499182879924774,
"learning_rate": 8.68050839235471e-05,
"loss": 0.0301,
"step": 1680
},
{
"epoch": 0.3180877093920572,
"grad_norm": 0.1072067990899086,
"learning_rate": 8.670806248180849e-05,
"loss": 0.0336,
"step": 1690
},
{
"epoch": 0.3199698851872765,
"grad_norm": 0.10061544179916382,
"learning_rate": 8.661104104006986e-05,
"loss": 0.0331,
"step": 1700
},
{
"epoch": 0.32185206098249575,
"grad_norm": 0.12949976325035095,
"learning_rate": 8.651401959833124e-05,
"loss": 0.0291,
"step": 1710
},
{
"epoch": 0.323734236777715,
"grad_norm": 0.14409397542476654,
"learning_rate": 8.641699815659261e-05,
"loss": 0.0266,
"step": 1720
},
{
"epoch": 0.32561641257293433,
"grad_norm": 0.10314024984836578,
"learning_rate": 8.631997671485399e-05,
"loss": 0.0313,
"step": 1730
},
{
"epoch": 0.3274985883681536,
"grad_norm": 0.15678931772708893,
"learning_rate": 8.622295527311536e-05,
"loss": 0.0351,
"step": 1740
},
{
"epoch": 0.32938076416337286,
"grad_norm": 0.09819275140762329,
"learning_rate": 8.612593383137673e-05,
"loss": 0.0337,
"step": 1750
},
{
"epoch": 0.33126293995859213,
"grad_norm": 0.13852599263191223,
"learning_rate": 8.602891238963812e-05,
"loss": 0.0312,
"step": 1760
},
{
"epoch": 0.3331451157538114,
"grad_norm": 0.11017139256000519,
"learning_rate": 8.593189094789948e-05,
"loss": 0.0305,
"step": 1770
},
{
"epoch": 0.33502729154903066,
"grad_norm": 0.07422087341547012,
"learning_rate": 8.583486950616087e-05,
"loss": 0.0263,
"step": 1780
},
{
"epoch": 0.33690946734425,
"grad_norm": 0.1125585064291954,
"learning_rate": 8.573784806442225e-05,
"loss": 0.0315,
"step": 1790
},
{
"epoch": 0.33879164313946925,
"grad_norm": 0.08203578740358353,
"learning_rate": 8.56408266226836e-05,
"loss": 0.0307,
"step": 1800
},
{
"epoch": 0.3406738189346885,
"grad_norm": 0.10316994786262512,
"learning_rate": 8.5543805180945e-05,
"loss": 0.0249,
"step": 1810
},
{
"epoch": 0.3425559947299078,
"grad_norm": 0.18619760870933533,
"learning_rate": 8.544678373920637e-05,
"loss": 0.0264,
"step": 1820
},
{
"epoch": 0.34443817052512704,
"grad_norm": 0.08711568266153336,
"learning_rate": 8.534976229746774e-05,
"loss": 0.0342,
"step": 1830
},
{
"epoch": 0.3463203463203463,
"grad_norm": 0.11246860027313232,
"learning_rate": 8.525274085572912e-05,
"loss": 0.03,
"step": 1840
},
{
"epoch": 0.34820252211556557,
"grad_norm": 0.05884129926562309,
"learning_rate": 8.51557194139905e-05,
"loss": 0.0299,
"step": 1850
},
{
"epoch": 0.3500846979107849,
"grad_norm": 0.12434038519859314,
"learning_rate": 8.505869797225187e-05,
"loss": 0.0263,
"step": 1860
},
{
"epoch": 0.35196687370600416,
"grad_norm": 0.0966510996222496,
"learning_rate": 8.496167653051324e-05,
"loss": 0.029,
"step": 1870
},
{
"epoch": 0.3538490495012234,
"grad_norm": 0.12718771398067474,
"learning_rate": 8.486465508877463e-05,
"loss": 0.0346,
"step": 1880
},
{
"epoch": 0.3557312252964427,
"grad_norm": 0.04632233828306198,
"learning_rate": 8.4767633647036e-05,
"loss": 0.029,
"step": 1890
},
{
"epoch": 0.35761340109166195,
"grad_norm": 0.1020045280456543,
"learning_rate": 8.467061220529738e-05,
"loss": 0.0283,
"step": 1900
},
{
"epoch": 0.3594955768868812,
"grad_norm": 0.14108321070671082,
"learning_rate": 8.457359076355875e-05,
"loss": 0.0298,
"step": 1910
},
{
"epoch": 0.3613777526821005,
"grad_norm": 0.12967492640018463,
"learning_rate": 8.447656932182014e-05,
"loss": 0.0298,
"step": 1920
},
{
"epoch": 0.3632599284773198,
"grad_norm": 0.07042180001735687,
"learning_rate": 8.43795478800815e-05,
"loss": 0.0284,
"step": 1930
},
{
"epoch": 0.36514210427253907,
"grad_norm": 0.14567403495311737,
"learning_rate": 8.428252643834287e-05,
"loss": 0.028,
"step": 1940
},
{
"epoch": 0.36702428006775834,
"grad_norm": 0.10920072346925735,
"learning_rate": 8.418550499660426e-05,
"loss": 0.0319,
"step": 1950
},
{
"epoch": 0.3689064558629776,
"grad_norm": 0.0970524400472641,
"learning_rate": 8.408848355486562e-05,
"loss": 0.0263,
"step": 1960
},
{
"epoch": 0.37078863165819687,
"grad_norm": 0.13133934140205383,
"learning_rate": 8.399146211312701e-05,
"loss": 0.0333,
"step": 1970
},
{
"epoch": 0.37267080745341613,
"grad_norm": 0.12621761858463287,
"learning_rate": 8.389444067138838e-05,
"loss": 0.0302,
"step": 1980
},
{
"epoch": 0.3745529832486354,
"grad_norm": 0.08393672108650208,
"learning_rate": 8.379741922964976e-05,
"loss": 0.0296,
"step": 1990
},
{
"epoch": 0.3764351590438547,
"grad_norm": 0.11379829049110413,
"learning_rate": 8.370039778791113e-05,
"loss": 0.0255,
"step": 2000
},
{
"epoch": 0.378317334839074,
"grad_norm": 0.07760214060544968,
"learning_rate": 8.360337634617251e-05,
"loss": 0.0244,
"step": 2010
},
{
"epoch": 0.38019951063429325,
"grad_norm": 0.07392806559801102,
"learning_rate": 8.350635490443388e-05,
"loss": 0.0315,
"step": 2020
},
{
"epoch": 0.3820816864295125,
"grad_norm": 0.12959477305412292,
"learning_rate": 8.340933346269526e-05,
"loss": 0.0302,
"step": 2030
},
{
"epoch": 0.3839638622247318,
"grad_norm": 0.09377480298280716,
"learning_rate": 8.331231202095664e-05,
"loss": 0.0302,
"step": 2040
},
{
"epoch": 0.38584603801995104,
"grad_norm": 0.06865111738443375,
"learning_rate": 8.3215290579218e-05,
"loss": 0.0314,
"step": 2050
},
{
"epoch": 0.38772821381517036,
"grad_norm": 0.11195676028728485,
"learning_rate": 8.311826913747939e-05,
"loss": 0.0273,
"step": 2060
},
{
"epoch": 0.38961038961038963,
"grad_norm": 0.1206878051161766,
"learning_rate": 8.302124769574077e-05,
"loss": 0.034,
"step": 2070
},
{
"epoch": 0.3914925654056089,
"grad_norm": 0.09009220451116562,
"learning_rate": 8.292422625400214e-05,
"loss": 0.0296,
"step": 2080
},
{
"epoch": 0.39337474120082816,
"grad_norm": 0.1171526163816452,
"learning_rate": 8.282720481226351e-05,
"loss": 0.031,
"step": 2090
},
{
"epoch": 0.3952569169960474,
"grad_norm": 0.0794205442070961,
"learning_rate": 8.273018337052489e-05,
"loss": 0.0255,
"step": 2100
},
{
"epoch": 0.3971390927912667,
"grad_norm": 0.07322624325752258,
"learning_rate": 8.263316192878626e-05,
"loss": 0.0287,
"step": 2110
},
{
"epoch": 0.39902126858648596,
"grad_norm": 0.09714718908071518,
"learning_rate": 8.253614048704764e-05,
"loss": 0.0261,
"step": 2120
},
{
"epoch": 0.3997741389045737,
"eval_E1/acc_on_CONSISTENT": 0.8807947019867549,
"eval_E1/acc_on_INCONSISTENT": 0.6530612244897959,
"eval_E1/accuracy": 0.825,
"eval_E1/balanced_accuracy": 0.7669279632382754,
"eval_E1/f1_INC": 0.6464646464646464,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.64,
"eval_E1/recall_INC": 0.6530612244897959,
"eval_E2/acc_on_CONSISTENT": 0.9929577464788732,
"eval_E2/acc_on_INCONSISTENT": 0.9137931034482759,
"eval_E2/accuracy": 0.97,
"eval_E2/balanced_accuracy": 0.9533754249635746,
"eval_E2/f1_INC": 0.9464285714285714,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9814814814814815,
"eval_E2/recall_INC": 0.9137931034482759,
"eval_E3/acc_on_CONSISTENT": 0.9615384615384616,
"eval_E3/acc_on_INCONSISTENT": 0.7857142857142857,
"eval_E3/accuracy": 0.9,
"eval_E3/balanced_accuracy": 0.8736263736263736,
"eval_E3/f1_INC": 0.8461538461538461,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.9166666666666666,
"eval_E3/recall_INC": 0.7857142857142857,
"eval_E4/acc_on_CONSISTENT": 0.9478260869565217,
"eval_E4/acc_on_INCONSISTENT": 0.8117647058823529,
"eval_E4/accuracy": 0.89,
"eval_E4/balanced_accuracy": 0.8797953964194374,
"eval_E4/f1_INC": 0.8625,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.92,
"eval_E4/recall_INC": 0.8117647058823529,
"eval_edge_macro_accuracy": 0.877,
"eval_edge_macro_balanced_accuracy": 0.8403860572905579,
"eval_edge_macro_f1_INC": 0.7862353387353387,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.8604651162790697,
"eval_overall/acc_on_INCONSISTENT": 0.8789808917197452,
"eval_overall/accuracy": 0.875,
"eval_overall/balanced_accuracy": 0.8697230039994075,
"eval_overall/f1_INC": 0.9169435215946845,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.9583333333333334,
"eval_overall/recall_INC": 0.8789808917197452,
"eval_overall_exact_match": 0.56,
"eval_scene/acc_on_CONSISTENT": 0.9333333333333333,
"eval_scene/acc_on_INCONSISTENT": 0.5230769230769231,
"eval_scene/accuracy": 0.8,
"eval_scene/balanced_accuracy": 0.7282051282051283,
"eval_scene/f1_INC": 0.6296296296296297,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.7906976744186046,
"eval_scene/recall_INC": 0.5230769230769231,
"step": 2124
},
{
"epoch": 0.4009034443817053,
"grad_norm": 0.15719006955623627,
"learning_rate": 8.243911904530903e-05,
"loss": 0.0269,
"step": 2130
},
{
"epoch": 0.40278562017692454,
"grad_norm": 0.06503473967313766,
"learning_rate": 8.234209760357039e-05,
"loss": 0.0283,
"step": 2140
},
{
"epoch": 0.4046677959721438,
"grad_norm": 0.09964703023433685,
"learning_rate": 8.224507616183177e-05,
"loss": 0.0232,
"step": 2150
},
{
"epoch": 0.40654997176736307,
"grad_norm": 0.13143323361873627,
"learning_rate": 8.214805472009315e-05,
"loss": 0.0267,
"step": 2160
},
{
"epoch": 0.40843214756258234,
"grad_norm": 0.12974168360233307,
"learning_rate": 8.205103327835452e-05,
"loss": 0.0256,
"step": 2170
},
{
"epoch": 0.4103143233578016,
"grad_norm": 0.09947684407234192,
"learning_rate": 8.19540118366159e-05,
"loss": 0.0307,
"step": 2180
},
{
"epoch": 0.41219649915302087,
"grad_norm": 0.10723303258419037,
"learning_rate": 8.185699039487727e-05,
"loss": 0.0283,
"step": 2190
},
{
"epoch": 0.4140786749482402,
"grad_norm": 0.07822173833847046,
"learning_rate": 8.175996895313865e-05,
"loss": 0.0269,
"step": 2200
},
{
"epoch": 0.41596085074345945,
"grad_norm": 0.10570277273654938,
"learning_rate": 8.166294751140002e-05,
"loss": 0.0295,
"step": 2210
},
{
"epoch": 0.4178430265386787,
"grad_norm": 0.09187448024749756,
"learning_rate": 8.156592606966141e-05,
"loss": 0.0308,
"step": 2220
},
{
"epoch": 0.419725202333898,
"grad_norm": 0.10860244184732437,
"learning_rate": 8.146890462792277e-05,
"loss": 0.0312,
"step": 2230
},
{
"epoch": 0.42160737812911725,
"grad_norm": 0.07823146134614944,
"learning_rate": 8.137188318618416e-05,
"loss": 0.0302,
"step": 2240
},
{
"epoch": 0.4234895539243365,
"grad_norm": 0.05982290208339691,
"learning_rate": 8.127486174444553e-05,
"loss": 0.0261,
"step": 2250
},
{
"epoch": 0.4253717297195558,
"grad_norm": 0.13135980069637299,
"learning_rate": 8.117784030270689e-05,
"loss": 0.0357,
"step": 2260
},
{
"epoch": 0.4272539055147751,
"grad_norm": 0.08659800887107849,
"learning_rate": 8.108081886096828e-05,
"loss": 0.0331,
"step": 2270
},
{
"epoch": 0.42913608130999437,
"grad_norm": 0.07572152465581894,
"learning_rate": 8.098379741922965e-05,
"loss": 0.0284,
"step": 2280
},
{
"epoch": 0.43101825710521363,
"grad_norm": 0.11546391248703003,
"learning_rate": 8.088677597749103e-05,
"loss": 0.034,
"step": 2290
},
{
"epoch": 0.4329004329004329,
"grad_norm": 0.09705963730812073,
"learning_rate": 8.07897545357524e-05,
"loss": 0.0277,
"step": 2300
},
{
"epoch": 0.43478260869565216,
"grad_norm": 0.1337226778268814,
"learning_rate": 8.069273309401379e-05,
"loss": 0.0275,
"step": 2310
},
{
"epoch": 0.4366647844908714,
"grad_norm": 0.10398007929325104,
"learning_rate": 8.059571165227515e-05,
"loss": 0.0269,
"step": 2320
},
{
"epoch": 0.43854696028609075,
"grad_norm": 0.059763580560684204,
"learning_rate": 8.049869021053653e-05,
"loss": 0.03,
"step": 2330
},
{
"epoch": 0.44042913608131,
"grad_norm": 0.1391168087720871,
"learning_rate": 8.040166876879791e-05,
"loss": 0.0259,
"step": 2340
},
{
"epoch": 0.4423113118765293,
"grad_norm": 0.12780527770519257,
"learning_rate": 8.030464732705927e-05,
"loss": 0.0306,
"step": 2350
},
{
"epoch": 0.44419348767174854,
"grad_norm": 0.09013444930315018,
"learning_rate": 8.020762588532066e-05,
"loss": 0.0238,
"step": 2360
},
{
"epoch": 0.4460756634669678,
"grad_norm": 0.08515927940607071,
"learning_rate": 8.011060444358204e-05,
"loss": 0.0315,
"step": 2370
},
{
"epoch": 0.4479578392621871,
"grad_norm": 0.07814784348011017,
"learning_rate": 8.001358300184341e-05,
"loss": 0.0284,
"step": 2380
},
{
"epoch": 0.44984001505740634,
"grad_norm": 0.10175956785678864,
"learning_rate": 7.991656156010478e-05,
"loss": 0.03,
"step": 2390
},
{
"epoch": 0.45172219085262566,
"grad_norm": 0.0597836934030056,
"learning_rate": 7.981954011836616e-05,
"loss": 0.0266,
"step": 2400
},
{
"epoch": 0.4536043666478449,
"grad_norm": 0.07506367564201355,
"learning_rate": 7.972251867662753e-05,
"loss": 0.0319,
"step": 2410
},
{
"epoch": 0.4554865424430642,
"grad_norm": 0.08653825521469116,
"learning_rate": 7.962549723488891e-05,
"loss": 0.0264,
"step": 2420
},
{
"epoch": 0.45736871823828346,
"grad_norm": 0.14505213499069214,
"learning_rate": 7.95284757931503e-05,
"loss": 0.0252,
"step": 2430
},
{
"epoch": 0.4592508940335027,
"grad_norm": 0.13145671784877777,
"learning_rate": 7.943145435141166e-05,
"loss": 0.0295,
"step": 2440
},
{
"epoch": 0.461133069828722,
"grad_norm": 0.07361818104982376,
"learning_rate": 7.933443290967304e-05,
"loss": 0.0269,
"step": 2450
},
{
"epoch": 0.46301524562394125,
"grad_norm": 0.1015157401561737,
"learning_rate": 7.923741146793442e-05,
"loss": 0.0279,
"step": 2460
},
{
"epoch": 0.4648974214191606,
"grad_norm": 0.09409838169813156,
"learning_rate": 7.914039002619579e-05,
"loss": 0.0294,
"step": 2470
},
{
"epoch": 0.46677959721437984,
"grad_norm": 0.0932067483663559,
"learning_rate": 7.904336858445717e-05,
"loss": 0.0265,
"step": 2480
},
{
"epoch": 0.4686617730095991,
"grad_norm": 0.15952104330062866,
"learning_rate": 7.894634714271854e-05,
"loss": 0.0255,
"step": 2490
},
{
"epoch": 0.47054394880481837,
"grad_norm": 0.09479888528585434,
"learning_rate": 7.884932570097993e-05,
"loss": 0.0279,
"step": 2500
},
{
"epoch": 0.47242612460003763,
"grad_norm": 0.1220136433839798,
"learning_rate": 7.875230425924129e-05,
"loss": 0.0294,
"step": 2510
},
{
"epoch": 0.4743083003952569,
"grad_norm": 0.08821658045053482,
"learning_rate": 7.865528281750268e-05,
"loss": 0.0305,
"step": 2520
},
{
"epoch": 0.47619047619047616,
"grad_norm": 0.23937903344631195,
"learning_rate": 7.855826137576405e-05,
"loss": 0.0269,
"step": 2530
},
{
"epoch": 0.4780726519856955,
"grad_norm": 0.09873885661363602,
"learning_rate": 7.846123993402543e-05,
"loss": 0.0324,
"step": 2540
},
{
"epoch": 0.47995482778091475,
"grad_norm": 0.08553300052881241,
"learning_rate": 7.83642184922868e-05,
"loss": 0.0328,
"step": 2550
},
{
"epoch": 0.481837003576134,
"grad_norm": 0.1176324337720871,
"learning_rate": 7.826719705054818e-05,
"loss": 0.0353,
"step": 2560
},
{
"epoch": 0.4837191793713533,
"grad_norm": 0.09982674568891525,
"learning_rate": 7.817017560880955e-05,
"loss": 0.0301,
"step": 2570
},
{
"epoch": 0.48560135516657255,
"grad_norm": 0.08941078931093216,
"learning_rate": 7.807315416707092e-05,
"loss": 0.0286,
"step": 2580
},
{
"epoch": 0.4874835309617918,
"grad_norm": 0.15026530623435974,
"learning_rate": 7.797613272533231e-05,
"loss": 0.0266,
"step": 2590
},
{
"epoch": 0.48936570675701113,
"grad_norm": 0.10724597424268723,
"learning_rate": 7.787911128359367e-05,
"loss": 0.0284,
"step": 2600
},
{
"epoch": 0.4912478825522304,
"grad_norm": 0.08620548248291016,
"learning_rate": 7.778208984185506e-05,
"loss": 0.0296,
"step": 2610
},
{
"epoch": 0.49313005834744966,
"grad_norm": 0.08863481879234314,
"learning_rate": 7.768506840011643e-05,
"loss": 0.0241,
"step": 2620
},
{
"epoch": 0.4950122341426689,
"grad_norm": 0.08469167351722717,
"learning_rate": 7.758804695837781e-05,
"loss": 0.0273,
"step": 2630
},
{
"epoch": 0.4968944099378882,
"grad_norm": 0.133014976978302,
"learning_rate": 7.749102551663918e-05,
"loss": 0.0295,
"step": 2640
},
{
"epoch": 0.49877658573310746,
"grad_norm": 0.09178700298070908,
"learning_rate": 7.739400407490056e-05,
"loss": 0.0293,
"step": 2650
},
{
"epoch": 0.4997176736307171,
"eval_E1/acc_on_CONSISTENT": 0.8211920529801324,
"eval_E1/acc_on_INCONSISTENT": 0.7346938775510204,
"eval_E1/accuracy": 0.8,
"eval_E1/balanced_accuracy": 0.7779429652655765,
"eval_E1/f1_INC": 0.6428571428571428,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.5714285714285714,
"eval_E1/recall_INC": 0.7346938775510204,
"eval_E2/acc_on_CONSISTENT": 0.9929577464788732,
"eval_E2/acc_on_INCONSISTENT": 0.8793103448275862,
"eval_E2/accuracy": 0.96,
"eval_E2/balanced_accuracy": 0.9361340456532297,
"eval_E2/f1_INC": 0.9272727272727272,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9807692307692307,
"eval_E2/recall_INC": 0.8793103448275862,
"eval_E3/acc_on_CONSISTENT": 0.9692307692307692,
"eval_E3/acc_on_INCONSISTENT": 0.7857142857142857,
"eval_E3/accuracy": 0.905,
"eval_E3/balanced_accuracy": 0.8774725274725275,
"eval_E3/f1_INC": 0.8527131782945736,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.9322033898305084,
"eval_E3/recall_INC": 0.7857142857142857,
"eval_E4/acc_on_CONSISTENT": 0.9565217391304348,
"eval_E4/acc_on_INCONSISTENT": 0.8352941176470589,
"eval_E4/accuracy": 0.905,
"eval_E4/balanced_accuracy": 0.8959079283887468,
"eval_E4/f1_INC": 0.8819875776397516,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.9342105263157895,
"eval_E4/recall_INC": 0.8352941176470589,
"eval_edge_macro_accuracy": 0.881,
"eval_edge_macro_balanced_accuracy": 0.8602835161480389,
"eval_edge_macro_f1_INC": 0.8105844458235261,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.813953488372093,
"eval_overall/acc_on_INCONSISTENT": 0.9235668789808917,
"eval_overall/accuracy": 0.9,
"eval_overall/balanced_accuracy": 0.8687601836764924,
"eval_overall/f1_INC": 0.935483870967742,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.9477124183006536,
"eval_overall/recall_INC": 0.9235668789808917,
"eval_overall_exact_match": 0.575,
"eval_scene/acc_on_CONSISTENT": 0.8740740740740741,
"eval_scene/acc_on_INCONSISTENT": 0.7538461538461538,
"eval_scene/accuracy": 0.835,
"eval_scene/balanced_accuracy": 0.813960113960114,
"eval_scene/f1_INC": 0.7480916030534351,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.7424242424242424,
"eval_scene/recall_INC": 0.7538461538461538,
"step": 2655
},
{
"epoch": 0.5006587615283268,
"grad_norm": 0.11279813200235367,
"learning_rate": 7.729698263316193e-05,
"loss": 0.0309,
"step": 2660
},
{
"epoch": 0.502540937323546,
"grad_norm": 0.08533964306116104,
"learning_rate": 7.71999611914233e-05,
"loss": 0.0256,
"step": 2670
},
{
"epoch": 0.5044231131187653,
"grad_norm": 0.14148874580860138,
"learning_rate": 7.71029397496847e-05,
"loss": 0.0236,
"step": 2680
},
{
"epoch": 0.5063052889139845,
"grad_norm": 0.11055805534124374,
"learning_rate": 7.700591830794605e-05,
"loss": 0.0305,
"step": 2690
},
{
"epoch": 0.5081874647092038,
"grad_norm": 0.0990087240934372,
"learning_rate": 7.690889686620744e-05,
"loss": 0.0294,
"step": 2700
},
{
"epoch": 0.5100696405044232,
"grad_norm": 0.12202861160039902,
"learning_rate": 7.681187542446882e-05,
"loss": 0.025,
"step": 2710
},
{
"epoch": 0.5119518162996424,
"grad_norm": 0.10385531932115555,
"learning_rate": 7.671485398273018e-05,
"loss": 0.0314,
"step": 2720
},
{
"epoch": 0.5138339920948617,
"grad_norm": 0.07932283729314804,
"learning_rate": 7.661783254099157e-05,
"loss": 0.0248,
"step": 2730
},
{
"epoch": 0.5157161678900809,
"grad_norm": 0.10993891954421997,
"learning_rate": 7.652081109925294e-05,
"loss": 0.0242,
"step": 2740
},
{
"epoch": 0.5175983436853002,
"grad_norm": 0.16471970081329346,
"learning_rate": 7.642378965751431e-05,
"loss": 0.0303,
"step": 2750
},
{
"epoch": 0.5194805194805194,
"grad_norm": 0.10347539931535721,
"learning_rate": 7.632676821577569e-05,
"loss": 0.0274,
"step": 2760
},
{
"epoch": 0.5213626952757388,
"grad_norm": 0.11677437275648117,
"learning_rate": 7.622974677403706e-05,
"loss": 0.0288,
"step": 2770
},
{
"epoch": 0.5232448710709581,
"grad_norm": 0.09840503334999084,
"learning_rate": 7.613272533229844e-05,
"loss": 0.0269,
"step": 2780
},
{
"epoch": 0.5251270468661773,
"grad_norm": 0.06443244963884354,
"learning_rate": 7.603570389055981e-05,
"loss": 0.0337,
"step": 2790
},
{
"epoch": 0.5270092226613966,
"grad_norm": 0.11365149915218353,
"learning_rate": 7.59386824488212e-05,
"loss": 0.0269,
"step": 2800
},
{
"epoch": 0.5288913984566158,
"grad_norm": 0.09044452011585236,
"learning_rate": 7.584166100708256e-05,
"loss": 0.0299,
"step": 2810
},
{
"epoch": 0.5307735742518351,
"grad_norm": 0.10111326724290848,
"learning_rate": 7.574463956534395e-05,
"loss": 0.0262,
"step": 2820
},
{
"epoch": 0.5326557500470543,
"grad_norm": 0.1057933047413826,
"learning_rate": 7.564761812360532e-05,
"loss": 0.0232,
"step": 2830
},
{
"epoch": 0.5345379258422737,
"grad_norm": 0.11712583154439926,
"learning_rate": 7.55505966818667e-05,
"loss": 0.0282,
"step": 2840
},
{
"epoch": 0.536420101637493,
"grad_norm": 0.09643035382032394,
"learning_rate": 7.545357524012807e-05,
"loss": 0.0269,
"step": 2850
},
{
"epoch": 0.5383022774327122,
"grad_norm": 0.10376808047294617,
"learning_rate": 7.535655379838945e-05,
"loss": 0.024,
"step": 2860
},
{
"epoch": 0.5401844532279315,
"grad_norm": 0.24281369149684906,
"learning_rate": 7.525953235665082e-05,
"loss": 0.0283,
"step": 2870
},
{
"epoch": 0.5420666290231507,
"grad_norm": 0.10237613320350647,
"learning_rate": 7.51625109149122e-05,
"loss": 0.0316,
"step": 2880
},
{
"epoch": 0.54394880481837,
"grad_norm": 0.12895576655864716,
"learning_rate": 7.506548947317358e-05,
"loss": 0.0294,
"step": 2890
},
{
"epoch": 0.5458309806135893,
"grad_norm": 0.11355803906917572,
"learning_rate": 7.496846803143494e-05,
"loss": 0.0277,
"step": 2900
},
{
"epoch": 0.5477131564088086,
"grad_norm": 0.16196122765541077,
"learning_rate": 7.487144658969633e-05,
"loss": 0.0305,
"step": 2910
},
{
"epoch": 0.5495953322040279,
"grad_norm": 0.08025684952735901,
"learning_rate": 7.47744251479577e-05,
"loss": 0.0291,
"step": 2920
},
{
"epoch": 0.5514775079992471,
"grad_norm": 0.10405171662569046,
"learning_rate": 7.467740370621908e-05,
"loss": 0.0266,
"step": 2930
},
{
"epoch": 0.5533596837944664,
"grad_norm": 0.17075183987617493,
"learning_rate": 7.458038226448045e-05,
"loss": 0.0261,
"step": 2940
},
{
"epoch": 0.5552418595896856,
"grad_norm": 0.13905194401741028,
"learning_rate": 7.448336082274183e-05,
"loss": 0.0234,
"step": 2950
},
{
"epoch": 0.557124035384905,
"grad_norm": 0.08814238011837006,
"learning_rate": 7.43863393810032e-05,
"loss": 0.0342,
"step": 2960
},
{
"epoch": 0.5590062111801242,
"grad_norm": 0.08515793830156326,
"learning_rate": 7.428931793926458e-05,
"loss": 0.0293,
"step": 2970
},
{
"epoch": 0.5608883869753435,
"grad_norm": 0.0772959515452385,
"learning_rate": 7.419229649752596e-05,
"loss": 0.026,
"step": 2980
},
{
"epoch": 0.5627705627705628,
"grad_norm": 0.12232999503612518,
"learning_rate": 7.409527505578732e-05,
"loss": 0.0315,
"step": 2990
},
{
"epoch": 0.564652738565782,
"grad_norm": 0.062099162489175797,
"learning_rate": 7.399825361404871e-05,
"loss": 0.0261,
"step": 3000
},
{
"epoch": 0.5665349143610013,
"grad_norm": 0.08616367727518082,
"learning_rate": 7.390123217231009e-05,
"loss": 0.0221,
"step": 3010
},
{
"epoch": 0.5684170901562206,
"grad_norm": 0.1390579491853714,
"learning_rate": 7.380421073057146e-05,
"loss": 0.0289,
"step": 3020
},
{
"epoch": 0.5702992659514399,
"grad_norm": 0.0917593464255333,
"learning_rate": 7.370718928883284e-05,
"loss": 0.0249,
"step": 3030
},
{
"epoch": 0.5721814417466592,
"grad_norm": 0.12263333052396774,
"learning_rate": 7.361016784709421e-05,
"loss": 0.0284,
"step": 3040
},
{
"epoch": 0.5740636175418784,
"grad_norm": 0.08040110766887665,
"learning_rate": 7.351314640535558e-05,
"loss": 0.0231,
"step": 3050
},
{
"epoch": 0.5759457933370977,
"grad_norm": 0.11405957490205765,
"learning_rate": 7.341612496361696e-05,
"loss": 0.0238,
"step": 3060
},
{
"epoch": 0.5778279691323169,
"grad_norm": 0.05968109518289566,
"learning_rate": 7.331910352187835e-05,
"loss": 0.0282,
"step": 3070
},
{
"epoch": 0.5797101449275363,
"grad_norm": 0.10681314766407013,
"learning_rate": 7.322208208013971e-05,
"loss": 0.027,
"step": 3080
},
{
"epoch": 0.5815923207227555,
"grad_norm": 0.0905841812491417,
"learning_rate": 7.31250606384011e-05,
"loss": 0.0258,
"step": 3090
},
{
"epoch": 0.5834744965179748,
"grad_norm": 0.07992485910654068,
"learning_rate": 7.302803919666247e-05,
"loss": 0.021,
"step": 3100
},
{
"epoch": 0.5853566723131941,
"grad_norm": 0.09587814658880234,
"learning_rate": 7.293101775492384e-05,
"loss": 0.0338,
"step": 3110
},
{
"epoch": 0.5872388481084133,
"grad_norm": 0.07799631357192993,
"learning_rate": 7.283399631318522e-05,
"loss": 0.0284,
"step": 3120
},
{
"epoch": 0.5891210239036326,
"grad_norm": 0.1305895447731018,
"learning_rate": 7.273697487144659e-05,
"loss": 0.0271,
"step": 3130
},
{
"epoch": 0.5910031996988518,
"grad_norm": 0.13612420856952667,
"learning_rate": 7.263995342970798e-05,
"loss": 0.0241,
"step": 3140
},
{
"epoch": 0.5928853754940712,
"grad_norm": 0.10845185816287994,
"learning_rate": 7.254293198796934e-05,
"loss": 0.0281,
"step": 3150
},
{
"epoch": 0.5947675512892904,
"grad_norm": 0.10513018816709518,
"learning_rate": 7.244591054623073e-05,
"loss": 0.0264,
"step": 3160
},
{
"epoch": 0.5966497270845097,
"grad_norm": 0.17080609500408173,
"learning_rate": 7.23488891044921e-05,
"loss": 0.0273,
"step": 3170
},
{
"epoch": 0.598531902879729,
"grad_norm": 0.08871451020240784,
"learning_rate": 7.225186766275346e-05,
"loss": 0.0309,
"step": 3180
},
{
"epoch": 0.5996612083568605,
"eval_E1/acc_on_CONSISTENT": 0.8211920529801324,
"eval_E1/acc_on_INCONSISTENT": 0.7346938775510204,
"eval_E1/accuracy": 0.8,
"eval_E1/balanced_accuracy": 0.7779429652655765,
"eval_E1/f1_INC": 0.6428571428571428,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.5714285714285714,
"eval_E1/recall_INC": 0.7346938775510204,
"eval_E2/acc_on_CONSISTENT": 0.9929577464788732,
"eval_E2/acc_on_INCONSISTENT": 0.9655172413793104,
"eval_E2/accuracy": 0.985,
"eval_E2/balanced_accuracy": 0.9792374939290918,
"eval_E2/f1_INC": 0.9739130434782608,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9824561403508771,
"eval_E2/recall_INC": 0.9655172413793104,
"eval_E3/acc_on_CONSISTENT": 0.9384615384615385,
"eval_E3/acc_on_INCONSISTENT": 0.7714285714285715,
"eval_E3/accuracy": 0.88,
"eval_E3/balanced_accuracy": 0.854945054945055,
"eval_E3/f1_INC": 0.8181818181818182,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.8709677419354839,
"eval_E3/recall_INC": 0.7714285714285715,
"eval_E4/acc_on_CONSISTENT": 0.9478260869565217,
"eval_E4/acc_on_INCONSISTENT": 0.7764705882352941,
"eval_E4/accuracy": 0.875,
"eval_E4/balanced_accuracy": 0.8621483375959079,
"eval_E4/f1_INC": 0.8407643312101911,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.9166666666666666,
"eval_E4/recall_INC": 0.7764705882352941,
"eval_edge_macro_accuracy": 0.853,
"eval_edge_macro_balanced_accuracy": 0.8437436592360152,
"eval_edge_macro_f1_INC": 0.7859608772083757,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.5348837209302325,
"eval_overall/acc_on_INCONSISTENT": 0.9171974522292994,
"eval_overall/accuracy": 0.835,
"eval_overall/balanced_accuracy": 0.7260405865797659,
"eval_overall/f1_INC": 0.897196261682243,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.8780487804878049,
"eval_overall/recall_INC": 0.9171974522292994,
"eval_overall_exact_match": 0.47,
"eval_scene/acc_on_CONSISTENT": 0.6888888888888889,
"eval_scene/acc_on_INCONSISTENT": 0.8,
"eval_scene/accuracy": 0.725,
"eval_scene/balanced_accuracy": 0.7444444444444445,
"eval_scene/f1_INC": 0.6540880503144655,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.5531914893617021,
"eval_scene/recall_INC": 0.8,
"step": 3186
},
{
"epoch": 0.6004140786749482,
"grad_norm": 0.12375885248184204,
"learning_rate": 7.215484622101485e-05,
"loss": 0.0275,
"step": 3190
},
{
"epoch": 0.6022962544701675,
"grad_norm": 0.10502137243747711,
"learning_rate": 7.205782477927623e-05,
"loss": 0.0279,
"step": 3200
},
{
"epoch": 0.6041784302653868,
"grad_norm": 0.1351398080587387,
"learning_rate": 7.19608033375376e-05,
"loss": 0.0234,
"step": 3210
},
{
"epoch": 0.6060606060606061,
"grad_norm": 0.14613057672977448,
"learning_rate": 7.186378189579897e-05,
"loss": 0.0235,
"step": 3220
},
{
"epoch": 0.6079427818558253,
"grad_norm": 0.09466767311096191,
"learning_rate": 7.176676045406035e-05,
"loss": 0.0322,
"step": 3230
},
{
"epoch": 0.6098249576510446,
"grad_norm": 0.11353032290935516,
"learning_rate": 7.166973901232172e-05,
"loss": 0.0277,
"step": 3240
},
{
"epoch": 0.6117071334462639,
"grad_norm": 0.0853382870554924,
"learning_rate": 7.15727175705831e-05,
"loss": 0.0311,
"step": 3250
},
{
"epoch": 0.6135893092414831,
"grad_norm": 0.055036455392837524,
"learning_rate": 7.147569612884449e-05,
"loss": 0.0278,
"step": 3260
},
{
"epoch": 0.6154714850367025,
"grad_norm": 0.06104744225740433,
"learning_rate": 7.137867468710585e-05,
"loss": 0.0286,
"step": 3270
},
{
"epoch": 0.6173536608319217,
"grad_norm": 0.08071596175432205,
"learning_rate": 7.128165324536723e-05,
"loss": 0.0257,
"step": 3280
},
{
"epoch": 0.619235836627141,
"grad_norm": 0.14282366633415222,
"learning_rate": 7.118463180362861e-05,
"loss": 0.0276,
"step": 3290
},
{
"epoch": 0.6211180124223602,
"grad_norm": 0.15172088146209717,
"learning_rate": 7.108761036188998e-05,
"loss": 0.0245,
"step": 3300
},
{
"epoch": 0.6230001882175795,
"grad_norm": 0.0917058140039444,
"learning_rate": 7.099058892015136e-05,
"loss": 0.0293,
"step": 3310
},
{
"epoch": 0.6248823640127988,
"grad_norm": 0.11406487971544266,
"learning_rate": 7.089356747841273e-05,
"loss": 0.0276,
"step": 3320
},
{
"epoch": 0.626764539808018,
"grad_norm": 0.11802924424409866,
"learning_rate": 7.07965460366741e-05,
"loss": 0.0263,
"step": 3330
},
{
"epoch": 0.6286467156032374,
"grad_norm": 0.11947114020586014,
"learning_rate": 7.069952459493548e-05,
"loss": 0.0285,
"step": 3340
},
{
"epoch": 0.6305288913984566,
"grad_norm": 0.10451506078243256,
"learning_rate": 7.060250315319687e-05,
"loss": 0.0275,
"step": 3350
},
{
"epoch": 0.6324110671936759,
"grad_norm": 0.10557418316602707,
"learning_rate": 7.050548171145823e-05,
"loss": 0.0265,
"step": 3360
},
{
"epoch": 0.6342932429888951,
"grad_norm": 0.12705279886722565,
"learning_rate": 7.040846026971962e-05,
"loss": 0.0246,
"step": 3370
},
{
"epoch": 0.6361754187841144,
"grad_norm": 0.18986289203166962,
"learning_rate": 7.031143882798099e-05,
"loss": 0.0285,
"step": 3380
},
{
"epoch": 0.6380575945793338,
"grad_norm": 0.09949778020381927,
"learning_rate": 7.021441738624236e-05,
"loss": 0.0265,
"step": 3390
},
{
"epoch": 0.639939770374553,
"grad_norm": 0.07037244737148285,
"learning_rate": 7.011739594450374e-05,
"loss": 0.0249,
"step": 3400
},
{
"epoch": 0.6418219461697723,
"grad_norm": 0.10179682075977325,
"learning_rate": 7.002037450276511e-05,
"loss": 0.0303,
"step": 3410
},
{
"epoch": 0.6437041219649915,
"grad_norm": 0.08202063292264938,
"learning_rate": 6.992335306102649e-05,
"loss": 0.0262,
"step": 3420
},
{
"epoch": 0.6455862977602108,
"grad_norm": 0.1346074640750885,
"learning_rate": 6.982633161928786e-05,
"loss": 0.0218,
"step": 3430
},
{
"epoch": 0.64746847355543,
"grad_norm": 0.11997853219509125,
"learning_rate": 6.972931017754925e-05,
"loss": 0.0291,
"step": 3440
},
{
"epoch": 0.6493506493506493,
"grad_norm": 0.05166507139801979,
"learning_rate": 6.963228873581061e-05,
"loss": 0.0267,
"step": 3450
},
{
"epoch": 0.6512328251458687,
"grad_norm": 0.08481217920780182,
"learning_rate": 6.9535267294072e-05,
"loss": 0.0275,
"step": 3460
},
{
"epoch": 0.6531150009410879,
"grad_norm": 0.19386963546276093,
"learning_rate": 6.943824585233337e-05,
"loss": 0.0255,
"step": 3470
},
{
"epoch": 0.6549971767363072,
"grad_norm": 0.19028638303279877,
"learning_rate": 6.934122441059475e-05,
"loss": 0.0275,
"step": 3480
},
{
"epoch": 0.6568793525315264,
"grad_norm": 0.07005799561738968,
"learning_rate": 6.924420296885612e-05,
"loss": 0.0265,
"step": 3490
},
{
"epoch": 0.6587615283267457,
"grad_norm": 0.08579978346824646,
"learning_rate": 6.91471815271175e-05,
"loss": 0.023,
"step": 3500
},
{
"epoch": 0.6606437041219649,
"grad_norm": 0.12526081502437592,
"learning_rate": 6.905016008537887e-05,
"loss": 0.0306,
"step": 3510
},
{
"epoch": 0.6625258799171843,
"grad_norm": 0.10663193464279175,
"learning_rate": 6.895313864364024e-05,
"loss": 0.0305,
"step": 3520
},
{
"epoch": 0.6644080557124036,
"grad_norm": 0.0989537239074707,
"learning_rate": 6.885611720190163e-05,
"loss": 0.0263,
"step": 3530
},
{
"epoch": 0.6662902315076228,
"grad_norm": 0.13903282582759857,
"learning_rate": 6.875909576016299e-05,
"loss": 0.0283,
"step": 3540
},
{
"epoch": 0.6681724073028421,
"grad_norm": 0.07183618098497391,
"learning_rate": 6.866207431842438e-05,
"loss": 0.0282,
"step": 3550
},
{
"epoch": 0.6700545830980613,
"grad_norm": 0.06900515407323837,
"learning_rate": 6.856505287668576e-05,
"loss": 0.0198,
"step": 3560
},
{
"epoch": 0.6719367588932806,
"grad_norm": 0.16435284912586212,
"learning_rate": 6.846803143494712e-05,
"loss": 0.0291,
"step": 3570
},
{
"epoch": 0.6738189346885,
"grad_norm": 0.12341795861721039,
"learning_rate": 6.83710099932085e-05,
"loss": 0.0279,
"step": 3580
},
{
"epoch": 0.6757011104837192,
"grad_norm": 0.15621671080589294,
"learning_rate": 6.827398855146988e-05,
"loss": 0.0258,
"step": 3590
},
{
"epoch": 0.6775832862789385,
"grad_norm": 0.11459346860647202,
"learning_rate": 6.817696710973125e-05,
"loss": 0.0324,
"step": 3600
},
{
"epoch": 0.6794654620741577,
"grad_norm": 0.10974545776844025,
"learning_rate": 6.807994566799263e-05,
"loss": 0.0284,
"step": 3610
},
{
"epoch": 0.681347637869377,
"grad_norm": 0.07209113240242004,
"learning_rate": 6.7982924226254e-05,
"loss": 0.0263,
"step": 3620
},
{
"epoch": 0.6832298136645962,
"grad_norm": 0.12532223761081696,
"learning_rate": 6.788590278451538e-05,
"loss": 0.0298,
"step": 3630
},
{
"epoch": 0.6851119894598156,
"grad_norm": 0.14268836379051208,
"learning_rate": 6.778888134277675e-05,
"loss": 0.027,
"step": 3640
},
{
"epoch": 0.6869941652550349,
"grad_norm": 0.20249424874782562,
"learning_rate": 6.769185990103814e-05,
"loss": 0.0275,
"step": 3650
},
{
"epoch": 0.6888763410502541,
"grad_norm": 0.1736336499452591,
"learning_rate": 6.75948384592995e-05,
"loss": 0.0258,
"step": 3660
},
{
"epoch": 0.6907585168454734,
"grad_norm": 0.042560216039419174,
"learning_rate": 6.749781701756089e-05,
"loss": 0.0239,
"step": 3670
},
{
"epoch": 0.6926406926406926,
"grad_norm": 0.042638007551431656,
"learning_rate": 6.740079557582226e-05,
"loss": 0.029,
"step": 3680
},
{
"epoch": 0.6945228684359119,
"grad_norm": 0.1276584416627884,
"learning_rate": 6.730377413408363e-05,
"loss": 0.0288,
"step": 3690
},
{
"epoch": 0.6964050442311311,
"grad_norm": 0.07026208192110062,
"learning_rate": 6.720675269234501e-05,
"loss": 0.0225,
"step": 3700
},
{
"epoch": 0.6982872200263505,
"grad_norm": 0.14463388919830322,
"learning_rate": 6.710973125060638e-05,
"loss": 0.025,
"step": 3710
},
{
"epoch": 0.6996047430830039,
"eval_E1/acc_on_CONSISTENT": 0.9337748344370861,
"eval_E1/acc_on_INCONSISTENT": 0.6122448979591837,
"eval_E1/accuracy": 0.855,
"eval_E1/balanced_accuracy": 0.7730098661981348,
"eval_E1/f1_INC": 0.6741573033707865,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.75,
"eval_E1/recall_INC": 0.6122448979591837,
"eval_E2/acc_on_CONSISTENT": 0.9788732394366197,
"eval_E2/acc_on_INCONSISTENT": 0.9310344827586207,
"eval_E2/accuracy": 0.965,
"eval_E2/balanced_accuracy": 0.9549538610976203,
"eval_E2/f1_INC": 0.9391304347826087,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9473684210526315,
"eval_E2/recall_INC": 0.9310344827586207,
"eval_E3/acc_on_CONSISTENT": 0.9769230769230769,
"eval_E3/acc_on_INCONSISTENT": 0.7857142857142857,
"eval_E3/accuracy": 0.91,
"eval_E3/balanced_accuracy": 0.8813186813186813,
"eval_E3/f1_INC": 0.859375,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.9482758620689655,
"eval_E3/recall_INC": 0.7857142857142857,
"eval_E4/acc_on_CONSISTENT": 0.9826086956521739,
"eval_E4/acc_on_INCONSISTENT": 0.7294117647058823,
"eval_E4/accuracy": 0.875,
"eval_E4/balanced_accuracy": 0.8560102301790281,
"eval_E4/f1_INC": 0.832214765100671,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.96875,
"eval_E4/recall_INC": 0.7294117647058823,
"eval_edge_macro_accuracy": 0.889,
"eval_edge_macro_balanced_accuracy": 0.8526026873028524,
"eval_edge_macro_f1_INC": 0.80764216731748,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.8837209302325582,
"eval_overall/acc_on_INCONSISTENT": 0.8598726114649682,
"eval_overall/accuracy": 0.865,
"eval_overall/balanced_accuracy": 0.8717967708487632,
"eval_overall/f1_INC": 0.9090909090909091,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.9642857142857143,
"eval_overall/recall_INC": 0.8598726114649682,
"eval_overall_exact_match": 0.61,
"eval_scene/acc_on_CONSISTENT": 0.9185185185185185,
"eval_scene/acc_on_INCONSISTENT": 0.676923076923077,
"eval_scene/accuracy": 0.84,
"eval_scene/balanced_accuracy": 0.7977207977207977,
"eval_scene/f1_INC": 0.7333333333333334,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.8,
"eval_scene/recall_INC": 0.676923076923077,
"step": 3717
},
{
"epoch": 0.7001693958215698,
"grad_norm": 0.06821384280920029,
"learning_rate": 6.701270980886777e-05,
"loss": 0.0281,
"step": 3720
},
{
"epoch": 0.702051571616789,
"grad_norm": 0.0533619187772274,
"learning_rate": 6.691568836712913e-05,
"loss": 0.0296,
"step": 3730
},
{
"epoch": 0.7039337474120083,
"grad_norm": 0.09107464551925659,
"learning_rate": 6.681866692539052e-05,
"loss": 0.0268,
"step": 3740
},
{
"epoch": 0.7058159232072275,
"grad_norm": 0.08339343965053558,
"learning_rate": 6.67216454836519e-05,
"loss": 0.0295,
"step": 3750
},
{
"epoch": 0.7076980990024468,
"grad_norm": 0.09445764124393463,
"learning_rate": 6.662462404191327e-05,
"loss": 0.026,
"step": 3760
},
{
"epoch": 0.709580274797666,
"grad_norm": 0.1917838305234909,
"learning_rate": 6.652760260017464e-05,
"loss": 0.0288,
"step": 3770
},
{
"epoch": 0.7114624505928854,
"grad_norm": 0.13823284208774567,
"learning_rate": 6.643058115843602e-05,
"loss": 0.0243,
"step": 3780
},
{
"epoch": 0.7133446263881047,
"grad_norm": 0.09427863359451294,
"learning_rate": 6.633355971669739e-05,
"loss": 0.0224,
"step": 3790
},
{
"epoch": 0.7152268021833239,
"grad_norm": 0.15948054194450378,
"learning_rate": 6.623653827495877e-05,
"loss": 0.0196,
"step": 3800
},
{
"epoch": 0.7171089779785432,
"grad_norm": 0.20518970489501953,
"learning_rate": 6.613951683322015e-05,
"loss": 0.026,
"step": 3810
},
{
"epoch": 0.7189911537737624,
"grad_norm": 0.15291956067085266,
"learning_rate": 6.604249539148151e-05,
"loss": 0.028,
"step": 3820
},
{
"epoch": 0.7208733295689818,
"grad_norm": 0.12342661619186401,
"learning_rate": 6.59454739497429e-05,
"loss": 0.0283,
"step": 3830
},
{
"epoch": 0.722755505364201,
"grad_norm": 0.07337340712547302,
"learning_rate": 6.584845250800428e-05,
"loss": 0.023,
"step": 3840
},
{
"epoch": 0.7246376811594203,
"grad_norm": 0.12145810574293137,
"learning_rate": 6.575143106626565e-05,
"loss": 0.0302,
"step": 3850
},
{
"epoch": 0.7265198569546396,
"grad_norm": 0.10396488010883331,
"learning_rate": 6.565440962452703e-05,
"loss": 0.026,
"step": 3860
},
{
"epoch": 0.7284020327498588,
"grad_norm": 0.08993718773126602,
"learning_rate": 6.55573881827884e-05,
"loss": 0.0281,
"step": 3870
},
{
"epoch": 0.7302842085450781,
"grad_norm": 0.09292326867580414,
"learning_rate": 6.546036674104977e-05,
"loss": 0.0281,
"step": 3880
},
{
"epoch": 0.7321663843402973,
"grad_norm": 0.1312495619058609,
"learning_rate": 6.536334529931115e-05,
"loss": 0.0248,
"step": 3890
},
{
"epoch": 0.7340485601355167,
"grad_norm": 0.09885958582162857,
"learning_rate": 6.526632385757254e-05,
"loss": 0.0227,
"step": 3900
},
{
"epoch": 0.7359307359307359,
"grad_norm": 0.05759183689951897,
"learning_rate": 6.51693024158339e-05,
"loss": 0.0316,
"step": 3910
},
{
"epoch": 0.7378129117259552,
"grad_norm": 0.1465388834476471,
"learning_rate": 6.507228097409528e-05,
"loss": 0.0239,
"step": 3920
},
{
"epoch": 0.7396950875211745,
"grad_norm": 0.13463398814201355,
"learning_rate": 6.497525953235666e-05,
"loss": 0.0243,
"step": 3930
},
{
"epoch": 0.7415772633163937,
"grad_norm": 0.10613127052783966,
"learning_rate": 6.487823809061803e-05,
"loss": 0.0225,
"step": 3940
},
{
"epoch": 0.743459439111613,
"grad_norm": 0.07204587757587433,
"learning_rate": 6.478121664887941e-05,
"loss": 0.0284,
"step": 3950
},
{
"epoch": 0.7453416149068323,
"grad_norm": 0.09663920104503632,
"learning_rate": 6.468419520714078e-05,
"loss": 0.0241,
"step": 3960
},
{
"epoch": 0.7472237907020516,
"grad_norm": 0.13608111441135406,
"learning_rate": 6.458717376540216e-05,
"loss": 0.0237,
"step": 3970
},
{
"epoch": 0.7491059664972708,
"grad_norm": 0.07337552309036255,
"learning_rate": 6.449015232366353e-05,
"loss": 0.0222,
"step": 3980
},
{
"epoch": 0.7509881422924901,
"grad_norm": 0.14900878071784973,
"learning_rate": 6.439313088192492e-05,
"loss": 0.0286,
"step": 3990
},
{
"epoch": 0.7528703180877094,
"grad_norm": 0.07007355242967606,
"learning_rate": 6.429610944018628e-05,
"loss": 0.028,
"step": 4000
},
{
"epoch": 0.7547524938829286,
"grad_norm": 0.15586300194263458,
"learning_rate": 6.419908799844765e-05,
"loss": 0.0267,
"step": 4010
},
{
"epoch": 0.756634669678148,
"grad_norm": 0.1284913569688797,
"learning_rate": 6.410206655670904e-05,
"loss": 0.0228,
"step": 4020
},
{
"epoch": 0.7585168454733672,
"grad_norm": 0.1646757572889328,
"learning_rate": 6.40050451149704e-05,
"loss": 0.0262,
"step": 4030
},
{
"epoch": 0.7603990212685865,
"grad_norm": 0.09742174297571182,
"learning_rate": 6.390802367323179e-05,
"loss": 0.029,
"step": 4040
},
{
"epoch": 0.7622811970638057,
"grad_norm": 0.07278095930814743,
"learning_rate": 6.381100223149316e-05,
"loss": 0.0263,
"step": 4050
},
{
"epoch": 0.764163372859025,
"grad_norm": 0.10488718748092651,
"learning_rate": 6.371398078975454e-05,
"loss": 0.0217,
"step": 4060
},
{
"epoch": 0.7660455486542443,
"grad_norm": 0.21971240639686584,
"learning_rate": 6.361695934801591e-05,
"loss": 0.0286,
"step": 4070
},
{
"epoch": 0.7679277244494636,
"grad_norm": 0.08719635754823685,
"learning_rate": 6.351993790627729e-05,
"loss": 0.0265,
"step": 4080
},
{
"epoch": 0.7698099002446829,
"grad_norm": 0.09772541373968124,
"learning_rate": 6.342291646453866e-05,
"loss": 0.0197,
"step": 4090
},
{
"epoch": 0.7716920760399021,
"grad_norm": 0.07383599132299423,
"learning_rate": 6.332589502280004e-05,
"loss": 0.0287,
"step": 4100
},
{
"epoch": 0.7735742518351214,
"grad_norm": 0.09341705590486526,
"learning_rate": 6.322887358106142e-05,
"loss": 0.0203,
"step": 4110
},
{
"epoch": 0.7754564276303407,
"grad_norm": 0.19727744162082672,
"learning_rate": 6.313185213932278e-05,
"loss": 0.0233,
"step": 4120
},
{
"epoch": 0.7773386034255599,
"grad_norm": 0.11619048565626144,
"learning_rate": 6.303483069758417e-05,
"loss": 0.0218,
"step": 4130
},
{
"epoch": 0.7792207792207793,
"grad_norm": 0.25396350026130676,
"learning_rate": 6.293780925584555e-05,
"loss": 0.022,
"step": 4140
},
{
"epoch": 0.7811029550159985,
"grad_norm": 0.14137905836105347,
"learning_rate": 6.284078781410692e-05,
"loss": 0.0215,
"step": 4150
},
{
"epoch": 0.7829851308112178,
"grad_norm": 0.053330399096012115,
"learning_rate": 6.27437663723683e-05,
"loss": 0.0236,
"step": 4160
},
{
"epoch": 0.784867306606437,
"grad_norm": 0.08605629950761795,
"learning_rate": 6.264674493062967e-05,
"loss": 0.0235,
"step": 4170
},
{
"epoch": 0.7867494824016563,
"grad_norm": 0.16659440100193024,
"learning_rate": 6.254972348889104e-05,
"loss": 0.0253,
"step": 4180
},
{
"epoch": 0.7886316581968756,
"grad_norm": 0.09707406908273697,
"learning_rate": 6.245270204715242e-05,
"loss": 0.0259,
"step": 4190
},
{
"epoch": 0.7905138339920948,
"grad_norm": 0.07335163652896881,
"learning_rate": 6.23556806054138e-05,
"loss": 0.0254,
"step": 4200
},
{
"epoch": 0.7923960097873142,
"grad_norm": 0.07250624150037766,
"learning_rate": 6.225865916367517e-05,
"loss": 0.0297,
"step": 4210
},
{
"epoch": 0.7942781855825334,
"grad_norm": 0.13132064044475555,
"learning_rate": 6.216163772193655e-05,
"loss": 0.0284,
"step": 4220
},
{
"epoch": 0.7961603613777527,
"grad_norm": 0.16921114921569824,
"learning_rate": 6.206461628019793e-05,
"loss": 0.0303,
"step": 4230
},
{
"epoch": 0.7980425371729719,
"grad_norm": 0.09276404231786728,
"learning_rate": 6.19675948384593e-05,
"loss": 0.0234,
"step": 4240
},
{
"epoch": 0.7995482778091474,
"eval_E1/acc_on_CONSISTENT": 0.7880794701986755,
"eval_E1/acc_on_INCONSISTENT": 0.6938775510204082,
"eval_E1/accuracy": 0.765,
"eval_E1/balanced_accuracy": 0.7409785106095419,
"eval_E1/f1_INC": 0.5913043478260871,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.5151515151515151,
"eval_E1/recall_INC": 0.6938775510204082,
"eval_E2/acc_on_CONSISTENT": 0.9859154929577465,
"eval_E2/acc_on_INCONSISTENT": 0.9655172413793104,
"eval_E2/accuracy": 0.98,
"eval_E2/balanced_accuracy": 0.9757163671685285,
"eval_E2/f1_INC": 0.9655172413793104,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9655172413793104,
"eval_E2/recall_INC": 0.9655172413793104,
"eval_E3/acc_on_CONSISTENT": 0.9461538461538461,
"eval_E3/acc_on_INCONSISTENT": 0.8,
"eval_E3/accuracy": 0.895,
"eval_E3/balanced_accuracy": 0.8730769230769231,
"eval_E3/f1_INC": 0.8421052631578948,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.8888888888888888,
"eval_E3/recall_INC": 0.8,
"eval_E4/acc_on_CONSISTENT": 0.9304347826086956,
"eval_E4/acc_on_INCONSISTENT": 0.8117647058823529,
"eval_E4/accuracy": 0.88,
"eval_E4/balanced_accuracy": 0.8710997442455243,
"eval_E4/f1_INC": 0.8518518518518517,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.8961038961038961,
"eval_E4/recall_INC": 0.8117647058823529,
"eval_edge_macro_accuracy": 0.866,
"eval_edge_macro_balanced_accuracy": 0.8560489528947475,
"eval_edge_macro_f1_INC": 0.7988043894916774,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.6511627906976745,
"eval_overall/acc_on_INCONSISTENT": 0.9426751592356688,
"eval_overall/accuracy": 0.88,
"eval_overall/balanced_accuracy": 0.7969189749666716,
"eval_overall/f1_INC": 0.925,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.9079754601226994,
"eval_overall/recall_INC": 0.9426751592356688,
"eval_overall_exact_match": 0.515,
"eval_scene/acc_on_CONSISTENT": 0.7925925925925926,
"eval_scene/acc_on_INCONSISTENT": 0.8461538461538461,
"eval_scene/accuracy": 0.81,
"eval_scene/balanced_accuracy": 0.8193732193732194,
"eval_scene/f1_INC": 0.7432432432432433,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.6626506024096386,
"eval_scene/recall_INC": 0.8461538461538461,
"step": 4248
},
{
"epoch": 0.7999247129681912,
"grad_norm": 0.07519380003213882,
"learning_rate": 6.187057339672068e-05,
"loss": 0.0227,
"step": 4250
},
{
"epoch": 0.8018068887634106,
"grad_norm": 0.15206333994865417,
"learning_rate": 6.177355195498205e-05,
"loss": 0.0263,
"step": 4260
},
{
"epoch": 0.8036890645586298,
"grad_norm": 0.09467748552560806,
"learning_rate": 6.167653051324343e-05,
"loss": 0.0215,
"step": 4270
},
{
"epoch": 0.8055712403538491,
"grad_norm": 0.09524611383676529,
"learning_rate": 6.15795090715048e-05,
"loss": 0.0253,
"step": 4280
},
{
"epoch": 0.8074534161490683,
"grad_norm": 0.09639701247215271,
"learning_rate": 6.148248762976619e-05,
"loss": 0.0273,
"step": 4290
},
{
"epoch": 0.8093355919442876,
"grad_norm": 0.14750158786773682,
"learning_rate": 6.138546618802755e-05,
"loss": 0.0247,
"step": 4300
},
{
"epoch": 0.8112177677395068,
"grad_norm": 0.15283837914466858,
"learning_rate": 6.128844474628894e-05,
"loss": 0.0255,
"step": 4310
},
{
"epoch": 0.8130999435347261,
"grad_norm": 0.1801212579011917,
"learning_rate": 6.119142330455031e-05,
"loss": 0.0236,
"step": 4320
},
{
"epoch": 0.8149821193299455,
"grad_norm": 0.18473784625530243,
"learning_rate": 6.109440186281169e-05,
"loss": 0.0321,
"step": 4330
},
{
"epoch": 0.8168642951251647,
"grad_norm": 0.13694533705711365,
"learning_rate": 6.099738042107306e-05,
"loss": 0.0231,
"step": 4340
},
{
"epoch": 0.818746470920384,
"grad_norm": 0.08112656325101852,
"learning_rate": 6.090035897933444e-05,
"loss": 0.0259,
"step": 4350
},
{
"epoch": 0.8206286467156032,
"grad_norm": 0.07673269510269165,
"learning_rate": 6.0803337537595815e-05,
"loss": 0.027,
"step": 4360
},
{
"epoch": 0.8225108225108225,
"grad_norm": 0.13535504043102264,
"learning_rate": 6.070631609585718e-05,
"loss": 0.0285,
"step": 4370
},
{
"epoch": 0.8243929983060417,
"grad_norm": 0.08035381883382797,
"learning_rate": 6.0609294654118564e-05,
"loss": 0.0263,
"step": 4380
},
{
"epoch": 0.8262751741012611,
"grad_norm": 0.142923042178154,
"learning_rate": 6.0512273212379945e-05,
"loss": 0.0228,
"step": 4390
},
{
"epoch": 0.8281573498964804,
"grad_norm": 0.19256168603897095,
"learning_rate": 6.041525177064131e-05,
"loss": 0.0215,
"step": 4400
},
{
"epoch": 0.8300395256916996,
"grad_norm": 0.08662780374288559,
"learning_rate": 6.0318230328902694e-05,
"loss": 0.0281,
"step": 4410
},
{
"epoch": 0.8319217014869189,
"grad_norm": 0.11855155229568481,
"learning_rate": 6.022120888716407e-05,
"loss": 0.0238,
"step": 4420
},
{
"epoch": 0.8338038772821381,
"grad_norm": 0.0649333968758583,
"learning_rate": 6.012418744542544e-05,
"loss": 0.0308,
"step": 4430
},
{
"epoch": 0.8356860530773574,
"grad_norm": 0.13388758897781372,
"learning_rate": 6.0027166003686816e-05,
"loss": 0.0285,
"step": 4440
},
{
"epoch": 0.8375682288725766,
"grad_norm": 0.1069571003317833,
"learning_rate": 5.99301445619482e-05,
"loss": 0.0215,
"step": 4450
},
{
"epoch": 0.839450404667796,
"grad_norm": 0.07490979135036469,
"learning_rate": 5.9833123120209565e-05,
"loss": 0.0266,
"step": 4460
},
{
"epoch": 0.8413325804630153,
"grad_norm": 0.11468319594860077,
"learning_rate": 5.9736101678470946e-05,
"loss": 0.0284,
"step": 4470
},
{
"epoch": 0.8432147562582345,
"grad_norm": 0.1102227121591568,
"learning_rate": 5.963908023673233e-05,
"loss": 0.0273,
"step": 4480
},
{
"epoch": 0.8450969320534538,
"grad_norm": 0.08790767937898636,
"learning_rate": 5.9542058794993695e-05,
"loss": 0.0226,
"step": 4490
},
{
"epoch": 0.846979107848673,
"grad_norm": 0.07965442538261414,
"learning_rate": 5.9445037353255076e-05,
"loss": 0.0164,
"step": 4500
},
{
"epoch": 0.8488612836438924,
"grad_norm": 0.12062489241361618,
"learning_rate": 5.934801591151645e-05,
"loss": 0.0271,
"step": 4510
},
{
"epoch": 0.8507434594391116,
"grad_norm": 0.12974771857261658,
"learning_rate": 5.925099446977782e-05,
"loss": 0.0253,
"step": 4520
},
{
"epoch": 0.8526256352343309,
"grad_norm": 0.15159684419631958,
"learning_rate": 5.91539730280392e-05,
"loss": 0.0277,
"step": 4530
},
{
"epoch": 0.8545078110295502,
"grad_norm": 0.10359372198581696,
"learning_rate": 5.905695158630058e-05,
"loss": 0.0278,
"step": 4540
},
{
"epoch": 0.8563899868247694,
"grad_norm": 0.11358320713043213,
"learning_rate": 5.895993014456195e-05,
"loss": 0.0232,
"step": 4550
},
{
"epoch": 0.8582721626199887,
"grad_norm": 0.0856373980641365,
"learning_rate": 5.886290870282333e-05,
"loss": 0.0305,
"step": 4560
},
{
"epoch": 0.8601543384152079,
"grad_norm": 0.08378347009420395,
"learning_rate": 5.876588726108471e-05,
"loss": 0.0199,
"step": 4570
},
{
"epoch": 0.8620365142104273,
"grad_norm": 0.13333091139793396,
"learning_rate": 5.866886581934608e-05,
"loss": 0.0247,
"step": 4580
},
{
"epoch": 0.8639186900056465,
"grad_norm": 0.15513169765472412,
"learning_rate": 5.857184437760745e-05,
"loss": 0.0206,
"step": 4590
},
{
"epoch": 0.8658008658008658,
"grad_norm": 0.12354400008916855,
"learning_rate": 5.847482293586883e-05,
"loss": 0.0222,
"step": 4600
},
{
"epoch": 0.8676830415960851,
"grad_norm": 0.1295776218175888,
"learning_rate": 5.83778014941302e-05,
"loss": 0.0239,
"step": 4610
},
{
"epoch": 0.8695652173913043,
"grad_norm": 0.15621507167816162,
"learning_rate": 5.828078005239158e-05,
"loss": 0.0277,
"step": 4620
},
{
"epoch": 0.8714473931865236,
"grad_norm": 0.17905867099761963,
"learning_rate": 5.818375861065296e-05,
"loss": 0.0225,
"step": 4630
},
{
"epoch": 0.8733295689817429,
"grad_norm": 0.1387549340724945,
"learning_rate": 5.808673716891433e-05,
"loss": 0.0258,
"step": 4640
},
{
"epoch": 0.8752117447769622,
"grad_norm": 0.12285871803760529,
"learning_rate": 5.798971572717571e-05,
"loss": 0.0249,
"step": 4650
},
{
"epoch": 0.8770939205721815,
"grad_norm": 0.119094617664814,
"learning_rate": 5.7892694285437085e-05,
"loss": 0.0302,
"step": 4660
},
{
"epoch": 0.8789760963674007,
"grad_norm": 0.08970344066619873,
"learning_rate": 5.779567284369846e-05,
"loss": 0.0205,
"step": 4670
},
{
"epoch": 0.88085827216262,
"grad_norm": 0.1598692238330841,
"learning_rate": 5.7698651401959834e-05,
"loss": 0.0218,
"step": 4680
},
{
"epoch": 0.8827404479578392,
"grad_norm": 0.24901559948921204,
"learning_rate": 5.7601629960221215e-05,
"loss": 0.0214,
"step": 4690
},
{
"epoch": 0.8846226237530586,
"grad_norm": 0.22025392949581146,
"learning_rate": 5.750460851848258e-05,
"loss": 0.0207,
"step": 4700
},
{
"epoch": 0.8865047995482778,
"grad_norm": 0.11392150819301605,
"learning_rate": 5.7407587076743963e-05,
"loss": 0.0235,
"step": 4710
},
{
"epoch": 0.8883869753434971,
"grad_norm": 0.07520972937345505,
"learning_rate": 5.7310565635005345e-05,
"loss": 0.0212,
"step": 4720
},
{
"epoch": 0.8902691511387164,
"grad_norm": 0.13182830810546875,
"learning_rate": 5.721354419326671e-05,
"loss": 0.02,
"step": 4730
},
{
"epoch": 0.8921513269339356,
"grad_norm": 0.1381557583808899,
"learning_rate": 5.711652275152809e-05,
"loss": 0.0277,
"step": 4740
},
{
"epoch": 0.8940335027291549,
"grad_norm": 0.12975607812404633,
"learning_rate": 5.701950130978947e-05,
"loss": 0.0256,
"step": 4750
},
{
"epoch": 0.8959156785243741,
"grad_norm": 0.17318369448184967,
"learning_rate": 5.6922479868050835e-05,
"loss": 0.0247,
"step": 4760
},
{
"epoch": 0.8977978543195935,
"grad_norm": 0.126237154006958,
"learning_rate": 5.6825458426312216e-05,
"loss": 0.0234,
"step": 4770
},
{
"epoch": 0.8994918125352908,
"eval_E1/acc_on_CONSISTENT": 0.8675496688741722,
"eval_E1/acc_on_INCONSISTENT": 0.5714285714285714,
"eval_E1/accuracy": 0.795,
"eval_E1/balanced_accuracy": 0.7194891201513718,
"eval_E1/f1_INC": 0.577319587628866,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.5833333333333334,
"eval_E1/recall_INC": 0.5714285714285714,
"eval_E2/acc_on_CONSISTENT": 0.9929577464788732,
"eval_E2/acc_on_INCONSISTENT": 0.9482758620689655,
"eval_E2/accuracy": 0.98,
"eval_E2/balanced_accuracy": 0.9706168042739194,
"eval_E2/f1_INC": 0.9649122807017544,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9821428571428571,
"eval_E2/recall_INC": 0.9482758620689655,
"eval_E3/acc_on_CONSISTENT": 0.9846153846153847,
"eval_E3/acc_on_INCONSISTENT": 0.7857142857142857,
"eval_E3/accuracy": 0.915,
"eval_E3/balanced_accuracy": 0.8851648351648351,
"eval_E3/f1_INC": 0.8661417322834646,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.9649122807017544,
"eval_E3/recall_INC": 0.7857142857142857,
"eval_E4/acc_on_CONSISTENT": 0.9652173913043478,
"eval_E4/acc_on_INCONSISTENT": 0.7647058823529411,
"eval_E4/accuracy": 0.88,
"eval_E4/balanced_accuracy": 0.8649616368286445,
"eval_E4/f1_INC": 0.8441558441558441,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.9420289855072463,
"eval_E4/recall_INC": 0.7647058823529411,
"eval_edge_macro_accuracy": 0.881,
"eval_edge_macro_balanced_accuracy": 0.8508385020757769,
"eval_edge_macro_f1_INC": 0.8001242095646729,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.813953488372093,
"eval_overall/acc_on_INCONSISTENT": 0.9044585987261147,
"eval_overall/accuracy": 0.885,
"eval_overall/balanced_accuracy": 0.8592060435491038,
"eval_overall/f1_INC": 0.9250814332247558,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.9466666666666667,
"eval_overall/recall_INC": 0.9044585987261147,
"eval_overall_exact_match": 0.58,
"eval_scene/acc_on_CONSISTENT": 0.8740740740740741,
"eval_scene/acc_on_INCONSISTENT": 0.7538461538461538,
"eval_scene/accuracy": 0.835,
"eval_scene/balanced_accuracy": 0.813960113960114,
"eval_scene/f1_INC": 0.7480916030534351,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.7424242424242424,
"eval_scene/recall_INC": 0.7538461538461538,
"step": 4779
},
{
"epoch": 0.8996800301148127,
"grad_norm": 0.1269172877073288,
"learning_rate": 5.67284369845736e-05,
"loss": 0.0252,
"step": 4780
},
{
"epoch": 0.901562205910032,
"grad_norm": 0.10349240154027939,
"learning_rate": 5.6631415542834965e-05,
"loss": 0.022,
"step": 4790
},
{
"epoch": 0.9034443817052513,
"grad_norm": 0.24686415493488312,
"learning_rate": 5.6534394101096346e-05,
"loss": 0.0265,
"step": 4800
},
{
"epoch": 0.9053265575004705,
"grad_norm": 0.11216803640127182,
"learning_rate": 5.643737265935772e-05,
"loss": 0.0216,
"step": 4810
},
{
"epoch": 0.9072087332956899,
"grad_norm": 0.14201720058918,
"learning_rate": 5.6340351217619094e-05,
"loss": 0.0283,
"step": 4820
},
{
"epoch": 0.9090909090909091,
"grad_norm": 0.07003463804721832,
"learning_rate": 5.624332977588047e-05,
"loss": 0.0254,
"step": 4830
},
{
"epoch": 0.9109730848861284,
"grad_norm": 0.10892708599567413,
"learning_rate": 5.614630833414185e-05,
"loss": 0.0273,
"step": 4840
},
{
"epoch": 0.9128552606813476,
"grad_norm": 0.06218297407031059,
"learning_rate": 5.604928689240322e-05,
"loss": 0.0258,
"step": 4850
},
{
"epoch": 0.9147374364765669,
"grad_norm": 0.10862410068511963,
"learning_rate": 5.59522654506646e-05,
"loss": 0.0206,
"step": 4860
},
{
"epoch": 0.9166196122717862,
"grad_norm": 0.07507742196321487,
"learning_rate": 5.585524400892598e-05,
"loss": 0.0262,
"step": 4870
},
{
"epoch": 0.9185017880670054,
"grad_norm": 0.10350686311721802,
"learning_rate": 5.575822256718735e-05,
"loss": 0.025,
"step": 4880
},
{
"epoch": 0.9203839638622248,
"grad_norm": 0.16628728806972504,
"learning_rate": 5.566120112544873e-05,
"loss": 0.0284,
"step": 4890
},
{
"epoch": 0.922266139657444,
"grad_norm": 0.045880332589149475,
"learning_rate": 5.55641796837101e-05,
"loss": 0.0235,
"step": 4900
},
{
"epoch": 0.9241483154526633,
"grad_norm": 0.17356722056865692,
"learning_rate": 5.546715824197147e-05,
"loss": 0.026,
"step": 4910
},
{
"epoch": 0.9260304912478825,
"grad_norm": 0.11924988031387329,
"learning_rate": 5.537013680023285e-05,
"loss": 0.0217,
"step": 4920
},
{
"epoch": 0.9279126670431018,
"grad_norm": 0.08413538336753845,
"learning_rate": 5.527311535849423e-05,
"loss": 0.0249,
"step": 4930
},
{
"epoch": 0.9297948428383211,
"grad_norm": 0.09474111348390579,
"learning_rate": 5.51760939167556e-05,
"loss": 0.0229,
"step": 4940
},
{
"epoch": 0.9316770186335404,
"grad_norm": 0.07419522106647491,
"learning_rate": 5.507907247501698e-05,
"loss": 0.022,
"step": 4950
},
{
"epoch": 0.9335591944287597,
"grad_norm": 0.09347780793905258,
"learning_rate": 5.498205103327836e-05,
"loss": 0.0252,
"step": 4960
},
{
"epoch": 0.9354413702239789,
"grad_norm": 0.053250234574079514,
"learning_rate": 5.4885029591539736e-05,
"loss": 0.0249,
"step": 4970
},
{
"epoch": 0.9373235460191982,
"grad_norm": 0.09263543039560318,
"learning_rate": 5.4788008149801104e-05,
"loss": 0.0189,
"step": 4980
},
{
"epoch": 0.9392057218144174,
"grad_norm": 0.12147948890924454,
"learning_rate": 5.4690986708062485e-05,
"loss": 0.0218,
"step": 4990
},
{
"epoch": 0.9410878976096367,
"grad_norm": 0.12498101592063904,
"learning_rate": 5.4593965266323866e-05,
"loss": 0.0206,
"step": 5000
},
{
"epoch": 0.9429700734048561,
"grad_norm": 0.1211477741599083,
"learning_rate": 5.449694382458523e-05,
"loss": 0.0262,
"step": 5010
},
{
"epoch": 0.9448522492000753,
"grad_norm": 0.10046116262674332,
"learning_rate": 5.4399922382846614e-05,
"loss": 0.0167,
"step": 5020
},
{
"epoch": 0.9467344249952946,
"grad_norm": 0.10313168913125992,
"learning_rate": 5.4302900941107996e-05,
"loss": 0.0263,
"step": 5030
},
{
"epoch": 0.9486166007905138,
"grad_norm": 0.07489953190088272,
"learning_rate": 5.420587949936936e-05,
"loss": 0.0233,
"step": 5040
},
{
"epoch": 0.9504987765857331,
"grad_norm": 0.09977987408638,
"learning_rate": 5.410885805763074e-05,
"loss": 0.0229,
"step": 5050
},
{
"epoch": 0.9523809523809523,
"grad_norm": 0.09566326439380646,
"learning_rate": 5.401183661589212e-05,
"loss": 0.0249,
"step": 5060
},
{
"epoch": 0.9542631281761716,
"grad_norm": 0.11907912790775299,
"learning_rate": 5.3914815174153486e-05,
"loss": 0.0256,
"step": 5070
},
{
"epoch": 0.956145303971391,
"grad_norm": 0.10536547005176544,
"learning_rate": 5.381779373241487e-05,
"loss": 0.0236,
"step": 5080
},
{
"epoch": 0.9580274797666102,
"grad_norm": 0.07869280129671097,
"learning_rate": 5.372077229067625e-05,
"loss": 0.0194,
"step": 5090
},
{
"epoch": 0.9599096555618295,
"grad_norm": 0.12649060785770416,
"learning_rate": 5.3623750848937616e-05,
"loss": 0.0248,
"step": 5100
},
{
"epoch": 0.9617918313570487,
"grad_norm": 0.07347354292869568,
"learning_rate": 5.3526729407199e-05,
"loss": 0.0276,
"step": 5110
},
{
"epoch": 0.963674007152268,
"grad_norm": 0.1066274419426918,
"learning_rate": 5.342970796546037e-05,
"loss": 0.0224,
"step": 5120
},
{
"epoch": 0.9655561829474872,
"grad_norm": 0.10295616090297699,
"learning_rate": 5.3332686523721745e-05,
"loss": 0.0293,
"step": 5130
},
{
"epoch": 0.9674383587427066,
"grad_norm": 0.07118721306324005,
"learning_rate": 5.323566508198312e-05,
"loss": 0.0278,
"step": 5140
},
{
"epoch": 0.9693205345379259,
"grad_norm": 0.11095461249351501,
"learning_rate": 5.31386436402445e-05,
"loss": 0.0259,
"step": 5150
},
{
"epoch": 0.9712027103331451,
"grad_norm": 0.11480211466550827,
"learning_rate": 5.304162219850587e-05,
"loss": 0.0213,
"step": 5160
},
{
"epoch": 0.9730848861283644,
"grad_norm": 0.13368651270866394,
"learning_rate": 5.294460075676725e-05,
"loss": 0.0219,
"step": 5170
},
{
"epoch": 0.9749670619235836,
"grad_norm": 0.10452937334775925,
"learning_rate": 5.284757931502863e-05,
"loss": 0.024,
"step": 5180
},
{
"epoch": 0.9768492377188029,
"grad_norm": 0.0894588828086853,
"learning_rate": 5.275055787329e-05,
"loss": 0.026,
"step": 5190
},
{
"epoch": 0.9787314135140223,
"grad_norm": 0.0918290838599205,
"learning_rate": 5.265353643155137e-05,
"loss": 0.0205,
"step": 5200
},
{
"epoch": 0.9806135893092415,
"grad_norm": 0.15705926716327667,
"learning_rate": 5.2556514989812753e-05,
"loss": 0.0279,
"step": 5210
},
{
"epoch": 0.9824957651044608,
"grad_norm": 0.07733868807554245,
"learning_rate": 5.245949354807412e-05,
"loss": 0.0258,
"step": 5220
},
{
"epoch": 0.98437794089968,
"grad_norm": 0.11112848669290543,
"learning_rate": 5.23624721063355e-05,
"loss": 0.0228,
"step": 5230
},
{
"epoch": 0.9862601166948993,
"grad_norm": 0.12285085022449493,
"learning_rate": 5.226545066459688e-05,
"loss": 0.025,
"step": 5240
},
{
"epoch": 0.9881422924901185,
"grad_norm": 0.13352616131305695,
"learning_rate": 5.216842922285825e-05,
"loss": 0.0248,
"step": 5250
},
{
"epoch": 0.9900244682853379,
"grad_norm": 0.09676120430231094,
"learning_rate": 5.207140778111963e-05,
"loss": 0.0227,
"step": 5260
},
{
"epoch": 0.9919066440805572,
"grad_norm": 0.08933494240045547,
"learning_rate": 5.1974386339381006e-05,
"loss": 0.0216,
"step": 5270
},
{
"epoch": 0.9937888198757764,
"grad_norm": 0.15473978221416473,
"learning_rate": 5.187736489764238e-05,
"loss": 0.0187,
"step": 5280
},
{
"epoch": 0.9956709956709957,
"grad_norm": 0.13211970031261444,
"learning_rate": 5.1780343455903755e-05,
"loss": 0.0203,
"step": 5290
},
{
"epoch": 0.9975531714662149,
"grad_norm": 0.14397864043712616,
"learning_rate": 5.1683322014165136e-05,
"loss": 0.0209,
"step": 5300
},
{
"epoch": 0.9994353472614342,
"grad_norm": 0.08155430108308792,
"learning_rate": 5.15863005724265e-05,
"loss": 0.0247,
"step": 5310
},
{
"epoch": 0.9994353472614342,
"eval_E1/acc_on_CONSISTENT": 0.7682119205298014,
"eval_E1/acc_on_INCONSISTENT": 0.7551020408163265,
"eval_E1/accuracy": 0.765,
"eval_E1/balanced_accuracy": 0.761656980673064,
"eval_E1/f1_INC": 0.6115702479338843,
"eval_E1/n": 200.0,
"eval_E1/precision_INC": 0.5138888888888888,
"eval_E1/recall_INC": 0.7551020408163265,
"eval_E2/acc_on_CONSISTENT": 0.9859154929577465,
"eval_E2/acc_on_INCONSISTENT": 0.9482758620689655,
"eval_E2/accuracy": 0.975,
"eval_E2/balanced_accuracy": 0.967095677513356,
"eval_E2/f1_INC": 0.9565217391304347,
"eval_E2/n": 200.0,
"eval_E2/precision_INC": 0.9649122807017544,
"eval_E2/recall_INC": 0.9482758620689655,
"eval_E3/acc_on_CONSISTENT": 0.9769230769230769,
"eval_E3/acc_on_INCONSISTENT": 0.7857142857142857,
"eval_E3/accuracy": 0.91,
"eval_E3/balanced_accuracy": 0.8813186813186813,
"eval_E3/f1_INC": 0.859375,
"eval_E3/n": 200.0,
"eval_E3/precision_INC": 0.9482758620689655,
"eval_E3/recall_INC": 0.7857142857142857,
"eval_E4/acc_on_CONSISTENT": 0.9478260869565217,
"eval_E4/acc_on_INCONSISTENT": 0.8117647058823529,
"eval_E4/accuracy": 0.89,
"eval_E4/balanced_accuracy": 0.8797953964194374,
"eval_E4/f1_INC": 0.8625,
"eval_E4/n": 200.0,
"eval_E4/precision_INC": 0.92,
"eval_E4/recall_INC": 0.8117647058823529,
"eval_edge_macro_accuracy": 0.865,
"eval_edge_macro_balanced_accuracy": 0.8541556833672439,
"eval_edge_macro_f1_INC": 0.7978535372730037,
"eval_malformed_rate": 0.0,
"eval_n_eval": 1000.0,
"eval_overall/acc_on_CONSISTENT": 0.6744186046511628,
"eval_overall/acc_on_INCONSISTENT": 0.9426751592356688,
"eval_overall/accuracy": 0.885,
"eval_overall/balanced_accuracy": 0.8085468819434158,
"eval_overall/f1_INC": 0.9278996865203761,
"eval_overall/n": 200.0,
"eval_overall/n_complete_groups": 200.0,
"eval_overall/precision_INC": 0.9135802469135802,
"eval_overall/recall_INC": 0.9426751592356688,
"eval_overall_exact_match": 0.53,
"eval_scene/acc_on_CONSISTENT": 0.7925925925925926,
"eval_scene/acc_on_INCONSISTENT": 0.7692307692307693,
"eval_scene/accuracy": 0.785,
"eval_scene/balanced_accuracy": 0.780911680911681,
"eval_scene/f1_INC": 0.6993006993006994,
"eval_scene/n": 200.0,
"eval_scene/precision_INC": 0.6410256410256411,
"eval_scene/recall_INC": 0.7692307692307693,
"step": 5310
}
],
"logging_steps": 10,
"max_steps": 10626,
"num_input_tokens_seen": 0,
"num_train_epochs": 2,
"save_steps": 2656,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 5.316422271085052e+18,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}