{ "best_metric": 0.9899, "best_model_checkpoint": "./checkpoints/unconditional/bartforcausallm-geom-aug5-angles-0306/checkpoint-165000", "epoch": 3.11661818593933, "eval_steps": 2500, "global_step": 165000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.888859506629897e-05, "grad_norm": 7.574718952178955, "learning_rate": 9.444297533149486e-10, "loss": 6.3416, "step": 1 }, { "epoch": 0.0009444297533149484, "grad_norm": 7.561321258544922, "learning_rate": 4.7221487665747425e-08, "loss": 6.3395, "step": 50 }, { "epoch": 0.0018888595066298968, "grad_norm": 7.6944804191589355, "learning_rate": 9.444297533149485e-08, "loss": 6.3324, "step": 100 }, { "epoch": 0.0028332892599448453, "grad_norm": 7.842940807342529, "learning_rate": 1.4166446299724227e-07, "loss": 6.3169, "step": 150 }, { "epoch": 0.0037777190132597936, "grad_norm": 8.135217666625977, "learning_rate": 1.888859506629897e-07, "loss": 6.2933, "step": 200 }, { "epoch": 0.004722148766574742, "grad_norm": 8.708903312683105, "learning_rate": 2.361074383287371e-07, "loss": 6.2595, "step": 250 }, { "epoch": 0.0056665785198896906, "grad_norm": 9.507205963134766, "learning_rate": 2.8332892599448455e-07, "loss": 6.2152, "step": 300 }, { "epoch": 0.006611008273204639, "grad_norm": 10.765588760375977, "learning_rate": 3.30550413660232e-07, "loss": 6.1584, "step": 350 }, { "epoch": 0.007555438026519587, "grad_norm": 12.292579650878906, "learning_rate": 3.777719013259794e-07, "loss": 6.0875, "step": 400 }, { "epoch": 0.008499867779834537, "grad_norm": 14.01995849609375, "learning_rate": 4.249933889917269e-07, "loss": 6.0028, "step": 450 }, { "epoch": 0.009444297533149484, "grad_norm": 15.684309959411621, "learning_rate": 4.722148766574742e-07, "loss": 5.9076, "step": 500 }, { "epoch": 0.010388727286464432, "grad_norm": 17.238126754760742, "learning_rate": 5.194363643232217e-07, "loss": 5.8083, "step": 550 }, { "epoch": 0.011333157039779381, "grad_norm": 18.432180404663086, "learning_rate": 5.666578519889691e-07, "loss": 5.7095, "step": 600 }, { "epoch": 0.01227758679309433, "grad_norm": 19.452835083007812, "learning_rate": 6.138793396547165e-07, "loss": 5.615, "step": 650 }, { "epoch": 0.013222016546409279, "grad_norm": 20.362192153930664, "learning_rate": 6.61100827320464e-07, "loss": 5.5239, "step": 700 }, { "epoch": 0.014166446299724227, "grad_norm": 20.807966232299805, "learning_rate": 7.083223149862114e-07, "loss": 5.4369, "step": 750 }, { "epoch": 0.015110876053039174, "grad_norm": 21.352497100830078, "learning_rate": 7.555438026519588e-07, "loss": 5.3531, "step": 800 }, { "epoch": 0.016055305806354125, "grad_norm": 21.627809524536133, "learning_rate": 8.027652903177062e-07, "loss": 5.2731, "step": 850 }, { "epoch": 0.016999735559669073, "grad_norm": 21.9608154296875, "learning_rate": 8.499867779834538e-07, "loss": 5.1951, "step": 900 }, { "epoch": 0.01794416531298402, "grad_norm": 22.01567840576172, "learning_rate": 8.97208265649201e-07, "loss": 5.1191, "step": 950 }, { "epoch": 0.018888595066298967, "grad_norm": 22.29902458190918, "learning_rate": 9.444297533149484e-07, "loss": 5.0444, "step": 1000 }, { "epoch": 0.019833024819613916, "grad_norm": 22.450542449951172, "learning_rate": 9.91651240980696e-07, "loss": 4.9694, "step": 1050 }, { "epoch": 0.020777454572928865, "grad_norm": 22.53548240661621, "learning_rate": 1.0388727286464433e-06, "loss": 4.8944, "step": 1100 }, { "epoch": 0.021721884326243814, "grad_norm": 22.63127899169922, "learning_rate": 1.0860942163121908e-06, "loss": 4.818, "step": 1150 }, { "epoch": 0.022666314079558762, "grad_norm": 22.73966407775879, "learning_rate": 1.1333157039779382e-06, "loss": 4.7395, "step": 1200 }, { "epoch": 0.02361074383287371, "grad_norm": 22.6774959564209, "learning_rate": 1.1805371916436856e-06, "loss": 4.659, "step": 1250 }, { "epoch": 0.02455517358618866, "grad_norm": 22.687959671020508, "learning_rate": 1.227758679309433e-06, "loss": 4.5745, "step": 1300 }, { "epoch": 0.02549960333950361, "grad_norm": 22.775596618652344, "learning_rate": 1.2749801669751805e-06, "loss": 4.4865, "step": 1350 }, { "epoch": 0.026444033092818557, "grad_norm": 22.703218460083008, "learning_rate": 1.322201654640928e-06, "loss": 4.3957, "step": 1400 }, { "epoch": 0.027388462846133506, "grad_norm": 22.817502975463867, "learning_rate": 1.3694231423066753e-06, "loss": 4.3003, "step": 1450 }, { "epoch": 0.028332892599448455, "grad_norm": 22.821916580200195, "learning_rate": 1.4166446299724227e-06, "loss": 4.1998, "step": 1500 }, { "epoch": 0.0292773223527634, "grad_norm": 22.714452743530273, "learning_rate": 1.46386611763817e-06, "loss": 4.0961, "step": 1550 }, { "epoch": 0.03022175210607835, "grad_norm": 22.816932678222656, "learning_rate": 1.5110876053039176e-06, "loss": 3.987, "step": 1600 }, { "epoch": 0.031166181859393297, "grad_norm": 22.72612953186035, "learning_rate": 1.558309092969665e-06, "loss": 3.8747, "step": 1650 }, { "epoch": 0.03211061161270825, "grad_norm": 22.67470932006836, "learning_rate": 1.6055305806354124e-06, "loss": 3.7601, "step": 1700 }, { "epoch": 0.0330550413660232, "grad_norm": 22.76194190979004, "learning_rate": 1.65275206830116e-06, "loss": 3.6435, "step": 1750 }, { "epoch": 0.03399947111933815, "grad_norm": 22.748592376708984, "learning_rate": 1.6999735559669075e-06, "loss": 3.5259, "step": 1800 }, { "epoch": 0.03494390087265309, "grad_norm": 22.67568588256836, "learning_rate": 1.7471950436326545e-06, "loss": 3.4075, "step": 1850 }, { "epoch": 0.03588833062596804, "grad_norm": 22.607223510742188, "learning_rate": 1.794416531298402e-06, "loss": 3.2877, "step": 1900 }, { "epoch": 0.036832760379282986, "grad_norm": 22.4986515045166, "learning_rate": 1.8416380189641494e-06, "loss": 3.1647, "step": 1950 }, { "epoch": 0.037777190132597935, "grad_norm": 22.303756713867188, "learning_rate": 1.8888595066298968e-06, "loss": 3.0417, "step": 2000 }, { "epoch": 0.038721619885912884, "grad_norm": 22.189130783081055, "learning_rate": 1.9360809942956444e-06, "loss": 2.9154, "step": 2050 }, { "epoch": 0.03966604963922783, "grad_norm": 21.89154052734375, "learning_rate": 1.983302481961392e-06, "loss": 2.7882, "step": 2100 }, { "epoch": 0.04061047939254278, "grad_norm": 21.769222259521484, "learning_rate": 2.0305239696271393e-06, "loss": 2.6586, "step": 2150 }, { "epoch": 0.04155490914585773, "grad_norm": 21.427040100097656, "learning_rate": 2.0777454572928867e-06, "loss": 2.5271, "step": 2200 }, { "epoch": 0.04249933889917268, "grad_norm": 21.123355865478516, "learning_rate": 2.124966944958634e-06, "loss": 2.3943, "step": 2250 }, { "epoch": 0.04344376865248763, "grad_norm": 20.638526916503906, "learning_rate": 2.1721884326243815e-06, "loss": 2.2612, "step": 2300 }, { "epoch": 0.044388198405802576, "grad_norm": 20.222171783447266, "learning_rate": 2.219409920290129e-06, "loss": 2.1283, "step": 2350 }, { "epoch": 0.045332628159117525, "grad_norm": 19.679176330566406, "learning_rate": 2.2666314079558764e-06, "loss": 1.9959, "step": 2400 }, { "epoch": 0.04627705791243247, "grad_norm": 19.067304611206055, "learning_rate": 2.313852895621624e-06, "loss": 1.8645, "step": 2450 }, { "epoch": 0.04722148766574742, "grad_norm": 18.46661376953125, "learning_rate": 2.3610743832873712e-06, "loss": 1.7351, "step": 2500 }, { "epoch": 0.04722148766574742, "eval_IntDiv": 0.5088811844215041, "eval_NumCircles": 12, "eval_SumBottleneck": 0.0, "eval_Uniqueness": 0.41333333333333333, "eval_Validity": 0.0075, "eval_Validity * Uniqueness": 0.0031, "eval_loss": 1.615347981452942, "eval_runtime": 169.1456, "eval_samples_per_second": 59.121, "eval_steps_per_second": 0.467, "step": 2500 }, { "epoch": 0.04816591741906237, "grad_norm": 17.706602096557617, "learning_rate": 2.4082958709531187e-06, "loss": 1.6105, "step": 2550 }, { "epoch": 0.04911034717237732, "grad_norm": 16.764541625976562, "learning_rate": 2.455517358618866e-06, "loss": 1.4878, "step": 2600 }, { "epoch": 0.05005477692569227, "grad_norm": 15.7522554397583, "learning_rate": 2.5027388462846135e-06, "loss": 1.3691, "step": 2650 }, { "epoch": 0.05099920667900722, "grad_norm": 14.707948684692383, "learning_rate": 2.549960333950361e-06, "loss": 1.2547, "step": 2700 }, { "epoch": 0.051943636432322166, "grad_norm": 13.541821479797363, "learning_rate": 2.5971818216161084e-06, "loss": 1.1475, "step": 2750 }, { "epoch": 0.052888066185637114, "grad_norm": 12.442481994628906, "learning_rate": 2.644403309281856e-06, "loss": 1.0452, "step": 2800 }, { "epoch": 0.05383249593895206, "grad_norm": 11.176552772521973, "learning_rate": 2.6916247969476032e-06, "loss": 0.9502, "step": 2850 }, { "epoch": 0.05477692569226701, "grad_norm": 9.865756034851074, "learning_rate": 2.7388462846133506e-06, "loss": 0.8649, "step": 2900 }, { "epoch": 0.05572135544558196, "grad_norm": 8.70965576171875, "learning_rate": 2.786067772279098e-06, "loss": 0.7851, "step": 2950 }, { "epoch": 0.05666578519889691, "grad_norm": 7.527464389801025, "learning_rate": 2.8332892599448455e-06, "loss": 0.716, "step": 3000 }, { "epoch": 0.05761021495221186, "grad_norm": 6.452827453613281, "learning_rate": 2.880510747610593e-06, "loss": 0.6517, "step": 3050 }, { "epoch": 0.0585546447055268, "grad_norm": 5.4376115798950195, "learning_rate": 2.92773223527634e-06, "loss": 0.5964, "step": 3100 }, { "epoch": 0.05949907445884175, "grad_norm": 4.537758827209473, "learning_rate": 2.9749537229420874e-06, "loss": 0.5486, "step": 3150 }, { "epoch": 0.0604435042121567, "grad_norm": 3.7361209392547607, "learning_rate": 3.022175210607835e-06, "loss": 0.5082, "step": 3200 }, { "epoch": 0.061387933965471646, "grad_norm": 3.0581328868865967, "learning_rate": 3.0693966982735826e-06, "loss": 0.4737, "step": 3250 }, { "epoch": 0.062332363718786594, "grad_norm": 2.4870424270629883, "learning_rate": 3.11661818593933e-06, "loss": 0.4435, "step": 3300 }, { "epoch": 0.06327679347210155, "grad_norm": 1.99289870262146, "learning_rate": 3.1638396736050775e-06, "loss": 0.4179, "step": 3350 }, { "epoch": 0.0642212232254165, "grad_norm": 1.5753567218780518, "learning_rate": 3.211061161270825e-06, "loss": 0.3944, "step": 3400 }, { "epoch": 0.06516565297873145, "grad_norm": 1.2454828023910522, "learning_rate": 3.2582826489365723e-06, "loss": 0.3751, "step": 3450 }, { "epoch": 0.0661100827320464, "grad_norm": 0.9801281690597534, "learning_rate": 3.30550413660232e-06, "loss": 0.3571, "step": 3500 }, { "epoch": 0.06705451248536135, "grad_norm": 0.7866788506507874, "learning_rate": 3.3527256242680676e-06, "loss": 0.3423, "step": 3550 }, { "epoch": 0.0679989422386763, "grad_norm": 0.6498755812644958, "learning_rate": 3.399947111933815e-06, "loss": 0.3293, "step": 3600 }, { "epoch": 0.06894337199199124, "grad_norm": 0.5582278966903687, "learning_rate": 3.4471685995995624e-06, "loss": 0.3196, "step": 3650 }, { "epoch": 0.06988780174530618, "grad_norm": 0.4853467047214508, "learning_rate": 3.494390087265309e-06, "loss": 0.3103, "step": 3700 }, { "epoch": 0.07083223149862113, "grad_norm": 0.4393543004989624, "learning_rate": 3.5416115749310565e-06, "loss": 0.3042, "step": 3750 }, { "epoch": 0.07177666125193607, "grad_norm": 0.38884973526000977, "learning_rate": 3.588833062596804e-06, "loss": 0.2992, "step": 3800 }, { "epoch": 0.07272109100525102, "grad_norm": 0.34861019253730774, "learning_rate": 3.6360545502625513e-06, "loss": 0.294, "step": 3850 }, { "epoch": 0.07366552075856597, "grad_norm": 0.31519466638565063, "learning_rate": 3.6832760379282987e-06, "loss": 0.2884, "step": 3900 }, { "epoch": 0.07460995051188092, "grad_norm": 0.2926502227783203, "learning_rate": 3.730497525594046e-06, "loss": 0.2863, "step": 3950 }, { "epoch": 0.07555438026519587, "grad_norm": 0.2618136405944824, "learning_rate": 3.7777190132597936e-06, "loss": 0.2817, "step": 4000 }, { "epoch": 0.07649881001851082, "grad_norm": 0.24470534920692444, "learning_rate": 3.8249405009255414e-06, "loss": 0.2779, "step": 4050 }, { "epoch": 0.07744323977182577, "grad_norm": 0.22638235986232758, "learning_rate": 3.872161988591289e-06, "loss": 0.2744, "step": 4100 }, { "epoch": 0.07838766952514072, "grad_norm": 0.21364189684391022, "learning_rate": 3.919383476257036e-06, "loss": 0.2728, "step": 4150 }, { "epoch": 0.07933209927845566, "grad_norm": 0.1984063982963562, "learning_rate": 3.966604963922784e-06, "loss": 0.2694, "step": 4200 }, { "epoch": 0.08027652903177061, "grad_norm": 0.18730804324150085, "learning_rate": 4.013826451588531e-06, "loss": 0.2669, "step": 4250 }, { "epoch": 0.08122095878508556, "grad_norm": 0.17376117408275604, "learning_rate": 4.0610479392542785e-06, "loss": 0.2647, "step": 4300 }, { "epoch": 0.08216538853840051, "grad_norm": 0.16496503353118896, "learning_rate": 4.108269426920026e-06, "loss": 0.2631, "step": 4350 }, { "epoch": 0.08310981829171546, "grad_norm": 0.1612619012594223, "learning_rate": 4.155490914585773e-06, "loss": 0.2614, "step": 4400 }, { "epoch": 0.08405424804503041, "grad_norm": 0.1521696299314499, "learning_rate": 4.202712402251521e-06, "loss": 0.2595, "step": 4450 }, { "epoch": 0.08499867779834536, "grad_norm": 0.13942956924438477, "learning_rate": 4.249933889917268e-06, "loss": 0.2568, "step": 4500 }, { "epoch": 0.0859431075516603, "grad_norm": 0.13571928441524506, "learning_rate": 4.297155377583016e-06, "loss": 0.2552, "step": 4550 }, { "epoch": 0.08688753730497525, "grad_norm": 0.13110731542110443, "learning_rate": 4.344376865248763e-06, "loss": 0.2537, "step": 4600 }, { "epoch": 0.0878319670582902, "grad_norm": 0.13350360095500946, "learning_rate": 4.3915983529145105e-06, "loss": 0.2526, "step": 4650 }, { "epoch": 0.08877639681160515, "grad_norm": 0.1257132589817047, "learning_rate": 4.438819840580258e-06, "loss": 0.252, "step": 4700 }, { "epoch": 0.0897208265649201, "grad_norm": 0.11655037105083466, "learning_rate": 4.486041328246005e-06, "loss": 0.2491, "step": 4750 }, { "epoch": 0.09066525631823505, "grad_norm": 0.1067115068435669, "learning_rate": 4.533262815911753e-06, "loss": 0.2492, "step": 4800 }, { "epoch": 0.09160968607155, "grad_norm": 0.10981940478086472, "learning_rate": 4.5804843035775e-06, "loss": 0.2469, "step": 4850 }, { "epoch": 0.09255411582486495, "grad_norm": 0.10173261910676956, "learning_rate": 4.627705791243248e-06, "loss": 0.2462, "step": 4900 }, { "epoch": 0.0934985455781799, "grad_norm": 0.09772108495235443, "learning_rate": 4.674927278908995e-06, "loss": 0.2452, "step": 4950 }, { "epoch": 0.09444297533149484, "grad_norm": 0.09387890994548798, "learning_rate": 4.7221487665747425e-06, "loss": 0.2435, "step": 5000 }, { "epoch": 0.09444297533149484, "eval_IntDiv": 0.658091988050375, "eval_NumCircles": 228, "eval_SumBottleneck": 0.0, "eval_Uniqueness": 0.9740663900414938, "eval_Validity": 0.0964, "eval_Validity * Uniqueness": 0.0939, "eval_loss": 0.24655571579933167, "eval_runtime": 257.2627, "eval_samples_per_second": 38.871, "eval_steps_per_second": 0.307, "step": 5000 }, { "epoch": 0.09538740508480979, "grad_norm": 0.09783821552991867, "learning_rate": 4.76937025424049e-06, "loss": 0.2429, "step": 5050 }, { "epoch": 0.09633183483812474, "grad_norm": 0.10056648403406143, "learning_rate": 4.816591741906237e-06, "loss": 0.2418, "step": 5100 }, { "epoch": 0.09727626459143969, "grad_norm": 0.09489645808935165, "learning_rate": 4.863813229571985e-06, "loss": 0.2403, "step": 5150 }, { "epoch": 0.09822069434475464, "grad_norm": 0.10906486213207245, "learning_rate": 4.911034717237732e-06, "loss": 0.2395, "step": 5200 }, { "epoch": 0.09916512409806959, "grad_norm": 0.08509868383407593, "learning_rate": 4.95825620490348e-06, "loss": 0.2375, "step": 5250 }, { "epoch": 0.10010955385138454, "grad_norm": 0.07894144207239151, "learning_rate": 5.005477692569227e-06, "loss": 0.2375, "step": 5300 }, { "epoch": 0.10105398360469948, "grad_norm": 0.08291951566934586, "learning_rate": 5.0526991802349745e-06, "loss": 0.2359, "step": 5350 }, { "epoch": 0.10199841335801443, "grad_norm": 0.0862336978316307, "learning_rate": 5.099920667900722e-06, "loss": 0.2354, "step": 5400 }, { "epoch": 0.10294284311132938, "grad_norm": 0.07523290812969208, "learning_rate": 5.147142155566469e-06, "loss": 0.2354, "step": 5450 }, { "epoch": 0.10388727286464433, "grad_norm": 0.08622250705957413, "learning_rate": 5.194363643232217e-06, "loss": 0.2339, "step": 5500 }, { "epoch": 0.10483170261795928, "grad_norm": 0.08163613826036453, "learning_rate": 5.241585130897964e-06, "loss": 0.2331, "step": 5550 }, { "epoch": 0.10577613237127423, "grad_norm": 0.08916472643613815, "learning_rate": 5.288806618563712e-06, "loss": 0.2327, "step": 5600 }, { "epoch": 0.10672056212458918, "grad_norm": 0.0924314633011818, "learning_rate": 5.336028106229459e-06, "loss": 0.2316, "step": 5650 }, { "epoch": 0.10766499187790413, "grad_norm": 0.06782221049070358, "learning_rate": 5.3832495938952064e-06, "loss": 0.2312, "step": 5700 }, { "epoch": 0.10860942163121907, "grad_norm": 0.07695573568344116, "learning_rate": 5.430471081560954e-06, "loss": 0.23, "step": 5750 }, { "epoch": 0.10955385138453402, "grad_norm": 0.07421786338090897, "learning_rate": 5.477692569226701e-06, "loss": 0.2289, "step": 5800 }, { "epoch": 0.11049828113784897, "grad_norm": 0.08338936418294907, "learning_rate": 5.524914056892449e-06, "loss": 0.2287, "step": 5850 }, { "epoch": 0.11144271089116392, "grad_norm": 0.07026118785142899, "learning_rate": 5.572135544558196e-06, "loss": 0.2277, "step": 5900 }, { "epoch": 0.11238714064447887, "grad_norm": 0.08924909681081772, "learning_rate": 5.6193570322239436e-06, "loss": 0.2277, "step": 5950 }, { "epoch": 0.11333157039779382, "grad_norm": 0.08202508091926575, "learning_rate": 5.666578519889691e-06, "loss": 0.2254, "step": 6000 }, { "epoch": 0.11427600015110877, "grad_norm": 0.06947985291481018, "learning_rate": 5.7138000075554384e-06, "loss": 0.2256, "step": 6050 }, { "epoch": 0.11522042990442372, "grad_norm": 0.07062337547540665, "learning_rate": 5.761021495221186e-06, "loss": 0.2248, "step": 6100 }, { "epoch": 0.11616485965773865, "grad_norm": 0.06354617327451706, "learning_rate": 5.8082429828869324e-06, "loss": 0.2234, "step": 6150 }, { "epoch": 0.1171092894110536, "grad_norm": 0.08576296269893646, "learning_rate": 5.85546447055268e-06, "loss": 0.2243, "step": 6200 }, { "epoch": 0.11805371916436855, "grad_norm": 0.06948589533567429, "learning_rate": 5.902685958218427e-06, "loss": 0.2233, "step": 6250 }, { "epoch": 0.1189981489176835, "grad_norm": 0.06646331399679184, "learning_rate": 5.949907445884175e-06, "loss": 0.2223, "step": 6300 }, { "epoch": 0.11994257867099845, "grad_norm": 0.07253573089838028, "learning_rate": 5.997128933549923e-06, "loss": 0.2212, "step": 6350 }, { "epoch": 0.1208870084243134, "grad_norm": 0.06802347302436829, "learning_rate": 6.04435042121567e-06, "loss": 0.2215, "step": 6400 }, { "epoch": 0.12183143817762834, "grad_norm": 0.07604142278432846, "learning_rate": 6.091571908881418e-06, "loss": 0.2203, "step": 6450 }, { "epoch": 0.12277586793094329, "grad_norm": 0.06039990857243538, "learning_rate": 6.138793396547165e-06, "loss": 0.2194, "step": 6500 }, { "epoch": 0.12372029768425824, "grad_norm": 0.06276606023311615, "learning_rate": 6.186014884212913e-06, "loss": 0.2187, "step": 6550 }, { "epoch": 0.12466472743757319, "grad_norm": 0.07089051604270935, "learning_rate": 6.23323637187866e-06, "loss": 0.218, "step": 6600 }, { "epoch": 0.12560915719088814, "grad_norm": 0.07489097863435745, "learning_rate": 6.2804578595444075e-06, "loss": 0.2176, "step": 6650 }, { "epoch": 0.1265535869442031, "grad_norm": 0.09530392289161682, "learning_rate": 6.327679347210155e-06, "loss": 0.2177, "step": 6700 }, { "epoch": 0.12749801669751804, "grad_norm": 0.08673632889986038, "learning_rate": 6.374900834875902e-06, "loss": 0.218, "step": 6750 }, { "epoch": 0.128442446450833, "grad_norm": 0.05699313431978226, "learning_rate": 6.42212232254165e-06, "loss": 0.2166, "step": 6800 }, { "epoch": 0.12938687620414793, "grad_norm": 0.06185412034392357, "learning_rate": 6.469343810207397e-06, "loss": 0.2159, "step": 6850 }, { "epoch": 0.1303313059574629, "grad_norm": 0.08904264867305756, "learning_rate": 6.516565297873145e-06, "loss": 0.2149, "step": 6900 }, { "epoch": 0.13127573571077783, "grad_norm": 0.07556107640266418, "learning_rate": 6.563786785538892e-06, "loss": 0.214, "step": 6950 }, { "epoch": 0.1322201654640928, "grad_norm": 0.05487874522805214, "learning_rate": 6.61100827320464e-06, "loss": 0.2149, "step": 7000 }, { "epoch": 0.13316459521740773, "grad_norm": 0.06657563894987106, "learning_rate": 6.658229760870387e-06, "loss": 0.2131, "step": 7050 }, { "epoch": 0.1341090249707227, "grad_norm": 0.08139476925134659, "learning_rate": 6.705451248536135e-06, "loss": 0.2133, "step": 7100 }, { "epoch": 0.13505345472403762, "grad_norm": 0.08273161947727203, "learning_rate": 6.752672736201882e-06, "loss": 0.2122, "step": 7150 }, { "epoch": 0.1359978844773526, "grad_norm": 0.06287536770105362, "learning_rate": 6.79989422386763e-06, "loss": 0.2123, "step": 7200 }, { "epoch": 0.13694231423066752, "grad_norm": 0.07065015286207199, "learning_rate": 6.847115711533377e-06, "loss": 0.2111, "step": 7250 }, { "epoch": 0.13788674398398248, "grad_norm": 0.06288257986307144, "learning_rate": 6.894337199199125e-06, "loss": 0.2112, "step": 7300 }, { "epoch": 0.13883117373729742, "grad_norm": 0.05428687855601311, "learning_rate": 6.9415586868648715e-06, "loss": 0.2107, "step": 7350 }, { "epoch": 0.13977560349061235, "grad_norm": 0.06647636741399765, "learning_rate": 6.988780174530618e-06, "loss": 0.2095, "step": 7400 }, { "epoch": 0.14072003324392732, "grad_norm": 0.08538660407066345, "learning_rate": 7.036001662196366e-06, "loss": 0.2096, "step": 7450 }, { "epoch": 0.14166446299724225, "grad_norm": 0.054214347153902054, "learning_rate": 7.083223149862113e-06, "loss": 0.2094, "step": 7500 }, { "epoch": 0.14166446299724225, "eval_IntDiv": 0.6649108233729664, "eval_NumCircles": 1021, "eval_SumBottleneck": 0.06573619216803897, "eval_Uniqueness": 0.9888438133874239, "eval_Validity": 0.3944, "eval_Validity * Uniqueness": 0.38999999999999996, "eval_loss": 0.23216083645820618, "eval_runtime": 205.3939, "eval_samples_per_second": 48.687, "eval_steps_per_second": 0.385, "step": 7500 }, { "epoch": 0.14260889275055721, "grad_norm": 0.07123802602291107, "learning_rate": 7.130444637527861e-06, "loss": 0.208, "step": 7550 }, { "epoch": 0.14355332250387215, "grad_norm": 0.08690359443426132, "learning_rate": 7.177666125193608e-06, "loss": 0.208, "step": 7600 }, { "epoch": 0.1444977522571871, "grad_norm": 0.059672556817531586, "learning_rate": 7.224887612859356e-06, "loss": 0.2076, "step": 7650 }, { "epoch": 0.14544218201050205, "grad_norm": 0.08448991179466248, "learning_rate": 7.272109100525103e-06, "loss": 0.2073, "step": 7700 }, { "epoch": 0.146386611763817, "grad_norm": 0.08471570163965225, "learning_rate": 7.319330588190851e-06, "loss": 0.2068, "step": 7750 }, { "epoch": 0.14733104151713194, "grad_norm": 0.06284050643444061, "learning_rate": 7.3665520758565975e-06, "loss": 0.206, "step": 7800 }, { "epoch": 0.1482754712704469, "grad_norm": 0.07133319973945618, "learning_rate": 7.413773563522346e-06, "loss": 0.2062, "step": 7850 }, { "epoch": 0.14921990102376184, "grad_norm": 0.05895814672112465, "learning_rate": 7.460995051188092e-06, "loss": 0.2059, "step": 7900 }, { "epoch": 0.1501643307770768, "grad_norm": 0.06890573352575302, "learning_rate": 7.5082165388538406e-06, "loss": 0.2052, "step": 7950 }, { "epoch": 0.15110876053039174, "grad_norm": 0.06390209496021271, "learning_rate": 7.555438026519587e-06, "loss": 0.2048, "step": 8000 }, { "epoch": 0.1520531902837067, "grad_norm": 0.056838810443878174, "learning_rate": 7.6026595141853354e-06, "loss": 0.205, "step": 8050 }, { "epoch": 0.15299762003702164, "grad_norm": 0.06041209027171135, "learning_rate": 7.649881001851083e-06, "loss": 0.2048, "step": 8100 }, { "epoch": 0.1539420497903366, "grad_norm": 0.061773158609867096, "learning_rate": 7.69710248951683e-06, "loss": 0.2037, "step": 8150 }, { "epoch": 0.15488647954365153, "grad_norm": 0.11010323464870453, "learning_rate": 7.744323977182578e-06, "loss": 0.2036, "step": 8200 }, { "epoch": 0.1558309092969665, "grad_norm": 0.06360630691051483, "learning_rate": 7.791545464848325e-06, "loss": 0.203, "step": 8250 }, { "epoch": 0.15677533905028143, "grad_norm": 0.06862206757068634, "learning_rate": 7.838766952514073e-06, "loss": 0.2025, "step": 8300 }, { "epoch": 0.1577197688035964, "grad_norm": 0.06639589369297028, "learning_rate": 7.88598844017982e-06, "loss": 0.2025, "step": 8350 }, { "epoch": 0.15866419855691133, "grad_norm": 0.06470789015293121, "learning_rate": 7.933209927845567e-06, "loss": 0.2021, "step": 8400 }, { "epoch": 0.1596086283102263, "grad_norm": 0.08671747893095016, "learning_rate": 7.980431415511315e-06, "loss": 0.2017, "step": 8450 }, { "epoch": 0.16055305806354123, "grad_norm": 0.06237388402223587, "learning_rate": 8.027652903177062e-06, "loss": 0.2013, "step": 8500 }, { "epoch": 0.1614974878168562, "grad_norm": 0.06949514895677567, "learning_rate": 8.07487439084281e-06, "loss": 0.2011, "step": 8550 }, { "epoch": 0.16244191757017112, "grad_norm": 0.056812018156051636, "learning_rate": 8.122095878508557e-06, "loss": 0.2006, "step": 8600 }, { "epoch": 0.1633863473234861, "grad_norm": 0.10049230605363846, "learning_rate": 8.169317366174305e-06, "loss": 0.2004, "step": 8650 }, { "epoch": 0.16433077707680102, "grad_norm": 0.06241702660918236, "learning_rate": 8.216538853840052e-06, "loss": 0.2005, "step": 8700 }, { "epoch": 0.16527520683011598, "grad_norm": 0.06494967639446259, "learning_rate": 8.2637603415058e-06, "loss": 0.1996, "step": 8750 }, { "epoch": 0.16621963658343092, "grad_norm": 0.052385032176971436, "learning_rate": 8.310981829171547e-06, "loss": 0.2001, "step": 8800 }, { "epoch": 0.16716406633674588, "grad_norm": 0.06349585950374603, "learning_rate": 8.358203316837294e-06, "loss": 0.1996, "step": 8850 }, { "epoch": 0.16810849609006082, "grad_norm": 0.05965185537934303, "learning_rate": 8.405424804503042e-06, "loss": 0.1991, "step": 8900 }, { "epoch": 0.16905292584337578, "grad_norm": 0.07849177718162537, "learning_rate": 8.452646292168789e-06, "loss": 0.1987, "step": 8950 }, { "epoch": 0.1699973555966907, "grad_norm": 0.06136157736182213, "learning_rate": 8.499867779834536e-06, "loss": 0.1988, "step": 9000 }, { "epoch": 0.17094178535000568, "grad_norm": 0.0692000463604927, "learning_rate": 8.547089267500284e-06, "loss": 0.1975, "step": 9050 }, { "epoch": 0.1718862151033206, "grad_norm": 0.07976619154214859, "learning_rate": 8.594310755166031e-06, "loss": 0.1967, "step": 9100 }, { "epoch": 0.17283064485663557, "grad_norm": 0.06603018939495087, "learning_rate": 8.641532242831779e-06, "loss": 0.1971, "step": 9150 }, { "epoch": 0.1737750746099505, "grad_norm": 0.07323586940765381, "learning_rate": 8.688753730497526e-06, "loss": 0.1975, "step": 9200 }, { "epoch": 0.17471950436326547, "grad_norm": 0.06465490162372589, "learning_rate": 8.735975218163274e-06, "loss": 0.1964, "step": 9250 }, { "epoch": 0.1756639341165804, "grad_norm": 0.07078143209218979, "learning_rate": 8.783196705829021e-06, "loss": 0.1963, "step": 9300 }, { "epoch": 0.17660836386989537, "grad_norm": 0.0694068893790245, "learning_rate": 8.830418193494768e-06, "loss": 0.1968, "step": 9350 }, { "epoch": 0.1775527936232103, "grad_norm": 0.06257413327693939, "learning_rate": 8.877639681160516e-06, "loss": 0.1959, "step": 9400 }, { "epoch": 0.17849722337652527, "grad_norm": 0.07000501453876495, "learning_rate": 8.924861168826263e-06, "loss": 0.1962, "step": 9450 }, { "epoch": 0.1794416531298402, "grad_norm": 0.06759538501501083, "learning_rate": 8.97208265649201e-06, "loss": 0.1952, "step": 9500 }, { "epoch": 0.18038608288315516, "grad_norm": 0.060186028480529785, "learning_rate": 9.019304144157758e-06, "loss": 0.1953, "step": 9550 }, { "epoch": 0.1813305126364701, "grad_norm": 0.06311298906803131, "learning_rate": 9.066525631823506e-06, "loss": 0.1952, "step": 9600 }, { "epoch": 0.18227494238978506, "grad_norm": 0.07063036412000656, "learning_rate": 9.113747119489253e-06, "loss": 0.1947, "step": 9650 }, { "epoch": 0.1832193721431, "grad_norm": 0.0659281387925148, "learning_rate": 9.160968607155e-06, "loss": 0.1947, "step": 9700 }, { "epoch": 0.18416380189641496, "grad_norm": 0.06546540558338165, "learning_rate": 9.208190094820748e-06, "loss": 0.1934, "step": 9750 }, { "epoch": 0.1851082316497299, "grad_norm": 0.07381387799978256, "learning_rate": 9.255411582486495e-06, "loss": 0.1946, "step": 9800 }, { "epoch": 0.18605266140304483, "grad_norm": 0.06649228930473328, "learning_rate": 9.302633070152241e-06, "loss": 0.1942, "step": 9850 }, { "epoch": 0.1869970911563598, "grad_norm": 0.05805610120296478, "learning_rate": 9.34985455781799e-06, "loss": 0.193, "step": 9900 }, { "epoch": 0.18794152090967473, "grad_norm": 0.07164664566516876, "learning_rate": 9.397076045483736e-06, "loss": 0.1929, "step": 9950 }, { "epoch": 0.1888859506629897, "grad_norm": 0.08711664378643036, "learning_rate": 9.444297533149485e-06, "loss": 0.1922, "step": 10000 }, { "epoch": 0.1888859506629897, "eval_IntDiv": 0.6716559012644133, "eval_NumCircles": 1463, "eval_SumBottleneck": 18.858898870396448, "eval_Uniqueness": 0.9836397368864901, "eval_Validity": 0.5929, "eval_Validity * Uniqueness": 0.5831999999999999, "eval_loss": 0.23170879483222961, "eval_runtime": 200.6166, "eval_samples_per_second": 49.846, "eval_steps_per_second": 0.394, "step": 10000 }, { "epoch": 0.18983038041630462, "grad_norm": 0.06512924283742905, "learning_rate": 9.491519020815232e-06, "loss": 0.1929, "step": 10050 }, { "epoch": 0.19077481016961959, "grad_norm": 0.052336838096380234, "learning_rate": 9.53874050848098e-06, "loss": 0.1919, "step": 10100 }, { "epoch": 0.19171923992293452, "grad_norm": 0.06273242831230164, "learning_rate": 9.585961996146727e-06, "loss": 0.1927, "step": 10150 }, { "epoch": 0.19266366967624948, "grad_norm": 0.05981794744729996, "learning_rate": 9.633183483812475e-06, "loss": 0.192, "step": 10200 }, { "epoch": 0.19360809942956442, "grad_norm": 0.05599646270275116, "learning_rate": 9.680404971478222e-06, "loss": 0.1913, "step": 10250 }, { "epoch": 0.19455252918287938, "grad_norm": 0.08935434371232986, "learning_rate": 9.72762645914397e-06, "loss": 0.1912, "step": 10300 }, { "epoch": 0.19549695893619431, "grad_norm": 0.06084713339805603, "learning_rate": 9.774847946809717e-06, "loss": 0.1911, "step": 10350 }, { "epoch": 0.19644138868950928, "grad_norm": 0.06149431690573692, "learning_rate": 9.822069434475464e-06, "loss": 0.191, "step": 10400 }, { "epoch": 0.1973858184428242, "grad_norm": 0.07272642105817795, "learning_rate": 9.869290922141212e-06, "loss": 0.1905, "step": 10450 }, { "epoch": 0.19833024819613917, "grad_norm": 0.07201600074768066, "learning_rate": 9.91651240980696e-06, "loss": 0.191, "step": 10500 }, { "epoch": 0.1992746779494541, "grad_norm": 0.11556652188301086, "learning_rate": 9.963733897472707e-06, "loss": 0.1907, "step": 10550 }, { "epoch": 0.20021910770276907, "grad_norm": 0.05119675397872925, "learning_rate": 1.0010955385138454e-05, "loss": 0.1902, "step": 10600 }, { "epoch": 0.201163537456084, "grad_norm": 0.09953638911247253, "learning_rate": 1.0058176872804202e-05, "loss": 0.1906, "step": 10650 }, { "epoch": 0.20210796720939897, "grad_norm": 0.06960253417491913, "learning_rate": 1.0105398360469949e-05, "loss": 0.1899, "step": 10700 }, { "epoch": 0.2030523969627139, "grad_norm": 0.0760783925652504, "learning_rate": 1.0152619848135696e-05, "loss": 0.19, "step": 10750 }, { "epoch": 0.20399682671602887, "grad_norm": 0.06543612480163574, "learning_rate": 1.0199841335801444e-05, "loss": 0.1891, "step": 10800 }, { "epoch": 0.2049412564693438, "grad_norm": 0.09574942290782928, "learning_rate": 1.0247062823467191e-05, "loss": 0.1888, "step": 10850 }, { "epoch": 0.20588568622265876, "grad_norm": 0.05036062374711037, "learning_rate": 1.0294284311132939e-05, "loss": 0.1888, "step": 10900 }, { "epoch": 0.2068301159759737, "grad_norm": 0.06448153406381607, "learning_rate": 1.0341505798798686e-05, "loss": 0.1891, "step": 10950 }, { "epoch": 0.20777454572928866, "grad_norm": 0.04905528947710991, "learning_rate": 1.0388727286464433e-05, "loss": 0.1886, "step": 11000 }, { "epoch": 0.2087189754826036, "grad_norm": 0.06905793398618698, "learning_rate": 1.0435948774130181e-05, "loss": 0.1883, "step": 11050 }, { "epoch": 0.20966340523591856, "grad_norm": 0.06637682020664215, "learning_rate": 1.0483170261795928e-05, "loss": 0.1878, "step": 11100 }, { "epoch": 0.2106078349892335, "grad_norm": 0.07833191752433777, "learning_rate": 1.0530391749461676e-05, "loss": 0.1881, "step": 11150 }, { "epoch": 0.21155226474254846, "grad_norm": 0.06527496874332428, "learning_rate": 1.0577613237127423e-05, "loss": 0.1883, "step": 11200 }, { "epoch": 0.2124966944958634, "grad_norm": 0.0647418349981308, "learning_rate": 1.062483472479317e-05, "loss": 0.1884, "step": 11250 }, { "epoch": 0.21344112424917835, "grad_norm": 0.06609103083610535, "learning_rate": 1.0672056212458918e-05, "loss": 0.187, "step": 11300 }, { "epoch": 0.2143855540024933, "grad_norm": 0.07147999107837677, "learning_rate": 1.0719277700124665e-05, "loss": 0.1876, "step": 11350 }, { "epoch": 0.21532998375580825, "grad_norm": 0.06188651919364929, "learning_rate": 1.0766499187790413e-05, "loss": 0.1871, "step": 11400 }, { "epoch": 0.2162744135091232, "grad_norm": 0.06207416206598282, "learning_rate": 1.081372067545616e-05, "loss": 0.1867, "step": 11450 }, { "epoch": 0.21721884326243815, "grad_norm": 0.058900002390146255, "learning_rate": 1.0860942163121908e-05, "loss": 0.187, "step": 11500 }, { "epoch": 0.21816327301575308, "grad_norm": 0.05081435665488243, "learning_rate": 1.0908163650787655e-05, "loss": 0.1871, "step": 11550 }, { "epoch": 0.21910770276906805, "grad_norm": 0.12407368421554565, "learning_rate": 1.0955385138453403e-05, "loss": 0.1866, "step": 11600 }, { "epoch": 0.22005213252238298, "grad_norm": 0.06678406894207001, "learning_rate": 1.100260662611915e-05, "loss": 0.1858, "step": 11650 }, { "epoch": 0.22099656227569794, "grad_norm": 0.09623323380947113, "learning_rate": 1.1049828113784897e-05, "loss": 0.1858, "step": 11700 }, { "epoch": 0.22194099202901288, "grad_norm": 0.06452932208776474, "learning_rate": 1.1097049601450645e-05, "loss": 0.185, "step": 11750 }, { "epoch": 0.22288542178232784, "grad_norm": 0.06891700625419617, "learning_rate": 1.1144271089116392e-05, "loss": 0.1853, "step": 11800 }, { "epoch": 0.22382985153564278, "grad_norm": 0.062022414058446884, "learning_rate": 1.119149257678214e-05, "loss": 0.1854, "step": 11850 }, { "epoch": 0.22477428128895774, "grad_norm": 0.06087144836783409, "learning_rate": 1.1238714064447887e-05, "loss": 0.1855, "step": 11900 }, { "epoch": 0.22571871104227267, "grad_norm": 0.05184387415647507, "learning_rate": 1.1285935552113635e-05, "loss": 0.1852, "step": 11950 }, { "epoch": 0.22666314079558764, "grad_norm": 0.057062018662691116, "learning_rate": 1.1333157039779382e-05, "loss": 0.1849, "step": 12000 }, { "epoch": 0.22760757054890257, "grad_norm": 0.047895029187202454, "learning_rate": 1.138037852744513e-05, "loss": 0.1838, "step": 12050 }, { "epoch": 0.22855200030221753, "grad_norm": 0.07605674117803574, "learning_rate": 1.1427600015110877e-05, "loss": 0.1844, "step": 12100 }, { "epoch": 0.22949643005553247, "grad_norm": 0.06877435743808746, "learning_rate": 1.1474821502776624e-05, "loss": 0.1841, "step": 12150 }, { "epoch": 0.23044085980884743, "grad_norm": 0.06217192858457565, "learning_rate": 1.1522042990442372e-05, "loss": 0.1848, "step": 12200 }, { "epoch": 0.23138528956216237, "grad_norm": 0.0755753219127655, "learning_rate": 1.1569264478108119e-05, "loss": 0.1838, "step": 12250 }, { "epoch": 0.2323297193154773, "grad_norm": 0.06125275418162346, "learning_rate": 1.1616485965773865e-05, "loss": 0.1839, "step": 12300 }, { "epoch": 0.23327414906879226, "grad_norm": 0.06085652858018875, "learning_rate": 1.1663707453439614e-05, "loss": 0.1836, "step": 12350 }, { "epoch": 0.2342185788221072, "grad_norm": 0.059611476957798004, "learning_rate": 1.171092894110536e-05, "loss": 0.184, "step": 12400 }, { "epoch": 0.23516300857542216, "grad_norm": 0.057628531008958817, "learning_rate": 1.1758150428771109e-05, "loss": 0.1836, "step": 12450 }, { "epoch": 0.2361074383287371, "grad_norm": 0.051481351256370544, "learning_rate": 1.1805371916436855e-05, "loss": 0.1826, "step": 12500 }, { "epoch": 0.2361074383287371, "eval_IntDiv": 0.6723225978479517, "eval_NumCircles": 1709, "eval_SumBottleneck": 33.4834356271834, "eval_Uniqueness": 0.9889148191365228, "eval_Validity": 0.6856, "eval_Validity * Uniqueness": 0.678, "eval_loss": 0.230007141828537, "eval_runtime": 226.2231, "eval_samples_per_second": 44.204, "eval_steps_per_second": 0.349, "step": 12500 }, { "epoch": 0.23705186808205206, "grad_norm": 0.05776699259877205, "learning_rate": 1.1852593404102604e-05, "loss": 0.1831, "step": 12550 }, { "epoch": 0.237996297835367, "grad_norm": 0.05494995415210724, "learning_rate": 1.189981489176835e-05, "loss": 0.1828, "step": 12600 }, { "epoch": 0.23894072758868196, "grad_norm": 0.069297656416893, "learning_rate": 1.1947036379434099e-05, "loss": 0.1826, "step": 12650 }, { "epoch": 0.2398851573419969, "grad_norm": 0.06274934858083725, "learning_rate": 1.1994257867099846e-05, "loss": 0.1828, "step": 12700 }, { "epoch": 0.24082958709531185, "grad_norm": 0.06455455720424652, "learning_rate": 1.2041479354765593e-05, "loss": 0.1822, "step": 12750 }, { "epoch": 0.2417740168486268, "grad_norm": 0.05143721401691437, "learning_rate": 1.208870084243134e-05, "loss": 0.1817, "step": 12800 }, { "epoch": 0.24271844660194175, "grad_norm": 0.06492584198713303, "learning_rate": 1.2135922330097088e-05, "loss": 0.1821, "step": 12850 }, { "epoch": 0.24366287635525669, "grad_norm": 0.05809108912944794, "learning_rate": 1.2183143817762836e-05, "loss": 0.182, "step": 12900 }, { "epoch": 0.24460730610857165, "grad_norm": 0.05554930120706558, "learning_rate": 1.2230365305428583e-05, "loss": 0.1817, "step": 12950 }, { "epoch": 0.24555173586188658, "grad_norm": 0.07007747888565063, "learning_rate": 1.227758679309433e-05, "loss": 0.1817, "step": 13000 }, { "epoch": 0.24649616561520155, "grad_norm": 0.046531952917575836, "learning_rate": 1.2324808280760078e-05, "loss": 0.1816, "step": 13050 }, { "epoch": 0.24744059536851648, "grad_norm": 0.05619041249155998, "learning_rate": 1.2372029768425825e-05, "loss": 0.1815, "step": 13100 }, { "epoch": 0.24838502512183144, "grad_norm": 0.056863684207201004, "learning_rate": 1.2419251256091573e-05, "loss": 0.1806, "step": 13150 }, { "epoch": 0.24932945487514638, "grad_norm": 0.055139560252428055, "learning_rate": 1.246647274375732e-05, "loss": 0.1812, "step": 13200 }, { "epoch": 0.25027388462846134, "grad_norm": 0.062468819320201874, "learning_rate": 1.2513694231423068e-05, "loss": 0.1809, "step": 13250 }, { "epoch": 0.2512183143817763, "grad_norm": 0.05228376016020775, "learning_rate": 1.2560915719088815e-05, "loss": 0.1816, "step": 13300 }, { "epoch": 0.2521627441350912, "grad_norm": 0.0677313357591629, "learning_rate": 1.260813720675456e-05, "loss": 0.1809, "step": 13350 }, { "epoch": 0.2531071738884062, "grad_norm": 0.06423202157020569, "learning_rate": 1.265535869442031e-05, "loss": 0.1805, "step": 13400 }, { "epoch": 0.25405160364172114, "grad_norm": 0.04973309114575386, "learning_rate": 1.2702580182086057e-05, "loss": 0.1807, "step": 13450 }, { "epoch": 0.25499603339503607, "grad_norm": 0.05538882687687874, "learning_rate": 1.2749801669751805e-05, "loss": 0.18, "step": 13500 }, { "epoch": 0.255940463148351, "grad_norm": 0.050686050206422806, "learning_rate": 1.279702315741755e-05, "loss": 0.1802, "step": 13550 }, { "epoch": 0.256884892901666, "grad_norm": 0.05636146292090416, "learning_rate": 1.28442446450833e-05, "loss": 0.1809, "step": 13600 }, { "epoch": 0.25782932265498093, "grad_norm": 0.09451480954885483, "learning_rate": 1.2891466132749047e-05, "loss": 0.1807, "step": 13650 }, { "epoch": 0.25877375240829587, "grad_norm": 0.0692017525434494, "learning_rate": 1.2938687620414794e-05, "loss": 0.1799, "step": 13700 }, { "epoch": 0.2597181821616108, "grad_norm": 0.05535691976547241, "learning_rate": 1.298590910808054e-05, "loss": 0.1797, "step": 13750 }, { "epoch": 0.2606626119149258, "grad_norm": 0.07851831614971161, "learning_rate": 1.303313059574629e-05, "loss": 0.1802, "step": 13800 }, { "epoch": 0.2616070416682407, "grad_norm": 0.05567861720919609, "learning_rate": 1.3080352083412037e-05, "loss": 0.1793, "step": 13850 }, { "epoch": 0.26255147142155566, "grad_norm": 0.05351938679814339, "learning_rate": 1.3127573571077784e-05, "loss": 0.1793, "step": 13900 }, { "epoch": 0.2634959011748706, "grad_norm": 0.0653354674577713, "learning_rate": 1.317479505874353e-05, "loss": 0.1789, "step": 13950 }, { "epoch": 0.2644403309281856, "grad_norm": 0.05891212075948715, "learning_rate": 1.322201654640928e-05, "loss": 0.1794, "step": 14000 }, { "epoch": 0.2653847606815005, "grad_norm": 0.06268806755542755, "learning_rate": 1.3269238034075026e-05, "loss": 0.1789, "step": 14050 }, { "epoch": 0.26632919043481545, "grad_norm": 0.05581704527139664, "learning_rate": 1.3316459521740774e-05, "loss": 0.1783, "step": 14100 }, { "epoch": 0.2672736201881304, "grad_norm": 0.05218515917658806, "learning_rate": 1.336368100940652e-05, "loss": 0.1787, "step": 14150 }, { "epoch": 0.2682180499414454, "grad_norm": 0.06501922011375427, "learning_rate": 1.341090249707227e-05, "loss": 0.1787, "step": 14200 }, { "epoch": 0.2691624796947603, "grad_norm": 0.06624319404363632, "learning_rate": 1.3458123984738016e-05, "loss": 0.1784, "step": 14250 }, { "epoch": 0.27010690944807525, "grad_norm": 0.057063791900873184, "learning_rate": 1.3505345472403764e-05, "loss": 0.1782, "step": 14300 }, { "epoch": 0.2710513392013902, "grad_norm": 0.0523834303021431, "learning_rate": 1.355256696006951e-05, "loss": 0.177, "step": 14350 }, { "epoch": 0.2719957689547052, "grad_norm": 0.06262258440256119, "learning_rate": 1.359978844773526e-05, "loss": 0.1776, "step": 14400 }, { "epoch": 0.2729401987080201, "grad_norm": 0.11803051829338074, "learning_rate": 1.3647009935401006e-05, "loss": 0.1788, "step": 14450 }, { "epoch": 0.27388462846133504, "grad_norm": 0.04776685684919357, "learning_rate": 1.3694231423066753e-05, "loss": 0.1771, "step": 14500 }, { "epoch": 0.27482905821465, "grad_norm": 0.055566057562828064, "learning_rate": 1.3741452910732499e-05, "loss": 0.1774, "step": 14550 }, { "epoch": 0.27577348796796497, "grad_norm": 0.052779823541641235, "learning_rate": 1.378867439839825e-05, "loss": 0.1768, "step": 14600 }, { "epoch": 0.2767179177212799, "grad_norm": 0.047762028872966766, "learning_rate": 1.3835895886063996e-05, "loss": 0.1774, "step": 14650 }, { "epoch": 0.27766234747459484, "grad_norm": 0.05478201434016228, "learning_rate": 1.3883117373729743e-05, "loss": 0.1767, "step": 14700 }, { "epoch": 0.2786067772279098, "grad_norm": 0.04895180091261864, "learning_rate": 1.3930338861395489e-05, "loss": 0.1774, "step": 14750 }, { "epoch": 0.2795512069812247, "grad_norm": 0.060355860739946365, "learning_rate": 1.3977560349061236e-05, "loss": 0.1767, "step": 14800 }, { "epoch": 0.2804956367345397, "grad_norm": 0.04826197400689125, "learning_rate": 1.4024781836726985e-05, "loss": 0.1765, "step": 14850 }, { "epoch": 0.28144006648785463, "grad_norm": 0.05118125304579735, "learning_rate": 1.4072003324392733e-05, "loss": 0.1769, "step": 14900 }, { "epoch": 0.28238449624116957, "grad_norm": 0.04951278492808342, "learning_rate": 1.4119224812058478e-05, "loss": 0.1766, "step": 14950 }, { "epoch": 0.2833289259944845, "grad_norm": 0.045592255890369415, "learning_rate": 1.4166446299724226e-05, "loss": 0.176, "step": 15000 }, { "epoch": 0.2833289259944845, "eval_IntDiv": 0.6754740353883415, "eval_NumCircles": 1896, "eval_SumBottleneck": 24.88157254104964, "eval_Uniqueness": 0.9935856318152662, "eval_Validity": 0.7795, "eval_Validity * Uniqueness": 0.7745, "eval_loss": 0.22851407527923584, "eval_runtime": 190.4593, "eval_samples_per_second": 52.505, "eval_steps_per_second": 0.415, "step": 15000 }, { "epoch": 0.2842733557477995, "grad_norm": 0.05508740246295929, "learning_rate": 1.4213667787389975e-05, "loss": 0.1759, "step": 15050 }, { "epoch": 0.28521778550111443, "grad_norm": 0.05503286048769951, "learning_rate": 1.4260889275055722e-05, "loss": 0.1763, "step": 15100 }, { "epoch": 0.28616221525442936, "grad_norm": 0.06549620628356934, "learning_rate": 1.4308110762721468e-05, "loss": 0.1757, "step": 15150 }, { "epoch": 0.2871066450077443, "grad_norm": 0.05942118540406227, "learning_rate": 1.4355332250387216e-05, "loss": 0.1758, "step": 15200 }, { "epoch": 0.2880510747610593, "grad_norm": 0.05008010193705559, "learning_rate": 1.4402553738052965e-05, "loss": 0.1759, "step": 15250 }, { "epoch": 0.2889955045143742, "grad_norm": 0.060427166521549225, "learning_rate": 1.4449775225718712e-05, "loss": 0.1755, "step": 15300 }, { "epoch": 0.28993993426768916, "grad_norm": 0.055758509784936905, "learning_rate": 1.449699671338446e-05, "loss": 0.1755, "step": 15350 }, { "epoch": 0.2908843640210041, "grad_norm": 0.05282703414559364, "learning_rate": 1.4544218201050205e-05, "loss": 0.1756, "step": 15400 }, { "epoch": 0.2918287937743191, "grad_norm": 0.05114014074206352, "learning_rate": 1.4591439688715954e-05, "loss": 0.1763, "step": 15450 }, { "epoch": 0.292773223527634, "grad_norm": 0.0755448266863823, "learning_rate": 1.4638661176381702e-05, "loss": 0.1756, "step": 15500 }, { "epoch": 0.29371765328094895, "grad_norm": 0.060348138213157654, "learning_rate": 1.468588266404745e-05, "loss": 0.1755, "step": 15550 }, { "epoch": 0.2946620830342639, "grad_norm": 0.0602448433637619, "learning_rate": 1.4733104151713195e-05, "loss": 0.1747, "step": 15600 }, { "epoch": 0.2956065127875789, "grad_norm": 0.05090785771608353, "learning_rate": 1.4780325639378944e-05, "loss": 0.1744, "step": 15650 }, { "epoch": 0.2965509425408938, "grad_norm": 0.056346822530031204, "learning_rate": 1.4827547127044691e-05, "loss": 0.1746, "step": 15700 }, { "epoch": 0.29749537229420875, "grad_norm": 0.05905643850564957, "learning_rate": 1.4874768614710439e-05, "loss": 0.1737, "step": 15750 }, { "epoch": 0.2984398020475237, "grad_norm": 0.04916936904191971, "learning_rate": 1.4921990102376185e-05, "loss": 0.1745, "step": 15800 }, { "epoch": 0.2993842318008387, "grad_norm": 0.061164479702711105, "learning_rate": 1.4969211590041934e-05, "loss": 0.1744, "step": 15850 }, { "epoch": 0.3003286615541536, "grad_norm": 0.05178654566407204, "learning_rate": 1.5016433077707681e-05, "loss": 0.1744, "step": 15900 }, { "epoch": 0.30127309130746854, "grad_norm": 0.0585685633122921, "learning_rate": 1.5063654565373429e-05, "loss": 0.1748, "step": 15950 }, { "epoch": 0.3022175210607835, "grad_norm": 0.05501897260546684, "learning_rate": 1.5110876053039174e-05, "loss": 0.1743, "step": 16000 }, { "epoch": 0.30316195081409847, "grad_norm": 0.052088260650634766, "learning_rate": 1.5158097540704923e-05, "loss": 0.1745, "step": 16050 }, { "epoch": 0.3041063805674134, "grad_norm": 0.04821436107158661, "learning_rate": 1.5205319028370671e-05, "loss": 0.1742, "step": 16100 }, { "epoch": 0.30505081032072834, "grad_norm": 0.05680272355675697, "learning_rate": 1.5252540516036418e-05, "loss": 0.1739, "step": 16150 }, { "epoch": 0.3059952400740433, "grad_norm": 0.05313114821910858, "learning_rate": 1.5299762003702166e-05, "loss": 0.1738, "step": 16200 }, { "epoch": 0.30693966982735826, "grad_norm": 0.06261331588029861, "learning_rate": 1.5346983491367913e-05, "loss": 0.1732, "step": 16250 }, { "epoch": 0.3078840995806732, "grad_norm": 0.0462849922478199, "learning_rate": 1.539420497903366e-05, "loss": 0.1729, "step": 16300 }, { "epoch": 0.30882852933398813, "grad_norm": 0.05679631978273392, "learning_rate": 1.5441426466699408e-05, "loss": 0.1731, "step": 16350 }, { "epoch": 0.30977295908730307, "grad_norm": 0.06842539459466934, "learning_rate": 1.5488647954365155e-05, "loss": 0.1734, "step": 16400 }, { "epoch": 0.31071738884061806, "grad_norm": 0.05262358486652374, "learning_rate": 1.5535869442030903e-05, "loss": 0.1728, "step": 16450 }, { "epoch": 0.311661818593933, "grad_norm": 0.05603114143013954, "learning_rate": 1.558309092969665e-05, "loss": 0.1726, "step": 16500 }, { "epoch": 0.31260624834724793, "grad_norm": 0.0576874203979969, "learning_rate": 1.5630312417362398e-05, "loss": 0.1737, "step": 16550 }, { "epoch": 0.31355067810056286, "grad_norm": 0.05990442633628845, "learning_rate": 1.5677533905028145e-05, "loss": 0.1731, "step": 16600 }, { "epoch": 0.31449510785387785, "grad_norm": 0.05039701610803604, "learning_rate": 1.5724755392693893e-05, "loss": 0.1726, "step": 16650 }, { "epoch": 0.3154395376071928, "grad_norm": 0.05477456375956535, "learning_rate": 1.577197688035964e-05, "loss": 0.1721, "step": 16700 }, { "epoch": 0.3163839673605077, "grad_norm": 0.05294732004404068, "learning_rate": 1.5819198368025387e-05, "loss": 0.1713, "step": 16750 }, { "epoch": 0.31732839711382266, "grad_norm": 0.05493660271167755, "learning_rate": 1.5866419855691135e-05, "loss": 0.1727, "step": 16800 }, { "epoch": 0.31827282686713765, "grad_norm": 0.0493696965277195, "learning_rate": 1.5913641343356882e-05, "loss": 0.1722, "step": 16850 }, { "epoch": 0.3192172566204526, "grad_norm": 0.061418116092681885, "learning_rate": 1.596086283102263e-05, "loss": 0.1718, "step": 16900 }, { "epoch": 0.3201616863737675, "grad_norm": 0.057717353105545044, "learning_rate": 1.6008084318688377e-05, "loss": 0.1714, "step": 16950 }, { "epoch": 0.32110611612708245, "grad_norm": 0.05513238534331322, "learning_rate": 1.6055305806354124e-05, "loss": 0.1718, "step": 17000 }, { "epoch": 0.32205054588039744, "grad_norm": 0.051071859896183014, "learning_rate": 1.6102527294019872e-05, "loss": 0.172, "step": 17050 }, { "epoch": 0.3229949756337124, "grad_norm": 0.0526854507625103, "learning_rate": 1.614974878168562e-05, "loss": 0.1713, "step": 17100 }, { "epoch": 0.3239394053870273, "grad_norm": 0.07438076287508011, "learning_rate": 1.6196970269351367e-05, "loss": 0.1715, "step": 17150 }, { "epoch": 0.32488383514034225, "grad_norm": 0.0649711862206459, "learning_rate": 1.6244191757017114e-05, "loss": 0.1715, "step": 17200 }, { "epoch": 0.3258282648936572, "grad_norm": 0.06108267977833748, "learning_rate": 1.6291413244682858e-05, "loss": 0.1718, "step": 17250 }, { "epoch": 0.3267726946469722, "grad_norm": 0.055628255009651184, "learning_rate": 1.633863473234861e-05, "loss": 0.1709, "step": 17300 }, { "epoch": 0.3277171244002871, "grad_norm": 0.051399242132902145, "learning_rate": 1.6385856220014356e-05, "loss": 0.1715, "step": 17350 }, { "epoch": 0.32866155415360204, "grad_norm": 0.05644528195261955, "learning_rate": 1.6433077707680104e-05, "loss": 0.1708, "step": 17400 }, { "epoch": 0.329605983906917, "grad_norm": 0.05368797481060028, "learning_rate": 1.648029919534585e-05, "loss": 0.1711, "step": 17450 }, { "epoch": 0.33055041366023197, "grad_norm": 0.05304599180817604, "learning_rate": 1.65275206830116e-05, "loss": 0.1709, "step": 17500 }, { "epoch": 0.33055041366023197, "eval_IntDiv": 0.6746703656240511, "eval_NumCircles": 2022, "eval_SumBottleneck": 27.596141872578055, "eval_Uniqueness": 0.9917216556688663, "eval_Validity": 0.8335, "eval_Validity * Uniqueness": 0.8266000000000001, "eval_loss": 0.22388486564159393, "eval_runtime": 191.8779, "eval_samples_per_second": 52.116, "eval_steps_per_second": 0.412, "step": 17500 }, { "epoch": 0.3314948434135469, "grad_norm": 0.07943501323461533, "learning_rate": 1.6574742170677346e-05, "loss": 0.1705, "step": 17550 }, { "epoch": 0.33243927316686184, "grad_norm": 0.05228978022933006, "learning_rate": 1.6621963658343094e-05, "loss": 0.1703, "step": 17600 }, { "epoch": 0.33338370292017677, "grad_norm": 0.050549883395433426, "learning_rate": 1.666918514600884e-05, "loss": 0.1701, "step": 17650 }, { "epoch": 0.33432813267349176, "grad_norm": 0.05755181238055229, "learning_rate": 1.671640663367459e-05, "loss": 0.1704, "step": 17700 }, { "epoch": 0.3352725624268067, "grad_norm": 0.05055411532521248, "learning_rate": 1.6763628121340336e-05, "loss": 0.1701, "step": 17750 }, { "epoch": 0.33621699218012163, "grad_norm": 0.05053755268454552, "learning_rate": 1.6810849609006083e-05, "loss": 0.17, "step": 17800 }, { "epoch": 0.33716142193343657, "grad_norm": 0.04863362014293671, "learning_rate": 1.685807109667183e-05, "loss": 0.1696, "step": 17850 }, { "epoch": 0.33810585168675156, "grad_norm": 0.04624275863170624, "learning_rate": 1.6905292584337578e-05, "loss": 0.17, "step": 17900 }, { "epoch": 0.3390502814400665, "grad_norm": 0.05891531705856323, "learning_rate": 1.6952514072003326e-05, "loss": 0.1702, "step": 17950 }, { "epoch": 0.3399947111933814, "grad_norm": 0.06249431148171425, "learning_rate": 1.6999735559669073e-05, "loss": 0.1699, "step": 18000 }, { "epoch": 0.34093914094669636, "grad_norm": 0.05025313422083855, "learning_rate": 1.704695704733482e-05, "loss": 0.1698, "step": 18050 }, { "epoch": 0.34188357070001135, "grad_norm": 0.051701273769140244, "learning_rate": 1.7094178535000568e-05, "loss": 0.1691, "step": 18100 }, { "epoch": 0.3428280004533263, "grad_norm": 0.05871399864554405, "learning_rate": 1.7141400022666315e-05, "loss": 0.1688, "step": 18150 }, { "epoch": 0.3437724302066412, "grad_norm": 0.06386410444974899, "learning_rate": 1.7188621510332063e-05, "loss": 0.1692, "step": 18200 }, { "epoch": 0.34471685995995616, "grad_norm": 0.06289192289113998, "learning_rate": 1.723584299799781e-05, "loss": 0.1689, "step": 18250 }, { "epoch": 0.34566128971327115, "grad_norm": 0.059846922755241394, "learning_rate": 1.7283064485663558e-05, "loss": 0.1688, "step": 18300 }, { "epoch": 0.3466057194665861, "grad_norm": 0.04965565726161003, "learning_rate": 1.7330285973329305e-05, "loss": 0.1683, "step": 18350 }, { "epoch": 0.347550149219901, "grad_norm": 0.05802846699953079, "learning_rate": 1.7377507460995052e-05, "loss": 0.1685, "step": 18400 }, { "epoch": 0.34849457897321595, "grad_norm": 0.05590154230594635, "learning_rate": 1.74247289486608e-05, "loss": 0.1683, "step": 18450 }, { "epoch": 0.34943900872653094, "grad_norm": 0.05660117790102959, "learning_rate": 1.7471950436326547e-05, "loss": 0.1678, "step": 18500 }, { "epoch": 0.3503834384798459, "grad_norm": 0.0665990486741066, "learning_rate": 1.7519171923992295e-05, "loss": 0.1685, "step": 18550 }, { "epoch": 0.3513278682331608, "grad_norm": 0.055347442626953125, "learning_rate": 1.7566393411658042e-05, "loss": 0.1683, "step": 18600 }, { "epoch": 0.35227229798647575, "grad_norm": 0.057999320328235626, "learning_rate": 1.761361489932379e-05, "loss": 0.1678, "step": 18650 }, { "epoch": 0.35321672773979074, "grad_norm": 0.05214443430304527, "learning_rate": 1.7660836386989537e-05, "loss": 0.1683, "step": 18700 }, { "epoch": 0.35416115749310567, "grad_norm": 0.04853496700525284, "learning_rate": 1.7708057874655284e-05, "loss": 0.1677, "step": 18750 }, { "epoch": 0.3551055872464206, "grad_norm": 0.04998196288943291, "learning_rate": 1.7755279362321032e-05, "loss": 0.1679, "step": 18800 }, { "epoch": 0.35605001699973554, "grad_norm": 0.04556301608681679, "learning_rate": 1.780250084998678e-05, "loss": 0.1679, "step": 18850 }, { "epoch": 0.35699444675305053, "grad_norm": 0.050546929240226746, "learning_rate": 1.7849722337652527e-05, "loss": 0.1677, "step": 18900 }, { "epoch": 0.35793887650636547, "grad_norm": 0.06045430526137352, "learning_rate": 1.7896943825318274e-05, "loss": 0.1674, "step": 18950 }, { "epoch": 0.3588833062596804, "grad_norm": 0.049684733152389526, "learning_rate": 1.794416531298402e-05, "loss": 0.167, "step": 19000 }, { "epoch": 0.35982773601299534, "grad_norm": 0.04686257243156433, "learning_rate": 1.799138680064977e-05, "loss": 0.1667, "step": 19050 }, { "epoch": 0.3607721657663103, "grad_norm": 0.06523380428552628, "learning_rate": 1.8038608288315516e-05, "loss": 0.1673, "step": 19100 }, { "epoch": 0.36171659551962526, "grad_norm": 0.05615226924419403, "learning_rate": 1.8085829775981264e-05, "loss": 0.1668, "step": 19150 }, { "epoch": 0.3626610252729402, "grad_norm": 0.04951716214418411, "learning_rate": 1.813305126364701e-05, "loss": 0.1667, "step": 19200 }, { "epoch": 0.36360545502625513, "grad_norm": 0.049394894391298294, "learning_rate": 1.818027275131276e-05, "loss": 0.1672, "step": 19250 }, { "epoch": 0.3645498847795701, "grad_norm": 0.06478346139192581, "learning_rate": 1.8227494238978506e-05, "loss": 0.1676, "step": 19300 }, { "epoch": 0.36549431453288506, "grad_norm": 0.05037521943449974, "learning_rate": 1.8274715726644253e-05, "loss": 0.1666, "step": 19350 }, { "epoch": 0.3664387442862, "grad_norm": 0.05799749493598938, "learning_rate": 1.832193721431e-05, "loss": 0.1671, "step": 19400 }, { "epoch": 0.3673831740395149, "grad_norm": 0.048989277333021164, "learning_rate": 1.836915870197575e-05, "loss": 0.1669, "step": 19450 }, { "epoch": 0.3683276037928299, "grad_norm": 0.05258223041892052, "learning_rate": 1.8416380189641496e-05, "loss": 0.1667, "step": 19500 }, { "epoch": 0.36927203354614485, "grad_norm": 0.07389132678508759, "learning_rate": 1.8463601677307243e-05, "loss": 0.1666, "step": 19550 }, { "epoch": 0.3702164632994598, "grad_norm": 0.05384159833192825, "learning_rate": 1.851082316497299e-05, "loss": 0.1661, "step": 19600 }, { "epoch": 0.3711608930527747, "grad_norm": 0.059844113886356354, "learning_rate": 1.8558044652638738e-05, "loss": 0.1661, "step": 19650 }, { "epoch": 0.37210532280608966, "grad_norm": 0.04890231043100357, "learning_rate": 1.8605266140304482e-05, "loss": 0.1665, "step": 19700 }, { "epoch": 0.37304975255940465, "grad_norm": 0.04909643530845642, "learning_rate": 1.8652487627970233e-05, "loss": 0.1665, "step": 19750 }, { "epoch": 0.3739941823127196, "grad_norm": 0.04791337996721268, "learning_rate": 1.869970911563598e-05, "loss": 0.1665, "step": 19800 }, { "epoch": 0.3749386120660345, "grad_norm": 0.05450041592121124, "learning_rate": 1.8746930603301728e-05, "loss": 0.166, "step": 19850 }, { "epoch": 0.37588304181934945, "grad_norm": 0.044679611921310425, "learning_rate": 1.8794152090967472e-05, "loss": 0.1653, "step": 19900 }, { "epoch": 0.37682747157266444, "grad_norm": 0.04662957042455673, "learning_rate": 1.8841373578633223e-05, "loss": 0.1663, "step": 19950 }, { "epoch": 0.3777719013259794, "grad_norm": 0.0513615645468235, "learning_rate": 1.888859506629897e-05, "loss": 0.1653, "step": 20000 }, { "epoch": 0.3777719013259794, "eval_IntDiv": 0.673756060968147, "eval_NumCircles": 2090, "eval_SumBottleneck": 79.7968680933827, "eval_Uniqueness": 0.9938685793614067, "eval_Validity": 0.8644, "eval_Validity * Uniqueness": 0.8590999999999999, "eval_loss": 0.2250804454088211, "eval_runtime": 167.7788, "eval_samples_per_second": 59.602, "eval_steps_per_second": 0.471, "step": 20000 }, { "epoch": 0.3787163310792943, "grad_norm": 0.04979109764099121, "learning_rate": 1.8935816553964717e-05, "loss": 0.1656, "step": 20050 }, { "epoch": 0.37966076083260925, "grad_norm": 0.05147046968340874, "learning_rate": 1.8983038041630465e-05, "loss": 0.1657, "step": 20100 }, { "epoch": 0.38060519058592424, "grad_norm": 0.060992199927568436, "learning_rate": 1.9030259529296212e-05, "loss": 0.1649, "step": 20150 }, { "epoch": 0.38154962033923917, "grad_norm": 0.0829363763332367, "learning_rate": 1.907748101696196e-05, "loss": 0.1651, "step": 20200 }, { "epoch": 0.3824940500925541, "grad_norm": 0.055334676057100296, "learning_rate": 1.9124702504627707e-05, "loss": 0.1654, "step": 20250 }, { "epoch": 0.38343847984586904, "grad_norm": 0.04878419637680054, "learning_rate": 1.9171923992293455e-05, "loss": 0.1643, "step": 20300 }, { "epoch": 0.38438290959918403, "grad_norm": 0.048638418316841125, "learning_rate": 1.9219145479959202e-05, "loss": 0.165, "step": 20350 }, { "epoch": 0.38532733935249897, "grad_norm": 0.059463996440172195, "learning_rate": 1.926636696762495e-05, "loss": 0.1652, "step": 20400 }, { "epoch": 0.3862717691058139, "grad_norm": 0.052719417959451675, "learning_rate": 1.9313588455290697e-05, "loss": 0.1645, "step": 20450 }, { "epoch": 0.38721619885912884, "grad_norm": 0.06053197756409645, "learning_rate": 1.9360809942956444e-05, "loss": 0.1652, "step": 20500 }, { "epoch": 0.3881606286124438, "grad_norm": 0.05033697932958603, "learning_rate": 1.940803143062219e-05, "loss": 0.1648, "step": 20550 }, { "epoch": 0.38910505836575876, "grad_norm": 0.04812562093138695, "learning_rate": 1.945525291828794e-05, "loss": 0.1649, "step": 20600 }, { "epoch": 0.3900494881190737, "grad_norm": 0.062223102897405624, "learning_rate": 1.9502474405953687e-05, "loss": 0.1639, "step": 20650 }, { "epoch": 0.39099391787238863, "grad_norm": 0.05222366377711296, "learning_rate": 1.9549695893619434e-05, "loss": 0.1642, "step": 20700 }, { "epoch": 0.3919383476257036, "grad_norm": 0.04900024086236954, "learning_rate": 1.959691738128518e-05, "loss": 0.1644, "step": 20750 }, { "epoch": 0.39288277737901856, "grad_norm": 0.046815238893032074, "learning_rate": 1.964413886895093e-05, "loss": 0.1646, "step": 20800 }, { "epoch": 0.3938272071323335, "grad_norm": 0.06252169609069824, "learning_rate": 1.9691360356616676e-05, "loss": 0.1649, "step": 20850 }, { "epoch": 0.3947716368856484, "grad_norm": 0.04834866523742676, "learning_rate": 1.9738581844282424e-05, "loss": 0.164, "step": 20900 }, { "epoch": 0.3957160666389634, "grad_norm": 0.048358265310525894, "learning_rate": 1.978580333194817e-05, "loss": 0.1637, "step": 20950 }, { "epoch": 0.39666049639227835, "grad_norm": 0.05006176978349686, "learning_rate": 1.983302481961392e-05, "loss": 0.1632, "step": 21000 }, { "epoch": 0.3976049261455933, "grad_norm": 0.047954704612493515, "learning_rate": 1.9880246307279666e-05, "loss": 0.1639, "step": 21050 }, { "epoch": 0.3985493558989082, "grad_norm": 0.05419699847698212, "learning_rate": 1.9927467794945413e-05, "loss": 0.1638, "step": 21100 }, { "epoch": 0.3994937856522232, "grad_norm": 0.04519990086555481, "learning_rate": 1.997468928261116e-05, "loss": 0.1643, "step": 21150 }, { "epoch": 0.40043821540553814, "grad_norm": 0.046618908643722534, "learning_rate": 2.0021910770276908e-05, "loss": 0.1637, "step": 21200 }, { "epoch": 0.4013826451588531, "grad_norm": 0.047772835940122604, "learning_rate": 2.0069132257942656e-05, "loss": 0.1636, "step": 21250 }, { "epoch": 0.402327074912168, "grad_norm": 0.052032891660928726, "learning_rate": 2.0116353745608403e-05, "loss": 0.1631, "step": 21300 }, { "epoch": 0.403271504665483, "grad_norm": 0.06592214107513428, "learning_rate": 2.016357523327415e-05, "loss": 0.1632, "step": 21350 }, { "epoch": 0.40421593441879794, "grad_norm": 0.052119940519332886, "learning_rate": 2.0210796720939898e-05, "loss": 0.1634, "step": 21400 }, { "epoch": 0.4051603641721129, "grad_norm": 0.04970613121986389, "learning_rate": 2.0258018208605645e-05, "loss": 0.1628, "step": 21450 }, { "epoch": 0.4061047939254278, "grad_norm": 0.04774336889386177, "learning_rate": 2.0305239696271393e-05, "loss": 0.1625, "step": 21500 }, { "epoch": 0.4070492236787428, "grad_norm": 0.0445546954870224, "learning_rate": 2.035246118393714e-05, "loss": 0.1631, "step": 21550 }, { "epoch": 0.40799365343205773, "grad_norm": 0.04618678241968155, "learning_rate": 2.0399682671602888e-05, "loss": 0.163, "step": 21600 }, { "epoch": 0.40893808318537267, "grad_norm": 0.050049684941768646, "learning_rate": 2.0446904159268635e-05, "loss": 0.1634, "step": 21650 }, { "epoch": 0.4098825129386876, "grad_norm": 0.04552027955651283, "learning_rate": 2.0494125646934382e-05, "loss": 0.1627, "step": 21700 }, { "epoch": 0.4108269426920026, "grad_norm": 0.050030846148729324, "learning_rate": 2.054134713460013e-05, "loss": 0.1628, "step": 21750 }, { "epoch": 0.41177137244531753, "grad_norm": 0.049408745020627975, "learning_rate": 2.0588568622265877e-05, "loss": 0.1621, "step": 21800 }, { "epoch": 0.41271580219863246, "grad_norm": 0.05092242732644081, "learning_rate": 2.0635790109931625e-05, "loss": 0.1631, "step": 21850 }, { "epoch": 0.4136602319519474, "grad_norm": 0.06667157262563705, "learning_rate": 2.0683011597597372e-05, "loss": 0.1624, "step": 21900 }, { "epoch": 0.4146046617052624, "grad_norm": 0.04680335521697998, "learning_rate": 2.073023308526312e-05, "loss": 0.1622, "step": 21950 }, { "epoch": 0.4155490914585773, "grad_norm": 0.056472811847925186, "learning_rate": 2.0777454572928867e-05, "loss": 0.1625, "step": 22000 }, { "epoch": 0.41649352121189226, "grad_norm": 0.05260661616921425, "learning_rate": 2.0824676060594614e-05, "loss": 0.1622, "step": 22050 }, { "epoch": 0.4174379509652072, "grad_norm": 0.051530856639146805, "learning_rate": 2.0871897548260362e-05, "loss": 0.1614, "step": 22100 }, { "epoch": 0.41838238071852213, "grad_norm": 0.043712228536605835, "learning_rate": 2.0919119035926106e-05, "loss": 0.1624, "step": 22150 }, { "epoch": 0.4193268104718371, "grad_norm": 0.0485212467610836, "learning_rate": 2.0966340523591857e-05, "loss": 0.1615, "step": 22200 }, { "epoch": 0.42027124022515205, "grad_norm": 0.04686351493000984, "learning_rate": 2.1013562011257604e-05, "loss": 0.1619, "step": 22250 }, { "epoch": 0.421215669978467, "grad_norm": 0.044877611100673676, "learning_rate": 2.106078349892335e-05, "loss": 0.1619, "step": 22300 }, { "epoch": 0.4221600997317819, "grad_norm": 0.05475960299372673, "learning_rate": 2.1108004986589096e-05, "loss": 0.162, "step": 22350 }, { "epoch": 0.4231045294850969, "grad_norm": 0.05157415196299553, "learning_rate": 2.1155226474254846e-05, "loss": 0.1613, "step": 22400 }, { "epoch": 0.42404895923841185, "grad_norm": 0.049894120544195175, "learning_rate": 2.1202447961920594e-05, "loss": 0.162, "step": 22450 }, { "epoch": 0.4249933889917268, "grad_norm": 0.04776232689619064, "learning_rate": 2.124966944958634e-05, "loss": 0.1615, "step": 22500 }, { "epoch": 0.4249933889917268, "eval_IntDiv": 0.6741982840942409, "eval_NumCircles": 2066, "eval_SumBottleneck": 40.66673864157336, "eval_Uniqueness": 0.9961385576377059, "eval_Validity": 0.8805, "eval_Validity * Uniqueness": 0.8771, "eval_loss": 0.22009611129760742, "eval_runtime": 178.3779, "eval_samples_per_second": 56.061, "eval_steps_per_second": 0.443, "step": 22500 }, { "epoch": 0.4259378187450417, "grad_norm": 0.053049568086862564, "learning_rate": 2.1296890937252085e-05, "loss": 0.1614, "step": 22550 }, { "epoch": 0.4268822484983567, "grad_norm": 0.056743137538433075, "learning_rate": 2.1344112424917836e-05, "loss": 0.1614, "step": 22600 }, { "epoch": 0.42782667825167164, "grad_norm": 0.04726259037852287, "learning_rate": 2.1391333912583584e-05, "loss": 0.1612, "step": 22650 }, { "epoch": 0.4287711080049866, "grad_norm": 0.05192072317004204, "learning_rate": 2.143855540024933e-05, "loss": 0.1609, "step": 22700 }, { "epoch": 0.4297155377583015, "grad_norm": 0.0483238659799099, "learning_rate": 2.148577688791508e-05, "loss": 0.1619, "step": 22750 }, { "epoch": 0.4306599675116165, "grad_norm": 0.04824618995189667, "learning_rate": 2.1532998375580826e-05, "loss": 0.1614, "step": 22800 }, { "epoch": 0.43160439726493144, "grad_norm": 0.055754538625478745, "learning_rate": 2.1580219863246573e-05, "loss": 0.1608, "step": 22850 }, { "epoch": 0.4325488270182464, "grad_norm": 0.049463506788015366, "learning_rate": 2.162744135091232e-05, "loss": 0.1606, "step": 22900 }, { "epoch": 0.4334932567715613, "grad_norm": 0.05329675227403641, "learning_rate": 2.1674662838578068e-05, "loss": 0.1609, "step": 22950 }, { "epoch": 0.4344376865248763, "grad_norm": 0.051349151879549026, "learning_rate": 2.1721884326243815e-05, "loss": 0.1613, "step": 23000 }, { "epoch": 0.43538211627819123, "grad_norm": 0.052568044513463974, "learning_rate": 2.1769105813909563e-05, "loss": 0.1605, "step": 23050 }, { "epoch": 0.43632654603150617, "grad_norm": 0.049984127283096313, "learning_rate": 2.181632730157531e-05, "loss": 0.1603, "step": 23100 }, { "epoch": 0.4372709757848211, "grad_norm": 0.05216143652796745, "learning_rate": 2.1863548789241058e-05, "loss": 0.1605, "step": 23150 }, { "epoch": 0.4382154055381361, "grad_norm": 0.04375084489583969, "learning_rate": 2.1910770276906805e-05, "loss": 0.1607, "step": 23200 }, { "epoch": 0.43915983529145103, "grad_norm": 0.04641221463680267, "learning_rate": 2.1957991764572553e-05, "loss": 0.1611, "step": 23250 }, { "epoch": 0.44010426504476596, "grad_norm": 0.05413924530148506, "learning_rate": 2.20052132522383e-05, "loss": 0.1601, "step": 23300 }, { "epoch": 0.4410486947980809, "grad_norm": 0.04659859836101532, "learning_rate": 2.2052434739904047e-05, "loss": 0.1597, "step": 23350 }, { "epoch": 0.4419931245513959, "grad_norm": 0.049303844571113586, "learning_rate": 2.2099656227569795e-05, "loss": 0.1608, "step": 23400 }, { "epoch": 0.4429375543047108, "grad_norm": 0.05150899663567543, "learning_rate": 2.2146877715235542e-05, "loss": 0.1604, "step": 23450 }, { "epoch": 0.44388198405802576, "grad_norm": 0.04486404359340668, "learning_rate": 2.219409920290129e-05, "loss": 0.1605, "step": 23500 }, { "epoch": 0.4448264138113407, "grad_norm": 0.046809643507003784, "learning_rate": 2.2241320690567037e-05, "loss": 0.1597, "step": 23550 }, { "epoch": 0.4457708435646557, "grad_norm": 0.05550043657422066, "learning_rate": 2.2288542178232785e-05, "loss": 0.1601, "step": 23600 }, { "epoch": 0.4467152733179706, "grad_norm": 0.048695486038923264, "learning_rate": 2.2335763665898532e-05, "loss": 0.1599, "step": 23650 }, { "epoch": 0.44765970307128555, "grad_norm": 0.0473329983651638, "learning_rate": 2.238298515356428e-05, "loss": 0.1593, "step": 23700 }, { "epoch": 0.4486041328246005, "grad_norm": 0.045891255140304565, "learning_rate": 2.2430206641230027e-05, "loss": 0.1597, "step": 23750 }, { "epoch": 0.4495485625779155, "grad_norm": 0.056684643030166626, "learning_rate": 2.2477428128895774e-05, "loss": 0.1596, "step": 23800 }, { "epoch": 0.4504929923312304, "grad_norm": 0.052081961184740067, "learning_rate": 2.2524649616561522e-05, "loss": 0.159, "step": 23850 }, { "epoch": 0.45143742208454535, "grad_norm": 0.04807828739285469, "learning_rate": 2.257187110422727e-05, "loss": 0.16, "step": 23900 }, { "epoch": 0.4523818518378603, "grad_norm": 0.04826336354017258, "learning_rate": 2.2619092591893017e-05, "loss": 0.1591, "step": 23950 }, { "epoch": 0.4533262815911753, "grad_norm": 0.047341976314783096, "learning_rate": 2.2666314079558764e-05, "loss": 0.1592, "step": 24000 }, { "epoch": 0.4542707113444902, "grad_norm": 0.05517047643661499, "learning_rate": 2.271353556722451e-05, "loss": 0.1594, "step": 24050 }, { "epoch": 0.45521514109780514, "grad_norm": 0.04903708025813103, "learning_rate": 2.276075705489026e-05, "loss": 0.1592, "step": 24100 }, { "epoch": 0.4561595708511201, "grad_norm": 0.04570724442601204, "learning_rate": 2.2807978542556006e-05, "loss": 0.1595, "step": 24150 }, { "epoch": 0.45710400060443507, "grad_norm": 0.052628882229328156, "learning_rate": 2.2855200030221754e-05, "loss": 0.1597, "step": 24200 }, { "epoch": 0.45804843035775, "grad_norm": 0.04528496041893959, "learning_rate": 2.29024215178875e-05, "loss": 0.1589, "step": 24250 }, { "epoch": 0.45899286011106494, "grad_norm": 0.052243687212467194, "learning_rate": 2.294964300555325e-05, "loss": 0.1595, "step": 24300 }, { "epoch": 0.4599372898643799, "grad_norm": 0.051040031015872955, "learning_rate": 2.2996864493218996e-05, "loss": 0.1594, "step": 24350 }, { "epoch": 0.46088171961769486, "grad_norm": 0.0495796725153923, "learning_rate": 2.3044085980884743e-05, "loss": 0.1588, "step": 24400 }, { "epoch": 0.4618261493710098, "grad_norm": 0.044973067939281464, "learning_rate": 2.309130746855049e-05, "loss": 0.1592, "step": 24450 }, { "epoch": 0.46277057912432473, "grad_norm": 0.04926302656531334, "learning_rate": 2.3138528956216238e-05, "loss": 0.1591, "step": 24500 }, { "epoch": 0.46371500887763967, "grad_norm": 0.05289784073829651, "learning_rate": 2.3185750443881986e-05, "loss": 0.1587, "step": 24550 }, { "epoch": 0.4646594386309546, "grad_norm": 0.04602381959557533, "learning_rate": 2.323297193154773e-05, "loss": 0.1587, "step": 24600 }, { "epoch": 0.4656038683842696, "grad_norm": 0.04793664813041687, "learning_rate": 2.328019341921348e-05, "loss": 0.1584, "step": 24650 }, { "epoch": 0.4665482981375845, "grad_norm": 0.0472899004817009, "learning_rate": 2.3327414906879228e-05, "loss": 0.159, "step": 24700 }, { "epoch": 0.46749272789089946, "grad_norm": 0.05157702416181564, "learning_rate": 2.3374636394544975e-05, "loss": 0.1586, "step": 24750 }, { "epoch": 0.4684371576442144, "grad_norm": 0.05022266134619713, "learning_rate": 2.342185788221072e-05, "loss": 0.1581, "step": 24800 }, { "epoch": 0.4693815873975294, "grad_norm": 0.045308325439691544, "learning_rate": 2.346907936987647e-05, "loss": 0.1582, "step": 24850 }, { "epoch": 0.4703260171508443, "grad_norm": 0.04587983712553978, "learning_rate": 2.3516300857542218e-05, "loss": 0.1581, "step": 24900 }, { "epoch": 0.47127044690415926, "grad_norm": 0.05331459268927574, "learning_rate": 2.3563522345207965e-05, "loss": 0.1589, "step": 24950 }, { "epoch": 0.4722148766574742, "grad_norm": 0.04572860524058342, "learning_rate": 2.361074383287371e-05, "loss": 0.1581, "step": 25000 }, { "epoch": 0.4722148766574742, "eval_IntDiv": 0.6749035325926918, "eval_NumCircles": 2090, "eval_SumBottleneck": 6.851700690576545, "eval_Uniqueness": 0.9958998226950354, "eval_Validity": 0.9024, "eval_Validity * Uniqueness": 0.8986999999999999, "eval_loss": 0.21742303669452667, "eval_runtime": 182.3984, "eval_samples_per_second": 54.825, "eval_steps_per_second": 0.433, "step": 25000 }, { "epoch": 0.4731593064107892, "grad_norm": 0.04581652209162712, "learning_rate": 2.365796532053946e-05, "loss": 0.1585, "step": 25050 }, { "epoch": 0.4741037361641041, "grad_norm": 0.05741024389863014, "learning_rate": 2.3705186808205207e-05, "loss": 0.158, "step": 25100 }, { "epoch": 0.47504816591741905, "grad_norm": 0.04329367354512215, "learning_rate": 2.3752408295870955e-05, "loss": 0.158, "step": 25150 }, { "epoch": 0.475992595670734, "grad_norm": 0.06485868245363235, "learning_rate": 2.37996297835367e-05, "loss": 0.158, "step": 25200 }, { "epoch": 0.476937025424049, "grad_norm": 0.047800544649362564, "learning_rate": 2.384685127120245e-05, "loss": 0.1576, "step": 25250 }, { "epoch": 0.4778814551773639, "grad_norm": 0.04749397933483124, "learning_rate": 2.3894072758868197e-05, "loss": 0.1579, "step": 25300 }, { "epoch": 0.47882588493067885, "grad_norm": 0.04395749047398567, "learning_rate": 2.3941294246533944e-05, "loss": 0.1577, "step": 25350 }, { "epoch": 0.4797703146839938, "grad_norm": 0.05013731122016907, "learning_rate": 2.3988515734199692e-05, "loss": 0.1575, "step": 25400 }, { "epoch": 0.48071474443730877, "grad_norm": 0.051896460354328156, "learning_rate": 2.403573722186544e-05, "loss": 0.1576, "step": 25450 }, { "epoch": 0.4816591741906237, "grad_norm": 0.04924899339675903, "learning_rate": 2.4082958709531187e-05, "loss": 0.1579, "step": 25500 }, { "epoch": 0.48260360394393864, "grad_norm": 0.04659641906619072, "learning_rate": 2.4130180197196934e-05, "loss": 0.1576, "step": 25550 }, { "epoch": 0.4835480336972536, "grad_norm": 0.04758733510971069, "learning_rate": 2.417740168486268e-05, "loss": 0.1575, "step": 25600 }, { "epoch": 0.48449246345056857, "grad_norm": 0.05001719668507576, "learning_rate": 2.422462317252843e-05, "loss": 0.1573, "step": 25650 }, { "epoch": 0.4854368932038835, "grad_norm": 0.04748954251408577, "learning_rate": 2.4271844660194176e-05, "loss": 0.1574, "step": 25700 }, { "epoch": 0.48638132295719844, "grad_norm": 0.044687461107969284, "learning_rate": 2.4319066147859924e-05, "loss": 0.1573, "step": 25750 }, { "epoch": 0.48732575271051337, "grad_norm": 0.043375976383686066, "learning_rate": 2.436628763552567e-05, "loss": 0.1576, "step": 25800 }, { "epoch": 0.48827018246382836, "grad_norm": 0.05321745574474335, "learning_rate": 2.441350912319142e-05, "loss": 0.1572, "step": 25850 }, { "epoch": 0.4892146122171433, "grad_norm": 0.052148446440696716, "learning_rate": 2.4460730610857166e-05, "loss": 0.1568, "step": 25900 }, { "epoch": 0.49015904197045823, "grad_norm": 0.04462754726409912, "learning_rate": 2.4507952098522914e-05, "loss": 0.1567, "step": 25950 }, { "epoch": 0.49110347172377317, "grad_norm": 0.04695236310362816, "learning_rate": 2.455517358618866e-05, "loss": 0.157, "step": 26000 }, { "epoch": 0.49204790147708816, "grad_norm": 0.05179441347718239, "learning_rate": 2.460239507385441e-05, "loss": 0.157, "step": 26050 }, { "epoch": 0.4929923312304031, "grad_norm": 0.043727729469537735, "learning_rate": 2.4649616561520156e-05, "loss": 0.1563, "step": 26100 }, { "epoch": 0.493936760983718, "grad_norm": 0.049075886607170105, "learning_rate": 2.4696838049185903e-05, "loss": 0.1571, "step": 26150 }, { "epoch": 0.49488119073703296, "grad_norm": 0.047818735241889954, "learning_rate": 2.474405953685165e-05, "loss": 0.1566, "step": 26200 }, { "epoch": 0.49582562049034795, "grad_norm": 0.0488211065530777, "learning_rate": 2.4791281024517398e-05, "loss": 0.1567, "step": 26250 }, { "epoch": 0.4967700502436629, "grad_norm": 0.04699009656906128, "learning_rate": 2.4838502512183146e-05, "loss": 0.1568, "step": 26300 }, { "epoch": 0.4977144799969778, "grad_norm": 0.05092700198292732, "learning_rate": 2.4885723999848893e-05, "loss": 0.157, "step": 26350 }, { "epoch": 0.49865890975029276, "grad_norm": 0.04320160672068596, "learning_rate": 2.493294548751464e-05, "loss": 0.1565, "step": 26400 }, { "epoch": 0.49960333950360775, "grad_norm": 0.05727711319923401, "learning_rate": 2.4980166975180388e-05, "loss": 0.1567, "step": 26450 }, { "epoch": 0.5005477692569227, "grad_norm": 0.04930399730801582, "learning_rate": 2.5027388462846135e-05, "loss": 0.1568, "step": 26500 }, { "epoch": 0.5014921990102377, "grad_norm": 0.05059923604130745, "learning_rate": 2.5074609950511886e-05, "loss": 0.1569, "step": 26550 }, { "epoch": 0.5024366287635526, "grad_norm": 0.04332175478339195, "learning_rate": 2.512183143817763e-05, "loss": 0.1566, "step": 26600 }, { "epoch": 0.5033810585168675, "grad_norm": 0.053408633917570114, "learning_rate": 2.5169052925843378e-05, "loss": 0.1562, "step": 26650 }, { "epoch": 0.5043254882701824, "grad_norm": 0.04940927028656006, "learning_rate": 2.521627441350912e-05, "loss": 0.1565, "step": 26700 }, { "epoch": 0.5052699180234974, "grad_norm": 0.0534246489405632, "learning_rate": 2.5263495901174872e-05, "loss": 0.1563, "step": 26750 }, { "epoch": 0.5062143477768124, "grad_norm": 0.045244380831718445, "learning_rate": 2.531071738884062e-05, "loss": 0.1562, "step": 26800 }, { "epoch": 0.5071587775301273, "grad_norm": 0.04426327720284462, "learning_rate": 2.5357938876506364e-05, "loss": 0.1562, "step": 26850 }, { "epoch": 0.5081032072834423, "grad_norm": 0.045144565403461456, "learning_rate": 2.5405160364172115e-05, "loss": 0.1555, "step": 26900 }, { "epoch": 0.5090476370367573, "grad_norm": 0.0495845302939415, "learning_rate": 2.5452381851837865e-05, "loss": 0.1556, "step": 26950 }, { "epoch": 0.5099920667900721, "grad_norm": 0.05211186036467552, "learning_rate": 2.549960333950361e-05, "loss": 0.1559, "step": 27000 }, { "epoch": 0.5109364965433871, "grad_norm": 0.04264421761035919, "learning_rate": 2.5546824827169357e-05, "loss": 0.1554, "step": 27050 }, { "epoch": 0.511880926296702, "grad_norm": 0.05559466406702995, "learning_rate": 2.55940463148351e-05, "loss": 0.1555, "step": 27100 }, { "epoch": 0.512825356050017, "grad_norm": 0.0480094738304615, "learning_rate": 2.5641267802500852e-05, "loss": 0.1556, "step": 27150 }, { "epoch": 0.513769785803332, "grad_norm": 0.04755575209856033, "learning_rate": 2.56884892901666e-05, "loss": 0.1558, "step": 27200 }, { "epoch": 0.5147142155566469, "grad_norm": 0.04603414237499237, "learning_rate": 2.5735710777832343e-05, "loss": 0.1556, "step": 27250 }, { "epoch": 0.5156586453099619, "grad_norm": 0.047985028475522995, "learning_rate": 2.5782932265498094e-05, "loss": 0.1557, "step": 27300 }, { "epoch": 0.5166030750632767, "grad_norm": 0.04816871136426926, "learning_rate": 2.5830153753163838e-05, "loss": 0.1553, "step": 27350 }, { "epoch": 0.5175475048165917, "grad_norm": 0.045150693506002426, "learning_rate": 2.587737524082959e-05, "loss": 0.1554, "step": 27400 }, { "epoch": 0.5184919345699067, "grad_norm": 0.06711737811565399, "learning_rate": 2.5924596728495336e-05, "loss": 0.155, "step": 27450 }, { "epoch": 0.5194363643232216, "grad_norm": 0.05005151778459549, "learning_rate": 2.597181821616108e-05, "loss": 0.1553, "step": 27500 }, { "epoch": 0.5194363643232216, "eval_IntDiv": 0.6759081241684225, "eval_NumCircles": 2043, "eval_SumBottleneck": 15.431755526387365, "eval_Uniqueness": 0.9953942318236648, "eval_Validity": 0.9119, "eval_Validity * Uniqueness": 0.9077, "eval_loss": 0.22005124390125275, "eval_runtime": 124.0571, "eval_samples_per_second": 80.608, "eval_steps_per_second": 0.637, "step": 27500 }, { "epoch": 0.5203807940765366, "grad_norm": 0.04579911381006241, "learning_rate": 2.601903970382683e-05, "loss": 0.1549, "step": 27550 }, { "epoch": 0.5213252238298516, "grad_norm": 0.04828266054391861, "learning_rate": 2.606626119149258e-05, "loss": 0.1553, "step": 27600 }, { "epoch": 0.5222696535831665, "grad_norm": 0.04638790711760521, "learning_rate": 2.6113482679158323e-05, "loss": 0.155, "step": 27650 }, { "epoch": 0.5232140833364815, "grad_norm": 0.05341976135969162, "learning_rate": 2.6160704166824073e-05, "loss": 0.1556, "step": 27700 }, { "epoch": 0.5241585130897963, "grad_norm": 0.046980440616607666, "learning_rate": 2.6207925654489817e-05, "loss": 0.1545, "step": 27750 }, { "epoch": 0.5251029428431113, "grad_norm": 0.05067123845219612, "learning_rate": 2.6255147142155568e-05, "loss": 0.1547, "step": 27800 }, { "epoch": 0.5260473725964263, "grad_norm": 0.052519671618938446, "learning_rate": 2.6302368629821316e-05, "loss": 0.155, "step": 27850 }, { "epoch": 0.5269918023497412, "grad_norm": 0.0610831044614315, "learning_rate": 2.634959011748706e-05, "loss": 0.1545, "step": 27900 }, { "epoch": 0.5279362321030562, "grad_norm": 0.05216547101736069, "learning_rate": 2.639681160515281e-05, "loss": 0.1548, "step": 27950 }, { "epoch": 0.5288806618563712, "grad_norm": 0.04268569126725197, "learning_rate": 2.644403309281856e-05, "loss": 0.1552, "step": 28000 }, { "epoch": 0.529825091609686, "grad_norm": 0.043124664574861526, "learning_rate": 2.6491254580484305e-05, "loss": 0.1545, "step": 28050 }, { "epoch": 0.530769521363001, "grad_norm": 0.04558455944061279, "learning_rate": 2.6538476068150053e-05, "loss": 0.1551, "step": 28100 }, { "epoch": 0.5317139511163159, "grad_norm": 0.044200774282217026, "learning_rate": 2.6585697555815797e-05, "loss": 0.1543, "step": 28150 }, { "epoch": 0.5326583808696309, "grad_norm": 0.05584769695997238, "learning_rate": 2.6632919043481548e-05, "loss": 0.1542, "step": 28200 }, { "epoch": 0.5336028106229459, "grad_norm": 0.04479102045297623, "learning_rate": 2.6680140531147295e-05, "loss": 0.1548, "step": 28250 }, { "epoch": 0.5345472403762608, "grad_norm": 0.04345661401748657, "learning_rate": 2.672736201881304e-05, "loss": 0.1544, "step": 28300 }, { "epoch": 0.5354916701295758, "grad_norm": 0.04374394193291664, "learning_rate": 2.677458350647879e-05, "loss": 0.1542, "step": 28350 }, { "epoch": 0.5364360998828908, "grad_norm": 0.04467054829001427, "learning_rate": 2.682180499414454e-05, "loss": 0.155, "step": 28400 }, { "epoch": 0.5373805296362056, "grad_norm": 0.04466468468308449, "learning_rate": 2.6869026481810285e-05, "loss": 0.1545, "step": 28450 }, { "epoch": 0.5383249593895206, "grad_norm": 0.04459542781114578, "learning_rate": 2.6916247969476032e-05, "loss": 0.1542, "step": 28500 }, { "epoch": 0.5392693891428355, "grad_norm": 0.042323678731918335, "learning_rate": 2.6963469457141776e-05, "loss": 0.1541, "step": 28550 }, { "epoch": 0.5402138188961505, "grad_norm": 0.048397697508335114, "learning_rate": 2.7010690944807527e-05, "loss": 0.1543, "step": 28600 }, { "epoch": 0.5411582486494655, "grad_norm": 0.04209814965724945, "learning_rate": 2.7057912432473275e-05, "loss": 0.154, "step": 28650 }, { "epoch": 0.5421026784027804, "grad_norm": 0.044207844883203506, "learning_rate": 2.710513392013902e-05, "loss": 0.1535, "step": 28700 }, { "epoch": 0.5430471081560954, "grad_norm": 0.04861968010663986, "learning_rate": 2.715235540780477e-05, "loss": 0.154, "step": 28750 }, { "epoch": 0.5439915379094103, "grad_norm": 0.044259048998355865, "learning_rate": 2.719957689547052e-05, "loss": 0.1541, "step": 28800 }, { "epoch": 0.5449359676627252, "grad_norm": 0.04490683227777481, "learning_rate": 2.7246798383136264e-05, "loss": 0.1539, "step": 28850 }, { "epoch": 0.5458803974160402, "grad_norm": 0.043924104422330856, "learning_rate": 2.729401987080201e-05, "loss": 0.1536, "step": 28900 }, { "epoch": 0.5468248271693551, "grad_norm": 0.0450325682759285, "learning_rate": 2.7341241358467756e-05, "loss": 0.1541, "step": 28950 }, { "epoch": 0.5477692569226701, "grad_norm": 0.045916877686977386, "learning_rate": 2.7388462846133506e-05, "loss": 0.1537, "step": 29000 }, { "epoch": 0.5487136866759851, "grad_norm": 0.04375700652599335, "learning_rate": 2.7435684333799254e-05, "loss": 0.1535, "step": 29050 }, { "epoch": 0.5496581164293, "grad_norm": 0.04615338146686554, "learning_rate": 2.7482905821464998e-05, "loss": 0.1534, "step": 29100 }, { "epoch": 0.550602546182615, "grad_norm": 0.04711620509624481, "learning_rate": 2.753012730913075e-05, "loss": 0.1539, "step": 29150 }, { "epoch": 0.5515469759359299, "grad_norm": 0.044599030166864395, "learning_rate": 2.75773487967965e-05, "loss": 0.1539, "step": 29200 }, { "epoch": 0.5524914056892448, "grad_norm": 0.04440312460064888, "learning_rate": 2.7624570284462244e-05, "loss": 0.1533, "step": 29250 }, { "epoch": 0.5534358354425598, "grad_norm": 0.04638102650642395, "learning_rate": 2.767179177212799e-05, "loss": 0.1533, "step": 29300 }, { "epoch": 0.5543802651958747, "grad_norm": 0.053348176181316376, "learning_rate": 2.7719013259793735e-05, "loss": 0.1538, "step": 29350 }, { "epoch": 0.5553246949491897, "grad_norm": 0.050860531628131866, "learning_rate": 2.7766234747459486e-05, "loss": 0.1533, "step": 29400 }, { "epoch": 0.5562691247025047, "grad_norm": 0.04356103390455246, "learning_rate": 2.7813456235125233e-05, "loss": 0.1527, "step": 29450 }, { "epoch": 0.5572135544558195, "grad_norm": 0.042640671133995056, "learning_rate": 2.7860677722790977e-05, "loss": 0.1532, "step": 29500 }, { "epoch": 0.5581579842091345, "grad_norm": 0.04304592311382294, "learning_rate": 2.7907899210456728e-05, "loss": 0.153, "step": 29550 }, { "epoch": 0.5591024139624494, "grad_norm": 0.04316912591457367, "learning_rate": 2.7955120698122472e-05, "loss": 0.1533, "step": 29600 }, { "epoch": 0.5600468437157644, "grad_norm": 0.04900282993912697, "learning_rate": 2.8002342185788223e-05, "loss": 0.1531, "step": 29650 }, { "epoch": 0.5609912734690794, "grad_norm": 0.04648090526461601, "learning_rate": 2.804956367345397e-05, "loss": 0.1537, "step": 29700 }, { "epoch": 0.5619357032223943, "grad_norm": 0.04537497088313103, "learning_rate": 2.8096785161119714e-05, "loss": 0.1531, "step": 29750 }, { "epoch": 0.5628801329757093, "grad_norm": 0.0440855398774147, "learning_rate": 2.8144006648785465e-05, "loss": 0.1532, "step": 29800 }, { "epoch": 0.5638245627290243, "grad_norm": 0.04407341778278351, "learning_rate": 2.8191228136451213e-05, "loss": 0.1526, "step": 29850 }, { "epoch": 0.5647689924823391, "grad_norm": 0.044014111161231995, "learning_rate": 2.8238449624116957e-05, "loss": 0.153, "step": 29900 }, { "epoch": 0.5657134222356541, "grad_norm": 0.04828241467475891, "learning_rate": 2.8285671111782708e-05, "loss": 0.1529, "step": 29950 }, { "epoch": 0.566657851988969, "grad_norm": 0.057511258870363235, "learning_rate": 2.833289259944845e-05, "loss": 0.1526, "step": 30000 }, { "epoch": 0.566657851988969, "eval_IntDiv": 0.6733873312690326, "eval_NumCircles": 2029, "eval_SumBottleneck": 94.85636791770321, "eval_Uniqueness": 0.9959974037213327, "eval_Validity": 0.9244, "eval_Validity * Uniqueness": 0.9207, "eval_loss": 0.22100494801998138, "eval_runtime": 132.8129, "eval_samples_per_second": 75.294, "eval_steps_per_second": 0.595, "step": 30000 }, { "epoch": 0.567602281742284, "grad_norm": 0.043798502534627914, "learning_rate": 2.8380114087114202e-05, "loss": 0.1525, "step": 30050 }, { "epoch": 0.568546711495599, "grad_norm": 0.04901360720396042, "learning_rate": 2.842733557477995e-05, "loss": 0.152, "step": 30100 }, { "epoch": 0.5694911412489139, "grad_norm": 0.045699212700128555, "learning_rate": 2.8474557062445694e-05, "loss": 0.1525, "step": 30150 }, { "epoch": 0.5704355710022289, "grad_norm": 0.04512882977724075, "learning_rate": 2.8521778550111445e-05, "loss": 0.1524, "step": 30200 }, { "epoch": 0.5713800007555438, "grad_norm": 0.050868455320596695, "learning_rate": 2.8569000037777192e-05, "loss": 0.1522, "step": 30250 }, { "epoch": 0.5723244305088587, "grad_norm": 0.0531810037791729, "learning_rate": 2.8616221525442936e-05, "loss": 0.1527, "step": 30300 }, { "epoch": 0.5732688602621737, "grad_norm": 0.0464874766767025, "learning_rate": 2.8663443013108687e-05, "loss": 0.1529, "step": 30350 }, { "epoch": 0.5742132900154886, "grad_norm": 0.04772254452109337, "learning_rate": 2.871066450077443e-05, "loss": 0.1531, "step": 30400 }, { "epoch": 0.5751577197688036, "grad_norm": 0.05246063694357872, "learning_rate": 2.8757885988440182e-05, "loss": 0.1521, "step": 30450 }, { "epoch": 0.5761021495221186, "grad_norm": 0.05110354721546173, "learning_rate": 2.880510747610593e-05, "loss": 0.1523, "step": 30500 }, { "epoch": 0.5770465792754335, "grad_norm": 0.041170086711645126, "learning_rate": 2.8852328963771673e-05, "loss": 0.1518, "step": 30550 }, { "epoch": 0.5779910090287484, "grad_norm": 0.049853697419166565, "learning_rate": 2.8899550451437424e-05, "loss": 0.152, "step": 30600 }, { "epoch": 0.5789354387820634, "grad_norm": 0.044876206666231155, "learning_rate": 2.8946771939103175e-05, "loss": 0.1524, "step": 30650 }, { "epoch": 0.5798798685353783, "grad_norm": 0.04139046370983124, "learning_rate": 2.899399342676892e-05, "loss": 0.1521, "step": 30700 }, { "epoch": 0.5808242982886933, "grad_norm": 0.04761512205004692, "learning_rate": 2.9041214914434666e-05, "loss": 0.1521, "step": 30750 }, { "epoch": 0.5817687280420082, "grad_norm": 0.04319838061928749, "learning_rate": 2.908843640210041e-05, "loss": 0.1519, "step": 30800 }, { "epoch": 0.5827131577953232, "grad_norm": 0.04349119961261749, "learning_rate": 2.913565788976616e-05, "loss": 0.1518, "step": 30850 }, { "epoch": 0.5836575875486382, "grad_norm": 0.03965750336647034, "learning_rate": 2.918287937743191e-05, "loss": 0.1522, "step": 30900 }, { "epoch": 0.584602017301953, "grad_norm": 0.05037494748830795, "learning_rate": 2.9230100865097653e-05, "loss": 0.1517, "step": 30950 }, { "epoch": 0.585546447055268, "grad_norm": 0.04333679750561714, "learning_rate": 2.9277322352763403e-05, "loss": 0.1517, "step": 31000 }, { "epoch": 0.586490876808583, "grad_norm": 0.0419125109910965, "learning_rate": 2.9324543840429154e-05, "loss": 0.152, "step": 31050 }, { "epoch": 0.5874353065618979, "grad_norm": 0.04751225933432579, "learning_rate": 2.93717653280949e-05, "loss": 0.1516, "step": 31100 }, { "epoch": 0.5883797363152129, "grad_norm": 0.043536752462387085, "learning_rate": 2.9418986815760646e-05, "loss": 0.1514, "step": 31150 }, { "epoch": 0.5893241660685278, "grad_norm": 0.04816202074289322, "learning_rate": 2.946620830342639e-05, "loss": 0.1513, "step": 31200 }, { "epoch": 0.5902685958218428, "grad_norm": 0.04625553637742996, "learning_rate": 2.951342979109214e-05, "loss": 0.1516, "step": 31250 }, { "epoch": 0.5912130255751578, "grad_norm": 0.047176361083984375, "learning_rate": 2.9560651278757888e-05, "loss": 0.1517, "step": 31300 }, { "epoch": 0.5921574553284726, "grad_norm": 0.04586511850357056, "learning_rate": 2.9607872766423632e-05, "loss": 0.1516, "step": 31350 }, { "epoch": 0.5931018850817876, "grad_norm": 0.04349669814109802, "learning_rate": 2.9655094254089383e-05, "loss": 0.1516, "step": 31400 }, { "epoch": 0.5940463148351026, "grad_norm": 0.04172945022583008, "learning_rate": 2.9702315741755134e-05, "loss": 0.1515, "step": 31450 }, { "epoch": 0.5949907445884175, "grad_norm": 0.04460207372903824, "learning_rate": 2.9749537229420878e-05, "loss": 0.1509, "step": 31500 }, { "epoch": 0.5959351743417325, "grad_norm": 0.04792268946766853, "learning_rate": 2.9796758717086625e-05, "loss": 0.1513, "step": 31550 }, { "epoch": 0.5968796040950474, "grad_norm": 0.042499180883169174, "learning_rate": 2.984398020475237e-05, "loss": 0.1522, "step": 31600 }, { "epoch": 0.5978240338483624, "grad_norm": 0.046458616852760315, "learning_rate": 2.989120169241812e-05, "loss": 0.1506, "step": 31650 }, { "epoch": 0.5987684636016773, "grad_norm": 0.042233433574438095, "learning_rate": 2.9938423180083867e-05, "loss": 0.1506, "step": 31700 }, { "epoch": 0.5997128933549922, "grad_norm": 0.04203198105096817, "learning_rate": 2.998564466774961e-05, "loss": 0.1511, "step": 31750 }, { "epoch": 0.6006573231083072, "grad_norm": 0.043934185057878494, "learning_rate": 3.0032866155415362e-05, "loss": 0.1511, "step": 31800 }, { "epoch": 0.6016017528616222, "grad_norm": 0.048820290714502335, "learning_rate": 3.0080087643081113e-05, "loss": 0.151, "step": 31850 }, { "epoch": 0.6025461826149371, "grad_norm": 0.04007445648312569, "learning_rate": 3.0127309130746857e-05, "loss": 0.1508, "step": 31900 }, { "epoch": 0.6034906123682521, "grad_norm": 0.046698328107595444, "learning_rate": 3.0174530618412605e-05, "loss": 0.1511, "step": 31950 }, { "epoch": 0.604435042121567, "grad_norm": 0.044066209346055984, "learning_rate": 3.022175210607835e-05, "loss": 0.1509, "step": 32000 }, { "epoch": 0.605379471874882, "grad_norm": 0.04355258867144585, "learning_rate": 3.02689735937441e-05, "loss": 0.1508, "step": 32050 }, { "epoch": 0.6063239016281969, "grad_norm": 0.04353592172265053, "learning_rate": 3.0316195081409847e-05, "loss": 0.1506, "step": 32100 }, { "epoch": 0.6072683313815118, "grad_norm": 0.043385494500398636, "learning_rate": 3.036341656907559e-05, "loss": 0.1512, "step": 32150 }, { "epoch": 0.6082127611348268, "grad_norm": 0.04625597223639488, "learning_rate": 3.0410638056741342e-05, "loss": 0.1503, "step": 32200 }, { "epoch": 0.6091571908881417, "grad_norm": 0.04363720118999481, "learning_rate": 3.0457859544407086e-05, "loss": 0.1507, "step": 32250 }, { "epoch": 0.6101016206414567, "grad_norm": 0.045969411730766296, "learning_rate": 3.0505081032072837e-05, "loss": 0.1506, "step": 32300 }, { "epoch": 0.6110460503947717, "grad_norm": 0.04395844787359238, "learning_rate": 3.0552302519738584e-05, "loss": 0.1503, "step": 32350 }, { "epoch": 0.6119904801480865, "grad_norm": 0.04256156459450722, "learning_rate": 3.059952400740433e-05, "loss": 0.1506, "step": 32400 }, { "epoch": 0.6129349099014015, "grad_norm": 0.04682016372680664, "learning_rate": 3.064674549507008e-05, "loss": 0.1502, "step": 32450 }, { "epoch": 0.6138793396547165, "grad_norm": 0.04435824975371361, "learning_rate": 3.0693966982735826e-05, "loss": 0.1504, "step": 32500 }, { "epoch": 0.6138793396547165, "eval_IntDiv": 0.6721615290451819, "eval_NumCircles": 2035, "eval_SumBottleneck": 66.73841546496317, "eval_Uniqueness": 0.9964736054712545, "eval_Validity": 0.9358, "eval_Validity * Uniqueness": 0.9325, "eval_loss": 0.21875813603401184, "eval_runtime": 137.5845, "eval_samples_per_second": 72.683, "eval_steps_per_second": 0.574, "step": 32500 }, { "epoch": 0.6148237694080314, "grad_norm": 0.04001381993293762, "learning_rate": 3.0741188470401574e-05, "loss": 0.1501, "step": 32550 }, { "epoch": 0.6157681991613464, "grad_norm": 0.04838736355304718, "learning_rate": 3.078840995806732e-05, "loss": 0.1505, "step": 32600 }, { "epoch": 0.6167126289146613, "grad_norm": 0.04443756118416786, "learning_rate": 3.083563144573307e-05, "loss": 0.1508, "step": 32650 }, { "epoch": 0.6176570586679763, "grad_norm": 0.04403910040855408, "learning_rate": 3.0882852933398816e-05, "loss": 0.1503, "step": 32700 }, { "epoch": 0.6186014884212913, "grad_norm": 0.04639765992760658, "learning_rate": 3.093007442106456e-05, "loss": 0.1504, "step": 32750 }, { "epoch": 0.6195459181746061, "grad_norm": 0.046807777136564255, "learning_rate": 3.097729590873031e-05, "loss": 0.1497, "step": 32800 }, { "epoch": 0.6204903479279211, "grad_norm": 0.042669061571359634, "learning_rate": 3.102451739639606e-05, "loss": 0.1507, "step": 32850 }, { "epoch": 0.6214347776812361, "grad_norm": 0.04330708086490631, "learning_rate": 3.1071738884061806e-05, "loss": 0.1503, "step": 32900 }, { "epoch": 0.622379207434551, "grad_norm": 0.04079671576619148, "learning_rate": 3.111896037172755e-05, "loss": 0.1497, "step": 32950 }, { "epoch": 0.623323637187866, "grad_norm": 0.041497327387332916, "learning_rate": 3.11661818593933e-05, "loss": 0.15, "step": 33000 }, { "epoch": 0.6242680669411809, "grad_norm": 0.043404724448919296, "learning_rate": 3.121340334705905e-05, "loss": 0.15, "step": 33050 }, { "epoch": 0.6252124966944959, "grad_norm": 0.04196419566869736, "learning_rate": 3.1260624834724795e-05, "loss": 0.1499, "step": 33100 }, { "epoch": 0.6261569264478108, "grad_norm": 0.0513342022895813, "learning_rate": 3.130784632239054e-05, "loss": 0.1494, "step": 33150 }, { "epoch": 0.6271013562011257, "grad_norm": 0.04405048117041588, "learning_rate": 3.135506781005629e-05, "loss": 0.15, "step": 33200 }, { "epoch": 0.6280457859544407, "grad_norm": 0.0435125008225441, "learning_rate": 3.140228929772204e-05, "loss": 0.15, "step": 33250 }, { "epoch": 0.6289902157077557, "grad_norm": 0.04210624098777771, "learning_rate": 3.1449510785387785e-05, "loss": 0.1495, "step": 33300 }, { "epoch": 0.6299346454610706, "grad_norm": 0.044044654816389084, "learning_rate": 3.149673227305353e-05, "loss": 0.1503, "step": 33350 }, { "epoch": 0.6308790752143856, "grad_norm": 0.046324584633111954, "learning_rate": 3.154395376071928e-05, "loss": 0.1499, "step": 33400 }, { "epoch": 0.6318235049677005, "grad_norm": 0.04510977491736412, "learning_rate": 3.159117524838503e-05, "loss": 0.1503, "step": 33450 }, { "epoch": 0.6327679347210154, "grad_norm": 0.04453182965517044, "learning_rate": 3.1638396736050775e-05, "loss": 0.1496, "step": 33500 }, { "epoch": 0.6337123644743304, "grad_norm": 0.04619555547833443, "learning_rate": 3.168561822371652e-05, "loss": 0.15, "step": 33550 }, { "epoch": 0.6346567942276453, "grad_norm": 0.046492885798215866, "learning_rate": 3.173283971138227e-05, "loss": 0.1494, "step": 33600 }, { "epoch": 0.6356012239809603, "grad_norm": 0.044635359197854996, "learning_rate": 3.178006119904802e-05, "loss": 0.1501, "step": 33650 }, { "epoch": 0.6365456537342753, "grad_norm": 0.043232157826423645, "learning_rate": 3.1827282686713764e-05, "loss": 0.1499, "step": 33700 }, { "epoch": 0.6374900834875902, "grad_norm": 0.04921558126807213, "learning_rate": 3.187450417437951e-05, "loss": 0.1502, "step": 33750 }, { "epoch": 0.6384345132409052, "grad_norm": 0.045477837324142456, "learning_rate": 3.192172566204526e-05, "loss": 0.1496, "step": 33800 }, { "epoch": 0.63937894299422, "grad_norm": 0.03983936831355095, "learning_rate": 3.196894714971101e-05, "loss": 0.1492, "step": 33850 }, { "epoch": 0.640323372747535, "grad_norm": 0.052483588457107544, "learning_rate": 3.2016168637376754e-05, "loss": 0.1497, "step": 33900 }, { "epoch": 0.64126780250085, "grad_norm": 0.04190405458211899, "learning_rate": 3.20633901250425e-05, "loss": 0.1495, "step": 33950 }, { "epoch": 0.6422122322541649, "grad_norm": 0.04555065557360649, "learning_rate": 3.211061161270825e-05, "loss": 0.149, "step": 34000 }, { "epoch": 0.6431566620074799, "grad_norm": 0.045656684786081314, "learning_rate": 3.2157833100373996e-05, "loss": 0.1491, "step": 34050 }, { "epoch": 0.6441010917607949, "grad_norm": 0.04785612225532532, "learning_rate": 3.2205054588039744e-05, "loss": 0.1494, "step": 34100 }, { "epoch": 0.6450455215141098, "grad_norm": 0.049298759549856186, "learning_rate": 3.225227607570549e-05, "loss": 0.1495, "step": 34150 }, { "epoch": 0.6459899512674248, "grad_norm": 0.04267873242497444, "learning_rate": 3.229949756337124e-05, "loss": 0.1494, "step": 34200 }, { "epoch": 0.6469343810207396, "grad_norm": 0.04413650929927826, "learning_rate": 3.2346719051036986e-05, "loss": 0.1492, "step": 34250 }, { "epoch": 0.6478788107740546, "grad_norm": 0.04392082244157791, "learning_rate": 3.2393940538702734e-05, "loss": 0.1489, "step": 34300 }, { "epoch": 0.6488232405273696, "grad_norm": 0.0455198809504509, "learning_rate": 3.244116202636848e-05, "loss": 0.1487, "step": 34350 }, { "epoch": 0.6497676702806845, "grad_norm": 0.041449300944805145, "learning_rate": 3.248838351403423e-05, "loss": 0.149, "step": 34400 }, { "epoch": 0.6507121000339995, "grad_norm": 0.04707035422325134, "learning_rate": 3.2535605001699976e-05, "loss": 0.1491, "step": 34450 }, { "epoch": 0.6516565297873144, "grad_norm": 0.041911277920007706, "learning_rate": 3.2582826489365716e-05, "loss": 0.1491, "step": 34500 }, { "epoch": 0.6526009595406294, "grad_norm": 0.04151961952447891, "learning_rate": 3.263004797703147e-05, "loss": 0.1487, "step": 34550 }, { "epoch": 0.6535453892939443, "grad_norm": 0.044632069766521454, "learning_rate": 3.267726946469722e-05, "loss": 0.149, "step": 34600 }, { "epoch": 0.6544898190472592, "grad_norm": 0.042126793414354324, "learning_rate": 3.2724490952362966e-05, "loss": 0.1486, "step": 34650 }, { "epoch": 0.6554342488005742, "grad_norm": 0.04214045777916908, "learning_rate": 3.277171244002871e-05, "loss": 0.1479, "step": 34700 }, { "epoch": 0.6563786785538892, "grad_norm": 0.04234960675239563, "learning_rate": 3.281893392769446e-05, "loss": 0.1487, "step": 34750 }, { "epoch": 0.6573231083072041, "grad_norm": 0.039977334439754486, "learning_rate": 3.286615541536021e-05, "loss": 0.1492, "step": 34800 }, { "epoch": 0.6582675380605191, "grad_norm": 0.04243616387248039, "learning_rate": 3.2913376903025955e-05, "loss": 0.1484, "step": 34850 }, { "epoch": 0.659211967813834, "grad_norm": 0.05773103982210159, "learning_rate": 3.29605983906917e-05, "loss": 0.1483, "step": 34900 }, { "epoch": 0.660156397567149, "grad_norm": 0.04068661853671074, "learning_rate": 3.300781987835745e-05, "loss": 0.1494, "step": 34950 }, { "epoch": 0.6611008273204639, "grad_norm": 0.0442153736948967, "learning_rate": 3.30550413660232e-05, "loss": 0.1484, "step": 35000 }, { "epoch": 0.6611008273204639, "eval_IntDiv": 0.6770821801344873, "eval_NumCircles": 2058, "eval_SumBottleneck": 102.10826414955649, "eval_Uniqueness": 0.9962614825891903, "eval_Validity": 0.9362, "eval_Validity * Uniqueness": 0.9327, "eval_loss": 0.21551957726478577, "eval_runtime": 173.3323, "eval_samples_per_second": 57.693, "eval_steps_per_second": 0.456, "step": 35000 }, { "epoch": 0.6620452570737788, "grad_norm": 0.04658207297325134, "learning_rate": 3.3102262853688945e-05, "loss": 0.1484, "step": 35050 }, { "epoch": 0.6629896868270938, "grad_norm": 0.039961159229278564, "learning_rate": 3.314948434135469e-05, "loss": 0.1481, "step": 35100 }, { "epoch": 0.6639341165804088, "grad_norm": 0.04039971902966499, "learning_rate": 3.319670582902044e-05, "loss": 0.1488, "step": 35150 }, { "epoch": 0.6648785463337237, "grad_norm": 0.043323203921318054, "learning_rate": 3.324392731668619e-05, "loss": 0.1485, "step": 35200 }, { "epoch": 0.6658229760870387, "grad_norm": 0.03915318101644516, "learning_rate": 3.3291148804351935e-05, "loss": 0.1483, "step": 35250 }, { "epoch": 0.6667674058403535, "grad_norm": 0.04595942795276642, "learning_rate": 3.333837029201768e-05, "loss": 0.1483, "step": 35300 }, { "epoch": 0.6677118355936685, "grad_norm": 0.04103100299835205, "learning_rate": 3.338559177968343e-05, "loss": 0.1478, "step": 35350 }, { "epoch": 0.6686562653469835, "grad_norm": 0.04457545652985573, "learning_rate": 3.343281326734918e-05, "loss": 0.1481, "step": 35400 }, { "epoch": 0.6696006951002984, "grad_norm": 0.045350249856710434, "learning_rate": 3.3480034755014924e-05, "loss": 0.1482, "step": 35450 }, { "epoch": 0.6705451248536134, "grad_norm": 0.04725562036037445, "learning_rate": 3.352725624268067e-05, "loss": 0.1481, "step": 35500 }, { "epoch": 0.6714895546069284, "grad_norm": 0.040911879390478134, "learning_rate": 3.357447773034642e-05, "loss": 0.1482, "step": 35550 }, { "epoch": 0.6724339843602433, "grad_norm": 0.041172876954078674, "learning_rate": 3.3621699218012167e-05, "loss": 0.1476, "step": 35600 }, { "epoch": 0.6733784141135583, "grad_norm": 0.03957286849617958, "learning_rate": 3.3668920705677914e-05, "loss": 0.148, "step": 35650 }, { "epoch": 0.6743228438668731, "grad_norm": 0.04149788245558739, "learning_rate": 3.371614219334366e-05, "loss": 0.1479, "step": 35700 }, { "epoch": 0.6752672736201881, "grad_norm": 0.03935207799077034, "learning_rate": 3.376336368100941e-05, "loss": 0.1478, "step": 35750 }, { "epoch": 0.6762117033735031, "grad_norm": 0.04698629304766655, "learning_rate": 3.3810585168675156e-05, "loss": 0.1481, "step": 35800 }, { "epoch": 0.677156133126818, "grad_norm": 0.038831084966659546, "learning_rate": 3.3857806656340904e-05, "loss": 0.1479, "step": 35850 }, { "epoch": 0.678100562880133, "grad_norm": 0.03888256847858429, "learning_rate": 3.390502814400665e-05, "loss": 0.1478, "step": 35900 }, { "epoch": 0.679044992633448, "grad_norm": 0.04672541096806526, "learning_rate": 3.39522496316724e-05, "loss": 0.1481, "step": 35950 }, { "epoch": 0.6799894223867629, "grad_norm": 0.053017470985651016, "learning_rate": 3.3999471119338146e-05, "loss": 0.1478, "step": 36000 }, { "epoch": 0.6809338521400778, "grad_norm": 0.04514249786734581, "learning_rate": 3.4046692607003893e-05, "loss": 0.1472, "step": 36050 }, { "epoch": 0.6818782818933927, "grad_norm": 0.041875209659338, "learning_rate": 3.409391409466964e-05, "loss": 0.1479, "step": 36100 }, { "epoch": 0.6828227116467077, "grad_norm": 0.04394491761922836, "learning_rate": 3.414113558233539e-05, "loss": 0.1477, "step": 36150 }, { "epoch": 0.6837671414000227, "grad_norm": 0.04849394038319588, "learning_rate": 3.4188357070001136e-05, "loss": 0.1474, "step": 36200 }, { "epoch": 0.6847115711533376, "grad_norm": 0.04249487444758415, "learning_rate": 3.423557855766688e-05, "loss": 0.1474, "step": 36250 }, { "epoch": 0.6856560009066526, "grad_norm": 0.040962573140859604, "learning_rate": 3.428280004533263e-05, "loss": 0.1481, "step": 36300 }, { "epoch": 0.6866004306599676, "grad_norm": 0.04347304254770279, "learning_rate": 3.433002153299838e-05, "loss": 0.1479, "step": 36350 }, { "epoch": 0.6875448604132824, "grad_norm": 0.037552349269390106, "learning_rate": 3.4377243020664125e-05, "loss": 0.1478, "step": 36400 }, { "epoch": 0.6884892901665974, "grad_norm": 0.04572897404432297, "learning_rate": 3.442446450832987e-05, "loss": 0.1476, "step": 36450 }, { "epoch": 0.6894337199199123, "grad_norm": 0.0419122651219368, "learning_rate": 3.447168599599562e-05, "loss": 0.1475, "step": 36500 }, { "epoch": 0.6903781496732273, "grad_norm": 0.045845117419958115, "learning_rate": 3.451890748366137e-05, "loss": 0.1475, "step": 36550 }, { "epoch": 0.6913225794265423, "grad_norm": 0.042422957718372345, "learning_rate": 3.4566128971327115e-05, "loss": 0.1475, "step": 36600 }, { "epoch": 0.6922670091798572, "grad_norm": 0.0408136248588562, "learning_rate": 3.461335045899286e-05, "loss": 0.1475, "step": 36650 }, { "epoch": 0.6932114389331722, "grad_norm": 0.04876342788338661, "learning_rate": 3.466057194665861e-05, "loss": 0.1471, "step": 36700 }, { "epoch": 0.6941558686864872, "grad_norm": 0.03962872922420502, "learning_rate": 3.470779343432436e-05, "loss": 0.1471, "step": 36750 }, { "epoch": 0.695100298439802, "grad_norm": 0.04511722922325134, "learning_rate": 3.4755014921990105e-05, "loss": 0.1473, "step": 36800 }, { "epoch": 0.696044728193117, "grad_norm": 0.04210526868700981, "learning_rate": 3.480223640965585e-05, "loss": 0.1471, "step": 36850 }, { "epoch": 0.6969891579464319, "grad_norm": 0.04322464391589165, "learning_rate": 3.48494578973216e-05, "loss": 0.1474, "step": 36900 }, { "epoch": 0.6979335876997469, "grad_norm": 0.043449219316244125, "learning_rate": 3.489667938498735e-05, "loss": 0.147, "step": 36950 }, { "epoch": 0.6988780174530619, "grad_norm": 0.04591750726103783, "learning_rate": 3.4943900872653094e-05, "loss": 0.1472, "step": 37000 }, { "epoch": 0.6998224472063768, "grad_norm": 0.05744858458638191, "learning_rate": 3.499112236031884e-05, "loss": 0.1469, "step": 37050 }, { "epoch": 0.7007668769596918, "grad_norm": 0.04016308858990669, "learning_rate": 3.503834384798459e-05, "loss": 0.1472, "step": 37100 }, { "epoch": 0.7017113067130066, "grad_norm": 0.044145192950963974, "learning_rate": 3.508556533565033e-05, "loss": 0.1473, "step": 37150 }, { "epoch": 0.7026557364663216, "grad_norm": 0.043727025389671326, "learning_rate": 3.5132786823316084e-05, "loss": 0.1473, "step": 37200 }, { "epoch": 0.7036001662196366, "grad_norm": 0.045494649559259415, "learning_rate": 3.518000831098183e-05, "loss": 0.1468, "step": 37250 }, { "epoch": 0.7045445959729515, "grad_norm": 0.041169676929712296, "learning_rate": 3.522722979864758e-05, "loss": 0.1467, "step": 37300 }, { "epoch": 0.7054890257262665, "grad_norm": 0.04302212968468666, "learning_rate": 3.5274451286313326e-05, "loss": 0.1468, "step": 37350 }, { "epoch": 0.7064334554795815, "grad_norm": 0.0564848892390728, "learning_rate": 3.5321672773979074e-05, "loss": 0.1469, "step": 37400 }, { "epoch": 0.7073778852328964, "grad_norm": 0.0423211008310318, "learning_rate": 3.536889426164482e-05, "loss": 0.1467, "step": 37450 }, { "epoch": 0.7083223149862113, "grad_norm": 0.03968310356140137, "learning_rate": 3.541611574931057e-05, "loss": 0.1464, "step": 37500 }, { "epoch": 0.7083223149862113, "eval_IntDiv": 0.6745440047293156, "eval_NumCircles": 1977, "eval_SumBottleneck": 95.88656318846768, "eval_Uniqueness": 0.9949664429530202, "eval_Validity": 0.9536, "eval_Validity * Uniqueness": 0.9488000000000001, "eval_loss": 0.21881870925426483, "eval_runtime": 275.0232, "eval_samples_per_second": 36.361, "eval_steps_per_second": 0.287, "step": 37500 }, { "epoch": 0.7092667447395262, "grad_norm": 0.038500651717185974, "learning_rate": 3.5463337236976316e-05, "loss": 0.1459, "step": 37550 }, { "epoch": 0.7102111744928412, "grad_norm": 0.07079191505908966, "learning_rate": 3.5510558724642064e-05, "loss": 0.1521, "step": 37600 }, { "epoch": 0.7111556042461562, "grad_norm": 0.04474485665559769, "learning_rate": 3.555778021230781e-05, "loss": 0.1498, "step": 37650 }, { "epoch": 0.7121000339994711, "grad_norm": 0.039751190692186356, "learning_rate": 3.560500169997356e-05, "loss": 0.147, "step": 37700 }, { "epoch": 0.7130444637527861, "grad_norm": 0.04085596650838852, "learning_rate": 3.5652223187639306e-05, "loss": 0.1469, "step": 37750 }, { "epoch": 0.7139888935061011, "grad_norm": 0.04008062183856964, "learning_rate": 3.569944467530505e-05, "loss": 0.147, "step": 37800 }, { "epoch": 0.7149333232594159, "grad_norm": 0.043622080236673355, "learning_rate": 3.57466661629708e-05, "loss": 0.1463, "step": 37850 }, { "epoch": 0.7158777530127309, "grad_norm": 0.0386788435280323, "learning_rate": 3.579388765063655e-05, "loss": 0.1466, "step": 37900 }, { "epoch": 0.7168221827660458, "grad_norm": 0.041269659996032715, "learning_rate": 3.5841109138302296e-05, "loss": 0.1461, "step": 37950 }, { "epoch": 0.7177666125193608, "grad_norm": 0.04069847986102104, "learning_rate": 3.588833062596804e-05, "loss": 0.1463, "step": 38000 }, { "epoch": 0.7187110422726758, "grad_norm": 0.04314687103033066, "learning_rate": 3.593555211363379e-05, "loss": 0.1465, "step": 38050 }, { "epoch": 0.7196554720259907, "grad_norm": 0.04384343698620796, "learning_rate": 3.598277360129954e-05, "loss": 0.1468, "step": 38100 }, { "epoch": 0.7205999017793057, "grad_norm": 0.04022786766290665, "learning_rate": 3.6029995088965285e-05, "loss": 0.1467, "step": 38150 }, { "epoch": 0.7215443315326207, "grad_norm": 0.040209971368312836, "learning_rate": 3.607721657663103e-05, "loss": 0.146, "step": 38200 }, { "epoch": 0.7224887612859355, "grad_norm": 0.04293399676680565, "learning_rate": 3.612443806429678e-05, "loss": 0.1464, "step": 38250 }, { "epoch": 0.7234331910392505, "grad_norm": 0.03986478969454765, "learning_rate": 3.617165955196253e-05, "loss": 0.1455, "step": 38300 }, { "epoch": 0.7243776207925654, "grad_norm": 0.04174085706472397, "learning_rate": 3.6218881039628275e-05, "loss": 0.1461, "step": 38350 }, { "epoch": 0.7253220505458804, "grad_norm": 0.0384858213365078, "learning_rate": 3.626610252729402e-05, "loss": 0.1458, "step": 38400 }, { "epoch": 0.7262664802991954, "grad_norm": 0.037855248898267746, "learning_rate": 3.631332401495977e-05, "loss": 0.1458, "step": 38450 }, { "epoch": 0.7272109100525103, "grad_norm": 0.04487213119864464, "learning_rate": 3.636054550262552e-05, "loss": 0.1466, "step": 38500 }, { "epoch": 0.7281553398058253, "grad_norm": 0.03921857103705406, "learning_rate": 3.6407766990291265e-05, "loss": 0.1456, "step": 38550 }, { "epoch": 0.7290997695591402, "grad_norm": 0.039742033928632736, "learning_rate": 3.645498847795701e-05, "loss": 0.1453, "step": 38600 }, { "epoch": 0.7300441993124551, "grad_norm": 0.042734693735837936, "learning_rate": 3.650220996562276e-05, "loss": 0.1457, "step": 38650 }, { "epoch": 0.7309886290657701, "grad_norm": 0.040849748998880386, "learning_rate": 3.654943145328851e-05, "loss": 0.1458, "step": 38700 }, { "epoch": 0.731933058819085, "grad_norm": 0.04030263051390648, "learning_rate": 3.6596652940954254e-05, "loss": 0.1456, "step": 38750 }, { "epoch": 0.7328774885724, "grad_norm": 0.04032140225172043, "learning_rate": 3.664387442862e-05, "loss": 0.1458, "step": 38800 }, { "epoch": 0.733821918325715, "grad_norm": 0.03997810557484627, "learning_rate": 3.669109591628575e-05, "loss": 0.1456, "step": 38850 }, { "epoch": 0.7347663480790299, "grad_norm": 0.04056718572974205, "learning_rate": 3.67383174039515e-05, "loss": 0.1456, "step": 38900 }, { "epoch": 0.7357107778323448, "grad_norm": 0.04264628142118454, "learning_rate": 3.6785538891617244e-05, "loss": 0.1454, "step": 38950 }, { "epoch": 0.7366552075856598, "grad_norm": 0.04554244503378868, "learning_rate": 3.683276037928299e-05, "loss": 0.1459, "step": 39000 }, { "epoch": 0.7375996373389747, "grad_norm": 0.042803600430488586, "learning_rate": 3.687998186694874e-05, "loss": 0.1453, "step": 39050 }, { "epoch": 0.7385440670922897, "grad_norm": 0.042651817202568054, "learning_rate": 3.6927203354614486e-05, "loss": 0.1452, "step": 39100 }, { "epoch": 0.7394884968456046, "grad_norm": 0.03989112377166748, "learning_rate": 3.6974424842280234e-05, "loss": 0.1456, "step": 39150 }, { "epoch": 0.7404329265989196, "grad_norm": 0.04320903122425079, "learning_rate": 3.702164632994598e-05, "loss": 0.1448, "step": 39200 }, { "epoch": 0.7413773563522346, "grad_norm": 0.045476533472537994, "learning_rate": 3.706886781761173e-05, "loss": 0.1459, "step": 39250 }, { "epoch": 0.7423217861055494, "grad_norm": 0.04550711065530777, "learning_rate": 3.7116089305277476e-05, "loss": 0.1458, "step": 39300 }, { "epoch": 0.7432662158588644, "grad_norm": 0.04075130820274353, "learning_rate": 3.7163310792943223e-05, "loss": 0.1453, "step": 39350 }, { "epoch": 0.7442106456121793, "grad_norm": 0.049413204193115234, "learning_rate": 3.7210532280608964e-05, "loss": 0.1453, "step": 39400 }, { "epoch": 0.7451550753654943, "grad_norm": 0.04133716970682144, "learning_rate": 3.725775376827472e-05, "loss": 0.1459, "step": 39450 }, { "epoch": 0.7460995051188093, "grad_norm": 0.043067894876003265, "learning_rate": 3.7304975255940466e-05, "loss": 0.1453, "step": 39500 }, { "epoch": 0.7470439348721242, "grad_norm": 0.040616828948259354, "learning_rate": 3.735219674360621e-05, "loss": 0.1452, "step": 39550 }, { "epoch": 0.7479883646254392, "grad_norm": 0.03994736075401306, "learning_rate": 3.739941823127196e-05, "loss": 0.145, "step": 39600 }, { "epoch": 0.7489327943787542, "grad_norm": 0.044843677431344986, "learning_rate": 3.744663971893771e-05, "loss": 0.1457, "step": 39650 }, { "epoch": 0.749877224132069, "grad_norm": 0.04071737825870514, "learning_rate": 3.7493861206603455e-05, "loss": 0.1454, "step": 39700 }, { "epoch": 0.750821653885384, "grad_norm": 0.0433492474257946, "learning_rate": 3.75410826942692e-05, "loss": 0.1452, "step": 39750 }, { "epoch": 0.7517660836386989, "grad_norm": 0.0414339154958725, "learning_rate": 3.7588304181934944e-05, "loss": 0.145, "step": 39800 }, { "epoch": 0.7527105133920139, "grad_norm": 0.03860550746321678, "learning_rate": 3.76355256696007e-05, "loss": 0.1455, "step": 39850 }, { "epoch": 0.7536549431453289, "grad_norm": 0.0417729988694191, "learning_rate": 3.7682747157266445e-05, "loss": 0.1446, "step": 39900 }, { "epoch": 0.7545993728986438, "grad_norm": 0.04280512034893036, "learning_rate": 3.772996864493219e-05, "loss": 0.1453, "step": 39950 }, { "epoch": 0.7555438026519588, "grad_norm": 0.04160696268081665, "learning_rate": 3.777719013259794e-05, "loss": 0.1452, "step": 40000 }, { "epoch": 0.7555438026519588, "eval_IntDiv": 0.6750172317742391, "eval_NumCircles": 2005, "eval_SumBottleneck": 104.05335725347341, "eval_Uniqueness": 0.9954907718120806, "eval_Validity": 0.9536, "eval_Validity * Uniqueness": 0.9493, "eval_loss": 0.21752898395061493, "eval_runtime": 148.2083, "eval_samples_per_second": 67.473, "eval_steps_per_second": 0.533, "step": 40000 }, { "epoch": 0.7564882324052737, "grad_norm": 0.042401425540447235, "learning_rate": 3.782441162026369e-05, "loss": 0.145, "step": 40050 }, { "epoch": 0.7574326621585886, "grad_norm": 0.04049965366721153, "learning_rate": 3.7871633107929435e-05, "loss": 0.1449, "step": 40100 }, { "epoch": 0.7583770919119036, "grad_norm": 0.040597207844257355, "learning_rate": 3.791885459559518e-05, "loss": 0.145, "step": 40150 }, { "epoch": 0.7593215216652185, "grad_norm": 0.041445136070251465, "learning_rate": 3.796607608326093e-05, "loss": 0.145, "step": 40200 }, { "epoch": 0.7602659514185335, "grad_norm": 0.04004233703017235, "learning_rate": 3.801329757092668e-05, "loss": 0.1451, "step": 40250 }, { "epoch": 0.7612103811718485, "grad_norm": 0.04090188071131706, "learning_rate": 3.8060519058592425e-05, "loss": 0.1448, "step": 40300 }, { "epoch": 0.7621548109251634, "grad_norm": 0.03945997729897499, "learning_rate": 3.810774054625817e-05, "loss": 0.1446, "step": 40350 }, { "epoch": 0.7630992406784783, "grad_norm": 0.04595568776130676, "learning_rate": 3.815496203392392e-05, "loss": 0.145, "step": 40400 }, { "epoch": 0.7640436704317933, "grad_norm": 0.0433221198618412, "learning_rate": 3.820218352158967e-05, "loss": 0.1448, "step": 40450 }, { "epoch": 0.7649881001851082, "grad_norm": 0.03807784244418144, "learning_rate": 3.8249405009255414e-05, "loss": 0.145, "step": 40500 }, { "epoch": 0.7659325299384232, "grad_norm": 0.04088008031249046, "learning_rate": 3.829662649692116e-05, "loss": 0.1451, "step": 40550 }, { "epoch": 0.7668769596917381, "grad_norm": 0.04342658072710037, "learning_rate": 3.834384798458691e-05, "loss": 0.1446, "step": 40600 }, { "epoch": 0.7678213894450531, "grad_norm": 0.03956913575530052, "learning_rate": 3.8391069472252657e-05, "loss": 0.1455, "step": 40650 }, { "epoch": 0.7687658191983681, "grad_norm": 0.03968043997883797, "learning_rate": 3.8438290959918404e-05, "loss": 0.1447, "step": 40700 }, { "epoch": 0.7697102489516829, "grad_norm": 0.040151093155145645, "learning_rate": 3.848551244758415e-05, "loss": 0.1448, "step": 40750 }, { "epoch": 0.7706546787049979, "grad_norm": 0.04133196175098419, "learning_rate": 3.85327339352499e-05, "loss": 0.1449, "step": 40800 }, { "epoch": 0.7715991084583129, "grad_norm": 0.04087718948721886, "learning_rate": 3.8579955422915646e-05, "loss": 0.1443, "step": 40850 }, { "epoch": 0.7725435382116278, "grad_norm": 0.0414508581161499, "learning_rate": 3.8627176910581394e-05, "loss": 0.1446, "step": 40900 }, { "epoch": 0.7734879679649428, "grad_norm": 0.042974840849637985, "learning_rate": 3.867439839824714e-05, "loss": 0.1443, "step": 40950 }, { "epoch": 0.7744323977182577, "grad_norm": 0.044965073466300964, "learning_rate": 3.872161988591289e-05, "loss": 0.1443, "step": 41000 }, { "epoch": 0.7753768274715727, "grad_norm": 0.041429974138736725, "learning_rate": 3.8768841373578636e-05, "loss": 0.1446, "step": 41050 }, { "epoch": 0.7763212572248877, "grad_norm": 0.048906195908784866, "learning_rate": 3.881606286124438e-05, "loss": 0.1442, "step": 41100 }, { "epoch": 0.7772656869782025, "grad_norm": 0.03840850293636322, "learning_rate": 3.886328434891013e-05, "loss": 0.1448, "step": 41150 }, { "epoch": 0.7782101167315175, "grad_norm": 0.0417274609208107, "learning_rate": 3.891050583657588e-05, "loss": 0.1441, "step": 41200 }, { "epoch": 0.7791545464848325, "grad_norm": 0.04040537029504776, "learning_rate": 3.8957727324241626e-05, "loss": 0.1447, "step": 41250 }, { "epoch": 0.7800989762381474, "grad_norm": 0.03781970590353012, "learning_rate": 3.900494881190737e-05, "loss": 0.1441, "step": 41300 }, { "epoch": 0.7810434059914624, "grad_norm": 0.03896123915910721, "learning_rate": 3.905217029957312e-05, "loss": 0.1449, "step": 41350 }, { "epoch": 0.7819878357447773, "grad_norm": 0.03823167458176613, "learning_rate": 3.909939178723887e-05, "loss": 0.1439, "step": 41400 }, { "epoch": 0.7829322654980923, "grad_norm": 0.04021603986620903, "learning_rate": 3.9146613274904615e-05, "loss": 0.1444, "step": 41450 }, { "epoch": 0.7838766952514072, "grad_norm": 0.04026469960808754, "learning_rate": 3.919383476257036e-05, "loss": 0.1441, "step": 41500 }, { "epoch": 0.7848211250047221, "grad_norm": 0.03865630552172661, "learning_rate": 3.924105625023611e-05, "loss": 0.1441, "step": 41550 }, { "epoch": 0.7857655547580371, "grad_norm": 0.041600365191698074, "learning_rate": 3.928827773790186e-05, "loss": 0.1439, "step": 41600 }, { "epoch": 0.7867099845113521, "grad_norm": 0.04239555075764656, "learning_rate": 3.9335499225567605e-05, "loss": 0.1443, "step": 41650 }, { "epoch": 0.787654414264667, "grad_norm": 0.039032984524965286, "learning_rate": 3.938272071323335e-05, "loss": 0.144, "step": 41700 }, { "epoch": 0.788598844017982, "grad_norm": 0.040044937282800674, "learning_rate": 3.94299422008991e-05, "loss": 0.1439, "step": 41750 }, { "epoch": 0.7895432737712968, "grad_norm": 0.04724070802330971, "learning_rate": 3.947716368856485e-05, "loss": 0.1443, "step": 41800 }, { "epoch": 0.7904877035246118, "grad_norm": 0.04197279363870621, "learning_rate": 3.9524385176230595e-05, "loss": 0.1436, "step": 41850 }, { "epoch": 0.7914321332779268, "grad_norm": 0.038634877651929855, "learning_rate": 3.957160666389634e-05, "loss": 0.1438, "step": 41900 }, { "epoch": 0.7923765630312417, "grad_norm": 0.04183882847428322, "learning_rate": 3.961882815156209e-05, "loss": 0.144, "step": 41950 }, { "epoch": 0.7933209927845567, "grad_norm": 0.03920188918709755, "learning_rate": 3.966604963922784e-05, "loss": 0.1438, "step": 42000 }, { "epoch": 0.7942654225378716, "grad_norm": 0.03762110322713852, "learning_rate": 3.971327112689358e-05, "loss": 0.1441, "step": 42050 }, { "epoch": 0.7952098522911866, "grad_norm": 0.03884753957390785, "learning_rate": 3.976049261455933e-05, "loss": 0.1442, "step": 42100 }, { "epoch": 0.7961542820445016, "grad_norm": 0.04141641780734062, "learning_rate": 3.980771410222508e-05, "loss": 0.1446, "step": 42150 }, { "epoch": 0.7970987117978164, "grad_norm": 0.0408857986330986, "learning_rate": 3.985493558989083e-05, "loss": 0.1438, "step": 42200 }, { "epoch": 0.7980431415511314, "grad_norm": 0.04080124944448471, "learning_rate": 3.9902157077556574e-05, "loss": 0.1437, "step": 42250 }, { "epoch": 0.7989875713044464, "grad_norm": 0.03976322337985039, "learning_rate": 3.994937856522232e-05, "loss": 0.144, "step": 42300 }, { "epoch": 0.7999320010577613, "grad_norm": 0.038657255470752716, "learning_rate": 3.999660005288807e-05, "loss": 0.1437, "step": 42350 }, { "epoch": 0.8008764308110763, "grad_norm": 0.03980283439159393, "learning_rate": 4.0043821540553816e-05, "loss": 0.1434, "step": 42400 }, { "epoch": 0.8018208605643912, "grad_norm": 0.04006297141313553, "learning_rate": 4.009104302821956e-05, "loss": 0.1442, "step": 42450 }, { "epoch": 0.8027652903177062, "grad_norm": 0.038921695202589035, "learning_rate": 4.013826451588531e-05, "loss": 0.1429, "step": 42500 }, { "epoch": 0.8027652903177062, "eval_IntDiv": 0.6749806030305069, "eval_NumCircles": 1992, "eval_SumBottleneck": 69.27043771964743, "eval_Uniqueness": 0.9962515618492295, "eval_Validity": 0.9604, "eval_Validity * Uniqueness": 0.9568, "eval_loss": 0.219866082072258, "eval_runtime": 129.8566, "eval_samples_per_second": 77.008, "eval_steps_per_second": 0.608, "step": 42500 }, { "epoch": 0.8037097200710211, "grad_norm": 0.04340285807847977, "learning_rate": 4.018548600355106e-05, "loss": 0.1436, "step": 42550 }, { "epoch": 0.804654149824336, "grad_norm": 0.038621239364147186, "learning_rate": 4.0232707491216806e-05, "loss": 0.1435, "step": 42600 }, { "epoch": 0.805598579577651, "grad_norm": 0.03881506249308586, "learning_rate": 4.0279928978882554e-05, "loss": 0.1428, "step": 42650 }, { "epoch": 0.806543009330966, "grad_norm": 0.05671614408493042, "learning_rate": 4.03271504665483e-05, "loss": 0.1438, "step": 42700 }, { "epoch": 0.8074874390842809, "grad_norm": 0.04462280124425888, "learning_rate": 4.037437195421405e-05, "loss": 0.1432, "step": 42750 }, { "epoch": 0.8084318688375959, "grad_norm": 0.038953039795160294, "learning_rate": 4.0421593441879796e-05, "loss": 0.1435, "step": 42800 }, { "epoch": 0.8093762985909108, "grad_norm": 0.0383635014295578, "learning_rate": 4.046881492954554e-05, "loss": 0.1431, "step": 42850 }, { "epoch": 0.8103207283442257, "grad_norm": 0.03972693532705307, "learning_rate": 4.051603641721129e-05, "loss": 0.1431, "step": 42900 }, { "epoch": 0.8112651580975407, "grad_norm": 0.04214174672961235, "learning_rate": 4.056325790487704e-05, "loss": 0.1436, "step": 42950 }, { "epoch": 0.8122095878508556, "grad_norm": 0.039007268846035004, "learning_rate": 4.0610479392542785e-05, "loss": 0.143, "step": 43000 }, { "epoch": 0.8131540176041706, "grad_norm": 0.043960537761449814, "learning_rate": 4.065770088020853e-05, "loss": 0.1433, "step": 43050 }, { "epoch": 0.8140984473574856, "grad_norm": 0.03882475197315216, "learning_rate": 4.070492236787428e-05, "loss": 0.1431, "step": 43100 }, { "epoch": 0.8150428771108005, "grad_norm": 0.040292058140039444, "learning_rate": 4.075214385554003e-05, "loss": 0.143, "step": 43150 }, { "epoch": 0.8159873068641155, "grad_norm": 0.04591679200530052, "learning_rate": 4.0799365343205775e-05, "loss": 0.1433, "step": 43200 }, { "epoch": 0.8169317366174303, "grad_norm": 0.04002595692873001, "learning_rate": 4.084658683087152e-05, "loss": 0.1431, "step": 43250 }, { "epoch": 0.8178761663707453, "grad_norm": 0.04661698639392853, "learning_rate": 4.089380831853727e-05, "loss": 0.1429, "step": 43300 }, { "epoch": 0.8188205961240603, "grad_norm": 0.0408141203224659, "learning_rate": 4.094102980620302e-05, "loss": 0.1432, "step": 43350 }, { "epoch": 0.8197650258773752, "grad_norm": 0.03837508708238602, "learning_rate": 4.0988251293868765e-05, "loss": 0.1431, "step": 43400 }, { "epoch": 0.8207094556306902, "grad_norm": 0.03888022154569626, "learning_rate": 4.103547278153451e-05, "loss": 0.1435, "step": 43450 }, { "epoch": 0.8216538853840052, "grad_norm": 0.04054855927824974, "learning_rate": 4.108269426920026e-05, "loss": 0.1429, "step": 43500 }, { "epoch": 0.8225983151373201, "grad_norm": 0.04131406918168068, "learning_rate": 4.112991575686601e-05, "loss": 0.1436, "step": 43550 }, { "epoch": 0.8235427448906351, "grad_norm": 0.03992599993944168, "learning_rate": 4.1177137244531755e-05, "loss": 0.1435, "step": 43600 }, { "epoch": 0.8244871746439499, "grad_norm": 0.03779558092355728, "learning_rate": 4.12243587321975e-05, "loss": 0.1432, "step": 43650 }, { "epoch": 0.8254316043972649, "grad_norm": 0.04053754359483719, "learning_rate": 4.127158021986325e-05, "loss": 0.1427, "step": 43700 }, { "epoch": 0.8263760341505799, "grad_norm": 0.04236629977822304, "learning_rate": 4.1318801707529e-05, "loss": 0.1428, "step": 43750 }, { "epoch": 0.8273204639038948, "grad_norm": 0.04077012464404106, "learning_rate": 4.1366023195194744e-05, "loss": 0.1431, "step": 43800 }, { "epoch": 0.8282648936572098, "grad_norm": 0.03918084874749184, "learning_rate": 4.141324468286049e-05, "loss": 0.1425, "step": 43850 }, { "epoch": 0.8292093234105248, "grad_norm": 0.04333747178316116, "learning_rate": 4.146046617052624e-05, "loss": 0.143, "step": 43900 }, { "epoch": 0.8301537531638397, "grad_norm": 0.04010206460952759, "learning_rate": 4.1507687658191987e-05, "loss": 0.1429, "step": 43950 }, { "epoch": 0.8310981829171546, "grad_norm": 0.03939329460263252, "learning_rate": 4.1554909145857734e-05, "loss": 0.1428, "step": 44000 }, { "epoch": 0.8320426126704695, "grad_norm": 0.038825348019599915, "learning_rate": 4.160213063352348e-05, "loss": 0.1429, "step": 44050 }, { "epoch": 0.8329870424237845, "grad_norm": 0.04334433004260063, "learning_rate": 4.164935212118923e-05, "loss": 0.1424, "step": 44100 }, { "epoch": 0.8339314721770995, "grad_norm": 0.039205778390169144, "learning_rate": 4.1696573608854976e-05, "loss": 0.1424, "step": 44150 }, { "epoch": 0.8348759019304144, "grad_norm": 0.038194429129362106, "learning_rate": 4.1743795096520724e-05, "loss": 0.1426, "step": 44200 }, { "epoch": 0.8358203316837294, "grad_norm": 0.038022927939891815, "learning_rate": 4.179101658418647e-05, "loss": 0.1427, "step": 44250 }, { "epoch": 0.8367647614370443, "grad_norm": 0.037816960364580154, "learning_rate": 4.183823807185221e-05, "loss": 0.1423, "step": 44300 }, { "epoch": 0.8377091911903592, "grad_norm": 0.048594340682029724, "learning_rate": 4.1885459559517966e-05, "loss": 0.1427, "step": 44350 }, { "epoch": 0.8386536209436742, "grad_norm": 0.04131820797920227, "learning_rate": 4.1932681047183713e-05, "loss": 0.1425, "step": 44400 }, { "epoch": 0.8395980506969891, "grad_norm": 0.039254333823919296, "learning_rate": 4.197990253484946e-05, "loss": 0.1427, "step": 44450 }, { "epoch": 0.8405424804503041, "grad_norm": 0.04378412663936615, "learning_rate": 4.202712402251521e-05, "loss": 0.1425, "step": 44500 }, { "epoch": 0.8414869102036191, "grad_norm": 0.04200153425335884, "learning_rate": 4.2074345510180956e-05, "loss": 0.1427, "step": 44550 }, { "epoch": 0.842431339956934, "grad_norm": 0.042584072798490524, "learning_rate": 4.21215669978467e-05, "loss": 0.1425, "step": 44600 }, { "epoch": 0.843375769710249, "grad_norm": 0.04479373246431351, "learning_rate": 4.216878848551245e-05, "loss": 0.1423, "step": 44650 }, { "epoch": 0.8443201994635638, "grad_norm": 0.03978758677840233, "learning_rate": 4.221600997317819e-05, "loss": 0.1426, "step": 44700 }, { "epoch": 0.8452646292168788, "grad_norm": 0.04194638878107071, "learning_rate": 4.2263231460843945e-05, "loss": 0.1426, "step": 44750 }, { "epoch": 0.8462090589701938, "grad_norm": 0.04227259382605553, "learning_rate": 4.231045294850969e-05, "loss": 0.1426, "step": 44800 }, { "epoch": 0.8471534887235087, "grad_norm": 0.03966226428747177, "learning_rate": 4.235767443617544e-05, "loss": 0.1417, "step": 44850 }, { "epoch": 0.8480979184768237, "grad_norm": 0.0409407839179039, "learning_rate": 4.240489592384119e-05, "loss": 0.1423, "step": 44900 }, { "epoch": 0.8490423482301387, "grad_norm": 0.044581107795238495, "learning_rate": 4.2452117411506935e-05, "loss": 0.1428, "step": 44950 }, { "epoch": 0.8499867779834536, "grad_norm": 0.03858479857444763, "learning_rate": 4.249933889917268e-05, "loss": 0.1421, "step": 45000 }, { "epoch": 0.8499867779834536, "eval_IntDiv": 0.6753409578373859, "eval_NumCircles": 1946, "eval_SumBottleneck": 121.23274083239235, "eval_Uniqueness": 0.9973906690324601, "eval_Validity": 0.9581, "eval_Validity * Uniqueness": 0.9556, "eval_loss": 0.221343532204628, "eval_runtime": 544.1787, "eval_samples_per_second": 18.376, "eval_steps_per_second": 0.145, "step": 45000 }, { "epoch": 0.8509312077367686, "grad_norm": 0.03902658820152283, "learning_rate": 4.254656038683843e-05, "loss": 0.1423, "step": 45050 }, { "epoch": 0.8518756374900834, "grad_norm": 0.03634857013821602, "learning_rate": 4.259378187450417e-05, "loss": 0.1426, "step": 45100 }, { "epoch": 0.8528200672433984, "grad_norm": 0.03744077309966087, "learning_rate": 4.2641003362169925e-05, "loss": 0.1423, "step": 45150 }, { "epoch": 0.8537644969967134, "grad_norm": 0.042965978384017944, "learning_rate": 4.268822484983567e-05, "loss": 0.1419, "step": 45200 }, { "epoch": 0.8547089267500283, "grad_norm": 0.0433276891708374, "learning_rate": 4.273544633750142e-05, "loss": 0.1425, "step": 45250 }, { "epoch": 0.8556533565033433, "grad_norm": 0.037295494228601456, "learning_rate": 4.278266782516717e-05, "loss": 0.1422, "step": 45300 }, { "epoch": 0.8565977862566583, "grad_norm": 0.03597498685121536, "learning_rate": 4.2829889312832914e-05, "loss": 0.1425, "step": 45350 }, { "epoch": 0.8575422160099732, "grad_norm": 0.04229936748743057, "learning_rate": 4.287711080049866e-05, "loss": 0.1421, "step": 45400 }, { "epoch": 0.8584866457632881, "grad_norm": 0.039778970181941986, "learning_rate": 4.292433228816441e-05, "loss": 0.1422, "step": 45450 }, { "epoch": 0.859431075516603, "grad_norm": 0.04163440316915512, "learning_rate": 4.297155377583016e-05, "loss": 0.1422, "step": 45500 }, { "epoch": 0.860375505269918, "grad_norm": 0.03776060789823532, "learning_rate": 4.3018775263495904e-05, "loss": 0.1422, "step": 45550 }, { "epoch": 0.861319935023233, "grad_norm": 0.038698527961969376, "learning_rate": 4.306599675116165e-05, "loss": 0.1416, "step": 45600 }, { "epoch": 0.8622643647765479, "grad_norm": 0.0414905808866024, "learning_rate": 4.31132182388274e-05, "loss": 0.142, "step": 45650 }, { "epoch": 0.8632087945298629, "grad_norm": 0.03794620931148529, "learning_rate": 4.3160439726493146e-05, "loss": 0.1419, "step": 45700 }, { "epoch": 0.8641532242831779, "grad_norm": 0.03707181662321091, "learning_rate": 4.3207661214158894e-05, "loss": 0.1418, "step": 45750 }, { "epoch": 0.8650976540364927, "grad_norm": 0.042990487068891525, "learning_rate": 4.325488270182464e-05, "loss": 0.142, "step": 45800 }, { "epoch": 0.8660420837898077, "grad_norm": 0.04003818705677986, "learning_rate": 4.330210418949039e-05, "loss": 0.1418, "step": 45850 }, { "epoch": 0.8669865135431226, "grad_norm": 0.05009523406624794, "learning_rate": 4.3349325677156136e-05, "loss": 0.1417, "step": 45900 }, { "epoch": 0.8679309432964376, "grad_norm": 0.03908533975481987, "learning_rate": 4.3396547164821884e-05, "loss": 0.1422, "step": 45950 }, { "epoch": 0.8688753730497526, "grad_norm": 0.03763602674007416, "learning_rate": 4.344376865248763e-05, "loss": 0.1415, "step": 46000 }, { "epoch": 0.8698198028030675, "grad_norm": 0.040500376373529434, "learning_rate": 4.349099014015338e-05, "loss": 0.1418, "step": 46050 }, { "epoch": 0.8707642325563825, "grad_norm": 0.0376383513212204, "learning_rate": 4.3538211627819126e-05, "loss": 0.142, "step": 46100 }, { "epoch": 0.8717086623096975, "grad_norm": 0.03595249727368355, "learning_rate": 4.358543311548487e-05, "loss": 0.1417, "step": 46150 }, { "epoch": 0.8726530920630123, "grad_norm": 0.03891431912779808, "learning_rate": 4.363265460315062e-05, "loss": 0.1416, "step": 46200 }, { "epoch": 0.8735975218163273, "grad_norm": 0.038210008293390274, "learning_rate": 4.367987609081637e-05, "loss": 0.1417, "step": 46250 }, { "epoch": 0.8745419515696422, "grad_norm": 0.03932406008243561, "learning_rate": 4.3727097578482116e-05, "loss": 0.1416, "step": 46300 }, { "epoch": 0.8754863813229572, "grad_norm": 0.0428214855492115, "learning_rate": 4.377431906614786e-05, "loss": 0.1415, "step": 46350 }, { "epoch": 0.8764308110762722, "grad_norm": 0.03876851126551628, "learning_rate": 4.382154055381361e-05, "loss": 0.1416, "step": 46400 }, { "epoch": 0.8773752408295871, "grad_norm": 0.03906278684735298, "learning_rate": 4.386876204147936e-05, "loss": 0.1413, "step": 46450 }, { "epoch": 0.8783196705829021, "grad_norm": 0.03978988528251648, "learning_rate": 4.3915983529145105e-05, "loss": 0.1414, "step": 46500 }, { "epoch": 0.879264100336217, "grad_norm": 0.03740892931818962, "learning_rate": 4.396320501681085e-05, "loss": 0.1414, "step": 46550 }, { "epoch": 0.8802085300895319, "grad_norm": 0.04060372710227966, "learning_rate": 4.40104265044766e-05, "loss": 0.1417, "step": 46600 }, { "epoch": 0.8811529598428469, "grad_norm": 0.03762989863753319, "learning_rate": 4.405764799214235e-05, "loss": 0.1414, "step": 46650 }, { "epoch": 0.8820973895961618, "grad_norm": 0.03969070687890053, "learning_rate": 4.4104869479808095e-05, "loss": 0.1416, "step": 46700 }, { "epoch": 0.8830418193494768, "grad_norm": 0.051500674337148666, "learning_rate": 4.415209096747384e-05, "loss": 0.1419, "step": 46750 }, { "epoch": 0.8839862491027918, "grad_norm": 0.039065293967723846, "learning_rate": 4.419931245513959e-05, "loss": 0.1415, "step": 46800 }, { "epoch": 0.8849306788561067, "grad_norm": 0.09825267642736435, "learning_rate": 4.424653394280534e-05, "loss": 0.146, "step": 46850 }, { "epoch": 0.8858751086094216, "grad_norm": 0.03920001536607742, "learning_rate": 4.4293755430471085e-05, "loss": 0.1453, "step": 46900 }, { "epoch": 0.8868195383627365, "grad_norm": 0.039298638701438904, "learning_rate": 4.4340976918136825e-05, "loss": 0.1422, "step": 46950 }, { "epoch": 0.8877639681160515, "grad_norm": 0.037064891308546066, "learning_rate": 4.438819840580258e-05, "loss": 0.1416, "step": 47000 }, { "epoch": 0.8887083978693665, "grad_norm": 0.04007786884903908, "learning_rate": 4.443541989346833e-05, "loss": 0.1415, "step": 47050 }, { "epoch": 0.8896528276226814, "grad_norm": 0.0389833003282547, "learning_rate": 4.4482641381134074e-05, "loss": 0.1415, "step": 47100 }, { "epoch": 0.8905972573759964, "grad_norm": 0.03825139254331589, "learning_rate": 4.452986286879982e-05, "loss": 0.1412, "step": 47150 }, { "epoch": 0.8915416871293114, "grad_norm": 0.038210537284612656, "learning_rate": 4.457708435646557e-05, "loss": 0.1419, "step": 47200 }, { "epoch": 0.8924861168826262, "grad_norm": 0.03999688848853111, "learning_rate": 4.462430584413132e-05, "loss": 0.1414, "step": 47250 }, { "epoch": 0.8934305466359412, "grad_norm": 0.036940354853868484, "learning_rate": 4.4671527331797064e-05, "loss": 0.1413, "step": 47300 }, { "epoch": 0.8943749763892561, "grad_norm": 0.03728590905666351, "learning_rate": 4.4718748819462805e-05, "loss": 0.1408, "step": 47350 }, { "epoch": 0.8953194061425711, "grad_norm": 0.039748433977365494, "learning_rate": 4.476597030712856e-05, "loss": 0.1409, "step": 47400 }, { "epoch": 0.8962638358958861, "grad_norm": 0.040691960602998734, "learning_rate": 4.4813191794794306e-05, "loss": 0.1408, "step": 47450 }, { "epoch": 0.897208265649201, "grad_norm": 0.038891807198524475, "learning_rate": 4.4860413282460054e-05, "loss": 0.1409, "step": 47500 }, { "epoch": 0.897208265649201, "eval_IntDiv": 0.6736677181093291, "eval_NumCircles": 1911, "eval_SumBottleneck": 86.87727763548693, "eval_Uniqueness": 0.9959497351749922, "eval_Validity": 0.9629, "eval_Validity * Uniqueness": 0.959, "eval_loss": 0.22050149738788605, "eval_runtime": 176.708, "eval_samples_per_second": 56.591, "eval_steps_per_second": 0.447, "step": 47500 }, { "epoch": 0.898152695402516, "grad_norm": 0.03801312297582626, "learning_rate": 4.49076347701258e-05, "loss": 0.1404, "step": 47550 }, { "epoch": 0.899097125155831, "grad_norm": 0.03790495917201042, "learning_rate": 4.495485625779155e-05, "loss": 0.1411, "step": 47600 }, { "epoch": 0.9000415549091458, "grad_norm": 0.03697515279054642, "learning_rate": 4.5002077745457296e-05, "loss": 0.1408, "step": 47650 }, { "epoch": 0.9009859846624608, "grad_norm": 0.038156308233737946, "learning_rate": 4.5049299233123043e-05, "loss": 0.1412, "step": 47700 }, { "epoch": 0.9019304144157757, "grad_norm": 0.03815595805644989, "learning_rate": 4.5096520720788784e-05, "loss": 0.1412, "step": 47750 }, { "epoch": 0.9028748441690907, "grad_norm": 0.03695128485560417, "learning_rate": 4.514374220845454e-05, "loss": 0.1404, "step": 47800 }, { "epoch": 0.9038192739224057, "grad_norm": 0.041734129190444946, "learning_rate": 4.5190963696120286e-05, "loss": 0.1409, "step": 47850 }, { "epoch": 0.9047637036757206, "grad_norm": 0.037755321711301804, "learning_rate": 4.523818518378603e-05, "loss": 0.1407, "step": 47900 }, { "epoch": 0.9057081334290356, "grad_norm": 0.04106855019927025, "learning_rate": 4.528540667145178e-05, "loss": 0.1412, "step": 47950 }, { "epoch": 0.9066525631823505, "grad_norm": 0.038810379803180695, "learning_rate": 4.533262815911753e-05, "loss": 0.1405, "step": 48000 }, { "epoch": 0.9075969929356654, "grad_norm": 0.040633875876665115, "learning_rate": 4.5379849646783275e-05, "loss": 0.1408, "step": 48050 }, { "epoch": 0.9085414226889804, "grad_norm": 0.03784584999084473, "learning_rate": 4.542707113444902e-05, "loss": 0.1406, "step": 48100 }, { "epoch": 0.9094858524422953, "grad_norm": 0.03675217553973198, "learning_rate": 4.547429262211477e-05, "loss": 0.1403, "step": 48150 }, { "epoch": 0.9104302821956103, "grad_norm": 0.03736715018749237, "learning_rate": 4.552151410978052e-05, "loss": 0.1404, "step": 48200 }, { "epoch": 0.9113747119489253, "grad_norm": 0.039480339735746384, "learning_rate": 4.5568735597446265e-05, "loss": 0.1408, "step": 48250 }, { "epoch": 0.9123191417022402, "grad_norm": 0.03867863118648529, "learning_rate": 4.561595708511201e-05, "loss": 0.1409, "step": 48300 }, { "epoch": 0.9132635714555551, "grad_norm": 0.04134884476661682, "learning_rate": 4.566317857277776e-05, "loss": 0.1409, "step": 48350 }, { "epoch": 0.9142080012088701, "grad_norm": 0.03984871506690979, "learning_rate": 4.571040006044351e-05, "loss": 0.1409, "step": 48400 }, { "epoch": 0.915152430962185, "grad_norm": 0.03945016488432884, "learning_rate": 4.5757621548109255e-05, "loss": 0.1406, "step": 48450 }, { "epoch": 0.9160968607155, "grad_norm": 0.03727708011865616, "learning_rate": 4.5804843035775e-05, "loss": 0.1409, "step": 48500 }, { "epoch": 0.9170412904688149, "grad_norm": 0.037360966205596924, "learning_rate": 4.585206452344075e-05, "loss": 0.1411, "step": 48550 }, { "epoch": 0.9179857202221299, "grad_norm": 0.037867240607738495, "learning_rate": 4.58992860111065e-05, "loss": 0.1406, "step": 48600 }, { "epoch": 0.9189301499754449, "grad_norm": 0.04353228956460953, "learning_rate": 4.5946507498772245e-05, "loss": 0.141, "step": 48650 }, { "epoch": 0.9198745797287597, "grad_norm": 0.03888324648141861, "learning_rate": 4.599372898643799e-05, "loss": 0.1403, "step": 48700 }, { "epoch": 0.9208190094820747, "grad_norm": 0.0398545078933239, "learning_rate": 4.604095047410374e-05, "loss": 0.1404, "step": 48750 }, { "epoch": 0.9217634392353897, "grad_norm": 0.03800971060991287, "learning_rate": 4.608817196176949e-05, "loss": 0.1407, "step": 48800 }, { "epoch": 0.9227078689887046, "grad_norm": 0.038277026265859604, "learning_rate": 4.6135393449435234e-05, "loss": 0.1403, "step": 48850 }, { "epoch": 0.9236522987420196, "grad_norm": 0.03802540898323059, "learning_rate": 4.618261493710098e-05, "loss": 0.1411, "step": 48900 }, { "epoch": 0.9245967284953345, "grad_norm": 0.03736951947212219, "learning_rate": 4.622983642476673e-05, "loss": 0.1401, "step": 48950 }, { "epoch": 0.9255411582486495, "grad_norm": 0.03727000206708908, "learning_rate": 4.6277057912432476e-05, "loss": 0.1403, "step": 49000 }, { "epoch": 0.9264855880019645, "grad_norm": 0.04053468257188797, "learning_rate": 4.6324279400098224e-05, "loss": 0.1402, "step": 49050 }, { "epoch": 0.9274300177552793, "grad_norm": 0.039708174765110016, "learning_rate": 4.637150088776397e-05, "loss": 0.1406, "step": 49100 }, { "epoch": 0.9283744475085943, "grad_norm": 0.038230881094932556, "learning_rate": 4.641872237542972e-05, "loss": 0.1402, "step": 49150 }, { "epoch": 0.9293188772619092, "grad_norm": 0.04183787479996681, "learning_rate": 4.646594386309546e-05, "loss": 0.1403, "step": 49200 }, { "epoch": 0.9302633070152242, "grad_norm": 0.03705020248889923, "learning_rate": 4.6513165350761214e-05, "loss": 0.1403, "step": 49250 }, { "epoch": 0.9312077367685392, "grad_norm": 0.03742217272520065, "learning_rate": 4.656038683842696e-05, "loss": 0.14, "step": 49300 }, { "epoch": 0.9321521665218541, "grad_norm": 0.0366576611995697, "learning_rate": 4.660760832609271e-05, "loss": 0.1399, "step": 49350 }, { "epoch": 0.933096596275169, "grad_norm": 0.0364999957382679, "learning_rate": 4.6654829813758456e-05, "loss": 0.14, "step": 49400 }, { "epoch": 0.934041026028484, "grad_norm": 0.03935829550027847, "learning_rate": 4.67020513014242e-05, "loss": 0.1401, "step": 49450 }, { "epoch": 0.9349854557817989, "grad_norm": 0.04018522426486015, "learning_rate": 4.674927278908995e-05, "loss": 0.1405, "step": 49500 }, { "epoch": 0.9359298855351139, "grad_norm": 0.035901207476854324, "learning_rate": 4.67964942767557e-05, "loss": 0.1402, "step": 49550 }, { "epoch": 0.9368743152884288, "grad_norm": 0.038646914064884186, "learning_rate": 4.684371576442144e-05, "loss": 0.1404, "step": 49600 }, { "epoch": 0.9378187450417438, "grad_norm": 0.03870958089828491, "learning_rate": 4.689093725208719e-05, "loss": 0.1403, "step": 49650 }, { "epoch": 0.9387631747950588, "grad_norm": 0.03777585178613663, "learning_rate": 4.693815873975294e-05, "loss": 0.1402, "step": 49700 }, { "epoch": 0.9397076045483737, "grad_norm": 0.03741728886961937, "learning_rate": 4.698538022741869e-05, "loss": 0.1397, "step": 49750 }, { "epoch": 0.9406520343016886, "grad_norm": 0.04445565119385719, "learning_rate": 4.7032601715084435e-05, "loss": 0.1403, "step": 49800 }, { "epoch": 0.9415964640550036, "grad_norm": 0.03762379288673401, "learning_rate": 4.707982320275018e-05, "loss": 0.14, "step": 49850 }, { "epoch": 0.9425408938083185, "grad_norm": 0.039248645305633545, "learning_rate": 4.712704469041593e-05, "loss": 0.14, "step": 49900 }, { "epoch": 0.9434853235616335, "grad_norm": 0.03991606459021568, "learning_rate": 4.717426617808168e-05, "loss": 0.1399, "step": 49950 }, { "epoch": 0.9444297533149484, "grad_norm": 0.03635440394282341, "learning_rate": 4.722148766574742e-05, "loss": 0.14, "step": 50000 }, { "epoch": 0.9444297533149484, "eval_IntDiv": 0.6736987008928911, "eval_NumCircles": 1879, "eval_SumBottleneck": 102.71637052764447, "eval_Uniqueness": 0.9957657750697098, "eval_Validity": 0.9683, "eval_Validity * Uniqueness": 0.9642000000000001, "eval_loss": 0.22040227055549622, "eval_runtime": 147.0984, "eval_samples_per_second": 67.982, "eval_steps_per_second": 0.537, "step": 50000 }, { "epoch": 0.9453741830682634, "grad_norm": 0.038114409893751144, "learning_rate": 4.726870915341317e-05, "loss": 0.14, "step": 50050 }, { "epoch": 0.9463186128215784, "grad_norm": 0.04051026329398155, "learning_rate": 4.731593064107892e-05, "loss": 0.1399, "step": 50100 }, { "epoch": 0.9472630425748932, "grad_norm": 0.04027138277888298, "learning_rate": 4.736315212874467e-05, "loss": 0.1399, "step": 50150 }, { "epoch": 0.9482074723282082, "grad_norm": 0.038797810673713684, "learning_rate": 4.7410373616410415e-05, "loss": 0.1398, "step": 50200 }, { "epoch": 0.9491519020815232, "grad_norm": 0.03835610672831535, "learning_rate": 4.745759510407616e-05, "loss": 0.1403, "step": 50250 }, { "epoch": 0.9500963318348381, "grad_norm": 0.03854671120643616, "learning_rate": 4.750481659174191e-05, "loss": 0.1394, "step": 50300 }, { "epoch": 0.9510407615881531, "grad_norm": 0.04039423540234566, "learning_rate": 4.755203807940766e-05, "loss": 0.1397, "step": 50350 }, { "epoch": 0.951985191341468, "grad_norm": 0.0391458161175251, "learning_rate": 4.75992595670734e-05, "loss": 0.1395, "step": 50400 }, { "epoch": 0.952929621094783, "grad_norm": 0.03797979652881622, "learning_rate": 4.764648105473915e-05, "loss": 0.1396, "step": 50450 }, { "epoch": 0.953874050848098, "grad_norm": 0.03791368007659912, "learning_rate": 4.76937025424049e-05, "loss": 0.1397, "step": 50500 }, { "epoch": 0.9548184806014128, "grad_norm": 0.03915339335799217, "learning_rate": 4.774092403007065e-05, "loss": 0.1398, "step": 50550 }, { "epoch": 0.9557629103547278, "grad_norm": 0.036083366721868515, "learning_rate": 4.7788145517736394e-05, "loss": 0.1401, "step": 50600 }, { "epoch": 0.9567073401080428, "grad_norm": 0.03668561577796936, "learning_rate": 4.783536700540214e-05, "loss": 0.1397, "step": 50650 }, { "epoch": 0.9576517698613577, "grad_norm": 0.038348205387592316, "learning_rate": 4.788258849306789e-05, "loss": 0.14, "step": 50700 }, { "epoch": 0.9585961996146727, "grad_norm": 0.04170968756079674, "learning_rate": 4.7929809980733636e-05, "loss": 0.1394, "step": 50750 }, { "epoch": 0.9595406293679876, "grad_norm": 0.03881774842739105, "learning_rate": 4.7977031468399384e-05, "loss": 0.1401, "step": 50800 }, { "epoch": 0.9604850591213026, "grad_norm": 0.03728939965367317, "learning_rate": 4.802425295606513e-05, "loss": 0.1393, "step": 50850 }, { "epoch": 0.9614294888746175, "grad_norm": 0.03740441054105759, "learning_rate": 4.807147444373088e-05, "loss": 0.1399, "step": 50900 }, { "epoch": 0.9623739186279324, "grad_norm": 0.03822319209575653, "learning_rate": 4.8118695931396626e-05, "loss": 0.1398, "step": 50950 }, { "epoch": 0.9633183483812474, "grad_norm": 0.04446132108569145, "learning_rate": 4.8165917419062373e-05, "loss": 0.1396, "step": 51000 }, { "epoch": 0.9642627781345624, "grad_norm": 0.043029796332120895, "learning_rate": 4.821313890672812e-05, "loss": 0.1395, "step": 51050 }, { "epoch": 0.9652072078878773, "grad_norm": 0.03640009090304375, "learning_rate": 4.826036039439387e-05, "loss": 0.14, "step": 51100 }, { "epoch": 0.9661516376411923, "grad_norm": 0.038955431431531906, "learning_rate": 4.8307581882059616e-05, "loss": 0.1398, "step": 51150 }, { "epoch": 0.9670960673945072, "grad_norm": 0.03975076600909233, "learning_rate": 4.835480336972536e-05, "loss": 0.1394, "step": 51200 }, { "epoch": 0.9680404971478221, "grad_norm": 0.03790029510855675, "learning_rate": 4.840202485739111e-05, "loss": 0.1393, "step": 51250 }, { "epoch": 0.9689849269011371, "grad_norm": 0.036953724920749664, "learning_rate": 4.844924634505686e-05, "loss": 0.1395, "step": 51300 }, { "epoch": 0.969929356654452, "grad_norm": 0.046937648206949234, "learning_rate": 4.8496467832722605e-05, "loss": 0.1396, "step": 51350 }, { "epoch": 0.970873786407767, "grad_norm": 0.03890126571059227, "learning_rate": 4.854368932038835e-05, "loss": 0.1395, "step": 51400 }, { "epoch": 0.971818216161082, "grad_norm": 0.03689221292734146, "learning_rate": 4.85909108080541e-05, "loss": 0.1398, "step": 51450 }, { "epoch": 0.9727626459143969, "grad_norm": 0.03794040530920029, "learning_rate": 4.863813229571985e-05, "loss": 0.1402, "step": 51500 }, { "epoch": 0.9737070756677119, "grad_norm": 0.040605366230010986, "learning_rate": 4.8685353783385595e-05, "loss": 0.1397, "step": 51550 }, { "epoch": 0.9746515054210267, "grad_norm": 0.038556575775146484, "learning_rate": 4.873257527105134e-05, "loss": 0.1389, "step": 51600 }, { "epoch": 0.9755959351743417, "grad_norm": 0.039618294686079025, "learning_rate": 4.877979675871709e-05, "loss": 0.139, "step": 51650 }, { "epoch": 0.9765403649276567, "grad_norm": 0.036886271089315414, "learning_rate": 4.882701824638284e-05, "loss": 0.1388, "step": 51700 }, { "epoch": 0.9774847946809716, "grad_norm": 0.03592230752110481, "learning_rate": 4.8874239734048585e-05, "loss": 0.1392, "step": 51750 }, { "epoch": 0.9784292244342866, "grad_norm": 0.03963198512792587, "learning_rate": 4.892146122171433e-05, "loss": 0.1392, "step": 51800 }, { "epoch": 0.9793736541876015, "grad_norm": 0.03853467106819153, "learning_rate": 4.896868270938007e-05, "loss": 0.139, "step": 51850 }, { "epoch": 0.9803180839409165, "grad_norm": 0.041389644145965576, "learning_rate": 4.901590419704583e-05, "loss": 0.1391, "step": 51900 }, { "epoch": 0.9812625136942315, "grad_norm": 0.03751647099852562, "learning_rate": 4.9063125684711575e-05, "loss": 0.1393, "step": 51950 }, { "epoch": 0.9822069434475463, "grad_norm": 0.03795652836561203, "learning_rate": 4.911034717237732e-05, "loss": 0.1393, "step": 52000 }, { "epoch": 0.9831513732008613, "grad_norm": 0.03588539734482765, "learning_rate": 4.915756866004307e-05, "loss": 0.1397, "step": 52050 }, { "epoch": 0.9840958029541763, "grad_norm": 0.03862900659441948, "learning_rate": 4.920479014770882e-05, "loss": 0.1388, "step": 52100 }, { "epoch": 0.9850402327074912, "grad_norm": 0.0370744951069355, "learning_rate": 4.9252011635374564e-05, "loss": 0.1388, "step": 52150 }, { "epoch": 0.9859846624608062, "grad_norm": 0.03734629228711128, "learning_rate": 4.929923312304031e-05, "loss": 0.139, "step": 52200 }, { "epoch": 0.9869290922141211, "grad_norm": 0.04039441794157028, "learning_rate": 4.934645461070605e-05, "loss": 0.139, "step": 52250 }, { "epoch": 0.987873521967436, "grad_norm": 0.036862604320049286, "learning_rate": 4.9393676098371807e-05, "loss": 0.1393, "step": 52300 }, { "epoch": 0.988817951720751, "grad_norm": 0.036821406334638596, "learning_rate": 4.9440897586037554e-05, "loss": 0.1388, "step": 52350 }, { "epoch": 0.9897623814740659, "grad_norm": 0.03865619748830795, "learning_rate": 4.94881190737033e-05, "loss": 0.139, "step": 52400 }, { "epoch": 0.9907068112273809, "grad_norm": 0.035568736493587494, "learning_rate": 4.953534056136905e-05, "loss": 0.139, "step": 52450 }, { "epoch": 0.9916512409806959, "grad_norm": 0.037988606840372086, "learning_rate": 4.9582562049034796e-05, "loss": 0.139, "step": 52500 }, { "epoch": 0.9916512409806959, "eval_IntDiv": 0.6751390364755717, "eval_NumCircles": 1849, "eval_SumBottleneck": 89.56139173967233, "eval_Uniqueness": 0.9958634953464323, "eval_Validity": 0.967, "eval_Validity * Uniqueness": 0.963, "eval_loss": 0.21950390934944153, "eval_runtime": 141.4764, "eval_samples_per_second": 70.683, "eval_steps_per_second": 0.558, "step": 52500 }, { "epoch": 0.9925956707340108, "grad_norm": 0.03755655884742737, "learning_rate": 4.9629783536700544e-05, "loss": 0.1387, "step": 52550 }, { "epoch": 0.9935401004873258, "grad_norm": 0.038111407309770584, "learning_rate": 4.967700502436629e-05, "loss": 0.139, "step": 52600 }, { "epoch": 0.9944845302406407, "grad_norm": 0.03855624422430992, "learning_rate": 4.972422651203203e-05, "loss": 0.1389, "step": 52650 }, { "epoch": 0.9954289599939556, "grad_norm": 0.039140962064266205, "learning_rate": 4.9771447999697786e-05, "loss": 0.1384, "step": 52700 }, { "epoch": 0.9963733897472706, "grad_norm": 0.03984202444553375, "learning_rate": 4.981866948736353e-05, "loss": 0.139, "step": 52750 }, { "epoch": 0.9973178195005855, "grad_norm": 0.037741757929325104, "learning_rate": 4.986589097502928e-05, "loss": 0.1395, "step": 52800 }, { "epoch": 0.9982622492539005, "grad_norm": 0.03908297419548035, "learning_rate": 4.991311246269503e-05, "loss": 0.1386, "step": 52850 }, { "epoch": 0.9992066790072155, "grad_norm": 0.03705788403749466, "learning_rate": 4.9960333950360776e-05, "loss": 0.1391, "step": 52900 }, { "epoch": 1.0001511087605304, "grad_norm": 0.03607379272580147, "learning_rate": 5.000755543802652e-05, "loss": 0.1389, "step": 52950 }, { "epoch": 1.0010955385138454, "grad_norm": 0.03600328415632248, "learning_rate": 5.005477692569227e-05, "loss": 0.1392, "step": 53000 }, { "epoch": 1.0020399682671604, "grad_norm": 0.03626548498868942, "learning_rate": 5.010199841335802e-05, "loss": 0.1384, "step": 53050 }, { "epoch": 1.0029843980204753, "grad_norm": 0.03653347119688988, "learning_rate": 5.014921990102377e-05, "loss": 0.139, "step": 53100 }, { "epoch": 1.0039288277737901, "grad_norm": 0.03781365975737572, "learning_rate": 5.0196441388689506e-05, "loss": 0.1388, "step": 53150 }, { "epoch": 1.004873257527105, "grad_norm": 0.03820788860321045, "learning_rate": 5.024366287635526e-05, "loss": 0.1383, "step": 53200 }, { "epoch": 1.00581768728042, "grad_norm": 0.03711088374257088, "learning_rate": 5.029088436402101e-05, "loss": 0.1384, "step": 53250 }, { "epoch": 1.006762117033735, "grad_norm": 0.03887972608208656, "learning_rate": 5.0338105851686755e-05, "loss": 0.1387, "step": 53300 }, { "epoch": 1.00770654678705, "grad_norm": 0.03757783770561218, "learning_rate": 5.038532733935251e-05, "loss": 0.1381, "step": 53350 }, { "epoch": 1.0086509765403648, "grad_norm": 0.037461020052433014, "learning_rate": 5.043254882701824e-05, "loss": 0.1391, "step": 53400 }, { "epoch": 1.0095954062936798, "grad_norm": 0.03664344549179077, "learning_rate": 5.0479770314684e-05, "loss": 0.1384, "step": 53450 }, { "epoch": 1.0105398360469948, "grad_norm": 0.03857383877038956, "learning_rate": 5.0526991802349745e-05, "loss": 0.1382, "step": 53500 }, { "epoch": 1.0114842658003098, "grad_norm": 0.03930969908833504, "learning_rate": 5.057421329001549e-05, "loss": 0.1383, "step": 53550 }, { "epoch": 1.0124286955536248, "grad_norm": 0.03819705918431282, "learning_rate": 5.062143477768124e-05, "loss": 0.1385, "step": 53600 }, { "epoch": 1.0133731253069396, "grad_norm": 0.0361647792160511, "learning_rate": 5.066865626534698e-05, "loss": 0.1385, "step": 53650 }, { "epoch": 1.0143175550602546, "grad_norm": 0.037715934216976166, "learning_rate": 5.071587775301273e-05, "loss": 0.1378, "step": 53700 }, { "epoch": 1.0152619848135696, "grad_norm": 0.04112401604652405, "learning_rate": 5.076309924067848e-05, "loss": 0.1413, "step": 53750 }, { "epoch": 1.0162064145668845, "grad_norm": 0.03757304325699806, "learning_rate": 5.081032072834423e-05, "loss": 0.1388, "step": 53800 }, { "epoch": 1.0171508443201995, "grad_norm": 0.03611813858151436, "learning_rate": 5.085754221600998e-05, "loss": 0.1382, "step": 53850 }, { "epoch": 1.0180952740735143, "grad_norm": 0.0363706536591053, "learning_rate": 5.090476370367573e-05, "loss": 0.1385, "step": 53900 }, { "epoch": 1.0190397038268293, "grad_norm": 0.03625526279211044, "learning_rate": 5.0951985191341465e-05, "loss": 0.1382, "step": 53950 }, { "epoch": 1.0199841335801443, "grad_norm": 0.03582845628261566, "learning_rate": 5.099920667900722e-05, "loss": 0.1383, "step": 54000 }, { "epoch": 1.0209285633334593, "grad_norm": 0.03748594596982002, "learning_rate": 5.1046428166672966e-05, "loss": 0.1382, "step": 54050 }, { "epoch": 1.0218729930867743, "grad_norm": 0.03609038144350052, "learning_rate": 5.1093649654338714e-05, "loss": 0.1382, "step": 54100 }, { "epoch": 1.0228174228400893, "grad_norm": 0.03806302696466446, "learning_rate": 5.114087114200447e-05, "loss": 0.1381, "step": 54150 }, { "epoch": 1.023761852593404, "grad_norm": 0.036087486892938614, "learning_rate": 5.11880926296702e-05, "loss": 0.1381, "step": 54200 }, { "epoch": 1.024706282346719, "grad_norm": 0.04140198230743408, "learning_rate": 5.1235314117335956e-05, "loss": 0.1383, "step": 54250 }, { "epoch": 1.025650712100034, "grad_norm": 0.03645627945661545, "learning_rate": 5.1282535605001704e-05, "loss": 0.1383, "step": 54300 }, { "epoch": 1.026595141853349, "grad_norm": 0.03653508424758911, "learning_rate": 5.132975709266745e-05, "loss": 0.1381, "step": 54350 }, { "epoch": 1.027539571606664, "grad_norm": 0.036742862313985825, "learning_rate": 5.13769785803332e-05, "loss": 0.1378, "step": 54400 }, { "epoch": 1.0284840013599788, "grad_norm": 0.036464765667915344, "learning_rate": 5.142420006799894e-05, "loss": 0.1378, "step": 54450 }, { "epoch": 1.0294284311132937, "grad_norm": 0.037247102707624435, "learning_rate": 5.1471421555664686e-05, "loss": 0.1379, "step": 54500 }, { "epoch": 1.0303728608666087, "grad_norm": 0.03660042956471443, "learning_rate": 5.151864304333044e-05, "loss": 0.1386, "step": 54550 }, { "epoch": 1.0313172906199237, "grad_norm": 0.03715239092707634, "learning_rate": 5.156586453099619e-05, "loss": 0.1373, "step": 54600 }, { "epoch": 1.0322617203732387, "grad_norm": 0.04086459428071976, "learning_rate": 5.1613086018661936e-05, "loss": 0.1377, "step": 54650 }, { "epoch": 1.0332061501265535, "grad_norm": 0.03470790386199951, "learning_rate": 5.1660307506327676e-05, "loss": 0.1379, "step": 54700 }, { "epoch": 1.0341505798798685, "grad_norm": 0.03989797458052635, "learning_rate": 5.1707528993993424e-05, "loss": 0.1382, "step": 54750 }, { "epoch": 1.0350950096331835, "grad_norm": 0.03538241237401962, "learning_rate": 5.175475048165918e-05, "loss": 0.1377, "step": 54800 }, { "epoch": 1.0360394393864985, "grad_norm": 0.037514034658670425, "learning_rate": 5.1801971969324925e-05, "loss": 0.1379, "step": 54850 }, { "epoch": 1.0369838691398134, "grad_norm": 0.03714431822299957, "learning_rate": 5.184919345699067e-05, "loss": 0.1379, "step": 54900 }, { "epoch": 1.0379282988931284, "grad_norm": 0.03839278221130371, "learning_rate": 5.189641494465643e-05, "loss": 0.1381, "step": 54950 }, { "epoch": 1.0388727286464432, "grad_norm": 0.041552457958459854, "learning_rate": 5.194363643232216e-05, "loss": 0.1385, "step": 55000 }, { "epoch": 1.0388727286464432, "eval_IntDiv": 0.6746670353281784, "eval_NumCircles": 1919, "eval_SumBottleneck": 104.8502702324718, "eval_Uniqueness": 0.9972210786331824, "eval_Validity": 0.9716, "eval_Validity * Uniqueness": 0.9689000000000001, "eval_loss": 0.2165948450565338, "eval_runtime": 157.7332, "eval_samples_per_second": 63.398, "eval_steps_per_second": 0.501, "step": 55000 }, { "epoch": 1.0398171583997582, "grad_norm": 0.039395008236169815, "learning_rate": 5.1990857919987915e-05, "loss": 0.1377, "step": 55050 }, { "epoch": 1.0407615881530732, "grad_norm": 0.03847438097000122, "learning_rate": 5.203807940765366e-05, "loss": 0.1383, "step": 55100 }, { "epoch": 1.0417060179063882, "grad_norm": 0.036816053092479706, "learning_rate": 5.208530089531941e-05, "loss": 0.1383, "step": 55150 }, { "epoch": 1.0426504476597032, "grad_norm": 0.036829713732004166, "learning_rate": 5.213252238298516e-05, "loss": 0.1379, "step": 55200 }, { "epoch": 1.043594877413018, "grad_norm": 0.03585440292954445, "learning_rate": 5.21797438706509e-05, "loss": 0.1376, "step": 55250 }, { "epoch": 1.044539307166333, "grad_norm": 0.038517702370882034, "learning_rate": 5.2226965358316645e-05, "loss": 0.1374, "step": 55300 }, { "epoch": 1.045483736919648, "grad_norm": 0.041327983140945435, "learning_rate": 5.22741868459824e-05, "loss": 0.1378, "step": 55350 }, { "epoch": 1.046428166672963, "grad_norm": 0.04428509250283241, "learning_rate": 5.232140833364815e-05, "loss": 0.1376, "step": 55400 }, { "epoch": 1.047372596426278, "grad_norm": 0.036376770585775375, "learning_rate": 5.2368629821313894e-05, "loss": 0.1375, "step": 55450 }, { "epoch": 1.0483170261795927, "grad_norm": 0.0363369956612587, "learning_rate": 5.2415851308979635e-05, "loss": 0.1377, "step": 55500 }, { "epoch": 1.0492614559329076, "grad_norm": 0.03586459532380104, "learning_rate": 5.246307279664538e-05, "loss": 0.1377, "step": 55550 }, { "epoch": 1.0502058856862226, "grad_norm": 0.03982817754149437, "learning_rate": 5.2510294284311137e-05, "loss": 0.138, "step": 55600 }, { "epoch": 1.0511503154395376, "grad_norm": 0.03734296187758446, "learning_rate": 5.2557515771976884e-05, "loss": 0.1379, "step": 55650 }, { "epoch": 1.0520947451928526, "grad_norm": 0.03519356623291969, "learning_rate": 5.260473725964263e-05, "loss": 0.1378, "step": 55700 }, { "epoch": 1.0530391749461676, "grad_norm": 0.037280354648828506, "learning_rate": 5.2651958747308386e-05, "loss": 0.1373, "step": 55750 }, { "epoch": 1.0539836046994824, "grad_norm": 0.036873992532491684, "learning_rate": 5.269918023497412e-05, "loss": 0.1378, "step": 55800 }, { "epoch": 1.0549280344527974, "grad_norm": 0.036729902029037476, "learning_rate": 5.2746401722639874e-05, "loss": 0.1379, "step": 55850 }, { "epoch": 1.0558724642061124, "grad_norm": 0.038911670446395874, "learning_rate": 5.279362321030562e-05, "loss": 0.1373, "step": 55900 }, { "epoch": 1.0568168939594274, "grad_norm": 0.037409767508506775, "learning_rate": 5.284084469797137e-05, "loss": 0.1374, "step": 55950 }, { "epoch": 1.0577613237127423, "grad_norm": 0.037427641451358795, "learning_rate": 5.288806618563712e-05, "loss": 0.1374, "step": 56000 }, { "epoch": 1.058705753466057, "grad_norm": 0.0359816774725914, "learning_rate": 5.293528767330286e-05, "loss": 0.1374, "step": 56050 }, { "epoch": 1.059650183219372, "grad_norm": 0.04195936396718025, "learning_rate": 5.298250916096861e-05, "loss": 0.1372, "step": 56100 }, { "epoch": 1.060594612972687, "grad_norm": 0.037752218544483185, "learning_rate": 5.302973064863436e-05, "loss": 0.1375, "step": 56150 }, { "epoch": 1.061539042726002, "grad_norm": 0.03472720831632614, "learning_rate": 5.3076952136300106e-05, "loss": 0.1375, "step": 56200 }, { "epoch": 1.062483472479317, "grad_norm": 0.03415931388735771, "learning_rate": 5.312417362396585e-05, "loss": 0.1373, "step": 56250 }, { "epoch": 1.0634279022326318, "grad_norm": 0.03713837265968323, "learning_rate": 5.3171395111631594e-05, "loss": 0.1377, "step": 56300 }, { "epoch": 1.0643723319859468, "grad_norm": 0.03562706336379051, "learning_rate": 5.321861659929734e-05, "loss": 0.1378, "step": 56350 }, { "epoch": 1.0653167617392618, "grad_norm": 0.03607762232422829, "learning_rate": 5.3265838086963095e-05, "loss": 0.1376, "step": 56400 }, { "epoch": 1.0662611914925768, "grad_norm": 0.035964932292699814, "learning_rate": 5.331305957462884e-05, "loss": 0.1372, "step": 56450 }, { "epoch": 1.0672056212458918, "grad_norm": 0.03449541702866554, "learning_rate": 5.336028106229459e-05, "loss": 0.1372, "step": 56500 }, { "epoch": 1.0681500509992068, "grad_norm": 0.03636105731129646, "learning_rate": 5.340750254996033e-05, "loss": 0.1378, "step": 56550 }, { "epoch": 1.0690944807525216, "grad_norm": 0.03516547009348869, "learning_rate": 5.345472403762608e-05, "loss": 0.1375, "step": 56600 }, { "epoch": 1.0700389105058365, "grad_norm": 0.04242686927318573, "learning_rate": 5.350194552529183e-05, "loss": 0.1376, "step": 56650 }, { "epoch": 1.0709833402591515, "grad_norm": 0.03984222561120987, "learning_rate": 5.354916701295758e-05, "loss": 0.1371, "step": 56700 }, { "epoch": 1.0719277700124665, "grad_norm": 0.03659963607788086, "learning_rate": 5.359638850062333e-05, "loss": 0.138, "step": 56750 }, { "epoch": 1.0728721997657815, "grad_norm": 0.03971521556377411, "learning_rate": 5.364360998828908e-05, "loss": 0.1372, "step": 56800 }, { "epoch": 1.0738166295190963, "grad_norm": 0.038986727595329285, "learning_rate": 5.3690831475954815e-05, "loss": 0.1375, "step": 56850 }, { "epoch": 1.0747610592724113, "grad_norm": 0.03840917721390724, "learning_rate": 5.373805296362057e-05, "loss": 0.1371, "step": 56900 }, { "epoch": 1.0757054890257263, "grad_norm": 0.03663348779082298, "learning_rate": 5.378527445128632e-05, "loss": 0.1375, "step": 56950 }, { "epoch": 1.0766499187790413, "grad_norm": 0.038384273648262024, "learning_rate": 5.3832495938952064e-05, "loss": 0.1374, "step": 57000 }, { "epoch": 1.0775943485323562, "grad_norm": 0.03782375901937485, "learning_rate": 5.387971742661781e-05, "loss": 0.1376, "step": 57050 }, { "epoch": 1.078538778285671, "grad_norm": 0.03748658299446106, "learning_rate": 5.392693891428355e-05, "loss": 0.1373, "step": 57100 }, { "epoch": 1.079483208038986, "grad_norm": 0.03759084641933441, "learning_rate": 5.39741604019493e-05, "loss": 0.1371, "step": 57150 }, { "epoch": 1.080427637792301, "grad_norm": 0.03753111511468887, "learning_rate": 5.4021381889615054e-05, "loss": 0.1375, "step": 57200 }, { "epoch": 1.081372067545616, "grad_norm": 0.03788271173834801, "learning_rate": 5.40686033772808e-05, "loss": 0.1375, "step": 57250 }, { "epoch": 1.082316497298931, "grad_norm": 0.0387134812772274, "learning_rate": 5.411582486494655e-05, "loss": 0.1366, "step": 57300 }, { "epoch": 1.0832609270522457, "grad_norm": 0.03641972690820694, "learning_rate": 5.416304635261229e-05, "loss": 0.1374, "step": 57350 }, { "epoch": 1.0842053568055607, "grad_norm": 0.0381280854344368, "learning_rate": 5.421026784027804e-05, "loss": 0.1372, "step": 57400 }, { "epoch": 1.0851497865588757, "grad_norm": 0.04020897299051285, "learning_rate": 5.425748932794379e-05, "loss": 0.1373, "step": 57450 }, { "epoch": 1.0860942163121907, "grad_norm": 0.034675512462854385, "learning_rate": 5.430471081560954e-05, "loss": 0.1371, "step": 57500 }, { "epoch": 1.0860942163121907, "eval_IntDiv": 0.6742774827487583, "eval_NumCircles": 1789, "eval_SumBottleneck": 113.21185507190121, "eval_Uniqueness": 0.9967095115681234, "eval_Validity": 0.9725, "eval_Validity * Uniqueness": 0.9693, "eval_loss": 0.21944023668766022, "eval_runtime": 194.4665, "eval_samples_per_second": 51.423, "eval_steps_per_second": 0.406, "step": 57500 }, { "epoch": 1.0870386460655057, "grad_norm": 0.03668108209967613, "learning_rate": 5.4351932303275286e-05, "loss": 0.1371, "step": 57550 }, { "epoch": 1.0879830758188207, "grad_norm": 0.03607726842164993, "learning_rate": 5.439915379094104e-05, "loss": 0.1373, "step": 57600 }, { "epoch": 1.0889275055721355, "grad_norm": 0.03482838347554207, "learning_rate": 5.4446375278606774e-05, "loss": 0.137, "step": 57650 }, { "epoch": 1.0898719353254505, "grad_norm": 0.03893599286675453, "learning_rate": 5.449359676627253e-05, "loss": 0.137, "step": 57700 }, { "epoch": 1.0908163650787654, "grad_norm": 0.037262577563524246, "learning_rate": 5.4540818253938276e-05, "loss": 0.1375, "step": 57750 }, { "epoch": 1.0917607948320804, "grad_norm": 0.0471830889582634, "learning_rate": 5.458803974160402e-05, "loss": 0.1371, "step": 57800 }, { "epoch": 1.0927052245853954, "grad_norm": 0.03907244652509689, "learning_rate": 5.463526122926977e-05, "loss": 0.1367, "step": 57850 }, { "epoch": 1.0936496543387102, "grad_norm": 0.03623643517494202, "learning_rate": 5.468248271693551e-05, "loss": 0.1372, "step": 57900 }, { "epoch": 1.0945940840920252, "grad_norm": 0.039610110223293304, "learning_rate": 5.472970420460126e-05, "loss": 0.1368, "step": 57950 }, { "epoch": 1.0955385138453402, "grad_norm": 0.03613843023777008, "learning_rate": 5.477692569226701e-05, "loss": 0.1371, "step": 58000 }, { "epoch": 1.0964829435986552, "grad_norm": 0.03665653243660927, "learning_rate": 5.482414717993276e-05, "loss": 0.1373, "step": 58050 }, { "epoch": 1.0974273733519702, "grad_norm": 0.03719150274991989, "learning_rate": 5.487136866759851e-05, "loss": 0.137, "step": 58100 }, { "epoch": 1.098371803105285, "grad_norm": 0.034522347152233124, "learning_rate": 5.491859015526425e-05, "loss": 0.1369, "step": 58150 }, { "epoch": 1.0993162328586, "grad_norm": 0.03722520172595978, "learning_rate": 5.4965811642929996e-05, "loss": 0.1369, "step": 58200 }, { "epoch": 1.100260662611915, "grad_norm": 0.03598468005657196, "learning_rate": 5.501303313059575e-05, "loss": 0.1366, "step": 58250 }, { "epoch": 1.10120509236523, "grad_norm": 0.03555673360824585, "learning_rate": 5.50602546182615e-05, "loss": 0.1365, "step": 58300 }, { "epoch": 1.1021495221185449, "grad_norm": 0.03569438308477402, "learning_rate": 5.5107476105927245e-05, "loss": 0.1366, "step": 58350 }, { "epoch": 1.1030939518718599, "grad_norm": 0.03701993450522423, "learning_rate": 5.5154697593593e-05, "loss": 0.1366, "step": 58400 }, { "epoch": 1.1040383816251746, "grad_norm": 0.036263953894376755, "learning_rate": 5.520191908125873e-05, "loss": 0.137, "step": 58450 }, { "epoch": 1.1049828113784896, "grad_norm": 0.03877771273255348, "learning_rate": 5.524914056892449e-05, "loss": 0.1368, "step": 58500 }, { "epoch": 1.1059272411318046, "grad_norm": 0.040634557604789734, "learning_rate": 5.5296362056590235e-05, "loss": 0.1367, "step": 58550 }, { "epoch": 1.1068716708851196, "grad_norm": 0.03558093681931496, "learning_rate": 5.534358354425598e-05, "loss": 0.1371, "step": 58600 }, { "epoch": 1.1078161006384346, "grad_norm": 0.03728151693940163, "learning_rate": 5.5390805031921736e-05, "loss": 0.1364, "step": 58650 }, { "epoch": 1.1087605303917494, "grad_norm": 0.035506751388311386, "learning_rate": 5.543802651958747e-05, "loss": 0.1372, "step": 58700 }, { "epoch": 1.1097049601450644, "grad_norm": 0.03539331629872322, "learning_rate": 5.5485248007253224e-05, "loss": 0.1363, "step": 58750 }, { "epoch": 1.1106493898983794, "grad_norm": 0.036371100693941116, "learning_rate": 5.553246949491897e-05, "loss": 0.1364, "step": 58800 }, { "epoch": 1.1115938196516943, "grad_norm": 0.03688681870698929, "learning_rate": 5.557969098258472e-05, "loss": 0.1365, "step": 58850 }, { "epoch": 1.1125382494050093, "grad_norm": 0.03523973375558853, "learning_rate": 5.562691247025047e-05, "loss": 0.1371, "step": 58900 }, { "epoch": 1.113482679158324, "grad_norm": 0.03621154651045799, "learning_rate": 5.567413395791621e-05, "loss": 0.1367, "step": 58950 }, { "epoch": 1.114427108911639, "grad_norm": 0.036918241530656815, "learning_rate": 5.5721355445581955e-05, "loss": 0.1364, "step": 59000 }, { "epoch": 1.115371538664954, "grad_norm": 0.038820780813694, "learning_rate": 5.576857693324771e-05, "loss": 0.1368, "step": 59050 }, { "epoch": 1.116315968418269, "grad_norm": 0.03686409816145897, "learning_rate": 5.5815798420913456e-05, "loss": 0.1369, "step": 59100 }, { "epoch": 1.117260398171584, "grad_norm": 0.038500700145959854, "learning_rate": 5.5863019908579204e-05, "loss": 0.1363, "step": 59150 }, { "epoch": 1.1182048279248988, "grad_norm": 0.03491613268852234, "learning_rate": 5.5910241396244944e-05, "loss": 0.1364, "step": 59200 }, { "epoch": 1.1191492576782138, "grad_norm": 0.03521444648504257, "learning_rate": 5.595746288391069e-05, "loss": 0.1361, "step": 59250 }, { "epoch": 1.1200936874315288, "grad_norm": 0.036053046584129333, "learning_rate": 5.6004684371576446e-05, "loss": 0.1366, "step": 59300 }, { "epoch": 1.1210381171848438, "grad_norm": 0.037523869425058365, "learning_rate": 5.6051905859242193e-05, "loss": 0.1365, "step": 59350 }, { "epoch": 1.1219825469381588, "grad_norm": 0.037330202758312225, "learning_rate": 5.609912734690794e-05, "loss": 0.1369, "step": 59400 }, { "epoch": 1.1229269766914738, "grad_norm": 0.03546906262636185, "learning_rate": 5.6146348834573695e-05, "loss": 0.1363, "step": 59450 }, { "epoch": 1.1238714064447886, "grad_norm": 0.03518075868487358, "learning_rate": 5.619357032223943e-05, "loss": 0.1366, "step": 59500 }, { "epoch": 1.1248158361981035, "grad_norm": 0.035837139934301376, "learning_rate": 5.624079180990518e-05, "loss": 0.1362, "step": 59550 }, { "epoch": 1.1257602659514185, "grad_norm": 0.0387086346745491, "learning_rate": 5.628801329757093e-05, "loss": 0.1365, "step": 59600 }, { "epoch": 1.1267046957047335, "grad_norm": 0.035501640290021896, "learning_rate": 5.633523478523668e-05, "loss": 0.1369, "step": 59650 }, { "epoch": 1.1276491254580485, "grad_norm": 0.03591162711381912, "learning_rate": 5.6382456272902425e-05, "loss": 0.1363, "step": 59700 }, { "epoch": 1.1285935552113633, "grad_norm": 0.03549930453300476, "learning_rate": 5.6429677760568166e-05, "loss": 0.1364, "step": 59750 }, { "epoch": 1.1295379849646783, "grad_norm": 0.03753489628434181, "learning_rate": 5.6476899248233914e-05, "loss": 0.1358, "step": 59800 }, { "epoch": 1.1304824147179933, "grad_norm": 0.03640427440404892, "learning_rate": 5.652412073589967e-05, "loss": 0.1365, "step": 59850 }, { "epoch": 1.1314268444713083, "grad_norm": 0.03651903197169304, "learning_rate": 5.6571342223565415e-05, "loss": 0.1363, "step": 59900 }, { "epoch": 1.1323712742246232, "grad_norm": 0.035612963140010834, "learning_rate": 5.661856371123116e-05, "loss": 0.1363, "step": 59950 }, { "epoch": 1.1333157039779382, "grad_norm": 0.036024708300828934, "learning_rate": 5.66657851988969e-05, "loss": 0.1361, "step": 60000 }, { "epoch": 1.1333157039779382, "eval_IntDiv": 0.6762442299141248, "eval_NumCircles": 1886, "eval_SumBottleneck": 88.66690272945793, "eval_Uniqueness": 0.9965024174467647, "eval_Validity": 0.9721, "eval_Validity * Uniqueness": 0.9686999999999999, "eval_loss": 0.2209620624780655, "eval_runtime": 180.4783, "eval_samples_per_second": 55.408, "eval_steps_per_second": 0.438, "step": 60000 }, { "epoch": 1.134260133731253, "grad_norm": 0.03587483987212181, "learning_rate": 5.671300668656265e-05, "loss": 0.1369, "step": 60050 }, { "epoch": 1.135204563484568, "grad_norm": 0.03470418602228165, "learning_rate": 5.6760228174228405e-05, "loss": 0.1359, "step": 60100 }, { "epoch": 1.136148993237883, "grad_norm": 0.03662164509296417, "learning_rate": 5.680744966189415e-05, "loss": 0.1363, "step": 60150 }, { "epoch": 1.137093422991198, "grad_norm": 0.03663404658436775, "learning_rate": 5.68546711495599e-05, "loss": 0.137, "step": 60200 }, { "epoch": 1.138037852744513, "grad_norm": 0.036474984139204025, "learning_rate": 5.6901892637225654e-05, "loss": 0.136, "step": 60250 }, { "epoch": 1.1389822824978277, "grad_norm": 0.035823922604322433, "learning_rate": 5.694911412489139e-05, "loss": 0.136, "step": 60300 }, { "epoch": 1.1399267122511427, "grad_norm": 0.03702053427696228, "learning_rate": 5.699633561255714e-05, "loss": 0.1367, "step": 60350 }, { "epoch": 1.1408711420044577, "grad_norm": 0.040692172944545746, "learning_rate": 5.704355710022289e-05, "loss": 0.1361, "step": 60400 }, { "epoch": 1.1418155717577727, "grad_norm": 0.036827363073825836, "learning_rate": 5.709077858788864e-05, "loss": 0.1362, "step": 60450 }, { "epoch": 1.1427600015110877, "grad_norm": 0.036160483956336975, "learning_rate": 5.7138000075554384e-05, "loss": 0.1361, "step": 60500 }, { "epoch": 1.1437044312644025, "grad_norm": 0.03658226132392883, "learning_rate": 5.7185221563220125e-05, "loss": 0.1364, "step": 60550 }, { "epoch": 1.1446488610177175, "grad_norm": 0.034424107521772385, "learning_rate": 5.723244305088587e-05, "loss": 0.1364, "step": 60600 }, { "epoch": 1.1455932907710324, "grad_norm": 0.03725495934486389, "learning_rate": 5.7279664538551627e-05, "loss": 0.1359, "step": 60650 }, { "epoch": 1.1465377205243474, "grad_norm": 0.03598535805940628, "learning_rate": 5.7326886026217374e-05, "loss": 0.1363, "step": 60700 }, { "epoch": 1.1474821502776624, "grad_norm": 0.03551675006747246, "learning_rate": 5.737410751388312e-05, "loss": 0.1362, "step": 60750 }, { "epoch": 1.1484265800309772, "grad_norm": 0.036639291793107986, "learning_rate": 5.742132900154886e-05, "loss": 0.1361, "step": 60800 }, { "epoch": 1.1493710097842922, "grad_norm": 0.03737671673297882, "learning_rate": 5.746855048921461e-05, "loss": 0.1362, "step": 60850 }, { "epoch": 1.1503154395376072, "grad_norm": 0.03501415252685547, "learning_rate": 5.7515771976880364e-05, "loss": 0.1363, "step": 60900 }, { "epoch": 1.1512598692909222, "grad_norm": 0.03903467208147049, "learning_rate": 5.756299346454611e-05, "loss": 0.1362, "step": 60950 }, { "epoch": 1.1522042990442372, "grad_norm": 0.03609508275985718, "learning_rate": 5.761021495221186e-05, "loss": 0.1359, "step": 61000 }, { "epoch": 1.153148728797552, "grad_norm": 0.03569348528981209, "learning_rate": 5.765743643987761e-05, "loss": 0.1362, "step": 61050 }, { "epoch": 1.154093158550867, "grad_norm": 0.035456396639347076, "learning_rate": 5.7704657927543347e-05, "loss": 0.1362, "step": 61100 }, { "epoch": 1.155037588304182, "grad_norm": 0.035628750920295715, "learning_rate": 5.77518794152091e-05, "loss": 0.1363, "step": 61150 }, { "epoch": 1.155982018057497, "grad_norm": 0.036210838705301285, "learning_rate": 5.779910090287485e-05, "loss": 0.1362, "step": 61200 }, { "epoch": 1.1569264478108119, "grad_norm": 0.03647904843091965, "learning_rate": 5.7846322390540596e-05, "loss": 0.1361, "step": 61250 }, { "epoch": 1.1578708775641269, "grad_norm": 0.03647620603442192, "learning_rate": 5.789354387820635e-05, "loss": 0.1359, "step": 61300 }, { "epoch": 1.1588153073174416, "grad_norm": 0.038710832595825195, "learning_rate": 5.7940765365872084e-05, "loss": 0.1363, "step": 61350 }, { "epoch": 1.1597597370707566, "grad_norm": 0.036215074360370636, "learning_rate": 5.798798685353784e-05, "loss": 0.1356, "step": 61400 }, { "epoch": 1.1607041668240716, "grad_norm": 0.03546201065182686, "learning_rate": 5.8035208341203585e-05, "loss": 0.1357, "step": 61450 }, { "epoch": 1.1616485965773866, "grad_norm": 0.03394092991948128, "learning_rate": 5.808242982886933e-05, "loss": 0.1359, "step": 61500 }, { "epoch": 1.1625930263307016, "grad_norm": 0.03701433166861534, "learning_rate": 5.812965131653508e-05, "loss": 0.1356, "step": 61550 }, { "epoch": 1.1635374560840164, "grad_norm": 0.04164905101060867, "learning_rate": 5.817687280420082e-05, "loss": 0.1363, "step": 61600 }, { "epoch": 1.1644818858373314, "grad_norm": 0.03765246644616127, "learning_rate": 5.822409429186657e-05, "loss": 0.136, "step": 61650 }, { "epoch": 1.1654263155906464, "grad_norm": 0.036890242248773575, "learning_rate": 5.827131577953232e-05, "loss": 0.136, "step": 61700 }, { "epoch": 1.1663707453439613, "grad_norm": 0.051052697002887726, "learning_rate": 5.831853726719807e-05, "loss": 0.1379, "step": 61750 }, { "epoch": 1.1673151750972763, "grad_norm": 0.038583334535360336, "learning_rate": 5.836575875486382e-05, "loss": 0.1367, "step": 61800 }, { "epoch": 1.1682596048505913, "grad_norm": 0.034067314118146896, "learning_rate": 5.841298024252956e-05, "loss": 0.1361, "step": 61850 }, { "epoch": 1.169204034603906, "grad_norm": 0.03614311292767525, "learning_rate": 5.8460201730195305e-05, "loss": 0.1359, "step": 61900 }, { "epoch": 1.170148464357221, "grad_norm": 0.03772439435124397, "learning_rate": 5.850742321786106e-05, "loss": 0.1356, "step": 61950 }, { "epoch": 1.171092894110536, "grad_norm": 0.03571084141731262, "learning_rate": 5.855464470552681e-05, "loss": 0.1358, "step": 62000 }, { "epoch": 1.172037323863851, "grad_norm": 0.03504854068160057, "learning_rate": 5.8601866193192554e-05, "loss": 0.1355, "step": 62050 }, { "epoch": 1.172981753617166, "grad_norm": 0.03524783253669739, "learning_rate": 5.864908768085831e-05, "loss": 0.1361, "step": 62100 }, { "epoch": 1.1739261833704808, "grad_norm": 0.03389600291848183, "learning_rate": 5.869630916852404e-05, "loss": 0.1356, "step": 62150 }, { "epoch": 1.1748706131237958, "grad_norm": 0.035194918513298035, "learning_rate": 5.87435306561898e-05, "loss": 0.1355, "step": 62200 }, { "epoch": 1.1758150428771108, "grad_norm": 0.03430324047803879, "learning_rate": 5.8790752143855544e-05, "loss": 0.1358, "step": 62250 }, { "epoch": 1.1767594726304258, "grad_norm": 0.0352756641805172, "learning_rate": 5.883797363152129e-05, "loss": 0.1357, "step": 62300 }, { "epoch": 1.1777039023837408, "grad_norm": 0.03489551693201065, "learning_rate": 5.888519511918704e-05, "loss": 0.1358, "step": 62350 }, { "epoch": 1.1786483321370556, "grad_norm": 0.03515790402889252, "learning_rate": 5.893241660685278e-05, "loss": 0.1354, "step": 62400 }, { "epoch": 1.1795927618903705, "grad_norm": 0.03738376125693321, "learning_rate": 5.897963809451853e-05, "loss": 0.135, "step": 62450 }, { "epoch": 1.1805371916436855, "grad_norm": 0.03577751666307449, "learning_rate": 5.902685958218428e-05, "loss": 0.1352, "step": 62500 }, { "epoch": 1.1805371916436855, "eval_IntDiv": 0.6742244350015371, "eval_NumCircles": 1820, "eval_SumBottleneck": 121.79448463999132, "eval_Uniqueness": 0.9973385198075545, "eval_Validity": 0.9769, "eval_Validity * Uniqueness": 0.9742999999999999, "eval_loss": 0.21928857266902924, "eval_runtime": 166.3308, "eval_samples_per_second": 60.121, "eval_steps_per_second": 0.475, "step": 62500 }, { "epoch": 1.1814816213970005, "grad_norm": 0.03618369996547699, "learning_rate": 5.907408106985003e-05, "loss": 0.1358, "step": 62550 }, { "epoch": 1.1824260511503155, "grad_norm": 0.03671099618077278, "learning_rate": 5.9121302557515776e-05, "loss": 0.1355, "step": 62600 }, { "epoch": 1.1833704809036303, "grad_norm": 0.03520066663622856, "learning_rate": 5.916852404518152e-05, "loss": 0.1352, "step": 62650 }, { "epoch": 1.1843149106569453, "grad_norm": 0.03716987371444702, "learning_rate": 5.9215745532847264e-05, "loss": 0.1355, "step": 62700 }, { "epoch": 1.1852593404102603, "grad_norm": 0.0351952463388443, "learning_rate": 5.926296702051302e-05, "loss": 0.1354, "step": 62750 }, { "epoch": 1.1862037701635753, "grad_norm": 0.03668035939335823, "learning_rate": 5.9310188508178766e-05, "loss": 0.1353, "step": 62800 }, { "epoch": 1.1871481999168902, "grad_norm": 0.03677074983716011, "learning_rate": 5.935740999584451e-05, "loss": 0.1352, "step": 62850 }, { "epoch": 1.188092629670205, "grad_norm": 0.034637849777936935, "learning_rate": 5.940463148351027e-05, "loss": 0.1355, "step": 62900 }, { "epoch": 1.18903705942352, "grad_norm": 0.03460422530770302, "learning_rate": 5.9451852971176e-05, "loss": 0.1354, "step": 62950 }, { "epoch": 1.189981489176835, "grad_norm": 0.03800395503640175, "learning_rate": 5.9499074458841755e-05, "loss": 0.1355, "step": 63000 }, { "epoch": 1.19092591893015, "grad_norm": 0.039297718554735184, "learning_rate": 5.95462959465075e-05, "loss": 0.1355, "step": 63050 }, { "epoch": 1.191870348683465, "grad_norm": 0.03711273893713951, "learning_rate": 5.959351743417325e-05, "loss": 0.1352, "step": 63100 }, { "epoch": 1.19281477843678, "grad_norm": 0.03804107755422592, "learning_rate": 5.9640738921839e-05, "loss": 0.1355, "step": 63150 }, { "epoch": 1.1937592081900947, "grad_norm": 0.03606366738677025, "learning_rate": 5.968796040950474e-05, "loss": 0.1354, "step": 63200 }, { "epoch": 1.1947036379434097, "grad_norm": 0.033525168895721436, "learning_rate": 5.9735181897170486e-05, "loss": 0.135, "step": 63250 }, { "epoch": 1.1956480676967247, "grad_norm": 0.03761378675699234, "learning_rate": 5.978240338483624e-05, "loss": 0.1356, "step": 63300 }, { "epoch": 1.1965924974500397, "grad_norm": 0.037442829459905624, "learning_rate": 5.982962487250199e-05, "loss": 0.1354, "step": 63350 }, { "epoch": 1.1975369272033547, "grad_norm": 0.035100825130939484, "learning_rate": 5.9876846360167735e-05, "loss": 0.1356, "step": 63400 }, { "epoch": 1.1984813569566697, "grad_norm": 0.0362405925989151, "learning_rate": 5.9924067847833476e-05, "loss": 0.1352, "step": 63450 }, { "epoch": 1.1994257867099845, "grad_norm": 0.03596195578575134, "learning_rate": 5.997128933549922e-05, "loss": 0.1352, "step": 63500 }, { "epoch": 1.2003702164632994, "grad_norm": 0.03574448078870773, "learning_rate": 6.001851082316498e-05, "loss": 0.1352, "step": 63550 }, { "epoch": 1.2013146462166144, "grad_norm": 0.03387679532170296, "learning_rate": 6.0065732310830725e-05, "loss": 0.1354, "step": 63600 }, { "epoch": 1.2022590759699294, "grad_norm": 0.03756575658917427, "learning_rate": 6.011295379849647e-05, "loss": 0.1349, "step": 63650 }, { "epoch": 1.2032035057232444, "grad_norm": 0.03488316386938095, "learning_rate": 6.0160175286162226e-05, "loss": 0.1357, "step": 63700 }, { "epoch": 1.2041479354765592, "grad_norm": 0.034471701830625534, "learning_rate": 6.020739677382796e-05, "loss": 0.135, "step": 63750 }, { "epoch": 1.2050923652298742, "grad_norm": 0.03792346268892288, "learning_rate": 6.0254618261493714e-05, "loss": 0.1353, "step": 63800 }, { "epoch": 1.2060367949831892, "grad_norm": 0.03445810452103615, "learning_rate": 6.030183974915946e-05, "loss": 0.1354, "step": 63850 }, { "epoch": 1.2069812247365042, "grad_norm": 0.03608221188187599, "learning_rate": 6.034906123682521e-05, "loss": 0.1354, "step": 63900 }, { "epoch": 1.2079256544898191, "grad_norm": 0.034803472459316254, "learning_rate": 6.039628272449096e-05, "loss": 0.1355, "step": 63950 }, { "epoch": 1.208870084243134, "grad_norm": 0.036331988871097565, "learning_rate": 6.04435042121567e-05, "loss": 0.135, "step": 64000 }, { "epoch": 1.209814513996449, "grad_norm": 0.03475756198167801, "learning_rate": 6.049072569982245e-05, "loss": 0.1348, "step": 64050 }, { "epoch": 1.210758943749764, "grad_norm": 0.03701501712203026, "learning_rate": 6.05379471874882e-05, "loss": 0.1354, "step": 64100 }, { "epoch": 1.2117033735030789, "grad_norm": 0.034120555967092514, "learning_rate": 6.0585168675153946e-05, "loss": 0.1351, "step": 64150 }, { "epoch": 1.2126478032563939, "grad_norm": 0.036551229655742645, "learning_rate": 6.0632390162819694e-05, "loss": 0.135, "step": 64200 }, { "epoch": 1.2135922330097086, "grad_norm": 0.034189194440841675, "learning_rate": 6.0679611650485434e-05, "loss": 0.1353, "step": 64250 }, { "epoch": 1.2145366627630236, "grad_norm": 0.03511236980557442, "learning_rate": 6.072683313815118e-05, "loss": 0.1354, "step": 64300 }, { "epoch": 1.2154810925163386, "grad_norm": 0.03575442358851433, "learning_rate": 6.0774054625816936e-05, "loss": 0.1352, "step": 64350 }, { "epoch": 1.2164255222696536, "grad_norm": 0.03568664938211441, "learning_rate": 6.0821276113482683e-05, "loss": 0.1354, "step": 64400 }, { "epoch": 1.2173699520229686, "grad_norm": 0.036859314888715744, "learning_rate": 6.086849760114843e-05, "loss": 0.1352, "step": 64450 }, { "epoch": 1.2183143817762834, "grad_norm": 0.03856856748461723, "learning_rate": 6.091571908881417e-05, "loss": 0.1351, "step": 64500 }, { "epoch": 1.2192588115295984, "grad_norm": 0.03419310599565506, "learning_rate": 6.096294057647992e-05, "loss": 0.1348, "step": 64550 }, { "epoch": 1.2202032412829134, "grad_norm": 0.035029299557209015, "learning_rate": 6.101016206414567e-05, "loss": 0.135, "step": 64600 }, { "epoch": 1.2211476710362283, "grad_norm": 0.03383321687579155, "learning_rate": 6.105738355181141e-05, "loss": 0.1353, "step": 64650 }, { "epoch": 1.2220921007895433, "grad_norm": 0.03418998792767525, "learning_rate": 6.110460503947717e-05, "loss": 0.1351, "step": 64700 }, { "epoch": 1.223036530542858, "grad_norm": 0.03458826243877411, "learning_rate": 6.115182652714292e-05, "loss": 0.1352, "step": 64750 }, { "epoch": 1.223980960296173, "grad_norm": 0.0356961153447628, "learning_rate": 6.119904801480866e-05, "loss": 0.135, "step": 64800 }, { "epoch": 1.224925390049488, "grad_norm": 0.037634965032339096, "learning_rate": 6.12462695024744e-05, "loss": 0.1348, "step": 64850 }, { "epoch": 1.225869819802803, "grad_norm": 0.04084901511669159, "learning_rate": 6.129349099014016e-05, "loss": 0.135, "step": 64900 }, { "epoch": 1.226814249556118, "grad_norm": 0.03546953573822975, "learning_rate": 6.134071247780591e-05, "loss": 0.1352, "step": 64950 }, { "epoch": 1.227758679309433, "grad_norm": 0.034587062895298004, "learning_rate": 6.138793396547165e-05, "loss": 0.1347, "step": 65000 }, { "epoch": 1.227758679309433, "eval_IntDiv": 0.6728725581070658, "eval_NumCircles": 1778, "eval_SumBottleneck": 120.18610082384086, "eval_Uniqueness": 0.996629213483146, "eval_Validity": 0.979, "eval_Validity * Uniqueness": 0.9756999999999999, "eval_loss": 0.2206730842590332, "eval_runtime": 146.1655, "eval_samples_per_second": 68.416, "eval_steps_per_second": 0.54, "step": 65000 }, { "epoch": 1.2287031090627478, "grad_norm": 0.03470972552895546, "learning_rate": 6.143515545313739e-05, "loss": 0.1354, "step": 65050 }, { "epoch": 1.2296475388160628, "grad_norm": 0.033624790608882904, "learning_rate": 6.148237694080315e-05, "loss": 0.1352, "step": 65100 }, { "epoch": 1.2305919685693778, "grad_norm": 0.03591257706284523, "learning_rate": 6.152959842846889e-05, "loss": 0.1348, "step": 65150 }, { "epoch": 1.2315363983226928, "grad_norm": 0.034969400614500046, "learning_rate": 6.157681991613464e-05, "loss": 0.1349, "step": 65200 }, { "epoch": 1.2324808280760078, "grad_norm": 0.03489504009485245, "learning_rate": 6.16240414038004e-05, "loss": 0.1347, "step": 65250 }, { "epoch": 1.2334252578293228, "grad_norm": 0.035852398723363876, "learning_rate": 6.167126289146614e-05, "loss": 0.1348, "step": 65300 }, { "epoch": 1.2343696875826375, "grad_norm": 0.03804373741149902, "learning_rate": 6.171848437913188e-05, "loss": 0.1344, "step": 65350 }, { "epoch": 1.2353141173359525, "grad_norm": 0.03336457535624504, "learning_rate": 6.176570586679763e-05, "loss": 0.1347, "step": 65400 }, { "epoch": 1.2362585470892675, "grad_norm": 0.03647491708397865, "learning_rate": 6.181292735446337e-05, "loss": 0.1349, "step": 65450 }, { "epoch": 1.2372029768425825, "grad_norm": 0.03604920580983162, "learning_rate": 6.186014884212913e-05, "loss": 0.1348, "step": 65500 }, { "epoch": 1.2381474065958975, "grad_norm": 0.03588010370731354, "learning_rate": 6.190737032979488e-05, "loss": 0.1346, "step": 65550 }, { "epoch": 1.2390918363492123, "grad_norm": 0.03668217733502388, "learning_rate": 6.195459181746062e-05, "loss": 0.1346, "step": 65600 }, { "epoch": 1.2400362661025273, "grad_norm": 0.03587242215871811, "learning_rate": 6.200181330512636e-05, "loss": 0.1346, "step": 65650 }, { "epoch": 1.2409806958558423, "grad_norm": 0.03660496696829796, "learning_rate": 6.204903479279212e-05, "loss": 0.1344, "step": 65700 }, { "epoch": 1.2419251256091572, "grad_norm": 0.03644092008471489, "learning_rate": 6.209625628045787e-05, "loss": 0.1343, "step": 65750 }, { "epoch": 1.2428695553624722, "grad_norm": 0.03421618416905403, "learning_rate": 6.214347776812361e-05, "loss": 0.1342, "step": 65800 }, { "epoch": 1.243813985115787, "grad_norm": 0.03486258164048195, "learning_rate": 6.219069925578935e-05, "loss": 0.1349, "step": 65850 }, { "epoch": 1.244758414869102, "grad_norm": 0.038386937230825424, "learning_rate": 6.22379207434551e-05, "loss": 0.1342, "step": 65900 }, { "epoch": 1.245702844622417, "grad_norm": 0.035354457795619965, "learning_rate": 6.228514223112085e-05, "loss": 0.1348, "step": 65950 }, { "epoch": 1.246647274375732, "grad_norm": 0.03467836230993271, "learning_rate": 6.23323637187866e-05, "loss": 0.1345, "step": 66000 }, { "epoch": 1.247591704129047, "grad_norm": 0.039318446069955826, "learning_rate": 6.237958520645236e-05, "loss": 0.1351, "step": 66050 }, { "epoch": 1.2485361338823617, "grad_norm": 0.03876136615872383, "learning_rate": 6.24268066941181e-05, "loss": 0.1347, "step": 66100 }, { "epoch": 1.2494805636356767, "grad_norm": 0.034266602247953415, "learning_rate": 6.247402818178384e-05, "loss": 0.1347, "step": 66150 }, { "epoch": 1.2504249933889917, "grad_norm": 0.043572522699832916, "learning_rate": 6.252124966944959e-05, "loss": 0.1344, "step": 66200 }, { "epoch": 1.2513694231423067, "grad_norm": 0.0357801727950573, "learning_rate": 6.256847115711534e-05, "loss": 0.1348, "step": 66250 }, { "epoch": 1.2523138528956217, "grad_norm": 0.03452853485941887, "learning_rate": 6.261569264478109e-05, "loss": 0.1346, "step": 66300 }, { "epoch": 1.2532582826489365, "grad_norm": 0.035646386444568634, "learning_rate": 6.266291413244683e-05, "loss": 0.1344, "step": 66350 }, { "epoch": 1.2542027124022515, "grad_norm": 0.03581445291638374, "learning_rate": 6.271013562011258e-05, "loss": 0.1348, "step": 66400 }, { "epoch": 1.2551471421555664, "grad_norm": 0.03603629767894745, "learning_rate": 6.275735710777832e-05, "loss": 0.135, "step": 66450 }, { "epoch": 1.2560915719088814, "grad_norm": 0.035187892615795135, "learning_rate": 6.280457859544408e-05, "loss": 0.1347, "step": 66500 }, { "epoch": 1.2570360016621964, "grad_norm": 0.03584189713001251, "learning_rate": 6.285180008310983e-05, "loss": 0.1345, "step": 66550 }, { "epoch": 1.2579804314155112, "grad_norm": 0.03309622034430504, "learning_rate": 6.289902157077557e-05, "loss": 0.1346, "step": 66600 }, { "epoch": 1.2589248611688262, "grad_norm": 0.035792406648397446, "learning_rate": 6.294624305844131e-05, "loss": 0.1344, "step": 66650 }, { "epoch": 1.2598692909221412, "grad_norm": 0.037292227149009705, "learning_rate": 6.299346454610706e-05, "loss": 0.1346, "step": 66700 }, { "epoch": 1.2608137206754562, "grad_norm": 0.03449574112892151, "learning_rate": 6.30406860337728e-05, "loss": 0.1348, "step": 66750 }, { "epoch": 1.2617581504287712, "grad_norm": 0.03661799058318138, "learning_rate": 6.308790752143856e-05, "loss": 0.1348, "step": 66800 }, { "epoch": 1.262702580182086, "grad_norm": 0.03684481978416443, "learning_rate": 6.313512900910431e-05, "loss": 0.1348, "step": 66850 }, { "epoch": 1.2636470099354011, "grad_norm": 0.03740385174751282, "learning_rate": 6.318235049677005e-05, "loss": 0.1349, "step": 66900 }, { "epoch": 1.264591439688716, "grad_norm": 0.03648831322789192, "learning_rate": 6.32295719844358e-05, "loss": 0.1344, "step": 66950 }, { "epoch": 1.265535869442031, "grad_norm": 0.03447984158992767, "learning_rate": 6.327679347210155e-05, "loss": 0.1339, "step": 67000 }, { "epoch": 1.2664802991953459, "grad_norm": 0.03470230475068092, "learning_rate": 6.33240149597673e-05, "loss": 0.1343, "step": 67050 }, { "epoch": 1.2674247289486609, "grad_norm": 0.0357542559504509, "learning_rate": 6.337123644743304e-05, "loss": 0.1349, "step": 67100 }, { "epoch": 1.2683691587019759, "grad_norm": 0.03521917387843132, "learning_rate": 6.341845793509878e-05, "loss": 0.1342, "step": 67150 }, { "epoch": 1.2693135884552906, "grad_norm": 0.033940766006708145, "learning_rate": 6.346567942276454e-05, "loss": 0.1341, "step": 67200 }, { "epoch": 1.2702580182086056, "grad_norm": 0.036328062415122986, "learning_rate": 6.351290091043028e-05, "loss": 0.1351, "step": 67250 }, { "epoch": 1.2712024479619206, "grad_norm": 0.03665727749466896, "learning_rate": 6.356012239809603e-05, "loss": 0.1341, "step": 67300 }, { "epoch": 1.2721468777152356, "grad_norm": 0.03458220139145851, "learning_rate": 6.360734388576179e-05, "loss": 0.1341, "step": 67350 }, { "epoch": 1.2730913074685506, "grad_norm": 0.036429692059755325, "learning_rate": 6.365456537342753e-05, "loss": 0.1343, "step": 67400 }, { "epoch": 1.2740357372218654, "grad_norm": 0.03453110530972481, "learning_rate": 6.370178686109327e-05, "loss": 0.1344, "step": 67450 }, { "epoch": 1.2749801669751804, "grad_norm": 0.03683925047516823, "learning_rate": 6.374900834875902e-05, "loss": 0.1345, "step": 67500 }, { "epoch": 1.2749801669751804, "eval_IntDiv": 0.6744969120595521, "eval_NumCircles": 1782, "eval_SumBottleneck": 78.07843472722837, "eval_Uniqueness": 0.9960248700438283, "eval_Validity": 0.9811, "eval_Validity * Uniqueness": 0.9772, "eval_loss": 0.2195402979850769, "eval_runtime": 185.4575, "eval_samples_per_second": 53.921, "eval_steps_per_second": 0.426, "step": 67500 }, { "epoch": 1.2759245967284953, "grad_norm": 0.03668908402323723, "learning_rate": 6.379622983642476e-05, "loss": 0.1342, "step": 67550 }, { "epoch": 1.2768690264818103, "grad_norm": 0.03842446953058243, "learning_rate": 6.384345132409052e-05, "loss": 0.1342, "step": 67600 }, { "epoch": 1.2778134562351253, "grad_norm": 0.032690659165382385, "learning_rate": 6.389067281175627e-05, "loss": 0.1341, "step": 67650 }, { "epoch": 1.27875788598844, "grad_norm": 0.034665271639823914, "learning_rate": 6.393789429942201e-05, "loss": 0.1342, "step": 67700 }, { "epoch": 1.279702315741755, "grad_norm": 0.03526727482676506, "learning_rate": 6.398511578708775e-05, "loss": 0.1339, "step": 67750 }, { "epoch": 1.28064674549507, "grad_norm": 0.034531448036432266, "learning_rate": 6.403233727475351e-05, "loss": 0.1342, "step": 67800 }, { "epoch": 1.281591175248385, "grad_norm": 0.03677108883857727, "learning_rate": 6.407955876241926e-05, "loss": 0.1343, "step": 67850 }, { "epoch": 1.2825356050017, "grad_norm": 0.03512340039014816, "learning_rate": 6.4126780250085e-05, "loss": 0.1342, "step": 67900 }, { "epoch": 1.2834800347550148, "grad_norm": 0.03522859141230583, "learning_rate": 6.417400173775074e-05, "loss": 0.1338, "step": 67950 }, { "epoch": 1.2844244645083298, "grad_norm": 0.03918865695595741, "learning_rate": 6.42212232254165e-05, "loss": 0.1338, "step": 68000 }, { "epoch": 1.2853688942616448, "grad_norm": 0.03585806488990784, "learning_rate": 6.426844471308224e-05, "loss": 0.1339, "step": 68050 }, { "epoch": 1.2863133240149598, "grad_norm": 0.03681211546063423, "learning_rate": 6.431566620074799e-05, "loss": 0.1343, "step": 68100 }, { "epoch": 1.2872577537682748, "grad_norm": 0.03411278873682022, "learning_rate": 6.436288768841375e-05, "loss": 0.1339, "step": 68150 }, { "epoch": 1.2882021835215895, "grad_norm": 0.03723642975091934, "learning_rate": 6.441010917607949e-05, "loss": 0.134, "step": 68200 }, { "epoch": 1.2891466132749045, "grad_norm": 0.03572777286171913, "learning_rate": 6.445733066374523e-05, "loss": 0.1343, "step": 68250 }, { "epoch": 1.2900910430282195, "grad_norm": 0.03607626259326935, "learning_rate": 6.450455215141098e-05, "loss": 0.1339, "step": 68300 }, { "epoch": 1.2910354727815345, "grad_norm": 0.0362374372780323, "learning_rate": 6.455177363907672e-05, "loss": 0.1344, "step": 68350 }, { "epoch": 1.2919799025348495, "grad_norm": 0.03370358422398567, "learning_rate": 6.459899512674248e-05, "loss": 0.1341, "step": 68400 }, { "epoch": 1.2929243322881643, "grad_norm": 0.037957437336444855, "learning_rate": 6.464621661440823e-05, "loss": 0.1339, "step": 68450 }, { "epoch": 1.2938687620414795, "grad_norm": 0.036816105246543884, "learning_rate": 6.469343810207397e-05, "loss": 0.1342, "step": 68500 }, { "epoch": 1.2948131917947943, "grad_norm": 0.03365691378712654, "learning_rate": 6.474065958973971e-05, "loss": 0.1337, "step": 68550 }, { "epoch": 1.2957576215481093, "grad_norm": 0.03756514936685562, "learning_rate": 6.478788107740547e-05, "loss": 0.1336, "step": 68600 }, { "epoch": 1.2967020513014242, "grad_norm": 0.03764648362994194, "learning_rate": 6.483510256507122e-05, "loss": 0.1342, "step": 68650 }, { "epoch": 1.2976464810547392, "grad_norm": 0.03453851118683815, "learning_rate": 6.488232405273696e-05, "loss": 0.1339, "step": 68700 }, { "epoch": 1.2985909108080542, "grad_norm": 0.035918571054935455, "learning_rate": 6.49295455404027e-05, "loss": 0.1341, "step": 68750 }, { "epoch": 1.299535340561369, "grad_norm": 0.03509676083922386, "learning_rate": 6.497676702806846e-05, "loss": 0.1337, "step": 68800 }, { "epoch": 1.300479770314684, "grad_norm": 0.036021579056978226, "learning_rate": 6.50239885157342e-05, "loss": 0.1343, "step": 68850 }, { "epoch": 1.301424200067999, "grad_norm": 0.0366428978741169, "learning_rate": 6.507121000339995e-05, "loss": 0.1341, "step": 68900 }, { "epoch": 1.302368629821314, "grad_norm": 0.03502330183982849, "learning_rate": 6.51184314910657e-05, "loss": 0.1339, "step": 68950 }, { "epoch": 1.303313059574629, "grad_norm": 0.03603357821702957, "learning_rate": 6.516565297873143e-05, "loss": 0.134, "step": 69000 }, { "epoch": 1.3042574893279437, "grad_norm": 0.03570196405053139, "learning_rate": 6.521287446639719e-05, "loss": 0.1337, "step": 69050 }, { "epoch": 1.3052019190812587, "grad_norm": 0.035346779972314835, "learning_rate": 6.526009595406294e-05, "loss": 0.1341, "step": 69100 }, { "epoch": 1.3061463488345737, "grad_norm": 0.033303964883089066, "learning_rate": 6.530731744172868e-05, "loss": 0.134, "step": 69150 }, { "epoch": 1.3070907785878887, "grad_norm": 0.03543694689869881, "learning_rate": 6.535453892939444e-05, "loss": 0.1339, "step": 69200 }, { "epoch": 1.3080352083412037, "grad_norm": 0.03384518250823021, "learning_rate": 6.540176041706019e-05, "loss": 0.1338, "step": 69250 }, { "epoch": 1.3089796380945184, "grad_norm": 0.03803733363747597, "learning_rate": 6.544898190472593e-05, "loss": 0.134, "step": 69300 }, { "epoch": 1.3099240678478334, "grad_norm": 0.035835590213537216, "learning_rate": 6.549620339239167e-05, "loss": 0.1333, "step": 69350 }, { "epoch": 1.3108684976011484, "grad_norm": 0.03444220498204231, "learning_rate": 6.554342488005743e-05, "loss": 0.1336, "step": 69400 }, { "epoch": 1.3118129273544634, "grad_norm": 0.03497631102800369, "learning_rate": 6.559064636772318e-05, "loss": 0.1336, "step": 69450 }, { "epoch": 1.3127573571077784, "grad_norm": 0.03455602750182152, "learning_rate": 6.563786785538892e-05, "loss": 0.1338, "step": 69500 }, { "epoch": 1.3137017868610932, "grad_norm": 0.033664628863334656, "learning_rate": 6.568508934305466e-05, "loss": 0.1336, "step": 69550 }, { "epoch": 1.3146462166144082, "grad_norm": 0.03349119424819946, "learning_rate": 6.573231083072042e-05, "loss": 0.1336, "step": 69600 }, { "epoch": 1.3155906463677232, "grad_norm": 0.03598978742957115, "learning_rate": 6.577953231838616e-05, "loss": 0.1341, "step": 69650 }, { "epoch": 1.3165350761210382, "grad_norm": 0.42032289505004883, "learning_rate": 6.582675380605191e-05, "loss": 0.1344, "step": 69700 }, { "epoch": 1.3174795058743531, "grad_norm": 0.0376116968691349, "learning_rate": 6.587397529371766e-05, "loss": 0.1355, "step": 69750 }, { "epoch": 1.318423935627668, "grad_norm": 0.03604390472173691, "learning_rate": 6.59211967813834e-05, "loss": 0.1338, "step": 69800 }, { "epoch": 1.319368365380983, "grad_norm": 0.03727199137210846, "learning_rate": 6.596841826904915e-05, "loss": 0.1337, "step": 69850 }, { "epoch": 1.320312795134298, "grad_norm": 0.03215288370847702, "learning_rate": 6.60156397567149e-05, "loss": 0.1331, "step": 69900 }, { "epoch": 1.3212572248876129, "grad_norm": 0.03482881188392639, "learning_rate": 6.606286124438064e-05, "loss": 0.1337, "step": 69950 }, { "epoch": 1.3222016546409279, "grad_norm": 0.03552589192986488, "learning_rate": 6.61100827320464e-05, "loss": 0.1329, "step": 70000 }, { "epoch": 1.3222016546409279, "eval_IntDiv": 0.67519542079352, "eval_NumCircles": 1923, "eval_SumBottleneck": 142.29113465356417, "eval_Uniqueness": 0.9967246673490276, "eval_Validity": 0.977, "eval_Validity * Uniqueness": 0.9738, "eval_loss": 0.22039534151554108, "eval_runtime": 277.1656, "eval_samples_per_second": 36.08, "eval_steps_per_second": 0.285, "step": 70000 }, { "epoch": 1.3231460843942426, "grad_norm": 0.03282619267702103, "learning_rate": 6.615730421971215e-05, "loss": 0.1331, "step": 70050 }, { "epoch": 1.3240905141475576, "grad_norm": 0.03366563841700554, "learning_rate": 6.620452570737789e-05, "loss": 0.1336, "step": 70100 }, { "epoch": 1.3250349439008726, "grad_norm": 0.03516401723027229, "learning_rate": 6.625174719504363e-05, "loss": 0.1336, "step": 70150 }, { "epoch": 1.3259793736541876, "grad_norm": 0.03529908508062363, "learning_rate": 6.629896868270938e-05, "loss": 0.1331, "step": 70200 }, { "epoch": 1.3269238034075026, "grad_norm": 0.03289472311735153, "learning_rate": 6.634619017037514e-05, "loss": 0.1335, "step": 70250 }, { "epoch": 1.3278682331608174, "grad_norm": 0.03417067974805832, "learning_rate": 6.639341165804088e-05, "loss": 0.1334, "step": 70300 }, { "epoch": 1.3288126629141326, "grad_norm": 0.033571094274520874, "learning_rate": 6.644063314570662e-05, "loss": 0.1334, "step": 70350 }, { "epoch": 1.3297570926674473, "grad_norm": 0.039340294897556305, "learning_rate": 6.648785463337237e-05, "loss": 0.1337, "step": 70400 }, { "epoch": 1.3307015224207623, "grad_norm": 0.03445740044116974, "learning_rate": 6.653507612103812e-05, "loss": 0.1332, "step": 70450 }, { "epoch": 1.3316459521740773, "grad_norm": 0.03408224135637283, "learning_rate": 6.658229760870387e-05, "loss": 0.1336, "step": 70500 }, { "epoch": 1.3325903819273923, "grad_norm": 0.03327103331685066, "learning_rate": 6.662951909636962e-05, "loss": 0.1334, "step": 70550 }, { "epoch": 1.3335348116807073, "grad_norm": 0.033326584845781326, "learning_rate": 6.667674058403536e-05, "loss": 0.1331, "step": 70600 }, { "epoch": 1.334479241434022, "grad_norm": 0.034601300954818726, "learning_rate": 6.67239620717011e-05, "loss": 0.1336, "step": 70650 }, { "epoch": 1.335423671187337, "grad_norm": 0.034161221235990524, "learning_rate": 6.677118355936686e-05, "loss": 0.1334, "step": 70700 }, { "epoch": 1.336368100940652, "grad_norm": 0.034209202975034714, "learning_rate": 6.68184050470326e-05, "loss": 0.1333, "step": 70750 }, { "epoch": 1.337312530693967, "grad_norm": 0.03379014506936073, "learning_rate": 6.686562653469835e-05, "loss": 0.1337, "step": 70800 }, { "epoch": 1.338256960447282, "grad_norm": 0.03430692106485367, "learning_rate": 6.691284802236411e-05, "loss": 0.1342, "step": 70850 }, { "epoch": 1.3392013902005968, "grad_norm": 0.03594708815217018, "learning_rate": 6.696006951002985e-05, "loss": 0.1337, "step": 70900 }, { "epoch": 1.3401458199539118, "grad_norm": 0.036250047385692596, "learning_rate": 6.700729099769559e-05, "loss": 0.1335, "step": 70950 }, { "epoch": 1.3410902497072268, "grad_norm": 0.034719619899988174, "learning_rate": 6.705451248536134e-05, "loss": 0.1333, "step": 71000 }, { "epoch": 1.3420346794605418, "grad_norm": 0.035545263439416885, "learning_rate": 6.71017339730271e-05, "loss": 0.1331, "step": 71050 }, { "epoch": 1.3429791092138568, "grad_norm": 0.03359880670905113, "learning_rate": 6.714895546069284e-05, "loss": 0.1339, "step": 71100 }, { "epoch": 1.3439235389671715, "grad_norm": 0.0339946523308754, "learning_rate": 6.719617694835858e-05, "loss": 0.1332, "step": 71150 }, { "epoch": 1.3448679687204865, "grad_norm": 0.033869463950395584, "learning_rate": 6.724339843602433e-05, "loss": 0.1336, "step": 71200 }, { "epoch": 1.3458123984738015, "grad_norm": 0.033742256462574005, "learning_rate": 6.729061992369007e-05, "loss": 0.1332, "step": 71250 }, { "epoch": 1.3467568282271165, "grad_norm": 0.032783932983875275, "learning_rate": 6.733784141135583e-05, "loss": 0.1333, "step": 71300 }, { "epoch": 1.3477012579804315, "grad_norm": 0.03557303547859192, "learning_rate": 6.738506289902158e-05, "loss": 0.1334, "step": 71350 }, { "epoch": 1.3486456877337463, "grad_norm": 0.03392179310321808, "learning_rate": 6.743228438668732e-05, "loss": 0.134, "step": 71400 }, { "epoch": 1.3495901174870613, "grad_norm": 0.0351148284971714, "learning_rate": 6.747950587435306e-05, "loss": 0.1331, "step": 71450 }, { "epoch": 1.3505345472403762, "grad_norm": 0.03509382903575897, "learning_rate": 6.752672736201882e-05, "loss": 0.133, "step": 71500 }, { "epoch": 1.3514789769936912, "grad_norm": 0.035408128052949905, "learning_rate": 6.757394884968457e-05, "loss": 0.1336, "step": 71550 }, { "epoch": 1.3524234067470062, "grad_norm": 0.03401173651218414, "learning_rate": 6.762117033735031e-05, "loss": 0.1336, "step": 71600 }, { "epoch": 1.353367836500321, "grad_norm": 0.03609152510762215, "learning_rate": 6.766839182501605e-05, "loss": 0.1333, "step": 71650 }, { "epoch": 1.354312266253636, "grad_norm": 0.03514854609966278, "learning_rate": 6.771561331268181e-05, "loss": 0.1336, "step": 71700 }, { "epoch": 1.355256696006951, "grad_norm": 0.03462997078895569, "learning_rate": 6.776283480034755e-05, "loss": 0.1332, "step": 71750 }, { "epoch": 1.356201125760266, "grad_norm": 0.035922423005104065, "learning_rate": 6.78100562880133e-05, "loss": 0.1333, "step": 71800 }, { "epoch": 1.357145555513581, "grad_norm": 0.03538636118173599, "learning_rate": 6.785727777567906e-05, "loss": 0.1331, "step": 71850 }, { "epoch": 1.3580899852668957, "grad_norm": 0.03371267393231392, "learning_rate": 6.79044992633448e-05, "loss": 0.133, "step": 71900 }, { "epoch": 1.3590344150202107, "grad_norm": 0.032313913106918335, "learning_rate": 6.795172075101054e-05, "loss": 0.1333, "step": 71950 }, { "epoch": 1.3599788447735257, "grad_norm": 0.03395611420273781, "learning_rate": 6.799894223867629e-05, "loss": 0.1328, "step": 72000 }, { "epoch": 1.3609232745268407, "grad_norm": 0.03396817296743393, "learning_rate": 6.804616372634203e-05, "loss": 0.1331, "step": 72050 }, { "epoch": 1.3618677042801557, "grad_norm": 0.03426605835556984, "learning_rate": 6.809338521400779e-05, "loss": 0.133, "step": 72100 }, { "epoch": 1.3628121340334705, "grad_norm": 0.03270237520337105, "learning_rate": 6.814060670167354e-05, "loss": 0.1332, "step": 72150 }, { "epoch": 1.3637565637867857, "grad_norm": 0.032416775822639465, "learning_rate": 6.818782818933928e-05, "loss": 0.1335, "step": 72200 }, { "epoch": 1.3647009935401004, "grad_norm": 0.033386580646038055, "learning_rate": 6.823504967700502e-05, "loss": 0.1329, "step": 72250 }, { "epoch": 1.3656454232934154, "grad_norm": 0.03782765194773674, "learning_rate": 6.828227116467078e-05, "loss": 0.133, "step": 72300 }, { "epoch": 1.3665898530467304, "grad_norm": 0.03531458601355553, "learning_rate": 6.832949265233653e-05, "loss": 0.1328, "step": 72350 }, { "epoch": 1.3675342828000454, "grad_norm": 0.03450023755431175, "learning_rate": 6.837671414000227e-05, "loss": 0.1332, "step": 72400 }, { "epoch": 1.3684787125533604, "grad_norm": 0.034696612507104874, "learning_rate": 6.842393562766801e-05, "loss": 0.1327, "step": 72450 }, { "epoch": 1.3694231423066752, "grad_norm": 0.043067049235105515, "learning_rate": 6.847115711533377e-05, "loss": 0.1332, "step": 72500 }, { "epoch": 1.3694231423066752, "eval_IntDiv": 0.676494540569192, "eval_NumCircles": 1900, "eval_SumBottleneck": 142.88537552443597, "eval_Uniqueness": 0.9973368841544608, "eval_Validity": 0.9763, "eval_Validity * Uniqueness": 0.9737, "eval_loss": 0.22205394506454468, "eval_runtime": 140.0051, "eval_samples_per_second": 71.426, "eval_steps_per_second": 0.564, "step": 72500 }, { "epoch": 1.3703675720599902, "grad_norm": 0.034007906913757324, "learning_rate": 6.851837860299951e-05, "loss": 0.1335, "step": 72550 }, { "epoch": 1.3713120018133051, "grad_norm": 0.03439343720674515, "learning_rate": 6.856560009066526e-05, "loss": 0.1328, "step": 72600 }, { "epoch": 1.3722564315666201, "grad_norm": 0.033956434577703476, "learning_rate": 6.861282157833102e-05, "loss": 0.1333, "step": 72650 }, { "epoch": 1.3732008613199351, "grad_norm": 0.03357469290494919, "learning_rate": 6.866004306599676e-05, "loss": 0.133, "step": 72700 }, { "epoch": 1.37414529107325, "grad_norm": 0.039847858250141144, "learning_rate": 6.87072645536625e-05, "loss": 0.1333, "step": 72750 }, { "epoch": 1.3750897208265649, "grad_norm": 0.03332245722413063, "learning_rate": 6.875448604132825e-05, "loss": 0.1328, "step": 72800 }, { "epoch": 1.3760341505798799, "grad_norm": 0.04137296602129936, "learning_rate": 6.880170752899399e-05, "loss": 0.1331, "step": 72850 }, { "epoch": 1.3769785803331949, "grad_norm": 0.035060543566942215, "learning_rate": 6.884892901665975e-05, "loss": 0.1332, "step": 72900 }, { "epoch": 1.3779230100865099, "grad_norm": 0.0341663733124733, "learning_rate": 6.88961505043255e-05, "loss": 0.1332, "step": 72950 }, { "epoch": 1.3788674398398246, "grad_norm": 0.04012038931250572, "learning_rate": 6.894337199199124e-05, "loss": 0.1328, "step": 73000 }, { "epoch": 1.3798118695931396, "grad_norm": 0.03443482518196106, "learning_rate": 6.899059347965698e-05, "loss": 0.1328, "step": 73050 }, { "epoch": 1.3807562993464546, "grad_norm": 0.034876659512519836, "learning_rate": 6.903781496732274e-05, "loss": 0.1331, "step": 73100 }, { "epoch": 1.3817007290997696, "grad_norm": 0.032676562666893005, "learning_rate": 6.908503645498849e-05, "loss": 0.1331, "step": 73150 }, { "epoch": 1.3826451588530846, "grad_norm": 0.03612913936376572, "learning_rate": 6.913225794265423e-05, "loss": 0.1331, "step": 73200 }, { "epoch": 1.3835895886063994, "grad_norm": 0.04051138460636139, "learning_rate": 6.917947943031997e-05, "loss": 0.1329, "step": 73250 }, { "epoch": 1.3845340183597143, "grad_norm": 0.03663019463419914, "learning_rate": 6.922670091798573e-05, "loss": 0.1329, "step": 73300 }, { "epoch": 1.3854784481130293, "grad_norm": 0.03480885177850723, "learning_rate": 6.927392240565147e-05, "loss": 0.1331, "step": 73350 }, { "epoch": 1.3864228778663443, "grad_norm": 0.03280779719352722, "learning_rate": 6.932114389331722e-05, "loss": 0.1334, "step": 73400 }, { "epoch": 1.3873673076196593, "grad_norm": 0.03692568466067314, "learning_rate": 6.936836538098297e-05, "loss": 0.1329, "step": 73450 }, { "epoch": 1.388311737372974, "grad_norm": 0.03707757219672203, "learning_rate": 6.941558686864871e-05, "loss": 0.133, "step": 73500 }, { "epoch": 1.389256167126289, "grad_norm": 0.03541959449648857, "learning_rate": 6.946280835631446e-05, "loss": 0.1331, "step": 73550 }, { "epoch": 1.390200596879604, "grad_norm": 0.03464554622769356, "learning_rate": 6.951002984398021e-05, "loss": 0.133, "step": 73600 }, { "epoch": 1.391145026632919, "grad_norm": 0.03536507859826088, "learning_rate": 6.955725133164595e-05, "loss": 0.1329, "step": 73650 }, { "epoch": 1.392089456386234, "grad_norm": 0.03280951455235481, "learning_rate": 6.96044728193117e-05, "loss": 0.1331, "step": 73700 }, { "epoch": 1.3930338861395488, "grad_norm": 0.03497319668531418, "learning_rate": 6.965169430697746e-05, "loss": 0.133, "step": 73750 }, { "epoch": 1.3939783158928638, "grad_norm": 0.03440965339541435, "learning_rate": 6.96989157946432e-05, "loss": 0.1331, "step": 73800 }, { "epoch": 1.3949227456461788, "grad_norm": 0.034885652363300323, "learning_rate": 6.974613728230894e-05, "loss": 0.1329, "step": 73850 }, { "epoch": 1.3958671753994938, "grad_norm": 0.035261351615190506, "learning_rate": 6.97933587699747e-05, "loss": 0.133, "step": 73900 }, { "epoch": 1.3968116051528088, "grad_norm": 0.03425212949514389, "learning_rate": 6.984058025764045e-05, "loss": 0.1327, "step": 73950 }, { "epoch": 1.3977560349061235, "grad_norm": 0.0337461419403553, "learning_rate": 6.988780174530619e-05, "loss": 0.1331, "step": 74000 }, { "epoch": 1.3987004646594388, "grad_norm": 0.034281451255083084, "learning_rate": 6.993502323297193e-05, "loss": 0.1329, "step": 74050 }, { "epoch": 1.3996448944127535, "grad_norm": 0.03384193778038025, "learning_rate": 6.998224472063768e-05, "loss": 0.1329, "step": 74100 }, { "epoch": 1.4005893241660685, "grad_norm": 0.03631910681724548, "learning_rate": 7.002946620830342e-05, "loss": 0.1323, "step": 74150 }, { "epoch": 1.4015337539193835, "grad_norm": 0.03432370722293854, "learning_rate": 7.007668769596918e-05, "loss": 0.1325, "step": 74200 }, { "epoch": 1.4024781836726985, "grad_norm": 0.03377067670226097, "learning_rate": 7.012390918363493e-05, "loss": 0.133, "step": 74250 }, { "epoch": 1.4034226134260135, "grad_norm": 0.0356762669980526, "learning_rate": 7.017113067130066e-05, "loss": 0.1328, "step": 74300 }, { "epoch": 1.4043670431793283, "grad_norm": 0.03509431704878807, "learning_rate": 7.021835215896641e-05, "loss": 0.1332, "step": 74350 }, { "epoch": 1.4053114729326432, "grad_norm": 0.034540463238954544, "learning_rate": 7.026557364663217e-05, "loss": 0.1325, "step": 74400 }, { "epoch": 1.4062559026859582, "grad_norm": 0.034034885466098785, "learning_rate": 7.031279513429791e-05, "loss": 0.1324, "step": 74450 }, { "epoch": 1.4072003324392732, "grad_norm": 0.034395016729831696, "learning_rate": 7.036001662196366e-05, "loss": 0.133, "step": 74500 }, { "epoch": 1.4081447621925882, "grad_norm": 0.0347941629588604, "learning_rate": 7.040723810962942e-05, "loss": 0.133, "step": 74550 }, { "epoch": 1.409089191945903, "grad_norm": 0.03411555290222168, "learning_rate": 7.045445959729516e-05, "loss": 0.1327, "step": 74600 }, { "epoch": 1.410033621699218, "grad_norm": 0.03434965759515762, "learning_rate": 7.05016810849609e-05, "loss": 0.1331, "step": 74650 }, { "epoch": 1.410978051452533, "grad_norm": 0.03667130321264267, "learning_rate": 7.054890257262665e-05, "loss": 0.1329, "step": 74700 }, { "epoch": 1.411922481205848, "grad_norm": 0.033231839537620544, "learning_rate": 7.059612406029241e-05, "loss": 0.1323, "step": 74750 }, { "epoch": 1.412866910959163, "grad_norm": 0.034749679267406464, "learning_rate": 7.064334554795815e-05, "loss": 0.1322, "step": 74800 }, { "epoch": 1.4138113407124777, "grad_norm": 0.03245394304394722, "learning_rate": 7.069056703562389e-05, "loss": 0.1329, "step": 74850 }, { "epoch": 1.4147557704657927, "grad_norm": 0.03446292504668236, "learning_rate": 7.073778852328964e-05, "loss": 0.1322, "step": 74900 }, { "epoch": 1.4157002002191077, "grad_norm": 0.03431730717420578, "learning_rate": 7.078501001095538e-05, "loss": 0.1326, "step": 74950 }, { "epoch": 1.4166446299724227, "grad_norm": 0.03592977672815323, "learning_rate": 7.083223149862114e-05, "loss": 0.1326, "step": 75000 }, { "epoch": 1.4166446299724227, "eval_IntDiv": 0.6736000487936087, "eval_NumCircles": 1862, "eval_SumBottleneck": 77.61507982887105, "eval_Uniqueness": 0.9965156794425087, "eval_Validity": 0.9758, "eval_Validity * Uniqueness": 0.9724, "eval_loss": 0.22631944715976715, "eval_runtime": 147.2208, "eval_samples_per_second": 67.925, "eval_steps_per_second": 0.537, "step": 75000 }, { "epoch": 1.4175890597257377, "grad_norm": 0.03518577292561531, "learning_rate": 7.087945298628689e-05, "loss": 0.1324, "step": 75050 }, { "epoch": 1.4185334894790524, "grad_norm": 0.03463682904839516, "learning_rate": 7.092667447395263e-05, "loss": 0.1329, "step": 75100 }, { "epoch": 1.4194779192323674, "grad_norm": 0.03702183812856674, "learning_rate": 7.097389596161837e-05, "loss": 0.1323, "step": 75150 }, { "epoch": 1.4204223489856824, "grad_norm": 0.034911446273326874, "learning_rate": 7.102111744928413e-05, "loss": 0.1324, "step": 75200 }, { "epoch": 1.4213667787389974, "grad_norm": 0.03381296619772911, "learning_rate": 7.106833893694987e-05, "loss": 0.1327, "step": 75250 }, { "epoch": 1.4223112084923124, "grad_norm": 0.03386329859495163, "learning_rate": 7.111556042461562e-05, "loss": 0.1327, "step": 75300 }, { "epoch": 1.4232556382456272, "grad_norm": 0.03465632349252701, "learning_rate": 7.116278191228138e-05, "loss": 0.1324, "step": 75350 }, { "epoch": 1.4242000679989422, "grad_norm": 0.036048926413059235, "learning_rate": 7.121000339994712e-05, "loss": 0.1324, "step": 75400 }, { "epoch": 1.4251444977522572, "grad_norm": 0.035686787217855453, "learning_rate": 7.125722488761286e-05, "loss": 0.1332, "step": 75450 }, { "epoch": 1.4260889275055721, "grad_norm": 0.033613305538892746, "learning_rate": 7.130444637527861e-05, "loss": 0.1327, "step": 75500 }, { "epoch": 1.4270333572588871, "grad_norm": 0.03671993687748909, "learning_rate": 7.135166786294437e-05, "loss": 0.1323, "step": 75550 }, { "epoch": 1.427977787012202, "grad_norm": 0.03528023883700371, "learning_rate": 7.13988893506101e-05, "loss": 0.1325, "step": 75600 }, { "epoch": 1.4289222167655171, "grad_norm": 0.03428101912140846, "learning_rate": 7.144611083827585e-05, "loss": 0.1321, "step": 75650 }, { "epoch": 1.4298666465188319, "grad_norm": 0.03439638018608093, "learning_rate": 7.14933323259416e-05, "loss": 0.1325, "step": 75700 }, { "epoch": 1.4308110762721469, "grad_norm": 0.035197000950574875, "learning_rate": 7.154055381360734e-05, "loss": 0.1325, "step": 75750 }, { "epoch": 1.4317555060254619, "grad_norm": 0.03388930857181549, "learning_rate": 7.15877753012731e-05, "loss": 0.1325, "step": 75800 }, { "epoch": 1.4326999357787769, "grad_norm": 0.034449998289346695, "learning_rate": 7.163499678893885e-05, "loss": 0.1322, "step": 75850 }, { "epoch": 1.4336443655320918, "grad_norm": 0.03624069318175316, "learning_rate": 7.168221827660459e-05, "loss": 0.1326, "step": 75900 }, { "epoch": 1.4345887952854066, "grad_norm": 0.03166576847434044, "learning_rate": 7.172943976427033e-05, "loss": 0.1325, "step": 75950 }, { "epoch": 1.4355332250387216, "grad_norm": 0.035211898386478424, "learning_rate": 7.177666125193609e-05, "loss": 0.1322, "step": 76000 }, { "epoch": 1.4364776547920366, "grad_norm": 0.03359732776880264, "learning_rate": 7.182388273960183e-05, "loss": 0.132, "step": 76050 }, { "epoch": 1.4374220845453516, "grad_norm": 0.03383719176054001, "learning_rate": 7.187110422726758e-05, "loss": 0.1323, "step": 76100 }, { "epoch": 1.4383665142986666, "grad_norm": 0.03474825993180275, "learning_rate": 7.191832571493332e-05, "loss": 0.1324, "step": 76150 }, { "epoch": 1.4393109440519813, "grad_norm": 0.03253985196352005, "learning_rate": 7.196554720259908e-05, "loss": 0.1321, "step": 76200 }, { "epoch": 1.4402553738052963, "grad_norm": 0.032670989632606506, "learning_rate": 7.201276869026482e-05, "loss": 0.1326, "step": 76250 }, { "epoch": 1.4411998035586113, "grad_norm": 0.033352483063936234, "learning_rate": 7.205999017793057e-05, "loss": 0.1323, "step": 76300 }, { "epoch": 1.4421442333119263, "grad_norm": 0.03328699246048927, "learning_rate": 7.210721166559632e-05, "loss": 0.1321, "step": 76350 }, { "epoch": 1.4430886630652413, "grad_norm": 0.033805493265390396, "learning_rate": 7.215443315326207e-05, "loss": 0.1322, "step": 76400 }, { "epoch": 1.444033092818556, "grad_norm": 0.035134922713041306, "learning_rate": 7.22016546409278e-05, "loss": 0.1319, "step": 76450 }, { "epoch": 1.444977522571871, "grad_norm": 0.03315921127796173, "learning_rate": 7.224887612859356e-05, "loss": 0.1324, "step": 76500 }, { "epoch": 1.445921952325186, "grad_norm": 0.03680766001343727, "learning_rate": 7.22960976162593e-05, "loss": 0.1321, "step": 76550 }, { "epoch": 1.446866382078501, "grad_norm": 0.03309629485011101, "learning_rate": 7.234331910392506e-05, "loss": 0.1324, "step": 76600 }, { "epoch": 1.447810811831816, "grad_norm": 0.03200734779238701, "learning_rate": 7.239054059159081e-05, "loss": 0.1322, "step": 76650 }, { "epoch": 1.4487552415851308, "grad_norm": 0.03358408063650131, "learning_rate": 7.243776207925655e-05, "loss": 0.1323, "step": 76700 }, { "epoch": 1.4496996713384458, "grad_norm": 0.0359036922454834, "learning_rate": 7.248498356692229e-05, "loss": 0.1323, "step": 76750 }, { "epoch": 1.4506441010917608, "grad_norm": 0.03324960172176361, "learning_rate": 7.253220505458804e-05, "loss": 0.1322, "step": 76800 }, { "epoch": 1.4515885308450758, "grad_norm": 0.03278156742453575, "learning_rate": 7.25794265422538e-05, "loss": 0.1318, "step": 76850 }, { "epoch": 1.4525329605983908, "grad_norm": 0.03501201793551445, "learning_rate": 7.262664802991954e-05, "loss": 0.1325, "step": 76900 }, { "epoch": 1.4534773903517055, "grad_norm": 0.033691663295030594, "learning_rate": 7.267386951758528e-05, "loss": 0.1321, "step": 76950 }, { "epoch": 1.4544218201050205, "grad_norm": 0.03405901417136192, "learning_rate": 7.272109100525103e-05, "loss": 0.1321, "step": 77000 }, { "epoch": 1.4553662498583355, "grad_norm": 0.034583427011966705, "learning_rate": 7.276831249291678e-05, "loss": 0.1324, "step": 77050 }, { "epoch": 1.4563106796116505, "grad_norm": 0.03459625318646431, "learning_rate": 7.281553398058253e-05, "loss": 0.1322, "step": 77100 }, { "epoch": 1.4572551093649655, "grad_norm": 0.03232525661587715, "learning_rate": 7.286275546824828e-05, "loss": 0.1322, "step": 77150 }, { "epoch": 1.4581995391182803, "grad_norm": 0.03223764896392822, "learning_rate": 7.290997695591402e-05, "loss": 0.1322, "step": 77200 }, { "epoch": 1.4591439688715953, "grad_norm": 0.03403366729617119, "learning_rate": 7.295719844357976e-05, "loss": 0.1326, "step": 77250 }, { "epoch": 1.4600883986249102, "grad_norm": 0.036456577479839325, "learning_rate": 7.300441993124552e-05, "loss": 0.1321, "step": 77300 }, { "epoch": 1.4610328283782252, "grad_norm": 0.03237883746623993, "learning_rate": 7.305164141891126e-05, "loss": 0.1327, "step": 77350 }, { "epoch": 1.4619772581315402, "grad_norm": 0.036743853241205215, "learning_rate": 7.309886290657701e-05, "loss": 0.1325, "step": 77400 }, { "epoch": 1.462921687884855, "grad_norm": 0.03302630037069321, "learning_rate": 7.314608439424277e-05, "loss": 0.132, "step": 77450 }, { "epoch": 1.4638661176381702, "grad_norm": 0.03390515595674515, "learning_rate": 7.319330588190851e-05, "loss": 0.1324, "step": 77500 }, { "epoch": 1.4638661176381702, "eval_IntDiv": 0.6743218384576104, "eval_NumCircles": 1851, "eval_SumBottleneck": 36.877627315070505, "eval_Uniqueness": 0.996241365298659, "eval_Validity": 0.9844, "eval_Validity * Uniqueness": 0.9807, "eval_loss": 0.22141359746456146, "eval_runtime": 155.7748, "eval_samples_per_second": 64.195, "eval_steps_per_second": 0.507, "step": 77500 }, { "epoch": 1.464810547391485, "grad_norm": 0.0346698984503746, "learning_rate": 7.324052736957425e-05, "loss": 0.1321, "step": 77550 }, { "epoch": 1.4657549771448, "grad_norm": 0.03332211449742317, "learning_rate": 7.328774885724e-05, "loss": 0.1319, "step": 77600 }, { "epoch": 1.466699406898115, "grad_norm": 0.03290266916155815, "learning_rate": 7.333497034490576e-05, "loss": 0.1325, "step": 77650 }, { "epoch": 1.46764383665143, "grad_norm": 0.034149616956710815, "learning_rate": 7.33821918325715e-05, "loss": 0.1325, "step": 77700 }, { "epoch": 1.468588266404745, "grad_norm": 0.032040782272815704, "learning_rate": 7.342941332023724e-05, "loss": 0.1319, "step": 77750 }, { "epoch": 1.4695326961580597, "grad_norm": 0.03240228444337845, "learning_rate": 7.3476634807903e-05, "loss": 0.1324, "step": 77800 }, { "epoch": 1.4704771259113747, "grad_norm": 0.033992256969213486, "learning_rate": 7.352385629556873e-05, "loss": 0.1321, "step": 77850 }, { "epoch": 1.4714215556646897, "grad_norm": 0.03453810140490532, "learning_rate": 7.357107778323449e-05, "loss": 0.1321, "step": 77900 }, { "epoch": 1.4723659854180047, "grad_norm": 0.033222541213035583, "learning_rate": 7.361829927090024e-05, "loss": 0.1319, "step": 77950 }, { "epoch": 1.4733104151713197, "grad_norm": 0.03460194543004036, "learning_rate": 7.366552075856598e-05, "loss": 0.132, "step": 78000 }, { "epoch": 1.4742548449246344, "grad_norm": 0.03799467161297798, "learning_rate": 7.371274224623172e-05, "loss": 0.1318, "step": 78050 }, { "epoch": 1.4751992746779494, "grad_norm": 0.035394489765167236, "learning_rate": 7.375996373389748e-05, "loss": 0.1328, "step": 78100 }, { "epoch": 1.4761437044312644, "grad_norm": 0.033741071820259094, "learning_rate": 7.380718522156322e-05, "loss": 0.1319, "step": 78150 }, { "epoch": 1.4770881341845794, "grad_norm": 0.033882446587085724, "learning_rate": 7.385440670922897e-05, "loss": 0.132, "step": 78200 }, { "epoch": 1.4780325639378944, "grad_norm": 0.03537466377019882, "learning_rate": 7.390162819689473e-05, "loss": 0.1321, "step": 78250 }, { "epoch": 1.4789769936912092, "grad_norm": 0.0343627855181694, "learning_rate": 7.394884968456047e-05, "loss": 0.1324, "step": 78300 }, { "epoch": 1.4799214234445242, "grad_norm": 0.03351946175098419, "learning_rate": 7.399607117222621e-05, "loss": 0.1313, "step": 78350 }, { "epoch": 1.4808658531978391, "grad_norm": 0.03741621598601341, "learning_rate": 7.404329265989196e-05, "loss": 0.1317, "step": 78400 }, { "epoch": 1.4818102829511541, "grad_norm": 0.03769581764936447, "learning_rate": 7.409051414755772e-05, "loss": 0.1321, "step": 78450 }, { "epoch": 1.4827547127044691, "grad_norm": 0.03300439566373825, "learning_rate": 7.413773563522346e-05, "loss": 0.1321, "step": 78500 }, { "epoch": 1.483699142457784, "grad_norm": 0.03384901210665703, "learning_rate": 7.41849571228892e-05, "loss": 0.1315, "step": 78550 }, { "epoch": 1.4846435722110989, "grad_norm": 0.03297720476984978, "learning_rate": 7.423217861055495e-05, "loss": 0.1321, "step": 78600 }, { "epoch": 1.4855880019644139, "grad_norm": 0.03326956182718277, "learning_rate": 7.427940009822069e-05, "loss": 0.1316, "step": 78650 }, { "epoch": 1.4865324317177289, "grad_norm": 0.046929981559515, "learning_rate": 7.432662158588645e-05, "loss": 0.1315, "step": 78700 }, { "epoch": 1.4874768614710439, "grad_norm": 0.03320509195327759, "learning_rate": 7.43738430735522e-05, "loss": 0.1318, "step": 78750 }, { "epoch": 1.4884212912243586, "grad_norm": 0.03342399001121521, "learning_rate": 7.442106456121793e-05, "loss": 0.1317, "step": 78800 }, { "epoch": 1.4893657209776736, "grad_norm": 0.03403449431061745, "learning_rate": 7.446828604888368e-05, "loss": 0.1316, "step": 78850 }, { "epoch": 1.4903101507309886, "grad_norm": 0.03532489016652107, "learning_rate": 7.451550753654944e-05, "loss": 0.1318, "step": 78900 }, { "epoch": 1.4912545804843036, "grad_norm": 0.03524802625179291, "learning_rate": 7.456272902421518e-05, "loss": 0.1321, "step": 78950 }, { "epoch": 1.4921990102376186, "grad_norm": 0.033044058829545975, "learning_rate": 7.460995051188093e-05, "loss": 0.1322, "step": 79000 }, { "epoch": 1.4931434399909334, "grad_norm": 0.03615684062242508, "learning_rate": 7.465717199954669e-05, "loss": 0.1315, "step": 79050 }, { "epoch": 1.4940878697442483, "grad_norm": 0.03450670465826988, "learning_rate": 7.470439348721243e-05, "loss": 0.1318, "step": 79100 }, { "epoch": 1.4950322994975633, "grad_norm": 0.03247403725981712, "learning_rate": 7.475161497487817e-05, "loss": 0.1319, "step": 79150 }, { "epoch": 1.4959767292508783, "grad_norm": 0.03302856907248497, "learning_rate": 7.479883646254392e-05, "loss": 0.1322, "step": 79200 }, { "epoch": 1.4969211590041933, "grad_norm": 0.03398624435067177, "learning_rate": 7.484605795020968e-05, "loss": 0.1318, "step": 79250 }, { "epoch": 1.497865588757508, "grad_norm": 0.04421595111489296, "learning_rate": 7.489327943787542e-05, "loss": 0.1319, "step": 79300 }, { "epoch": 1.4988100185108233, "grad_norm": 0.033207375556230545, "learning_rate": 7.494050092554116e-05, "loss": 0.1317, "step": 79350 }, { "epoch": 1.499754448264138, "grad_norm": 0.03270217776298523, "learning_rate": 7.498772241320691e-05, "loss": 0.1316, "step": 79400 }, { "epoch": 1.500698878017453, "grad_norm": 0.03329164907336235, "learning_rate": 7.503494390087265e-05, "loss": 0.1318, "step": 79450 }, { "epoch": 1.501643307770768, "grad_norm": 0.035060182213783264, "learning_rate": 7.50821653885384e-05, "loss": 0.1321, "step": 79500 }, { "epoch": 1.5025877375240828, "grad_norm": 0.03220762684941292, "learning_rate": 7.512938687620416e-05, "loss": 0.1321, "step": 79550 }, { "epoch": 1.503532167277398, "grad_norm": 0.03359417989850044, "learning_rate": 7.517660836386989e-05, "loss": 0.1313, "step": 79600 }, { "epoch": 1.5044765970307128, "grad_norm": 0.03320552408695221, "learning_rate": 7.522382985153564e-05, "loss": 0.1317, "step": 79650 }, { "epoch": 1.5054210267840278, "grad_norm": 0.033667005598545074, "learning_rate": 7.52710513392014e-05, "loss": 0.1318, "step": 79700 }, { "epoch": 1.5063654565373428, "grad_norm": 0.03311780095100403, "learning_rate": 7.531827282686714e-05, "loss": 0.1315, "step": 79750 }, { "epoch": 1.5073098862906575, "grad_norm": 0.03523420915007591, "learning_rate": 7.536549431453289e-05, "loss": 0.1316, "step": 79800 }, { "epoch": 1.5082543160439728, "grad_norm": 0.03257552161812782, "learning_rate": 7.541271580219864e-05, "loss": 0.1321, "step": 79850 }, { "epoch": 1.5091987457972875, "grad_norm": 0.03278305381536484, "learning_rate": 7.545993728986439e-05, "loss": 0.132, "step": 79900 }, { "epoch": 1.5101431755506025, "grad_norm": 0.03307291120290756, "learning_rate": 7.550715877753013e-05, "loss": 0.1317, "step": 79950 }, { "epoch": 1.5110876053039175, "grad_norm": 0.03285872936248779, "learning_rate": 7.555438026519588e-05, "loss": 0.1316, "step": 80000 }, { "epoch": 1.5110876053039175, "eval_IntDiv": 0.67635870138015, "eval_NumCircles": 1907, "eval_SumBottleneck": 110.69378211839536, "eval_Uniqueness": 0.9977592177632919, "eval_Validity": 0.9818, "eval_Validity * Uniqueness": 0.9796, "eval_loss": 0.22132526338100433, "eval_runtime": 382.3192, "eval_samples_per_second": 26.156, "eval_steps_per_second": 0.207, "step": 80000 }, { "epoch": 1.5120320350572325, "grad_norm": 0.03208912909030914, "learning_rate": 7.560160175286163e-05, "loss": 0.1317, "step": 80050 }, { "epoch": 1.5129764648105475, "grad_norm": 0.033077530562877655, "learning_rate": 7.564882324052737e-05, "loss": 0.132, "step": 80100 }, { "epoch": 1.5139208945638623, "grad_norm": 0.033878978341817856, "learning_rate": 7.569604472819312e-05, "loss": 0.1316, "step": 80150 }, { "epoch": 1.5148653243171772, "grad_norm": 0.03354906663298607, "learning_rate": 7.574326621585887e-05, "loss": 0.1312, "step": 80200 }, { "epoch": 1.5158097540704922, "grad_norm": 0.03632081300020218, "learning_rate": 7.579048770352461e-05, "loss": 0.1318, "step": 80250 }, { "epoch": 1.5167541838238072, "grad_norm": 0.036365482956171036, "learning_rate": 7.583770919119036e-05, "loss": 0.1318, "step": 80300 }, { "epoch": 1.5176986135771222, "grad_norm": 0.03166661411523819, "learning_rate": 7.588493067885612e-05, "loss": 0.1314, "step": 80350 }, { "epoch": 1.518643043330437, "grad_norm": 0.03378362953662872, "learning_rate": 7.593215216652186e-05, "loss": 0.1317, "step": 80400 }, { "epoch": 1.5195874730837522, "grad_norm": 0.06077829748392105, "learning_rate": 7.59793736541876e-05, "loss": 0.1313, "step": 80450 }, { "epoch": 1.520531902837067, "grad_norm": 0.03321153670549393, "learning_rate": 7.602659514185335e-05, "loss": 0.1315, "step": 80500 }, { "epoch": 1.521476332590382, "grad_norm": 0.031411606818437576, "learning_rate": 7.60738166295191e-05, "loss": 0.1317, "step": 80550 }, { "epoch": 1.522420762343697, "grad_norm": 0.03172076866030693, "learning_rate": 7.612103811718485e-05, "loss": 0.1314, "step": 80600 }, { "epoch": 1.5233651920970117, "grad_norm": 0.03327244520187378, "learning_rate": 7.61682596048506e-05, "loss": 0.1319, "step": 80650 }, { "epoch": 1.524309621850327, "grad_norm": 0.032992202788591385, "learning_rate": 7.621548109251634e-05, "loss": 0.1314, "step": 80700 }, { "epoch": 1.5252540516036417, "grad_norm": 0.03182346373796463, "learning_rate": 7.626270258018208e-05, "loss": 0.1315, "step": 80750 }, { "epoch": 1.5261984813569567, "grad_norm": 0.03239559009671211, "learning_rate": 7.630992406784784e-05, "loss": 0.1312, "step": 80800 }, { "epoch": 1.5271429111102717, "grad_norm": 0.03269616514444351, "learning_rate": 7.635714555551359e-05, "loss": 0.1316, "step": 80850 }, { "epoch": 1.5280873408635864, "grad_norm": 0.03241470828652382, "learning_rate": 7.640436704317933e-05, "loss": 0.1311, "step": 80900 }, { "epoch": 1.5290317706169017, "grad_norm": 0.033959608525037766, "learning_rate": 7.645158853084507e-05, "loss": 0.1316, "step": 80950 }, { "epoch": 1.5299762003702164, "grad_norm": 0.038958996534347534, "learning_rate": 7.649881001851083e-05, "loss": 0.1313, "step": 81000 }, { "epoch": 1.5309206301235314, "grad_norm": 0.03411746025085449, "learning_rate": 7.654603150617657e-05, "loss": 0.1321, "step": 81050 }, { "epoch": 1.5318650598768464, "grad_norm": 0.03489353880286217, "learning_rate": 7.659325299384232e-05, "loss": 0.1315, "step": 81100 }, { "epoch": 1.5328094896301612, "grad_norm": 0.035584256052970886, "learning_rate": 7.664047448150808e-05, "loss": 0.1317, "step": 81150 }, { "epoch": 1.5337539193834764, "grad_norm": 0.03375415503978729, "learning_rate": 7.668769596917382e-05, "loss": 0.1311, "step": 81200 }, { "epoch": 1.5346983491367912, "grad_norm": 0.03370421752333641, "learning_rate": 7.673491745683956e-05, "loss": 0.1317, "step": 81250 }, { "epoch": 1.5356427788901061, "grad_norm": 0.03473379835486412, "learning_rate": 7.678213894450531e-05, "loss": 0.1313, "step": 81300 }, { "epoch": 1.5365872086434211, "grad_norm": 0.03384014591574669, "learning_rate": 7.682936043217105e-05, "loss": 0.131, "step": 81350 }, { "epoch": 1.537531638396736, "grad_norm": 0.033823199570178986, "learning_rate": 7.687658191983681e-05, "loss": 0.1318, "step": 81400 }, { "epoch": 1.5384760681500511, "grad_norm": 0.0359630286693573, "learning_rate": 7.692380340750255e-05, "loss": 0.1311, "step": 81450 }, { "epoch": 1.5394204979033659, "grad_norm": 0.0333484411239624, "learning_rate": 7.69710248951683e-05, "loss": 0.1312, "step": 81500 }, { "epoch": 1.5403649276566809, "grad_norm": 0.032448187470436096, "learning_rate": 7.701824638283404e-05, "loss": 0.1312, "step": 81550 }, { "epoch": 1.5413093574099959, "grad_norm": 0.032805878669023514, "learning_rate": 7.70654678704998e-05, "loss": 0.1316, "step": 81600 }, { "epoch": 1.5422537871633106, "grad_norm": 0.03641144558787346, "learning_rate": 7.711268935816555e-05, "loss": 0.1312, "step": 81650 }, { "epoch": 1.5431982169166258, "grad_norm": 0.033019449561834335, "learning_rate": 7.715991084583129e-05, "loss": 0.1313, "step": 81700 }, { "epoch": 1.5441426466699406, "grad_norm": 0.03241269290447235, "learning_rate": 7.720713233349703e-05, "loss": 0.1312, "step": 81750 }, { "epoch": 1.5450870764232556, "grad_norm": 0.03255240619182587, "learning_rate": 7.725435382116279e-05, "loss": 0.1314, "step": 81800 }, { "epoch": 1.5460315061765706, "grad_norm": 0.03456416353583336, "learning_rate": 7.730157530882853e-05, "loss": 0.1317, "step": 81850 }, { "epoch": 1.5469759359298856, "grad_norm": 0.0323290154337883, "learning_rate": 7.734879679649428e-05, "loss": 0.1315, "step": 81900 }, { "epoch": 1.5479203656832006, "grad_norm": 0.03250962495803833, "learning_rate": 7.739601828416004e-05, "loss": 0.1313, "step": 81950 }, { "epoch": 1.5488647954365153, "grad_norm": 0.03328783065080643, "learning_rate": 7.744323977182578e-05, "loss": 0.1315, "step": 82000 }, { "epoch": 1.5498092251898303, "grad_norm": 0.03249920904636383, "learning_rate": 7.749046125949152e-05, "loss": 0.1316, "step": 82050 }, { "epoch": 1.5507536549431453, "grad_norm": 0.0327029749751091, "learning_rate": 7.753768274715727e-05, "loss": 0.1313, "step": 82100 }, { "epoch": 1.5516980846964603, "grad_norm": 0.033199869096279144, "learning_rate": 7.758490423482303e-05, "loss": 0.1314, "step": 82150 }, { "epoch": 1.5526425144497753, "grad_norm": 0.03532984480261803, "learning_rate": 7.763212572248877e-05, "loss": 0.1312, "step": 82200 }, { "epoch": 1.55358694420309, "grad_norm": 0.034524690359830856, "learning_rate": 7.767934721015451e-05, "loss": 0.1313, "step": 82250 }, { "epoch": 1.5545313739564053, "grad_norm": 0.03455452620983124, "learning_rate": 7.772656869782026e-05, "loss": 0.1317, "step": 82300 }, { "epoch": 1.55547580370972, "grad_norm": 0.03256925195455551, "learning_rate": 7.7773790185486e-05, "loss": 0.1312, "step": 82350 }, { "epoch": 1.556420233463035, "grad_norm": 0.033178482204675674, "learning_rate": 7.782101167315176e-05, "loss": 0.1312, "step": 82400 }, { "epoch": 1.55736466321635, "grad_norm": 0.034179188311100006, "learning_rate": 7.786823316081751e-05, "loss": 0.1318, "step": 82450 }, { "epoch": 1.5583090929696648, "grad_norm": 0.03321341425180435, "learning_rate": 7.791545464848325e-05, "loss": 0.131, "step": 82500 }, { "epoch": 1.5583090929696648, "eval_IntDiv": 0.6759108841462417, "eval_NumCircles": 1872, "eval_SumBottleneck": 100.34454116463725, "eval_Uniqueness": 0.9973569177594795, "eval_Validity": 0.9837, "eval_Validity * Uniqueness": 0.9811000000000001, "eval_loss": 0.2254992425441742, "eval_runtime": 179.8863, "eval_samples_per_second": 55.591, "eval_steps_per_second": 0.439, "step": 82500 }, { "epoch": 1.55925352272298, "grad_norm": 0.03472723811864853, "learning_rate": 7.796267613614899e-05, "loss": 0.1315, "step": 82550 }, { "epoch": 1.5601979524762948, "grad_norm": 0.03273049369454384, "learning_rate": 7.800989762381475e-05, "loss": 0.1313, "step": 82600 }, { "epoch": 1.5611423822296098, "grad_norm": 0.033700838685035706, "learning_rate": 7.805711911148049e-05, "loss": 0.1313, "step": 82650 }, { "epoch": 1.5620868119829248, "grad_norm": 0.03421711549162865, "learning_rate": 7.810434059914624e-05, "loss": 0.1313, "step": 82700 }, { "epoch": 1.5630312417362395, "grad_norm": 0.034588832408189774, "learning_rate": 7.8151562086812e-05, "loss": 0.1312, "step": 82750 }, { "epoch": 1.5639756714895547, "grad_norm": 0.031996410340070724, "learning_rate": 7.819878357447774e-05, "loss": 0.1311, "step": 82800 }, { "epoch": 1.5649201012428695, "grad_norm": 0.03474227711558342, "learning_rate": 7.824600506214348e-05, "loss": 0.1309, "step": 82850 }, { "epoch": 1.5658645309961845, "grad_norm": 0.03325621411204338, "learning_rate": 7.829322654980923e-05, "loss": 0.1315, "step": 82900 }, { "epoch": 1.5668089607494995, "grad_norm": 0.03478478640317917, "learning_rate": 7.834044803747498e-05, "loss": 0.1315, "step": 82950 }, { "epoch": 1.5677533905028143, "grad_norm": 0.0325407013297081, "learning_rate": 7.838766952514073e-05, "loss": 0.1311, "step": 83000 }, { "epoch": 1.5686978202561295, "grad_norm": 0.03321729600429535, "learning_rate": 7.843489101280647e-05, "loss": 0.1312, "step": 83050 }, { "epoch": 1.5696422500094442, "grad_norm": 0.03430989757180214, "learning_rate": 7.848211250047222e-05, "loss": 0.131, "step": 83100 }, { "epoch": 1.5705866797627592, "grad_norm": 0.03371304273605347, "learning_rate": 7.852933398813796e-05, "loss": 0.1315, "step": 83150 }, { "epoch": 1.5715311095160742, "grad_norm": 0.03275899961590767, "learning_rate": 7.857655547580372e-05, "loss": 0.1314, "step": 83200 }, { "epoch": 1.572475539269389, "grad_norm": 0.031357262283563614, "learning_rate": 7.862377696346947e-05, "loss": 0.1313, "step": 83250 }, { "epoch": 1.5734199690227042, "grad_norm": 0.032311778515577316, "learning_rate": 7.867099845113521e-05, "loss": 0.1314, "step": 83300 }, { "epoch": 1.574364398776019, "grad_norm": 0.03254953771829605, "learning_rate": 7.871821993880095e-05, "loss": 0.1313, "step": 83350 }, { "epoch": 1.575308828529334, "grad_norm": 0.03609485551714897, "learning_rate": 7.87654414264667e-05, "loss": 0.1311, "step": 83400 }, { "epoch": 1.576253258282649, "grad_norm": 0.0334036648273468, "learning_rate": 7.881266291413245e-05, "loss": 0.131, "step": 83450 }, { "epoch": 1.5771976880359637, "grad_norm": 0.034047387540340424, "learning_rate": 7.88598844017982e-05, "loss": 0.1312, "step": 83500 }, { "epoch": 1.578142117789279, "grad_norm": 0.03655078634619713, "learning_rate": 7.890710588946395e-05, "loss": 0.1312, "step": 83550 }, { "epoch": 1.5790865475425937, "grad_norm": 0.03521301969885826, "learning_rate": 7.89543273771297e-05, "loss": 0.1307, "step": 83600 }, { "epoch": 1.5800309772959087, "grad_norm": 0.032875366508960724, "learning_rate": 7.900154886479544e-05, "loss": 0.1308, "step": 83650 }, { "epoch": 1.5809754070492237, "grad_norm": 0.03328433260321617, "learning_rate": 7.904877035246119e-05, "loss": 0.1312, "step": 83700 }, { "epoch": 1.5819198368025387, "grad_norm": 0.031327370554208755, "learning_rate": 7.909599184012694e-05, "loss": 0.1309, "step": 83750 }, { "epoch": 1.5828642665558537, "grad_norm": 0.033544138073921204, "learning_rate": 7.914321332779268e-05, "loss": 0.131, "step": 83800 }, { "epoch": 1.5838086963091684, "grad_norm": 0.03232868015766144, "learning_rate": 7.919043481545842e-05, "loss": 0.1311, "step": 83850 }, { "epoch": 1.5847531260624834, "grad_norm": 0.038089316338300705, "learning_rate": 7.923765630312418e-05, "loss": 0.1313, "step": 83900 }, { "epoch": 1.5856975558157984, "grad_norm": 0.0318075567483902, "learning_rate": 7.928487779078992e-05, "loss": 0.1313, "step": 83950 }, { "epoch": 1.5866419855691134, "grad_norm": 0.033873051404953, "learning_rate": 7.933209927845567e-05, "loss": 0.1307, "step": 84000 }, { "epoch": 1.5875864153224284, "grad_norm": 0.034211598336696625, "learning_rate": 7.937932076612143e-05, "loss": 0.1312, "step": 84050 }, { "epoch": 1.5885308450757432, "grad_norm": 0.03254133090376854, "learning_rate": 7.942654225378716e-05, "loss": 0.1312, "step": 84100 }, { "epoch": 1.5894752748290584, "grad_norm": 0.034095022827386856, "learning_rate": 7.947376374145291e-05, "loss": 0.1307, "step": 84150 }, { "epoch": 1.5904197045823731, "grad_norm": 0.03864233195781708, "learning_rate": 7.952098522911866e-05, "loss": 0.131, "step": 84200 }, { "epoch": 1.5913641343356881, "grad_norm": 0.032559242099523544, "learning_rate": 7.95682067167844e-05, "loss": 0.131, "step": 84250 }, { "epoch": 1.5923085640890031, "grad_norm": 0.03572993353009224, "learning_rate": 7.961542820445016e-05, "loss": 0.1308, "step": 84300 }, { "epoch": 1.5932529938423179, "grad_norm": 0.03364045172929764, "learning_rate": 7.966264969211591e-05, "loss": 0.1308, "step": 84350 }, { "epoch": 1.594197423595633, "grad_norm": 0.033965714275836945, "learning_rate": 7.970987117978165e-05, "loss": 0.1308, "step": 84400 }, { "epoch": 1.5951418533489479, "grad_norm": 0.031207934021949768, "learning_rate": 7.97570926674474e-05, "loss": 0.1308, "step": 84450 }, { "epoch": 1.5960862831022629, "grad_norm": 0.03407738357782364, "learning_rate": 7.980431415511315e-05, "loss": 0.1308, "step": 84500 }, { "epoch": 1.5970307128555778, "grad_norm": 0.03191528841853142, "learning_rate": 7.98515356427789e-05, "loss": 0.1308, "step": 84550 }, { "epoch": 1.5979751426088926, "grad_norm": 0.03319375962018967, "learning_rate": 7.989875713044464e-05, "loss": 0.1309, "step": 84600 }, { "epoch": 1.5989195723622078, "grad_norm": 0.036977045238018036, "learning_rate": 7.994597861811038e-05, "loss": 0.1312, "step": 84650 }, { "epoch": 1.5998640021155226, "grad_norm": 0.0330628976225853, "learning_rate": 7.999320010577614e-05, "loss": 0.131, "step": 84700 }, { "epoch": 1.6008084318688376, "grad_norm": 0.034098900854587555, "learning_rate": 8.004042159344188e-05, "loss": 0.131, "step": 84750 }, { "epoch": 1.6017528616221526, "grad_norm": 0.03371657431125641, "learning_rate": 8.008764308110763e-05, "loss": 0.1302, "step": 84800 }, { "epoch": 1.6026972913754673, "grad_norm": 0.03141997754573822, "learning_rate": 8.013486456877339e-05, "loss": 0.1306, "step": 84850 }, { "epoch": 1.6036417211287826, "grad_norm": 0.03254419192671776, "learning_rate": 8.018208605643911e-05, "loss": 0.1308, "step": 84900 }, { "epoch": 1.6045861508820973, "grad_norm": 0.03265642002224922, "learning_rate": 8.022930754410487e-05, "loss": 0.1308, "step": 84950 }, { "epoch": 1.6055305806354123, "grad_norm": 0.03289772570133209, "learning_rate": 8.027652903177062e-05, "loss": 0.1311, "step": 85000 }, { "epoch": 1.6055305806354123, "eval_IntDiv": 0.6752463156040405, "eval_NumCircles": 1832, "eval_SumBottleneck": 79.28270099440202, "eval_Uniqueness": 0.9953128184226615, "eval_Validity": 0.9814, "eval_Validity * Uniqueness": 0.9768, "eval_loss": 0.2228364795446396, "eval_runtime": 184.5958, "eval_samples_per_second": 54.172, "eval_steps_per_second": 0.428, "step": 85000 }, { "epoch": 1.6064750103887273, "grad_norm": 0.032556310296058655, "learning_rate": 8.032375051943636e-05, "loss": 0.1313, "step": 85050 }, { "epoch": 1.607419440142042, "grad_norm": 0.03210385888814926, "learning_rate": 8.037097200710212e-05, "loss": 0.1311, "step": 85100 }, { "epoch": 1.6083638698953573, "grad_norm": 0.035149507224559784, "learning_rate": 8.041819349476787e-05, "loss": 0.1304, "step": 85150 }, { "epoch": 1.609308299648672, "grad_norm": 0.03774908557534218, "learning_rate": 8.046541498243361e-05, "loss": 0.1312, "step": 85200 }, { "epoch": 1.610252729401987, "grad_norm": 0.031195536255836487, "learning_rate": 8.051263647009935e-05, "loss": 0.1308, "step": 85250 }, { "epoch": 1.611197159155302, "grad_norm": 0.03285038098692894, "learning_rate": 8.055985795776511e-05, "loss": 0.1308, "step": 85300 }, { "epoch": 1.612141588908617, "grad_norm": 0.032728906720876694, "learning_rate": 8.060707944543086e-05, "loss": 0.1309, "step": 85350 }, { "epoch": 1.613086018661932, "grad_norm": 0.03371796756982803, "learning_rate": 8.06543009330966e-05, "loss": 0.1308, "step": 85400 }, { "epoch": 1.6140304484152468, "grad_norm": 0.032543063163757324, "learning_rate": 8.070152242076234e-05, "loss": 0.1312, "step": 85450 }, { "epoch": 1.6149748781685618, "grad_norm": 0.0344734713435173, "learning_rate": 8.07487439084281e-05, "loss": 0.1302, "step": 85500 }, { "epoch": 1.6159193079218768, "grad_norm": 0.032725635915994644, "learning_rate": 8.079596539609384e-05, "loss": 0.1306, "step": 85550 }, { "epoch": 1.6168637376751918, "grad_norm": 0.03293488919734955, "learning_rate": 8.084318688375959e-05, "loss": 0.1308, "step": 85600 }, { "epoch": 1.6178081674285067, "grad_norm": 0.03451158106327057, "learning_rate": 8.089040837142535e-05, "loss": 0.1309, "step": 85650 }, { "epoch": 1.6187525971818215, "grad_norm": 0.03583483397960663, "learning_rate": 8.093762985909109e-05, "loss": 0.1305, "step": 85700 }, { "epoch": 1.6196970269351367, "grad_norm": 0.03246820345520973, "learning_rate": 8.098485134675683e-05, "loss": 0.1305, "step": 85750 }, { "epoch": 1.6206414566884515, "grad_norm": 0.03407864272594452, "learning_rate": 8.103207283442258e-05, "loss": 0.1305, "step": 85800 }, { "epoch": 1.6215858864417665, "grad_norm": 0.034830525517463684, "learning_rate": 8.107929432208832e-05, "loss": 0.1303, "step": 85850 }, { "epoch": 1.6225303161950815, "grad_norm": 0.03173186630010605, "learning_rate": 8.112651580975408e-05, "loss": 0.1307, "step": 85900 }, { "epoch": 1.6234747459483962, "grad_norm": 0.03207417204976082, "learning_rate": 8.117373729741982e-05, "loss": 0.1302, "step": 85950 }, { "epoch": 1.6244191757017115, "grad_norm": 0.03452261537313461, "learning_rate": 8.122095878508557e-05, "loss": 0.1303, "step": 86000 }, { "epoch": 1.6253636054550262, "grad_norm": 0.03754331171512604, "learning_rate": 8.126818027275131e-05, "loss": 0.1308, "step": 86050 }, { "epoch": 1.6263080352083412, "grad_norm": 0.03383311629295349, "learning_rate": 8.131540176041707e-05, "loss": 0.1307, "step": 86100 }, { "epoch": 1.6272524649616562, "grad_norm": 0.032774414867162704, "learning_rate": 8.136262324808282e-05, "loss": 0.131, "step": 86150 }, { "epoch": 1.628196894714971, "grad_norm": 0.03446482867002487, "learning_rate": 8.140984473574856e-05, "loss": 0.1307, "step": 86200 }, { "epoch": 1.6291413244682862, "grad_norm": 0.03273361176252365, "learning_rate": 8.14570662234143e-05, "loss": 0.1308, "step": 86250 }, { "epoch": 1.630085754221601, "grad_norm": 0.03464832529425621, "learning_rate": 8.150428771108006e-05, "loss": 0.1306, "step": 86300 }, { "epoch": 1.631030183974916, "grad_norm": 0.053987544029951096, "learning_rate": 8.15515091987458e-05, "loss": 0.1304, "step": 86350 }, { "epoch": 1.631974613728231, "grad_norm": 0.03320919722318649, "learning_rate": 8.159873068641155e-05, "loss": 0.1305, "step": 86400 }, { "epoch": 1.6329190434815457, "grad_norm": 0.03400113061070442, "learning_rate": 8.16459521740773e-05, "loss": 0.1307, "step": 86450 }, { "epoch": 1.633863473234861, "grad_norm": 0.033012453466653824, "learning_rate": 8.169317366174305e-05, "loss": 0.1303, "step": 86500 }, { "epoch": 1.6348079029881757, "grad_norm": 0.03289708495140076, "learning_rate": 8.174039514940879e-05, "loss": 0.1303, "step": 86550 }, { "epoch": 1.6357523327414907, "grad_norm": 0.04009835794568062, "learning_rate": 8.178761663707454e-05, "loss": 0.1307, "step": 86600 }, { "epoch": 1.6366967624948057, "grad_norm": 0.03311842679977417, "learning_rate": 8.183483812474028e-05, "loss": 0.1308, "step": 86650 }, { "epoch": 1.6376411922481204, "grad_norm": 0.03284565731883049, "learning_rate": 8.188205961240603e-05, "loss": 0.1306, "step": 86700 }, { "epoch": 1.6385856220014356, "grad_norm": 0.03489474207162857, "learning_rate": 8.192928110007178e-05, "loss": 0.1307, "step": 86750 }, { "epoch": 1.6395300517547504, "grad_norm": 0.03317221999168396, "learning_rate": 8.197650258773753e-05, "loss": 0.1303, "step": 86800 }, { "epoch": 1.6404744815080654, "grad_norm": 0.03166181221604347, "learning_rate": 8.202372407540327e-05, "loss": 0.1301, "step": 86850 }, { "epoch": 1.6414189112613804, "grad_norm": 0.03485480323433876, "learning_rate": 8.207094556306902e-05, "loss": 0.1306, "step": 86900 }, { "epoch": 1.6423633410146952, "grad_norm": 0.03391929343342781, "learning_rate": 8.211816705073478e-05, "loss": 0.1309, "step": 86950 }, { "epoch": 1.6433077707680104, "grad_norm": 0.032505277544260025, "learning_rate": 8.216538853840052e-05, "loss": 0.1304, "step": 87000 }, { "epoch": 1.6442522005213251, "grad_norm": 0.033149175345897675, "learning_rate": 8.221261002606626e-05, "loss": 0.13, "step": 87050 }, { "epoch": 1.6451966302746401, "grad_norm": 0.03202742710709572, "learning_rate": 8.225983151373201e-05, "loss": 0.1303, "step": 87100 }, { "epoch": 1.6461410600279551, "grad_norm": 0.035311050713062286, "learning_rate": 8.230705300139775e-05, "loss": 0.1305, "step": 87150 }, { "epoch": 1.6470854897812701, "grad_norm": 0.032540950924158096, "learning_rate": 8.235427448906351e-05, "loss": 0.1305, "step": 87200 }, { "epoch": 1.648029919534585, "grad_norm": 0.032569948583841324, "learning_rate": 8.240149597672926e-05, "loss": 0.1303, "step": 87250 }, { "epoch": 1.6489743492878999, "grad_norm": 0.03402874246239662, "learning_rate": 8.2448717464395e-05, "loss": 0.1304, "step": 87300 }, { "epoch": 1.6499187790412149, "grad_norm": 0.031238287687301636, "learning_rate": 8.249593895206074e-05, "loss": 0.1303, "step": 87350 }, { "epoch": 1.6508632087945299, "grad_norm": 0.03156851977109909, "learning_rate": 8.25431604397265e-05, "loss": 0.1303, "step": 87400 }, { "epoch": 1.6518076385478448, "grad_norm": 0.03367098048329353, "learning_rate": 8.259038192739225e-05, "loss": 0.1304, "step": 87450 }, { "epoch": 1.6527520683011598, "grad_norm": 0.03533583879470825, "learning_rate": 8.2637603415058e-05, "loss": 0.1306, "step": 87500 }, { "epoch": 1.6527520683011598, "eval_IntDiv": 0.675560116307528, "eval_NumCircles": 1858, "eval_SumBottleneck": 71.19473512477576, "eval_Uniqueness": 0.9971507072351684, "eval_Validity": 0.9827, "eval_Validity * Uniqueness": 0.9799, "eval_loss": 0.22135956585407257, "eval_runtime": 170.5735, "eval_samples_per_second": 58.626, "eval_steps_per_second": 0.463, "step": 87500 }, { "epoch": 1.6536964980544746, "grad_norm": 0.03185064345598221, "learning_rate": 8.268482490272373e-05, "loss": 0.1305, "step": 87550 }, { "epoch": 1.6546409278077898, "grad_norm": 0.03493405878543854, "learning_rate": 8.273204639038949e-05, "loss": 0.1306, "step": 87600 }, { "epoch": 1.6555853575611046, "grad_norm": 0.05202694237232208, "learning_rate": 8.277926787805523e-05, "loss": 0.1319, "step": 87650 }, { "epoch": 1.6565297873144196, "grad_norm": 0.035386987030506134, "learning_rate": 8.282648936572098e-05, "loss": 0.1308, "step": 87700 }, { "epoch": 1.6574742170677346, "grad_norm": 0.03221660852432251, "learning_rate": 8.287371085338674e-05, "loss": 0.1306, "step": 87750 }, { "epoch": 1.6584186468210493, "grad_norm": 0.03241260349750519, "learning_rate": 8.292093234105248e-05, "loss": 0.1298, "step": 87800 }, { "epoch": 1.6593630765743645, "grad_norm": 0.03220011293888092, "learning_rate": 8.296815382871822e-05, "loss": 0.1306, "step": 87850 }, { "epoch": 1.6603075063276793, "grad_norm": 0.03164534270763397, "learning_rate": 8.301537531638397e-05, "loss": 0.1307, "step": 87900 }, { "epoch": 1.6612519360809943, "grad_norm": 0.03339521959424019, "learning_rate": 8.306259680404971e-05, "loss": 0.1305, "step": 87950 }, { "epoch": 1.6621963658343093, "grad_norm": 0.03277956694364548, "learning_rate": 8.310981829171547e-05, "loss": 0.1303, "step": 88000 }, { "epoch": 1.663140795587624, "grad_norm": 0.03257771581411362, "learning_rate": 8.315703977938122e-05, "loss": 0.13, "step": 88050 }, { "epoch": 1.6640852253409393, "grad_norm": 0.03333691135048866, "learning_rate": 8.320426126704696e-05, "loss": 0.1303, "step": 88100 }, { "epoch": 1.665029655094254, "grad_norm": 0.032397542148828506, "learning_rate": 8.32514827547127e-05, "loss": 0.1305, "step": 88150 }, { "epoch": 1.665974084847569, "grad_norm": 0.035203032195568085, "learning_rate": 8.329870424237846e-05, "loss": 0.1304, "step": 88200 }, { "epoch": 1.666918514600884, "grad_norm": 0.0326635017991066, "learning_rate": 8.334592573004421e-05, "loss": 0.1305, "step": 88250 }, { "epoch": 1.6678629443541988, "grad_norm": 0.03197743743658066, "learning_rate": 8.339314721770995e-05, "loss": 0.1301, "step": 88300 }, { "epoch": 1.668807374107514, "grad_norm": 0.03436250984668732, "learning_rate": 8.344036870537569e-05, "loss": 0.1302, "step": 88350 }, { "epoch": 1.6697518038608288, "grad_norm": 0.0334109365940094, "learning_rate": 8.348759019304145e-05, "loss": 0.1302, "step": 88400 }, { "epoch": 1.6706962336141438, "grad_norm": 0.032548610121011734, "learning_rate": 8.353481168070719e-05, "loss": 0.1306, "step": 88450 }, { "epoch": 1.6716406633674588, "grad_norm": 0.03424903750419617, "learning_rate": 8.358203316837294e-05, "loss": 0.1302, "step": 88500 }, { "epoch": 1.6725850931207735, "grad_norm": 0.03245558962225914, "learning_rate": 8.36292546560387e-05, "loss": 0.1302, "step": 88550 }, { "epoch": 1.6735295228740887, "grad_norm": 0.033540766686201096, "learning_rate": 8.367647614370442e-05, "loss": 0.1305, "step": 88600 }, { "epoch": 1.6744739526274035, "grad_norm": 0.03311548009514809, "learning_rate": 8.372369763137018e-05, "loss": 0.1304, "step": 88650 }, { "epoch": 1.6754183823807185, "grad_norm": 0.032845038920640945, "learning_rate": 8.377091911903593e-05, "loss": 0.1301, "step": 88700 }, { "epoch": 1.6763628121340335, "grad_norm": 0.031849753111600876, "learning_rate": 8.381814060670167e-05, "loss": 0.13, "step": 88750 }, { "epoch": 1.6773072418873483, "grad_norm": 0.03208203613758087, "learning_rate": 8.386536209436743e-05, "loss": 0.1301, "step": 88800 }, { "epoch": 1.6782516716406635, "grad_norm": 0.03281673789024353, "learning_rate": 8.391258358203318e-05, "loss": 0.1303, "step": 88850 }, { "epoch": 1.6791961013939782, "grad_norm": 0.03231252357363701, "learning_rate": 8.395980506969892e-05, "loss": 0.1306, "step": 88900 }, { "epoch": 1.6801405311472932, "grad_norm": 0.031996697187423706, "learning_rate": 8.400702655736466e-05, "loss": 0.1302, "step": 88950 }, { "epoch": 1.6810849609006082, "grad_norm": 0.032829221338033676, "learning_rate": 8.405424804503042e-05, "loss": 0.13, "step": 89000 }, { "epoch": 1.6820293906539232, "grad_norm": 0.033410314470529556, "learning_rate": 8.410146953269617e-05, "loss": 0.1304, "step": 89050 }, { "epoch": 1.6829738204072382, "grad_norm": 0.03253168612718582, "learning_rate": 8.414869102036191e-05, "loss": 0.1308, "step": 89100 }, { "epoch": 1.683918250160553, "grad_norm": 0.03128289058804512, "learning_rate": 8.419591250802765e-05, "loss": 0.1303, "step": 89150 }, { "epoch": 1.684862679913868, "grad_norm": 0.03179633617401123, "learning_rate": 8.42431339956934e-05, "loss": 0.1302, "step": 89200 }, { "epoch": 1.685807109667183, "grad_norm": 0.033765312284231186, "learning_rate": 8.429035548335915e-05, "loss": 0.1304, "step": 89250 }, { "epoch": 1.686751539420498, "grad_norm": 0.03176012635231018, "learning_rate": 8.43375769710249e-05, "loss": 0.1304, "step": 89300 }, { "epoch": 1.687695969173813, "grad_norm": 0.03212093189358711, "learning_rate": 8.438479845869066e-05, "loss": 0.1306, "step": 89350 }, { "epoch": 1.6886403989271277, "grad_norm": 0.031867872923612595, "learning_rate": 8.443201994635638e-05, "loss": 0.1303, "step": 89400 }, { "epoch": 1.689584828680443, "grad_norm": 0.03292366489768028, "learning_rate": 8.447924143402214e-05, "loss": 0.1302, "step": 89450 }, { "epoch": 1.6905292584337577, "grad_norm": 0.03248576819896698, "learning_rate": 8.452646292168789e-05, "loss": 0.1301, "step": 89500 }, { "epoch": 1.6914736881870727, "grad_norm": 0.034801967442035675, "learning_rate": 8.457368440935363e-05, "loss": 0.1302, "step": 89550 }, { "epoch": 1.6924181179403877, "grad_norm": 0.03333309292793274, "learning_rate": 8.462090589701939e-05, "loss": 0.1298, "step": 89600 }, { "epoch": 1.6933625476937024, "grad_norm": 0.03292447701096535, "learning_rate": 8.466812738468514e-05, "loss": 0.1301, "step": 89650 }, { "epoch": 1.6943069774470176, "grad_norm": 0.03272983431816101, "learning_rate": 8.471534887235088e-05, "loss": 0.1298, "step": 89700 }, { "epoch": 1.6952514072003324, "grad_norm": 0.031518545001745224, "learning_rate": 8.476257036001662e-05, "loss": 0.1299, "step": 89750 }, { "epoch": 1.6961958369536474, "grad_norm": 0.033491890877485275, "learning_rate": 8.480979184768238e-05, "loss": 0.1301, "step": 89800 }, { "epoch": 1.6971402667069624, "grad_norm": 0.03437047451734543, "learning_rate": 8.485701333534813e-05, "loss": 0.1303, "step": 89850 }, { "epoch": 1.6980846964602772, "grad_norm": 0.032266441732645035, "learning_rate": 8.490423482301387e-05, "loss": 0.1299, "step": 89900 }, { "epoch": 1.6990291262135924, "grad_norm": 0.03254459425806999, "learning_rate": 8.495145631067961e-05, "loss": 0.1298, "step": 89950 }, { "epoch": 1.6999735559669071, "grad_norm": 0.0328393317759037, "learning_rate": 8.499867779834536e-05, "loss": 0.1302, "step": 90000 }, { "epoch": 1.6999735559669071, "eval_IntDiv": 0.6763735787602316, "eval_NumCircles": 1845, "eval_SumBottleneck": 118.52647713183667, "eval_Uniqueness": 0.9968518330455977, "eval_Validity": 0.9847, "eval_Validity * Uniqueness": 0.9816, "eval_loss": 0.22151616215705872, "eval_runtime": 182.907, "eval_samples_per_second": 54.673, "eval_steps_per_second": 0.432, "step": 90000 }, { "epoch": 1.7009179857202221, "grad_norm": 0.032844070345163345, "learning_rate": 8.50458992860111e-05, "loss": 0.1296, "step": 90050 }, { "epoch": 1.7018624154735371, "grad_norm": 0.033383093774318695, "learning_rate": 8.509312077367686e-05, "loss": 0.1301, "step": 90100 }, { "epoch": 1.7028068452268519, "grad_norm": 0.03271855413913727, "learning_rate": 8.514034226134261e-05, "loss": 0.1303, "step": 90150 }, { "epoch": 1.703751274980167, "grad_norm": 0.03207269683480263, "learning_rate": 8.518756374900834e-05, "loss": 0.1299, "step": 90200 }, { "epoch": 1.7046957047334819, "grad_norm": 0.03107481263577938, "learning_rate": 8.52347852366741e-05, "loss": 0.1296, "step": 90250 }, { "epoch": 1.7056401344867969, "grad_norm": 0.031586114317178726, "learning_rate": 8.528200672433985e-05, "loss": 0.13, "step": 90300 }, { "epoch": 1.7065845642401118, "grad_norm": 0.03357912227511406, "learning_rate": 8.532922821200559e-05, "loss": 0.1301, "step": 90350 }, { "epoch": 1.7075289939934266, "grad_norm": 0.03239195793867111, "learning_rate": 8.537644969967134e-05, "loss": 0.1298, "step": 90400 }, { "epoch": 1.7084734237467418, "grad_norm": 0.03342338651418686, "learning_rate": 8.54236711873371e-05, "loss": 0.1303, "step": 90450 }, { "epoch": 1.7094178535000566, "grad_norm": 0.031242061406373978, "learning_rate": 8.547089267500284e-05, "loss": 0.13, "step": 90500 }, { "epoch": 1.7103622832533716, "grad_norm": 0.031504400074481964, "learning_rate": 8.551811416266858e-05, "loss": 0.1298, "step": 90550 }, { "epoch": 1.7113067130066866, "grad_norm": 0.03305623307824135, "learning_rate": 8.556533565033433e-05, "loss": 0.1303, "step": 90600 }, { "epoch": 1.7122511427600016, "grad_norm": 0.05198463052511215, "learning_rate": 8.561255713800009e-05, "loss": 0.1302, "step": 90650 }, { "epoch": 1.7131955725133166, "grad_norm": 0.03155484423041344, "learning_rate": 8.565977862566583e-05, "loss": 0.1301, "step": 90700 }, { "epoch": 1.7141400022666313, "grad_norm": 0.03167435899376869, "learning_rate": 8.570700011333157e-05, "loss": 0.1297, "step": 90750 }, { "epoch": 1.7150844320199463, "grad_norm": 0.03249998763203621, "learning_rate": 8.575422160099732e-05, "loss": 0.13, "step": 90800 }, { "epoch": 1.7160288617732613, "grad_norm": 0.031752586364746094, "learning_rate": 8.580144308866306e-05, "loss": 0.13, "step": 90850 }, { "epoch": 1.7169732915265763, "grad_norm": 0.0341353714466095, "learning_rate": 8.584866457632882e-05, "loss": 0.13, "step": 90900 }, { "epoch": 1.7179177212798913, "grad_norm": 0.03167761489748955, "learning_rate": 8.589588606399457e-05, "loss": 0.13, "step": 90950 }, { "epoch": 1.718862151033206, "grad_norm": 0.030908364802598953, "learning_rate": 8.594310755166031e-05, "loss": 0.1301, "step": 91000 }, { "epoch": 1.719806580786521, "grad_norm": 0.03247930109500885, "learning_rate": 8.599032903932605e-05, "loss": 0.13, "step": 91050 }, { "epoch": 1.720751010539836, "grad_norm": 0.03251555562019348, "learning_rate": 8.603755052699181e-05, "loss": 0.1299, "step": 91100 }, { "epoch": 1.721695440293151, "grad_norm": 0.03408970683813095, "learning_rate": 8.608477201465755e-05, "loss": 0.1303, "step": 91150 }, { "epoch": 1.722639870046466, "grad_norm": 0.03323538228869438, "learning_rate": 8.61319935023233e-05, "loss": 0.13, "step": 91200 }, { "epoch": 1.7235842997997808, "grad_norm": 0.03317233547568321, "learning_rate": 8.617921498998904e-05, "loss": 0.1299, "step": 91250 }, { "epoch": 1.724528729553096, "grad_norm": 0.03204472362995148, "learning_rate": 8.62264364776548e-05, "loss": 0.1297, "step": 91300 }, { "epoch": 1.7254731593064108, "grad_norm": 0.03452823683619499, "learning_rate": 8.627365796532054e-05, "loss": 0.1302, "step": 91350 }, { "epoch": 1.7264175890597258, "grad_norm": 0.03206075727939606, "learning_rate": 8.632087945298629e-05, "loss": 0.1296, "step": 91400 }, { "epoch": 1.7273620188130407, "grad_norm": 0.03215822950005531, "learning_rate": 8.636810094065205e-05, "loss": 0.1302, "step": 91450 }, { "epoch": 1.7283064485663555, "grad_norm": 0.03127072751522064, "learning_rate": 8.641532242831779e-05, "loss": 0.1297, "step": 91500 }, { "epoch": 1.7292508783196707, "grad_norm": 0.03346798196434975, "learning_rate": 8.646254391598353e-05, "loss": 0.1299, "step": 91550 }, { "epoch": 1.7301953080729855, "grad_norm": 0.03361326828598976, "learning_rate": 8.650976540364928e-05, "loss": 0.13, "step": 91600 }, { "epoch": 1.7311397378263005, "grad_norm": 0.03208928555250168, "learning_rate": 8.655698689131502e-05, "loss": 0.13, "step": 91650 }, { "epoch": 1.7320841675796155, "grad_norm": 0.03289501368999481, "learning_rate": 8.660420837898078e-05, "loss": 0.1298, "step": 91700 }, { "epoch": 1.7330285973329302, "grad_norm": 0.031941741704940796, "learning_rate": 8.665142986664653e-05, "loss": 0.1298, "step": 91750 }, { "epoch": 1.7339730270862455, "grad_norm": 0.03291500732302666, "learning_rate": 8.669865135431227e-05, "loss": 0.1296, "step": 91800 }, { "epoch": 1.7349174568395602, "grad_norm": 0.03263208270072937, "learning_rate": 8.674587284197801e-05, "loss": 0.1293, "step": 91850 }, { "epoch": 1.7358618865928752, "grad_norm": 0.03268318250775337, "learning_rate": 8.679309432964377e-05, "loss": 0.1297, "step": 91900 }, { "epoch": 1.7368063163461902, "grad_norm": 0.03185218572616577, "learning_rate": 8.684031581730951e-05, "loss": 0.1301, "step": 91950 }, { "epoch": 1.737750746099505, "grad_norm": 0.03265377879142761, "learning_rate": 8.688753730497526e-05, "loss": 0.13, "step": 92000 }, { "epoch": 1.7386951758528202, "grad_norm": 0.030994277447462082, "learning_rate": 8.6934758792641e-05, "loss": 0.1299, "step": 92050 }, { "epoch": 1.739639605606135, "grad_norm": 0.03463870659470558, "learning_rate": 8.698198028030676e-05, "loss": 0.1298, "step": 92100 }, { "epoch": 1.74058403535945, "grad_norm": 0.03511086106300354, "learning_rate": 8.70292017679725e-05, "loss": 0.1299, "step": 92150 }, { "epoch": 1.741528465112765, "grad_norm": 0.030512243509292603, "learning_rate": 8.707642325563825e-05, "loss": 0.1296, "step": 92200 }, { "epoch": 1.7424728948660797, "grad_norm": 0.030884580686688423, "learning_rate": 8.7123644743304e-05, "loss": 0.1294, "step": 92250 }, { "epoch": 1.743417324619395, "grad_norm": 0.03296820446848869, "learning_rate": 8.717086623096975e-05, "loss": 0.1301, "step": 92300 }, { "epoch": 1.7443617543727097, "grad_norm": 0.03204120323061943, "learning_rate": 8.721808771863549e-05, "loss": 0.1297, "step": 92350 }, { "epoch": 1.7453061841260247, "grad_norm": 0.03161325678229332, "learning_rate": 8.726530920630124e-05, "loss": 0.1299, "step": 92400 }, { "epoch": 1.7462506138793397, "grad_norm": 0.03171123191714287, "learning_rate": 8.731253069396698e-05, "loss": 0.1294, "step": 92450 }, { "epoch": 1.7471950436326547, "grad_norm": 0.03336206078529358, "learning_rate": 8.735975218163274e-05, "loss": 0.1299, "step": 92500 }, { "epoch": 1.7471950436326547, "eval_IntDiv": 0.6764717757341718, "eval_NumCircles": 1844, "eval_SumBottleneck": 121.93734316157848, "eval_Uniqueness": 0.9964329392580513, "eval_Validity": 0.9812, "eval_Validity * Uniqueness": 0.9776999999999999, "eval_loss": 0.2202538549900055, "eval_runtime": 194.5828, "eval_samples_per_second": 51.392, "eval_steps_per_second": 0.406, "step": 92500 }, { "epoch": 1.7481394733859696, "grad_norm": 0.03265482932329178, "learning_rate": 8.740697366929849e-05, "loss": 0.1303, "step": 92550 }, { "epoch": 1.7490839031392844, "grad_norm": 0.03214295580983162, "learning_rate": 8.745419515696423e-05, "loss": 0.1297, "step": 92600 }, { "epoch": 1.7500283328925994, "grad_norm": 0.03226783499121666, "learning_rate": 8.750141664462997e-05, "loss": 0.1298, "step": 92650 }, { "epoch": 1.7509727626459144, "grad_norm": 0.031816188246011734, "learning_rate": 8.754863813229573e-05, "loss": 0.1295, "step": 92700 }, { "epoch": 1.7519171923992294, "grad_norm": 0.03170837461948395, "learning_rate": 8.759585961996148e-05, "loss": 0.1291, "step": 92750 }, { "epoch": 1.7528616221525444, "grad_norm": 0.03050745651125908, "learning_rate": 8.764308110762722e-05, "loss": 0.1297, "step": 92800 }, { "epoch": 1.7538060519058591, "grad_norm": 0.031236059963703156, "learning_rate": 8.769030259529296e-05, "loss": 0.1297, "step": 92850 }, { "epoch": 1.7547504816591744, "grad_norm": 0.03299104794859886, "learning_rate": 8.773752408295872e-05, "loss": 0.1299, "step": 92900 }, { "epoch": 1.7556949114124891, "grad_norm": 0.03372008726000786, "learning_rate": 8.778474557062446e-05, "loss": 0.1293, "step": 92950 }, { "epoch": 1.7566393411658041, "grad_norm": 0.03325498476624489, "learning_rate": 8.783196705829021e-05, "loss": 0.1296, "step": 93000 }, { "epoch": 1.757583770919119, "grad_norm": 0.03384057804942131, "learning_rate": 8.787918854595596e-05, "loss": 0.1299, "step": 93050 }, { "epoch": 1.7585282006724339, "grad_norm": 0.032343607395887375, "learning_rate": 8.79264100336217e-05, "loss": 0.1298, "step": 93100 }, { "epoch": 1.759472630425749, "grad_norm": 0.03339138254523277, "learning_rate": 8.797363152128745e-05, "loss": 0.1299, "step": 93150 }, { "epoch": 1.7604170601790639, "grad_norm": 0.031661685556173325, "learning_rate": 8.80208530089532e-05, "loss": 0.1297, "step": 93200 }, { "epoch": 1.7613614899323788, "grad_norm": 0.03327033296227455, "learning_rate": 8.806807449661894e-05, "loss": 0.1296, "step": 93250 }, { "epoch": 1.7623059196856938, "grad_norm": 0.03704866021871567, "learning_rate": 8.81152959842847e-05, "loss": 0.13, "step": 93300 }, { "epoch": 1.7632503494390086, "grad_norm": 0.03303058072924614, "learning_rate": 8.816251747195045e-05, "loss": 0.1302, "step": 93350 }, { "epoch": 1.7641947791923238, "grad_norm": 0.03383225202560425, "learning_rate": 8.820973895961619e-05, "loss": 0.1298, "step": 93400 }, { "epoch": 1.7651392089456386, "grad_norm": 0.03151782229542732, "learning_rate": 8.825696044728193e-05, "loss": 0.1295, "step": 93450 }, { "epoch": 1.7660836386989536, "grad_norm": 0.03220135718584061, "learning_rate": 8.830418193494768e-05, "loss": 0.1299, "step": 93500 }, { "epoch": 1.7670280684522686, "grad_norm": 0.03270825743675232, "learning_rate": 8.835140342261344e-05, "loss": 0.1299, "step": 93550 }, { "epoch": 1.7679724982055833, "grad_norm": 0.03184273838996887, "learning_rate": 8.839862491027918e-05, "loss": 0.1299, "step": 93600 }, { "epoch": 1.7689169279588985, "grad_norm": 0.032908834517002106, "learning_rate": 8.844584639794492e-05, "loss": 0.1295, "step": 93650 }, { "epoch": 1.7698613577122133, "grad_norm": 0.03238241747021675, "learning_rate": 8.849306788561067e-05, "loss": 0.1295, "step": 93700 }, { "epoch": 1.7708057874655283, "grad_norm": 0.03502850607037544, "learning_rate": 8.854028937327642e-05, "loss": 0.13, "step": 93750 }, { "epoch": 1.7717502172188433, "grad_norm": 0.031221669167280197, "learning_rate": 8.858751086094217e-05, "loss": 0.1297, "step": 93800 }, { "epoch": 1.772694646972158, "grad_norm": 0.03292059525847435, "learning_rate": 8.863473234860792e-05, "loss": 0.1292, "step": 93850 }, { "epoch": 1.7736390767254733, "grad_norm": 0.031278345733881, "learning_rate": 8.868195383627365e-05, "loss": 0.1297, "step": 93900 }, { "epoch": 1.774583506478788, "grad_norm": 0.032782282680273056, "learning_rate": 8.87291753239394e-05, "loss": 0.1298, "step": 93950 }, { "epoch": 1.775527936232103, "grad_norm": 0.031976472586393356, "learning_rate": 8.877639681160516e-05, "loss": 0.1296, "step": 94000 }, { "epoch": 1.776472365985418, "grad_norm": 0.03204074874520302, "learning_rate": 8.88236182992709e-05, "loss": 0.1293, "step": 94050 }, { "epoch": 1.7774167957387328, "grad_norm": 0.03530345484614372, "learning_rate": 8.887083978693665e-05, "loss": 0.1295, "step": 94100 }, { "epoch": 1.778361225492048, "grad_norm": 0.032665058970451355, "learning_rate": 8.891806127460241e-05, "loss": 0.1297, "step": 94150 }, { "epoch": 1.7793056552453628, "grad_norm": 0.031935494393110275, "learning_rate": 8.896528276226815e-05, "loss": 0.1296, "step": 94200 }, { "epoch": 1.7802500849986778, "grad_norm": 0.0330500565469265, "learning_rate": 8.901250424993389e-05, "loss": 0.1296, "step": 94250 }, { "epoch": 1.7811945147519928, "grad_norm": 0.03153182938694954, "learning_rate": 8.905972573759964e-05, "loss": 0.1292, "step": 94300 }, { "epoch": 1.7821389445053077, "grad_norm": 0.03515075519680977, "learning_rate": 8.91069472252654e-05, "loss": 0.1296, "step": 94350 }, { "epoch": 1.7830833742586227, "grad_norm": 0.032303888350725174, "learning_rate": 8.915416871293114e-05, "loss": 0.1294, "step": 94400 }, { "epoch": 1.7840278040119375, "grad_norm": 0.033024366945028305, "learning_rate": 8.920139020059688e-05, "loss": 0.1295, "step": 94450 }, { "epoch": 1.7849722337652525, "grad_norm": 0.032366979867219925, "learning_rate": 8.924861168826263e-05, "loss": 0.1295, "step": 94500 }, { "epoch": 1.7859166635185675, "grad_norm": 0.03495559096336365, "learning_rate": 8.929583317592837e-05, "loss": 0.1296, "step": 94550 }, { "epoch": 1.7868610932718825, "grad_norm": 0.03195580095052719, "learning_rate": 8.934305466359413e-05, "loss": 0.1293, "step": 94600 }, { "epoch": 1.7878055230251975, "grad_norm": 0.03369217738509178, "learning_rate": 8.939027615125988e-05, "loss": 0.1297, "step": 94650 }, { "epoch": 1.7887499527785122, "grad_norm": 0.03430734574794769, "learning_rate": 8.943749763892561e-05, "loss": 0.1294, "step": 94700 }, { "epoch": 1.7896943825318274, "grad_norm": 0.0328482948243618, "learning_rate": 8.948471912659136e-05, "loss": 0.1294, "step": 94750 }, { "epoch": 1.7906388122851422, "grad_norm": 0.03214641660451889, "learning_rate": 8.953194061425712e-05, "loss": 0.1294, "step": 94800 }, { "epoch": 1.7915832420384572, "grad_norm": 0.03139464929699898, "learning_rate": 8.957916210192286e-05, "loss": 0.1295, "step": 94850 }, { "epoch": 1.7925276717917722, "grad_norm": 0.031085209921002388, "learning_rate": 8.962638358958861e-05, "loss": 0.1297, "step": 94900 }, { "epoch": 1.793472101545087, "grad_norm": 0.03182016313076019, "learning_rate": 8.967360507725437e-05, "loss": 0.1295, "step": 94950 }, { "epoch": 1.7944165312984022, "grad_norm": 0.03288981318473816, "learning_rate": 8.972082656492011e-05, "loss": 0.1291, "step": 95000 }, { "epoch": 1.7944165312984022, "eval_IntDiv": 0.6761179369024302, "eval_NumCircles": 1853, "eval_SumBottleneck": 73.73124528243243, "eval_Uniqueness": 0.9966490658001624, "eval_Validity": 0.9848, "eval_Validity * Uniqueness": 0.9814999999999999, "eval_loss": 0.22177205979824066, "eval_runtime": 156.3624, "eval_samples_per_second": 63.954, "eval_steps_per_second": 0.505, "step": 95000 }, { "epoch": 1.795360961051717, "grad_norm": 0.030356988310813904, "learning_rate": 8.976804805258585e-05, "loss": 0.1292, "step": 95050 }, { "epoch": 1.796305390805032, "grad_norm": 0.03299425169825554, "learning_rate": 8.98152695402516e-05, "loss": 0.1297, "step": 95100 }, { "epoch": 1.797249820558347, "grad_norm": 0.034271370619535446, "learning_rate": 8.986249102791736e-05, "loss": 0.1289, "step": 95150 }, { "epoch": 1.7981942503116617, "grad_norm": 0.03240935131907463, "learning_rate": 8.99097125155831e-05, "loss": 0.1295, "step": 95200 }, { "epoch": 1.799138680064977, "grad_norm": 0.03102274425327778, "learning_rate": 8.995693400324884e-05, "loss": 0.1297, "step": 95250 }, { "epoch": 1.8000831098182917, "grad_norm": 0.03209412842988968, "learning_rate": 9.000415549091459e-05, "loss": 0.1294, "step": 95300 }, { "epoch": 1.8010275395716067, "grad_norm": 0.034560251981019974, "learning_rate": 9.005137697858033e-05, "loss": 0.1293, "step": 95350 }, { "epoch": 1.8019719693249217, "grad_norm": 0.03372807800769806, "learning_rate": 9.009859846624609e-05, "loss": 0.1297, "step": 95400 }, { "epoch": 1.8029163990782364, "grad_norm": 0.031143080443143845, "learning_rate": 9.014581995391184e-05, "loss": 0.1292, "step": 95450 }, { "epoch": 1.8038608288315516, "grad_norm": 0.03242100030183792, "learning_rate": 9.019304144157757e-05, "loss": 0.1289, "step": 95500 }, { "epoch": 1.8048052585848664, "grad_norm": 0.031234469264745712, "learning_rate": 9.024026292924332e-05, "loss": 0.1297, "step": 95550 }, { "epoch": 1.8057496883381814, "grad_norm": 0.0313754640519619, "learning_rate": 9.028748441690908e-05, "loss": 0.1294, "step": 95600 }, { "epoch": 1.8066941180914964, "grad_norm": 0.030753374099731445, "learning_rate": 9.033470590457482e-05, "loss": 0.1295, "step": 95650 }, { "epoch": 1.8076385478448111, "grad_norm": 0.03201891854405403, "learning_rate": 9.038192739224057e-05, "loss": 0.129, "step": 95700 }, { "epoch": 1.8085829775981264, "grad_norm": 0.03216942399740219, "learning_rate": 9.042914887990633e-05, "loss": 0.1295, "step": 95750 }, { "epoch": 1.8095274073514411, "grad_norm": 0.03384096920490265, "learning_rate": 9.047637036757207e-05, "loss": 0.1293, "step": 95800 }, { "epoch": 1.8104718371047561, "grad_norm": 0.03245903551578522, "learning_rate": 9.052359185523781e-05, "loss": 0.1292, "step": 95850 }, { "epoch": 1.8114162668580711, "grad_norm": 0.0323839895427227, "learning_rate": 9.057081334290356e-05, "loss": 0.1292, "step": 95900 }, { "epoch": 1.8123606966113859, "grad_norm": 0.03167814761400223, "learning_rate": 9.061803483056932e-05, "loss": 0.1294, "step": 95950 }, { "epoch": 1.813305126364701, "grad_norm": 0.031890254467725754, "learning_rate": 9.066525631823506e-05, "loss": 0.1291, "step": 96000 }, { "epoch": 1.8142495561180159, "grad_norm": 0.03097745031118393, "learning_rate": 9.07124778059008e-05, "loss": 0.1294, "step": 96050 }, { "epoch": 1.8151939858713309, "grad_norm": 0.03142160549759865, "learning_rate": 9.075969929356655e-05, "loss": 0.1293, "step": 96100 }, { "epoch": 1.8161384156246458, "grad_norm": 0.03213433548808098, "learning_rate": 9.080692078123229e-05, "loss": 0.1292, "step": 96150 }, { "epoch": 1.8170828453779608, "grad_norm": 0.03310408070683479, "learning_rate": 9.085414226889805e-05, "loss": 0.1296, "step": 96200 }, { "epoch": 1.8180272751312758, "grad_norm": 0.029789285734295845, "learning_rate": 9.09013637565638e-05, "loss": 0.1295, "step": 96250 }, { "epoch": 1.8189717048845906, "grad_norm": 0.031007548794150352, "learning_rate": 9.094858524422954e-05, "loss": 0.1293, "step": 96300 }, { "epoch": 1.8199161346379056, "grad_norm": 0.0332544706761837, "learning_rate": 9.099580673189528e-05, "loss": 0.1291, "step": 96350 }, { "epoch": 1.8208605643912206, "grad_norm": 0.032597627490758896, "learning_rate": 9.104302821956104e-05, "loss": 0.1291, "step": 96400 }, { "epoch": 1.8218049941445356, "grad_norm": 0.03137396275997162, "learning_rate": 9.109024970722678e-05, "loss": 0.1292, "step": 96450 }, { "epoch": 1.8227494238978506, "grad_norm": 0.03485961630940437, "learning_rate": 9.113747119489253e-05, "loss": 0.1292, "step": 96500 }, { "epoch": 1.8236938536511653, "grad_norm": 0.03189757466316223, "learning_rate": 9.118469268255827e-05, "loss": 0.1293, "step": 96550 }, { "epoch": 1.8246382834044805, "grad_norm": 0.032880473881959915, "learning_rate": 9.123191417022403e-05, "loss": 0.1289, "step": 96600 }, { "epoch": 1.8255827131577953, "grad_norm": 0.03189772740006447, "learning_rate": 9.127913565788977e-05, "loss": 0.1292, "step": 96650 }, { "epoch": 1.8265271429111103, "grad_norm": 0.03686245530843735, "learning_rate": 9.132635714555552e-05, "loss": 0.1292, "step": 96700 }, { "epoch": 1.8274715726644253, "grad_norm": 0.030567971989512444, "learning_rate": 9.137357863322127e-05, "loss": 0.129, "step": 96750 }, { "epoch": 1.82841600241774, "grad_norm": 0.031383056193590164, "learning_rate": 9.142080012088701e-05, "loss": 0.1294, "step": 96800 }, { "epoch": 1.8293604321710553, "grad_norm": 0.03135773539543152, "learning_rate": 9.146802160855276e-05, "loss": 0.1294, "step": 96850 }, { "epoch": 1.83030486192437, "grad_norm": 0.030293315649032593, "learning_rate": 9.151524309621851e-05, "loss": 0.1292, "step": 96900 }, { "epoch": 1.831249291677685, "grad_norm": 0.032779302448034286, "learning_rate": 9.156246458388425e-05, "loss": 0.1294, "step": 96950 }, { "epoch": 1.832193721431, "grad_norm": 0.030849242582917213, "learning_rate": 9.160968607155e-05, "loss": 0.129, "step": 97000 }, { "epoch": 1.8331381511843148, "grad_norm": 0.031763121485710144, "learning_rate": 9.165690755921576e-05, "loss": 0.1291, "step": 97050 }, { "epoch": 1.83408258093763, "grad_norm": 0.03407585993409157, "learning_rate": 9.17041290468815e-05, "loss": 0.1294, "step": 97100 }, { "epoch": 1.8350270106909448, "grad_norm": 0.03244151920080185, "learning_rate": 9.175135053454724e-05, "loss": 0.1294, "step": 97150 }, { "epoch": 1.8359714404442598, "grad_norm": 0.033093202859163284, "learning_rate": 9.1798572022213e-05, "loss": 0.1295, "step": 97200 }, { "epoch": 1.8369158701975747, "grad_norm": 0.03308787941932678, "learning_rate": 9.184579350987873e-05, "loss": 0.1291, "step": 97250 }, { "epoch": 1.8378602999508895, "grad_norm": 0.03181995451450348, "learning_rate": 9.189301499754449e-05, "loss": 0.1293, "step": 97300 }, { "epoch": 1.8388047297042047, "grad_norm": 0.03397463634610176, "learning_rate": 9.194023648521023e-05, "loss": 0.129, "step": 97350 }, { "epoch": 1.8397491594575195, "grad_norm": 0.0319986455142498, "learning_rate": 9.198745797287598e-05, "loss": 0.1292, "step": 97400 }, { "epoch": 1.8406935892108345, "grad_norm": 0.03074694238603115, "learning_rate": 9.203467946054172e-05, "loss": 0.129, "step": 97450 }, { "epoch": 1.8416380189641495, "grad_norm": 0.03126883879303932, "learning_rate": 9.208190094820748e-05, "loss": 0.1295, "step": 97500 }, { "epoch": 1.8416380189641495, "eval_IntDiv": 0.6741635491429127, "eval_NumCircles": 1775, "eval_SumBottleneck": 81.78865202500032, "eval_Uniqueness": 0.9976654486398701, "eval_Validity": 0.9852, "eval_Validity * Uniqueness": 0.9829, "eval_loss": 0.22220973670482635, "eval_runtime": 149.8036, "eval_samples_per_second": 66.754, "eval_steps_per_second": 0.527, "step": 97500 }, { "epoch": 1.8425824487174642, "grad_norm": 0.03375394642353058, "learning_rate": 9.212912243587323e-05, "loss": 0.1292, "step": 97550 }, { "epoch": 1.8435268784707795, "grad_norm": 0.035560403019189835, "learning_rate": 9.217634392353897e-05, "loss": 0.1289, "step": 97600 }, { "epoch": 1.8444713082240942, "grad_norm": 0.03282679244875908, "learning_rate": 9.222356541120471e-05, "loss": 0.1295, "step": 97650 }, { "epoch": 1.8454157379774092, "grad_norm": 0.03246370702981949, "learning_rate": 9.227078689887047e-05, "loss": 0.1291, "step": 97700 }, { "epoch": 1.8463601677307242, "grad_norm": 0.03099025785923004, "learning_rate": 9.231800838653621e-05, "loss": 0.1288, "step": 97750 }, { "epoch": 1.8473045974840392, "grad_norm": 0.03150777518749237, "learning_rate": 9.236522987420196e-05, "loss": 0.129, "step": 97800 }, { "epoch": 1.8482490272373542, "grad_norm": 0.030322782695293427, "learning_rate": 9.241245136186772e-05, "loss": 0.1294, "step": 97850 }, { "epoch": 1.849193456990669, "grad_norm": 0.033207107335329056, "learning_rate": 9.245967284953346e-05, "loss": 0.1291, "step": 97900 }, { "epoch": 1.850137886743984, "grad_norm": 0.030867090448737144, "learning_rate": 9.25068943371992e-05, "loss": 0.1292, "step": 97950 }, { "epoch": 1.851082316497299, "grad_norm": 0.031916942447423935, "learning_rate": 9.255411582486495e-05, "loss": 0.1292, "step": 98000 }, { "epoch": 1.852026746250614, "grad_norm": 0.03201865777373314, "learning_rate": 9.260133731253071e-05, "loss": 0.129, "step": 98050 }, { "epoch": 1.852971176003929, "grad_norm": 0.03251785784959793, "learning_rate": 9.264855880019645e-05, "loss": 0.129, "step": 98100 }, { "epoch": 1.8539156057572437, "grad_norm": 0.036396533250808716, "learning_rate": 9.269578028786219e-05, "loss": 0.1293, "step": 98150 }, { "epoch": 1.854860035510559, "grad_norm": 0.030961332842707634, "learning_rate": 9.274300177552794e-05, "loss": 0.1286, "step": 98200 }, { "epoch": 1.8558044652638737, "grad_norm": 0.03121994435787201, "learning_rate": 9.279022326319368e-05, "loss": 0.129, "step": 98250 }, { "epoch": 1.8567488950171886, "grad_norm": 0.030900532379746437, "learning_rate": 9.283744475085944e-05, "loss": 0.1288, "step": 98300 }, { "epoch": 1.8576933247705036, "grad_norm": 0.03200496360659599, "learning_rate": 9.288466623852519e-05, "loss": 0.129, "step": 98350 }, { "epoch": 1.8586377545238184, "grad_norm": 0.03078722022473812, "learning_rate": 9.293188772619092e-05, "loss": 0.129, "step": 98400 }, { "epoch": 1.8595821842771336, "grad_norm": 0.034765392541885376, "learning_rate": 9.297910921385667e-05, "loss": 0.1294, "step": 98450 }, { "epoch": 1.8605266140304484, "grad_norm": 0.031112344935536385, "learning_rate": 9.302633070152243e-05, "loss": 0.1292, "step": 98500 }, { "epoch": 1.8614710437837634, "grad_norm": 0.03214152902364731, "learning_rate": 9.307355218918817e-05, "loss": 0.1291, "step": 98550 }, { "epoch": 1.8624154735370784, "grad_norm": 0.0314289890229702, "learning_rate": 9.312077367685392e-05, "loss": 0.1289, "step": 98600 }, { "epoch": 1.8633599032903931, "grad_norm": 0.03377971425652504, "learning_rate": 9.316799516451968e-05, "loss": 0.1289, "step": 98650 }, { "epoch": 1.8643043330437084, "grad_norm": 0.03157028928399086, "learning_rate": 9.321521665218542e-05, "loss": 0.1289, "step": 98700 }, { "epoch": 1.8652487627970231, "grad_norm": 0.031073100864887238, "learning_rate": 9.326243813985116e-05, "loss": 0.1284, "step": 98750 }, { "epoch": 1.866193192550338, "grad_norm": 0.032128702849149704, "learning_rate": 9.330965962751691e-05, "loss": 0.1291, "step": 98800 }, { "epoch": 1.867137622303653, "grad_norm": 0.030978592112660408, "learning_rate": 9.335688111518267e-05, "loss": 0.1289, "step": 98850 }, { "epoch": 1.8680820520569679, "grad_norm": 0.029975784942507744, "learning_rate": 9.34041026028484e-05, "loss": 0.1291, "step": 98900 }, { "epoch": 1.869026481810283, "grad_norm": 0.03138572722673416, "learning_rate": 9.345132409051415e-05, "loss": 0.1287, "step": 98950 }, { "epoch": 1.8699709115635978, "grad_norm": 0.032420482486486435, "learning_rate": 9.34985455781799e-05, "loss": 0.1287, "step": 99000 }, { "epoch": 1.8709153413169128, "grad_norm": 0.031986743211746216, "learning_rate": 9.354576706584564e-05, "loss": 0.1293, "step": 99050 }, { "epoch": 1.8718597710702278, "grad_norm": 0.030881498008966446, "learning_rate": 9.35929885535114e-05, "loss": 0.1288, "step": 99100 }, { "epoch": 1.8728042008235426, "grad_norm": 0.032784219831228256, "learning_rate": 9.364021004117715e-05, "loss": 0.1287, "step": 99150 }, { "epoch": 1.8737486305768578, "grad_norm": 0.03237314522266388, "learning_rate": 9.368743152884288e-05, "loss": 0.1291, "step": 99200 }, { "epoch": 1.8746930603301726, "grad_norm": 0.03215375170111656, "learning_rate": 9.373465301650863e-05, "loss": 0.1292, "step": 99250 }, { "epoch": 1.8756374900834876, "grad_norm": 0.032943256199359894, "learning_rate": 9.378187450417439e-05, "loss": 0.1292, "step": 99300 }, { "epoch": 1.8765819198368026, "grad_norm": 0.03276362642645836, "learning_rate": 9.382909599184013e-05, "loss": 0.1291, "step": 99350 }, { "epoch": 1.8775263495901173, "grad_norm": 0.032118942588567734, "learning_rate": 9.387631747950588e-05, "loss": 0.1288, "step": 99400 }, { "epoch": 1.8784707793434325, "grad_norm": 0.03151397779583931, "learning_rate": 9.392353896717164e-05, "loss": 0.129, "step": 99450 }, { "epoch": 1.8794152090967473, "grad_norm": 0.031651269644498825, "learning_rate": 9.397076045483738e-05, "loss": 0.129, "step": 99500 }, { "epoch": 1.8803596388500623, "grad_norm": 0.03145061805844307, "learning_rate": 9.401798194250312e-05, "loss": 0.129, "step": 99550 }, { "epoch": 1.8813040686033773, "grad_norm": 0.03131103515625, "learning_rate": 9.406520343016887e-05, "loss": 0.1289, "step": 99600 }, { "epoch": 1.8822484983566923, "grad_norm": 0.032128430902957916, "learning_rate": 9.411242491783462e-05, "loss": 0.1284, "step": 99650 }, { "epoch": 1.8831929281100073, "grad_norm": 0.03198719024658203, "learning_rate": 9.415964640550037e-05, "loss": 0.1286, "step": 99700 }, { "epoch": 1.884137357863322, "grad_norm": 0.032896533608436584, "learning_rate": 9.42068678931661e-05, "loss": 0.1288, "step": 99750 }, { "epoch": 1.885081787616637, "grad_norm": 0.0340246818959713, "learning_rate": 9.425408938083186e-05, "loss": 0.1285, "step": 99800 }, { "epoch": 1.886026217369952, "grad_norm": 0.031980834901332855, "learning_rate": 9.43013108684976e-05, "loss": 0.1291, "step": 99850 }, { "epoch": 1.886970647123267, "grad_norm": 0.031757574528455734, "learning_rate": 9.434853235616336e-05, "loss": 0.1291, "step": 99900 }, { "epoch": 1.887915076876582, "grad_norm": 0.03182145580649376, "learning_rate": 9.439575384382911e-05, "loss": 0.1288, "step": 99950 }, { "epoch": 1.8888595066298968, "grad_norm": 0.03457492217421532, "learning_rate": 9.444297533149484e-05, "loss": 0.1291, "step": 100000 }, { "epoch": 1.8888595066298968, "eval_IntDiv": 0.6743061801907743, "eval_NumCircles": 1804, "eval_SumBottleneck": 139.18799649352331, "eval_Uniqueness": 0.9962467031852302, "eval_Validity": 0.9858, "eval_Validity * Uniqueness": 0.9821, "eval_loss": 0.22128786146640778, "eval_runtime": 142.7392, "eval_samples_per_second": 70.058, "eval_steps_per_second": 0.553, "step": 100000 }, { "epoch": 1.889803936383212, "grad_norm": 0.0325089767575264, "learning_rate": 9.449019681916059e-05, "loss": 0.1291, "step": 100050 }, { "epoch": 1.8907483661365267, "grad_norm": 0.03152022510766983, "learning_rate": 9.453741830682634e-05, "loss": 0.129, "step": 100100 }, { "epoch": 1.8916927958898417, "grad_norm": 0.03236249089241028, "learning_rate": 9.458463979449209e-05, "loss": 0.1288, "step": 100150 }, { "epoch": 1.8926372256431567, "grad_norm": 0.030793968588113785, "learning_rate": 9.463186128215784e-05, "loss": 0.1289, "step": 100200 }, { "epoch": 1.8935816553964715, "grad_norm": 0.03210464119911194, "learning_rate": 9.46790827698236e-05, "loss": 0.1283, "step": 100250 }, { "epoch": 1.8945260851497867, "grad_norm": 0.03131192922592163, "learning_rate": 9.472630425748933e-05, "loss": 0.1289, "step": 100300 }, { "epoch": 1.8954705149031015, "grad_norm": 0.03122732974588871, "learning_rate": 9.477352574515508e-05, "loss": 0.1286, "step": 100350 }, { "epoch": 1.8964149446564165, "grad_norm": 0.03309931606054306, "learning_rate": 9.482074723282083e-05, "loss": 0.1285, "step": 100400 }, { "epoch": 1.8973593744097315, "grad_norm": 0.03190501779317856, "learning_rate": 9.486796872048658e-05, "loss": 0.1286, "step": 100450 }, { "epoch": 1.8983038041630462, "grad_norm": 0.031672220677137375, "learning_rate": 9.491519020815232e-05, "loss": 0.129, "step": 100500 }, { "epoch": 1.8992482339163614, "grad_norm": 0.033101778477430344, "learning_rate": 9.496241169581806e-05, "loss": 0.1289, "step": 100550 }, { "epoch": 1.9001926636696762, "grad_norm": 0.031027158722281456, "learning_rate": 9.500963318348382e-05, "loss": 0.1281, "step": 100600 }, { "epoch": 1.9011370934229912, "grad_norm": 0.031026804819703102, "learning_rate": 9.505685467114956e-05, "loss": 0.1288, "step": 100650 }, { "epoch": 1.9020815231763062, "grad_norm": 0.030612537637352943, "learning_rate": 9.510407615881531e-05, "loss": 0.1284, "step": 100700 }, { "epoch": 1.903025952929621, "grad_norm": 0.032488863915205, "learning_rate": 9.515129764648107e-05, "loss": 0.1289, "step": 100750 }, { "epoch": 1.9039703826829362, "grad_norm": 0.03325662761926651, "learning_rate": 9.51985191341468e-05, "loss": 0.1287, "step": 100800 }, { "epoch": 1.904914812436251, "grad_norm": 0.033667780458927155, "learning_rate": 9.524574062181255e-05, "loss": 0.1288, "step": 100850 }, { "epoch": 1.905859242189566, "grad_norm": 0.030815908685326576, "learning_rate": 9.52929621094783e-05, "loss": 0.1284, "step": 100900 }, { "epoch": 1.906803671942881, "grad_norm": 0.03072621487081051, "learning_rate": 9.534018359714404e-05, "loss": 0.1287, "step": 100950 }, { "epoch": 1.9077481016961957, "grad_norm": 0.03231118991971016, "learning_rate": 9.53874050848098e-05, "loss": 0.1289, "step": 101000 }, { "epoch": 1.908692531449511, "grad_norm": 0.032014451920986176, "learning_rate": 9.543462657247554e-05, "loss": 0.1286, "step": 101050 }, { "epoch": 1.9096369612028257, "grad_norm": 0.03190544992685318, "learning_rate": 9.54818480601413e-05, "loss": 0.1285, "step": 101100 }, { "epoch": 1.9105813909561407, "grad_norm": 0.032066527754068375, "learning_rate": 9.552906954780703e-05, "loss": 0.1291, "step": 101150 }, { "epoch": 1.9115258207094556, "grad_norm": 0.03224795684218407, "learning_rate": 9.557629103547279e-05, "loss": 0.1286, "step": 101200 }, { "epoch": 1.9124702504627704, "grad_norm": 0.032026659697294235, "learning_rate": 9.562351252313854e-05, "loss": 0.1287, "step": 101250 }, { "epoch": 1.9134146802160856, "grad_norm": 0.03577273339033127, "learning_rate": 9.567073401080428e-05, "loss": 0.1286, "step": 101300 }, { "epoch": 1.9143591099694004, "grad_norm": 0.031189359724521637, "learning_rate": 9.571795549847002e-05, "loss": 0.129, "step": 101350 }, { "epoch": 1.9153035397227154, "grad_norm": 0.03247307613492012, "learning_rate": 9.576517698613578e-05, "loss": 0.1283, "step": 101400 }, { "epoch": 1.9162479694760304, "grad_norm": 0.029580647125840187, "learning_rate": 9.581239847380152e-05, "loss": 0.1285, "step": 101450 }, { "epoch": 1.9171923992293454, "grad_norm": 0.03076835721731186, "learning_rate": 9.585961996146727e-05, "loss": 0.1281, "step": 101500 }, { "epoch": 1.9181368289826604, "grad_norm": 0.03275373578071594, "learning_rate": 9.590684144913303e-05, "loss": 0.1284, "step": 101550 }, { "epoch": 1.9190812587359751, "grad_norm": 0.030566567555069923, "learning_rate": 9.595406293679877e-05, "loss": 0.1287, "step": 101600 }, { "epoch": 1.9200256884892901, "grad_norm": 0.030883299186825752, "learning_rate": 9.600128442446451e-05, "loss": 0.1284, "step": 101650 }, { "epoch": 1.920970118242605, "grad_norm": 0.03114418126642704, "learning_rate": 9.604850591213026e-05, "loss": 0.1285, "step": 101700 }, { "epoch": 1.92191454799592, "grad_norm": 0.032511983066797256, "learning_rate": 9.6095727399796e-05, "loss": 0.1284, "step": 101750 }, { "epoch": 1.922858977749235, "grad_norm": 0.030889932066202164, "learning_rate": 9.614294888746176e-05, "loss": 0.129, "step": 101800 }, { "epoch": 1.9238034075025499, "grad_norm": 0.030872337520122528, "learning_rate": 9.61901703751275e-05, "loss": 0.1285, "step": 101850 }, { "epoch": 1.924747837255865, "grad_norm": 0.03334726765751839, "learning_rate": 9.623739186279325e-05, "loss": 0.1285, "step": 101900 }, { "epoch": 1.9256922670091798, "grad_norm": 0.03152294456958771, "learning_rate": 9.628461335045899e-05, "loss": 0.1283, "step": 101950 }, { "epoch": 1.9266366967624948, "grad_norm": 0.030257461592555046, "learning_rate": 9.633183483812475e-05, "loss": 0.1285, "step": 102000 }, { "epoch": 1.9275811265158098, "grad_norm": 0.032155513763427734, "learning_rate": 9.63790563257905e-05, "loss": 0.1283, "step": 102050 }, { "epoch": 1.9285255562691246, "grad_norm": 0.031235361471772194, "learning_rate": 9.642627781345624e-05, "loss": 0.1284, "step": 102100 }, { "epoch": 1.9294699860224398, "grad_norm": 0.032510943710803986, "learning_rate": 9.647349930112198e-05, "loss": 0.1285, "step": 102150 }, { "epoch": 1.9304144157757546, "grad_norm": 0.031020887196063995, "learning_rate": 9.652072078878774e-05, "loss": 0.1288, "step": 102200 }, { "epoch": 1.9313588455290696, "grad_norm": 0.03475572541356087, "learning_rate": 9.656794227645348e-05, "loss": 0.1281, "step": 102250 }, { "epoch": 1.9323032752823845, "grad_norm": 0.03335932269692421, "learning_rate": 9.661516376411923e-05, "loss": 0.1287, "step": 102300 }, { "epoch": 1.9332477050356993, "grad_norm": 0.03218882158398628, "learning_rate": 9.666238525178499e-05, "loss": 0.1288, "step": 102350 }, { "epoch": 1.9341921347890145, "grad_norm": 0.032306648790836334, "learning_rate": 9.670960673945073e-05, "loss": 0.1284, "step": 102400 }, { "epoch": 1.9351365645423293, "grad_norm": 0.03255116194486618, "learning_rate": 9.675682822711647e-05, "loss": 0.1286, "step": 102450 }, { "epoch": 1.9360809942956443, "grad_norm": 0.031585562974214554, "learning_rate": 9.680404971478222e-05, "loss": 0.1285, "step": 102500 }, { "epoch": 1.9360809942956443, "eval_IntDiv": 0.6759120235585525, "eval_NumCircles": 1816, "eval_SumBottleneck": 125.15657362646701, "eval_Uniqueness": 0.9975661697596593, "eval_Validity": 0.9861, "eval_Validity * Uniqueness": 0.9837, "eval_loss": 0.21980594098567963, "eval_runtime": 171.0924, "eval_samples_per_second": 58.448, "eval_steps_per_second": 0.462, "step": 102500 }, { "epoch": 1.9370254240489593, "grad_norm": 0.031136535108089447, "learning_rate": 9.685127120244796e-05, "loss": 0.1286, "step": 102550 }, { "epoch": 1.937969853802274, "grad_norm": 0.032396815717220306, "learning_rate": 9.689849269011372e-05, "loss": 0.1285, "step": 102600 }, { "epoch": 1.9389142835555893, "grad_norm": 0.0332774892449379, "learning_rate": 9.694571417777946e-05, "loss": 0.1283, "step": 102650 }, { "epoch": 1.939858713308904, "grad_norm": 0.030227508395910263, "learning_rate": 9.699293566544521e-05, "loss": 0.1283, "step": 102700 }, { "epoch": 1.940803143062219, "grad_norm": 0.03064686246216297, "learning_rate": 9.704015715311095e-05, "loss": 0.1287, "step": 102750 }, { "epoch": 1.941747572815534, "grad_norm": 0.03143608197569847, "learning_rate": 9.70873786407767e-05, "loss": 0.1285, "step": 102800 }, { "epoch": 1.9426920025688488, "grad_norm": 0.030528616160154343, "learning_rate": 9.713460012844246e-05, "loss": 0.1284, "step": 102850 }, { "epoch": 1.943636432322164, "grad_norm": 0.03008735179901123, "learning_rate": 9.71818216161082e-05, "loss": 0.1284, "step": 102900 }, { "epoch": 1.9445808620754788, "grad_norm": 0.031211763620376587, "learning_rate": 9.722904310377394e-05, "loss": 0.1287, "step": 102950 }, { "epoch": 1.9455252918287937, "grad_norm": 0.0312972292304039, "learning_rate": 9.72762645914397e-05, "loss": 0.1287, "step": 103000 }, { "epoch": 1.9464697215821087, "grad_norm": 0.03230850026011467, "learning_rate": 9.732348607910544e-05, "loss": 0.1287, "step": 103050 }, { "epoch": 1.9474141513354237, "grad_norm": 0.03144695609807968, "learning_rate": 9.737070756677119e-05, "loss": 0.1285, "step": 103100 }, { "epoch": 1.9483585810887387, "grad_norm": 0.034094564616680145, "learning_rate": 9.741792905443694e-05, "loss": 0.1284, "step": 103150 }, { "epoch": 1.9493030108420535, "grad_norm": 0.03339524567127228, "learning_rate": 9.746515054210269e-05, "loss": 0.1284, "step": 103200 }, { "epoch": 1.9502474405953685, "grad_norm": 0.03027011640369892, "learning_rate": 9.751237202976843e-05, "loss": 0.1282, "step": 103250 }, { "epoch": 1.9511918703486835, "grad_norm": 0.031145894899964333, "learning_rate": 9.755959351743418e-05, "loss": 0.1279, "step": 103300 }, { "epoch": 1.9521363001019985, "grad_norm": 0.03161751478910446, "learning_rate": 9.760681500509993e-05, "loss": 0.1285, "step": 103350 }, { "epoch": 1.9530807298553134, "grad_norm": 0.030371012166142464, "learning_rate": 9.765403649276567e-05, "loss": 0.1288, "step": 103400 }, { "epoch": 1.9540251596086282, "grad_norm": 0.030944732949137688, "learning_rate": 9.770125798043142e-05, "loss": 0.1289, "step": 103450 }, { "epoch": 1.9549695893619432, "grad_norm": 0.03380543738603592, "learning_rate": 9.774847946809717e-05, "loss": 0.1285, "step": 103500 }, { "epoch": 1.9559140191152582, "grad_norm": 0.031203528866171837, "learning_rate": 9.779570095576291e-05, "loss": 0.1281, "step": 103550 }, { "epoch": 1.9568584488685732, "grad_norm": 0.032017335295677185, "learning_rate": 9.784292244342866e-05, "loss": 0.1287, "step": 103600 }, { "epoch": 1.9578028786218882, "grad_norm": 0.03075268119573593, "learning_rate": 9.789014393109442e-05, "loss": 0.1285, "step": 103650 }, { "epoch": 1.958747308375203, "grad_norm": 0.030344190075993538, "learning_rate": 9.793736541876015e-05, "loss": 0.128, "step": 103700 }, { "epoch": 1.9596917381285182, "grad_norm": 0.03319081291556358, "learning_rate": 9.79845869064259e-05, "loss": 0.1284, "step": 103750 }, { "epoch": 1.960636167881833, "grad_norm": 0.03129640966653824, "learning_rate": 9.803180839409165e-05, "loss": 0.128, "step": 103800 }, { "epoch": 1.961580597635148, "grad_norm": 0.030710792168974876, "learning_rate": 9.80790298817574e-05, "loss": 0.1281, "step": 103850 }, { "epoch": 1.962525027388463, "grad_norm": 0.029974179342389107, "learning_rate": 9.812625136942315e-05, "loss": 0.1283, "step": 103900 }, { "epoch": 1.9634694571417777, "grad_norm": 0.03194688633084297, "learning_rate": 9.81734728570889e-05, "loss": 0.1286, "step": 103950 }, { "epoch": 1.9644138868950929, "grad_norm": 0.030003881081938744, "learning_rate": 9.822069434475464e-05, "loss": 0.1283, "step": 104000 }, { "epoch": 1.9653583166484077, "grad_norm": 0.031517744064331055, "learning_rate": 9.826791583242038e-05, "loss": 0.1282, "step": 104050 }, { "epoch": 1.9663027464017226, "grad_norm": 0.03278505429625511, "learning_rate": 9.831513732008614e-05, "loss": 0.1283, "step": 104100 }, { "epoch": 1.9672471761550376, "grad_norm": 0.03307149186730385, "learning_rate": 9.836235880775189e-05, "loss": 0.1284, "step": 104150 }, { "epoch": 1.9681916059083524, "grad_norm": 0.03273303061723709, "learning_rate": 9.840958029541763e-05, "loss": 0.1282, "step": 104200 }, { "epoch": 1.9691360356616676, "grad_norm": 0.030647989362478256, "learning_rate": 9.845680178308337e-05, "loss": 0.1286, "step": 104250 }, { "epoch": 1.9700804654149824, "grad_norm": 0.03141530603170395, "learning_rate": 9.850402327074913e-05, "loss": 0.1282, "step": 104300 }, { "epoch": 1.9710248951682974, "grad_norm": 0.031366102397441864, "learning_rate": 9.855124475841487e-05, "loss": 0.128, "step": 104350 }, { "epoch": 1.9719693249216124, "grad_norm": 0.031711168587207794, "learning_rate": 9.859846624608062e-05, "loss": 0.1283, "step": 104400 }, { "epoch": 1.9729137546749271, "grad_norm": 0.03180047497153282, "learning_rate": 9.864568773374638e-05, "loss": 0.128, "step": 104450 }, { "epoch": 1.9738581844282423, "grad_norm": 0.03191027417778969, "learning_rate": 9.86929092214121e-05, "loss": 0.1281, "step": 104500 }, { "epoch": 1.9748026141815571, "grad_norm": 0.03321731463074684, "learning_rate": 9.874013070907786e-05, "loss": 0.1284, "step": 104550 }, { "epoch": 1.975747043934872, "grad_norm": 0.031075885519385338, "learning_rate": 9.878735219674361e-05, "loss": 0.1288, "step": 104600 }, { "epoch": 1.976691473688187, "grad_norm": 0.031180303543806076, "learning_rate": 9.883457368440935e-05, "loss": 0.1282, "step": 104650 }, { "epoch": 1.9776359034415019, "grad_norm": 0.03217089921236038, "learning_rate": 9.888179517207511e-05, "loss": 0.1283, "step": 104700 }, { "epoch": 1.978580333194817, "grad_norm": 0.03102269023656845, "learning_rate": 9.892901665974086e-05, "loss": 0.1281, "step": 104750 }, { "epoch": 1.9795247629481318, "grad_norm": 0.03151198476552963, "learning_rate": 9.89762381474066e-05, "loss": 0.1283, "step": 104800 }, { "epoch": 1.9804691927014468, "grad_norm": 0.03256242722272873, "learning_rate": 9.902345963507234e-05, "loss": 0.1282, "step": 104850 }, { "epoch": 1.9814136224547618, "grad_norm": 0.030599094927310944, "learning_rate": 9.90706811227381e-05, "loss": 0.1282, "step": 104900 }, { "epoch": 1.9823580522080768, "grad_norm": 0.0326649472117424, "learning_rate": 9.911790261040385e-05, "loss": 0.1284, "step": 104950 }, { "epoch": 1.9833024819613918, "grad_norm": 0.03007500059902668, "learning_rate": 9.916512409806959e-05, "loss": 0.1281, "step": 105000 }, { "epoch": 1.9833024819613918, "eval_IntDiv": 0.6759186923725939, "eval_NumCircles": 1861, "eval_SumBottleneck": 137.85493109307512, "eval_Uniqueness": 0.995020325203252, "eval_Validity": 0.984, "eval_Validity * Uniqueness": 0.9791, "eval_loss": 0.21944665908813477, "eval_runtime": 155.0682, "eval_samples_per_second": 64.488, "eval_steps_per_second": 0.509, "step": 105000 }, { "epoch": 1.9842469117147066, "grad_norm": 0.03170621395111084, "learning_rate": 9.921234558573533e-05, "loss": 0.1284, "step": 105050 }, { "epoch": 1.9851913414680216, "grad_norm": 0.03468237444758415, "learning_rate": 9.925956707340109e-05, "loss": 0.1285, "step": 105100 }, { "epoch": 1.9861357712213366, "grad_norm": 0.03189409151673317, "learning_rate": 9.930678856106683e-05, "loss": 0.1282, "step": 105150 }, { "epoch": 1.9870802009746515, "grad_norm": 0.031356412917375565, "learning_rate": 9.935401004873258e-05, "loss": 0.1283, "step": 105200 }, { "epoch": 1.9880246307279665, "grad_norm": 0.030180856585502625, "learning_rate": 9.940123153639834e-05, "loss": 0.1282, "step": 105250 }, { "epoch": 1.9889690604812813, "grad_norm": 0.031230801716446877, "learning_rate": 9.944845302406406e-05, "loss": 0.1281, "step": 105300 }, { "epoch": 1.9899134902345965, "grad_norm": 0.029161296784877777, "learning_rate": 9.949567451172982e-05, "loss": 0.1285, "step": 105350 }, { "epoch": 1.9908579199879113, "grad_norm": 0.031987473368644714, "learning_rate": 9.954289599939557e-05, "loss": 0.1283, "step": 105400 }, { "epoch": 1.9918023497412263, "grad_norm": 0.029123231768608093, "learning_rate": 9.959011748706131e-05, "loss": 0.1281, "step": 105450 }, { "epoch": 1.9927467794945413, "grad_norm": 0.029776757583022118, "learning_rate": 9.963733897472707e-05, "loss": 0.128, "step": 105500 }, { "epoch": 1.993691209247856, "grad_norm": 0.030581964179873466, "learning_rate": 9.968456046239282e-05, "loss": 0.128, "step": 105550 }, { "epoch": 1.9946356390011712, "grad_norm": 0.030468670651316643, "learning_rate": 9.973178195005856e-05, "loss": 0.1281, "step": 105600 }, { "epoch": 1.995580068754486, "grad_norm": 0.030483776703476906, "learning_rate": 9.97790034377243e-05, "loss": 0.1281, "step": 105650 }, { "epoch": 1.996524498507801, "grad_norm": 0.032915446907281876, "learning_rate": 9.982622492539006e-05, "loss": 0.1283, "step": 105700 }, { "epoch": 1.997468928261116, "grad_norm": 0.03299493342638016, "learning_rate": 9.987344641305581e-05, "loss": 0.1282, "step": 105750 }, { "epoch": 1.9984133580144308, "grad_norm": 0.03074507787823677, "learning_rate": 9.992066790072155e-05, "loss": 0.1283, "step": 105800 }, { "epoch": 1.999357787767746, "grad_norm": 0.031508225947618484, "learning_rate": 9.996788938838729e-05, "loss": 0.1283, "step": 105850 }, { "epoch": 2.0003022175210607, "grad_norm": 0.03270776942372322, "learning_rate": 9.99983210137719e-05, "loss": 0.128, "step": 105900 }, { "epoch": 2.0012466472743755, "grad_norm": 0.02954925037920475, "learning_rate": 9.999307418180903e-05, "loss": 0.128, "step": 105950 }, { "epoch": 2.0021910770276907, "grad_norm": 0.032797809690237045, "learning_rate": 9.998782734984616e-05, "loss": 0.1279, "step": 106000 }, { "epoch": 2.0031355067810055, "grad_norm": 0.03156310319900513, "learning_rate": 9.998258051788331e-05, "loss": 0.1282, "step": 106050 }, { "epoch": 2.0040799365343207, "grad_norm": 0.030284004285931587, "learning_rate": 9.997733368592044e-05, "loss": 0.1284, "step": 106100 }, { "epoch": 2.0050243662876355, "grad_norm": 0.03082447685301304, "learning_rate": 9.997208685395758e-05, "loss": 0.1284, "step": 106150 }, { "epoch": 2.0059687960409507, "grad_norm": 0.03188361972570419, "learning_rate": 9.996684002199472e-05, "loss": 0.1279, "step": 106200 }, { "epoch": 2.0069132257942655, "grad_norm": 0.030592627823352814, "learning_rate": 9.996159319003187e-05, "loss": 0.1278, "step": 106250 }, { "epoch": 2.0078576555475802, "grad_norm": 0.03397824615240097, "learning_rate": 9.995634635806899e-05, "loss": 0.1283, "step": 106300 }, { "epoch": 2.0088020853008954, "grad_norm": 0.029781833291053772, "learning_rate": 9.995109952610614e-05, "loss": 0.1282, "step": 106350 }, { "epoch": 2.00974651505421, "grad_norm": 0.03163611516356468, "learning_rate": 9.994585269414329e-05, "loss": 0.128, "step": 106400 }, { "epoch": 2.0106909448075254, "grad_norm": 0.030900411307811737, "learning_rate": 9.994060586218042e-05, "loss": 0.1282, "step": 106450 }, { "epoch": 2.01163537456084, "grad_norm": 0.03239472210407257, "learning_rate": 9.993535903021755e-05, "loss": 0.1275, "step": 106500 }, { "epoch": 2.012579804314155, "grad_norm": 0.031129390001296997, "learning_rate": 9.99301121982547e-05, "loss": 0.1284, "step": 106550 }, { "epoch": 2.01352423406747, "grad_norm": 0.03226134181022644, "learning_rate": 9.992486536629184e-05, "loss": 0.128, "step": 106600 }, { "epoch": 2.014468663820785, "grad_norm": 0.03175993636250496, "learning_rate": 9.991961853432897e-05, "loss": 0.1276, "step": 106650 }, { "epoch": 2.0154130935741, "grad_norm": 0.030258111655712128, "learning_rate": 9.991437170236612e-05, "loss": 0.1274, "step": 106700 }, { "epoch": 2.016357523327415, "grad_norm": 0.030759736895561218, "learning_rate": 9.990912487040326e-05, "loss": 0.1278, "step": 106750 }, { "epoch": 2.0173019530807297, "grad_norm": 0.031528763473033905, "learning_rate": 9.990387803844039e-05, "loss": 0.1281, "step": 106800 }, { "epoch": 2.018246382834045, "grad_norm": 0.03222572058439255, "learning_rate": 9.989863120647753e-05, "loss": 0.1279, "step": 106850 }, { "epoch": 2.0191908125873597, "grad_norm": 0.031606752425432205, "learning_rate": 9.989338437451468e-05, "loss": 0.1281, "step": 106900 }, { "epoch": 2.020135242340675, "grad_norm": 0.032157402485609055, "learning_rate": 9.988813754255181e-05, "loss": 0.1277, "step": 106950 }, { "epoch": 2.0210796720939896, "grad_norm": 0.031891368329524994, "learning_rate": 9.988289071058895e-05, "loss": 0.1281, "step": 107000 }, { "epoch": 2.0220241018473044, "grad_norm": 0.033382877707481384, "learning_rate": 9.98776438786261e-05, "loss": 0.1278, "step": 107050 }, { "epoch": 2.0229685316006196, "grad_norm": 0.03718525916337967, "learning_rate": 9.987239704666323e-05, "loss": 0.128, "step": 107100 }, { "epoch": 2.0239129613539344, "grad_norm": 0.03011896274983883, "learning_rate": 9.986715021470036e-05, "loss": 0.1275, "step": 107150 }, { "epoch": 2.0248573911072496, "grad_norm": 0.03114982321858406, "learning_rate": 9.986190338273751e-05, "loss": 0.1273, "step": 107200 }, { "epoch": 2.0258018208605644, "grad_norm": 0.02968214824795723, "learning_rate": 9.985665655077466e-05, "loss": 0.1278, "step": 107250 }, { "epoch": 2.026746250613879, "grad_norm": 0.03396786004304886, "learning_rate": 9.985140971881178e-05, "loss": 0.1278, "step": 107300 }, { "epoch": 2.0276906803671944, "grad_norm": 0.030438421294093132, "learning_rate": 9.984616288684893e-05, "loss": 0.1276, "step": 107350 }, { "epoch": 2.028635110120509, "grad_norm": 0.031969599425792694, "learning_rate": 9.984091605488607e-05, "loss": 0.1281, "step": 107400 }, { "epoch": 2.0295795398738243, "grad_norm": 0.03244292363524437, "learning_rate": 9.98356692229232e-05, "loss": 0.1275, "step": 107450 }, { "epoch": 2.030523969627139, "grad_norm": 0.03134356066584587, "learning_rate": 9.983042239096034e-05, "loss": 0.128, "step": 107500 }, { "epoch": 2.030523969627139, "eval_IntDiv": 0.6749105449313759, "eval_NumCircles": 1842, "eval_SumBottleneck": 126.75180840114035, "eval_Uniqueness": 0.9972608298670995, "eval_Validity": 0.9857, "eval_Validity * Uniqueness": 0.983, "eval_loss": 0.22094513475894928, "eval_runtime": 165.9901, "eval_samples_per_second": 60.245, "eval_steps_per_second": 0.476, "step": 107500 }, { "epoch": 2.031468399380454, "grad_norm": 0.03156000375747681, "learning_rate": 9.982517555899749e-05, "loss": 0.1277, "step": 107550 }, { "epoch": 2.032412829133769, "grad_norm": 0.029780549928545952, "learning_rate": 9.981992872703462e-05, "loss": 0.1276, "step": 107600 }, { "epoch": 2.033357258887084, "grad_norm": 0.030690845102071762, "learning_rate": 9.981468189507176e-05, "loss": 0.1277, "step": 107650 }, { "epoch": 2.034301688640399, "grad_norm": 0.03388810530304909, "learning_rate": 9.98094350631089e-05, "loss": 0.1275, "step": 107700 }, { "epoch": 2.035246118393714, "grad_norm": 0.031045276671648026, "learning_rate": 9.980418823114604e-05, "loss": 0.1277, "step": 107750 }, { "epoch": 2.0361905481470286, "grad_norm": 0.032489486038684845, "learning_rate": 9.979894139918317e-05, "loss": 0.1276, "step": 107800 }, { "epoch": 2.037134977900344, "grad_norm": 0.03224669024348259, "learning_rate": 9.979369456722032e-05, "loss": 0.1277, "step": 107850 }, { "epoch": 2.0380794076536586, "grad_norm": 0.03145352378487587, "learning_rate": 9.978844773525745e-05, "loss": 0.1277, "step": 107900 }, { "epoch": 2.039023837406974, "grad_norm": 0.030292874202132225, "learning_rate": 9.978320090329459e-05, "loss": 0.1277, "step": 107950 }, { "epoch": 2.0399682671602886, "grad_norm": 0.03224615007638931, "learning_rate": 9.977795407133173e-05, "loss": 0.1277, "step": 108000 }, { "epoch": 2.0409126969136038, "grad_norm": 0.030627965927124023, "learning_rate": 9.977270723936888e-05, "loss": 0.1279, "step": 108050 }, { "epoch": 2.0418571266669185, "grad_norm": 0.03157993033528328, "learning_rate": 9.976746040740602e-05, "loss": 0.1274, "step": 108100 }, { "epoch": 2.0428015564202333, "grad_norm": 0.03173212707042694, "learning_rate": 9.976221357544315e-05, "loss": 0.1276, "step": 108150 }, { "epoch": 2.0437459861735485, "grad_norm": 0.032537464052438736, "learning_rate": 9.97569667434803e-05, "loss": 0.1274, "step": 108200 }, { "epoch": 2.0446904159268633, "grad_norm": 0.03172621503472328, "learning_rate": 9.975171991151743e-05, "loss": 0.1277, "step": 108250 }, { "epoch": 2.0456348456801785, "grad_norm": 0.031581975519657135, "learning_rate": 9.974647307955456e-05, "loss": 0.1276, "step": 108300 }, { "epoch": 2.0465792754334933, "grad_norm": 0.0315680168569088, "learning_rate": 9.974122624759171e-05, "loss": 0.1279, "step": 108350 }, { "epoch": 2.047523705186808, "grad_norm": 0.030431771650910378, "learning_rate": 9.973597941562885e-05, "loss": 0.1278, "step": 108400 }, { "epoch": 2.0484681349401233, "grad_norm": 0.030450956895947456, "learning_rate": 9.973073258366598e-05, "loss": 0.1273, "step": 108450 }, { "epoch": 2.049412564693438, "grad_norm": 0.03603486344218254, "learning_rate": 9.972548575170313e-05, "loss": 0.1279, "step": 108500 }, { "epoch": 2.0503569944467532, "grad_norm": 0.030933473259210587, "learning_rate": 9.972023891974026e-05, "loss": 0.128, "step": 108550 }, { "epoch": 2.051301424200068, "grad_norm": 0.031134510412812233, "learning_rate": 9.971499208777741e-05, "loss": 0.1277, "step": 108600 }, { "epoch": 2.0522458539533828, "grad_norm": 0.032212257385253906, "learning_rate": 9.970974525581454e-05, "loss": 0.1276, "step": 108650 }, { "epoch": 2.053190283706698, "grad_norm": 0.03120744228363037, "learning_rate": 9.970449842385168e-05, "loss": 0.1275, "step": 108700 }, { "epoch": 2.0541347134600128, "grad_norm": 0.040439531207084656, "learning_rate": 9.969925159188882e-05, "loss": 0.1277, "step": 108750 }, { "epoch": 2.055079143213328, "grad_norm": 0.03126702830195427, "learning_rate": 9.969400475992596e-05, "loss": 0.1278, "step": 108800 }, { "epoch": 2.0560235729666427, "grad_norm": 0.030931178480386734, "learning_rate": 9.96887579279631e-05, "loss": 0.1275, "step": 108850 }, { "epoch": 2.0569680027199575, "grad_norm": 0.031455181539058685, "learning_rate": 9.968351109600024e-05, "loss": 0.1279, "step": 108900 }, { "epoch": 2.0579124324732727, "grad_norm": 0.030301764607429504, "learning_rate": 9.967826426403737e-05, "loss": 0.1276, "step": 108950 }, { "epoch": 2.0588568622265875, "grad_norm": 0.029773209244012833, "learning_rate": 9.967301743207452e-05, "loss": 0.1274, "step": 109000 }, { "epoch": 2.0598012919799027, "grad_norm": 0.03431079909205437, "learning_rate": 9.966777060011165e-05, "loss": 0.1278, "step": 109050 }, { "epoch": 2.0607457217332175, "grad_norm": 0.030635753646492958, "learning_rate": 9.96625237681488e-05, "loss": 0.1276, "step": 109100 }, { "epoch": 2.0616901514865322, "grad_norm": 0.029895437881350517, "learning_rate": 9.965727693618594e-05, "loss": 0.1279, "step": 109150 }, { "epoch": 2.0626345812398474, "grad_norm": 0.030125219374895096, "learning_rate": 9.965203010422307e-05, "loss": 0.1276, "step": 109200 }, { "epoch": 2.063579010993162, "grad_norm": 0.030766785144805908, "learning_rate": 9.964678327226022e-05, "loss": 0.1272, "step": 109250 }, { "epoch": 2.0645234407464774, "grad_norm": 0.030363690108060837, "learning_rate": 9.964153644029735e-05, "loss": 0.1278, "step": 109300 }, { "epoch": 2.065467870499792, "grad_norm": 0.03088587522506714, "learning_rate": 9.963628960833449e-05, "loss": 0.1276, "step": 109350 }, { "epoch": 2.066412300253107, "grad_norm": 0.029841002076864243, "learning_rate": 9.963104277637163e-05, "loss": 0.1275, "step": 109400 }, { "epoch": 2.067356730006422, "grad_norm": 0.030565431341528893, "learning_rate": 9.962579594440877e-05, "loss": 0.1275, "step": 109450 }, { "epoch": 2.068301159759737, "grad_norm": 0.03151451796293259, "learning_rate": 9.96205491124459e-05, "loss": 0.1275, "step": 109500 }, { "epoch": 2.069245589513052, "grad_norm": 0.03095455840229988, "learning_rate": 9.961530228048305e-05, "loss": 0.1274, "step": 109550 }, { "epoch": 2.070190019266367, "grad_norm": 0.031233634799718857, "learning_rate": 9.96100554485202e-05, "loss": 0.1272, "step": 109600 }, { "epoch": 2.0711344490196817, "grad_norm": 0.03180794417858124, "learning_rate": 9.960480861655733e-05, "loss": 0.1279, "step": 109650 }, { "epoch": 2.072078878772997, "grad_norm": 0.031484320759773254, "learning_rate": 9.959956178459446e-05, "loss": 0.1274, "step": 109700 }, { "epoch": 2.0730233085263117, "grad_norm": 0.03033544309437275, "learning_rate": 9.959431495263161e-05, "loss": 0.1275, "step": 109750 }, { "epoch": 2.073967738279627, "grad_norm": 0.03152722120285034, "learning_rate": 9.958906812066874e-05, "loss": 0.1276, "step": 109800 }, { "epoch": 2.0749121680329417, "grad_norm": 0.03036566451191902, "learning_rate": 9.958382128870588e-05, "loss": 0.1278, "step": 109850 }, { "epoch": 2.075856597786257, "grad_norm": 0.03138386458158493, "learning_rate": 9.957857445674303e-05, "loss": 0.1273, "step": 109900 }, { "epoch": 2.0768010275395716, "grad_norm": 0.029914850369095802, "learning_rate": 9.957332762478016e-05, "loss": 0.1274, "step": 109950 }, { "epoch": 2.0777454572928864, "grad_norm": 0.03165780380368233, "learning_rate": 9.95680807928173e-05, "loss": 0.1276, "step": 110000 }, { "epoch": 2.0777454572928864, "eval_IntDiv": 0.674912022821093, "eval_NumCircles": 1802, "eval_SumBottleneck": 140.5363179417604, "eval_Uniqueness": 0.9967568663220837, "eval_Validity": 0.9867, "eval_Validity * Uniqueness": 0.9835, "eval_loss": 0.21939074993133545, "eval_runtime": 152.7536, "eval_samples_per_second": 65.465, "eval_steps_per_second": 0.517, "step": 110000 }, { "epoch": 2.0786898870462016, "grad_norm": 0.030047722160816193, "learning_rate": 9.956283396085444e-05, "loss": 0.1272, "step": 110050 }, { "epoch": 2.0796343167995164, "grad_norm": 0.0321236290037632, "learning_rate": 9.955758712889159e-05, "loss": 0.1273, "step": 110100 }, { "epoch": 2.0805787465528316, "grad_norm": 0.030221659690141678, "learning_rate": 9.955234029692871e-05, "loss": 0.1272, "step": 110150 }, { "epoch": 2.0815231763061464, "grad_norm": 0.0302255991846323, "learning_rate": 9.954709346496586e-05, "loss": 0.1276, "step": 110200 }, { "epoch": 2.082467606059461, "grad_norm": 0.03290421888232231, "learning_rate": 9.9541846633003e-05, "loss": 0.1275, "step": 110250 }, { "epoch": 2.0834120358127763, "grad_norm": 0.03150339052081108, "learning_rate": 9.953659980104014e-05, "loss": 0.1272, "step": 110300 }, { "epoch": 2.084356465566091, "grad_norm": 0.030869511887431145, "learning_rate": 9.953135296907727e-05, "loss": 0.1274, "step": 110350 }, { "epoch": 2.0853008953194063, "grad_norm": 0.03139565512537956, "learning_rate": 9.952610613711442e-05, "loss": 0.1272, "step": 110400 }, { "epoch": 2.086245325072721, "grad_norm": 0.034078408032655716, "learning_rate": 9.952085930515155e-05, "loss": 0.1273, "step": 110450 }, { "epoch": 2.087189754826036, "grad_norm": 0.03308840095996857, "learning_rate": 9.951561247318869e-05, "loss": 0.1276, "step": 110500 }, { "epoch": 2.088134184579351, "grad_norm": 0.031203461810946465, "learning_rate": 9.951036564122583e-05, "loss": 0.1273, "step": 110550 }, { "epoch": 2.089078614332666, "grad_norm": 0.030895423144102097, "learning_rate": 9.950511880926298e-05, "loss": 0.1279, "step": 110600 }, { "epoch": 2.090023044085981, "grad_norm": 0.030569950118660927, "learning_rate": 9.94998719773001e-05, "loss": 0.1275, "step": 110650 }, { "epoch": 2.090967473839296, "grad_norm": 0.030348218977451324, "learning_rate": 9.949462514533725e-05, "loss": 0.1278, "step": 110700 }, { "epoch": 2.0919119035926106, "grad_norm": 0.030427666381001472, "learning_rate": 9.94893783133744e-05, "loss": 0.1271, "step": 110750 }, { "epoch": 2.092856333345926, "grad_norm": 0.030752841383218765, "learning_rate": 9.948413148141152e-05, "loss": 0.1274, "step": 110800 }, { "epoch": 2.0938007630992406, "grad_norm": 0.03096630610525608, "learning_rate": 9.947888464944867e-05, "loss": 0.1274, "step": 110850 }, { "epoch": 2.094745192852556, "grad_norm": 0.030976982787251472, "learning_rate": 9.947363781748581e-05, "loss": 0.1282, "step": 110900 }, { "epoch": 2.0956896226058706, "grad_norm": 0.03303275629878044, "learning_rate": 9.946839098552295e-05, "loss": 0.1274, "step": 110950 }, { "epoch": 2.0966340523591853, "grad_norm": 0.03143987059593201, "learning_rate": 9.946314415356008e-05, "loss": 0.1279, "step": 111000 }, { "epoch": 2.0975784821125005, "grad_norm": 0.032130297273397446, "learning_rate": 9.945789732159723e-05, "loss": 0.1275, "step": 111050 }, { "epoch": 2.0985229118658153, "grad_norm": 0.03030380792915821, "learning_rate": 9.945265048963436e-05, "loss": 0.1271, "step": 111100 }, { "epoch": 2.0994673416191305, "grad_norm": 0.030696799978613853, "learning_rate": 9.94474036576715e-05, "loss": 0.1275, "step": 111150 }, { "epoch": 2.1004117713724453, "grad_norm": 0.034175511449575424, "learning_rate": 9.944215682570864e-05, "loss": 0.1274, "step": 111200 }, { "epoch": 2.1013562011257605, "grad_norm": 0.03142855316400528, "learning_rate": 9.943690999374579e-05, "loss": 0.1273, "step": 111250 }, { "epoch": 2.1023006308790753, "grad_norm": 0.03163035586476326, "learning_rate": 9.943166316178291e-05, "loss": 0.1276, "step": 111300 }, { "epoch": 2.10324506063239, "grad_norm": 0.0320865623652935, "learning_rate": 9.942641632982006e-05, "loss": 0.1275, "step": 111350 }, { "epoch": 2.1041894903857052, "grad_norm": 0.030937623232603073, "learning_rate": 9.94211694978572e-05, "loss": 0.128, "step": 111400 }, { "epoch": 2.10513392013902, "grad_norm": 0.03208814188838005, "learning_rate": 9.941592266589434e-05, "loss": 0.1269, "step": 111450 }, { "epoch": 2.106078349892335, "grad_norm": 0.030605565756559372, "learning_rate": 9.941067583393147e-05, "loss": 0.1276, "step": 111500 }, { "epoch": 2.10702277964565, "grad_norm": 0.03072093427181244, "learning_rate": 9.940542900196862e-05, "loss": 0.1272, "step": 111550 }, { "epoch": 2.1079672093989648, "grad_norm": 0.03066159039735794, "learning_rate": 9.940018217000576e-05, "loss": 0.1277, "step": 111600 }, { "epoch": 2.10891163915228, "grad_norm": 0.03098146803677082, "learning_rate": 9.939493533804289e-05, "loss": 0.1275, "step": 111650 }, { "epoch": 2.1098560689055947, "grad_norm": 0.029735835269093513, "learning_rate": 9.938968850608004e-05, "loss": 0.1272, "step": 111700 }, { "epoch": 2.11080049865891, "grad_norm": 0.03141288086771965, "learning_rate": 9.938444167411717e-05, "loss": 0.127, "step": 111750 }, { "epoch": 2.1117449284122247, "grad_norm": 0.030705709010362625, "learning_rate": 9.93791948421543e-05, "loss": 0.1275, "step": 111800 }, { "epoch": 2.1126893581655395, "grad_norm": 0.029928697273135185, "learning_rate": 9.937394801019145e-05, "loss": 0.1271, "step": 111850 }, { "epoch": 2.1136337879188547, "grad_norm": 0.030462687835097313, "learning_rate": 9.936870117822859e-05, "loss": 0.1278, "step": 111900 }, { "epoch": 2.1145782176721695, "grad_norm": 0.03161010891199112, "learning_rate": 9.936345434626573e-05, "loss": 0.1272, "step": 111950 }, { "epoch": 2.1155226474254847, "grad_norm": 0.03300702944397926, "learning_rate": 9.935820751430287e-05, "loss": 0.1269, "step": 112000 }, { "epoch": 2.1164670771787994, "grad_norm": 0.030708275735378265, "learning_rate": 9.935296068234001e-05, "loss": 0.1274, "step": 112050 }, { "epoch": 2.117411506932114, "grad_norm": 0.03201821818947792, "learning_rate": 9.934771385037715e-05, "loss": 0.1271, "step": 112100 }, { "epoch": 2.1183559366854294, "grad_norm": 0.032169945538043976, "learning_rate": 9.934246701841428e-05, "loss": 0.1273, "step": 112150 }, { "epoch": 2.119300366438744, "grad_norm": 0.03245997428894043, "learning_rate": 9.933722018645143e-05, "loss": 0.1272, "step": 112200 }, { "epoch": 2.1202447961920594, "grad_norm": 0.030417680740356445, "learning_rate": 9.933197335448856e-05, "loss": 0.1273, "step": 112250 }, { "epoch": 2.121189225945374, "grad_norm": 0.02988787367939949, "learning_rate": 9.93267265225257e-05, "loss": 0.1275, "step": 112300 }, { "epoch": 2.122133655698689, "grad_norm": 0.029521912336349487, "learning_rate": 9.932147969056284e-05, "loss": 0.1272, "step": 112350 }, { "epoch": 2.123078085452004, "grad_norm": 0.0316658653318882, "learning_rate": 9.931623285859998e-05, "loss": 0.1273, "step": 112400 }, { "epoch": 2.124022515205319, "grad_norm": 0.0317998081445694, "learning_rate": 9.931098602663713e-05, "loss": 0.1272, "step": 112450 }, { "epoch": 2.124966944958634, "grad_norm": 0.030574927106499672, "learning_rate": 9.930573919467426e-05, "loss": 0.1274, "step": 112500 }, { "epoch": 2.124966944958634, "eval_IntDiv": 0.6756239678011141, "eval_NumCircles": 1807, "eval_SumBottleneck": 142.6990589824803, "eval_Uniqueness": 0.9972544234289201, "eval_Validity": 0.9834, "eval_Validity * Uniqueness": 0.9807000000000001, "eval_loss": 0.221370667219162, "eval_runtime": 161.3033, "eval_samples_per_second": 61.995, "eval_steps_per_second": 0.49, "step": 112500 }, { "epoch": 2.125911374711949, "grad_norm": 0.03285792097449303, "learning_rate": 9.93004923627114e-05, "loss": 0.1276, "step": 112550 }, { "epoch": 2.1268558044652637, "grad_norm": 0.03031335212290287, "learning_rate": 9.929524553074854e-05, "loss": 0.1273, "step": 112600 }, { "epoch": 2.127800234218579, "grad_norm": 0.030399737879633904, "learning_rate": 9.928999869878568e-05, "loss": 0.1268, "step": 112650 }, { "epoch": 2.1287446639718937, "grad_norm": 0.03280104696750641, "learning_rate": 9.928475186682281e-05, "loss": 0.1276, "step": 112700 }, { "epoch": 2.129689093725209, "grad_norm": 0.03185192495584488, "learning_rate": 9.927950503485996e-05, "loss": 0.1272, "step": 112750 }, { "epoch": 2.1306335234785236, "grad_norm": 0.029596658423542976, "learning_rate": 9.927425820289709e-05, "loss": 0.1275, "step": 112800 }, { "epoch": 2.1315779532318384, "grad_norm": 0.032732512801885605, "learning_rate": 9.926901137093424e-05, "loss": 0.1275, "step": 112850 }, { "epoch": 2.1325223829851536, "grad_norm": 0.030049802735447884, "learning_rate": 9.926376453897137e-05, "loss": 0.1275, "step": 112900 }, { "epoch": 2.1334668127384684, "grad_norm": 0.03314054384827614, "learning_rate": 9.925851770700852e-05, "loss": 0.1276, "step": 112950 }, { "epoch": 2.1344112424917836, "grad_norm": 0.03116578608751297, "learning_rate": 9.925327087504565e-05, "loss": 0.1273, "step": 113000 }, { "epoch": 2.1353556722450984, "grad_norm": 0.031439051032066345, "learning_rate": 9.924802404308279e-05, "loss": 0.1272, "step": 113050 }, { "epoch": 2.1363001019984136, "grad_norm": 0.03252581134438515, "learning_rate": 9.924277721111993e-05, "loss": 0.1273, "step": 113100 }, { "epoch": 2.1372445317517283, "grad_norm": 0.03235326707363129, "learning_rate": 9.923753037915707e-05, "loss": 0.1268, "step": 113150 }, { "epoch": 2.138188961505043, "grad_norm": 0.02995842881500721, "learning_rate": 9.92322835471942e-05, "loss": 0.127, "step": 113200 }, { "epoch": 2.1391333912583583, "grad_norm": 0.0337495431303978, "learning_rate": 9.922703671523135e-05, "loss": 0.1271, "step": 113250 }, { "epoch": 2.140077821011673, "grad_norm": 0.031650643795728683, "learning_rate": 9.922178988326848e-05, "loss": 0.1273, "step": 113300 }, { "epoch": 2.141022250764988, "grad_norm": 0.03139448165893555, "learning_rate": 9.921654305130562e-05, "loss": 0.1273, "step": 113350 }, { "epoch": 2.141966680518303, "grad_norm": 0.03124273382127285, "learning_rate": 9.921129621934277e-05, "loss": 0.1273, "step": 113400 }, { "epoch": 2.142911110271618, "grad_norm": 0.03129229694604874, "learning_rate": 9.920604938737991e-05, "loss": 0.1276, "step": 113450 }, { "epoch": 2.143855540024933, "grad_norm": 0.031154261901974678, "learning_rate": 9.920080255541705e-05, "loss": 0.1274, "step": 113500 }, { "epoch": 2.144799969778248, "grad_norm": 0.03015695884823799, "learning_rate": 9.919555572345418e-05, "loss": 0.1273, "step": 113550 }, { "epoch": 2.145744399531563, "grad_norm": 0.03224260360002518, "learning_rate": 9.919030889149133e-05, "loss": 0.1272, "step": 113600 }, { "epoch": 2.146688829284878, "grad_norm": 0.029643189162015915, "learning_rate": 9.918506205952846e-05, "loss": 0.1272, "step": 113650 }, { "epoch": 2.1476332590381926, "grad_norm": 0.04193345084786415, "learning_rate": 9.91798152275656e-05, "loss": 0.1287, "step": 113700 }, { "epoch": 2.148577688791508, "grad_norm": 0.04142722487449646, "learning_rate": 9.917456839560274e-05, "loss": 0.1278, "step": 113750 }, { "epoch": 2.1495221185448226, "grad_norm": 0.030909711495041847, "learning_rate": 9.916932156363988e-05, "loss": 0.1269, "step": 113800 }, { "epoch": 2.1504665482981378, "grad_norm": 0.030999835580587387, "learning_rate": 9.916407473167701e-05, "loss": 0.1275, "step": 113850 }, { "epoch": 2.1514109780514525, "grad_norm": 0.03106130287051201, "learning_rate": 9.915882789971416e-05, "loss": 0.1273, "step": 113900 }, { "epoch": 2.1523554078047673, "grad_norm": 0.030505893751978874, "learning_rate": 9.91535810677513e-05, "loss": 0.1272, "step": 113950 }, { "epoch": 2.1532998375580825, "grad_norm": 0.030803704634308815, "learning_rate": 9.914833423578843e-05, "loss": 0.1269, "step": 114000 }, { "epoch": 2.1542442673113973, "grad_norm": 0.029437560588121414, "learning_rate": 9.914308740382557e-05, "loss": 0.1275, "step": 114050 }, { "epoch": 2.1551886970647125, "grad_norm": 0.03059661202132702, "learning_rate": 9.913784057186272e-05, "loss": 0.1272, "step": 114100 }, { "epoch": 2.1561331268180273, "grad_norm": 0.0304799135774374, "learning_rate": 9.913259373989984e-05, "loss": 0.1268, "step": 114150 }, { "epoch": 2.157077556571342, "grad_norm": 0.03252127394080162, "learning_rate": 9.912734690793699e-05, "loss": 0.1274, "step": 114200 }, { "epoch": 2.1580219863246572, "grad_norm": 0.030883194878697395, "learning_rate": 9.912210007597414e-05, "loss": 0.1269, "step": 114250 }, { "epoch": 2.158966416077972, "grad_norm": 0.03368291258811951, "learning_rate": 9.911685324401127e-05, "loss": 0.1269, "step": 114300 }, { "epoch": 2.1599108458312872, "grad_norm": 0.030355436727404594, "learning_rate": 9.91116064120484e-05, "loss": 0.1271, "step": 114350 }, { "epoch": 2.160855275584602, "grad_norm": 0.034298114478588104, "learning_rate": 9.910635958008555e-05, "loss": 0.1274, "step": 114400 }, { "epoch": 2.1617997053379168, "grad_norm": 0.03156331181526184, "learning_rate": 9.91011127481227e-05, "loss": 0.1273, "step": 114450 }, { "epoch": 2.162744135091232, "grad_norm": 0.03061150386929512, "learning_rate": 9.909586591615982e-05, "loss": 0.1269, "step": 114500 }, { "epoch": 2.1636885648445467, "grad_norm": 0.031174810603260994, "learning_rate": 9.909061908419697e-05, "loss": 0.1271, "step": 114550 }, { "epoch": 2.164632994597862, "grad_norm": 0.02999940887093544, "learning_rate": 9.908537225223411e-05, "loss": 0.1271, "step": 114600 }, { "epoch": 2.1655774243511767, "grad_norm": 0.02999294362962246, "learning_rate": 9.908012542027123e-05, "loss": 0.1269, "step": 114650 }, { "epoch": 2.1665218541044915, "grad_norm": 0.031463947147130966, "learning_rate": 9.907487858830838e-05, "loss": 0.1271, "step": 114700 }, { "epoch": 2.1674662838578067, "grad_norm": 0.02994396723806858, "learning_rate": 9.906963175634553e-05, "loss": 0.1271, "step": 114750 }, { "epoch": 2.1684107136111215, "grad_norm": 0.03058142587542534, "learning_rate": 9.906438492438266e-05, "loss": 0.1269, "step": 114800 }, { "epoch": 2.1693551433644367, "grad_norm": 0.03184689208865166, "learning_rate": 9.90591380924198e-05, "loss": 0.127, "step": 114850 }, { "epoch": 2.1702995731177515, "grad_norm": 0.032390058040618896, "learning_rate": 9.905389126045695e-05, "loss": 0.1271, "step": 114900 }, { "epoch": 2.1712440028710667, "grad_norm": 0.030557969585061073, "learning_rate": 9.904864442849408e-05, "loss": 0.1269, "step": 114950 }, { "epoch": 2.1721884326243814, "grad_norm": 0.030850928276777267, "learning_rate": 9.904339759653121e-05, "loss": 0.127, "step": 115000 }, { "epoch": 2.1721884326243814, "eval_IntDiv": 0.6750459808367719, "eval_NumCircles": 1792, "eval_SumBottleneck": 146.96603321450658, "eval_Uniqueness": 0.9969657125518357, "eval_Validity": 0.9887, "eval_Validity * Uniqueness": 0.9857, "eval_loss": 0.22077137231826782, "eval_runtime": 163.422, "eval_samples_per_second": 61.191, "eval_steps_per_second": 0.483, "step": 115000 }, { "epoch": 2.173132862377696, "grad_norm": 0.030503345653414726, "learning_rate": 9.903815076456836e-05, "loss": 0.1269, "step": 115050 }, { "epoch": 2.1740772921310114, "grad_norm": 0.030602455139160156, "learning_rate": 9.903290393260551e-05, "loss": 0.1267, "step": 115100 }, { "epoch": 2.175021721884326, "grad_norm": 0.028886226937174797, "learning_rate": 9.902765710064263e-05, "loss": 0.127, "step": 115150 }, { "epoch": 2.1759661516376414, "grad_norm": 0.03117545321583748, "learning_rate": 9.902241026867978e-05, "loss": 0.1268, "step": 115200 }, { "epoch": 2.176910581390956, "grad_norm": 0.03284977748990059, "learning_rate": 9.901716343671692e-05, "loss": 0.1269, "step": 115250 }, { "epoch": 2.177855011144271, "grad_norm": 0.03156328201293945, "learning_rate": 9.901191660475406e-05, "loss": 0.1271, "step": 115300 }, { "epoch": 2.178799440897586, "grad_norm": 0.03082215040922165, "learning_rate": 9.900666977279119e-05, "loss": 0.1271, "step": 115350 }, { "epoch": 2.179743870650901, "grad_norm": 0.029946813359856606, "learning_rate": 9.900142294082834e-05, "loss": 0.1274, "step": 115400 }, { "epoch": 2.180688300404216, "grad_norm": 0.03275628015398979, "learning_rate": 9.899617610886547e-05, "loss": 0.1267, "step": 115450 }, { "epoch": 2.181632730157531, "grad_norm": 0.03032122366130352, "learning_rate": 9.89909292769026e-05, "loss": 0.1268, "step": 115500 }, { "epoch": 2.1825771599108457, "grad_norm": 0.030515864491462708, "learning_rate": 9.898568244493975e-05, "loss": 0.1271, "step": 115550 }, { "epoch": 2.183521589664161, "grad_norm": 0.031929418444633484, "learning_rate": 9.898043561297689e-05, "loss": 0.1265, "step": 115600 }, { "epoch": 2.1844660194174756, "grad_norm": 0.029962915927171707, "learning_rate": 9.897518878101402e-05, "loss": 0.127, "step": 115650 }, { "epoch": 2.185410449170791, "grad_norm": 0.03162502497434616, "learning_rate": 9.896994194905117e-05, "loss": 0.1263, "step": 115700 }, { "epoch": 2.1863548789241056, "grad_norm": 0.031597867608070374, "learning_rate": 9.89646951170883e-05, "loss": 0.127, "step": 115750 }, { "epoch": 2.1872993086774204, "grad_norm": 0.02870918996632099, "learning_rate": 9.895944828512545e-05, "loss": 0.1274, "step": 115800 }, { "epoch": 2.1882437384307356, "grad_norm": 0.02880951762199402, "learning_rate": 9.895420145316258e-05, "loss": 0.1268, "step": 115850 }, { "epoch": 2.1891881681840504, "grad_norm": 0.030875254422426224, "learning_rate": 9.894895462119973e-05, "loss": 0.1265, "step": 115900 }, { "epoch": 2.1901325979373656, "grad_norm": 0.030232423916459084, "learning_rate": 9.894370778923687e-05, "loss": 0.1266, "step": 115950 }, { "epoch": 2.1910770276906804, "grad_norm": 0.029422488063573837, "learning_rate": 9.8938460957274e-05, "loss": 0.1271, "step": 116000 }, { "epoch": 2.192021457443995, "grad_norm": 0.02919410541653633, "learning_rate": 9.893321412531115e-05, "loss": 0.1269, "step": 116050 }, { "epoch": 2.1929658871973103, "grad_norm": 0.031369294971227646, "learning_rate": 9.892796729334828e-05, "loss": 0.1272, "step": 116100 }, { "epoch": 2.193910316950625, "grad_norm": 0.0300123393535614, "learning_rate": 9.892272046138541e-05, "loss": 0.1268, "step": 116150 }, { "epoch": 2.1948547467039403, "grad_norm": 0.03247970715165138, "learning_rate": 9.891747362942256e-05, "loss": 0.1269, "step": 116200 }, { "epoch": 2.195799176457255, "grad_norm": 0.030525866895914078, "learning_rate": 9.89122267974597e-05, "loss": 0.1271, "step": 116250 }, { "epoch": 2.19674360621057, "grad_norm": 0.030151113867759705, "learning_rate": 9.890697996549684e-05, "loss": 0.1268, "step": 116300 }, { "epoch": 2.197688035963885, "grad_norm": 0.035363517701625824, "learning_rate": 9.890173313353398e-05, "loss": 0.1269, "step": 116350 }, { "epoch": 2.1986324657172, "grad_norm": 0.03152402490377426, "learning_rate": 9.889648630157111e-05, "loss": 0.1272, "step": 116400 }, { "epoch": 2.199576895470515, "grad_norm": 0.032552462071180344, "learning_rate": 9.889123946960826e-05, "loss": 0.1269, "step": 116450 }, { "epoch": 2.20052132522383, "grad_norm": 0.03141910582780838, "learning_rate": 9.888599263764539e-05, "loss": 0.1267, "step": 116500 }, { "epoch": 2.2014657549771446, "grad_norm": 0.0315852127969265, "learning_rate": 9.888074580568253e-05, "loss": 0.1268, "step": 116550 }, { "epoch": 2.20241018473046, "grad_norm": 0.030032940208911896, "learning_rate": 9.887549897371967e-05, "loss": 0.1269, "step": 116600 }, { "epoch": 2.2033546144837746, "grad_norm": 0.0294108334928751, "learning_rate": 9.887025214175681e-05, "loss": 0.1268, "step": 116650 }, { "epoch": 2.2042990442370898, "grad_norm": 0.032054170966148376, "learning_rate": 9.886500530979396e-05, "loss": 0.127, "step": 116700 }, { "epoch": 2.2052434739904045, "grad_norm": 0.031966883689165115, "learning_rate": 9.885975847783109e-05, "loss": 0.1272, "step": 116750 }, { "epoch": 2.2061879037437198, "grad_norm": 0.03269194811582565, "learning_rate": 9.885451164586824e-05, "loss": 0.1271, "step": 116800 }, { "epoch": 2.2071323334970345, "grad_norm": 0.030014628544449806, "learning_rate": 9.884926481390537e-05, "loss": 0.1267, "step": 116850 }, { "epoch": 2.2080767632503493, "grad_norm": 0.031461410224437714, "learning_rate": 9.88440179819425e-05, "loss": 0.1268, "step": 116900 }, { "epoch": 2.2090211930036645, "grad_norm": 0.033580660820007324, "learning_rate": 9.883877114997965e-05, "loss": 0.1269, "step": 116950 }, { "epoch": 2.2099656227569793, "grad_norm": 0.03246843442320824, "learning_rate": 9.883352431801679e-05, "loss": 0.1267, "step": 117000 }, { "epoch": 2.2109100525102945, "grad_norm": 0.030514543876051903, "learning_rate": 9.882827748605392e-05, "loss": 0.1265, "step": 117050 }, { "epoch": 2.2118544822636093, "grad_norm": 0.030961541458964348, "learning_rate": 9.882303065409107e-05, "loss": 0.1265, "step": 117100 }, { "epoch": 2.212798912016924, "grad_norm": 0.03175503388047218, "learning_rate": 9.88177838221282e-05, "loss": 0.127, "step": 117150 }, { "epoch": 2.2137433417702392, "grad_norm": 0.02957373857498169, "learning_rate": 9.881253699016534e-05, "loss": 0.1272, "step": 117200 }, { "epoch": 2.214687771523554, "grad_norm": 0.031406693160533905, "learning_rate": 9.880729015820248e-05, "loss": 0.1269, "step": 117250 }, { "epoch": 2.215632201276869, "grad_norm": 0.02823270671069622, "learning_rate": 9.880204332623963e-05, "loss": 0.1269, "step": 117300 }, { "epoch": 2.216576631030184, "grad_norm": 0.030367614701390266, "learning_rate": 9.879679649427675e-05, "loss": 0.1269, "step": 117350 }, { "epoch": 2.2175210607834988, "grad_norm": 0.03351715952157974, "learning_rate": 9.87915496623139e-05, "loss": 0.1266, "step": 117400 }, { "epoch": 2.218465490536814, "grad_norm": 0.030430564656853676, "learning_rate": 9.878630283035105e-05, "loss": 0.1267, "step": 117450 }, { "epoch": 2.2194099202901287, "grad_norm": 0.03185087814927101, "learning_rate": 9.878105599838818e-05, "loss": 0.1269, "step": 117500 }, { "epoch": 2.2194099202901287, "eval_IntDiv": 0.6756696524310755, "eval_NumCircles": 1839, "eval_SumBottleneck": 120.41085710404147, "eval_Uniqueness": 0.9964416429442863, "eval_Validity": 0.9836, "eval_Validity * Uniqueness": 0.9801, "eval_loss": 0.22182780504226685, "eval_runtime": 153.7523, "eval_samples_per_second": 65.04, "eval_steps_per_second": 0.514, "step": 117500 }, { "epoch": 2.220354350043444, "grad_norm": 0.03215664625167847, "learning_rate": 9.877580916642531e-05, "loss": 0.1265, "step": 117550 }, { "epoch": 2.2212987797967587, "grad_norm": 0.029117712751030922, "learning_rate": 9.877056233446246e-05, "loss": 0.1266, "step": 117600 }, { "epoch": 2.2222432095500735, "grad_norm": 0.03044295124709606, "learning_rate": 9.87653155024996e-05, "loss": 0.1268, "step": 117650 }, { "epoch": 2.2231876393033887, "grad_norm": 0.030987808480858803, "learning_rate": 9.876006867053673e-05, "loss": 0.1268, "step": 117700 }, { "epoch": 2.2241320690567035, "grad_norm": 0.031435854732990265, "learning_rate": 9.875482183857388e-05, "loss": 0.1267, "step": 117750 }, { "epoch": 2.2250764988100187, "grad_norm": 0.02960273064672947, "learning_rate": 9.874957500661102e-05, "loss": 0.1266, "step": 117800 }, { "epoch": 2.2260209285633334, "grad_norm": 0.029567210003733635, "learning_rate": 9.874432817464814e-05, "loss": 0.1266, "step": 117850 }, { "epoch": 2.226965358316648, "grad_norm": 0.03268927335739136, "learning_rate": 9.873908134268529e-05, "loss": 0.1268, "step": 117900 }, { "epoch": 2.2279097880699634, "grad_norm": 0.03346012905240059, "learning_rate": 9.873383451072244e-05, "loss": 0.1265, "step": 117950 }, { "epoch": 2.228854217823278, "grad_norm": 0.033269863575696945, "learning_rate": 9.872858767875956e-05, "loss": 0.1268, "step": 118000 }, { "epoch": 2.2297986475765934, "grad_norm": 0.030457140877842903, "learning_rate": 9.87233408467967e-05, "loss": 0.1273, "step": 118050 }, { "epoch": 2.230743077329908, "grad_norm": 0.031120477244257927, "learning_rate": 9.871809401483385e-05, "loss": 0.1265, "step": 118100 }, { "epoch": 2.231687507083223, "grad_norm": 0.03034776635468006, "learning_rate": 9.871284718287099e-05, "loss": 0.1265, "step": 118150 }, { "epoch": 2.232631936836538, "grad_norm": 0.02984011545777321, "learning_rate": 9.870760035090812e-05, "loss": 0.127, "step": 118200 }, { "epoch": 2.233576366589853, "grad_norm": 0.030410069972276688, "learning_rate": 9.870235351894527e-05, "loss": 0.1267, "step": 118250 }, { "epoch": 2.234520796343168, "grad_norm": 0.029898902401328087, "learning_rate": 9.869710668698242e-05, "loss": 0.1264, "step": 118300 }, { "epoch": 2.235465226096483, "grad_norm": 0.03175502270460129, "learning_rate": 9.869185985501954e-05, "loss": 0.1267, "step": 118350 }, { "epoch": 2.2364096558497977, "grad_norm": 0.031203893944621086, "learning_rate": 9.868661302305668e-05, "loss": 0.1269, "step": 118400 }, { "epoch": 2.237354085603113, "grad_norm": 0.03148692101240158, "learning_rate": 9.868136619109383e-05, "loss": 0.127, "step": 118450 }, { "epoch": 2.2382985153564277, "grad_norm": 0.030228374525904655, "learning_rate": 9.867611935913095e-05, "loss": 0.1265, "step": 118500 }, { "epoch": 2.239242945109743, "grad_norm": 0.030350271612405777, "learning_rate": 9.86708725271681e-05, "loss": 0.1268, "step": 118550 }, { "epoch": 2.2401873748630576, "grad_norm": 0.03268728405237198, "learning_rate": 9.866562569520525e-05, "loss": 0.1271, "step": 118600 }, { "epoch": 2.241131804616373, "grad_norm": 0.03109091706573963, "learning_rate": 9.866037886324238e-05, "loss": 0.127, "step": 118650 }, { "epoch": 2.2420762343696876, "grad_norm": 0.03193889930844307, "learning_rate": 9.865513203127951e-05, "loss": 0.1269, "step": 118700 }, { "epoch": 2.2430206641230024, "grad_norm": 0.03016296587884426, "learning_rate": 9.864988519931666e-05, "loss": 0.1267, "step": 118750 }, { "epoch": 2.2439650938763176, "grad_norm": 0.029093271121382713, "learning_rate": 9.86446383673538e-05, "loss": 0.1267, "step": 118800 }, { "epoch": 2.2449095236296324, "grad_norm": 0.030138954520225525, "learning_rate": 9.863939153539093e-05, "loss": 0.1269, "step": 118850 }, { "epoch": 2.2458539533829476, "grad_norm": 0.03101114183664322, "learning_rate": 9.863414470342808e-05, "loss": 0.1268, "step": 118900 }, { "epoch": 2.2467983831362623, "grad_norm": 0.030858922749757767, "learning_rate": 9.862889787146521e-05, "loss": 0.1264, "step": 118950 }, { "epoch": 2.247742812889577, "grad_norm": 0.032199710607528687, "learning_rate": 9.862365103950235e-05, "loss": 0.1266, "step": 119000 }, { "epoch": 2.2486872426428923, "grad_norm": 0.03255471587181091, "learning_rate": 9.861840420753949e-05, "loss": 0.127, "step": 119050 }, { "epoch": 2.249631672396207, "grad_norm": 0.03159305080771446, "learning_rate": 9.861315737557664e-05, "loss": 0.1264, "step": 119100 }, { "epoch": 2.2505761021495223, "grad_norm": 0.02929779142141342, "learning_rate": 9.860791054361377e-05, "loss": 0.1269, "step": 119150 }, { "epoch": 2.251520531902837, "grad_norm": 0.029203403741121292, "learning_rate": 9.860266371165091e-05, "loss": 0.1266, "step": 119200 }, { "epoch": 2.252464961656152, "grad_norm": 0.03223557025194168, "learning_rate": 9.859741687968806e-05, "loss": 0.1269, "step": 119250 }, { "epoch": 2.253409391409467, "grad_norm": 0.029391977936029434, "learning_rate": 9.859217004772519e-05, "loss": 0.1265, "step": 119300 }, { "epoch": 2.254353821162782, "grad_norm": 0.030141489580273628, "learning_rate": 9.858692321576232e-05, "loss": 0.1268, "step": 119350 }, { "epoch": 2.255298250916097, "grad_norm": 0.03062259778380394, "learning_rate": 9.858167638379947e-05, "loss": 0.1262, "step": 119400 }, { "epoch": 2.256242680669412, "grad_norm": 0.031231626868247986, "learning_rate": 9.85764295518366e-05, "loss": 0.1267, "step": 119450 }, { "epoch": 2.2571871104227266, "grad_norm": 0.03052443265914917, "learning_rate": 9.857118271987374e-05, "loss": 0.1264, "step": 119500 }, { "epoch": 2.258131540176042, "grad_norm": 0.03437763825058937, "learning_rate": 9.856593588791089e-05, "loss": 0.1266, "step": 119550 }, { "epoch": 2.2590759699293566, "grad_norm": 0.03214403986930847, "learning_rate": 9.856068905594802e-05, "loss": 0.1263, "step": 119600 }, { "epoch": 2.2600203996826718, "grad_norm": 0.031690776348114014, "learning_rate": 9.855544222398517e-05, "loss": 0.1272, "step": 119650 }, { "epoch": 2.2609648294359865, "grad_norm": 0.030563699081540108, "learning_rate": 9.85501953920223e-05, "loss": 0.1266, "step": 119700 }, { "epoch": 2.2619092591893013, "grad_norm": 0.030078794807195663, "learning_rate": 9.854494856005944e-05, "loss": 0.1264, "step": 119750 }, { "epoch": 2.2628536889426165, "grad_norm": 0.032179348170757294, "learning_rate": 9.853970172809658e-05, "loss": 0.1262, "step": 119800 }, { "epoch": 2.2637981186959313, "grad_norm": 0.028874129056930542, "learning_rate": 9.853445489613372e-05, "loss": 0.1264, "step": 119850 }, { "epoch": 2.2647425484492465, "grad_norm": 0.030105454847216606, "learning_rate": 9.852920806417086e-05, "loss": 0.1264, "step": 119900 }, { "epoch": 2.2656869782025613, "grad_norm": 0.03206780552864075, "learning_rate": 9.8523961232208e-05, "loss": 0.1266, "step": 119950 }, { "epoch": 2.2666314079558765, "grad_norm": 0.033804912120103836, "learning_rate": 9.851871440024513e-05, "loss": 0.1263, "step": 120000 }, { "epoch": 2.2666314079558765, "eval_IntDiv": 0.6757013532630584, "eval_NumCircles": 1789, "eval_SumBottleneck": 45.481233858868606, "eval_Uniqueness": 0.9969620253164557, "eval_Validity": 0.9875, "eval_Validity * Uniqueness": 0.9845, "eval_loss": 0.22044317424297333, "eval_runtime": 156.2872, "eval_samples_per_second": 63.985, "eval_steps_per_second": 0.505, "step": 120000 }, { "epoch": 2.2675758377091912, "grad_norm": 0.030944503843784332, "learning_rate": 9.851346756828228e-05, "loss": 0.1268, "step": 120050 }, { "epoch": 2.268520267462506, "grad_norm": 0.03145240619778633, "learning_rate": 9.850822073631941e-05, "loss": 0.1263, "step": 120100 }, { "epoch": 2.2694646972158212, "grad_norm": 0.030586564913392067, "learning_rate": 9.850297390435656e-05, "loss": 0.1271, "step": 120150 }, { "epoch": 2.270409126969136, "grad_norm": 0.03215653821825981, "learning_rate": 9.84977270723937e-05, "loss": 0.1262, "step": 120200 }, { "epoch": 2.2713535567224508, "grad_norm": 0.0300662312656641, "learning_rate": 9.849248024043083e-05, "loss": 0.1261, "step": 120250 }, { "epoch": 2.272297986475766, "grad_norm": 0.03004559315741062, "learning_rate": 9.848723340846798e-05, "loss": 0.1266, "step": 120300 }, { "epoch": 2.2732424162290807, "grad_norm": 0.03180261701345444, "learning_rate": 9.848198657650511e-05, "loss": 0.1265, "step": 120350 }, { "epoch": 2.274186845982396, "grad_norm": 0.03075404278934002, "learning_rate": 9.847673974454224e-05, "loss": 0.1265, "step": 120400 }, { "epoch": 2.2751312757357107, "grad_norm": 0.0336390845477581, "learning_rate": 9.847149291257939e-05, "loss": 0.126, "step": 120450 }, { "epoch": 2.276075705489026, "grad_norm": 0.03066145069897175, "learning_rate": 9.846624608061653e-05, "loss": 0.1263, "step": 120500 }, { "epoch": 2.2770201352423407, "grad_norm": 0.030583713203668594, "learning_rate": 9.846099924865366e-05, "loss": 0.1267, "step": 120550 }, { "epoch": 2.2779645649956555, "grad_norm": 0.03259202465415001, "learning_rate": 9.84557524166908e-05, "loss": 0.1265, "step": 120600 }, { "epoch": 2.2789089947489707, "grad_norm": 0.02979629673063755, "learning_rate": 9.845050558472795e-05, "loss": 0.1266, "step": 120650 }, { "epoch": 2.2798534245022855, "grad_norm": 0.03038039244711399, "learning_rate": 9.844525875276509e-05, "loss": 0.1258, "step": 120700 }, { "epoch": 2.2807978542556, "grad_norm": 0.032037872821092606, "learning_rate": 9.844001192080222e-05, "loss": 0.1266, "step": 120750 }, { "epoch": 2.2817422840089154, "grad_norm": 0.03393993154168129, "learning_rate": 9.843476508883937e-05, "loss": 0.1262, "step": 120800 }, { "epoch": 2.28268671376223, "grad_norm": 0.030017733573913574, "learning_rate": 9.84295182568765e-05, "loss": 0.1266, "step": 120850 }, { "epoch": 2.2836311435155454, "grad_norm": 0.02974378876388073, "learning_rate": 9.842427142491364e-05, "loss": 0.1266, "step": 120900 }, { "epoch": 2.28457557326886, "grad_norm": 0.03195719048380852, "learning_rate": 9.841902459295078e-05, "loss": 0.1266, "step": 120950 }, { "epoch": 2.2855200030221754, "grad_norm": 0.03515315428376198, "learning_rate": 9.841377776098792e-05, "loss": 0.1263, "step": 121000 }, { "epoch": 2.28646443277549, "grad_norm": 0.030088290572166443, "learning_rate": 9.840853092902505e-05, "loss": 0.1261, "step": 121050 }, { "epoch": 2.287408862528805, "grad_norm": 0.029277993366122246, "learning_rate": 9.84032840970622e-05, "loss": 0.1265, "step": 121100 }, { "epoch": 2.28835329228212, "grad_norm": 0.029223978519439697, "learning_rate": 9.839803726509935e-05, "loss": 0.1262, "step": 121150 }, { "epoch": 2.289297722035435, "grad_norm": 0.02957259677350521, "learning_rate": 9.839279043313647e-05, "loss": 0.1263, "step": 121200 }, { "epoch": 2.29024215178875, "grad_norm": 0.03579745069146156, "learning_rate": 9.838754360117362e-05, "loss": 0.1264, "step": 121250 }, { "epoch": 2.291186581542065, "grad_norm": 0.03433266282081604, "learning_rate": 9.838229676921076e-05, "loss": 0.1265, "step": 121300 }, { "epoch": 2.2921310112953797, "grad_norm": 0.02964366041123867, "learning_rate": 9.837704993724788e-05, "loss": 0.1263, "step": 121350 }, { "epoch": 2.293075441048695, "grad_norm": 0.031110644340515137, "learning_rate": 9.837180310528503e-05, "loss": 0.1265, "step": 121400 }, { "epoch": 2.2940198708020096, "grad_norm": 0.029602376744151115, "learning_rate": 9.836655627332218e-05, "loss": 0.1261, "step": 121450 }, { "epoch": 2.294964300555325, "grad_norm": 0.02958512492477894, "learning_rate": 9.836130944135931e-05, "loss": 0.1262, "step": 121500 }, { "epoch": 2.2959087303086396, "grad_norm": 0.03119255229830742, "learning_rate": 9.835606260939645e-05, "loss": 0.1261, "step": 121550 }, { "epoch": 2.2968531600619544, "grad_norm": 0.03125549107789993, "learning_rate": 9.835081577743359e-05, "loss": 0.1263, "step": 121600 }, { "epoch": 2.2977975898152696, "grad_norm": 0.02865816280245781, "learning_rate": 9.834556894547074e-05, "loss": 0.1266, "step": 121650 }, { "epoch": 2.2987420195685844, "grad_norm": 0.03134646266698837, "learning_rate": 9.834032211350786e-05, "loss": 0.1265, "step": 121700 }, { "epoch": 2.2996864493218996, "grad_norm": 0.029626276344060898, "learning_rate": 9.833507528154501e-05, "loss": 0.1265, "step": 121750 }, { "epoch": 2.3006308790752144, "grad_norm": 0.029868055135011673, "learning_rate": 9.832982844958216e-05, "loss": 0.1266, "step": 121800 }, { "epoch": 2.3015753088285296, "grad_norm": 0.031809840351343155, "learning_rate": 9.832458161761928e-05, "loss": 0.1261, "step": 121850 }, { "epoch": 2.3025197385818443, "grad_norm": 0.029713250696659088, "learning_rate": 9.831933478565642e-05, "loss": 0.1266, "step": 121900 }, { "epoch": 2.303464168335159, "grad_norm": 0.028964050114154816, "learning_rate": 9.831408795369357e-05, "loss": 0.1266, "step": 121950 }, { "epoch": 2.3044085980884743, "grad_norm": 0.031115826219320297, "learning_rate": 9.83088411217307e-05, "loss": 0.1263, "step": 122000 }, { "epoch": 2.305353027841789, "grad_norm": 0.03149169310927391, "learning_rate": 9.830359428976784e-05, "loss": 0.1264, "step": 122050 }, { "epoch": 2.306297457595104, "grad_norm": 0.03149883449077606, "learning_rate": 9.829834745780499e-05, "loss": 0.1263, "step": 122100 }, { "epoch": 2.307241887348419, "grad_norm": 0.03026418946683407, "learning_rate": 9.829310062584212e-05, "loss": 0.1264, "step": 122150 }, { "epoch": 2.308186317101734, "grad_norm": 0.02949458360671997, "learning_rate": 9.828785379387925e-05, "loss": 0.1258, "step": 122200 }, { "epoch": 2.309130746855049, "grad_norm": 0.03160266578197479, "learning_rate": 9.82826069619164e-05, "loss": 0.1262, "step": 122250 }, { "epoch": 2.310075176608364, "grad_norm": 0.03194103389978409, "learning_rate": 9.827736012995355e-05, "loss": 0.1269, "step": 122300 }, { "epoch": 2.311019606361679, "grad_norm": 0.03079579956829548, "learning_rate": 9.827211329799067e-05, "loss": 0.1262, "step": 122350 }, { "epoch": 2.311964036114994, "grad_norm": 0.03128531947731972, "learning_rate": 9.826686646602782e-05, "loss": 0.1264, "step": 122400 }, { "epoch": 2.3129084658683086, "grad_norm": 0.030853070318698883, "learning_rate": 9.826161963406496e-05, "loss": 0.126, "step": 122450 }, { "epoch": 2.3138528956216238, "grad_norm": 0.030455121770501137, "learning_rate": 9.82563728021021e-05, "loss": 0.1263, "step": 122500 }, { "epoch": 2.3138528956216238, "eval_IntDiv": 0.6734784812915939, "eval_NumCircles": 1726, "eval_SumBottleneck": 91.7177517297487, "eval_Uniqueness": 0.9955461079056585, "eval_Validity": 0.9879, "eval_Validity * Uniqueness": 0.9834999999999999, "eval_loss": 0.2223573476076126, "eval_runtime": 147.6691, "eval_samples_per_second": 67.719, "eval_steps_per_second": 0.535, "step": 122500 }, { "epoch": 2.3147973253749385, "grad_norm": 0.031210441142320633, "learning_rate": 9.825112597013923e-05, "loss": 0.1266, "step": 122550 }, { "epoch": 2.3157417551282538, "grad_norm": 0.03316907584667206, "learning_rate": 9.824587913817638e-05, "loss": 0.1262, "step": 122600 }, { "epoch": 2.3166861848815685, "grad_norm": 0.031030727550387383, "learning_rate": 9.824063230621351e-05, "loss": 0.1263, "step": 122650 }, { "epoch": 2.3176306146348833, "grad_norm": 0.030012335628271103, "learning_rate": 9.823538547425065e-05, "loss": 0.1261, "step": 122700 }, { "epoch": 2.3185750443881985, "grad_norm": 0.029376914724707603, "learning_rate": 9.82301386422878e-05, "loss": 0.1265, "step": 122750 }, { "epoch": 2.3195194741415133, "grad_norm": 0.030192455276846886, "learning_rate": 9.822489181032493e-05, "loss": 0.1263, "step": 122800 }, { "epoch": 2.3204639038948285, "grad_norm": 0.03015223518013954, "learning_rate": 9.821964497836206e-05, "loss": 0.1264, "step": 122850 }, { "epoch": 2.3214083336481433, "grad_norm": 0.030058734118938446, "learning_rate": 9.821439814639921e-05, "loss": 0.1262, "step": 122900 }, { "epoch": 2.322352763401458, "grad_norm": 0.030630873516201973, "learning_rate": 9.820915131443634e-05, "loss": 0.1262, "step": 122950 }, { "epoch": 2.3232971931547732, "grad_norm": 0.03095577284693718, "learning_rate": 9.820390448247349e-05, "loss": 0.1264, "step": 123000 }, { "epoch": 2.324241622908088, "grad_norm": 0.033833615481853485, "learning_rate": 9.819865765051063e-05, "loss": 0.1265, "step": 123050 }, { "epoch": 2.325186052661403, "grad_norm": 0.0312512032687664, "learning_rate": 9.819341081854777e-05, "loss": 0.1265, "step": 123100 }, { "epoch": 2.326130482414718, "grad_norm": 0.03081582672894001, "learning_rate": 9.81881639865849e-05, "loss": 0.126, "step": 123150 }, { "epoch": 2.3270749121680327, "grad_norm": 0.03029760718345642, "learning_rate": 9.818291715462204e-05, "loss": 0.1261, "step": 123200 }, { "epoch": 2.328019341921348, "grad_norm": 0.031045695766806602, "learning_rate": 9.817767032265919e-05, "loss": 0.1261, "step": 123250 }, { "epoch": 2.3289637716746627, "grad_norm": 0.030072564259171486, "learning_rate": 9.817242349069632e-05, "loss": 0.1262, "step": 123300 }, { "epoch": 2.329908201427978, "grad_norm": 0.03082260861992836, "learning_rate": 9.816717665873346e-05, "loss": 0.1259, "step": 123350 }, { "epoch": 2.3308526311812927, "grad_norm": 0.030818941071629524, "learning_rate": 9.81619298267706e-05, "loss": 0.1262, "step": 123400 }, { "epoch": 2.3317970609346075, "grad_norm": 0.031143147498369217, "learning_rate": 9.815668299480774e-05, "loss": 0.1261, "step": 123450 }, { "epoch": 2.3327414906879227, "grad_norm": 0.032287806272506714, "learning_rate": 9.815143616284488e-05, "loss": 0.126, "step": 123500 }, { "epoch": 2.3336859204412375, "grad_norm": 0.030313432216644287, "learning_rate": 9.814618933088202e-05, "loss": 0.1264, "step": 123550 }, { "epoch": 2.3346303501945527, "grad_norm": 0.030984070152044296, "learning_rate": 9.814094249891915e-05, "loss": 0.1264, "step": 123600 }, { "epoch": 2.3355747799478674, "grad_norm": 0.030631303787231445, "learning_rate": 9.81356956669563e-05, "loss": 0.126, "step": 123650 }, { "epoch": 2.3365192097011827, "grad_norm": 0.0477432906627655, "learning_rate": 9.813044883499343e-05, "loss": 0.1263, "step": 123700 }, { "epoch": 2.3374636394544974, "grad_norm": 0.034352827817201614, "learning_rate": 9.812520200303057e-05, "loss": 0.1262, "step": 123750 }, { "epoch": 2.338408069207812, "grad_norm": 0.032135967165231705, "learning_rate": 9.811995517106772e-05, "loss": 0.1261, "step": 123800 }, { "epoch": 2.3393524989611274, "grad_norm": 0.02987782470881939, "learning_rate": 9.811470833910485e-05, "loss": 0.1262, "step": 123850 }, { "epoch": 2.340296928714442, "grad_norm": 0.031222796067595482, "learning_rate": 9.8109461507142e-05, "loss": 0.1265, "step": 123900 }, { "epoch": 2.341241358467757, "grad_norm": 0.029427967965602875, "learning_rate": 9.810421467517913e-05, "loss": 0.1259, "step": 123950 }, { "epoch": 2.342185788221072, "grad_norm": 0.03199567645788193, "learning_rate": 9.809896784321628e-05, "loss": 0.1262, "step": 124000 }, { "epoch": 2.343130217974387, "grad_norm": 0.03147945553064346, "learning_rate": 9.809372101125341e-05, "loss": 0.1264, "step": 124050 }, { "epoch": 2.344074647727702, "grad_norm": 0.030630670487880707, "learning_rate": 9.808847417929055e-05, "loss": 0.1261, "step": 124100 }, { "epoch": 2.345019077481017, "grad_norm": 0.03085673786699772, "learning_rate": 9.80832273473277e-05, "loss": 0.1262, "step": 124150 }, { "epoch": 2.345963507234332, "grad_norm": 0.029848851263523102, "learning_rate": 9.807798051536483e-05, "loss": 0.1266, "step": 124200 }, { "epoch": 2.346907936987647, "grad_norm": 0.03065461292862892, "learning_rate": 9.807273368340196e-05, "loss": 0.1262, "step": 124250 }, { "epoch": 2.3478523667409616, "grad_norm": 0.030843205749988556, "learning_rate": 9.806748685143911e-05, "loss": 0.1262, "step": 124300 }, { "epoch": 2.348796796494277, "grad_norm": 0.029086943715810776, "learning_rate": 9.806224001947624e-05, "loss": 0.1259, "step": 124350 }, { "epoch": 2.3497412262475916, "grad_norm": 0.03188510984182358, "learning_rate": 9.805699318751338e-05, "loss": 0.1259, "step": 124400 }, { "epoch": 2.350685656000907, "grad_norm": 0.030681289732456207, "learning_rate": 9.805174635555052e-05, "loss": 0.1263, "step": 124450 }, { "epoch": 2.3516300857542216, "grad_norm": 0.029577797278761864, "learning_rate": 9.804649952358767e-05, "loss": 0.1255, "step": 124500 }, { "epoch": 2.3525745155075364, "grad_norm": 0.03054780699312687, "learning_rate": 9.804125269162479e-05, "loss": 0.1264, "step": 124550 }, { "epoch": 2.3535189452608516, "grad_norm": 0.02935425005853176, "learning_rate": 9.803600585966194e-05, "loss": 0.1263, "step": 124600 }, { "epoch": 2.3544633750141664, "grad_norm": 0.030872177332639694, "learning_rate": 9.803075902769909e-05, "loss": 0.126, "step": 124650 }, { "epoch": 2.3554078047674816, "grad_norm": 0.02941545844078064, "learning_rate": 9.802551219573622e-05, "loss": 0.1258, "step": 124700 }, { "epoch": 2.3563522345207963, "grad_norm": 0.12018760293722153, "learning_rate": 9.802026536377335e-05, "loss": 0.1263, "step": 124750 }, { "epoch": 2.357296664274111, "grad_norm": 0.03154360502958298, "learning_rate": 9.80150185318105e-05, "loss": 0.1266, "step": 124800 }, { "epoch": 2.3582410940274263, "grad_norm": 0.03009643964469433, "learning_rate": 9.800977169984764e-05, "loss": 0.1263, "step": 124850 }, { "epoch": 2.359185523780741, "grad_norm": 0.02966955676674843, "learning_rate": 9.800452486788477e-05, "loss": 0.1264, "step": 124900 }, { "epoch": 2.3601299535340563, "grad_norm": 0.03143578767776489, "learning_rate": 9.799927803592192e-05, "loss": 0.1258, "step": 124950 }, { "epoch": 2.361074383287371, "grad_norm": 0.030630165711045265, "learning_rate": 9.799403120395906e-05, "loss": 0.1263, "step": 125000 }, { "epoch": 2.361074383287371, "eval_IntDiv": 0.6751319376924494, "eval_NumCircles": 1830, "eval_SumBottleneck": 109.13830615669166, "eval_Uniqueness": 0.9979726305119108, "eval_Validity": 0.9865, "eval_Validity * Uniqueness": 0.9845, "eval_loss": 0.22188544273376465, "eval_runtime": 159.4144, "eval_samples_per_second": 62.73, "eval_steps_per_second": 0.496, "step": 125000 }, { "epoch": 2.3620188130406863, "grad_norm": 0.03141171112656593, "learning_rate": 9.798878437199618e-05, "loss": 0.1255, "step": 125050 }, { "epoch": 2.362963242794001, "grad_norm": 0.030290568247437477, "learning_rate": 9.798353754003333e-05, "loss": 0.1263, "step": 125100 }, { "epoch": 2.363907672547316, "grad_norm": 0.02947160042822361, "learning_rate": 9.797829070807048e-05, "loss": 0.1259, "step": 125150 }, { "epoch": 2.364852102300631, "grad_norm": 0.03237726166844368, "learning_rate": 9.79730438761076e-05, "loss": 0.1258, "step": 125200 }, { "epoch": 2.365796532053946, "grad_norm": 0.033090878278017044, "learning_rate": 9.796779704414475e-05, "loss": 0.1261, "step": 125250 }, { "epoch": 2.3667409618072606, "grad_norm": 0.028459906578063965, "learning_rate": 9.79625502121819e-05, "loss": 0.1262, "step": 125300 }, { "epoch": 2.367685391560576, "grad_norm": 0.028950702399015427, "learning_rate": 9.795730338021903e-05, "loss": 0.126, "step": 125350 }, { "epoch": 2.3686298213138905, "grad_norm": 0.030603863298892975, "learning_rate": 9.795205654825616e-05, "loss": 0.1264, "step": 125400 }, { "epoch": 2.3695742510672058, "grad_norm": 0.02983209677040577, "learning_rate": 9.794680971629331e-05, "loss": 0.1264, "step": 125450 }, { "epoch": 2.3705186808205205, "grad_norm": 0.030234090983867645, "learning_rate": 9.794156288433046e-05, "loss": 0.1262, "step": 125500 }, { "epoch": 2.3714631105738357, "grad_norm": 0.0312111247330904, "learning_rate": 9.793631605236758e-05, "loss": 0.126, "step": 125550 }, { "epoch": 2.3724075403271505, "grad_norm": 0.029612848535180092, "learning_rate": 9.793106922040473e-05, "loss": 0.126, "step": 125600 }, { "epoch": 2.3733519700804653, "grad_norm": 0.030727945268154144, "learning_rate": 9.792582238844187e-05, "loss": 0.1259, "step": 125650 }, { "epoch": 2.3742963998337805, "grad_norm": 0.029324917122721672, "learning_rate": 9.7920575556479e-05, "loss": 0.1257, "step": 125700 }, { "epoch": 2.3752408295870953, "grad_norm": 0.03091776743531227, "learning_rate": 9.791532872451614e-05, "loss": 0.1261, "step": 125750 }, { "epoch": 2.37618525934041, "grad_norm": 0.03024865873157978, "learning_rate": 9.791008189255329e-05, "loss": 0.1261, "step": 125800 }, { "epoch": 2.3771296890937252, "grad_norm": 0.028509100899100304, "learning_rate": 9.790483506059042e-05, "loss": 0.1262, "step": 125850 }, { "epoch": 2.37807411884704, "grad_norm": 0.029800182208418846, "learning_rate": 9.789958822862756e-05, "loss": 0.1258, "step": 125900 }, { "epoch": 2.379018548600355, "grad_norm": 0.03016243875026703, "learning_rate": 9.78943413966647e-05, "loss": 0.1257, "step": 125950 }, { "epoch": 2.37996297835367, "grad_norm": 0.030023276805877686, "learning_rate": 9.788909456470184e-05, "loss": 0.1256, "step": 126000 }, { "epoch": 2.380907408106985, "grad_norm": 0.031432148069143295, "learning_rate": 9.788384773273897e-05, "loss": 0.1261, "step": 126050 }, { "epoch": 2.3818518378603, "grad_norm": 0.03153073787689209, "learning_rate": 9.787860090077612e-05, "loss": 0.1262, "step": 126100 }, { "epoch": 2.3827962676136147, "grad_norm": 0.03001335822045803, "learning_rate": 9.787335406881325e-05, "loss": 0.1258, "step": 126150 }, { "epoch": 2.38374069736693, "grad_norm": 0.02997543290257454, "learning_rate": 9.786810723685039e-05, "loss": 0.126, "step": 126200 }, { "epoch": 2.3846851271202447, "grad_norm": 0.028755608946084976, "learning_rate": 9.786286040488753e-05, "loss": 0.126, "step": 126250 }, { "epoch": 2.38562955687356, "grad_norm": 0.029783451929688454, "learning_rate": 9.785761357292468e-05, "loss": 0.1259, "step": 126300 }, { "epoch": 2.3865739866268747, "grad_norm": 0.031625546514987946, "learning_rate": 9.785236674096182e-05, "loss": 0.1259, "step": 126350 }, { "epoch": 2.3875184163801895, "grad_norm": 0.031450483947992325, "learning_rate": 9.784711990899895e-05, "loss": 0.1259, "step": 126400 }, { "epoch": 2.3884628461335047, "grad_norm": 0.03207407519221306, "learning_rate": 9.78418730770361e-05, "loss": 0.1258, "step": 126450 }, { "epoch": 2.3894072758868194, "grad_norm": 0.029833300039172173, "learning_rate": 9.783662624507323e-05, "loss": 0.1257, "step": 126500 }, { "epoch": 2.3903517056401347, "grad_norm": 0.03075999952852726, "learning_rate": 9.783137941311036e-05, "loss": 0.1258, "step": 126550 }, { "epoch": 2.3912961353934494, "grad_norm": 0.03014497458934784, "learning_rate": 9.782613258114751e-05, "loss": 0.1257, "step": 126600 }, { "epoch": 2.392240565146764, "grad_norm": 0.03092237189412117, "learning_rate": 9.782088574918465e-05, "loss": 0.1257, "step": 126650 }, { "epoch": 2.3931849949000794, "grad_norm": 0.03071182779967785, "learning_rate": 9.781563891722178e-05, "loss": 0.126, "step": 126700 }, { "epoch": 2.394129424653394, "grad_norm": 0.03460408374667168, "learning_rate": 9.781039208525893e-05, "loss": 0.1257, "step": 126750 }, { "epoch": 2.3950738544067094, "grad_norm": 0.030511287972331047, "learning_rate": 9.780514525329606e-05, "loss": 0.126, "step": 126800 }, { "epoch": 2.396018284160024, "grad_norm": 0.03278229385614395, "learning_rate": 9.779989842133321e-05, "loss": 0.1261, "step": 126850 }, { "epoch": 2.3969627139133394, "grad_norm": 0.029480352997779846, "learning_rate": 9.779465158937034e-05, "loss": 0.1258, "step": 126900 }, { "epoch": 2.397907143666654, "grad_norm": 0.030810458585619926, "learning_rate": 9.778940475740748e-05, "loss": 0.1258, "step": 126950 }, { "epoch": 2.398851573419969, "grad_norm": 0.03149948641657829, "learning_rate": 9.778415792544462e-05, "loss": 0.126, "step": 127000 }, { "epoch": 2.399796003173284, "grad_norm": 0.03035249561071396, "learning_rate": 9.777891109348176e-05, "loss": 0.1259, "step": 127050 }, { "epoch": 2.400740432926599, "grad_norm": 0.032149430364370346, "learning_rate": 9.77736642615189e-05, "loss": 0.1263, "step": 127100 }, { "epoch": 2.4016848626799137, "grad_norm": 0.03196382895112038, "learning_rate": 9.776841742955604e-05, "loss": 0.1259, "step": 127150 }, { "epoch": 2.402629292433229, "grad_norm": 0.0302816741168499, "learning_rate": 9.776317059759317e-05, "loss": 0.1255, "step": 127200 }, { "epoch": 2.4035737221865436, "grad_norm": 0.03058108501136303, "learning_rate": 9.775792376563032e-05, "loss": 0.1262, "step": 127250 }, { "epoch": 2.404518151939859, "grad_norm": 0.04030664265155792, "learning_rate": 9.775267693366745e-05, "loss": 0.1261, "step": 127300 }, { "epoch": 2.4054625816931736, "grad_norm": 0.031995028257369995, "learning_rate": 9.77474301017046e-05, "loss": 0.1258, "step": 127350 }, { "epoch": 2.406407011446489, "grad_norm": 0.030386365950107574, "learning_rate": 9.774218326974174e-05, "loss": 0.126, "step": 127400 }, { "epoch": 2.4073514411998036, "grad_norm": 0.030255388468503952, "learning_rate": 9.773693643777887e-05, "loss": 0.1263, "step": 127450 }, { "epoch": 2.4082958709531184, "grad_norm": 0.031969279050827026, "learning_rate": 9.773168960581602e-05, "loss": 0.1256, "step": 127500 }, { "epoch": 2.4082958709531184, "eval_IntDiv": 0.6749806935758513, "eval_NumCircles": 1832, "eval_SumBottleneck": 17.118232449928158, "eval_Uniqueness": 0.9967634267219582, "eval_Validity": 0.9887, "eval_Validity * Uniqueness": 0.9855, "eval_loss": 0.22204314172267914, "eval_runtime": 178.5349, "eval_samples_per_second": 56.011, "eval_steps_per_second": 0.442, "step": 127500 }, { "epoch": 2.4092403007064336, "grad_norm": 0.03162260726094246, "learning_rate": 9.772644277385315e-05, "loss": 0.1256, "step": 127550 }, { "epoch": 2.4101847304597483, "grad_norm": 0.032319579273462296, "learning_rate": 9.772119594189029e-05, "loss": 0.1256, "step": 127600 }, { "epoch": 2.411129160213063, "grad_norm": 0.03165993094444275, "learning_rate": 9.771594910992743e-05, "loss": 0.1258, "step": 127650 }, { "epoch": 2.4120735899663783, "grad_norm": 0.03178146854043007, "learning_rate": 9.771070227796457e-05, "loss": 0.1261, "step": 127700 }, { "epoch": 2.413018019719693, "grad_norm": 0.03087359108030796, "learning_rate": 9.77054554460017e-05, "loss": 0.1262, "step": 127750 }, { "epoch": 2.4139624494730083, "grad_norm": 0.03073815070092678, "learning_rate": 9.770020861403885e-05, "loss": 0.1256, "step": 127800 }, { "epoch": 2.414906879226323, "grad_norm": 0.031517136842012405, "learning_rate": 9.7694961782076e-05, "loss": 0.1258, "step": 127850 }, { "epoch": 2.4158513089796383, "grad_norm": 0.030842887237668037, "learning_rate": 9.768971495011313e-05, "loss": 0.1258, "step": 127900 }, { "epoch": 2.416795738732953, "grad_norm": 0.02955375239253044, "learning_rate": 9.768446811815026e-05, "loss": 0.1259, "step": 127950 }, { "epoch": 2.417740168486268, "grad_norm": 0.029184196144342422, "learning_rate": 9.767922128618741e-05, "loss": 0.1259, "step": 128000 }, { "epoch": 2.418684598239583, "grad_norm": 0.030931448563933372, "learning_rate": 9.767397445422454e-05, "loss": 0.1258, "step": 128050 }, { "epoch": 2.419629027992898, "grad_norm": 0.030501212924718857, "learning_rate": 9.766872762226168e-05, "loss": 0.1261, "step": 128100 }, { "epoch": 2.420573457746213, "grad_norm": 0.03187808394432068, "learning_rate": 9.766348079029883e-05, "loss": 0.1256, "step": 128150 }, { "epoch": 2.421517887499528, "grad_norm": 0.029216798022389412, "learning_rate": 9.765823395833596e-05, "loss": 0.1262, "step": 128200 }, { "epoch": 2.4224623172528426, "grad_norm": 0.03254800662398338, "learning_rate": 9.76529871263731e-05, "loss": 0.1257, "step": 128250 }, { "epoch": 2.4234067470061578, "grad_norm": 0.032217010855674744, "learning_rate": 9.764774029441024e-05, "loss": 0.1259, "step": 128300 }, { "epoch": 2.4243511767594725, "grad_norm": 0.03511874005198479, "learning_rate": 9.764249346244739e-05, "loss": 0.1258, "step": 128350 }, { "epoch": 2.4252956065127877, "grad_norm": 0.03247033432126045, "learning_rate": 9.763724663048451e-05, "loss": 0.1259, "step": 128400 }, { "epoch": 2.4262400362661025, "grad_norm": 0.030106158927083015, "learning_rate": 9.763199979852166e-05, "loss": 0.1258, "step": 128450 }, { "epoch": 2.4271844660194173, "grad_norm": 0.03078060783445835, "learning_rate": 9.76267529665588e-05, "loss": 0.1258, "step": 128500 }, { "epoch": 2.4281288957727325, "grad_norm": 0.03152476251125336, "learning_rate": 9.762150613459592e-05, "loss": 0.126, "step": 128550 }, { "epoch": 2.4290733255260473, "grad_norm": 0.030316533520817757, "learning_rate": 9.761625930263307e-05, "loss": 0.1255, "step": 128600 }, { "epoch": 2.4300177552793625, "grad_norm": 0.029565759003162384, "learning_rate": 9.761101247067022e-05, "loss": 0.1256, "step": 128650 }, { "epoch": 2.4309621850326772, "grad_norm": 0.029535114765167236, "learning_rate": 9.760576563870735e-05, "loss": 0.1255, "step": 128700 }, { "epoch": 2.4319066147859925, "grad_norm": 0.029632851481437683, "learning_rate": 9.760051880674449e-05, "loss": 0.1262, "step": 128750 }, { "epoch": 2.4328510445393072, "grad_norm": 0.029429327696561813, "learning_rate": 9.759527197478163e-05, "loss": 0.1258, "step": 128800 }, { "epoch": 2.433795474292622, "grad_norm": 0.02927103452384472, "learning_rate": 9.759002514281878e-05, "loss": 0.1255, "step": 128850 }, { "epoch": 2.434739904045937, "grad_norm": 0.032307855784893036, "learning_rate": 9.75847783108559e-05, "loss": 0.1255, "step": 128900 }, { "epoch": 2.435684333799252, "grad_norm": 0.029389536008238792, "learning_rate": 9.757953147889305e-05, "loss": 0.1258, "step": 128950 }, { "epoch": 2.4366287635525667, "grad_norm": 0.03070959821343422, "learning_rate": 9.75742846469302e-05, "loss": 0.1256, "step": 129000 }, { "epoch": 2.437573193305882, "grad_norm": 0.029550153762102127, "learning_rate": 9.756903781496732e-05, "loss": 0.1257, "step": 129050 }, { "epoch": 2.4385176230591967, "grad_norm": 0.03148769214749336, "learning_rate": 9.756379098300446e-05, "loss": 0.1256, "step": 129100 }, { "epoch": 2.439462052812512, "grad_norm": 0.02921866998076439, "learning_rate": 9.755854415104161e-05, "loss": 0.1261, "step": 129150 }, { "epoch": 2.4404064825658267, "grad_norm": 0.03157436475157738, "learning_rate": 9.755329731907875e-05, "loss": 0.1257, "step": 129200 }, { "epoch": 2.441350912319142, "grad_norm": 0.029943101108074188, "learning_rate": 9.754805048711588e-05, "loss": 0.1256, "step": 129250 }, { "epoch": 2.4422953420724567, "grad_norm": 0.03219788894057274, "learning_rate": 9.754280365515303e-05, "loss": 0.1261, "step": 129300 }, { "epoch": 2.4432397718257715, "grad_norm": 0.03058514930307865, "learning_rate": 9.753755682319016e-05, "loss": 0.1262, "step": 129350 }, { "epoch": 2.4441842015790867, "grad_norm": 0.029908526688814163, "learning_rate": 9.75323099912273e-05, "loss": 0.1257, "step": 129400 }, { "epoch": 2.4451286313324014, "grad_norm": 0.03076547384262085, "learning_rate": 9.752706315926444e-05, "loss": 0.1256, "step": 129450 }, { "epoch": 2.446073061085716, "grad_norm": 0.03007439710199833, "learning_rate": 9.752181632730159e-05, "loss": 0.1258, "step": 129500 }, { "epoch": 2.4470174908390314, "grad_norm": 0.030883923172950745, "learning_rate": 9.751656949533871e-05, "loss": 0.1255, "step": 129550 }, { "epoch": 2.447961920592346, "grad_norm": 0.030147844925522804, "learning_rate": 9.751132266337586e-05, "loss": 0.126, "step": 129600 }, { "epoch": 2.4489063503456614, "grad_norm": 0.03255255147814751, "learning_rate": 9.7506075831413e-05, "loss": 0.1258, "step": 129650 }, { "epoch": 2.449850780098976, "grad_norm": 0.03039463423192501, "learning_rate": 9.750082899945014e-05, "loss": 0.1256, "step": 129700 }, { "epoch": 2.4507952098522914, "grad_norm": 0.029357634484767914, "learning_rate": 9.749558216748727e-05, "loss": 0.1247, "step": 129750 }, { "epoch": 2.451739639605606, "grad_norm": 0.03129146248102188, "learning_rate": 9.749033533552442e-05, "loss": 0.1259, "step": 129800 }, { "epoch": 2.452684069358921, "grad_norm": 0.03086383268237114, "learning_rate": 9.748508850356155e-05, "loss": 0.1257, "step": 129850 }, { "epoch": 2.453628499112236, "grad_norm": 0.0311911478638649, "learning_rate": 9.747984167159869e-05, "loss": 0.1256, "step": 129900 }, { "epoch": 2.454572928865551, "grad_norm": 0.029697343707084656, "learning_rate": 9.747459483963584e-05, "loss": 0.1253, "step": 129950 }, { "epoch": 2.455517358618866, "grad_norm": 0.03087482415139675, "learning_rate": 9.746934800767297e-05, "loss": 0.1258, "step": 130000 }, { "epoch": 2.455517358618866, "eval_IntDiv": 0.6738869845251874, "eval_NumCircles": 1752, "eval_SumBottleneck": 108.57887880376416, "eval_Uniqueness": 0.9960590137429264, "eval_Validity": 0.9896, "eval_Validity * Uniqueness": 0.9857, "eval_loss": 0.22618694603443146, "eval_runtime": 153.0975, "eval_samples_per_second": 65.318, "eval_steps_per_second": 0.516, "step": 130000 }, { "epoch": 2.456461788372181, "grad_norm": 0.030074989423155785, "learning_rate": 9.74641011757101e-05, "loss": 0.1254, "step": 130050 }, { "epoch": 2.4574062181254956, "grad_norm": 0.029410509392619133, "learning_rate": 9.745885434374725e-05, "loss": 0.1257, "step": 130100 }, { "epoch": 2.458350647878811, "grad_norm": 0.031873103231191635, "learning_rate": 9.745360751178439e-05, "loss": 0.1255, "step": 130150 }, { "epoch": 2.4592950776321256, "grad_norm": 0.02962912991642952, "learning_rate": 9.744836067982153e-05, "loss": 0.1254, "step": 130200 }, { "epoch": 2.460239507385441, "grad_norm": 0.030474258586764336, "learning_rate": 9.744311384785867e-05, "loss": 0.1254, "step": 130250 }, { "epoch": 2.4611839371387556, "grad_norm": 0.029951393604278564, "learning_rate": 9.743786701589581e-05, "loss": 0.1259, "step": 130300 }, { "epoch": 2.4621283668920704, "grad_norm": 0.030843082815408707, "learning_rate": 9.743262018393295e-05, "loss": 0.1258, "step": 130350 }, { "epoch": 2.4630727966453856, "grad_norm": 0.033163897693157196, "learning_rate": 9.742737335197008e-05, "loss": 0.1258, "step": 130400 }, { "epoch": 2.4640172263987004, "grad_norm": 0.03033023327589035, "learning_rate": 9.742212652000723e-05, "loss": 0.1257, "step": 130450 }, { "epoch": 2.4649616561520156, "grad_norm": 0.029983418062329292, "learning_rate": 9.741687968804436e-05, "loss": 0.1254, "step": 130500 }, { "epoch": 2.4659060859053303, "grad_norm": 0.031683046370744705, "learning_rate": 9.74116328560815e-05, "loss": 0.1254, "step": 130550 }, { "epoch": 2.4668505156586455, "grad_norm": 0.03159486874938011, "learning_rate": 9.740638602411864e-05, "loss": 0.1257, "step": 130600 }, { "epoch": 2.4677949454119603, "grad_norm": 0.03095719777047634, "learning_rate": 9.740113919215578e-05, "loss": 0.1258, "step": 130650 }, { "epoch": 2.468739375165275, "grad_norm": 0.033382389694452286, "learning_rate": 9.739589236019293e-05, "loss": 0.1257, "step": 130700 }, { "epoch": 2.4696838049185903, "grad_norm": 0.031587596982717514, "learning_rate": 9.739064552823006e-05, "loss": 0.1257, "step": 130750 }, { "epoch": 2.470628234671905, "grad_norm": 0.032326068729162216, "learning_rate": 9.73853986962672e-05, "loss": 0.1251, "step": 130800 }, { "epoch": 2.47157266442522, "grad_norm": 0.030911488458514214, "learning_rate": 9.738015186430434e-05, "loss": 0.1256, "step": 130850 }, { "epoch": 2.472517094178535, "grad_norm": 0.02997417375445366, "learning_rate": 9.737490503234148e-05, "loss": 0.1256, "step": 130900 }, { "epoch": 2.47346152393185, "grad_norm": 0.03371577709913254, "learning_rate": 9.736965820037861e-05, "loss": 0.1258, "step": 130950 }, { "epoch": 2.474405953685165, "grad_norm": 0.062081847339868546, "learning_rate": 9.736441136841576e-05, "loss": 0.1265, "step": 131000 }, { "epoch": 2.47535038343848, "grad_norm": 0.029059462249279022, "learning_rate": 9.735916453645289e-05, "loss": 0.1254, "step": 131050 }, { "epoch": 2.476294813191795, "grad_norm": 0.03081386536359787, "learning_rate": 9.735391770449004e-05, "loss": 0.1251, "step": 131100 }, { "epoch": 2.4772392429451098, "grad_norm": 0.030498944222927094, "learning_rate": 9.734867087252717e-05, "loss": 0.1257, "step": 131150 }, { "epoch": 2.4781836726984245, "grad_norm": 0.03168106824159622, "learning_rate": 9.734342404056432e-05, "loss": 0.1255, "step": 131200 }, { "epoch": 2.4791281024517398, "grad_norm": 0.029555438086390495, "learning_rate": 9.733817720860145e-05, "loss": 0.1253, "step": 131250 }, { "epoch": 2.4800725322050545, "grad_norm": 0.030375482514500618, "learning_rate": 9.733293037663859e-05, "loss": 0.1257, "step": 131300 }, { "epoch": 2.4810169619583693, "grad_norm": 0.02995748072862625, "learning_rate": 9.732768354467573e-05, "loss": 0.1254, "step": 131350 }, { "epoch": 2.4819613917116845, "grad_norm": 0.0309746153652668, "learning_rate": 9.732243671271287e-05, "loss": 0.1258, "step": 131400 }, { "epoch": 2.4829058214649993, "grad_norm": 0.032020267099142075, "learning_rate": 9.731718988075e-05, "loss": 0.1257, "step": 131450 }, { "epoch": 2.4838502512183145, "grad_norm": 0.02980688586831093, "learning_rate": 9.731194304878715e-05, "loss": 0.1257, "step": 131500 }, { "epoch": 2.4847946809716293, "grad_norm": 0.02965422347187996, "learning_rate": 9.730669621682428e-05, "loss": 0.1255, "step": 131550 }, { "epoch": 2.4857391107249445, "grad_norm": 0.03347427770495415, "learning_rate": 9.730144938486142e-05, "loss": 0.1255, "step": 131600 }, { "epoch": 2.4866835404782592, "grad_norm": 0.029343770816922188, "learning_rate": 9.729620255289856e-05, "loss": 0.1261, "step": 131650 }, { "epoch": 2.487627970231574, "grad_norm": 0.03250967338681221, "learning_rate": 9.729095572093571e-05, "loss": 0.1252, "step": 131700 }, { "epoch": 2.488572399984889, "grad_norm": 0.028727497905492783, "learning_rate": 9.728570888897283e-05, "loss": 0.1253, "step": 131750 }, { "epoch": 2.489516829738204, "grad_norm": 0.029668500646948814, "learning_rate": 9.728046205700998e-05, "loss": 0.1255, "step": 131800 }, { "epoch": 2.490461259491519, "grad_norm": 0.031547147780656815, "learning_rate": 9.727521522504713e-05, "loss": 0.1254, "step": 131850 }, { "epoch": 2.491405689244834, "grad_norm": 0.0307680182158947, "learning_rate": 9.726996839308426e-05, "loss": 0.1255, "step": 131900 }, { "epoch": 2.4923501189981487, "grad_norm": 0.030757635831832886, "learning_rate": 9.72647215611214e-05, "loss": 0.1253, "step": 131950 }, { "epoch": 2.493294548751464, "grad_norm": 0.029581965878605843, "learning_rate": 9.725947472915854e-05, "loss": 0.1258, "step": 132000 }, { "epoch": 2.4942389785047787, "grad_norm": 0.029111281037330627, "learning_rate": 9.725422789719568e-05, "loss": 0.1255, "step": 132050 }, { "epoch": 2.495183408258094, "grad_norm": 0.029316168278455734, "learning_rate": 9.724898106523281e-05, "loss": 0.1257, "step": 132100 }, { "epoch": 2.4961278380114087, "grad_norm": 0.029891720041632652, "learning_rate": 9.724373423326996e-05, "loss": 0.1252, "step": 132150 }, { "epoch": 2.4970722677647235, "grad_norm": 0.029518865048885345, "learning_rate": 9.72384874013071e-05, "loss": 0.1253, "step": 132200 }, { "epoch": 2.4980166975180387, "grad_norm": 0.03103054314851761, "learning_rate": 9.723324056934423e-05, "loss": 0.1251, "step": 132250 }, { "epoch": 2.4989611272713534, "grad_norm": 0.030240988358855247, "learning_rate": 9.722799373738137e-05, "loss": 0.1256, "step": 132300 }, { "epoch": 2.4999055570246687, "grad_norm": 0.031186047941446304, "learning_rate": 9.722274690541852e-05, "loss": 0.1258, "step": 132350 }, { "epoch": 2.5008499867779834, "grad_norm": 0.03039182908833027, "learning_rate": 9.721750007345564e-05, "loss": 0.1254, "step": 132400 }, { "epoch": 2.5017944165312986, "grad_norm": 0.03073803521692753, "learning_rate": 9.721225324149279e-05, "loss": 0.1255, "step": 132450 }, { "epoch": 2.5027388462846134, "grad_norm": 0.02909904345870018, "learning_rate": 9.720700640952994e-05, "loss": 0.1256, "step": 132500 }, { "epoch": 2.5027388462846134, "eval_IntDiv": 0.6756204959571669, "eval_NumCircles": 1770, "eval_SumBottleneck": 67.2682450513192, "eval_Uniqueness": 0.9966653193209377, "eval_Validity": 0.9896, "eval_Validity * Uniqueness": 0.9863, "eval_loss": 0.22361724078655243, "eval_runtime": 145.5363, "eval_samples_per_second": 68.711, "eval_steps_per_second": 0.543, "step": 132500 }, { "epoch": 2.503683276037928, "grad_norm": 0.030198320746421814, "learning_rate": 9.720175957756707e-05, "loss": 0.1255, "step": 132550 }, { "epoch": 2.5046277057912434, "grad_norm": 0.030344273895025253, "learning_rate": 9.71965127456042e-05, "loss": 0.1254, "step": 132600 }, { "epoch": 2.505572135544558, "grad_norm": 0.031055618077516556, "learning_rate": 9.719126591364135e-05, "loss": 0.1254, "step": 132650 }, { "epoch": 2.506516565297873, "grad_norm": 0.02936367690563202, "learning_rate": 9.718601908167849e-05, "loss": 0.1254, "step": 132700 }, { "epoch": 2.507460995051188, "grad_norm": 0.030568424612283707, "learning_rate": 9.718077224971562e-05, "loss": 0.1255, "step": 132750 }, { "epoch": 2.508405424804503, "grad_norm": 0.028994325548410416, "learning_rate": 9.717552541775277e-05, "loss": 0.1254, "step": 132800 }, { "epoch": 2.509349854557818, "grad_norm": 0.030606715008616447, "learning_rate": 9.717027858578991e-05, "loss": 0.1256, "step": 132850 }, { "epoch": 2.510294284311133, "grad_norm": 0.030216315761208534, "learning_rate": 9.716503175382703e-05, "loss": 0.1259, "step": 132900 }, { "epoch": 2.511238714064448, "grad_norm": 0.030603960156440735, "learning_rate": 9.715978492186418e-05, "loss": 0.1253, "step": 132950 }, { "epoch": 2.512183143817763, "grad_norm": 0.03096739761531353, "learning_rate": 9.715453808990133e-05, "loss": 0.1257, "step": 133000 }, { "epoch": 2.5131275735710776, "grad_norm": 0.02949897013604641, "learning_rate": 9.714929125793846e-05, "loss": 0.1254, "step": 133050 }, { "epoch": 2.514072003324393, "grad_norm": 0.030979987233877182, "learning_rate": 9.71440444259756e-05, "loss": 0.1253, "step": 133100 }, { "epoch": 2.5150164330777076, "grad_norm": 0.029318055137991905, "learning_rate": 9.713879759401274e-05, "loss": 0.1252, "step": 133150 }, { "epoch": 2.5159608628310224, "grad_norm": 0.03115161880850792, "learning_rate": 9.713355076204988e-05, "loss": 0.1253, "step": 133200 }, { "epoch": 2.5169052925843376, "grad_norm": 0.031060202047228813, "learning_rate": 9.712830393008701e-05, "loss": 0.1252, "step": 133250 }, { "epoch": 2.5178497223376524, "grad_norm": 0.03146335855126381, "learning_rate": 9.712305709812416e-05, "loss": 0.1256, "step": 133300 }, { "epoch": 2.5187941520909676, "grad_norm": 0.032398175448179245, "learning_rate": 9.71178102661613e-05, "loss": 0.1255, "step": 133350 }, { "epoch": 2.5197385818442823, "grad_norm": 0.029489295557141304, "learning_rate": 9.711256343419843e-05, "loss": 0.1255, "step": 133400 }, { "epoch": 2.5206830115975976, "grad_norm": 0.030793625861406326, "learning_rate": 9.710731660223558e-05, "loss": 0.1251, "step": 133450 }, { "epoch": 2.5216274413509123, "grad_norm": 0.03075922466814518, "learning_rate": 9.710206977027272e-05, "loss": 0.1256, "step": 133500 }, { "epoch": 2.522571871104227, "grad_norm": 0.029393164440989494, "learning_rate": 9.709682293830986e-05, "loss": 0.1254, "step": 133550 }, { "epoch": 2.5235163008575423, "grad_norm": 0.02911745384335518, "learning_rate": 9.709157610634699e-05, "loss": 0.1254, "step": 133600 }, { "epoch": 2.524460730610857, "grad_norm": 0.03193994238972664, "learning_rate": 9.708632927438414e-05, "loss": 0.1254, "step": 133650 }, { "epoch": 2.525405160364172, "grad_norm": 0.030375948175787926, "learning_rate": 9.708108244242127e-05, "loss": 0.1256, "step": 133700 }, { "epoch": 2.526349590117487, "grad_norm": 0.03206557780504227, "learning_rate": 9.70758356104584e-05, "loss": 0.1253, "step": 133750 }, { "epoch": 2.5272940198708023, "grad_norm": 0.030131135135889053, "learning_rate": 9.707058877849555e-05, "loss": 0.1251, "step": 133800 }, { "epoch": 2.528238449624117, "grad_norm": 0.03141976147890091, "learning_rate": 9.706534194653269e-05, "loss": 0.1248, "step": 133850 }, { "epoch": 2.529182879377432, "grad_norm": 0.03130596503615379, "learning_rate": 9.706009511456982e-05, "loss": 0.1251, "step": 133900 }, { "epoch": 2.530127309130747, "grad_norm": 0.030236775055527687, "learning_rate": 9.705484828260697e-05, "loss": 0.1252, "step": 133950 }, { "epoch": 2.531071738884062, "grad_norm": 0.03183705359697342, "learning_rate": 9.70496014506441e-05, "loss": 0.1256, "step": 134000 }, { "epoch": 2.5320161686373766, "grad_norm": 0.03074331395328045, "learning_rate": 9.704435461868125e-05, "loss": 0.125, "step": 134050 }, { "epoch": 2.5329605983906918, "grad_norm": 0.029482737183570862, "learning_rate": 9.703910778671838e-05, "loss": 0.1248, "step": 134100 }, { "epoch": 2.5339050281440065, "grad_norm": 0.03448597341775894, "learning_rate": 9.703386095475552e-05, "loss": 0.1256, "step": 134150 }, { "epoch": 2.5348494578973217, "grad_norm": 0.0318196676671505, "learning_rate": 9.702861412279267e-05, "loss": 0.1253, "step": 134200 }, { "epoch": 2.5357938876506365, "grad_norm": 0.03066682070493698, "learning_rate": 9.70233672908298e-05, "loss": 0.1251, "step": 134250 }, { "epoch": 2.5367383174039517, "grad_norm": 0.02901112101972103, "learning_rate": 9.701812045886695e-05, "loss": 0.1252, "step": 134300 }, { "epoch": 2.5376827471572665, "grad_norm": 0.029728412628173828, "learning_rate": 9.701287362690408e-05, "loss": 0.1255, "step": 134350 }, { "epoch": 2.5386271769105813, "grad_norm": 0.03380723297595978, "learning_rate": 9.700762679494121e-05, "loss": 0.1252, "step": 134400 }, { "epoch": 2.5395716066638965, "grad_norm": 0.032415639609098434, "learning_rate": 9.700237996297836e-05, "loss": 0.1253, "step": 134450 }, { "epoch": 2.5405160364172112, "grad_norm": 0.031910937279462814, "learning_rate": 9.69971331310155e-05, "loss": 0.1254, "step": 134500 }, { "epoch": 2.541460466170526, "grad_norm": 0.030924534425139427, "learning_rate": 9.699188629905264e-05, "loss": 0.1251, "step": 134550 }, { "epoch": 2.5424048959238412, "grad_norm": 0.03125675022602081, "learning_rate": 9.698663946708978e-05, "loss": 0.1257, "step": 134600 }, { "epoch": 2.543349325677156, "grad_norm": 0.0296334195882082, "learning_rate": 9.698139263512691e-05, "loss": 0.1252, "step": 134650 }, { "epoch": 2.544293755430471, "grad_norm": 0.030433109030127525, "learning_rate": 9.697614580316406e-05, "loss": 0.1252, "step": 134700 }, { "epoch": 2.545238185183786, "grad_norm": 0.02993951551616192, "learning_rate": 9.697089897120119e-05, "loss": 0.1252, "step": 134750 }, { "epoch": 2.546182614937101, "grad_norm": 0.03202015161514282, "learning_rate": 9.696565213923833e-05, "loss": 0.1252, "step": 134800 }, { "epoch": 2.547127044690416, "grad_norm": 0.03057137317955494, "learning_rate": 9.696040530727547e-05, "loss": 0.1254, "step": 134850 }, { "epoch": 2.5480714744437307, "grad_norm": 0.029324673116207123, "learning_rate": 9.695515847531261e-05, "loss": 0.1251, "step": 134900 }, { "epoch": 2.549015904197046, "grad_norm": 0.03202293813228607, "learning_rate": 9.694991164334974e-05, "loss": 0.1254, "step": 134950 }, { "epoch": 2.5499603339503607, "grad_norm": 0.029453586786985397, "learning_rate": 9.694466481138689e-05, "loss": 0.1254, "step": 135000 }, { "epoch": 2.5499603339503607, "eval_IntDiv": 0.6757105462165724, "eval_NumCircles": 1819, "eval_SumBottleneck": 113.6150694080732, "eval_Uniqueness": 0.9959551016280715, "eval_Validity": 0.9889, "eval_Validity * Uniqueness": 0.9849, "eval_loss": 0.22135719656944275, "eval_runtime": 158.3072, "eval_samples_per_second": 63.168, "eval_steps_per_second": 0.499, "step": 135000 }, { "epoch": 2.5509047637036755, "grad_norm": 0.029841803014278412, "learning_rate": 9.693941797942404e-05, "loss": 0.1254, "step": 135050 }, { "epoch": 2.5518491934569907, "grad_norm": 0.02987363375723362, "learning_rate": 9.693417114746117e-05, "loss": 0.1255, "step": 135100 }, { "epoch": 2.5527936232103055, "grad_norm": 0.03126811236143112, "learning_rate": 9.69289243154983e-05, "loss": 0.1251, "step": 135150 }, { "epoch": 2.5537380529636207, "grad_norm": 0.030623845756053925, "learning_rate": 9.692367748353545e-05, "loss": 0.125, "step": 135200 }, { "epoch": 2.5546824827169354, "grad_norm": 0.029703468084335327, "learning_rate": 9.691843065157259e-05, "loss": 0.1254, "step": 135250 }, { "epoch": 2.5556269124702506, "grad_norm": 0.029651472344994545, "learning_rate": 9.691318381960972e-05, "loss": 0.1251, "step": 135300 }, { "epoch": 2.5565713422235654, "grad_norm": 0.029780074954032898, "learning_rate": 9.690793698764687e-05, "loss": 0.1254, "step": 135350 }, { "epoch": 2.55751577197688, "grad_norm": 0.030976980924606323, "learning_rate": 9.6902690155684e-05, "loss": 0.1252, "step": 135400 }, { "epoch": 2.5584602017301954, "grad_norm": 0.03146212920546532, "learning_rate": 9.689744332372113e-05, "loss": 0.1252, "step": 135450 }, { "epoch": 2.55940463148351, "grad_norm": 0.029765963554382324, "learning_rate": 9.689219649175828e-05, "loss": 0.1255, "step": 135500 }, { "epoch": 2.560349061236825, "grad_norm": 0.030256252735853195, "learning_rate": 9.688694965979543e-05, "loss": 0.1251, "step": 135550 }, { "epoch": 2.56129349099014, "grad_norm": 0.03131643310189247, "learning_rate": 9.688170282783255e-05, "loss": 0.125, "step": 135600 }, { "epoch": 2.5622379207434554, "grad_norm": 0.03051631525158882, "learning_rate": 9.68764559958697e-05, "loss": 0.1255, "step": 135650 }, { "epoch": 2.56318235049677, "grad_norm": 0.0293186753988266, "learning_rate": 9.687120916390684e-05, "loss": 0.1252, "step": 135700 }, { "epoch": 2.564126780250085, "grad_norm": 0.030304742977023125, "learning_rate": 9.686596233194398e-05, "loss": 0.1248, "step": 135750 }, { "epoch": 2.5650712100034, "grad_norm": 0.029475709423422813, "learning_rate": 9.686071549998111e-05, "loss": 0.1252, "step": 135800 }, { "epoch": 2.566015639756715, "grad_norm": 0.03071817383170128, "learning_rate": 9.685546866801826e-05, "loss": 0.1251, "step": 135850 }, { "epoch": 2.5669600695100296, "grad_norm": 0.03155483305454254, "learning_rate": 9.68502218360554e-05, "loss": 0.1254, "step": 135900 }, { "epoch": 2.567904499263345, "grad_norm": 0.030977396294474602, "learning_rate": 9.684497500409253e-05, "loss": 0.1252, "step": 135950 }, { "epoch": 2.5688489290166596, "grad_norm": 0.031048251315951347, "learning_rate": 9.683972817212968e-05, "loss": 0.1249, "step": 136000 }, { "epoch": 2.569793358769975, "grad_norm": 0.03027273900806904, "learning_rate": 9.683448134016681e-05, "loss": 0.1252, "step": 136050 }, { "epoch": 2.5707377885232896, "grad_norm": 0.031511738896369934, "learning_rate": 9.682923450820394e-05, "loss": 0.125, "step": 136100 }, { "epoch": 2.571682218276605, "grad_norm": 0.031236708164215088, "learning_rate": 9.682398767624109e-05, "loss": 0.1252, "step": 136150 }, { "epoch": 2.5726266480299196, "grad_norm": 0.030984243378043175, "learning_rate": 9.681874084427824e-05, "loss": 0.1253, "step": 136200 }, { "epoch": 2.5735710777832344, "grad_norm": 0.030252605676651, "learning_rate": 9.681349401231536e-05, "loss": 0.1253, "step": 136250 }, { "epoch": 2.5745155075365496, "grad_norm": 0.032272472977638245, "learning_rate": 9.68082471803525e-05, "loss": 0.1249, "step": 136300 }, { "epoch": 2.5754599372898643, "grad_norm": 0.029683703556656837, "learning_rate": 9.680300034838965e-05, "loss": 0.1254, "step": 136350 }, { "epoch": 2.576404367043179, "grad_norm": 0.030713027343153954, "learning_rate": 9.679775351642679e-05, "loss": 0.1251, "step": 136400 }, { "epoch": 2.5773487967964943, "grad_norm": 0.03206394240260124, "learning_rate": 9.679250668446392e-05, "loss": 0.1252, "step": 136450 }, { "epoch": 2.578293226549809, "grad_norm": 0.03190517798066139, "learning_rate": 9.678725985250107e-05, "loss": 0.125, "step": 136500 }, { "epoch": 2.5792376563031243, "grad_norm": 0.030424444004893303, "learning_rate": 9.67820130205382e-05, "loss": 0.125, "step": 136550 }, { "epoch": 2.580182086056439, "grad_norm": 0.030477305874228477, "learning_rate": 9.677676618857534e-05, "loss": 0.1252, "step": 136600 }, { "epoch": 2.5811265158097543, "grad_norm": 0.030125759541988373, "learning_rate": 9.677151935661248e-05, "loss": 0.1253, "step": 136650 }, { "epoch": 2.582070945563069, "grad_norm": 0.030539261177182198, "learning_rate": 9.676627252464963e-05, "loss": 0.1254, "step": 136700 }, { "epoch": 2.583015375316384, "grad_norm": 0.030906861647963524, "learning_rate": 9.676102569268675e-05, "loss": 0.1253, "step": 136750 }, { "epoch": 2.583959805069699, "grad_norm": 0.02998339757323265, "learning_rate": 9.67557788607239e-05, "loss": 0.1255, "step": 136800 }, { "epoch": 2.584904234823014, "grad_norm": 0.03106423281133175, "learning_rate": 9.675053202876105e-05, "loss": 0.1248, "step": 136850 }, { "epoch": 2.5858486645763286, "grad_norm": 0.03145177289843559, "learning_rate": 9.674528519679818e-05, "loss": 0.1249, "step": 136900 }, { "epoch": 2.5867930943296438, "grad_norm": 0.03156405687332153, "learning_rate": 9.674003836483531e-05, "loss": 0.1245, "step": 136950 }, { "epoch": 2.587737524082959, "grad_norm": 0.0317852720618248, "learning_rate": 9.673479153287246e-05, "loss": 0.1254, "step": 137000 }, { "epoch": 2.5886819538362738, "grad_norm": 0.030165698379278183, "learning_rate": 9.67295447009096e-05, "loss": 0.1252, "step": 137050 }, { "epoch": 2.5896263835895885, "grad_norm": 0.029607661068439484, "learning_rate": 9.672429786894673e-05, "loss": 0.1254, "step": 137100 }, { "epoch": 2.5905708133429037, "grad_norm": 0.0298980250954628, "learning_rate": 9.671905103698388e-05, "loss": 0.125, "step": 137150 }, { "epoch": 2.5915152430962185, "grad_norm": 0.030301345512270927, "learning_rate": 9.671380420502101e-05, "loss": 0.1252, "step": 137200 }, { "epoch": 2.5924596728495333, "grad_norm": 0.0307435505092144, "learning_rate": 9.670855737305815e-05, "loss": 0.125, "step": 137250 }, { "epoch": 2.5934041026028485, "grad_norm": 0.031235698610544205, "learning_rate": 9.670331054109529e-05, "loss": 0.1254, "step": 137300 }, { "epoch": 2.5943485323561633, "grad_norm": 0.029005499556660652, "learning_rate": 9.669806370913244e-05, "loss": 0.1252, "step": 137350 }, { "epoch": 2.5952929621094785, "grad_norm": 0.03244328498840332, "learning_rate": 9.669281687716957e-05, "loss": 0.1253, "step": 137400 }, { "epoch": 2.5962373918627932, "grad_norm": 0.029643896967172623, "learning_rate": 9.668757004520671e-05, "loss": 0.1255, "step": 137450 }, { "epoch": 2.5971818216161084, "grad_norm": 0.03186696022748947, "learning_rate": 9.668232321324386e-05, "loss": 0.1251, "step": 137500 }, { "epoch": 2.5971818216161084, "eval_IntDiv": 0.6745818341458489, "eval_NumCircles": 1768, "eval_SumBottleneck": 84.59764215725035, "eval_Uniqueness": 0.996566696960517, "eval_Validity": 0.9903, "eval_Validity * Uniqueness": 0.9869, "eval_loss": 0.22427041828632355, "eval_runtime": 164.3278, "eval_samples_per_second": 60.854, "eval_steps_per_second": 0.481, "step": 137500 }, { "epoch": 2.598126251369423, "grad_norm": 0.03159765899181366, "learning_rate": 9.667707638128099e-05, "loss": 0.1248, "step": 137550 }, { "epoch": 2.599070681122738, "grad_norm": 0.031029582023620605, "learning_rate": 9.667182954931812e-05, "loss": 0.125, "step": 137600 }, { "epoch": 2.600015110876053, "grad_norm": 0.030903464183211327, "learning_rate": 9.666658271735527e-05, "loss": 0.1252, "step": 137650 }, { "epoch": 2.600959540629368, "grad_norm": 0.029926655814051628, "learning_rate": 9.66613358853924e-05, "loss": 0.1248, "step": 137700 }, { "epoch": 2.6019039703826827, "grad_norm": 0.03032410703599453, "learning_rate": 9.665608905342954e-05, "loss": 0.1246, "step": 137750 }, { "epoch": 2.602848400135998, "grad_norm": 0.03210930898785591, "learning_rate": 9.665084222146669e-05, "loss": 0.1254, "step": 137800 }, { "epoch": 2.6037928298893127, "grad_norm": 0.030375441536307335, "learning_rate": 9.664559538950382e-05, "loss": 0.125, "step": 137850 }, { "epoch": 2.604737259642628, "grad_norm": 0.03106711432337761, "learning_rate": 9.664034855754097e-05, "loss": 0.1255, "step": 137900 }, { "epoch": 2.6056816893959427, "grad_norm": 0.030868416652083397, "learning_rate": 9.66351017255781e-05, "loss": 0.1254, "step": 137950 }, { "epoch": 2.606626119149258, "grad_norm": 0.02921781875193119, "learning_rate": 9.662985489361523e-05, "loss": 0.125, "step": 138000 }, { "epoch": 2.6075705489025727, "grad_norm": 0.03369951620697975, "learning_rate": 9.662460806165238e-05, "loss": 0.1247, "step": 138050 }, { "epoch": 2.6085149786558874, "grad_norm": 0.02885156124830246, "learning_rate": 9.661936122968952e-05, "loss": 0.1252, "step": 138100 }, { "epoch": 2.6094594084092027, "grad_norm": 0.029856203123927116, "learning_rate": 9.661411439772666e-05, "loss": 0.1252, "step": 138150 }, { "epoch": 2.6104038381625174, "grad_norm": 0.03181063011288643, "learning_rate": 9.66088675657638e-05, "loss": 0.1248, "step": 138200 }, { "epoch": 2.611348267915832, "grad_norm": 0.030621390789747238, "learning_rate": 9.660362073380093e-05, "loss": 0.1247, "step": 138250 }, { "epoch": 2.6122926976691474, "grad_norm": 0.029942961409687996, "learning_rate": 9.659837390183808e-05, "loss": 0.1246, "step": 138300 }, { "epoch": 2.613237127422462, "grad_norm": 0.030427340418100357, "learning_rate": 9.659312706987521e-05, "loss": 0.1252, "step": 138350 }, { "epoch": 2.6141815571757774, "grad_norm": 0.030616551637649536, "learning_rate": 9.658788023791236e-05, "loss": 0.1248, "step": 138400 }, { "epoch": 2.615125986929092, "grad_norm": 0.03042016550898552, "learning_rate": 9.65826334059495e-05, "loss": 0.1252, "step": 138450 }, { "epoch": 2.6160704166824074, "grad_norm": 0.03129958733916283, "learning_rate": 9.657738657398663e-05, "loss": 0.1248, "step": 138500 }, { "epoch": 2.617014846435722, "grad_norm": 0.029363177716732025, "learning_rate": 9.657213974202378e-05, "loss": 0.1253, "step": 138550 }, { "epoch": 2.617959276189037, "grad_norm": 0.03179867938160896, "learning_rate": 9.656689291006091e-05, "loss": 0.1251, "step": 138600 }, { "epoch": 2.618903705942352, "grad_norm": 0.030565332621335983, "learning_rate": 9.656164607809804e-05, "loss": 0.1247, "step": 138650 }, { "epoch": 2.619848135695667, "grad_norm": 0.030077271163463593, "learning_rate": 9.655639924613519e-05, "loss": 0.1251, "step": 138700 }, { "epoch": 2.6207925654489816, "grad_norm": 0.03181888908147812, "learning_rate": 9.655115241417232e-05, "loss": 0.1253, "step": 138750 }, { "epoch": 2.621736995202297, "grad_norm": 0.029745711013674736, "learning_rate": 9.654590558220946e-05, "loss": 0.1247, "step": 138800 }, { "epoch": 2.622681424955612, "grad_norm": 0.030187029391527176, "learning_rate": 9.65406587502466e-05, "loss": 0.1251, "step": 138850 }, { "epoch": 2.623625854708927, "grad_norm": 0.030486902222037315, "learning_rate": 9.653541191828375e-05, "loss": 0.1247, "step": 138900 }, { "epoch": 2.6245702844622416, "grad_norm": 0.029948486015200615, "learning_rate": 9.653016508632089e-05, "loss": 0.1247, "step": 138950 }, { "epoch": 2.625514714215557, "grad_norm": 0.03125929832458496, "learning_rate": 9.652491825435802e-05, "loss": 0.1254, "step": 139000 }, { "epoch": 2.6264591439688716, "grad_norm": 0.030087046325206757, "learning_rate": 9.651967142239517e-05, "loss": 0.1249, "step": 139050 }, { "epoch": 2.6274035737221864, "grad_norm": 0.030551616102457047, "learning_rate": 9.65144245904323e-05, "loss": 0.1251, "step": 139100 }, { "epoch": 2.6283480034755016, "grad_norm": 0.029612518846988678, "learning_rate": 9.650917775846944e-05, "loss": 0.1247, "step": 139150 }, { "epoch": 2.6292924332288163, "grad_norm": 0.032431695610284805, "learning_rate": 9.650393092650658e-05, "loss": 0.1249, "step": 139200 }, { "epoch": 2.6302368629821316, "grad_norm": 0.03299001231789589, "learning_rate": 9.649868409454372e-05, "loss": 0.1253, "step": 139250 }, { "epoch": 2.6311812927354463, "grad_norm": 0.029100149869918823, "learning_rate": 9.649343726258085e-05, "loss": 0.125, "step": 139300 }, { "epoch": 2.6321257224887615, "grad_norm": 0.0315014123916626, "learning_rate": 9.6488190430618e-05, "loss": 0.1247, "step": 139350 }, { "epoch": 2.6330701522420763, "grad_norm": 0.03037048503756523, "learning_rate": 9.648294359865513e-05, "loss": 0.125, "step": 139400 }, { "epoch": 2.634014581995391, "grad_norm": 0.030029380694031715, "learning_rate": 9.647769676669227e-05, "loss": 0.1253, "step": 139450 }, { "epoch": 2.6349590117487063, "grad_norm": 0.030272047966718674, "learning_rate": 9.647244993472941e-05, "loss": 0.1248, "step": 139500 }, { "epoch": 2.635903441502021, "grad_norm": 0.034756001085042953, "learning_rate": 9.646720310276656e-05, "loss": 0.1247, "step": 139550 }, { "epoch": 2.636847871255336, "grad_norm": 0.02903776243329048, "learning_rate": 9.646195627080368e-05, "loss": 0.125, "step": 139600 }, { "epoch": 2.637792301008651, "grad_norm": 0.030790897086262703, "learning_rate": 9.645670943884083e-05, "loss": 0.1248, "step": 139650 }, { "epoch": 2.638736730761966, "grad_norm": 0.029581811279058456, "learning_rate": 9.645146260687798e-05, "loss": 0.1245, "step": 139700 }, { "epoch": 2.639681160515281, "grad_norm": 0.0328785739839077, "learning_rate": 9.644621577491511e-05, "loss": 0.1246, "step": 139750 }, { "epoch": 2.640625590268596, "grad_norm": 0.030750280246138573, "learning_rate": 9.644096894295225e-05, "loss": 0.125, "step": 139800 }, { "epoch": 2.641570020021911, "grad_norm": 0.029267912730574608, "learning_rate": 9.643572211098939e-05, "loss": 0.1252, "step": 139850 }, { "epoch": 2.6425144497752258, "grad_norm": 0.029781755059957504, "learning_rate": 9.643047527902653e-05, "loss": 0.1245, "step": 139900 }, { "epoch": 2.6434588795285405, "grad_norm": 0.028933921828866005, "learning_rate": 9.642522844706366e-05, "loss": 0.1244, "step": 139950 }, { "epoch": 2.6444033092818557, "grad_norm": 0.03319871053099632, "learning_rate": 9.641998161510081e-05, "loss": 0.1248, "step": 140000 }, { "epoch": 2.6444033092818557, "eval_IntDiv": 0.676621520181506, "eval_NumCircles": 1821, "eval_SumBottleneck": 79.85021597060303, "eval_Uniqueness": 0.9953507176066303, "eval_Validity": 0.9894, "eval_Validity * Uniqueness": 0.9848, "eval_loss": 0.22644120454788208, "eval_runtime": 187.2469, "eval_samples_per_second": 53.405, "eval_steps_per_second": 0.422, "step": 140000 }, { "epoch": 2.6453477390351705, "grad_norm": 0.031081242486834526, "learning_rate": 9.641473478313796e-05, "loss": 0.125, "step": 140050 }, { "epoch": 2.6462921687884853, "grad_norm": 0.030445747077465057, "learning_rate": 9.640948795117508e-05, "loss": 0.1249, "step": 140100 }, { "epoch": 2.6472365985418005, "grad_norm": 0.031043998897075653, "learning_rate": 9.640424111921222e-05, "loss": 0.1251, "step": 140150 }, { "epoch": 2.6481810282951153, "grad_norm": 0.0316653735935688, "learning_rate": 9.639899428724937e-05, "loss": 0.1248, "step": 140200 }, { "epoch": 2.6491254580484305, "grad_norm": 0.0298308078199625, "learning_rate": 9.63937474552865e-05, "loss": 0.1251, "step": 140250 }, { "epoch": 2.6500698878017452, "grad_norm": 0.02991516701877117, "learning_rate": 9.638850062332364e-05, "loss": 0.1247, "step": 140300 }, { "epoch": 2.6510143175550605, "grad_norm": 0.030179331079125404, "learning_rate": 9.638325379136079e-05, "loss": 0.1249, "step": 140350 }, { "epoch": 2.651958747308375, "grad_norm": 0.030263211578130722, "learning_rate": 9.637800695939792e-05, "loss": 0.1252, "step": 140400 }, { "epoch": 2.65290317706169, "grad_norm": 0.031000308692455292, "learning_rate": 9.637276012743505e-05, "loss": 0.1247, "step": 140450 }, { "epoch": 2.653847606815005, "grad_norm": 0.030651850625872612, "learning_rate": 9.63675132954722e-05, "loss": 0.1247, "step": 140500 }, { "epoch": 2.65479203656832, "grad_norm": 0.03115278296172619, "learning_rate": 9.636226646350935e-05, "loss": 0.1248, "step": 140550 }, { "epoch": 2.6557364663216347, "grad_norm": 0.029112152755260468, "learning_rate": 9.635701963154647e-05, "loss": 0.1247, "step": 140600 }, { "epoch": 2.65668089607495, "grad_norm": 0.029711099341511726, "learning_rate": 9.635177279958362e-05, "loss": 0.1248, "step": 140650 }, { "epoch": 2.657625325828265, "grad_norm": 0.030505096539855003, "learning_rate": 9.634652596762076e-05, "loss": 0.1247, "step": 140700 }, { "epoch": 2.65856975558158, "grad_norm": 0.030927732586860657, "learning_rate": 9.63412791356579e-05, "loss": 0.125, "step": 140750 }, { "epoch": 2.6595141853348947, "grad_norm": 0.03163710609078407, "learning_rate": 9.633603230369503e-05, "loss": 0.1251, "step": 140800 }, { "epoch": 2.66045861508821, "grad_norm": 0.029443474486470222, "learning_rate": 9.633078547173218e-05, "loss": 0.1249, "step": 140850 }, { "epoch": 2.6614030448415247, "grad_norm": 0.029304003342986107, "learning_rate": 9.632553863976931e-05, "loss": 0.1256, "step": 140900 }, { "epoch": 2.6623474745948394, "grad_norm": 0.030231306329369545, "learning_rate": 9.632029180780645e-05, "loss": 0.1247, "step": 140950 }, { "epoch": 2.6632919043481547, "grad_norm": 0.030772240832448006, "learning_rate": 9.63150449758436e-05, "loss": 0.1247, "step": 141000 }, { "epoch": 2.6642363341014694, "grad_norm": 0.029812119901180267, "learning_rate": 9.630979814388073e-05, "loss": 0.1248, "step": 141050 }, { "epoch": 2.6651807638547846, "grad_norm": 0.02923138625919819, "learning_rate": 9.630455131191786e-05, "loss": 0.1247, "step": 141100 }, { "epoch": 2.6661251936080994, "grad_norm": 0.030670765787363052, "learning_rate": 9.629930447995501e-05, "loss": 0.1249, "step": 141150 }, { "epoch": 2.6670696233614146, "grad_norm": 0.02940480411052704, "learning_rate": 9.629405764799214e-05, "loss": 0.1251, "step": 141200 }, { "epoch": 2.6680140531147294, "grad_norm": 0.03155173733830452, "learning_rate": 9.628881081602929e-05, "loss": 0.1246, "step": 141250 }, { "epoch": 2.668958482868044, "grad_norm": 0.0320095494389534, "learning_rate": 9.628356398406642e-05, "loss": 0.1248, "step": 141300 }, { "epoch": 2.6699029126213594, "grad_norm": 0.03052476979792118, "learning_rate": 9.627831715210357e-05, "loss": 0.1246, "step": 141350 }, { "epoch": 2.670847342374674, "grad_norm": 0.030455227941274643, "learning_rate": 9.62730703201407e-05, "loss": 0.1246, "step": 141400 }, { "epoch": 2.671791772127989, "grad_norm": 0.031568173319101334, "learning_rate": 9.626782348817784e-05, "loss": 0.125, "step": 141450 }, { "epoch": 2.672736201881304, "grad_norm": 0.02995588630437851, "learning_rate": 9.626257665621499e-05, "loss": 0.1249, "step": 141500 }, { "epoch": 2.673680631634619, "grad_norm": 0.02990071289241314, "learning_rate": 9.625732982425212e-05, "loss": 0.1248, "step": 141550 }, { "epoch": 2.674625061387934, "grad_norm": 0.03133208677172661, "learning_rate": 9.625208299228926e-05, "loss": 0.1248, "step": 141600 }, { "epoch": 2.675569491141249, "grad_norm": 0.031862758100032806, "learning_rate": 9.62468361603264e-05, "loss": 0.125, "step": 141650 }, { "epoch": 2.676513920894564, "grad_norm": 0.03139256313443184, "learning_rate": 9.624158932836354e-05, "loss": 0.1251, "step": 141700 }, { "epoch": 2.677458350647879, "grad_norm": 0.03260360285639763, "learning_rate": 9.623634249640068e-05, "loss": 0.125, "step": 141750 }, { "epoch": 2.6784027804011936, "grad_norm": 0.02930285967886448, "learning_rate": 9.623109566443782e-05, "loss": 0.1246, "step": 141800 }, { "epoch": 2.679347210154509, "grad_norm": 0.03125821053981781, "learning_rate": 9.622584883247495e-05, "loss": 0.1248, "step": 141850 }, { "epoch": 2.6802916399078236, "grad_norm": 0.031529106199741364, "learning_rate": 9.62206020005121e-05, "loss": 0.1246, "step": 141900 }, { "epoch": 2.6812360696611384, "grad_norm": 0.028520939871668816, "learning_rate": 9.621535516854923e-05, "loss": 0.125, "step": 141950 }, { "epoch": 2.6821804994144536, "grad_norm": 0.030373793095350266, "learning_rate": 9.621010833658637e-05, "loss": 0.1249, "step": 142000 }, { "epoch": 2.6831249291677683, "grad_norm": 0.02937725931406021, "learning_rate": 9.620486150462351e-05, "loss": 0.1246, "step": 142050 }, { "epoch": 2.6840693589210836, "grad_norm": 0.029935287311673164, "learning_rate": 9.619961467266065e-05, "loss": 0.1253, "step": 142100 }, { "epoch": 2.6850137886743983, "grad_norm": 0.029274797067046165, "learning_rate": 9.61943678406978e-05, "loss": 0.1241, "step": 142150 }, { "epoch": 2.6859582184277135, "grad_norm": 0.031093643978238106, "learning_rate": 9.618912100873493e-05, "loss": 0.1247, "step": 142200 }, { "epoch": 2.6869026481810283, "grad_norm": 0.03190628066658974, "learning_rate": 9.618387417677206e-05, "loss": 0.1251, "step": 142250 }, { "epoch": 2.687847077934343, "grad_norm": 0.030768748372793198, "learning_rate": 9.617862734480921e-05, "loss": 0.1251, "step": 142300 }, { "epoch": 2.6887915076876583, "grad_norm": 0.02981323003768921, "learning_rate": 9.617338051284635e-05, "loss": 0.1247, "step": 142350 }, { "epoch": 2.689735937440973, "grad_norm": 0.0291121955960989, "learning_rate": 9.616813368088349e-05, "loss": 0.1247, "step": 142400 }, { "epoch": 2.690680367194288, "grad_norm": 0.031347259879112244, "learning_rate": 9.616288684892063e-05, "loss": 0.1247, "step": 142450 }, { "epoch": 2.691624796947603, "grad_norm": 0.03089527226984501, "learning_rate": 9.615764001695776e-05, "loss": 0.1249, "step": 142500 }, { "epoch": 2.691624796947603, "eval_IntDiv": 0.6731756155207695, "eval_NumCircles": 1726, "eval_SumBottleneck": 152.58847233456203, "eval_Uniqueness": 0.9970674486803519, "eval_Validity": 0.9889, "eval_Validity * Uniqueness": 0.986, "eval_loss": 0.22579021751880646, "eval_runtime": 142.3664, "eval_samples_per_second": 70.241, "eval_steps_per_second": 0.555, "step": 142500 }, { "epoch": 2.6925692267009183, "grad_norm": 0.029169311746954918, "learning_rate": 9.615239318499491e-05, "loss": 0.1247, "step": 142550 }, { "epoch": 2.693513656454233, "grad_norm": 0.029961396008729935, "learning_rate": 9.614714635303204e-05, "loss": 0.125, "step": 142600 }, { "epoch": 2.694458086207548, "grad_norm": 0.029884980991482735, "learning_rate": 9.614189952106918e-05, "loss": 0.1251, "step": 142650 }, { "epoch": 2.695402515960863, "grad_norm": 0.030396319925785065, "learning_rate": 9.613665268910632e-05, "loss": 0.1249, "step": 142700 }, { "epoch": 2.6963469457141778, "grad_norm": 0.031206287443637848, "learning_rate": 9.613140585714346e-05, "loss": 0.1253, "step": 142750 }, { "epoch": 2.6972913754674925, "grad_norm": 0.03108644299209118, "learning_rate": 9.612615902518059e-05, "loss": 0.1248, "step": 142800 }, { "epoch": 2.6982358052208077, "grad_norm": 0.029938185587525368, "learning_rate": 9.612091219321774e-05, "loss": 0.1251, "step": 142850 }, { "epoch": 2.6991802349741225, "grad_norm": 0.030280394479632378, "learning_rate": 9.611566536125489e-05, "loss": 0.1249, "step": 142900 }, { "epoch": 2.7001246647274377, "grad_norm": 0.029538294300436974, "learning_rate": 9.611041852929202e-05, "loss": 0.1246, "step": 142950 }, { "epoch": 2.7010690944807525, "grad_norm": 0.02996234968304634, "learning_rate": 9.610517169732915e-05, "loss": 0.1246, "step": 143000 }, { "epoch": 2.7020135242340677, "grad_norm": 0.03022209368646145, "learning_rate": 9.60999248653663e-05, "loss": 0.1246, "step": 143050 }, { "epoch": 2.7029579539873825, "grad_norm": 0.03174090012907982, "learning_rate": 9.609467803340344e-05, "loss": 0.1248, "step": 143100 }, { "epoch": 2.7039023837406972, "grad_norm": 0.030269909650087357, "learning_rate": 9.608943120144057e-05, "loss": 0.1245, "step": 143150 }, { "epoch": 2.7048468134940125, "grad_norm": 0.031082836911082268, "learning_rate": 9.608418436947772e-05, "loss": 0.1247, "step": 143200 }, { "epoch": 2.7057912432473272, "grad_norm": 0.030190326273441315, "learning_rate": 9.607893753751485e-05, "loss": 0.1246, "step": 143250 }, { "epoch": 2.706735673000642, "grad_norm": 0.03429156914353371, "learning_rate": 9.607369070555198e-05, "loss": 0.1247, "step": 143300 }, { "epoch": 2.707680102753957, "grad_norm": 0.031128844246268272, "learning_rate": 9.606844387358913e-05, "loss": 0.1248, "step": 143350 }, { "epoch": 2.708624532507272, "grad_norm": 0.029816748574376106, "learning_rate": 9.606319704162628e-05, "loss": 0.1248, "step": 143400 }, { "epoch": 2.709568962260587, "grad_norm": 0.029712896794080734, "learning_rate": 9.60579502096634e-05, "loss": 0.1245, "step": 143450 }, { "epoch": 2.710513392013902, "grad_norm": 0.02970869652926922, "learning_rate": 9.605270337770055e-05, "loss": 0.1249, "step": 143500 }, { "epoch": 2.711457821767217, "grad_norm": 0.03232578560709953, "learning_rate": 9.60474565457377e-05, "loss": 0.125, "step": 143550 }, { "epoch": 2.712402251520532, "grad_norm": 0.029967106878757477, "learning_rate": 9.604220971377483e-05, "loss": 0.1245, "step": 143600 }, { "epoch": 2.7133466812738467, "grad_norm": 0.031575459986925125, "learning_rate": 9.603696288181196e-05, "loss": 0.1246, "step": 143650 }, { "epoch": 2.714291111027162, "grad_norm": 0.030580319464206696, "learning_rate": 9.603171604984911e-05, "loss": 0.1248, "step": 143700 }, { "epoch": 2.7152355407804767, "grad_norm": 0.030997775495052338, "learning_rate": 9.602646921788624e-05, "loss": 0.1247, "step": 143750 }, { "epoch": 2.7161799705337915, "grad_norm": 0.030787331983447075, "learning_rate": 9.602122238592338e-05, "loss": 0.1246, "step": 143800 }, { "epoch": 2.7171244002871067, "grad_norm": 0.03288395330309868, "learning_rate": 9.601597555396053e-05, "loss": 0.1244, "step": 143850 }, { "epoch": 2.7180688300404214, "grad_norm": 0.029867641627788544, "learning_rate": 9.601072872199767e-05, "loss": 0.1244, "step": 143900 }, { "epoch": 2.7190132597937366, "grad_norm": 0.02898983284831047, "learning_rate": 9.600548189003479e-05, "loss": 0.1246, "step": 143950 }, { "epoch": 2.7199576895470514, "grad_norm": 0.028879547491669655, "learning_rate": 9.600023505807194e-05, "loss": 0.1243, "step": 144000 }, { "epoch": 2.7209021193003666, "grad_norm": 0.02999992109835148, "learning_rate": 9.599498822610909e-05, "loss": 0.1242, "step": 144050 }, { "epoch": 2.7218465490536814, "grad_norm": 0.030271336436271667, "learning_rate": 9.598974139414622e-05, "loss": 0.1241, "step": 144100 }, { "epoch": 2.722790978806996, "grad_norm": 0.030525656417012215, "learning_rate": 9.598449456218336e-05, "loss": 0.1248, "step": 144150 }, { "epoch": 2.7237354085603114, "grad_norm": 0.031169433146715164, "learning_rate": 9.59792477302205e-05, "loss": 0.125, "step": 144200 }, { "epoch": 2.724679838313626, "grad_norm": 0.03043052740395069, "learning_rate": 9.597400089825764e-05, "loss": 0.1247, "step": 144250 }, { "epoch": 2.725624268066941, "grad_norm": 0.03044126369059086, "learning_rate": 9.596875406629477e-05, "loss": 0.1245, "step": 144300 }, { "epoch": 2.726568697820256, "grad_norm": 0.03046533837914467, "learning_rate": 9.596350723433192e-05, "loss": 0.1249, "step": 144350 }, { "epoch": 2.7275131275735713, "grad_norm": 0.030271925032138824, "learning_rate": 9.595826040236905e-05, "loss": 0.1248, "step": 144400 }, { "epoch": 2.728457557326886, "grad_norm": 0.03144744038581848, "learning_rate": 9.595301357040619e-05, "loss": 0.1249, "step": 144450 }, { "epoch": 2.729401987080201, "grad_norm": 0.02995523437857628, "learning_rate": 9.594776673844333e-05, "loss": 0.125, "step": 144500 }, { "epoch": 2.730346416833516, "grad_norm": 0.032649774104356766, "learning_rate": 9.594251990648048e-05, "loss": 0.125, "step": 144550 }, { "epoch": 2.731290846586831, "grad_norm": 0.02932005189359188, "learning_rate": 9.593727307451762e-05, "loss": 0.1244, "step": 144600 }, { "epoch": 2.7322352763401456, "grad_norm": 0.030243877321481705, "learning_rate": 9.593202624255475e-05, "loss": 0.1246, "step": 144650 }, { "epoch": 2.733179706093461, "grad_norm": 0.0291652362793684, "learning_rate": 9.59267794105919e-05, "loss": 0.1248, "step": 144700 }, { "epoch": 2.7341241358467756, "grad_norm": 0.030636487528681755, "learning_rate": 9.592153257862903e-05, "loss": 0.1246, "step": 144750 }, { "epoch": 2.735068565600091, "grad_norm": 0.02886177785694599, "learning_rate": 9.591628574666616e-05, "loss": 0.1249, "step": 144800 }, { "epoch": 2.7360129953534056, "grad_norm": 0.031016184017062187, "learning_rate": 9.591103891470331e-05, "loss": 0.1245, "step": 144850 }, { "epoch": 2.736957425106721, "grad_norm": 0.031431544572114944, "learning_rate": 9.590579208274045e-05, "loss": 0.1243, "step": 144900 }, { "epoch": 2.7379018548600356, "grad_norm": 0.030993232503533363, "learning_rate": 9.590054525077758e-05, "loss": 0.1243, "step": 144950 }, { "epoch": 2.7388462846133503, "grad_norm": 0.03161017969250679, "learning_rate": 9.589529841881473e-05, "loss": 0.1247, "step": 145000 }, { "epoch": 2.7388462846133503, "eval_IntDiv": 0.6739275077017487, "eval_NumCircles": 1752, "eval_SumBottleneck": 126.31492071434228, "eval_Uniqueness": 0.9965715438136533, "eval_Validity": 0.9917, "eval_Validity * Uniqueness": 0.9883000000000001, "eval_loss": 0.22861789166927338, "eval_runtime": 163.6303, "eval_samples_per_second": 61.113, "eval_steps_per_second": 0.483, "step": 145000 }, { "epoch": 2.7397907143666655, "grad_norm": 0.030252059921622276, "learning_rate": 9.589005158685186e-05, "loss": 0.1245, "step": 145050 }, { "epoch": 2.7407351441199803, "grad_norm": 0.029259683564305305, "learning_rate": 9.588480475488901e-05, "loss": 0.1248, "step": 145100 }, { "epoch": 2.741679573873295, "grad_norm": 0.030730007216334343, "learning_rate": 9.587955792292614e-05, "loss": 0.1245, "step": 145150 }, { "epoch": 2.7426240036266103, "grad_norm": 0.031004605814814568, "learning_rate": 9.587431109096328e-05, "loss": 0.1242, "step": 145200 }, { "epoch": 2.743568433379925, "grad_norm": 0.029607461765408516, "learning_rate": 9.586906425900042e-05, "loss": 0.1244, "step": 145250 }, { "epoch": 2.7445128631332403, "grad_norm": 0.02931045927107334, "learning_rate": 9.586381742703756e-05, "loss": 0.1245, "step": 145300 }, { "epoch": 2.745457292886555, "grad_norm": 0.03089645504951477, "learning_rate": 9.58585705950747e-05, "loss": 0.1245, "step": 145350 }, { "epoch": 2.7464017226398703, "grad_norm": 0.03363144025206566, "learning_rate": 9.585332376311184e-05, "loss": 0.125, "step": 145400 }, { "epoch": 2.747346152393185, "grad_norm": 0.032556138932704926, "learning_rate": 9.584807693114897e-05, "loss": 0.1248, "step": 145450 }, { "epoch": 2.7482905821465, "grad_norm": 0.030517781153321266, "learning_rate": 9.584283009918612e-05, "loss": 0.1245, "step": 145500 }, { "epoch": 2.749235011899815, "grad_norm": 0.03014392964541912, "learning_rate": 9.583758326722325e-05, "loss": 0.1248, "step": 145550 }, { "epoch": 2.7501794416531298, "grad_norm": 0.030192140489816666, "learning_rate": 9.583233643526039e-05, "loss": 0.1242, "step": 145600 }, { "epoch": 2.7511238714064445, "grad_norm": 0.030665041878819466, "learning_rate": 9.582708960329754e-05, "loss": 0.1247, "step": 145650 }, { "epoch": 2.7520683011597598, "grad_norm": 0.031236717477440834, "learning_rate": 9.582184277133467e-05, "loss": 0.125, "step": 145700 }, { "epoch": 2.7530127309130745, "grad_norm": 0.03358257934451103, "learning_rate": 9.581659593937182e-05, "loss": 0.1245, "step": 145750 }, { "epoch": 2.7539571606663897, "grad_norm": 0.029940718784928322, "learning_rate": 9.581134910740895e-05, "loss": 0.125, "step": 145800 }, { "epoch": 2.7549015904197045, "grad_norm": 0.03196457773447037, "learning_rate": 9.580610227544608e-05, "loss": 0.1247, "step": 145850 }, { "epoch": 2.7558460201730197, "grad_norm": 0.029910778626799583, "learning_rate": 9.580085544348323e-05, "loss": 0.1243, "step": 145900 }, { "epoch": 2.7567904499263345, "grad_norm": 0.030390068888664246, "learning_rate": 9.579560861152037e-05, "loss": 0.1244, "step": 145950 }, { "epoch": 2.7577348796796493, "grad_norm": 0.031380731612443924, "learning_rate": 9.57903617795575e-05, "loss": 0.1247, "step": 146000 }, { "epoch": 2.7586793094329645, "grad_norm": 0.03159390762448311, "learning_rate": 9.578511494759465e-05, "loss": 0.1243, "step": 146050 }, { "epoch": 2.7596237391862792, "grad_norm": 0.02936170995235443, "learning_rate": 9.577986811563178e-05, "loss": 0.1246, "step": 146100 }, { "epoch": 2.760568168939594, "grad_norm": 0.0304179135710001, "learning_rate": 9.577462128366893e-05, "loss": 0.1246, "step": 146150 }, { "epoch": 2.761512598692909, "grad_norm": 0.02920597791671753, "learning_rate": 9.576937445170606e-05, "loss": 0.1244, "step": 146200 }, { "epoch": 2.7624570284462244, "grad_norm": 0.02911481447517872, "learning_rate": 9.576412761974321e-05, "loss": 0.1244, "step": 146250 }, { "epoch": 2.763401458199539, "grad_norm": 0.03270099312067032, "learning_rate": 9.575888078778034e-05, "loss": 0.1243, "step": 146300 }, { "epoch": 2.764345887952854, "grad_norm": 0.03294456750154495, "learning_rate": 9.575363395581748e-05, "loss": 0.1246, "step": 146350 }, { "epoch": 2.765290317706169, "grad_norm": 0.031783826649188995, "learning_rate": 9.574838712385463e-05, "loss": 0.1245, "step": 146400 }, { "epoch": 2.766234747459484, "grad_norm": 0.030433081090450287, "learning_rate": 9.574314029189176e-05, "loss": 0.1245, "step": 146450 }, { "epoch": 2.7671791772127987, "grad_norm": 0.029428161680698395, "learning_rate": 9.573789345992889e-05, "loss": 0.1243, "step": 146500 }, { "epoch": 2.768123606966114, "grad_norm": 0.031680453568696976, "learning_rate": 9.573264662796604e-05, "loss": 0.1245, "step": 146550 }, { "epoch": 2.7690680367194287, "grad_norm": 0.02989640273153782, "learning_rate": 9.572739979600317e-05, "loss": 0.124, "step": 146600 }, { "epoch": 2.770012466472744, "grad_norm": 0.03157028183341026, "learning_rate": 9.572215296404031e-05, "loss": 0.1245, "step": 146650 }, { "epoch": 2.7709568962260587, "grad_norm": 0.029746554791927338, "learning_rate": 9.571690613207746e-05, "loss": 0.1249, "step": 146700 }, { "epoch": 2.771901325979374, "grad_norm": 0.03011084347963333, "learning_rate": 9.57116593001146e-05, "loss": 0.1243, "step": 146750 }, { "epoch": 2.7728457557326887, "grad_norm": 0.029405873268842697, "learning_rate": 9.570641246815172e-05, "loss": 0.1243, "step": 146800 }, { "epoch": 2.7737901854860034, "grad_norm": 0.029429055750370026, "learning_rate": 9.570116563618887e-05, "loss": 0.1244, "step": 146850 }, { "epoch": 2.7747346152393186, "grad_norm": 0.030816292390227318, "learning_rate": 9.569591880422602e-05, "loss": 0.1243, "step": 146900 }, { "epoch": 2.7756790449926334, "grad_norm": 0.031051386147737503, "learning_rate": 9.569067197226315e-05, "loss": 0.1242, "step": 146950 }, { "epoch": 2.776623474745948, "grad_norm": 0.030621329322457314, "learning_rate": 9.568542514030029e-05, "loss": 0.124, "step": 147000 }, { "epoch": 2.7775679044992634, "grad_norm": 0.031203530728816986, "learning_rate": 9.568017830833743e-05, "loss": 0.1242, "step": 147050 }, { "epoch": 2.778512334252578, "grad_norm": 0.03024238720536232, "learning_rate": 9.567493147637457e-05, "loss": 0.124, "step": 147100 }, { "epoch": 2.7794567640058934, "grad_norm": 0.0325225330889225, "learning_rate": 9.56696846444117e-05, "loss": 0.1249, "step": 147150 }, { "epoch": 2.780401193759208, "grad_norm": 0.031234536319971085, "learning_rate": 9.566443781244885e-05, "loss": 0.1243, "step": 147200 }, { "epoch": 2.7813456235125233, "grad_norm": 0.03090486489236355, "learning_rate": 9.5659190980486e-05, "loss": 0.1245, "step": 147250 }, { "epoch": 2.782290053265838, "grad_norm": 0.029996473342180252, "learning_rate": 9.565394414852312e-05, "loss": 0.1245, "step": 147300 }, { "epoch": 2.783234483019153, "grad_norm": 0.029790321364998817, "learning_rate": 9.564869731656026e-05, "loss": 0.1248, "step": 147350 }, { "epoch": 2.784178912772468, "grad_norm": 0.031023163348436356, "learning_rate": 9.564345048459741e-05, "loss": 0.1245, "step": 147400 }, { "epoch": 2.785123342525783, "grad_norm": 0.030883966013789177, "learning_rate": 9.563820365263455e-05, "loss": 0.1241, "step": 147450 }, { "epoch": 2.7860677722790976, "grad_norm": 0.029277166351675987, "learning_rate": 9.563295682067168e-05, "loss": 0.124, "step": 147500 }, { "epoch": 2.7860677722790976, "eval_IntDiv": 0.6752212485493365, "eval_NumCircles": 1803, "eval_SumBottleneck": 78.5171148754626, "eval_Uniqueness": 0.9958485216686918, "eval_Validity": 0.9876, "eval_Validity * Uniqueness": 0.9835, "eval_loss": 0.2268691062927246, "eval_runtime": 192.9037, "eval_samples_per_second": 51.839, "eval_steps_per_second": 0.41, "step": 147500 }, { "epoch": 2.787012202032413, "grad_norm": 0.030383141711354256, "learning_rate": 9.562770998870883e-05, "loss": 0.1242, "step": 147550 }, { "epoch": 2.7879566317857276, "grad_norm": 0.030232971534132957, "learning_rate": 9.562246315674596e-05, "loss": 0.1243, "step": 147600 }, { "epoch": 2.788901061539043, "grad_norm": 0.03235278278589249, "learning_rate": 9.56172163247831e-05, "loss": 0.1244, "step": 147650 }, { "epoch": 2.7898454912923576, "grad_norm": 0.032762184739112854, "learning_rate": 9.561196949282024e-05, "loss": 0.1247, "step": 147700 }, { "epoch": 2.790789921045673, "grad_norm": 0.030667833983898163, "learning_rate": 9.560672266085739e-05, "loss": 0.1245, "step": 147750 }, { "epoch": 2.7917343507989876, "grad_norm": 0.029218818992376328, "learning_rate": 9.560147582889451e-05, "loss": 0.1246, "step": 147800 }, { "epoch": 2.7926787805523023, "grad_norm": 0.03019571304321289, "learning_rate": 9.559622899693166e-05, "loss": 0.1243, "step": 147850 }, { "epoch": 2.7936232103056176, "grad_norm": 0.034227512776851654, "learning_rate": 9.55909821649688e-05, "loss": 0.1241, "step": 147900 }, { "epoch": 2.7945676400589323, "grad_norm": 0.030551545321941376, "learning_rate": 9.558573533300594e-05, "loss": 0.1244, "step": 147950 }, { "epoch": 2.795512069812247, "grad_norm": 0.03126870095729828, "learning_rate": 9.558048850104307e-05, "loss": 0.1245, "step": 148000 }, { "epoch": 2.7964564995655623, "grad_norm": 0.03058863990008831, "learning_rate": 9.557524166908022e-05, "loss": 0.1247, "step": 148050 }, { "epoch": 2.7974009293188775, "grad_norm": 0.030744323506951332, "learning_rate": 9.556999483711735e-05, "loss": 0.1245, "step": 148100 }, { "epoch": 2.7983453590721923, "grad_norm": 0.030059538781642914, "learning_rate": 9.556474800515449e-05, "loss": 0.1245, "step": 148150 }, { "epoch": 2.799289788825507, "grad_norm": 0.030162468552589417, "learning_rate": 9.555950117319164e-05, "loss": 0.1245, "step": 148200 }, { "epoch": 2.8002342185788223, "grad_norm": 0.03013281524181366, "learning_rate": 9.555425434122877e-05, "loss": 0.1244, "step": 148250 }, { "epoch": 2.801178648332137, "grad_norm": 0.03206546977162361, "learning_rate": 9.55490075092659e-05, "loss": 0.1245, "step": 148300 }, { "epoch": 2.802123078085452, "grad_norm": 0.030373886227607727, "learning_rate": 9.554376067730305e-05, "loss": 0.1243, "step": 148350 }, { "epoch": 2.803067507838767, "grad_norm": 0.030518220737576485, "learning_rate": 9.553851384534018e-05, "loss": 0.1241, "step": 148400 }, { "epoch": 2.804011937592082, "grad_norm": 0.030005313456058502, "learning_rate": 9.553326701337733e-05, "loss": 0.1246, "step": 148450 }, { "epoch": 2.804956367345397, "grad_norm": 0.0316878966987133, "learning_rate": 9.552802018141447e-05, "loss": 0.1244, "step": 148500 }, { "epoch": 2.8059007970987118, "grad_norm": 0.03115692548453808, "learning_rate": 9.552277334945161e-05, "loss": 0.1246, "step": 148550 }, { "epoch": 2.806845226852027, "grad_norm": 0.030033569782972336, "learning_rate": 9.551752651748875e-05, "loss": 0.1249, "step": 148600 }, { "epoch": 2.8077896566053417, "grad_norm": 0.03339090943336487, "learning_rate": 9.551227968552588e-05, "loss": 0.124, "step": 148650 }, { "epoch": 2.8087340863586565, "grad_norm": 0.02881164848804474, "learning_rate": 9.550703285356303e-05, "loss": 0.1243, "step": 148700 }, { "epoch": 2.8096785161119717, "grad_norm": 0.03055950626730919, "learning_rate": 9.550178602160016e-05, "loss": 0.1246, "step": 148750 }, { "epoch": 2.8106229458652865, "grad_norm": 0.030855553224682808, "learning_rate": 9.54965391896373e-05, "loss": 0.1242, "step": 148800 }, { "epoch": 2.8115673756186013, "grad_norm": 0.029905397444963455, "learning_rate": 9.549129235767444e-05, "loss": 0.1246, "step": 148850 }, { "epoch": 2.8125118053719165, "grad_norm": 0.030197659507393837, "learning_rate": 9.548604552571158e-05, "loss": 0.1247, "step": 148900 }, { "epoch": 2.8134562351252312, "grad_norm": 0.03174937888979912, "learning_rate": 9.548079869374871e-05, "loss": 0.1243, "step": 148950 }, { "epoch": 2.8144006648785465, "grad_norm": 0.0316217839717865, "learning_rate": 9.547555186178586e-05, "loss": 0.1237, "step": 149000 }, { "epoch": 2.8153450946318612, "grad_norm": 0.030198922380805016, "learning_rate": 9.5470305029823e-05, "loss": 0.1244, "step": 149050 }, { "epoch": 2.8162895243851764, "grad_norm": 0.03081279993057251, "learning_rate": 9.546505819786014e-05, "loss": 0.1244, "step": 149100 }, { "epoch": 2.817233954138491, "grad_norm": 0.03092917613685131, "learning_rate": 9.545981136589727e-05, "loss": 0.1244, "step": 149150 }, { "epoch": 2.818178383891806, "grad_norm": 0.031317636370658875, "learning_rate": 9.545456453393441e-05, "loss": 0.125, "step": 149200 }, { "epoch": 2.819122813645121, "grad_norm": 0.03153866529464722, "learning_rate": 9.544931770197156e-05, "loss": 0.124, "step": 149250 }, { "epoch": 2.820067243398436, "grad_norm": 0.032413166016340256, "learning_rate": 9.544407087000869e-05, "loss": 0.1245, "step": 149300 }, { "epoch": 2.8210116731517507, "grad_norm": 0.030098911374807358, "learning_rate": 9.543882403804584e-05, "loss": 0.1248, "step": 149350 }, { "epoch": 2.821956102905066, "grad_norm": 0.029416797682642937, "learning_rate": 9.543357720608297e-05, "loss": 0.1248, "step": 149400 }, { "epoch": 2.822900532658381, "grad_norm": 0.030450457707047462, "learning_rate": 9.54283303741201e-05, "loss": 0.1244, "step": 149450 }, { "epoch": 2.823844962411696, "grad_norm": 0.029822420328855515, "learning_rate": 9.542308354215725e-05, "loss": 0.1241, "step": 149500 }, { "epoch": 2.8247893921650107, "grad_norm": 0.030192460864782333, "learning_rate": 9.541783671019439e-05, "loss": 0.1243, "step": 149550 }, { "epoch": 2.825733821918326, "grad_norm": 0.031042462214827538, "learning_rate": 9.541258987823153e-05, "loss": 0.1242, "step": 149600 }, { "epoch": 2.8266782516716407, "grad_norm": 0.028887039050459862, "learning_rate": 9.540734304626867e-05, "loss": 0.1243, "step": 149650 }, { "epoch": 2.8276226814249554, "grad_norm": 0.03163671866059303, "learning_rate": 9.54020962143058e-05, "loss": 0.1241, "step": 149700 }, { "epoch": 2.8285671111782706, "grad_norm": 0.029494522139430046, "learning_rate": 9.539684938234295e-05, "loss": 0.1242, "step": 149750 }, { "epoch": 2.8295115409315854, "grad_norm": 0.03078319877386093, "learning_rate": 9.539160255038008e-05, "loss": 0.1242, "step": 149800 }, { "epoch": 2.8304559706849, "grad_norm": 0.03046657145023346, "learning_rate": 9.538635571841722e-05, "loss": 0.124, "step": 149850 }, { "epoch": 2.8314004004382154, "grad_norm": 0.030404508113861084, "learning_rate": 9.538110888645436e-05, "loss": 0.1244, "step": 149900 }, { "epoch": 2.8323448301915306, "grad_norm": 0.03017832525074482, "learning_rate": 9.53758620544915e-05, "loss": 0.1244, "step": 149950 }, { "epoch": 2.8332892599448454, "grad_norm": 0.02882099151611328, "learning_rate": 9.537061522252863e-05, "loss": 0.1241, "step": 150000 }, { "epoch": 2.8332892599448454, "eval_IntDiv": 0.674696138225682, "eval_NumCircles": 1738, "eval_SumBottleneck": 163.57836676900493, "eval_Uniqueness": 0.9949576442113756, "eval_Validity": 0.9916, "eval_Validity * Uniqueness": 0.9866, "eval_loss": 0.2306589037179947, "eval_runtime": 144.9366, "eval_samples_per_second": 68.996, "eval_steps_per_second": 0.545, "step": 150000 }, { "epoch": 2.83423368969816, "grad_norm": 0.03028525970876217, "learning_rate": 9.536536839056578e-05, "loss": 0.1244, "step": 150050 }, { "epoch": 2.8351781194514754, "grad_norm": 0.032300401479005814, "learning_rate": 9.536012155860293e-05, "loss": 0.1245, "step": 150100 }, { "epoch": 2.83612254920479, "grad_norm": 0.03092985227704048, "learning_rate": 9.535487472664006e-05, "loss": 0.1245, "step": 150150 }, { "epoch": 2.837066978958105, "grad_norm": 0.030432621017098427, "learning_rate": 9.53496278946772e-05, "loss": 0.1242, "step": 150200 }, { "epoch": 2.83801140871142, "grad_norm": 0.03006182238459587, "learning_rate": 9.534438106271434e-05, "loss": 0.1243, "step": 150250 }, { "epoch": 2.838955838464735, "grad_norm": 0.029931051656603813, "learning_rate": 9.533913423075148e-05, "loss": 0.1244, "step": 150300 }, { "epoch": 2.83990026821805, "grad_norm": 0.030714187771081924, "learning_rate": 9.533388739878861e-05, "loss": 0.1243, "step": 150350 }, { "epoch": 2.840844697971365, "grad_norm": 0.031225161626935005, "learning_rate": 9.532864056682576e-05, "loss": 0.1245, "step": 150400 }, { "epoch": 2.84178912772468, "grad_norm": 0.03055122308433056, "learning_rate": 9.532339373486289e-05, "loss": 0.1242, "step": 150450 }, { "epoch": 2.842733557477995, "grad_norm": 0.0293124970048666, "learning_rate": 9.531814690290003e-05, "loss": 0.1244, "step": 150500 }, { "epoch": 2.8436779872313096, "grad_norm": 0.03088289685547352, "learning_rate": 9.531290007093717e-05, "loss": 0.1242, "step": 150550 }, { "epoch": 2.844622416984625, "grad_norm": 0.029394324868917465, "learning_rate": 9.530765323897432e-05, "loss": 0.1245, "step": 150600 }, { "epoch": 2.8455668467379396, "grad_norm": 0.03036622144281864, "learning_rate": 9.530240640701144e-05, "loss": 0.1244, "step": 150650 }, { "epoch": 2.8465112764912543, "grad_norm": 0.030185358598828316, "learning_rate": 9.529715957504859e-05, "loss": 0.1247, "step": 150700 }, { "epoch": 2.8474557062445696, "grad_norm": 0.0302352923899889, "learning_rate": 9.529191274308574e-05, "loss": 0.1241, "step": 150750 }, { "epoch": 2.8484001359978843, "grad_norm": 0.02973882295191288, "learning_rate": 9.528666591112287e-05, "loss": 0.1243, "step": 150800 }, { "epoch": 2.8493445657511995, "grad_norm": 0.029882898554205894, "learning_rate": 9.528141907916e-05, "loss": 0.1242, "step": 150850 }, { "epoch": 2.8502889955045143, "grad_norm": 0.029836198315024376, "learning_rate": 9.527617224719715e-05, "loss": 0.1243, "step": 150900 }, { "epoch": 2.8512334252578295, "grad_norm": 0.03216365724802017, "learning_rate": 9.527092541523429e-05, "loss": 0.1245, "step": 150950 }, { "epoch": 2.8521778550111443, "grad_norm": 0.02967124804854393, "learning_rate": 9.526567858327142e-05, "loss": 0.1238, "step": 151000 }, { "epoch": 2.853122284764459, "grad_norm": 0.030022861436009407, "learning_rate": 9.526043175130857e-05, "loss": 0.1244, "step": 151050 }, { "epoch": 2.8540667145177743, "grad_norm": 0.02922731637954712, "learning_rate": 9.525518491934571e-05, "loss": 0.1239, "step": 151100 }, { "epoch": 2.855011144271089, "grad_norm": 0.03100123628973961, "learning_rate": 9.524993808738283e-05, "loss": 0.1242, "step": 151150 }, { "epoch": 2.855955574024404, "grad_norm": 0.030239218845963478, "learning_rate": 9.524469125541998e-05, "loss": 0.1243, "step": 151200 }, { "epoch": 2.856900003777719, "grad_norm": 0.02970399707555771, "learning_rate": 9.523944442345713e-05, "loss": 0.1243, "step": 151250 }, { "epoch": 2.8578444335310342, "grad_norm": 0.031216928735375404, "learning_rate": 9.523419759149426e-05, "loss": 0.1242, "step": 151300 }, { "epoch": 2.858788863284349, "grad_norm": 0.02937917597591877, "learning_rate": 9.52289507595314e-05, "loss": 0.1242, "step": 151350 }, { "epoch": 2.8597332930376638, "grad_norm": 0.031808435916900635, "learning_rate": 9.522370392756854e-05, "loss": 0.1246, "step": 151400 }, { "epoch": 2.860677722790979, "grad_norm": 0.029903624206781387, "learning_rate": 9.521845709560568e-05, "loss": 0.1245, "step": 151450 }, { "epoch": 2.8616221525442938, "grad_norm": 0.03264070302248001, "learning_rate": 9.521321026364281e-05, "loss": 0.1245, "step": 151500 }, { "epoch": 2.8625665822976085, "grad_norm": 0.029620274901390076, "learning_rate": 9.520796343167996e-05, "loss": 0.1245, "step": 151550 }, { "epoch": 2.8635110120509237, "grad_norm": 0.030056992545723915, "learning_rate": 9.52027165997171e-05, "loss": 0.1246, "step": 151600 }, { "epoch": 2.8644554418042385, "grad_norm": 0.030014734715223312, "learning_rate": 9.519746976775423e-05, "loss": 0.124, "step": 151650 }, { "epoch": 2.8653998715575537, "grad_norm": 0.03214219957590103, "learning_rate": 9.519222293579137e-05, "loss": 0.1242, "step": 151700 }, { "epoch": 2.8663443013108685, "grad_norm": 0.03271941468119621, "learning_rate": 9.518697610382852e-05, "loss": 0.1242, "step": 151750 }, { "epoch": 2.8672887310641837, "grad_norm": 0.029659178107976913, "learning_rate": 9.518172927186564e-05, "loss": 0.1243, "step": 151800 }, { "epoch": 2.8682331608174985, "grad_norm": 0.03023168444633484, "learning_rate": 9.517648243990279e-05, "loss": 0.1238, "step": 151850 }, { "epoch": 2.8691775905708132, "grad_norm": 0.029718277975916862, "learning_rate": 9.517123560793994e-05, "loss": 0.1243, "step": 151900 }, { "epoch": 2.8701220203241284, "grad_norm": 0.029556551948189735, "learning_rate": 9.516598877597707e-05, "loss": 0.1247, "step": 151950 }, { "epoch": 2.871066450077443, "grad_norm": 0.03250070661306381, "learning_rate": 9.51607419440142e-05, "loss": 0.1243, "step": 152000 }, { "epoch": 2.872010879830758, "grad_norm": 0.03317854180932045, "learning_rate": 9.515549511205135e-05, "loss": 0.1242, "step": 152050 }, { "epoch": 2.872955309584073, "grad_norm": 0.03136292099952698, "learning_rate": 9.515024828008849e-05, "loss": 0.1244, "step": 152100 }, { "epoch": 2.873899739337388, "grad_norm": 0.030933400616049767, "learning_rate": 9.514500144812562e-05, "loss": 0.1242, "step": 152150 }, { "epoch": 2.874844169090703, "grad_norm": 0.030744511634111404, "learning_rate": 9.513975461616277e-05, "loss": 0.1239, "step": 152200 }, { "epoch": 2.875788598844018, "grad_norm": 0.029868680983781815, "learning_rate": 9.51345077841999e-05, "loss": 0.1241, "step": 152250 }, { "epoch": 2.876733028597333, "grad_norm": 0.03094368800520897, "learning_rate": 9.512926095223704e-05, "loss": 0.1242, "step": 152300 }, { "epoch": 2.877677458350648, "grad_norm": 0.03128987178206444, "learning_rate": 9.512401412027418e-05, "loss": 0.1242, "step": 152350 }, { "epoch": 2.8786218881039627, "grad_norm": 0.03019063174724579, "learning_rate": 9.511876728831132e-05, "loss": 0.1241, "step": 152400 }, { "epoch": 2.879566317857278, "grad_norm": 0.030634427443146706, "learning_rate": 9.511352045634846e-05, "loss": 0.1241, "step": 152450 }, { "epoch": 2.8805107476105927, "grad_norm": 0.029716376215219498, "learning_rate": 9.51082736243856e-05, "loss": 0.1239, "step": 152500 }, { "epoch": 2.8805107476105927, "eval_IntDiv": 0.6754511590058381, "eval_NumCircles": 1801, "eval_SumBottleneck": 112.71250499298053, "eval_Uniqueness": 0.9965594009309856, "eval_Validity": 0.9882, "eval_Validity * Uniqueness": 0.9847999999999999, "eval_loss": 0.22836735844612122, "eval_runtime": 151.2834, "eval_samples_per_second": 66.101, "eval_steps_per_second": 0.522, "step": 152500 }, { "epoch": 2.8814551773639074, "grad_norm": 0.030146805569529533, "learning_rate": 9.510302679242275e-05, "loss": 0.1241, "step": 152550 }, { "epoch": 2.8823996071172227, "grad_norm": 0.029940679669380188, "learning_rate": 9.509777996045988e-05, "loss": 0.1242, "step": 152600 }, { "epoch": 2.8833440368705374, "grad_norm": 0.030865265056490898, "learning_rate": 9.509253312849701e-05, "loss": 0.1242, "step": 152650 }, { "epoch": 2.8842884666238526, "grad_norm": 0.029241813346743584, "learning_rate": 9.508728629653416e-05, "loss": 0.1243, "step": 152700 }, { "epoch": 2.8852328963771674, "grad_norm": 0.02956436388194561, "learning_rate": 9.50820394645713e-05, "loss": 0.1242, "step": 152750 }, { "epoch": 2.8861773261304826, "grad_norm": 0.030417531728744507, "learning_rate": 9.507679263260843e-05, "loss": 0.1243, "step": 152800 }, { "epoch": 2.8871217558837974, "grad_norm": 0.028892945498228073, "learning_rate": 9.507154580064558e-05, "loss": 0.1242, "step": 152850 }, { "epoch": 2.888066185637112, "grad_norm": 0.032526008784770966, "learning_rate": 9.506629896868271e-05, "loss": 0.1241, "step": 152900 }, { "epoch": 2.8890106153904274, "grad_norm": 0.030549772083759308, "learning_rate": 9.506105213671986e-05, "loss": 0.1243, "step": 152950 }, { "epoch": 2.889955045143742, "grad_norm": 0.030052652582526207, "learning_rate": 9.505580530475699e-05, "loss": 0.124, "step": 153000 }, { "epoch": 2.890899474897057, "grad_norm": 0.03027515485882759, "learning_rate": 9.505055847279413e-05, "loss": 0.1244, "step": 153050 }, { "epoch": 2.891843904650372, "grad_norm": 0.029869453981518745, "learning_rate": 9.504531164083127e-05, "loss": 0.1243, "step": 153100 }, { "epoch": 2.8927883344036873, "grad_norm": 0.03055277280509472, "learning_rate": 9.504006480886841e-05, "loss": 0.1241, "step": 153150 }, { "epoch": 2.893732764157002, "grad_norm": 0.03320738300681114, "learning_rate": 9.503481797690554e-05, "loss": 0.1241, "step": 153200 }, { "epoch": 2.894677193910317, "grad_norm": 0.029844477772712708, "learning_rate": 9.502957114494269e-05, "loss": 0.1239, "step": 153250 }, { "epoch": 2.895621623663632, "grad_norm": 0.031142182648181915, "learning_rate": 9.502432431297982e-05, "loss": 0.1243, "step": 153300 }, { "epoch": 2.896566053416947, "grad_norm": 0.029807645827531815, "learning_rate": 9.501907748101697e-05, "loss": 0.124, "step": 153350 }, { "epoch": 2.8975104831702616, "grad_norm": 0.02967250533401966, "learning_rate": 9.50138306490541e-05, "loss": 0.1237, "step": 153400 }, { "epoch": 2.898454912923577, "grad_norm": 0.03079136088490486, "learning_rate": 9.500858381709125e-05, "loss": 0.1242, "step": 153450 }, { "epoch": 2.8993993426768916, "grad_norm": 0.03274829685688019, "learning_rate": 9.500333698512839e-05, "loss": 0.1238, "step": 153500 }, { "epoch": 2.900343772430207, "grad_norm": 0.029814649373292923, "learning_rate": 9.499809015316552e-05, "loss": 0.124, "step": 153550 }, { "epoch": 2.9012882021835216, "grad_norm": 0.031251855194568634, "learning_rate": 9.499284332120267e-05, "loss": 0.124, "step": 153600 }, { "epoch": 2.902232631936837, "grad_norm": 0.03163657337427139, "learning_rate": 9.49875964892398e-05, "loss": 0.1245, "step": 153650 }, { "epoch": 2.9031770616901516, "grad_norm": 0.02984117716550827, "learning_rate": 9.498234965727693e-05, "loss": 0.1241, "step": 153700 }, { "epoch": 2.9041214914434663, "grad_norm": 0.03070632554590702, "learning_rate": 9.497710282531408e-05, "loss": 0.1243, "step": 153750 }, { "epoch": 2.9050659211967815, "grad_norm": 0.030731244012713432, "learning_rate": 9.497185599335122e-05, "loss": 0.1242, "step": 153800 }, { "epoch": 2.9060103509500963, "grad_norm": 0.030058221891522408, "learning_rate": 9.496660916138835e-05, "loss": 0.1243, "step": 153850 }, { "epoch": 2.906954780703411, "grad_norm": 0.03684212267398834, "learning_rate": 9.49613623294255e-05, "loss": 0.1238, "step": 153900 }, { "epoch": 2.9078992104567263, "grad_norm": 0.030140936374664307, "learning_rate": 9.495611549746264e-05, "loss": 0.124, "step": 153950 }, { "epoch": 2.908843640210041, "grad_norm": 0.030845334753394127, "learning_rate": 9.495086866549976e-05, "loss": 0.1244, "step": 154000 }, { "epoch": 2.9097880699633563, "grad_norm": 0.032873041927814484, "learning_rate": 9.494562183353691e-05, "loss": 0.1242, "step": 154050 }, { "epoch": 2.910732499716671, "grad_norm": 0.029177797958254814, "learning_rate": 9.494037500157406e-05, "loss": 0.1237, "step": 154100 }, { "epoch": 2.9116769294699862, "grad_norm": 0.03281928971409798, "learning_rate": 9.49351281696112e-05, "loss": 0.1239, "step": 154150 }, { "epoch": 2.912621359223301, "grad_norm": 0.03168530762195587, "learning_rate": 9.492988133764833e-05, "loss": 0.1239, "step": 154200 }, { "epoch": 2.913565788976616, "grad_norm": 0.02998930960893631, "learning_rate": 9.492463450568548e-05, "loss": 0.124, "step": 154250 }, { "epoch": 2.914510218729931, "grad_norm": 0.03214602172374725, "learning_rate": 9.491938767372261e-05, "loss": 0.1239, "step": 154300 }, { "epoch": 2.9154546484832458, "grad_norm": 0.029457084834575653, "learning_rate": 9.491414084175974e-05, "loss": 0.1241, "step": 154350 }, { "epoch": 2.9163990782365605, "grad_norm": 0.03164689242839813, "learning_rate": 9.490889400979689e-05, "loss": 0.1239, "step": 154400 }, { "epoch": 2.9173435079898757, "grad_norm": 0.030171334743499756, "learning_rate": 9.490364717783404e-05, "loss": 0.1244, "step": 154450 }, { "epoch": 2.9182879377431905, "grad_norm": 0.030302755534648895, "learning_rate": 9.489840034587116e-05, "loss": 0.1241, "step": 154500 }, { "epoch": 2.9192323674965057, "grad_norm": 0.029300488531589508, "learning_rate": 9.48931535139083e-05, "loss": 0.1244, "step": 154550 }, { "epoch": 2.9201767972498205, "grad_norm": 0.03065422736108303, "learning_rate": 9.488790668194545e-05, "loss": 0.1241, "step": 154600 }, { "epoch": 2.9211212270031357, "grad_norm": 0.03169218823313713, "learning_rate": 9.488265984998259e-05, "loss": 0.1233, "step": 154650 }, { "epoch": 2.9220656567564505, "grad_norm": 0.03357355296611786, "learning_rate": 9.487741301801972e-05, "loss": 0.124, "step": 154700 }, { "epoch": 2.9230100865097652, "grad_norm": 0.030457772314548492, "learning_rate": 9.487216618605687e-05, "loss": 0.1239, "step": 154750 }, { "epoch": 2.9239545162630804, "grad_norm": 0.030103325843811035, "learning_rate": 9.4866919354094e-05, "loss": 0.1241, "step": 154800 }, { "epoch": 2.924898946016395, "grad_norm": 0.029994463548064232, "learning_rate": 9.486167252213114e-05, "loss": 0.1241, "step": 154850 }, { "epoch": 2.92584337576971, "grad_norm": 0.0303980503231287, "learning_rate": 9.485642569016828e-05, "loss": 0.1241, "step": 154900 }, { "epoch": 2.926787805523025, "grad_norm": 0.029470382258296013, "learning_rate": 9.485117885820543e-05, "loss": 0.1243, "step": 154950 }, { "epoch": 2.9277322352763404, "grad_norm": 0.030892470851540565, "learning_rate": 9.484593202624255e-05, "loss": 0.124, "step": 155000 }, { "epoch": 2.9277322352763404, "eval_IntDiv": 0.6753807574168076, "eval_NumCircles": 1759, "eval_SumBottleneck": 130.98107444634587, "eval_Uniqueness": 0.995960004039996, "eval_Validity": 0.9901, "eval_Validity * Uniqueness": 0.9861, "eval_loss": 0.2264726608991623, "eval_runtime": 150.7609, "eval_samples_per_second": 66.33, "eval_steps_per_second": 0.524, "step": 155000 }, { "epoch": 2.928676665029655, "grad_norm": 0.03193139284849167, "learning_rate": 9.48406851942797e-05, "loss": 0.1239, "step": 155050 }, { "epoch": 2.92962109478297, "grad_norm": 0.0299345962703228, "learning_rate": 9.483543836231685e-05, "loss": 0.1239, "step": 155100 }, { "epoch": 2.930565524536285, "grad_norm": 0.030979815870523453, "learning_rate": 9.483019153035397e-05, "loss": 0.1242, "step": 155150 }, { "epoch": 2.9315099542896, "grad_norm": 0.02980734594166279, "learning_rate": 9.482494469839111e-05, "loss": 0.1241, "step": 155200 }, { "epoch": 2.9324543840429147, "grad_norm": 0.03007327951490879, "learning_rate": 9.481969786642826e-05, "loss": 0.1243, "step": 155250 }, { "epoch": 2.93339881379623, "grad_norm": 0.02995985373854637, "learning_rate": 9.48144510344654e-05, "loss": 0.1239, "step": 155300 }, { "epoch": 2.9343432435495447, "grad_norm": 0.030454132705926895, "learning_rate": 9.480920420250253e-05, "loss": 0.1239, "step": 155350 }, { "epoch": 2.93528767330286, "grad_norm": 0.03090987727046013, "learning_rate": 9.480395737053968e-05, "loss": 0.1238, "step": 155400 }, { "epoch": 2.9362321030561747, "grad_norm": 0.03119453601539135, "learning_rate": 9.479871053857681e-05, "loss": 0.1238, "step": 155450 }, { "epoch": 2.93717653280949, "grad_norm": 0.030893098562955856, "learning_rate": 9.479346370661394e-05, "loss": 0.1242, "step": 155500 }, { "epoch": 2.9381209625628046, "grad_norm": 0.02955041266977787, "learning_rate": 9.478821687465109e-05, "loss": 0.1239, "step": 155550 }, { "epoch": 2.9390653923161194, "grad_norm": 0.030328072607517242, "learning_rate": 9.478297004268823e-05, "loss": 0.1241, "step": 155600 }, { "epoch": 2.9400098220694346, "grad_norm": 0.03025083616375923, "learning_rate": 9.477772321072536e-05, "loss": 0.1241, "step": 155650 }, { "epoch": 2.9409542518227494, "grad_norm": 0.031009269878268242, "learning_rate": 9.477247637876251e-05, "loss": 0.124, "step": 155700 }, { "epoch": 2.941898681576064, "grad_norm": 0.030988579615950584, "learning_rate": 9.476722954679965e-05, "loss": 0.1236, "step": 155750 }, { "epoch": 2.9428431113293794, "grad_norm": 0.03261903300881386, "learning_rate": 9.476198271483679e-05, "loss": 0.1237, "step": 155800 }, { "epoch": 2.943787541082694, "grad_norm": 0.03092227503657341, "learning_rate": 9.475673588287392e-05, "loss": 0.1241, "step": 155850 }, { "epoch": 2.9447319708360093, "grad_norm": 0.029566843062639236, "learning_rate": 9.475148905091107e-05, "loss": 0.124, "step": 155900 }, { "epoch": 2.945676400589324, "grad_norm": 0.02972228266298771, "learning_rate": 9.47462422189482e-05, "loss": 0.1241, "step": 155950 }, { "epoch": 2.9466208303426393, "grad_norm": 0.031306806951761246, "learning_rate": 9.474099538698534e-05, "loss": 0.1238, "step": 156000 }, { "epoch": 2.947565260095954, "grad_norm": 0.03085344098508358, "learning_rate": 9.473574855502249e-05, "loss": 0.1237, "step": 156050 }, { "epoch": 2.948509689849269, "grad_norm": 0.030973223969340324, "learning_rate": 9.473050172305962e-05, "loss": 0.1242, "step": 156100 }, { "epoch": 2.949454119602584, "grad_norm": 0.03048812784254551, "learning_rate": 9.472525489109675e-05, "loss": 0.1237, "step": 156150 }, { "epoch": 2.950398549355899, "grad_norm": 0.03498373180627823, "learning_rate": 9.47200080591339e-05, "loss": 0.1235, "step": 156200 }, { "epoch": 2.9513429791092136, "grad_norm": 0.031036848202347755, "learning_rate": 9.471476122717103e-05, "loss": 0.1237, "step": 156250 }, { "epoch": 2.952287408862529, "grad_norm": 0.030411291867494583, "learning_rate": 9.470951439520818e-05, "loss": 0.124, "step": 156300 }, { "epoch": 2.9532318386158436, "grad_norm": 0.031184542924165726, "learning_rate": 9.470426756324532e-05, "loss": 0.1241, "step": 156350 }, { "epoch": 2.954176268369159, "grad_norm": 0.030569372698664665, "learning_rate": 9.469902073128245e-05, "loss": 0.1238, "step": 156400 }, { "epoch": 2.9551206981224736, "grad_norm": 0.03029923513531685, "learning_rate": 9.46937738993196e-05, "loss": 0.124, "step": 156450 }, { "epoch": 2.956065127875789, "grad_norm": 0.030520964413881302, "learning_rate": 9.468852706735673e-05, "loss": 0.1238, "step": 156500 }, { "epoch": 2.9570095576291036, "grad_norm": 0.03238176926970482, "learning_rate": 9.468328023539388e-05, "loss": 0.124, "step": 156550 }, { "epoch": 2.9579539873824183, "grad_norm": 0.028946757316589355, "learning_rate": 9.467803340343101e-05, "loss": 0.1238, "step": 156600 }, { "epoch": 2.9588984171357335, "grad_norm": 0.029789486899971962, "learning_rate": 9.467278657146815e-05, "loss": 0.1242, "step": 156650 }, { "epoch": 2.9598428468890483, "grad_norm": 0.029594004154205322, "learning_rate": 9.46675397395053e-05, "loss": 0.1239, "step": 156700 }, { "epoch": 2.960787276642363, "grad_norm": 0.03217633441090584, "learning_rate": 9.466229290754243e-05, "loss": 0.1239, "step": 156750 }, { "epoch": 2.9617317063956783, "grad_norm": 0.030481096357107162, "learning_rate": 9.465704607557958e-05, "loss": 0.1237, "step": 156800 }, { "epoch": 2.9626761361489935, "grad_norm": 0.03275182098150253, "learning_rate": 9.465179924361671e-05, "loss": 0.1238, "step": 156850 }, { "epoch": 2.9636205659023083, "grad_norm": 0.03244251012802124, "learning_rate": 9.464655241165384e-05, "loss": 0.124, "step": 156900 }, { "epoch": 2.964564995655623, "grad_norm": 0.04609978571534157, "learning_rate": 9.464130557969099e-05, "loss": 0.1236, "step": 156950 }, { "epoch": 2.9655094254089382, "grad_norm": 0.03171761706471443, "learning_rate": 9.463605874772812e-05, "loss": 0.1238, "step": 157000 }, { "epoch": 2.966453855162253, "grad_norm": 0.029186898842453957, "learning_rate": 9.463081191576526e-05, "loss": 0.1236, "step": 157050 }, { "epoch": 2.967398284915568, "grad_norm": 0.02995595708489418, "learning_rate": 9.46255650838024e-05, "loss": 0.1235, "step": 157100 }, { "epoch": 2.968342714668883, "grad_norm": 0.030154472216963768, "learning_rate": 9.462031825183954e-05, "loss": 0.1238, "step": 157150 }, { "epoch": 2.9692871444221978, "grad_norm": 0.03014478273689747, "learning_rate": 9.461507141987669e-05, "loss": 0.1237, "step": 157200 }, { "epoch": 2.970231574175513, "grad_norm": 0.029089974239468575, "learning_rate": 9.460982458791382e-05, "loss": 0.124, "step": 157250 }, { "epoch": 2.9711760039288277, "grad_norm": 0.031166354194283485, "learning_rate": 9.460457775595097e-05, "loss": 0.1242, "step": 157300 }, { "epoch": 2.972120433682143, "grad_norm": 0.029407722875475883, "learning_rate": 9.45993309239881e-05, "loss": 0.1235, "step": 157350 }, { "epoch": 2.9730648634354577, "grad_norm": 0.03141268342733383, "learning_rate": 9.459408409202524e-05, "loss": 0.1234, "step": 157400 }, { "epoch": 2.9740092931887725, "grad_norm": 0.030987806618213654, "learning_rate": 9.458883726006238e-05, "loss": 0.1238, "step": 157450 }, { "epoch": 2.9749537229420877, "grad_norm": 0.03140963986515999, "learning_rate": 9.458359042809952e-05, "loss": 0.1236, "step": 157500 }, { "epoch": 2.9749537229420877, "eval_IntDiv": 0.6751810883115703, "eval_NumCircles": 1831, "eval_SumBottleneck": 127.51099242035768, "eval_Uniqueness": 0.9972763038434379, "eval_Validity": 0.9913, "eval_Validity * Uniqueness": 0.9885999999999999, "eval_loss": 0.22699880599975586, "eval_runtime": 159.162, "eval_samples_per_second": 62.829, "eval_steps_per_second": 0.496, "step": 157500 }, { "epoch": 2.9758981526954025, "grad_norm": 0.03078465536236763, "learning_rate": 9.457834359613665e-05, "loss": 0.1235, "step": 157550 }, { "epoch": 2.9768425824487172, "grad_norm": 0.030992714688181877, "learning_rate": 9.45730967641738e-05, "loss": 0.1241, "step": 157600 }, { "epoch": 2.9777870122020325, "grad_norm": 0.031937360763549805, "learning_rate": 9.456784993221093e-05, "loss": 0.124, "step": 157650 }, { "epoch": 2.9787314419553472, "grad_norm": 0.030401287600398064, "learning_rate": 9.456260310024807e-05, "loss": 0.1238, "step": 157700 }, { "epoch": 2.9796758717086624, "grad_norm": 0.030253244563937187, "learning_rate": 9.455735626828521e-05, "loss": 0.1241, "step": 157750 }, { "epoch": 2.980620301461977, "grad_norm": 0.03143264353275299, "learning_rate": 9.455210943632236e-05, "loss": 0.124, "step": 157800 }, { "epoch": 2.9815647312152924, "grad_norm": 0.030856089666485786, "learning_rate": 9.454686260435948e-05, "loss": 0.1235, "step": 157850 }, { "epoch": 2.982509160968607, "grad_norm": 0.03179367259144783, "learning_rate": 9.454161577239663e-05, "loss": 0.1238, "step": 157900 }, { "epoch": 2.983453590721922, "grad_norm": 0.029089946299791336, "learning_rate": 9.453636894043378e-05, "loss": 0.1233, "step": 157950 }, { "epoch": 2.984398020475237, "grad_norm": 0.029514018446207047, "learning_rate": 9.453112210847091e-05, "loss": 0.124, "step": 158000 }, { "epoch": 2.985342450228552, "grad_norm": 0.03045920468866825, "learning_rate": 9.452587527650804e-05, "loss": 0.1239, "step": 158050 }, { "epoch": 2.9862868799818667, "grad_norm": 0.030663738027215004, "learning_rate": 9.452062844454519e-05, "loss": 0.124, "step": 158100 }, { "epoch": 2.987231309735182, "grad_norm": 0.030752604827284813, "learning_rate": 9.451538161258233e-05, "loss": 0.1238, "step": 158150 }, { "epoch": 2.9881757394884967, "grad_norm": 0.02938421256840229, "learning_rate": 9.451013478061946e-05, "loss": 0.1241, "step": 158200 }, { "epoch": 2.989120169241812, "grad_norm": 0.02930537797510624, "learning_rate": 9.450488794865661e-05, "loss": 0.1235, "step": 158250 }, { "epoch": 2.9900645989951267, "grad_norm": 0.030464576557278633, "learning_rate": 9.449964111669376e-05, "loss": 0.1234, "step": 158300 }, { "epoch": 2.991009028748442, "grad_norm": 0.031350091099739075, "learning_rate": 9.449439428473088e-05, "loss": 0.1243, "step": 158350 }, { "epoch": 2.9919534585017566, "grad_norm": 0.0305135827511549, "learning_rate": 9.448914745276802e-05, "loss": 0.1236, "step": 158400 }, { "epoch": 2.9928978882550714, "grad_norm": 0.030921433120965958, "learning_rate": 9.448390062080517e-05, "loss": 0.1239, "step": 158450 }, { "epoch": 2.9938423180083866, "grad_norm": 0.039991192519664764, "learning_rate": 9.447865378884229e-05, "loss": 0.1238, "step": 158500 }, { "epoch": 2.9947867477617014, "grad_norm": 0.033750858157873154, "learning_rate": 9.447340695687944e-05, "loss": 0.1243, "step": 158550 }, { "epoch": 2.995731177515016, "grad_norm": 0.030020590871572495, "learning_rate": 9.446816012491659e-05, "loss": 0.1237, "step": 158600 }, { "epoch": 2.9966756072683314, "grad_norm": 0.0305172111839056, "learning_rate": 9.446291329295372e-05, "loss": 0.1237, "step": 158650 }, { "epoch": 2.9976200370216466, "grad_norm": 0.030973752960562706, "learning_rate": 9.445766646099085e-05, "loss": 0.1239, "step": 158700 }, { "epoch": 2.9985644667749614, "grad_norm": 0.030267532914876938, "learning_rate": 9.4452419629028e-05, "loss": 0.1237, "step": 158750 }, { "epoch": 2.999508896528276, "grad_norm": 0.02969502843916416, "learning_rate": 9.444717279706515e-05, "loss": 0.1239, "step": 158800 }, { "epoch": 3.0004533262815913, "grad_norm": 0.03173915296792984, "learning_rate": 9.444192596510227e-05, "loss": 0.1236, "step": 158850 }, { "epoch": 3.001397756034906, "grad_norm": 0.03185234218835831, "learning_rate": 9.443667913313942e-05, "loss": 0.1236, "step": 158900 }, { "epoch": 3.002342185788221, "grad_norm": 0.03149121627211571, "learning_rate": 9.443143230117656e-05, "loss": 0.1234, "step": 158950 }, { "epoch": 3.003286615541536, "grad_norm": 0.030765732750296593, "learning_rate": 9.442618546921368e-05, "loss": 0.1235, "step": 159000 }, { "epoch": 3.004231045294851, "grad_norm": 0.031362440437078476, "learning_rate": 9.442093863725083e-05, "loss": 0.1239, "step": 159050 }, { "epoch": 3.005175475048166, "grad_norm": 0.029362289234995842, "learning_rate": 9.441569180528798e-05, "loss": 0.123, "step": 159100 }, { "epoch": 3.006119904801481, "grad_norm": 0.030735842883586884, "learning_rate": 9.441044497332511e-05, "loss": 0.1234, "step": 159150 }, { "epoch": 3.0070643345547956, "grad_norm": 0.031287066638469696, "learning_rate": 9.440519814136225e-05, "loss": 0.1235, "step": 159200 }, { "epoch": 3.008008764308111, "grad_norm": 0.03278295695781708, "learning_rate": 9.43999513093994e-05, "loss": 0.1236, "step": 159250 }, { "epoch": 3.0089531940614256, "grad_norm": 0.03188945725560188, "learning_rate": 9.439470447743653e-05, "loss": 0.1236, "step": 159300 }, { "epoch": 3.009897623814741, "grad_norm": 0.030972128733992577, "learning_rate": 9.438945764547366e-05, "loss": 0.1232, "step": 159350 }, { "epoch": 3.0108420535680556, "grad_norm": 0.03045603074133396, "learning_rate": 9.438421081351081e-05, "loss": 0.1233, "step": 159400 }, { "epoch": 3.0117864833213708, "grad_norm": 0.031380441039800644, "learning_rate": 9.437896398154794e-05, "loss": 0.1232, "step": 159450 }, { "epoch": 3.0127309130746855, "grad_norm": 0.030158083885908127, "learning_rate": 9.437371714958508e-05, "loss": 0.1236, "step": 159500 }, { "epoch": 3.0136753428280003, "grad_norm": 0.03185613453388214, "learning_rate": 9.436847031762222e-05, "loss": 0.1236, "step": 159550 }, { "epoch": 3.0146197725813155, "grad_norm": 0.030171716585755348, "learning_rate": 9.436322348565937e-05, "loss": 0.1232, "step": 159600 }, { "epoch": 3.0155642023346303, "grad_norm": 0.030458660796284676, "learning_rate": 9.43579766536965e-05, "loss": 0.1236, "step": 159650 }, { "epoch": 3.0165086320879455, "grad_norm": 0.02919768914580345, "learning_rate": 9.435272982173364e-05, "loss": 0.1236, "step": 159700 }, { "epoch": 3.0174530618412603, "grad_norm": 0.033059343695640564, "learning_rate": 9.434748298977079e-05, "loss": 0.1236, "step": 159750 }, { "epoch": 3.018397491594575, "grad_norm": 0.03114180639386177, "learning_rate": 9.434223615780792e-05, "loss": 0.1232, "step": 159800 }, { "epoch": 3.0193419213478903, "grad_norm": 0.030235888436436653, "learning_rate": 9.433698932584506e-05, "loss": 0.1233, "step": 159850 }, { "epoch": 3.020286351101205, "grad_norm": 0.03075767494738102, "learning_rate": 9.43317424938822e-05, "loss": 0.1235, "step": 159900 }, { "epoch": 3.0212307808545202, "grad_norm": 0.030777424573898315, "learning_rate": 9.432649566191934e-05, "loss": 0.1231, "step": 159950 }, { "epoch": 3.022175210607835, "grad_norm": 0.029254883527755737, "learning_rate": 9.432124882995647e-05, "loss": 0.1236, "step": 160000 }, { "epoch": 3.022175210607835, "eval_IntDiv": 0.6755930850853908, "eval_NumCircles": 1790, "eval_SumBottleneck": 77.88659800028454, "eval_Uniqueness": 0.9967712642518414, "eval_Validity": 0.9911, "eval_Validity * Uniqueness": 0.9879, "eval_loss": 0.23043379187583923, "eval_runtime": 147.9287, "eval_samples_per_second": 67.6, "eval_steps_per_second": 0.534, "step": 160000 }, { "epoch": 3.0231196403611498, "grad_norm": 0.031245851889252663, "learning_rate": 9.431600199799362e-05, "loss": 0.1234, "step": 160050 }, { "epoch": 3.024064070114465, "grad_norm": 0.031074659898877144, "learning_rate": 9.431075516603075e-05, "loss": 0.1236, "step": 160100 }, { "epoch": 3.0250084998677798, "grad_norm": 0.030625561252236366, "learning_rate": 9.43055083340679e-05, "loss": 0.1235, "step": 160150 }, { "epoch": 3.025952929621095, "grad_norm": 0.031566619873046875, "learning_rate": 9.430026150210503e-05, "loss": 0.1238, "step": 160200 }, { "epoch": 3.0268973593744097, "grad_norm": 0.030760711058974266, "learning_rate": 9.429501467014217e-05, "loss": 0.1235, "step": 160250 }, { "epoch": 3.0278417891277245, "grad_norm": 0.03177009895443916, "learning_rate": 9.428976783817931e-05, "loss": 0.124, "step": 160300 }, { "epoch": 3.0287862188810397, "grad_norm": 0.030511317774653435, "learning_rate": 9.428452100621645e-05, "loss": 0.1236, "step": 160350 }, { "epoch": 3.0297306486343545, "grad_norm": 0.031585536897182465, "learning_rate": 9.42792741742536e-05, "loss": 0.1235, "step": 160400 }, { "epoch": 3.0306750783876697, "grad_norm": 0.029559988528490067, "learning_rate": 9.427402734229073e-05, "loss": 0.1236, "step": 160450 }, { "epoch": 3.0316195081409845, "grad_norm": 0.03184564784169197, "learning_rate": 9.426878051032786e-05, "loss": 0.1235, "step": 160500 }, { "epoch": 3.0325639378942992, "grad_norm": 0.029830627143383026, "learning_rate": 9.426353367836501e-05, "loss": 0.1236, "step": 160550 }, { "epoch": 3.0335083676476144, "grad_norm": 0.0427539199590683, "learning_rate": 9.425828684640215e-05, "loss": 0.1235, "step": 160600 }, { "epoch": 3.034452797400929, "grad_norm": 0.02963174134492874, "learning_rate": 9.425304001443929e-05, "loss": 0.1232, "step": 160650 }, { "epoch": 3.0353972271542444, "grad_norm": 0.033669885247945786, "learning_rate": 9.424779318247643e-05, "loss": 0.1234, "step": 160700 }, { "epoch": 3.036341656907559, "grad_norm": 0.03216470405459404, "learning_rate": 9.424254635051356e-05, "loss": 0.1234, "step": 160750 }, { "epoch": 3.037286086660874, "grad_norm": 0.030175279825925827, "learning_rate": 9.423729951855071e-05, "loss": 0.1233, "step": 160800 }, { "epoch": 3.038230516414189, "grad_norm": 0.03274207562208176, "learning_rate": 9.423205268658784e-05, "loss": 0.1232, "step": 160850 }, { "epoch": 3.039174946167504, "grad_norm": 0.030740777030587196, "learning_rate": 9.422680585462498e-05, "loss": 0.1235, "step": 160900 }, { "epoch": 3.040119375920819, "grad_norm": 0.03072310984134674, "learning_rate": 9.422155902266212e-05, "loss": 0.1233, "step": 160950 }, { "epoch": 3.041063805674134, "grad_norm": 0.03217470645904541, "learning_rate": 9.421631219069926e-05, "loss": 0.1234, "step": 161000 }, { "epoch": 3.0420082354274487, "grad_norm": 0.03042328543961048, "learning_rate": 9.421106535873639e-05, "loss": 0.1236, "step": 161050 }, { "epoch": 3.042952665180764, "grad_norm": 0.02958352118730545, "learning_rate": 9.420581852677354e-05, "loss": 0.1233, "step": 161100 }, { "epoch": 3.0438970949340787, "grad_norm": 0.029310936108231544, "learning_rate": 9.420057169481069e-05, "loss": 0.1233, "step": 161150 }, { "epoch": 3.044841524687394, "grad_norm": 0.030509455129504204, "learning_rate": 9.419532486284782e-05, "loss": 0.1232, "step": 161200 }, { "epoch": 3.0457859544407087, "grad_norm": 0.03241512179374695, "learning_rate": 9.419007803088495e-05, "loss": 0.1232, "step": 161250 }, { "epoch": 3.046730384194024, "grad_norm": 0.031190838664770126, "learning_rate": 9.41848311989221e-05, "loss": 0.1234, "step": 161300 }, { "epoch": 3.0476748139473386, "grad_norm": 0.029773946851491928, "learning_rate": 9.417958436695923e-05, "loss": 0.1232, "step": 161350 }, { "epoch": 3.0486192437006534, "grad_norm": 0.03056354448199272, "learning_rate": 9.417433753499637e-05, "loss": 0.1234, "step": 161400 }, { "epoch": 3.0495636734539686, "grad_norm": 0.03138606622815132, "learning_rate": 9.416909070303352e-05, "loss": 0.1235, "step": 161450 }, { "epoch": 3.0505081032072834, "grad_norm": 0.030519990250468254, "learning_rate": 9.416384387107065e-05, "loss": 0.1233, "step": 161500 }, { "epoch": 3.0514525329605986, "grad_norm": 0.032704342156648636, "learning_rate": 9.415859703910778e-05, "loss": 0.1236, "step": 161550 }, { "epoch": 3.0523969627139134, "grad_norm": 0.02988733910024166, "learning_rate": 9.415335020714493e-05, "loss": 0.1237, "step": 161600 }, { "epoch": 3.053341392467228, "grad_norm": 0.033243220299482346, "learning_rate": 9.414810337518208e-05, "loss": 0.1234, "step": 161650 }, { "epoch": 3.0542858222205433, "grad_norm": 0.029969921335577965, "learning_rate": 9.41428565432192e-05, "loss": 0.1234, "step": 161700 }, { "epoch": 3.055230251973858, "grad_norm": 0.02988543175160885, "learning_rate": 9.413760971125635e-05, "loss": 0.1236, "step": 161750 }, { "epoch": 3.0561746817271733, "grad_norm": 0.030185097828507423, "learning_rate": 9.41323628792935e-05, "loss": 0.1232, "step": 161800 }, { "epoch": 3.057119111480488, "grad_norm": 0.03167417272925377, "learning_rate": 9.412711604733061e-05, "loss": 0.1234, "step": 161850 }, { "epoch": 3.058063541233803, "grad_norm": 0.031165946274995804, "learning_rate": 9.412186921536776e-05, "loss": 0.1233, "step": 161900 }, { "epoch": 3.059007970987118, "grad_norm": 0.031182730570435524, "learning_rate": 9.411662238340491e-05, "loss": 0.1233, "step": 161950 }, { "epoch": 3.059952400740433, "grad_norm": 0.0320664681494236, "learning_rate": 9.411137555144204e-05, "loss": 0.1231, "step": 162000 }, { "epoch": 3.060896830493748, "grad_norm": 0.03093823790550232, "learning_rate": 9.410612871947918e-05, "loss": 0.1234, "step": 162050 }, { "epoch": 3.061841260247063, "grad_norm": 0.030557693913578987, "learning_rate": 9.410088188751632e-05, "loss": 0.1233, "step": 162100 }, { "epoch": 3.0627856900003776, "grad_norm": 0.030610332265496254, "learning_rate": 9.409563505555347e-05, "loss": 0.1234, "step": 162150 }, { "epoch": 3.063730119753693, "grad_norm": 0.03080502711236477, "learning_rate": 9.409038822359059e-05, "loss": 0.1233, "step": 162200 }, { "epoch": 3.0646745495070076, "grad_norm": 0.029564280062913895, "learning_rate": 9.408514139162774e-05, "loss": 0.1231, "step": 162250 }, { "epoch": 3.065618979260323, "grad_norm": 0.03041326254606247, "learning_rate": 9.407989455966489e-05, "loss": 0.1229, "step": 162300 }, { "epoch": 3.0665634090136376, "grad_norm": 0.03158561512827873, "learning_rate": 9.407464772770201e-05, "loss": 0.1233, "step": 162350 }, { "epoch": 3.0675078387669523, "grad_norm": 0.03127938136458397, "learning_rate": 9.406940089573916e-05, "loss": 0.1234, "step": 162400 }, { "epoch": 3.0684522685202675, "grad_norm": 0.02966582588851452, "learning_rate": 9.40641540637763e-05, "loss": 0.1232, "step": 162450 }, { "epoch": 3.0693966982735823, "grad_norm": 0.0301327146589756, "learning_rate": 9.405890723181344e-05, "loss": 0.1234, "step": 162500 }, { "epoch": 3.0693966982735823, "eval_IntDiv": 0.6741110615181577, "eval_NumCircles": 1800, "eval_SumBottleneck": 155.5064008940473, "eval_Uniqueness": 0.9967728922952803, "eval_Validity": 0.9916, "eval_Validity * Uniqueness": 0.9884000000000001, "eval_loss": 0.22666501998901367, "eval_runtime": 151.6842, "eval_samples_per_second": 65.926, "eval_steps_per_second": 0.521, "step": 162500 }, { "epoch": 3.0703411280268975, "grad_norm": 0.030422020703554153, "learning_rate": 9.405366039985057e-05, "loss": 0.1236, "step": 162550 }, { "epoch": 3.0712855577802123, "grad_norm": 0.03093128278851509, "learning_rate": 9.404841356788772e-05, "loss": 0.1235, "step": 162600 }, { "epoch": 3.072229987533527, "grad_norm": 0.0318017341196537, "learning_rate": 9.404316673592485e-05, "loss": 0.1234, "step": 162650 }, { "epoch": 3.0731744172868423, "grad_norm": 0.03227454051375389, "learning_rate": 9.403791990396199e-05, "loss": 0.1234, "step": 162700 }, { "epoch": 3.074118847040157, "grad_norm": 0.0319363996386528, "learning_rate": 9.403267307199913e-05, "loss": 0.1233, "step": 162750 }, { "epoch": 3.0750632767934722, "grad_norm": 0.030314335599541664, "learning_rate": 9.402742624003628e-05, "loss": 0.1232, "step": 162800 }, { "epoch": 3.076007706546787, "grad_norm": 0.030228281393647194, "learning_rate": 9.40221794080734e-05, "loss": 0.1235, "step": 162850 }, { "epoch": 3.0769521363001022, "grad_norm": 0.032179996371269226, "learning_rate": 9.401693257611055e-05, "loss": 0.1232, "step": 162900 }, { "epoch": 3.077896566053417, "grad_norm": 0.031232589855790138, "learning_rate": 9.40116857441477e-05, "loss": 0.1232, "step": 162950 }, { "epoch": 3.0788409958067318, "grad_norm": 0.030301764607429504, "learning_rate": 9.400643891218483e-05, "loss": 0.1235, "step": 163000 }, { "epoch": 3.079785425560047, "grad_norm": 0.031947989016771317, "learning_rate": 9.400119208022196e-05, "loss": 0.1233, "step": 163050 }, { "epoch": 3.0807298553133617, "grad_norm": 0.03043929859995842, "learning_rate": 9.399594524825911e-05, "loss": 0.1234, "step": 163100 }, { "epoch": 3.081674285066677, "grad_norm": 0.03049435280263424, "learning_rate": 9.399069841629625e-05, "loss": 0.1237, "step": 163150 }, { "epoch": 3.0826187148199917, "grad_norm": 0.03066340461373329, "learning_rate": 9.398545158433338e-05, "loss": 0.1232, "step": 163200 }, { "epoch": 3.0835631445733065, "grad_norm": 0.03302876651287079, "learning_rate": 9.398020475237053e-05, "loss": 0.1232, "step": 163250 }, { "epoch": 3.0845075743266217, "grad_norm": 0.0319611057639122, "learning_rate": 9.397495792040766e-05, "loss": 0.1232, "step": 163300 }, { "epoch": 3.0854520040799365, "grad_norm": 0.03421981260180473, "learning_rate": 9.39697110884448e-05, "loss": 0.1233, "step": 163350 }, { "epoch": 3.0863964338332517, "grad_norm": 0.031150560826063156, "learning_rate": 9.396446425648194e-05, "loss": 0.1233, "step": 163400 }, { "epoch": 3.0873408635865665, "grad_norm": 0.02990487776696682, "learning_rate": 9.395921742451908e-05, "loss": 0.1234, "step": 163450 }, { "epoch": 3.088285293339881, "grad_norm": 0.03053167089819908, "learning_rate": 9.395397059255622e-05, "loss": 0.1236, "step": 163500 }, { "epoch": 3.0892297230931964, "grad_norm": 0.031231245025992393, "learning_rate": 9.394872376059336e-05, "loss": 0.1232, "step": 163550 }, { "epoch": 3.090174152846511, "grad_norm": 0.03200772777199745, "learning_rate": 9.39434769286305e-05, "loss": 0.1236, "step": 163600 }, { "epoch": 3.0911185825998264, "grad_norm": 0.04483465105295181, "learning_rate": 9.393823009666764e-05, "loss": 0.1233, "step": 163650 }, { "epoch": 3.092063012353141, "grad_norm": 0.03081994690001011, "learning_rate": 9.393298326470477e-05, "loss": 0.1228, "step": 163700 }, { "epoch": 3.093007442106456, "grad_norm": 0.03111526556313038, "learning_rate": 9.392773643274192e-05, "loss": 0.1236, "step": 163750 }, { "epoch": 3.093951871859771, "grad_norm": 0.03290475532412529, "learning_rate": 9.392248960077905e-05, "loss": 0.1235, "step": 163800 }, { "epoch": 3.094896301613086, "grad_norm": 0.030884582549333572, "learning_rate": 9.391724276881619e-05, "loss": 0.1233, "step": 163850 }, { "epoch": 3.095840731366401, "grad_norm": 0.02979167178273201, "learning_rate": 9.391199593685334e-05, "loss": 0.1237, "step": 163900 }, { "epoch": 3.096785161119716, "grad_norm": 0.030847247689962387, "learning_rate": 9.390674910489047e-05, "loss": 0.1231, "step": 163950 }, { "epoch": 3.0977295908730307, "grad_norm": 0.03103218600153923, "learning_rate": 9.390150227292762e-05, "loss": 0.1234, "step": 164000 }, { "epoch": 3.098674020626346, "grad_norm": 0.032022085040807724, "learning_rate": 9.389625544096475e-05, "loss": 0.1233, "step": 164050 }, { "epoch": 3.0996184503796607, "grad_norm": 0.03231204301118851, "learning_rate": 9.389100860900188e-05, "loss": 0.1232, "step": 164100 }, { "epoch": 3.100562880132976, "grad_norm": 0.03138069808483124, "learning_rate": 9.388576177703903e-05, "loss": 0.1235, "step": 164150 }, { "epoch": 3.1015073098862906, "grad_norm": 0.03135951980948448, "learning_rate": 9.388051494507617e-05, "loss": 0.1235, "step": 164200 }, { "epoch": 3.1024517396396054, "grad_norm": 0.032286614179611206, "learning_rate": 9.38752681131133e-05, "loss": 0.1232, "step": 164250 }, { "epoch": 3.1033961693929206, "grad_norm": 0.030674278736114502, "learning_rate": 9.387002128115045e-05, "loss": 0.1236, "step": 164300 }, { "epoch": 3.1043405991462354, "grad_norm": 0.030325086787343025, "learning_rate": 9.386477444918758e-05, "loss": 0.1234, "step": 164350 }, { "epoch": 3.1052850288995506, "grad_norm": 0.031174805015325546, "learning_rate": 9.385952761722473e-05, "loss": 0.1228, "step": 164400 }, { "epoch": 3.1062294586528654, "grad_norm": 0.03184359893202782, "learning_rate": 9.385428078526186e-05, "loss": 0.1237, "step": 164450 }, { "epoch": 3.10717388840618, "grad_norm": 0.031295936554670334, "learning_rate": 9.384903395329901e-05, "loss": 0.1233, "step": 164500 }, { "epoch": 3.1081183181594954, "grad_norm": 0.03018672578036785, "learning_rate": 9.384378712133614e-05, "loss": 0.1235, "step": 164550 }, { "epoch": 3.10906274791281, "grad_norm": 0.030191898345947266, "learning_rate": 9.383854028937328e-05, "loss": 0.1236, "step": 164600 }, { "epoch": 3.1100071776661253, "grad_norm": 0.03210653364658356, "learning_rate": 9.383329345741042e-05, "loss": 0.123, "step": 164650 }, { "epoch": 3.11095160741944, "grad_norm": 0.031393129378557205, "learning_rate": 9.382804662544756e-05, "loss": 0.1234, "step": 164700 }, { "epoch": 3.1118960371727553, "grad_norm": 0.029841627925634384, "learning_rate": 9.382279979348469e-05, "loss": 0.1235, "step": 164750 }, { "epoch": 3.11284046692607, "grad_norm": 0.03104235976934433, "learning_rate": 9.381755296152184e-05, "loss": 0.1231, "step": 164800 }, { "epoch": 3.113784896679385, "grad_norm": 0.02976902946829796, "learning_rate": 9.381230612955897e-05, "loss": 0.1235, "step": 164850 }, { "epoch": 3.1147293264327, "grad_norm": 0.03283771499991417, "learning_rate": 9.380705929759611e-05, "loss": 0.1232, "step": 164900 }, { "epoch": 3.115673756186015, "grad_norm": 0.03152434527873993, "learning_rate": 9.380181246563326e-05, "loss": 0.1236, "step": 164950 }, { "epoch": 3.11661818593933, "grad_norm": 0.03260129317641258, "learning_rate": 9.37965656336704e-05, "loss": 0.1234, "step": 165000 }, { "epoch": 3.11661818593933, "eval_IntDiv": 0.6761449903097957, "eval_NumCircles": 1761, "eval_SumBottleneck": 119.13335492781925, "eval_Uniqueness": 0.9972798710457385, "eval_Validity": 0.9926, "eval_Validity * Uniqueness": 0.9899, "eval_loss": 0.22647763788700104, "eval_runtime": 211.0789, "eval_samples_per_second": 47.376, "eval_steps_per_second": 0.374, "step": 165000 } ], "logging_steps": 50, "max_steps": 1058840, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 2500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 10, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1.4718070254030815e+19, "train_batch_size": 512, "trial_name": null, "trial_params": null }