{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 0.14379178948882018, "eval_steps": 500, "global_step": 500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "ce_ib": 65.99971008300781, "ce_orig": 0.8247115612030029, "epoch": 0, "kl_loss": 3969.01025390625, "loss_ib": 39.69670104980469, "step": 0 }, { "ce_ib": 61.875301361083984, "ce_orig": 0.3094598948955536, "epoch": 0, "kl_loss": 1816.435302734375, "loss_ib": 18.17053985595703, "step": 0 }, { "ce_ib": 65.33805084228516, "ce_orig": 1.0820972919464111, "epoch": 0, "kl_loss": 4051.13818359375, "loss_ib": 40.517913818359375, "step": 0 }, { "ce_ib": 65.36083221435547, "ce_orig": 0.8601827025413513, "epoch": 0, "kl_loss": 3727.80126953125, "loss_ib": 37.2845458984375, "step": 0 }, { "ce_ib": 64.40461730957031, "ce_orig": 1.3601988554000854, "epoch": 0.00028758357897764035, "kl_loss": 3548.660888671875, "loss_ib": 35.49304962158203, "step": 1 }, { "ce_ib": 66.136474609375, "ce_orig": 0.9451982975006104, "epoch": 0.00028758357897764035, "kl_loss": 4003.119140625, "loss_ib": 40.037803649902344, "step": 1 }, { "ce_ib": 65.30732727050781, "ce_orig": 1.3611608743667603, "epoch": 0.00028758357897764035, "kl_loss": 3076.302490234375, "loss_ib": 30.769554138183594, "step": 1 }, { "ce_ib": 63.613216400146484, "ce_orig": 0.5681392550468445, "epoch": 0.00028758357897764035, "kl_loss": 3922.22265625, "loss_ib": 39.22858810424805, "step": 1 }, { "ce_ib": 65.20169067382812, "ce_orig": 0.9869711399078369, "epoch": 0.0005751671579552807, "kl_loss": 4010.333251953125, "loss_ib": 40.1098518371582, "step": 2 }, { "ce_ib": 64.6613540649414, "ce_orig": 1.0124142169952393, "epoch": 0.0005751671579552807, "kl_loss": 3416.4658203125, "loss_ib": 34.17112350463867, "step": 2 }, { "ce_ib": 64.3924560546875, "ce_orig": 0.825140118598938, "epoch": 0.0005751671579552807, "kl_loss": 3954.5244140625, "loss_ib": 39.55168533325195, "step": 2 }, { "ce_ib": 66.31563568115234, "ce_orig": 1.6114795207977295, "epoch": 0.0005751671579552807, "kl_loss": 3360.53955078125, "loss_ib": 33.61202621459961, "step": 2 }, { "ce_ib": 63.97846603393555, "ce_orig": 1.0248628854751587, "epoch": 0.0008627507369329212, "kl_loss": 3866.74462890625, "loss_ib": 38.67384338378906, "step": 3 }, { "ce_ib": 64.94669342041016, "ce_orig": 0.7158174514770508, "epoch": 0.0008627507369329212, "kl_loss": 3586.52783203125, "loss_ib": 35.87177276611328, "step": 3 }, { "ce_ib": 66.78568267822266, "ce_orig": 1.1728931665420532, "epoch": 0.0008627507369329212, "kl_loss": 3981.269775390625, "loss_ib": 39.81937789916992, "step": 3 }, { "ce_ib": 66.30445861816406, "ce_orig": 0.9273799657821655, "epoch": 0.0008627507369329212, "kl_loss": 3999.728271484375, "loss_ib": 40.00391387939453, "step": 3 }, { "ce_ib": 63.22294616699219, "ce_orig": 0.6721798181533813, "epoch": 0.0011503343159105614, "kl_loss": 3434.2626953125, "loss_ib": 34.34894943237305, "step": 4 }, { "ce_ib": 65.629150390625, "ce_orig": 0.851636528968811, "epoch": 0.0011503343159105614, "kl_loss": 3777.80029296875, "loss_ib": 37.78456497192383, "step": 4 }, { "ce_ib": 65.70416259765625, "ce_orig": 0.8407150506973267, "epoch": 0.0011503343159105614, "kl_loss": 3663.44775390625, "loss_ib": 36.641048431396484, "step": 4 }, { "ce_ib": 65.25149536132812, "ce_orig": 0.8431562781333923, "epoch": 0.0011503343159105614, "kl_loss": 4073.102783203125, "loss_ib": 40.737552642822266, "step": 4 }, { "epoch": 0.0014379178948882019, "grad_norm": Infinity, "learning_rate": 0.0, "loss": 37.6069, "step": 5 }, { "ce_ib": 63.31033706665039, "ce_orig": 0.5193647146224976, "epoch": 0.0014379178948882019, "kl_loss": 3829.75732421875, "loss_ib": 38.30390167236328, "step": 5 }, { "ce_ib": 64.82113647460938, "ce_orig": 0.9080048203468323, "epoch": 0.0014379178948882019, "kl_loss": 4034.60400390625, "loss_ib": 40.35251998901367, "step": 5 }, { "ce_ib": 67.75746154785156, "ce_orig": 1.7583141326904297, "epoch": 0.0014379178948882019, "kl_loss": 3362.895751953125, "loss_ib": 33.6357307434082, "step": 5 }, { "ce_ib": 65.55052947998047, "ce_orig": 1.0019645690917969, "epoch": 0.0014379178948882019, "kl_loss": 3561.7119140625, "loss_ib": 35.62367248535156, "step": 5 }, { "ce_ib": 65.5093765258789, "ce_orig": 1.2022827863693237, "epoch": 0.0017255014738658423, "kl_loss": 3854.793212890625, "loss_ib": 38.554481506347656, "step": 6 }, { "ce_ib": 63.95633316040039, "ce_orig": 0.5561846494674683, "epoch": 0.0017255014738658423, "kl_loss": 3231.163818359375, "loss_ib": 32.31803512573242, "step": 6 }, { "ce_ib": 66.91143798828125, "ce_orig": 1.007911205291748, "epoch": 0.0017255014738658423, "kl_loss": 3694.936767578125, "loss_ib": 36.956058502197266, "step": 6 }, { "ce_ib": 65.86326599121094, "ce_orig": 1.1325939893722534, "epoch": 0.0017255014738658423, "kl_loss": 3653.87255859375, "loss_ib": 36.545310974121094, "step": 6 }, { "ce_ib": 61.93317794799805, "ce_orig": 0.3588999807834625, "epoch": 0.0020130850528434826, "kl_loss": 2617.40478515625, "loss_ib": 26.180240631103516, "step": 7 }, { "ce_ib": 66.48375701904297, "ce_orig": 0.9551417231559753, "epoch": 0.0020130850528434826, "kl_loss": 4009.37158203125, "loss_ib": 40.100364685058594, "step": 7 }, { "ce_ib": 64.68529510498047, "ce_orig": 1.3479645252227783, "epoch": 0.0020130850528434826, "kl_loss": 3682.17919921875, "loss_ib": 36.82826232910156, "step": 7 }, { "ce_ib": 65.71565246582031, "ce_orig": 1.4119635820388794, "epoch": 0.0020130850528434826, "kl_loss": 3543.86865234375, "loss_ib": 35.44525909423828, "step": 7 }, { "ce_ib": 64.79589080810547, "ce_orig": 1.1264829635620117, "epoch": 0.002300668631821123, "kl_loss": 3802.966552734375, "loss_ib": 38.0361442565918, "step": 8 }, { "ce_ib": 64.57544708251953, "ce_orig": 0.8281353712081909, "epoch": 0.002300668631821123, "kl_loss": 4064.0234375, "loss_ib": 40.646690368652344, "step": 8 }, { "ce_ib": 64.70269012451172, "ce_orig": 0.8244958519935608, "epoch": 0.002300668631821123, "kl_loss": 3695.80029296875, "loss_ib": 36.964473724365234, "step": 8 }, { "ce_ib": 66.23006439208984, "ce_orig": 0.7464499473571777, "epoch": 0.002300668631821123, "kl_loss": 3909.509765625, "loss_ib": 39.10171890258789, "step": 8 }, { "ce_ib": 66.00849151611328, "ce_orig": 1.2234286069869995, "epoch": 0.0025882522107987635, "kl_loss": 3269.261962890625, "loss_ib": 32.69921875, "step": 9 }, { "ce_ib": 61.78355407714844, "ce_orig": 0.6015470623970032, "epoch": 0.0025882522107987635, "kl_loss": 3815.06103515625, "loss_ib": 38.15678787231445, "step": 9 }, { "ce_ib": 61.84153747558594, "ce_orig": 0.6827983856201172, "epoch": 0.0025882522107987635, "kl_loss": 3885.240966796875, "loss_ib": 38.85859298706055, "step": 9 }, { "ce_ib": 66.06260681152344, "ce_orig": 1.3108824491500854, "epoch": 0.0025882522107987635, "kl_loss": 3949.405029296875, "loss_ib": 39.50065612792969, "step": 9 }, { "epoch": 0.0028758357897764038, "grad_norm": 518.9179077148438, "learning_rate": 6.369426751592357e-07, "loss": 37.6918, "step": 10 }, { "ce_ib": 64.02448272705078, "ce_orig": 0.762144923210144, "epoch": 0.0028758357897764038, "kl_loss": 3554.281005859375, "loss_ib": 35.54920959472656, "step": 10 }, { "ce_ib": 68.01136016845703, "ce_orig": 1.6496213674545288, "epoch": 0.0028758357897764038, "kl_loss": 3769.318359375, "loss_ib": 37.69998550415039, "step": 10 }, { "ce_ib": 68.6688003540039, "ce_orig": 1.7943211793899536, "epoch": 0.0028758357897764038, "kl_loss": 3359.124267578125, "loss_ib": 33.59811019897461, "step": 10 }, { "ce_ib": 66.47740936279297, "ce_orig": 0.9888946413993835, "epoch": 0.0028758357897764038, "kl_loss": 3657.010009765625, "loss_ib": 36.57674789428711, "step": 10 }, { "ce_ib": 68.97245788574219, "ce_orig": 1.853747844696045, "epoch": 0.003163419368754044, "kl_loss": 3813.30908203125, "loss_ib": 38.13998794555664, "step": 11 }, { "ce_ib": 66.31513214111328, "ce_orig": 1.50633704662323, "epoch": 0.003163419368754044, "kl_loss": 3285.7900390625, "loss_ib": 32.86452865600586, "step": 11 }, { "ce_ib": 63.428436279296875, "ce_orig": 0.9150334000587463, "epoch": 0.003163419368754044, "kl_loss": 3867.107421875, "loss_ib": 38.67741775512695, "step": 11 }, { "ce_ib": 64.99458312988281, "ce_orig": 0.8206988573074341, "epoch": 0.003163419368754044, "kl_loss": 1840.817626953125, "loss_ib": 18.414674758911133, "step": 11 }, { "ce_ib": 64.90898132324219, "ce_orig": 1.1344208717346191, "epoch": 0.0034510029477316847, "kl_loss": 3756.06201171875, "loss_ib": 37.56711196899414, "step": 12 }, { "ce_ib": 65.14974975585938, "ce_orig": 0.8449010848999023, "epoch": 0.0034510029477316847, "kl_loss": 3669.84326171875, "loss_ib": 36.70494842529297, "step": 12 }, { "ce_ib": 61.738800048828125, "ce_orig": 0.8912803530693054, "epoch": 0.0034510029477316847, "kl_loss": 3856.634765625, "loss_ib": 38.5725212097168, "step": 12 }, { "ce_ib": 62.223426818847656, "ce_orig": 0.6894405484199524, "epoch": 0.0034510029477316847, "kl_loss": 3847.307373046875, "loss_ib": 38.47929763793945, "step": 12 }, { "ce_ib": 62.734622955322266, "ce_orig": 0.8210228085517883, "epoch": 0.003738586526709325, "kl_loss": 4047.759765625, "loss_ib": 40.48387145996094, "step": 13 }, { "ce_ib": 63.48801040649414, "ce_orig": 0.6192799806594849, "epoch": 0.003738586526709325, "kl_loss": 3207.78173828125, "loss_ib": 32.084163665771484, "step": 13 }, { "ce_ib": 63.36425018310547, "ce_orig": 0.8307191729545593, "epoch": 0.003738586526709325, "kl_loss": 4154.55859375, "loss_ib": 41.55192184448242, "step": 13 }, { "ce_ib": 63.72712326049805, "ce_orig": 0.6353437304496765, "epoch": 0.003738586526709325, "kl_loss": 3861.010009765625, "loss_ib": 38.61647033691406, "step": 13 }, { "ce_ib": 63.29721450805664, "ce_orig": 1.0746912956237793, "epoch": 0.004026170105686965, "kl_loss": 3788.18603515625, "loss_ib": 37.88819122314453, "step": 14 }, { "ce_ib": 64.876708984375, "ce_orig": 0.2551986575126648, "epoch": 0.004026170105686965, "kl_loss": 3221.554931640625, "loss_ib": 32.2220344543457, "step": 14 }, { "ce_ib": 63.66843032836914, "ce_orig": 0.9092416763305664, "epoch": 0.004026170105686965, "kl_loss": 4153.7578125, "loss_ib": 41.5439453125, "step": 14 }, { "ce_ib": 62.37735366821289, "ce_orig": 0.4772454798221588, "epoch": 0.004026170105686965, "kl_loss": 3842.333984375, "loss_ib": 38.4295768737793, "step": 14 }, { "epoch": 0.004313753684664605, "grad_norm": 522.8844604492188, "learning_rate": 1.4331210191082802e-06, "loss": 37.6292, "step": 15 }, { "ce_ib": 65.9225845336914, "ce_orig": 1.2483989000320435, "epoch": 0.004313753684664605, "kl_loss": 3718.763427734375, "loss_ib": 37.1942253112793, "step": 15 }, { "ce_ib": 62.323360443115234, "ce_orig": 0.6228176951408386, "epoch": 0.004313753684664605, "kl_loss": 3593.427490234375, "loss_ib": 35.94050598144531, "step": 15 }, { "ce_ib": 63.397438049316406, "ce_orig": 1.2859151363372803, "epoch": 0.004313753684664605, "kl_loss": 4189.4609375, "loss_ib": 41.90094757080078, "step": 15 }, { "ce_ib": 63.35916519165039, "ce_orig": 0.7082123160362244, "epoch": 0.004313753684664605, "kl_loss": 3782.929443359375, "loss_ib": 37.835628509521484, "step": 15 }, { "ce_ib": 63.69921112060547, "ce_orig": 0.7915922999382019, "epoch": 0.004601337263642246, "kl_loss": 3295.76953125, "loss_ib": 32.96406555175781, "step": 16 }, { "ce_ib": 64.55254364013672, "ce_orig": 1.4573107957839966, "epoch": 0.004601337263642246, "kl_loss": 3830.550537109375, "loss_ib": 38.31195831298828, "step": 16 }, { "ce_ib": 63.20068359375, "ce_orig": 0.9544379115104675, "epoch": 0.004601337263642246, "kl_loss": 3457.2080078125, "loss_ib": 34.578399658203125, "step": 16 }, { "ce_ib": 67.24832153320312, "ce_orig": 0.8406115174293518, "epoch": 0.004601337263642246, "kl_loss": 4083.5341796875, "loss_ib": 40.842063903808594, "step": 16 }, { "ce_ib": 66.60543060302734, "ce_orig": 1.3419269323349, "epoch": 0.004888920842619887, "kl_loss": 3605.4677734375, "loss_ib": 36.061336517333984, "step": 17 }, { "ce_ib": 62.604434967041016, "ce_orig": 0.6389816999435425, "epoch": 0.004888920842619887, "kl_loss": 4083.78759765625, "loss_ib": 40.84413528442383, "step": 17 }, { "ce_ib": 64.72972106933594, "ce_orig": 1.176672101020813, "epoch": 0.004888920842619887, "kl_loss": 1900.025634765625, "loss_ib": 19.006729125976562, "step": 17 }, { "ce_ib": 65.18509674072266, "ce_orig": 1.2524960041046143, "epoch": 0.004888920842619887, "kl_loss": 3951.653076171875, "loss_ib": 39.523048400878906, "step": 17 }, { "ce_ib": 64.49193572998047, "ce_orig": 1.1009666919708252, "epoch": 0.005176504421597527, "kl_loss": 3485.996826171875, "loss_ib": 34.866416931152344, "step": 18 }, { "ce_ib": 61.90851974487305, "ce_orig": 0.4805839955806732, "epoch": 0.005176504421597527, "kl_loss": 3180.7490234375, "loss_ib": 31.81368064880371, "step": 18 }, { "ce_ib": 65.22083282470703, "ce_orig": 0.80530846118927, "epoch": 0.005176504421597527, "kl_loss": 3836.34423828125, "loss_ib": 38.36996078491211, "step": 18 }, { "ce_ib": 65.64443969726562, "ce_orig": 1.2098023891448975, "epoch": 0.005176504421597527, "kl_loss": 3608.783203125, "loss_ib": 36.09439468383789, "step": 18 }, { "ce_ib": 64.61073303222656, "ce_orig": 1.073931097984314, "epoch": 0.005464088000575167, "kl_loss": 3759.63671875, "loss_ib": 37.60282516479492, "step": 19 }, { "ce_ib": 66.11485290527344, "ce_orig": 1.3443665504455566, "epoch": 0.005464088000575167, "kl_loss": 3318.16650390625, "loss_ib": 33.18827438354492, "step": 19 }, { "ce_ib": 66.71015167236328, "ce_orig": 0.8358739018440247, "epoch": 0.005464088000575167, "kl_loss": 4202.9921875, "loss_ib": 42.036590576171875, "step": 19 }, { "ce_ib": 67.69292449951172, "ce_orig": 1.7301944494247437, "epoch": 0.005464088000575167, "kl_loss": 3555.893310546875, "loss_ib": 35.56570053100586, "step": 19 }, { "epoch": 0.0057516715795528075, "grad_norm": 523.6597900390625, "learning_rate": 2.229299363057325e-06, "loss": 38.0114, "step": 20 }, { "ce_ib": 63.84000015258789, "ce_orig": 0.7589442729949951, "epoch": 0.0057516715795528075, "kl_loss": 4097.67724609375, "loss_ib": 40.983154296875, "step": 20 }, { "ce_ib": 62.5760612487793, "ce_orig": 0.6316663026809692, "epoch": 0.0057516715795528075, "kl_loss": 3378.1162109375, "loss_ib": 33.787418365478516, "step": 20 }, { "ce_ib": 64.90914154052734, "ce_orig": 0.8841529488563538, "epoch": 0.0057516715795528075, "kl_loss": 4190.35009765625, "loss_ib": 41.90998840332031, "step": 20 }, { "ce_ib": 63.49992370605469, "ce_orig": 1.1218868494033813, "epoch": 0.0057516715795528075, "kl_loss": 3893.951171875, "loss_ib": 38.94586181640625, "step": 20 }, { "ce_ib": 62.81148147583008, "ce_orig": 0.7255597710609436, "epoch": 0.006039255158530448, "kl_loss": 4084.71142578125, "loss_ib": 40.8533935546875, "step": 21 }, { "ce_ib": 62.18263244628906, "ce_orig": 0.6901943683624268, "epoch": 0.006039255158530448, "kl_loss": 3732.931396484375, "loss_ib": 37.335533142089844, "step": 21 }, { "ce_ib": 64.20355987548828, "ce_orig": 1.0124316215515137, "epoch": 0.006039255158530448, "kl_loss": 3761.3251953125, "loss_ib": 37.61967086791992, "step": 21 }, { "ce_ib": 61.63228988647461, "ce_orig": 0.5279907584190369, "epoch": 0.006039255158530448, "kl_loss": 3691.64111328125, "loss_ib": 36.92257308959961, "step": 21 }, { "ce_ib": 62.56758499145508, "ce_orig": 0.7798469066619873, "epoch": 0.006326838737508088, "kl_loss": 3670.70166015625, "loss_ib": 36.71327209472656, "step": 22 }, { "ce_ib": 63.57075881958008, "ce_orig": 0.8365420699119568, "epoch": 0.006326838737508088, "kl_loss": 3658.580322265625, "loss_ib": 36.592159271240234, "step": 22 }, { "ce_ib": 61.62807083129883, "ce_orig": 0.5540810823440552, "epoch": 0.006326838737508088, "kl_loss": 3681.03662109375, "loss_ib": 36.8165283203125, "step": 22 }, { "ce_ib": 64.64292907714844, "ce_orig": 1.0211745500564575, "epoch": 0.006326838737508088, "kl_loss": 3909.70458984375, "loss_ib": 39.10350799560547, "step": 22 }, { "ce_ib": 63.90407180786133, "ce_orig": 1.0038657188415527, "epoch": 0.006614422316485728, "kl_loss": 3516.5341796875, "loss_ib": 35.17173385620117, "step": 23 }, { "ce_ib": 64.3149642944336, "ce_orig": 1.43198823928833, "epoch": 0.006614422316485728, "kl_loss": 3473.03955078125, "loss_ib": 34.73682403564453, "step": 23 }, { "ce_ib": 65.7113037109375, "ce_orig": 1.3454030752182007, "epoch": 0.006614422316485728, "kl_loss": 3446.73095703125, "loss_ib": 34.473880767822266, "step": 23 }, { "ce_ib": 64.66767120361328, "ce_orig": 1.1042531728744507, "epoch": 0.006614422316485728, "kl_loss": 3285.74560546875, "loss_ib": 32.863922119140625, "step": 23 }, { "ce_ib": 62.60567092895508, "ce_orig": 0.8803403973579407, "epoch": 0.006902005895463369, "kl_loss": 4045.211669921875, "loss_ib": 40.4583740234375, "step": 24 }, { "ce_ib": 62.218082427978516, "ce_orig": 0.5355222225189209, "epoch": 0.006902005895463369, "kl_loss": 2061.3427734375, "loss_ib": 20.619647979736328, "step": 24 }, { "ce_ib": 62.739349365234375, "ce_orig": 0.7724053263664246, "epoch": 0.006902005895463369, "kl_loss": 3955.72021484375, "loss_ib": 39.5634765625, "step": 24 }, { "ce_ib": 64.84529876708984, "ce_orig": 0.9221442341804504, "epoch": 0.006902005895463369, "kl_loss": 4072.906982421875, "loss_ib": 40.73555374145508, "step": 24 }, { "epoch": 0.00718958947444101, "grad_norm": 500.6357116699219, "learning_rate": 3.0254777070063695e-06, "loss": 37.5291, "step": 25 }, { "ce_ib": 64.90079498291016, "ce_orig": 1.3044438362121582, "epoch": 0.00718958947444101, "kl_loss": 3491.833984375, "loss_ib": 34.924827575683594, "step": 25 }, { "ce_ib": 60.71520233154297, "ce_orig": 0.4326849579811096, "epoch": 0.00718958947444101, "kl_loss": 3640.559326171875, "loss_ib": 36.41166305541992, "step": 25 }, { "ce_ib": 64.01187896728516, "ce_orig": 1.0306893587112427, "epoch": 0.00718958947444101, "kl_loss": 3960.2236328125, "loss_ib": 39.60863494873047, "step": 25 }, { "ce_ib": 64.18307495117188, "ce_orig": 0.9839837551116943, "epoch": 0.00718958947444101, "kl_loss": 3976.920654296875, "loss_ib": 39.7756233215332, "step": 25 }, { "ce_ib": 64.72349548339844, "ce_orig": 1.4616881608963013, "epoch": 0.00747717305341865, "kl_loss": 3761.33935546875, "loss_ib": 37.61986541748047, "step": 26 }, { "ce_ib": 64.97052764892578, "ce_orig": 0.7502491474151611, "epoch": 0.00747717305341865, "kl_loss": 3893.336669921875, "loss_ib": 38.93986129760742, "step": 26 }, { "ce_ib": 65.82380676269531, "ce_orig": 1.34544038772583, "epoch": 0.00747717305341865, "kl_loss": 3513.64404296875, "loss_ib": 35.14302062988281, "step": 26 }, { "ce_ib": 65.6162109375, "ce_orig": 1.0590736865997314, "epoch": 0.00747717305341865, "kl_loss": 3592.0341796875, "loss_ib": 35.926902770996094, "step": 26 }, { "ce_ib": 60.9577522277832, "ce_orig": 0.7530563473701477, "epoch": 0.00776475663239629, "kl_loss": 3584.533203125, "loss_ib": 35.8514289855957, "step": 27 }, { "ce_ib": 62.96725845336914, "ce_orig": 0.7575862407684326, "epoch": 0.00776475663239629, "kl_loss": 4020.78271484375, "loss_ib": 40.2141227722168, "step": 27 }, { "ce_ib": 63.01191329956055, "ce_orig": 0.8695152997970581, "epoch": 0.00776475663239629, "kl_loss": 3717.216064453125, "loss_ib": 37.178462982177734, "step": 27 }, { "ce_ib": 61.84136199951172, "ce_orig": 0.5044524669647217, "epoch": 0.00776475663239629, "kl_loss": 3559.84326171875, "loss_ib": 35.6046142578125, "step": 27 }, { "ce_ib": 62.60879898071289, "ce_orig": 0.7411525249481201, "epoch": 0.00805234021137393, "kl_loss": 3949.431640625, "loss_ib": 39.50057601928711, "step": 28 }, { "ce_ib": 63.889503479003906, "ce_orig": 0.7678407430648804, "epoch": 0.00805234021137393, "kl_loss": 3446.158447265625, "loss_ib": 34.46797180175781, "step": 28 }, { "ce_ib": 64.12403869628906, "ce_orig": 1.3409479856491089, "epoch": 0.00805234021137393, "kl_loss": 3590.536376953125, "loss_ib": 35.91177749633789, "step": 28 }, { "ce_ib": 67.9863510131836, "ce_orig": 1.4907015562057495, "epoch": 0.00805234021137393, "kl_loss": 4102.9951171875, "loss_ib": 41.036746978759766, "step": 28 }, { "ce_ib": 63.33028793334961, "ce_orig": 0.7299618721008301, "epoch": 0.008339923790351571, "kl_loss": 3933.06591796875, "loss_ib": 39.33699035644531, "step": 29 }, { "ce_ib": 65.11859893798828, "ce_orig": 1.07808256149292, "epoch": 0.008339923790351571, "kl_loss": 3267.3017578125, "loss_ib": 32.679527282714844, "step": 29 }, { "ce_ib": 61.750606536865234, "ce_orig": 1.5331333875656128, "epoch": 0.008339923790351571, "kl_loss": 3922.66748046875, "loss_ib": 39.23284912109375, "step": 29 }, { "ce_ib": 63.025821685791016, "ce_orig": 0.9248456954956055, "epoch": 0.008339923790351571, "kl_loss": 3479.8994140625, "loss_ib": 34.8052978515625, "step": 29 }, { "epoch": 0.00862750736932921, "grad_norm": 531.7625732421875, "learning_rate": 3.821656050955414e-06, "loss": 37.9283, "step": 30 }, { "ce_ib": 63.19704055786133, "ce_orig": 0.813347339630127, "epoch": 0.00862750736932921, "kl_loss": 3683.62451171875, "loss_ib": 36.84256362915039, "step": 30 }, { "ce_ib": 64.78852844238281, "ce_orig": 1.25947105884552, "epoch": 0.00862750736932921, "kl_loss": 3672.6279296875, "loss_ib": 36.732757568359375, "step": 30 }, { "ce_ib": 65.48835754394531, "ce_orig": 1.5832844972610474, "epoch": 0.00862750736932921, "kl_loss": 3535.34765625, "loss_ib": 35.360023498535156, "step": 30 }, { "ce_ib": 67.59868621826172, "ce_orig": 1.2523659467697144, "epoch": 0.00862750736932921, "kl_loss": 3592.551513671875, "loss_ib": 35.932273864746094, "step": 30 }, { "ce_ib": 65.58070373535156, "ce_orig": 1.3204323053359985, "epoch": 0.008915090948306852, "kl_loss": 3685.355224609375, "loss_ib": 36.860107421875, "step": 31 }, { "ce_ib": 65.22953033447266, "ce_orig": 1.7766001224517822, "epoch": 0.008915090948306852, "kl_loss": 3778.63427734375, "loss_ib": 37.79286575317383, "step": 31 }, { "ce_ib": 63.3836555480957, "ce_orig": 1.204979419708252, "epoch": 0.008915090948306852, "kl_loss": 3684.710693359375, "loss_ib": 36.85344314575195, "step": 31 }, { "ce_ib": 62.92445755004883, "ce_orig": 0.7449155449867249, "epoch": 0.008915090948306852, "kl_loss": 3957.828857421875, "loss_ib": 39.58457946777344, "step": 31 }, { "ce_ib": 63.693058013916016, "ce_orig": 0.963614821434021, "epoch": 0.009202674527284491, "kl_loss": 3871.184814453125, "loss_ib": 38.71821594238281, "step": 32 }, { "ce_ib": 62.92957305908203, "ce_orig": 0.699960470199585, "epoch": 0.009202674527284491, "kl_loss": 3611.31103515625, "loss_ib": 36.11940383911133, "step": 32 }, { "ce_ib": 61.641639709472656, "ce_orig": 0.5809459686279297, "epoch": 0.009202674527284491, "kl_loss": 3945.29052734375, "loss_ib": 39.459068298339844, "step": 32 }, { "ce_ib": 61.629180908203125, "ce_orig": 0.4764775037765503, "epoch": 0.009202674527284491, "kl_loss": 3752.23681640625, "loss_ib": 37.52853012084961, "step": 32 }, { "ce_ib": 65.62612915039062, "ce_orig": 1.0748307704925537, "epoch": 0.009490258106262132, "kl_loss": 3731.794921875, "loss_ib": 37.32451248168945, "step": 33 }, { "ce_ib": 61.40937423706055, "ce_orig": 1.1108014583587646, "epoch": 0.009490258106262132, "kl_loss": 3651.0771484375, "loss_ib": 36.516910552978516, "step": 33 }, { "ce_ib": 59.90447235107422, "ce_orig": 0.32240188121795654, "epoch": 0.009490258106262132, "kl_loss": 3386.24365234375, "loss_ib": 33.86842727661133, "step": 33 }, { "ce_ib": 62.98430633544922, "ce_orig": 1.2453433275222778, "epoch": 0.009490258106262132, "kl_loss": 3598.07275390625, "loss_ib": 35.98702621459961, "step": 33 }, { "ce_ib": 63.15117263793945, "ce_orig": 0.7339913249015808, "epoch": 0.009777841685239774, "kl_loss": 2625.630859375, "loss_ib": 26.262624740600586, "step": 34 }, { "ce_ib": 61.62659454345703, "ce_orig": 1.0284781455993652, "epoch": 0.009777841685239774, "kl_loss": 3689.47705078125, "loss_ib": 36.90093231201172, "step": 34 }, { "ce_ib": 62.00101852416992, "ce_orig": 0.7457196116447449, "epoch": 0.009777841685239774, "kl_loss": 3870.28466796875, "loss_ib": 38.70904541015625, "step": 34 }, { "ce_ib": 60.758033752441406, "ce_orig": 0.4431888163089752, "epoch": 0.009777841685239774, "kl_loss": 2776.04248046875, "loss_ib": 27.76650047302246, "step": 34 }, { "epoch": 0.010065425264217413, "grad_norm": 514.6280517578125, "learning_rate": 4.6178343949044585e-06, "loss": 36.6953, "step": 35 }, { "ce_ib": 61.88233947753906, "ce_orig": 0.742504894733429, "epoch": 0.010065425264217413, "kl_loss": 3676.15625, "loss_ib": 36.76774978637695, "step": 35 }, { "ce_ib": 65.21971130371094, "ce_orig": 1.4801323413848877, "epoch": 0.010065425264217413, "kl_loss": 3239.951171875, "loss_ib": 32.40603256225586, "step": 35 }, { "ce_ib": 61.43843460083008, "ce_orig": 0.8911157846450806, "epoch": 0.010065425264217413, "kl_loss": 3907.4306640625, "loss_ib": 39.08045196533203, "step": 35 }, { "ce_ib": 60.8431510925293, "ce_orig": 0.6813702583312988, "epoch": 0.010065425264217413, "kl_loss": 3710.92919921875, "loss_ib": 37.11537551879883, "step": 35 }, { "ce_ib": 62.07615280151367, "ce_orig": 0.9490892887115479, "epoch": 0.010353008843195054, "kl_loss": 3473.35009765625, "loss_ib": 34.739707946777344, "step": 36 }, { "ce_ib": 63.5875358581543, "ce_orig": 1.1264761686325073, "epoch": 0.010353008843195054, "kl_loss": 3691.65673828125, "loss_ib": 36.92292785644531, "step": 36 }, { "ce_ib": 61.989559173583984, "ce_orig": 0.7521851062774658, "epoch": 0.010353008843195054, "kl_loss": 3681.02392578125, "loss_ib": 36.816436767578125, "step": 36 }, { "ce_ib": 66.18658447265625, "ce_orig": 1.4330860376358032, "epoch": 0.010353008843195054, "kl_loss": 3735.92529296875, "loss_ib": 37.36587142944336, "step": 36 }, { "ce_ib": 61.510005950927734, "ce_orig": 0.6856619119644165, "epoch": 0.010640592422172693, "kl_loss": 3193.4365234375, "loss_ib": 31.940513610839844, "step": 37 }, { "ce_ib": 65.34510040283203, "ce_orig": 1.6867130994796753, "epoch": 0.010640592422172693, "kl_loss": 3602.250244140625, "loss_ib": 36.02903747558594, "step": 37 }, { "ce_ib": 63.198848724365234, "ce_orig": 1.003406286239624, "epoch": 0.010640592422172693, "kl_loss": 3923.912109375, "loss_ib": 39.24544143676758, "step": 37 }, { "ce_ib": 63.12528610229492, "ce_orig": 1.0664888620376587, "epoch": 0.010640592422172693, "kl_loss": 3344.81298828125, "loss_ib": 33.45444107055664, "step": 37 }, { "ce_ib": 61.980186462402344, "ce_orig": 0.6754278540611267, "epoch": 0.010928176001150335, "kl_loss": 3765.134033203125, "loss_ib": 37.65753936767578, "step": 38 }, { "ce_ib": 64.89917755126953, "ce_orig": 1.3892360925674438, "epoch": 0.010928176001150335, "kl_loss": 3431.3056640625, "loss_ib": 34.31954574584961, "step": 38 }, { "ce_ib": 63.881900787353516, "ce_orig": 0.9926798343658447, "epoch": 0.010928176001150335, "kl_loss": 3779.434814453125, "loss_ib": 37.80073547363281, "step": 38 }, { "ce_ib": 61.26738357543945, "ce_orig": 0.5064423084259033, "epoch": 0.010928176001150335, "kl_loss": 3226.73974609375, "loss_ib": 32.27352523803711, "step": 38 }, { "ce_ib": 61.48027420043945, "ce_orig": 0.6444438099861145, "epoch": 0.011215759580127974, "kl_loss": 3812.853271484375, "loss_ib": 38.13467788696289, "step": 39 }, { "ce_ib": 65.14291381835938, "ce_orig": 1.157513976097107, "epoch": 0.011215759580127974, "kl_loss": 3730.44921875, "loss_ib": 37.311004638671875, "step": 39 }, { "ce_ib": 65.04698944091797, "ce_orig": 1.4464482069015503, "epoch": 0.011215759580127974, "kl_loss": 3499.406005859375, "loss_ib": 35.00056457519531, "step": 39 }, { "ce_ib": 61.870948791503906, "ce_orig": 0.7682390213012695, "epoch": 0.011215759580127974, "kl_loss": 3903.7294921875, "loss_ib": 39.043479919433594, "step": 39 }, { "epoch": 0.011503343159105615, "grad_norm": 530.5418701171875, "learning_rate": 5.414012738853504e-06, "loss": 36.8859, "step": 40 }, { "ce_ib": 66.74645233154297, "ce_orig": 1.7853225469589233, "epoch": 0.011503343159105615, "kl_loss": 3331.3544921875, "loss_ib": 33.32021713256836, "step": 40 }, { "ce_ib": 62.318843841552734, "ce_orig": 0.7977343797683716, "epoch": 0.011503343159105615, "kl_loss": 3502.8125, "loss_ib": 35.034358978271484, "step": 40 }, { "ce_ib": 63.681610107421875, "ce_orig": 1.3478271961212158, "epoch": 0.011503343159105615, "kl_loss": 3501.63134765625, "loss_ib": 35.02267837524414, "step": 40 }, { "ce_ib": 62.9583740234375, "ce_orig": 1.0469328165054321, "epoch": 0.011503343159105615, "kl_loss": 3721.776611328125, "loss_ib": 37.22406005859375, "step": 40 }, { "ce_ib": 61.38816833496094, "ce_orig": 0.7066026926040649, "epoch": 0.011790926738083256, "kl_loss": 3805.5771484375, "loss_ib": 38.06190872192383, "step": 41 }, { "ce_ib": 61.03729248046875, "ce_orig": 0.7563859820365906, "epoch": 0.011790926738083256, "kl_loss": 3660.0556640625, "loss_ib": 36.606658935546875, "step": 41 }, { "ce_ib": 63.25761795043945, "ce_orig": 0.8998059034347534, "epoch": 0.011790926738083256, "kl_loss": 3492.48876953125, "loss_ib": 34.93121337890625, "step": 41 }, { "ce_ib": 62.87449264526367, "ce_orig": 0.9313430190086365, "epoch": 0.011790926738083256, "kl_loss": 3241.703125, "loss_ib": 32.423316955566406, "step": 41 }, { "ce_ib": 64.49095916748047, "ce_orig": 1.71138596534729, "epoch": 0.012078510317060896, "kl_loss": 3664.8984375, "loss_ib": 36.655433654785156, "step": 42 }, { "ce_ib": 61.09724807739258, "ce_orig": 0.7595378756523132, "epoch": 0.012078510317060896, "kl_loss": 3622.4169921875, "loss_ib": 36.230281829833984, "step": 42 }, { "ce_ib": 60.89824676513672, "ce_orig": 0.9210549592971802, "epoch": 0.012078510317060896, "kl_loss": 3331.73388671875, "loss_ib": 33.32342529296875, "step": 42 }, { "ce_ib": 62.15813446044922, "ce_orig": 0.6488374471664429, "epoch": 0.012078510317060896, "kl_loss": 3685.21826171875, "loss_ib": 36.8583984375, "step": 42 }, { "ce_ib": 62.060028076171875, "ce_orig": 0.8468491435050964, "epoch": 0.012366093896038537, "kl_loss": 3631.91064453125, "loss_ib": 36.325313568115234, "step": 43 }, { "ce_ib": 64.66139221191406, "ce_orig": 1.069366693496704, "epoch": 0.012366093896038537, "kl_loss": 3382.873046875, "loss_ib": 33.83519744873047, "step": 43 }, { "ce_ib": 59.3759651184082, "ce_orig": 0.6913302540779114, "epoch": 0.012366093896038537, "kl_loss": 3886.6796875, "loss_ib": 38.87273406982422, "step": 43 }, { "ce_ib": 63.80333709716797, "ce_orig": 1.2420175075531006, "epoch": 0.012366093896038537, "kl_loss": 3315.640625, "loss_ib": 33.162784576416016, "step": 43 }, { "ce_ib": 61.69696044921875, "ce_orig": 0.9505507349967957, "epoch": 0.012653677475016176, "kl_loss": 3327.21044921875, "loss_ib": 33.27827453613281, "step": 44 }, { "ce_ib": 60.231571197509766, "ce_orig": 1.0403425693511963, "epoch": 0.012653677475016176, "kl_loss": 3099.7314453125, "loss_ib": 31.00333595275879, "step": 44 }, { "ce_ib": 60.59477996826172, "ce_orig": 0.9732199907302856, "epoch": 0.012653677475016176, "kl_loss": 3785.45654296875, "loss_ib": 37.86062240600586, "step": 44 }, { "ce_ib": 60.5795783996582, "ce_orig": 0.9181808233261108, "epoch": 0.012653677475016176, "kl_loss": 3470.03466796875, "loss_ib": 34.70640182495117, "step": 44 }, { "epoch": 0.012941261053993817, "grad_norm": 476.64434814453125, "learning_rate": 6.210191082802548e-06, "loss": 35.3798, "step": 45 }, { "ce_ib": 61.55487060546875, "ce_orig": 1.3028727769851685, "epoch": 0.012941261053993817, "kl_loss": 3647.279541015625, "loss_ib": 36.47895050048828, "step": 45 }, { "ce_ib": 60.31386947631836, "ce_orig": 0.6792593598365784, "epoch": 0.012941261053993817, "kl_loss": 3385.7255859375, "loss_ib": 33.863285064697266, "step": 45 }, { "ce_ib": 61.40266036987305, "ce_orig": 0.9505258798599243, "epoch": 0.012941261053993817, "kl_loss": 3687.73779296875, "loss_ib": 36.88351821899414, "step": 45 }, { "ce_ib": 62.62788009643555, "ce_orig": 0.7607139945030212, "epoch": 0.012941261053993817, "kl_loss": 3367.47412109375, "loss_ib": 33.68100357055664, "step": 45 }, { "ce_ib": 60.83255386352539, "ce_orig": 1.0399366617202759, "epoch": 0.013228844632971457, "kl_loss": 3394.5810546875, "loss_ib": 33.9518928527832, "step": 46 }, { "ce_ib": 61.447139739990234, "ce_orig": 0.8051762580871582, "epoch": 0.013228844632971457, "kl_loss": 3173.857421875, "loss_ib": 31.744718551635742, "step": 46 }, { "ce_ib": 61.36168670654297, "ce_orig": 1.1020334959030151, "epoch": 0.013228844632971457, "kl_loss": 3414.359130859375, "loss_ib": 34.14972686767578, "step": 46 }, { "ce_ib": 60.41455841064453, "ce_orig": 0.706063449382782, "epoch": 0.013228844632971457, "kl_loss": 3687.080078125, "loss_ib": 36.8768424987793, "step": 46 }, { "ce_ib": 60.49672317504883, "ce_orig": 0.8405731320381165, "epoch": 0.013516428211949098, "kl_loss": 3867.85693359375, "loss_ib": 38.68461990356445, "step": 47 }, { "ce_ib": 63.74329376220703, "ce_orig": 0.8466535806655884, "epoch": 0.013516428211949098, "kl_loss": 3611.955078125, "loss_ib": 36.12592315673828, "step": 47 }, { "ce_ib": 61.18013381958008, "ce_orig": 0.9858855605125427, "epoch": 0.013516428211949098, "kl_loss": 3885.5107421875, "loss_ib": 38.86122512817383, "step": 47 }, { "ce_ib": 65.59097290039062, "ce_orig": 1.7553099393844604, "epoch": 0.013516428211949098, "kl_loss": 3490.478515625, "loss_ib": 34.91134262084961, "step": 47 }, { "ce_ib": 61.62842559814453, "ce_orig": 0.838309109210968, "epoch": 0.013804011790926739, "kl_loss": 3487.0517578125, "loss_ib": 34.876678466796875, "step": 48 }, { "ce_ib": 62.534908294677734, "ce_orig": 1.5411649942398071, "epoch": 0.013804011790926739, "kl_loss": 3555.408203125, "loss_ib": 35.560333251953125, "step": 48 }, { "ce_ib": 61.39102554321289, "ce_orig": 0.5941852927207947, "epoch": 0.013804011790926739, "kl_loss": 3320.55078125, "loss_ib": 33.211647033691406, "step": 48 }, { "ce_ib": 62.17927551269531, "ce_orig": 1.398880958557129, "epoch": 0.013804011790926739, "kl_loss": 2767.198974609375, "loss_ib": 27.678207397460938, "step": 48 }, { "ce_ib": 61.87635803222656, "ce_orig": 1.1401021480560303, "epoch": 0.014091595369904378, "kl_loss": 3533.70703125, "loss_ib": 35.343257904052734, "step": 49 }, { "ce_ib": 59.036781311035156, "ce_orig": 0.7694017291069031, "epoch": 0.014091595369904378, "kl_loss": 3748.14453125, "loss_ib": 37.48734664916992, "step": 49 }, { "ce_ib": 60.804603576660156, "ce_orig": 1.3716927766799927, "epoch": 0.014091595369904378, "kl_loss": 3407.55224609375, "loss_ib": 34.08160400390625, "step": 49 }, { "ce_ib": 60.6622200012207, "ce_orig": 0.6214744448661804, "epoch": 0.014091595369904378, "kl_loss": 3320.9990234375, "loss_ib": 33.21605682373047, "step": 49 }, { "epoch": 0.01437917894888202, "grad_norm": 510.91943359375, "learning_rate": 7.006369426751593e-06, "loss": 35.2805, "step": 50 }, { "ce_ib": 58.74787139892578, "ce_orig": 0.8769705891609192, "epoch": 0.01437917894888202, "kl_loss": 3581.33544921875, "loss_ib": 35.81922912597656, "step": 50 }, { "ce_ib": 57.18757247924805, "ce_orig": 0.699286699295044, "epoch": 0.01437917894888202, "kl_loss": 3327.9033203125, "loss_ib": 33.284751892089844, "step": 50 }, { "ce_ib": 60.32874298095703, "ce_orig": 0.722357451915741, "epoch": 0.01437917894888202, "kl_loss": 3368.121337890625, "loss_ib": 33.6872444152832, "step": 50 }, { "ce_ib": 63.51592254638672, "ce_orig": 1.0477139949798584, "epoch": 0.01437917894888202, "kl_loss": 3434.626708984375, "loss_ib": 34.35261917114258, "step": 50 }, { "ce_ib": 58.714073181152344, "ce_orig": 0.6123059391975403, "epoch": 0.014666762527859659, "kl_loss": 3747.56982421875, "loss_ib": 37.4815673828125, "step": 51 }, { "ce_ib": 61.6097526550293, "ce_orig": 1.2942873239517212, "epoch": 0.014666762527859659, "kl_loss": 3235.971923828125, "loss_ib": 32.36587905883789, "step": 51 }, { "ce_ib": 58.607505798339844, "ce_orig": 0.6153243184089661, "epoch": 0.014666762527859659, "kl_loss": 3752.208984375, "loss_ib": 37.527950286865234, "step": 51 }, { "ce_ib": 60.741729736328125, "ce_orig": 1.3440642356872559, "epoch": 0.014666762527859659, "kl_loss": 3612.9765625, "loss_ib": 36.13583755493164, "step": 51 }, { "ce_ib": 60.87339782714844, "ce_orig": 0.8129587769508362, "epoch": 0.0149543461068373, "kl_loss": 3125.83642578125, "loss_ib": 31.264450073242188, "step": 52 }, { "ce_ib": 58.96531295776367, "ce_orig": 0.9034717082977295, "epoch": 0.0149543461068373, "kl_loss": 3257.168212890625, "loss_ib": 32.57757568359375, "step": 52 }, { "ce_ib": 60.43812942504883, "ce_orig": 0.8096925020217896, "epoch": 0.0149543461068373, "kl_loss": 3082.474853515625, "loss_ib": 30.830793380737305, "step": 52 }, { "ce_ib": 61.23511505126953, "ce_orig": 1.078736424446106, "epoch": 0.0149543461068373, "kl_loss": 3490.707275390625, "loss_ib": 34.9131965637207, "step": 52 }, { "ce_ib": 60.389286041259766, "ce_orig": 1.2757381200790405, "epoch": 0.015241929685814939, "kl_loss": 3353.767578125, "loss_ib": 33.54371643066406, "step": 53 }, { "ce_ib": 57.41773223876953, "ce_orig": 0.552437424659729, "epoch": 0.015241929685814939, "kl_loss": 2717.25927734375, "loss_ib": 27.178335189819336, "step": 53 }, { "ce_ib": 60.19536590576172, "ce_orig": 0.7778604626655579, "epoch": 0.015241929685814939, "kl_loss": 3204.783203125, "loss_ib": 32.05385208129883, "step": 53 }, { "ce_ib": 61.59130859375, "ce_orig": 1.6185189485549927, "epoch": 0.015241929685814939, "kl_loss": 3477.7470703125, "loss_ib": 34.78363037109375, "step": 53 }, { "ce_ib": 63.59449005126953, "ce_orig": 1.4870353937149048, "epoch": 0.01552951326479258, "kl_loss": 3315.589599609375, "loss_ib": 33.162254333496094, "step": 54 }, { "ce_ib": 59.9765625, "ce_orig": 1.258398175239563, "epoch": 0.01552951326479258, "kl_loss": 3485.625, "loss_ib": 34.862247467041016, "step": 54 }, { "ce_ib": 58.29402160644531, "ce_orig": 0.9382989406585693, "epoch": 0.01552951326479258, "kl_loss": 3394.168701171875, "loss_ib": 33.94751739501953, "step": 54 }, { "ce_ib": 58.97043228149414, "ce_orig": 0.6211685538291931, "epoch": 0.01552951326479258, "kl_loss": 3460.42333984375, "loss_ib": 34.610130310058594, "step": 54 }, { "epoch": 0.01581709684377022, "grad_norm": 469.67340087890625, "learning_rate": 7.802547770700637e-06, "loss": 34.1513, "step": 55 }, { "ce_ib": 61.76213073730469, "ce_orig": 0.8650195002555847, "epoch": 0.01581709684377022, "kl_loss": 3174.44775390625, "loss_ib": 31.750654220581055, "step": 55 }, { "ce_ib": 55.92485809326172, "ce_orig": 0.08637077361345291, "epoch": 0.01581709684377022, "kl_loss": 468.1816101074219, "loss_ib": 4.687408447265625, "step": 55 }, { "ce_ib": 59.152156829833984, "ce_orig": 0.9888356328010559, "epoch": 0.01581709684377022, "kl_loss": 3260.65771484375, "loss_ib": 32.612491607666016, "step": 55 }, { "ce_ib": 60.753597259521484, "ce_orig": 0.837508499622345, "epoch": 0.01581709684377022, "kl_loss": 3544.2236328125, "loss_ib": 35.44831085205078, "step": 55 }, { "ce_ib": 56.82107925415039, "ce_orig": 0.8040409684181213, "epoch": 0.01610468042274786, "kl_loss": 3288.75830078125, "loss_ib": 32.89326477050781, "step": 56 }, { "ce_ib": 58.140541076660156, "ce_orig": 0.666872501373291, "epoch": 0.01610468042274786, "kl_loss": 3718.909912109375, "loss_ib": 37.19491195678711, "step": 56 }, { "ce_ib": 59.2910041809082, "ce_orig": 0.9221104979515076, "epoch": 0.01610468042274786, "kl_loss": 3336.389404296875, "loss_ib": 33.36982345581055, "step": 56 }, { "ce_ib": 61.521507263183594, "ce_orig": 1.3518534898757935, "epoch": 0.01610468042274786, "kl_loss": 3092.3486328125, "loss_ib": 30.929637908935547, "step": 56 }, { "ce_ib": 57.95586013793945, "ce_orig": 0.8081279397010803, "epoch": 0.016392264001725502, "kl_loss": 3491.455810546875, "loss_ib": 34.920352935791016, "step": 57 }, { "ce_ib": 58.949745178222656, "ce_orig": 0.5393152236938477, "epoch": 0.016392264001725502, "kl_loss": 3235.858154296875, "loss_ib": 32.36447525024414, "step": 57 }, { "ce_ib": 60.55893325805664, "ce_orig": 0.7738803029060364, "epoch": 0.016392264001725502, "kl_loss": 2924.27783203125, "loss_ib": 29.24883270263672, "step": 57 }, { "ce_ib": 61.02143478393555, "ce_orig": 1.209029197692871, "epoch": 0.016392264001725502, "kl_loss": 3489.797607421875, "loss_ib": 34.904075622558594, "step": 57 }, { "ce_ib": 60.51230239868164, "ce_orig": 1.1623197793960571, "epoch": 0.016679847580703143, "kl_loss": 3124.18798828125, "loss_ib": 31.2479305267334, "step": 58 }, { "ce_ib": 60.99052429199219, "ce_orig": 1.069433569908142, "epoch": 0.016679847580703143, "kl_loss": 3169.855712890625, "loss_ib": 31.704654693603516, "step": 58 }, { "ce_ib": 58.70066452026367, "ce_orig": 1.0279523134231567, "epoch": 0.016679847580703143, "kl_loss": 3483.8056640625, "loss_ib": 34.84392547607422, "step": 58 }, { "ce_ib": 59.15578842163086, "ce_orig": 1.0242782831192017, "epoch": 0.016679847580703143, "kl_loss": 3071.107421875, "loss_ib": 30.716989517211914, "step": 58 }, { "ce_ib": 61.244327545166016, "ce_orig": 1.7360433340072632, "epoch": 0.01696743115968078, "kl_loss": 2984.33984375, "loss_ib": 29.849523544311523, "step": 59 }, { "ce_ib": 60.01206588745117, "ce_orig": 1.2617676258087158, "epoch": 0.01696743115968078, "kl_loss": 3349.006591796875, "loss_ib": 33.49606704711914, "step": 59 }, { "ce_ib": 56.53895568847656, "ce_orig": 0.5960240960121155, "epoch": 0.01696743115968078, "kl_loss": 3249.41357421875, "loss_ib": 32.49979019165039, "step": 59 }, { "ce_ib": 59.71278762817383, "ce_orig": 0.8869993090629578, "epoch": 0.01696743115968078, "kl_loss": 3232.68505859375, "loss_ib": 32.332820892333984, "step": 59 }, { "epoch": 0.01725501473865842, "grad_norm": 486.4937438964844, "learning_rate": 8.598726114649681e-06, "loss": 33.3977, "step": 60 }, { "ce_ib": 58.857635498046875, "ce_orig": 0.7359964847564697, "epoch": 0.01725501473865842, "kl_loss": 3203.08740234375, "loss_ib": 32.03675842285156, "step": 60 }, { "ce_ib": 59.75052261352539, "ce_orig": 1.0773297548294067, "epoch": 0.01725501473865842, "kl_loss": 3154.876953125, "loss_ib": 31.55474281311035, "step": 60 }, { "ce_ib": 57.949344635009766, "ce_orig": 0.8577583432197571, "epoch": 0.01725501473865842, "kl_loss": 3265.8623046875, "loss_ib": 32.6644172668457, "step": 60 }, { "ce_ib": 59.86404037475586, "ce_orig": 1.3723738193511963, "epoch": 0.01725501473865842, "kl_loss": 2843.7080078125, "loss_ib": 28.443065643310547, "step": 60 }, { "ce_ib": 56.99949645996094, "ce_orig": 0.5773953199386597, "epoch": 0.017542598317636063, "kl_loss": 3343.131103515625, "loss_ib": 33.43701171875, "step": 61 }, { "ce_ib": 60.948787689208984, "ce_orig": 1.6039363145828247, "epoch": 0.017542598317636063, "kl_loss": 3304.048583984375, "loss_ib": 33.04657745361328, "step": 61 }, { "ce_ib": 58.39208221435547, "ce_orig": 0.984937310218811, "epoch": 0.017542598317636063, "kl_loss": 3363.2353515625, "loss_ib": 33.63819122314453, "step": 61 }, { "ce_ib": 59.0418586730957, "ce_orig": 0.783109188079834, "epoch": 0.017542598317636063, "kl_loss": 3394.3154296875, "loss_ib": 33.949058532714844, "step": 61 }, { "ce_ib": 62.10023880004883, "ce_orig": 1.8530871868133545, "epoch": 0.017830181896613704, "kl_loss": 3175.18505859375, "loss_ib": 31.758060455322266, "step": 62 }, { "ce_ib": 56.835514068603516, "ce_orig": 0.7488876581192017, "epoch": 0.017830181896613704, "kl_loss": 2187.16943359375, "loss_ib": 21.877376556396484, "step": 62 }, { "ce_ib": 60.125152587890625, "ce_orig": 1.4274426698684692, "epoch": 0.017830181896613704, "kl_loss": 3222.76611328125, "loss_ib": 32.233673095703125, "step": 62 }, { "ce_ib": 55.86289978027344, "ce_orig": 0.7154338955879211, "epoch": 0.017830181896613704, "kl_loss": 3421.8095703125, "loss_ib": 34.22368240356445, "step": 62 }, { "ce_ib": 59.97455596923828, "ce_orig": 1.2463781833648682, "epoch": 0.018117765475591345, "kl_loss": 2927.573486328125, "loss_ib": 29.2817325592041, "step": 63 }, { "ce_ib": 58.33196258544922, "ce_orig": 0.5972486734390259, "epoch": 0.018117765475591345, "kl_loss": 3288.707763671875, "loss_ib": 32.89291000366211, "step": 63 }, { "ce_ib": 60.974822998046875, "ce_orig": 1.4676904678344727, "epoch": 0.018117765475591345, "kl_loss": 2948.23388671875, "loss_ib": 29.48843765258789, "step": 63 }, { "ce_ib": 57.45879364013672, "ce_orig": 0.7307599782943726, "epoch": 0.018117765475591345, "kl_loss": 2998.276123046875, "loss_ib": 29.988508224487305, "step": 63 }, { "ce_ib": 57.19486618041992, "ce_orig": 0.7821041345596313, "epoch": 0.018405349054568983, "kl_loss": 3225.396728515625, "loss_ib": 32.25968551635742, "step": 64 }, { "ce_ib": 57.73394775390625, "ce_orig": 0.6754387617111206, "epoch": 0.018405349054568983, "kl_loss": 3085.6650390625, "loss_ib": 30.862422943115234, "step": 64 }, { "ce_ib": 55.39207077026367, "ce_orig": 0.5158528685569763, "epoch": 0.018405349054568983, "kl_loss": 3063.913818359375, "loss_ib": 30.644676208496094, "step": 64 }, { "ce_ib": 57.978118896484375, "ce_orig": 0.9754984974861145, "epoch": 0.018405349054568983, "kl_loss": 3214.08251953125, "loss_ib": 32.14662170410156, "step": 64 }, { "epoch": 0.018692932633546624, "grad_norm": 475.1830139160156, "learning_rate": 9.394904458598726e-06, "loss": 32.2213, "step": 65 }, { "ce_ib": 57.8340950012207, "ce_orig": 0.7973042726516724, "epoch": 0.018692932633546624, "kl_loss": 3016.814208984375, "loss_ib": 30.173925399780273, "step": 65 }, { "ce_ib": 56.048274993896484, "ce_orig": 0.7601141929626465, "epoch": 0.018692932633546624, "kl_loss": 3293.418212890625, "loss_ib": 32.93978500366211, "step": 65 }, { "ce_ib": 55.681297302246094, "ce_orig": 0.9179377555847168, "epoch": 0.018692932633546624, "kl_loss": 3359.49755859375, "loss_ib": 33.60054397583008, "step": 65 }, { "ce_ib": 58.35697937011719, "ce_orig": 1.3632832765579224, "epoch": 0.018692932633546624, "kl_loss": 3379.584228515625, "loss_ib": 33.80167770385742, "step": 65 }, { "ce_ib": 60.778778076171875, "ce_orig": 1.0116430521011353, "epoch": 0.018980516212524265, "kl_loss": 3229.637451171875, "loss_ib": 32.302452087402344, "step": 66 }, { "ce_ib": 56.4047737121582, "ce_orig": 1.053054928779602, "epoch": 0.018980516212524265, "kl_loss": 3030.66552734375, "loss_ib": 30.312294006347656, "step": 66 }, { "ce_ib": 57.94568634033203, "ce_orig": 0.946856677532196, "epoch": 0.018980516212524265, "kl_loss": 3040.84765625, "loss_ib": 30.414268493652344, "step": 66 }, { "ce_ib": 56.41437911987305, "ce_orig": 0.7833185195922852, "epoch": 0.018980516212524265, "kl_loss": 3050.6826171875, "loss_ib": 30.512468338012695, "step": 66 }, { "ce_ib": 59.401546478271484, "ce_orig": 1.328580617904663, "epoch": 0.019268099791501906, "kl_loss": 2916.177978515625, "loss_ib": 29.1677188873291, "step": 67 }, { "ce_ib": 57.880680084228516, "ce_orig": 0.7882740497589111, "epoch": 0.019268099791501906, "kl_loss": 3422.02783203125, "loss_ib": 34.22606658935547, "step": 67 }, { "ce_ib": 59.44600296020508, "ce_orig": 0.7883732914924622, "epoch": 0.019268099791501906, "kl_loss": 3327.45703125, "loss_ib": 33.280513763427734, "step": 67 }, { "ce_ib": 59.17395782470703, "ce_orig": 1.088062047958374, "epoch": 0.019268099791501906, "kl_loss": 1573.11181640625, "loss_ib": 15.737035751342773, "step": 67 }, { "ce_ib": 56.406436920166016, "ce_orig": 0.592961847782135, "epoch": 0.019555683370479547, "kl_loss": 3268.48779296875, "loss_ib": 32.69051742553711, "step": 68 }, { "ce_ib": 56.2723274230957, "ce_orig": 0.5646532773971558, "epoch": 0.019555683370479547, "kl_loss": 3152.529296875, "loss_ib": 31.530920028686523, "step": 68 }, { "ce_ib": 55.98052215576172, "ce_orig": 0.5173469185829163, "epoch": 0.019555683370479547, "kl_loss": 2985.48681640625, "loss_ib": 29.86046600341797, "step": 68 }, { "ce_ib": 55.83637237548828, "ce_orig": 0.4308261573314667, "epoch": 0.019555683370479547, "kl_loss": 2723.078369140625, "loss_ib": 27.236366271972656, "step": 68 }, { "ce_ib": 59.32357406616211, "ce_orig": 1.509739637374878, "epoch": 0.019843266949457185, "kl_loss": 2924.435546875, "loss_ib": 29.250288009643555, "step": 69 }, { "ce_ib": 59.09616470336914, "ce_orig": 2.3940815925598145, "epoch": 0.019843266949457185, "kl_loss": 2945.3994140625, "loss_ib": 29.459903717041016, "step": 69 }, { "ce_ib": 55.772178649902344, "ce_orig": 1.207844614982605, "epoch": 0.019843266949457185, "kl_loss": 3110.099365234375, "loss_ib": 31.106569290161133, "step": 69 }, { "ce_ib": 59.807865142822266, "ce_orig": 1.4729925394058228, "epoch": 0.019843266949457185, "kl_loss": 2798.36474609375, "loss_ib": 27.989627838134766, "step": 69 }, { "epoch": 0.020130850528434826, "grad_norm": 451.3029479980469, "learning_rate": 1.0191082802547772e-05, "loss": 31.1615, "step": 70 }, { "ce_ib": 57.67570495605469, "ce_orig": 0.8390839695930481, "epoch": 0.020130850528434826, "kl_loss": 3100.12451171875, "loss_ib": 31.00701141357422, "step": 70 }, { "ce_ib": 56.19687271118164, "ce_orig": 0.4426974654197693, "epoch": 0.020130850528434826, "kl_loss": 2944.1025390625, "loss_ib": 29.446645736694336, "step": 70 }, { "ce_ib": 57.55405044555664, "ce_orig": 1.0506970882415771, "epoch": 0.020130850528434826, "kl_loss": 2788.48095703125, "loss_ib": 27.89056396484375, "step": 70 }, { "ce_ib": 57.250022888183594, "ce_orig": 0.8879465460777283, "epoch": 0.020130850528434826, "kl_loss": 3008.960693359375, "loss_ib": 30.0953311920166, "step": 70 }, { "ce_ib": 56.017364501953125, "ce_orig": 0.8262448310852051, "epoch": 0.020418434107412467, "kl_loss": 3022.1181640625, "loss_ib": 30.226781845092773, "step": 71 }, { "ce_ib": 57.61652755737305, "ce_orig": 0.628873348236084, "epoch": 0.020418434107412467, "kl_loss": 2915.463134765625, "loss_ib": 29.16039276123047, "step": 71 }, { "ce_ib": 56.01335525512695, "ce_orig": 0.9199650883674622, "epoch": 0.020418434107412467, "kl_loss": 2920.94091796875, "loss_ib": 29.215009689331055, "step": 71 }, { "ce_ib": 55.02300262451172, "ce_orig": 0.636806845664978, "epoch": 0.020418434107412467, "kl_loss": 2990.93994140625, "loss_ib": 29.914901733398438, "step": 71 }, { "ce_ib": 58.92692947387695, "ce_orig": 1.6168797016143799, "epoch": 0.020706017686390108, "kl_loss": 2569.22216796875, "loss_ib": 25.6981143951416, "step": 72 }, { "ce_ib": 54.50556182861328, "ce_orig": 0.7561197280883789, "epoch": 0.020706017686390108, "kl_loss": 3147.120361328125, "loss_ib": 31.476654052734375, "step": 72 }, { "ce_ib": 54.70288848876953, "ce_orig": 0.7983661890029907, "epoch": 0.020706017686390108, "kl_loss": 2991.32568359375, "loss_ib": 29.91872787475586, "step": 72 }, { "ce_ib": 55.79477310180664, "ce_orig": 1.1335042715072632, "epoch": 0.020706017686390108, "kl_loss": 2651.6884765625, "loss_ib": 26.522462844848633, "step": 72 }, { "ce_ib": 55.5018424987793, "ce_orig": 0.6628856062889099, "epoch": 0.02099360126536775, "kl_loss": 2991.87646484375, "loss_ib": 29.924312591552734, "step": 73 }, { "ce_ib": 54.66994094848633, "ce_orig": 0.9854854941368103, "epoch": 0.02099360126536775, "kl_loss": 2946.215087890625, "loss_ib": 29.46761703491211, "step": 73 }, { "ce_ib": 58.076210021972656, "ce_orig": 1.3572182655334473, "epoch": 0.02099360126536775, "kl_loss": 3050.9150390625, "loss_ib": 30.514957427978516, "step": 73 }, { "ce_ib": 55.1069221496582, "ce_orig": 0.8574339747428894, "epoch": 0.02099360126536775, "kl_loss": 3119.42724609375, "loss_ib": 31.19978141784668, "step": 73 }, { "ce_ib": 54.855194091796875, "ce_orig": 0.8055992126464844, "epoch": 0.021281184844345387, "kl_loss": 3110.638671875, "loss_ib": 31.11187171936035, "step": 74 }, { "ce_ib": 52.890716552734375, "ce_orig": 0.522036075592041, "epoch": 0.021281184844345387, "kl_loss": 2826.3251953125, "loss_ib": 28.268539428710938, "step": 74 }, { "ce_ib": 54.693538665771484, "ce_orig": 0.729824960231781, "epoch": 0.021281184844345387, "kl_loss": 3347.115966796875, "loss_ib": 33.476627349853516, "step": 74 }, { "ce_ib": 55.074676513671875, "ce_orig": 0.9839091897010803, "epoch": 0.021281184844345387, "kl_loss": 2667.3046875, "loss_ib": 26.67855453491211, "step": 74 }, { "epoch": 0.021568768423323028, "grad_norm": 460.4914245605469, "learning_rate": 1.0987261146496815e-05, "loss": 30.2003, "step": 75 }, { "ce_ib": 55.64740753173828, "ce_orig": 0.6976457238197327, "epoch": 0.021568768423323028, "kl_loss": 2705.426025390625, "loss_ib": 27.059823989868164, "step": 75 }, { "ce_ib": 56.64052963256836, "ce_orig": 1.448681116104126, "epoch": 0.021568768423323028, "kl_loss": 2853.453369140625, "loss_ib": 28.540197372436523, "step": 75 }, { "ce_ib": 55.26200485229492, "ce_orig": 0.7230492234230042, "epoch": 0.021568768423323028, "kl_loss": 3141.7001953125, "loss_ib": 31.422529220581055, "step": 75 }, { "ce_ib": 54.74195098876953, "ce_orig": 0.611904501914978, "epoch": 0.021568768423323028, "kl_loss": 3029.38916015625, "loss_ib": 30.29936408996582, "step": 75 }, { "ce_ib": 54.31443786621094, "ce_orig": 1.1379636526107788, "epoch": 0.02185635200230067, "kl_loss": 3160.546875, "loss_ib": 31.61090087890625, "step": 76 }, { "ce_ib": 53.96803665161133, "ce_orig": 0.7516291737556458, "epoch": 0.02185635200230067, "kl_loss": 3008.7666015625, "loss_ib": 30.093063354492188, "step": 76 }, { "ce_ib": 54.48766326904297, "ce_orig": 1.210386872291565, "epoch": 0.02185635200230067, "kl_loss": 2852.64794921875, "loss_ib": 28.53192901611328, "step": 76 }, { "ce_ib": 54.85871124267578, "ce_orig": 1.4512004852294922, "epoch": 0.02185635200230067, "kl_loss": 3227.62255859375, "loss_ib": 32.28171157836914, "step": 76 }, { "ce_ib": 54.70118713378906, "ce_orig": 1.2653746604919434, "epoch": 0.02214393558127831, "kl_loss": 2925.536865234375, "loss_ib": 29.260839462280273, "step": 77 }, { "ce_ib": 54.4128532409668, "ce_orig": 0.7473430633544922, "epoch": 0.02214393558127831, "kl_loss": 2963.836669921875, "loss_ib": 29.643808364868164, "step": 77 }, { "ce_ib": 56.661434173583984, "ce_orig": 1.4954595565795898, "epoch": 0.02214393558127831, "kl_loss": 2720.67724609375, "loss_ib": 27.212438583374023, "step": 77 }, { "ce_ib": 54.728179931640625, "ce_orig": 0.827836275100708, "epoch": 0.02214393558127831, "kl_loss": 2690.066650390625, "loss_ib": 26.906139373779297, "step": 77 }, { "ce_ib": 53.935279846191406, "ce_orig": 0.7729896903038025, "epoch": 0.022431519160255948, "kl_loss": 3118.779296875, "loss_ib": 31.193185806274414, "step": 78 }, { "ce_ib": 53.90089797973633, "ce_orig": 1.05341637134552, "epoch": 0.022431519160255948, "kl_loss": 2867.553466796875, "loss_ib": 28.680925369262695, "step": 78 }, { "ce_ib": 57.06119155883789, "ce_orig": 1.1991482973098755, "epoch": 0.022431519160255948, "kl_loss": 2615.50390625, "loss_ib": 26.160743713378906, "step": 78 }, { "ce_ib": 55.66145324707031, "ce_orig": 1.2269896268844604, "epoch": 0.022431519160255948, "kl_loss": 2716.58154296875, "loss_ib": 27.1713809967041, "step": 78 }, { "ce_ib": 56.3227424621582, "ce_orig": 1.6050187349319458, "epoch": 0.02271910273923359, "kl_loss": 2608.66943359375, "loss_ib": 26.09232521057129, "step": 79 }, { "ce_ib": 55.02303695678711, "ce_orig": 1.3928401470184326, "epoch": 0.02271910273923359, "kl_loss": 2699.94677734375, "loss_ib": 27.00497055053711, "step": 79 }, { "ce_ib": 53.92034912109375, "ce_orig": 0.8707427978515625, "epoch": 0.02271910273923359, "kl_loss": 2800.906494140625, "loss_ib": 28.01445770263672, "step": 79 }, { "ce_ib": 55.906776428222656, "ce_orig": 1.184428095817566, "epoch": 0.02271910273923359, "kl_loss": 2736.019775390625, "loss_ib": 27.365787506103516, "step": 79 }, { "epoch": 0.02300668631821123, "grad_norm": 423.0335998535156, "learning_rate": 1.178343949044586e-05, "loss": 28.5021, "step": 80 }, { "ce_ib": 54.60192108154297, "ce_orig": 1.0805023908615112, "epoch": 0.02300668631821123, "kl_loss": 2762.3125, "loss_ib": 27.628583908081055, "step": 80 }, { "ce_ib": 54.54481506347656, "ce_orig": 0.9205932021141052, "epoch": 0.02300668631821123, "kl_loss": 2967.17919921875, "loss_ib": 29.67724609375, "step": 80 }, { "ce_ib": 59.29964065551758, "ce_orig": 1.6950358152389526, "epoch": 0.02300668631821123, "kl_loss": 2693.053955078125, "loss_ib": 26.93647003173828, "step": 80 }, { "ce_ib": 52.242156982421875, "ce_orig": 0.9504690766334534, "epoch": 0.02300668631821123, "kl_loss": 2905.36669921875, "loss_ib": 29.05889129638672, "step": 80 }, { "ce_ib": 55.506492614746094, "ce_orig": 1.2976820468902588, "epoch": 0.02329426989718887, "kl_loss": 2749.579345703125, "loss_ib": 27.501344680786133, "step": 81 }, { "ce_ib": 55.9608039855957, "ce_orig": 1.092388391494751, "epoch": 0.02329426989718887, "kl_loss": 2680.87744140625, "loss_ib": 26.814369201660156, "step": 81 }, { "ce_ib": 55.16973114013672, "ce_orig": 1.686485767364502, "epoch": 0.02329426989718887, "kl_loss": 2655.03369140625, "loss_ib": 26.55585479736328, "step": 81 }, { "ce_ib": 54.82407760620117, "ce_orig": 0.9071881175041199, "epoch": 0.02329426989718887, "kl_loss": 2584.10107421875, "loss_ib": 25.846492767333984, "step": 81 }, { "ce_ib": 52.7196044921875, "ce_orig": 0.6356145739555359, "epoch": 0.023581853476166512, "kl_loss": 2775.622802734375, "loss_ib": 27.761497497558594, "step": 82 }, { "ce_ib": 52.03306198120117, "ce_orig": 0.935957133769989, "epoch": 0.023581853476166512, "kl_loss": 2809.512451171875, "loss_ib": 28.100326538085938, "step": 82 }, { "ce_ib": 53.90233612060547, "ce_orig": 1.145911455154419, "epoch": 0.023581853476166512, "kl_loss": 2701.700927734375, "loss_ib": 27.02239990234375, "step": 82 }, { "ce_ib": 53.358924865722656, "ce_orig": 0.881079375743866, "epoch": 0.023581853476166512, "kl_loss": 2774.904296875, "loss_ib": 27.754379272460938, "step": 82 }, { "ce_ib": 51.51953125, "ce_orig": 1.0080299377441406, "epoch": 0.02386943705514415, "kl_loss": 2673.2802734375, "loss_ib": 26.737953186035156, "step": 83 }, { "ce_ib": 54.799827575683594, "ce_orig": 1.211903691291809, "epoch": 0.02386943705514415, "kl_loss": 2386.9873046875, "loss_ib": 23.87535285949707, "step": 83 }, { "ce_ib": 53.07735824584961, "ce_orig": 0.9792759418487549, "epoch": 0.02386943705514415, "kl_loss": 2844.404296875, "loss_ib": 28.449350357055664, "step": 83 }, { "ce_ib": 57.56839370727539, "ce_orig": 1.708152413368225, "epoch": 0.02386943705514415, "kl_loss": 2686.004150390625, "loss_ib": 26.86579704284668, "step": 83 }, { "ce_ib": 56.169593811035156, "ce_orig": 1.0889211893081665, "epoch": 0.02415702063412179, "kl_loss": 2531.922607421875, "loss_ib": 25.32484245300293, "step": 84 }, { "ce_ib": 52.437904357910156, "ce_orig": 0.9348316788673401, "epoch": 0.02415702063412179, "kl_loss": 2593.02294921875, "loss_ib": 25.93547248840332, "step": 84 }, { "ce_ib": 50.439369201660156, "ce_orig": 0.710110068321228, "epoch": 0.02415702063412179, "kl_loss": 2809.076171875, "loss_ib": 28.09580421447754, "step": 84 }, { "ce_ib": 51.97590637207031, "ce_orig": 0.7616681456565857, "epoch": 0.02415702063412179, "kl_loss": 2728.056640625, "loss_ib": 27.285762786865234, "step": 84 }, { "epoch": 0.024444604213099432, "grad_norm": 432.98297119140625, "learning_rate": 1.2579617834394904e-05, "loss": 27.55, "step": 85 }, { "ce_ib": 53.3626594543457, "ce_orig": 1.2040644884109497, "epoch": 0.024444604213099432, "kl_loss": 2776.72802734375, "loss_ib": 27.77261734008789, "step": 85 }, { "ce_ib": 50.8441276550293, "ce_orig": 0.3849184215068817, "epoch": 0.024444604213099432, "kl_loss": 2446.23681640625, "loss_ib": 24.467453002929688, "step": 85 }, { "ce_ib": 56.2274055480957, "ce_orig": 1.5932576656341553, "epoch": 0.024444604213099432, "kl_loss": 2712.46728515625, "loss_ib": 27.130294799804688, "step": 85 }, { "ce_ib": 51.763954162597656, "ce_orig": 0.8911384344100952, "epoch": 0.024444604213099432, "kl_loss": 2615.62939453125, "loss_ib": 26.161468505859375, "step": 85 }, { "ce_ib": 58.18117904663086, "ce_orig": 2.2738187313079834, "epoch": 0.024732187792077073, "kl_loss": 2173.28564453125, "loss_ib": 21.73867416381836, "step": 86 }, { "ce_ib": 52.2686882019043, "ce_orig": 0.9880481958389282, "epoch": 0.024732187792077073, "kl_loss": 2540.4462890625, "loss_ib": 25.40968894958496, "step": 86 }, { "ce_ib": 52.55824661254883, "ce_orig": 0.7514367699623108, "epoch": 0.024732187792077073, "kl_loss": 2694.514404296875, "loss_ib": 26.95039939880371, "step": 86 }, { "ce_ib": 54.02186584472656, "ce_orig": 1.0578229427337646, "epoch": 0.024732187792077073, "kl_loss": 2508.5751953125, "loss_ib": 25.091154098510742, "step": 86 }, { "ce_ib": 51.11041259765625, "ce_orig": 1.0314545631408691, "epoch": 0.025019771371054714, "kl_loss": 2482.1767578125, "loss_ib": 24.82687759399414, "step": 87 }, { "ce_ib": 52.022422790527344, "ce_orig": 0.9868292212486267, "epoch": 0.025019771371054714, "kl_loss": 2379.2041015625, "loss_ib": 23.797243118286133, "step": 87 }, { "ce_ib": 51.21082305908203, "ce_orig": 0.7481355667114258, "epoch": 0.025019771371054714, "kl_loss": 2631.20556640625, "loss_ib": 26.317176818847656, "step": 87 }, { "ce_ib": 55.54100799560547, "ce_orig": 1.7815814018249512, "epoch": 0.025019771371054714, "kl_loss": 2545.77587890625, "loss_ib": 25.46331214904785, "step": 87 }, { "ce_ib": 52.07685470581055, "ce_orig": 0.6155886054039001, "epoch": 0.025307354950032352, "kl_loss": 2352.36767578125, "loss_ib": 23.52888298034668, "step": 88 }, { "ce_ib": 53.431034088134766, "ce_orig": 0.2792898416519165, "epoch": 0.025307354950032352, "kl_loss": 2138.5185546875, "loss_ib": 21.39052963256836, "step": 88 }, { "ce_ib": 51.92123794555664, "ce_orig": 0.8495407104492188, "epoch": 0.025307354950032352, "kl_loss": 2580.02490234375, "loss_ib": 25.80544090270996, "step": 88 }, { "ce_ib": 51.645992279052734, "ce_orig": 0.8546672463417053, "epoch": 0.025307354950032352, "kl_loss": 2461.83203125, "loss_ib": 24.623483657836914, "step": 88 }, { "ce_ib": 54.053565979003906, "ce_orig": 1.8279736042022705, "epoch": 0.025594938529009993, "kl_loss": 2367.5888671875, "loss_ib": 23.681293487548828, "step": 89 }, { "ce_ib": 51.267242431640625, "ce_orig": 1.1525427103042603, "epoch": 0.025594938529009993, "kl_loss": 2426.50537109375, "loss_ib": 24.270179748535156, "step": 89 }, { "ce_ib": 49.84978485107422, "ce_orig": 0.9793948531150818, "epoch": 0.025594938529009993, "kl_loss": 2521.16650390625, "loss_ib": 25.216650009155273, "step": 89 }, { "ce_ib": 53.35862350463867, "ce_orig": 0.9854567646980286, "epoch": 0.025594938529009993, "kl_loss": 2478.33984375, "loss_ib": 24.788734436035156, "step": 89 }, { "epoch": 0.025882522107987634, "grad_norm": 397.4322814941406, "learning_rate": 1.337579617834395e-05, "loss": 25.8688, "step": 90 }, { "ce_ib": 50.910614013671875, "ce_orig": 0.6994275450706482, "epoch": 0.025882522107987634, "kl_loss": 2584.65478515625, "loss_ib": 25.85163688659668, "step": 90 }, { "ce_ib": 53.02171325683594, "ce_orig": 1.0508131980895996, "epoch": 0.025882522107987634, "kl_loss": 2165.5048828125, "loss_ib": 21.660350799560547, "step": 90 }, { "ce_ib": 55.81970977783203, "ce_orig": 2.0338478088378906, "epoch": 0.025882522107987634, "kl_loss": 2277.224609375, "loss_ib": 22.7778263092041, "step": 90 }, { "ce_ib": 52.05428695678711, "ce_orig": 1.1036865711212158, "epoch": 0.025882522107987634, "kl_loss": 2340.133056640625, "loss_ib": 23.40653419494629, "step": 90 }, { "ce_ib": 50.32669448852539, "ce_orig": 0.6009736657142639, "epoch": 0.026170105686965275, "kl_loss": 2234.68017578125, "loss_ib": 22.35183334350586, "step": 91 }, { "ce_ib": 53.1220817565918, "ce_orig": 1.201808214187622, "epoch": 0.026170105686965275, "kl_loss": 2135.09423828125, "loss_ib": 21.35625457763672, "step": 91 }, { "ce_ib": 49.957176208496094, "ce_orig": 1.040064811706543, "epoch": 0.026170105686965275, "kl_loss": 2486.378662109375, "loss_ib": 24.86878204345703, "step": 91 }, { "ce_ib": 50.12799835205078, "ce_orig": 0.863908588886261, "epoch": 0.026170105686965275, "kl_loss": 2400.52392578125, "loss_ib": 24.010250091552734, "step": 91 }, { "ce_ib": 52.6755256652832, "ce_orig": 1.1070929765701294, "epoch": 0.026457689265942913, "kl_loss": 1971.570068359375, "loss_ib": 19.72096824645996, "step": 92 }, { "ce_ib": 49.004791259765625, "ce_orig": 1.1243679523468018, "epoch": 0.026457689265942913, "kl_loss": 2431.189453125, "loss_ib": 24.31679344177246, "step": 92 }, { "ce_ib": 56.39695739746094, "ce_orig": 2.0895683765411377, "epoch": 0.026457689265942913, "kl_loss": 2032.292724609375, "loss_ib": 20.32856559753418, "step": 92 }, { "ce_ib": 48.332069396972656, "ce_orig": 0.7159590721130371, "epoch": 0.026457689265942913, "kl_loss": 2333.5986328125, "loss_ib": 23.3408203125, "step": 92 }, { "ce_ib": 51.314674377441406, "ce_orig": 0.5955004692077637, "epoch": 0.026745272844920554, "kl_loss": 2113.81005859375, "loss_ib": 21.143232345581055, "step": 93 }, { "ce_ib": 50.85389709472656, "ce_orig": 1.063989281654358, "epoch": 0.026745272844920554, "kl_loss": 2374.11474609375, "loss_ib": 23.746232986450195, "step": 93 }, { "ce_ib": 52.245399475097656, "ce_orig": 0.854840099811554, "epoch": 0.026745272844920554, "kl_loss": 1991.779052734375, "loss_ib": 19.923015594482422, "step": 93 }, { "ce_ib": 49.68756103515625, "ce_orig": 0.7530232667922974, "epoch": 0.026745272844920554, "kl_loss": 2126.8818359375, "loss_ib": 21.273786544799805, "step": 93 }, { "ce_ib": 54.24198913574219, "ce_orig": 1.3871289491653442, "epoch": 0.027032856423898195, "kl_loss": 2152.40869140625, "loss_ib": 21.529510498046875, "step": 94 }, { "ce_ib": 51.039283752441406, "ce_orig": 1.1029423475265503, "epoch": 0.027032856423898195, "kl_loss": 2147.513916015625, "loss_ib": 21.480243682861328, "step": 94 }, { "ce_ib": 48.558746337890625, "ce_orig": 0.8018097877502441, "epoch": 0.027032856423898195, "kl_loss": 2464.363525390625, "loss_ib": 24.64849090576172, "step": 94 }, { "ce_ib": 51.13576889038086, "ce_orig": 1.1009808778762817, "epoch": 0.027032856423898195, "kl_loss": 2014.6015625, "loss_ib": 20.1511287689209, "step": 94 }, { "epoch": 0.027320440002875836, "grad_norm": 380.0746154785156, "learning_rate": 1.4171974522292993e-05, "loss": 23.87, "step": 95 }, { "ce_ib": 55.49427795410156, "ce_orig": 1.7911261320114136, "epoch": 0.027320440002875836, "kl_loss": 2262.322265625, "loss_ib": 22.62877082824707, "step": 95 }, { "ce_ib": 49.06692886352539, "ce_orig": 1.022802710533142, "epoch": 0.027320440002875836, "kl_loss": 2229.0361328125, "loss_ib": 22.29526710510254, "step": 95 }, { "ce_ib": 50.922794342041016, "ce_orig": 0.8836882710456848, "epoch": 0.027320440002875836, "kl_loss": 2195.3564453125, "loss_ib": 21.958656311035156, "step": 95 }, { "ce_ib": 49.9268913269043, "ce_orig": 1.0127633810043335, "epoch": 0.027320440002875836, "kl_loss": 2146.888671875, "loss_ib": 21.473878860473633, "step": 95 }, { "ce_ib": 49.77082061767578, "ce_orig": 0.9023265838623047, "epoch": 0.027608023581853477, "kl_loss": 2299.9072265625, "loss_ib": 23.00404930114746, "step": 96 }, { "ce_ib": 47.34916305541992, "ce_orig": 0.5646235346794128, "epoch": 0.027608023581853477, "kl_loss": 2068.25634765625, "loss_ib": 20.687297821044922, "step": 96 }, { "ce_ib": 49.27576446533203, "ce_orig": 0.8970661163330078, "epoch": 0.027608023581853477, "kl_loss": 2058.2939453125, "loss_ib": 20.587865829467773, "step": 96 }, { "ce_ib": 51.644412994384766, "ce_orig": 1.6223132610321045, "epoch": 0.027608023581853477, "kl_loss": 1921.7979736328125, "loss_ib": 19.22314453125, "step": 96 }, { "ce_ib": 49.01395034790039, "ce_orig": 0.74750155210495, "epoch": 0.027895607160831115, "kl_loss": 1786.2314453125, "loss_ib": 17.867216110229492, "step": 97 }, { "ce_ib": 49.16642761230469, "ce_orig": 1.0198180675506592, "epoch": 0.027895607160831115, "kl_loss": 2137.5, "loss_ib": 21.37991714477539, "step": 97 }, { "ce_ib": 51.9681396484375, "ce_orig": 1.1882346868515015, "epoch": 0.027895607160831115, "kl_loss": 2058.308837890625, "loss_ib": 20.588285446166992, "step": 97 }, { "ce_ib": 49.95888900756836, "ce_orig": 0.9148277640342712, "epoch": 0.027895607160831115, "kl_loss": 2065.841552734375, "loss_ib": 20.663410186767578, "step": 97 }, { "ce_ib": 49.571800231933594, "ce_orig": 1.0728422403335571, "epoch": 0.028183190739808756, "kl_loss": 2083.6865234375, "loss_ib": 20.841821670532227, "step": 98 }, { "ce_ib": 49.93168640136719, "ce_orig": 0.8260626792907715, "epoch": 0.028183190739808756, "kl_loss": 1862.836181640625, "loss_ib": 18.63335418701172, "step": 98 }, { "ce_ib": 48.66516876220703, "ce_orig": 0.562609851360321, "epoch": 0.028183190739808756, "kl_loss": 2181.225830078125, "loss_ib": 21.817123413085938, "step": 98 }, { "ce_ib": 47.39895248413086, "ce_orig": 1.3863259553909302, "epoch": 0.028183190739808756, "kl_loss": 2107.5283203125, "loss_ib": 21.080020904541016, "step": 98 }, { "ce_ib": 48.56808090209961, "ce_orig": 0.7511693835258484, "epoch": 0.028470774318786397, "kl_loss": 2047.9061279296875, "loss_ib": 20.483917236328125, "step": 99 }, { "ce_ib": 48.201148986816406, "ce_orig": 1.3514686822891235, "epoch": 0.028470774318786397, "kl_loss": 2207.186279296875, "loss_ib": 22.07668113708496, "step": 99 }, { "ce_ib": 47.37411880493164, "ce_orig": 0.8630917072296143, "epoch": 0.028470774318786397, "kl_loss": 2191.63232421875, "loss_ib": 21.921058654785156, "step": 99 }, { "ce_ib": 50.7148323059082, "ce_orig": 1.3532038927078247, "epoch": 0.028470774318786397, "kl_loss": 2022.049560546875, "loss_ib": 20.225566864013672, "step": 99 }, { "epoch": 0.02875835789776404, "grad_norm": 356.2680358886719, "learning_rate": 1.4968152866242039e-05, "loss": 21.7419, "step": 100 }, { "ce_ib": 47.18466567993164, "ce_orig": 1.1329602003097534, "epoch": 0.02875835789776404, "kl_loss": 1989.36962890625, "loss_ib": 19.898414611816406, "step": 100 }, { "ce_ib": 53.88701248168945, "ce_orig": 2.2805113792419434, "epoch": 0.02875835789776404, "kl_loss": 1755.5928955078125, "loss_ib": 17.561317443847656, "step": 100 }, { "ce_ib": 48.18925094604492, "ce_orig": 0.8274984359741211, "epoch": 0.02875835789776404, "kl_loss": 1906.422119140625, "loss_ib": 19.069040298461914, "step": 100 }, { "ce_ib": 46.921417236328125, "ce_orig": 0.7587900757789612, "epoch": 0.02875835789776404, "kl_loss": 2072.403076171875, "loss_ib": 20.728723526000977, "step": 100 }, { "ce_ib": 53.836181640625, "ce_orig": 2.063023805618286, "epoch": 0.02904594147674168, "kl_loss": 1652.205322265625, "loss_ib": 16.527435302734375, "step": 101 }, { "ce_ib": 47.936073303222656, "ce_orig": 0.6192855834960938, "epoch": 0.02904594147674168, "kl_loss": 1928.050048828125, "loss_ib": 19.285293579101562, "step": 101 }, { "ce_ib": 52.24326705932617, "ce_orig": 1.2729721069335938, "epoch": 0.02904594147674168, "kl_loss": 1928.1400146484375, "loss_ib": 19.286624908447266, "step": 101 }, { "ce_ib": 46.775421142578125, "ce_orig": 0.7013092041015625, "epoch": 0.02904594147674168, "kl_loss": 2082.877685546875, "loss_ib": 20.833454132080078, "step": 101 }, { "ce_ib": 46.20343780517578, "ce_orig": 0.7948331832885742, "epoch": 0.029333525055719317, "kl_loss": 1859.212890625, "loss_ib": 18.59674835205078, "step": 102 }, { "ce_ib": 48.856143951416016, "ce_orig": 1.1838785409927368, "epoch": 0.029333525055719317, "kl_loss": 1660.9873046875, "loss_ib": 16.614757537841797, "step": 102 }, { "ce_ib": 47.809078216552734, "ce_orig": 1.779065728187561, "epoch": 0.029333525055719317, "kl_loss": 1773.1181640625, "loss_ib": 17.7359619140625, "step": 102 }, { "ce_ib": 48.513916015625, "ce_orig": 1.4937797784805298, "epoch": 0.029333525055719317, "kl_loss": 1870.419189453125, "loss_ib": 18.709043502807617, "step": 102 }, { "ce_ib": 50.835166931152344, "ce_orig": 1.46725594997406, "epoch": 0.02962110863469696, "kl_loss": 1848.5126953125, "loss_ib": 18.490209579467773, "step": 103 }, { "ce_ib": 49.164024353027344, "ce_orig": 1.4439281225204468, "epoch": 0.02962110863469696, "kl_loss": 1786.349365234375, "loss_ib": 17.868410110473633, "step": 103 }, { "ce_ib": 47.89384841918945, "ce_orig": 1.4249969720840454, "epoch": 0.02962110863469696, "kl_loss": 1961.390625, "loss_ib": 19.618694305419922, "step": 103 }, { "ce_ib": 50.38489532470703, "ce_orig": 1.2643296718597412, "epoch": 0.02962110863469696, "kl_loss": 1844.09521484375, "loss_ib": 18.44599151611328, "step": 103 }, { "ce_ib": 47.76396942138672, "ce_orig": 0.7680091857910156, "epoch": 0.0299086922136746, "kl_loss": 1581.564697265625, "loss_ib": 15.820423126220703, "step": 104 }, { "ce_ib": 47.076053619384766, "ce_orig": 1.2261803150177002, "epoch": 0.0299086922136746, "kl_loss": 1776.835693359375, "loss_ib": 17.77306365966797, "step": 104 }, { "ce_ib": 47.24263000488281, "ce_orig": 0.8971230983734131, "epoch": 0.0299086922136746, "kl_loss": 1715.18798828125, "loss_ib": 17.15660285949707, "step": 104 }, { "ce_ib": 45.86969757080078, "ce_orig": 0.2927989065647125, "epoch": 0.0299086922136746, "kl_loss": 1346.9228515625, "loss_ib": 13.47381591796875, "step": 104 }, { "epoch": 0.03019627579265224, "grad_norm": 313.57281494140625, "learning_rate": 1.5764331210191083e-05, "loss": 19.1552, "step": 105 }, { "ce_ib": 46.8266487121582, "ce_orig": 1.2301392555236816, "epoch": 0.03019627579265224, "kl_loss": 1715.3831787109375, "loss_ib": 17.15851402282715, "step": 105 }, { "ce_ib": 48.934349060058594, "ce_orig": 1.5663868188858032, "epoch": 0.03019627579265224, "kl_loss": 1713.754638671875, "loss_ib": 17.142438888549805, "step": 105 }, { "ce_ib": 47.73679733276367, "ce_orig": 0.7973002791404724, "epoch": 0.03019627579265224, "kl_loss": 1519.5120849609375, "loss_ib": 15.199894905090332, "step": 105 }, { "ce_ib": 48.780006408691406, "ce_orig": 1.2290194034576416, "epoch": 0.03019627579265224, "kl_loss": 1714.5169677734375, "loss_ib": 17.150047302246094, "step": 105 }, { "ce_ib": 46.12453079223633, "ce_orig": 0.7794104218482971, "epoch": 0.030483859371629878, "kl_loss": 1571.0771484375, "loss_ib": 15.715384483337402, "step": 106 }, { "ce_ib": 46.5201530456543, "ce_orig": 0.8720536231994629, "epoch": 0.030483859371629878, "kl_loss": 1566.1361083984375, "loss_ib": 15.66601276397705, "step": 106 }, { "ce_ib": 44.020755767822266, "ce_orig": 0.22585166990756989, "epoch": 0.030483859371629878, "kl_loss": 1053.362548828125, "loss_ib": 10.538026809692383, "step": 106 }, { "ce_ib": 44.2620735168457, "ce_orig": 0.26073363423347473, "epoch": 0.030483859371629878, "kl_loss": 1120.464599609375, "loss_ib": 11.20907211303711, "step": 106 }, { "ce_ib": 47.4915885925293, "ce_orig": 1.2189853191375732, "epoch": 0.03077144295060752, "kl_loss": 947.7132568359375, "loss_ib": 9.481881141662598, "step": 107 }, { "ce_ib": 47.91807556152344, "ce_orig": 1.3612654209136963, "epoch": 0.03077144295060752, "kl_loss": 1467.544677734375, "loss_ib": 14.680237770080566, "step": 107 }, { "ce_ib": 42.33379364013672, "ce_orig": 0.8033524751663208, "epoch": 0.03077144295060752, "kl_loss": 1744.4759521484375, "loss_ib": 17.448991775512695, "step": 107 }, { "ce_ib": 47.13089370727539, "ce_orig": 0.9136131405830383, "epoch": 0.03077144295060752, "kl_loss": 1629.6527099609375, "loss_ib": 16.301239013671875, "step": 107 }, { "ce_ib": 46.97206115722656, "ce_orig": 1.0767881870269775, "epoch": 0.03105902652958516, "kl_loss": 1675.902099609375, "loss_ib": 16.763717651367188, "step": 108 }, { "ce_ib": 43.823402404785156, "ce_orig": 0.7930386662483215, "epoch": 0.03105902652958516, "kl_loss": 1553.387939453125, "loss_ib": 15.538261413574219, "step": 108 }, { "ce_ib": 45.571510314941406, "ce_orig": 0.781028151512146, "epoch": 0.03105902652958516, "kl_loss": 1472.5889892578125, "loss_ib": 14.730446815490723, "step": 108 }, { "ce_ib": 48.90847396850586, "ce_orig": 1.6240291595458984, "epoch": 0.03105902652958516, "kl_loss": 1453.4114990234375, "loss_ib": 14.539006233215332, "step": 108 }, { "ce_ib": 47.367916107177734, "ce_orig": 0.615014374256134, "epoch": 0.0313466101085628, "kl_loss": 1492.5986328125, "loss_ib": 14.9307222366333, "step": 109 }, { "ce_ib": 46.28598403930664, "ce_orig": 1.3170636892318726, "epoch": 0.0313466101085628, "kl_loss": 1374.111572265625, "loss_ib": 13.745744705200195, "step": 109 }, { "ce_ib": 47.25022506713867, "ce_orig": 1.893700361251831, "epoch": 0.0313466101085628, "kl_loss": 1464.014404296875, "loss_ib": 14.644868850708008, "step": 109 }, { "ce_ib": 43.77083969116211, "ce_orig": 0.5421922206878662, "epoch": 0.0313466101085628, "kl_loss": 1321.385986328125, "loss_ib": 13.218236923217773, "step": 109 }, { "epoch": 0.03163419368754044, "grad_norm": 294.16033935546875, "learning_rate": 1.6560509554140128e-05, "loss": 16.7628, "step": 110 }, { "ce_ib": 47.9586067199707, "ce_orig": 0.962894082069397, "epoch": 0.03163419368754044, "kl_loss": 1451.75830078125, "loss_ib": 14.522378921508789, "step": 110 }, { "ce_ib": 43.98506546020508, "ce_orig": 0.734940767288208, "epoch": 0.03163419368754044, "kl_loss": 1582.23291015625, "loss_ib": 15.826726913452148, "step": 110 }, { "ce_ib": 43.784725189208984, "ce_orig": 1.0270369052886963, "epoch": 0.03163419368754044, "kl_loss": 1439.91748046875, "loss_ib": 14.403553009033203, "step": 110 }, { "ce_ib": 47.88432312011719, "ce_orig": 1.8923044204711914, "epoch": 0.03163419368754044, "kl_loss": 1339.40087890625, "loss_ib": 13.398797035217285, "step": 110 }, { "ce_ib": 45.02385711669922, "ce_orig": 0.563847005367279, "epoch": 0.031921777266518084, "kl_loss": 1429.29736328125, "loss_ib": 14.29747486114502, "step": 111 }, { "ce_ib": 44.20392990112305, "ce_orig": 1.070389986038208, "epoch": 0.031921777266518084, "kl_loss": 1417.1707763671875, "loss_ib": 14.176127433776855, "step": 111 }, { "ce_ib": 47.985328674316406, "ce_orig": 1.82245671749115, "epoch": 0.031921777266518084, "kl_loss": 1312.49853515625, "loss_ib": 13.129783630371094, "step": 111 }, { "ce_ib": 47.73635482788086, "ce_orig": 1.0577436685562134, "epoch": 0.031921777266518084, "kl_loss": 1424.302734375, "loss_ib": 14.247800827026367, "step": 111 }, { "ce_ib": 46.29003143310547, "ce_orig": 1.197394847869873, "epoch": 0.03220936084549572, "kl_loss": 1341.0858154296875, "loss_ib": 13.415486335754395, "step": 112 }, { "ce_ib": 45.729007720947266, "ce_orig": 0.9139751195907593, "epoch": 0.03220936084549572, "kl_loss": 1310.7313232421875, "loss_ib": 13.111886024475098, "step": 112 }, { "ce_ib": 46.864864349365234, "ce_orig": 1.5965396165847778, "epoch": 0.03220936084549572, "kl_loss": 1156.0203857421875, "loss_ib": 11.564889907836914, "step": 112 }, { "ce_ib": 43.946414947509766, "ce_orig": 1.2731986045837402, "epoch": 0.03220936084549572, "kl_loss": 1306.838134765625, "loss_ib": 13.072775840759277, "step": 112 }, { "ce_ib": 44.451026916503906, "ce_orig": 1.2415810823440552, "epoch": 0.032496944424473366, "kl_loss": 1380.1820068359375, "loss_ib": 13.80626392364502, "step": 113 }, { "ce_ib": 45.05312728881836, "ce_orig": 0.7081640362739563, "epoch": 0.032496944424473366, "kl_loss": 1326.8614501953125, "loss_ib": 13.273119926452637, "step": 113 }, { "ce_ib": 45.38166809082031, "ce_orig": 0.49601882696151733, "epoch": 0.032496944424473366, "kl_loss": 1228.1025390625, "loss_ib": 12.285563468933105, "step": 113 }, { "ce_ib": 42.399070739746094, "ce_orig": 1.1342860460281372, "epoch": 0.032496944424473366, "kl_loss": 1330.390380859375, "loss_ib": 13.30814266204834, "step": 113 }, { "ce_ib": 42.90398406982422, "ce_orig": 0.8459790945053101, "epoch": 0.032784528003451004, "kl_loss": 1192.5108642578125, "loss_ib": 11.929399490356445, "step": 114 }, { "ce_ib": 42.922142028808594, "ce_orig": 0.657600462436676, "epoch": 0.032784528003451004, "kl_loss": 1351.73291015625, "loss_ib": 13.521620750427246, "step": 114 }, { "ce_ib": 43.3038215637207, "ce_orig": 0.5711429119110107, "epoch": 0.032784528003451004, "kl_loss": 1127.6776123046875, "loss_ib": 11.281105995178223, "step": 114 }, { "ce_ib": 45.69675064086914, "ce_orig": 1.5162954330444336, "epoch": 0.032784528003451004, "kl_loss": 1221.5166015625, "loss_ib": 12.219735145568848, "step": 114 }, { "epoch": 0.03307211158242864, "grad_norm": 255.8572540283203, "learning_rate": 1.7356687898089173e-05, "loss": 14.1527, "step": 115 }, { "ce_ib": 45.3430061340332, "ce_orig": 1.2573144435882568, "epoch": 0.03307211158242864, "kl_loss": 1201.44775390625, "loss_ib": 12.019010543823242, "step": 115 }, { "ce_ib": 41.08205795288086, "ce_orig": 0.44548746943473816, "epoch": 0.03307211158242864, "kl_loss": 553.1367797851562, "loss_ib": 5.535475730895996, "step": 115 }, { "ce_ib": 42.01618957519531, "ce_orig": 0.9748629927635193, "epoch": 0.03307211158242864, "kl_loss": 1253.167724609375, "loss_ib": 12.53587818145752, "step": 115 }, { "ce_ib": 46.25815200805664, "ce_orig": 1.704155445098877, "epoch": 0.03307211158242864, "kl_loss": 1103.8121337890625, "loss_ib": 11.042746543884277, "step": 115 }, { "ce_ib": 41.26174545288086, "ce_orig": 0.6826565861701965, "epoch": 0.033359695161406286, "kl_loss": 1163.051025390625, "loss_ib": 11.634635925292969, "step": 116 }, { "ce_ib": 40.63665008544922, "ce_orig": 0.900534987449646, "epoch": 0.033359695161406286, "kl_loss": 1172.418212890625, "loss_ib": 11.728245735168457, "step": 116 }, { "ce_ib": 44.31190872192383, "ce_orig": 1.1153950691223145, "epoch": 0.033359695161406286, "kl_loss": 1033.94287109375, "loss_ib": 10.343859672546387, "step": 116 }, { "ce_ib": 43.1805305480957, "ce_orig": 0.9051750302314758, "epoch": 0.033359695161406286, "kl_loss": 1077.079833984375, "loss_ib": 10.775115966796875, "step": 116 }, { "ce_ib": 41.2710075378418, "ce_orig": 0.38958603143692017, "epoch": 0.033647278740383924, "kl_loss": 966.39892578125, "loss_ib": 9.668116569519043, "step": 117 }, { "ce_ib": 42.25935745239258, "ce_orig": 0.8274361491203308, "epoch": 0.033647278740383924, "kl_loss": 1053.1240234375, "loss_ib": 10.535466194152832, "step": 117 }, { "ce_ib": 40.06983947753906, "ce_orig": 0.7041372060775757, "epoch": 0.033647278740383924, "kl_loss": 1147.9034423828125, "loss_ib": 11.483041763305664, "step": 117 }, { "ce_ib": 46.431880950927734, "ce_orig": 1.3825441598892212, "epoch": 0.033647278740383924, "kl_loss": 1083.45751953125, "loss_ib": 10.839218139648438, "step": 117 }, { "ce_ib": 43.25281524658203, "ce_orig": 0.9396786689758301, "epoch": 0.03393486231936156, "kl_loss": 1038.500244140625, "loss_ib": 10.389327049255371, "step": 118 }, { "ce_ib": 40.72803497314453, "ce_orig": 0.5316663980484009, "epoch": 0.03393486231936156, "kl_loss": 935.3412475585938, "loss_ib": 9.357484817504883, "step": 118 }, { "ce_ib": 40.19837951660156, "ce_orig": 0.7874443531036377, "epoch": 0.03393486231936156, "kl_loss": 987.9114379882812, "loss_ib": 9.883133888244629, "step": 118 }, { "ce_ib": 42.92312240600586, "ce_orig": 0.8642221093177795, "epoch": 0.03393486231936156, "kl_loss": 1002.868896484375, "loss_ib": 10.032980918884277, "step": 118 }, { "ce_ib": 43.140602111816406, "ce_orig": 0.9903743863105774, "epoch": 0.034222445898339206, "kl_loss": 945.7418212890625, "loss_ib": 9.461731910705566, "step": 119 }, { "ce_ib": 44.95377731323242, "ce_orig": 0.7084935903549194, "epoch": 0.034222445898339206, "kl_loss": 1001.4967041015625, "loss_ib": 10.019461631774902, "step": 119 }, { "ce_ib": 43.81313705444336, "ce_orig": 1.0507792234420776, "epoch": 0.034222445898339206, "kl_loss": 966.8169555664062, "loss_ib": 9.672550201416016, "step": 119 }, { "ce_ib": 38.509605407714844, "ce_orig": 0.24314048886299133, "epoch": 0.034222445898339206, "kl_loss": 900.1303100585938, "loss_ib": 9.00515365600586, "step": 119 }, { "epoch": 0.03451002947731684, "grad_norm": 213.6476287841797, "learning_rate": 1.8152866242038215e-05, "loss": 11.2209, "step": 120 }, { "ce_ib": 43.3798942565918, "ce_orig": 1.417758822441101, "epoch": 0.03451002947731684, "kl_loss": 874.8845825195312, "loss_ib": 8.753183364868164, "step": 120 }, { "ce_ib": 41.32734298706055, "ce_orig": 0.8705493807792664, "epoch": 0.03451002947731684, "kl_loss": 937.0117797851562, "loss_ib": 9.374250411987305, "step": 120 }, { "ce_ib": 38.6541633605957, "ce_orig": 0.23277077078819275, "epoch": 0.03451002947731684, "kl_loss": 378.5799560546875, "loss_ib": 3.7896647453308105, "step": 120 }, { "ce_ib": 43.36669921875, "ce_orig": 1.0161871910095215, "epoch": 0.03451002947731684, "kl_loss": 853.2371215820312, "loss_ib": 8.536707878112793, "step": 120 }, { "ce_ib": 41.16870880126953, "ce_orig": 0.9253172874450684, "epoch": 0.03479761305629449, "kl_loss": 846.5045776367188, "loss_ib": 8.469161987304688, "step": 121 }, { "ce_ib": 44.02971267700195, "ce_orig": 1.2445998191833496, "epoch": 0.03479761305629449, "kl_loss": 718.2892456054688, "loss_ib": 7.187295436859131, "step": 121 }, { "ce_ib": 43.64518737792969, "ce_orig": 1.7942239046096802, "epoch": 0.03479761305629449, "kl_loss": 756.7442626953125, "loss_ib": 7.571806907653809, "step": 121 }, { "ce_ib": 42.69846725463867, "ce_orig": 0.8896026015281677, "epoch": 0.03479761305629449, "kl_loss": 883.087890625, "loss_ib": 8.835148811340332, "step": 121 }, { "ce_ib": 40.64472579956055, "ce_orig": 0.8089054822921753, "epoch": 0.035085196635272126, "kl_loss": 727.42724609375, "loss_ib": 7.278336524963379, "step": 122 }, { "ce_ib": 41.40364456176758, "ce_orig": 0.8790702819824219, "epoch": 0.035085196635272126, "kl_loss": 701.3001708984375, "loss_ib": 7.017142295837402, "step": 122 }, { "ce_ib": 45.067813873291016, "ce_orig": 0.3258854150772095, "epoch": 0.035085196635272126, "kl_loss": 577.9033203125, "loss_ib": 5.783539772033691, "step": 122 }, { "ce_ib": 44.684349060058594, "ce_orig": 1.5608466863632202, "epoch": 0.035085196635272126, "kl_loss": 660.216796875, "loss_ib": 6.606636047363281, "step": 122 }, { "ce_ib": 42.09290313720703, "ce_orig": 0.7853221297264099, "epoch": 0.03537278021424976, "kl_loss": 688.5507202148438, "loss_ib": 6.889716625213623, "step": 123 }, { "ce_ib": 41.19681930541992, "ce_orig": 1.0058292150497437, "epoch": 0.03537278021424976, "kl_loss": 660.992431640625, "loss_ib": 6.614044189453125, "step": 123 }, { "ce_ib": 41.700340270996094, "ce_orig": 0.7194111347198486, "epoch": 0.03537278021424976, "kl_loss": 460.14190673828125, "loss_ib": 4.605588912963867, "step": 123 }, { "ce_ib": 44.97040939331055, "ce_orig": 1.1617707014083862, "epoch": 0.03537278021424976, "kl_loss": 618.4761962890625, "loss_ib": 6.189259052276611, "step": 123 }, { "ce_ib": 42.433712005615234, "ce_orig": 0.7316823601722717, "epoch": 0.03566036379322741, "kl_loss": 761.43359375, "loss_ib": 7.618578910827637, "step": 124 }, { "ce_ib": 42.72594451904297, "ce_orig": 0.9406179189682007, "epoch": 0.03566036379322741, "kl_loss": 608.378173828125, "loss_ib": 6.088054180145264, "step": 124 }, { "ce_ib": 44.054351806640625, "ce_orig": 1.101775050163269, "epoch": 0.03566036379322741, "kl_loss": 533.7700805664062, "loss_ib": 5.342106342315674, "step": 124 }, { "ce_ib": 41.86262130737305, "ce_orig": 1.2485934495925903, "epoch": 0.03566036379322741, "kl_loss": 604.7998657226562, "loss_ib": 6.05218505859375, "step": 124 }, { "epoch": 0.035947947372205045, "grad_norm": 165.4596405029297, "learning_rate": 1.8949044585987264e-05, "loss": 8.3603, "step": 125 }, { "ce_ib": 41.704227447509766, "ce_orig": 0.7984323501586914, "epoch": 0.035947947372205045, "kl_loss": 570.8909912109375, "loss_ib": 5.713080406188965, "step": 125 }, { "ce_ib": 44.47398376464844, "ce_orig": 1.532689094543457, "epoch": 0.035947947372205045, "kl_loss": 572.6158447265625, "loss_ib": 5.7306060791015625, "step": 125 }, { "ce_ib": 44.11103820800781, "ce_orig": 0.8605639338493347, "epoch": 0.035947947372205045, "kl_loss": 560.5389404296875, "loss_ib": 5.609800338745117, "step": 125 }, { "ce_ib": 42.20602798461914, "ce_orig": 1.0192476511001587, "epoch": 0.035947947372205045, "kl_loss": 583.3988647460938, "loss_ib": 5.83820915222168, "step": 125 }, { "ce_ib": 43.26830291748047, "ce_orig": 0.7587823271751404, "epoch": 0.03623553095118269, "kl_loss": 595.424072265625, "loss_ib": 5.958567142486572, "step": 126 }, { "ce_ib": 42.44752502441406, "ce_orig": 1.2043931484222412, "epoch": 0.03623553095118269, "kl_loss": 496.97802734375, "loss_ib": 4.974024772644043, "step": 126 }, { "ce_ib": 43.29387283325195, "ce_orig": 1.735470175743103, "epoch": 0.03623553095118269, "kl_loss": 459.98992919921875, "loss_ib": 4.604228496551514, "step": 126 }, { "ce_ib": 44.7207145690918, "ce_orig": 1.0822900533676147, "epoch": 0.03623553095118269, "kl_loss": 513.75048828125, "loss_ib": 5.141976833343506, "step": 126 }, { "ce_ib": 43.62824249267578, "ce_orig": 1.2997839450836182, "epoch": 0.03652311453016033, "kl_loss": 499.59527587890625, "loss_ib": 5.0003156661987305, "step": 127 }, { "ce_ib": 45.198951721191406, "ce_orig": 1.4282422065734863, "epoch": 0.03652311453016033, "kl_loss": 442.3271484375, "loss_ib": 4.427791118621826, "step": 127 }, { "ce_ib": 41.611297607421875, "ce_orig": 0.6139658093452454, "epoch": 0.03652311453016033, "kl_loss": 492.67706298828125, "loss_ib": 4.930931568145752, "step": 127 }, { "ce_ib": 43.24065017700195, "ce_orig": 1.5706660747528076, "epoch": 0.03652311453016033, "kl_loss": 477.58251953125, "loss_ib": 4.780148983001709, "step": 127 }, { "ce_ib": 45.77122497558594, "ce_orig": 1.3252004384994507, "epoch": 0.036810698109137965, "kl_loss": 367.55364990234375, "loss_ib": 3.6801135540008545, "step": 128 }, { "ce_ib": 43.11273956298828, "ce_orig": 1.3362116813659668, "epoch": 0.036810698109137965, "kl_loss": 402.22039794921875, "loss_ib": 4.026515007019043, "step": 128 }, { "ce_ib": 43.218231201171875, "ce_orig": 1.3605029582977295, "epoch": 0.036810698109137965, "kl_loss": 467.728759765625, "loss_ib": 4.681609630584717, "step": 128 }, { "ce_ib": 42.986263275146484, "ce_orig": 1.012925386428833, "epoch": 0.036810698109137965, "kl_loss": 461.2456359863281, "loss_ib": 4.61675500869751, "step": 128 }, { "ce_ib": 45.84535598754883, "ce_orig": 0.9996353387832642, "epoch": 0.03709828168811561, "kl_loss": 307.2117919921875, "loss_ib": 3.07670259475708, "step": 129 }, { "ce_ib": 47.88697052001953, "ce_orig": 1.4389865398406982, "epoch": 0.03709828168811561, "kl_loss": 270.8951416015625, "loss_ib": 2.713740110397339, "step": 129 }, { "ce_ib": 44.36796569824219, "ce_orig": 0.28512611985206604, "epoch": 0.03709828168811561, "kl_loss": 424.74493408203125, "loss_ib": 4.251885890960693, "step": 129 }, { "ce_ib": 49.39015197753906, "ce_orig": 1.1395325660705566, "epoch": 0.03709828168811561, "kl_loss": 358.5738220214844, "loss_ib": 3.59067702293396, "step": 129 }, { "epoch": 0.03738586526709325, "grad_norm": 114.32688903808594, "learning_rate": 1.974522292993631e-05, "loss": 5.7247, "step": 130 }, { "ce_ib": 46.33614730834961, "ce_orig": 1.3037816286087036, "epoch": 0.03738586526709325, "kl_loss": 291.12872314453125, "loss_ib": 2.9159207344055176, "step": 130 }, { "ce_ib": 47.692874908447266, "ce_orig": 0.864368736743927, "epoch": 0.03738586526709325, "kl_loss": 327.73089599609375, "loss_ib": 3.282078266143799, "step": 130 }, { "ce_ib": 49.18111038208008, "ce_orig": 1.450368046760559, "epoch": 0.03738586526709325, "kl_loss": 326.9405212402344, "loss_ib": 3.2743234634399414, "step": 130 }, { "ce_ib": 47.151817321777344, "ce_orig": 0.6973881125450134, "epoch": 0.03738586526709325, "kl_loss": 341.2000732421875, "loss_ib": 3.4167158603668213, "step": 130 }, { "ce_ib": 47.11798858642578, "ce_orig": 0.9874345660209656, "epoch": 0.03767344884607089, "kl_loss": 245.39163208007812, "loss_ib": 2.458627939224243, "step": 131 }, { "ce_ib": 48.82184600830078, "ce_orig": 1.7434450387954712, "epoch": 0.03767344884607089, "kl_loss": 233.43666076660156, "loss_ib": 2.3392486572265625, "step": 131 }, { "ce_ib": 52.432861328125, "ce_orig": 1.6617094278335571, "epoch": 0.03767344884607089, "kl_loss": 249.0355682373047, "loss_ib": 2.495598793029785, "step": 131 }, { "ce_ib": 48.34469223022461, "ce_orig": 0.8209026455879211, "epoch": 0.03767344884607089, "kl_loss": 258.18017578125, "loss_ib": 2.5866363048553467, "step": 131 }, { "ce_ib": 49.49347686767578, "ce_orig": 1.1256669759750366, "epoch": 0.03796103242504853, "kl_loss": 249.56777954101562, "loss_ib": 2.500627040863037, "step": 132 }, { "ce_ib": 53.37258529663086, "ce_orig": 1.1655960083007812, "epoch": 0.03796103242504853, "kl_loss": 296.350830078125, "loss_ib": 2.9688453674316406, "step": 132 }, { "ce_ib": 48.557525634765625, "ce_orig": 1.608039140701294, "epoch": 0.03796103242504853, "kl_loss": 236.46792602539062, "loss_ib": 2.369534969329834, "step": 132 }, { "ce_ib": 49.64237594604492, "ce_orig": 1.220885157585144, "epoch": 0.03796103242504853, "kl_loss": 232.15313720703125, "loss_ib": 2.32649564743042, "step": 132 }, { "ce_ib": 53.12397384643555, "ce_orig": 1.4053157567977905, "epoch": 0.03824861600402617, "kl_loss": 148.06582641601562, "loss_ib": 1.4859706163406372, "step": 133 }, { "ce_ib": 46.214569091796875, "ce_orig": 0.5235381722450256, "epoch": 0.03824861600402617, "kl_loss": 216.90960693359375, "loss_ib": 2.173717498779297, "step": 133 }, { "ce_ib": 63.17025375366211, "ce_orig": 1.6942404508590698, "epoch": 0.03824861600402617, "kl_loss": 157.73348999023438, "loss_ib": 1.5836519002914429, "step": 133 }, { "ce_ib": 56.94756317138672, "ce_orig": 1.1503974199295044, "epoch": 0.03824861600402617, "kl_loss": 172.39581298828125, "loss_ib": 1.7296528816223145, "step": 133 }, { "ce_ib": 56.051700592041016, "ce_orig": 1.2757078409194946, "epoch": 0.03853619958300381, "kl_loss": 132.28765869140625, "loss_ib": 1.328481674194336, "step": 134 }, { "ce_ib": 57.61357879638672, "ce_orig": 0.6087625026702881, "epoch": 0.03853619958300381, "kl_loss": 177.25326538085938, "loss_ib": 1.7782940864562988, "step": 134 }, { "ce_ib": 62.553672790527344, "ce_orig": 0.979148805141449, "epoch": 0.03853619958300381, "kl_loss": 148.2458038330078, "loss_ib": 1.4887133836746216, "step": 134 }, { "ce_ib": 59.60444259643555, "ce_orig": 0.786743700504303, "epoch": 0.03853619958300381, "kl_loss": 177.24185180664062, "loss_ib": 1.7783788442611694, "step": 134 }, { "epoch": 0.03882378316198145, "grad_norm": 61.325218200683594, "learning_rate": 2.054140127388535e-05, "loss": 3.423, "step": 135 }, { "ce_ib": 47.83711624145508, "ce_orig": 1.0823129415512085, "epoch": 0.03882378316198145, "kl_loss": 117.60155487060547, "loss_ib": 1.1807992458343506, "step": 135 }, { "ce_ib": 53.23299789428711, "ce_orig": 2.0539369583129883, "epoch": 0.03882378316198145, "kl_loss": 105.29367065429688, "loss_ib": 1.0582599639892578, "step": 135 }, { "ce_ib": 62.1235466003418, "ce_orig": 1.288967251777649, "epoch": 0.03882378316198145, "kl_loss": 117.70156860351562, "loss_ib": 1.1832280158996582, "step": 135 }, { "ce_ib": 60.246185302734375, "ce_orig": 1.0303462743759155, "epoch": 0.03882378316198145, "kl_loss": 119.00950622558594, "loss_ib": 1.1961196660995483, "step": 135 }, { "ce_ib": 64.75760650634766, "ce_orig": 1.0299265384674072, "epoch": 0.039111366740959094, "kl_loss": 97.26797485351562, "loss_ib": 0.9791554808616638, "step": 136 }, { "ce_ib": 59.91645812988281, "ce_orig": 0.9491832256317139, "epoch": 0.039111366740959094, "kl_loss": 101.67373657226562, "loss_ib": 1.0227290391921997, "step": 136 }, { "ce_ib": 64.09386444091797, "ce_orig": 1.0575294494628906, "epoch": 0.039111366740959094, "kl_loss": 86.674072265625, "loss_ib": 0.873150110244751, "step": 136 }, { "ce_ib": 55.84811782836914, "ce_orig": 0.5318177342414856, "epoch": 0.039111366740959094, "kl_loss": 69.2609634399414, "loss_ib": 0.6981943845748901, "step": 136 }, { "ce_ib": 61.201900482177734, "ce_orig": 1.5152733325958252, "epoch": 0.03939895031993673, "kl_loss": 86.82037353515625, "loss_ib": 0.8743239641189575, "step": 137 }, { "ce_ib": 48.1711540222168, "ce_orig": 0.9321234822273254, "epoch": 0.03939895031993673, "kl_loss": 88.01079559326172, "loss_ib": 0.8849250674247742, "step": 137 }, { "ce_ib": 56.62932205200195, "ce_orig": 0.9663710594177246, "epoch": 0.03939895031993673, "kl_loss": 92.86305236816406, "loss_ib": 0.9342934489250183, "step": 137 }, { "ce_ib": 50.61298751831055, "ce_orig": 1.012882113456726, "epoch": 0.03939895031993673, "kl_loss": 100.32122802734375, "loss_ib": 1.0082734823226929, "step": 137 }, { "ce_ib": 52.78557586669922, "ce_orig": 1.3567779064178467, "epoch": 0.03968653389891437, "kl_loss": 75.2830581665039, "loss_ib": 0.7581090927124023, "step": 138 }, { "ce_ib": 52.53969192504883, "ce_orig": 1.0360667705535889, "epoch": 0.03968653389891437, "kl_loss": 80.51203918457031, "loss_ib": 0.81037437915802, "step": 138 }, { "ce_ib": 42.97282028198242, "ce_orig": 0.6911470890045166, "epoch": 0.03968653389891437, "kl_loss": 107.92098236083984, "loss_ib": 1.0835070610046387, "step": 138 }, { "ce_ib": 55.01441192626953, "ce_orig": 1.0413540601730347, "epoch": 0.03968653389891437, "kl_loss": 84.3485107421875, "loss_ib": 0.8489865064620972, "step": 138 }, { "ce_ib": 49.41832733154297, "ce_orig": 0.5004691481590271, "epoch": 0.039974117477892014, "kl_loss": 64.56187438964844, "loss_ib": 0.6505606174468994, "step": 139 }, { "ce_ib": 54.80555725097656, "ce_orig": 0.8709143996238708, "epoch": 0.039974117477892014, "kl_loss": 75.56375122070312, "loss_ib": 0.7611180543899536, "step": 139 }, { "ce_ib": 44.817134857177734, "ce_orig": 1.1028708219528198, "epoch": 0.039974117477892014, "kl_loss": 56.54993438720703, "loss_ib": 0.569981038570404, "step": 139 }, { "ce_ib": 50.21042251586914, "ce_orig": 1.0824670791625977, "epoch": 0.039974117477892014, "kl_loss": 69.47157287597656, "loss_ib": 0.6997367739677429, "step": 139 }, { "epoch": 0.04026170105686965, "grad_norm": 27.144216537475586, "learning_rate": 2.1337579617834397e-05, "loss": 2.0774, "step": 140 }, { "ce_ib": 47.516990661621094, "ce_orig": 1.2334574460983276, "epoch": 0.04026170105686965, "kl_loss": 63.68349838256836, "loss_ib": 0.6415866613388062, "step": 140 }, { "ce_ib": 42.7164306640625, "ce_orig": 0.7245992422103882, "epoch": 0.04026170105686965, "kl_loss": 62.23073196411133, "loss_ib": 0.6265789866447449, "step": 140 }, { "ce_ib": 47.90711212158203, "ce_orig": 0.797220766544342, "epoch": 0.04026170105686965, "kl_loss": 70.8463134765625, "loss_ib": 0.7132538557052612, "step": 140 }, { "ce_ib": 44.96827697753906, "ce_orig": 0.9708709716796875, "epoch": 0.04026170105686965, "kl_loss": 62.58702087402344, "loss_ib": 0.6303670406341553, "step": 140 }, { "ce_ib": 43.66420364379883, "ce_orig": 1.5154752731323242, "epoch": 0.040549284635847296, "kl_loss": 63.67985916137695, "loss_ib": 0.641165018081665, "step": 141 }, { "ce_ib": 39.74589920043945, "ce_orig": 1.1597050428390503, "epoch": 0.040549284635847296, "kl_loss": 68.15312194824219, "loss_ib": 0.6855058073997498, "step": 141 }, { "ce_ib": 38.30898666381836, "ce_orig": 1.208406686782837, "epoch": 0.040549284635847296, "kl_loss": 54.45480728149414, "loss_ib": 0.5483789443969727, "step": 141 }, { "ce_ib": 42.6765022277832, "ce_orig": 1.5113545656204224, "epoch": 0.040549284635847296, "kl_loss": 45.85490417480469, "loss_ib": 0.46281668543815613, "step": 141 }, { "ce_ib": 40.479461669921875, "ce_orig": 1.2261719703674316, "epoch": 0.040836868214824934, "kl_loss": 44.18513488769531, "loss_ib": 0.44589927792549133, "step": 142 }, { "ce_ib": 38.052547454833984, "ce_orig": 0.6562057137489319, "epoch": 0.040836868214824934, "kl_loss": 54.23804473876953, "loss_ib": 0.5461856722831726, "step": 142 }, { "ce_ib": 42.021270751953125, "ce_orig": 0.31955811381340027, "epoch": 0.040836868214824934, "kl_loss": 29.33365249633789, "loss_ib": 0.2975386381149292, "step": 142 }, { "ce_ib": 41.40554428100586, "ce_orig": 0.9634075164794922, "epoch": 0.040836868214824934, "kl_loss": 54.530174255371094, "loss_ib": 0.5494422912597656, "step": 142 }, { "ce_ib": 38.900028228759766, "ce_orig": 1.0080485343933105, "epoch": 0.04112445179380257, "kl_loss": 52.973106384277344, "loss_ib": 0.533621072769165, "step": 143 }, { "ce_ib": 38.12443923950195, "ce_orig": 0.9282627105712891, "epoch": 0.04112445179380257, "kl_loss": 42.263893127441406, "loss_ib": 0.42645135521888733, "step": 143 }, { "ce_ib": 43.536231994628906, "ce_orig": 1.5404144525527954, "epoch": 0.04112445179380257, "kl_loss": 39.663185119628906, "loss_ib": 0.4009854793548584, "step": 143 }, { "ce_ib": 39.83261489868164, "ce_orig": 1.2672309875488281, "epoch": 0.04112445179380257, "kl_loss": 42.35781478881836, "loss_ib": 0.4275614023208618, "step": 143 }, { "ce_ib": 41.01529312133789, "ce_orig": 1.457834005355835, "epoch": 0.041412035372780216, "kl_loss": 34.49407958984375, "loss_ib": 0.3490423262119293, "step": 144 }, { "ce_ib": 29.345317840576172, "ce_orig": 0.3651731610298157, "epoch": 0.041412035372780216, "kl_loss": 68.94469451904297, "loss_ib": 0.6923814415931702, "step": 144 }, { "ce_ib": 34.595951080322266, "ce_orig": 0.5874239802360535, "epoch": 0.041412035372780216, "kl_loss": 42.69541931152344, "loss_ib": 0.43041378259658813, "step": 144 }, { "ce_ib": 33.79957962036133, "ce_orig": 0.6981248259544373, "epoch": 0.041412035372780216, "kl_loss": 43.602195739746094, "loss_ib": 0.43940192461013794, "step": 144 }, { "epoch": 0.041699618951757854, "grad_norm": 11.803001403808594, "learning_rate": 2.2133757961783442e-05, "loss": 1.5408, "step": 145 }, { "ce_ib": 35.549190521240234, "ce_orig": 1.1565806865692139, "epoch": 0.041699618951757854, "kl_loss": 33.884830474853516, "loss_ib": 0.34240320324897766, "step": 145 }, { "ce_ib": 36.85725021362305, "ce_orig": 0.614605188369751, "epoch": 0.041699618951757854, "kl_loss": 38.68310546875, "loss_ib": 0.3905167579650879, "step": 145 }, { "ce_ib": 33.613216400146484, "ce_orig": 0.774656355381012, "epoch": 0.041699618951757854, "kl_loss": 35.071624755859375, "loss_ib": 0.35407754778862, "step": 145 }, { "ce_ib": 38.60401916503906, "ce_orig": 1.3087610006332397, "epoch": 0.041699618951757854, "kl_loss": 27.925447463989258, "loss_ib": 0.28311488032341003, "step": 145 }, { "ce_ib": 31.10846519470215, "ce_orig": 0.8307720422744751, "epoch": 0.0419872025307355, "kl_loss": 35.52260208129883, "loss_ib": 0.358336865901947, "step": 146 }, { "ce_ib": 35.52298355102539, "ce_orig": 0.6402543187141418, "epoch": 0.0419872025307355, "kl_loss": 20.296550750732422, "loss_ib": 0.2065178006887436, "step": 146 }, { "ce_ib": 32.333797454833984, "ce_orig": 0.5773739814758301, "epoch": 0.0419872025307355, "kl_loss": 33.569828033447266, "loss_ib": 0.3389316499233246, "step": 146 }, { "ce_ib": 36.07624816894531, "ce_orig": 1.3285282850265503, "epoch": 0.0419872025307355, "kl_loss": 28.952056884765625, "loss_ib": 0.29312819242477417, "step": 146 }, { "ce_ib": 34.523563385009766, "ce_orig": 1.455711841583252, "epoch": 0.042274786109713136, "kl_loss": 33.6051025390625, "loss_ib": 0.33950334787368774, "step": 147 }, { "ce_ib": 32.496185302734375, "ce_orig": 0.8119601011276245, "epoch": 0.042274786109713136, "kl_loss": 30.560955047607422, "loss_ib": 0.3088591694831848, "step": 147 }, { "ce_ib": 31.24298858642578, "ce_orig": 0.6599155068397522, "epoch": 0.042274786109713136, "kl_loss": 25.330509185791016, "loss_ib": 0.25642937421798706, "step": 147 }, { "ce_ib": 34.15837097167969, "ce_orig": 0.7831727862358093, "epoch": 0.042274786109713136, "kl_loss": 32.8238410949707, "loss_ib": 0.33165425062179565, "step": 147 }, { "ce_ib": 36.50813674926758, "ce_orig": 1.3959016799926758, "epoch": 0.042562369688690774, "kl_loss": 24.21875762939453, "loss_ib": 0.24583838880062103, "step": 148 }, { "ce_ib": 33.1202392578125, "ce_orig": 0.511696457862854, "epoch": 0.042562369688690774, "kl_loss": 32.21922302246094, "loss_ib": 0.32550424337387085, "step": 148 }, { "ce_ib": 31.0117130279541, "ce_orig": 0.6812951564788818, "epoch": 0.042562369688690774, "kl_loss": 24.291759490966797, "loss_ib": 0.24601876735687256, "step": 148 }, { "ce_ib": 31.82808494567871, "ce_orig": 0.6159489750862122, "epoch": 0.042562369688690774, "kl_loss": 21.070880889892578, "loss_ib": 0.21389161050319672, "step": 148 }, { "ce_ib": 30.777088165283203, "ce_orig": 0.6892868280410767, "epoch": 0.04284995326766842, "kl_loss": 22.594371795654297, "loss_ib": 0.22902143001556396, "step": 149 }, { "ce_ib": 37.14453887939453, "ce_orig": 1.9816077947616577, "epoch": 0.04284995326766842, "kl_loss": 44.33348083496094, "loss_ib": 0.44704926013946533, "step": 149 }, { "ce_ib": 28.821805953979492, "ce_orig": 0.8520447611808777, "epoch": 0.04284995326766842, "kl_loss": 25.312294006347656, "loss_ib": 0.25600510835647583, "step": 149 }, { "ce_ib": 34.31684494018555, "ce_orig": 1.2896530628204346, "epoch": 0.04284995326766842, "kl_loss": 29.53026580810547, "loss_ib": 0.2987343370914459, "step": 149 }, { "epoch": 0.043137536846646056, "grad_norm": 6.311826705932617, "learning_rate": 2.2929936305732484e-05, "loss": 1.2869, "step": 150 }, { "ce_ib": 29.53162384033203, "ce_orig": 0.9975224733352661, "epoch": 0.043137536846646056, "kl_loss": 21.389690399169922, "loss_ib": 0.21685007214546204, "step": 150 }, { "ce_ib": 33.31801986694336, "ce_orig": 1.2958406209945679, "epoch": 0.043137536846646056, "kl_loss": 24.239055633544922, "loss_ib": 0.24572233855724335, "step": 150 }, { "ce_ib": 35.665565490722656, "ce_orig": 0.5235558152198792, "epoch": 0.043137536846646056, "kl_loss": 22.637462615966797, "loss_ib": 0.22994117438793182, "step": 150 }, { "ce_ib": 35.29521179199219, "ce_orig": 1.2123780250549316, "epoch": 0.043137536846646056, "kl_loss": 21.82353401184082, "loss_ib": 0.22176486253738403, "step": 150 }, { "ce_ib": 33.05928421020508, "ce_orig": 0.8596100807189941, "epoch": 0.043425120425623694, "kl_loss": 24.44532012939453, "loss_ib": 0.2477591335773468, "step": 151 }, { "ce_ib": 38.77718734741211, "ce_orig": 2.1412835121154785, "epoch": 0.043425120425623694, "kl_loss": 28.010578155517578, "loss_ib": 0.2839834988117218, "step": 151 }, { "ce_ib": 34.24200439453125, "ce_orig": 0.6295925974845886, "epoch": 0.043425120425623694, "kl_loss": 21.05971908569336, "loss_ib": 0.21402138471603394, "step": 151 }, { "ce_ib": 33.19257736206055, "ce_orig": 1.2560220956802368, "epoch": 0.043425120425623694, "kl_loss": 21.76863670349121, "loss_ib": 0.2210056185722351, "step": 151 }, { "ce_ib": 32.58409881591797, "ce_orig": 0.7950013279914856, "epoch": 0.04371270400460134, "kl_loss": 28.509788513183594, "loss_ib": 0.28835630416870117, "step": 152 }, { "ce_ib": 32.49606704711914, "ce_orig": 1.8779208660125732, "epoch": 0.04371270400460134, "kl_loss": 30.838430404663086, "loss_ib": 0.3116339147090912, "step": 152 }, { "ce_ib": 33.429622650146484, "ce_orig": 0.7865967154502869, "epoch": 0.04371270400460134, "kl_loss": 29.228368759155273, "loss_ib": 0.2956266403198242, "step": 152 }, { "ce_ib": 29.401348114013672, "ce_orig": 0.7986537218093872, "epoch": 0.04371270400460134, "kl_loss": 24.602405548095703, "loss_ib": 0.24896419048309326, "step": 152 }, { "ce_ib": 35.428165435791016, "ce_orig": 1.3112716674804688, "epoch": 0.044000287583578976, "kl_loss": 18.217554092407227, "loss_ib": 0.1857183575630188, "step": 153 }, { "ce_ib": 33.20622634887695, "ce_orig": 1.091870903968811, "epoch": 0.044000287583578976, "kl_loss": 18.279142379760742, "loss_ib": 0.18611203134059906, "step": 153 }, { "ce_ib": 32.40380859375, "ce_orig": 1.0627433061599731, "epoch": 0.044000287583578976, "kl_loss": 20.22241973876953, "loss_ib": 0.20546457171440125, "step": 153 }, { "ce_ib": 29.084455490112305, "ce_orig": 0.823095440864563, "epoch": 0.044000287583578976, "kl_loss": 23.27497673034668, "loss_ib": 0.235658198595047, "step": 153 }, { "ce_ib": 30.08700180053711, "ce_orig": 0.6791905164718628, "epoch": 0.04428787116255662, "kl_loss": 17.341888427734375, "loss_ib": 0.17642758786678314, "step": 154 }, { "ce_ib": 28.275983810424805, "ce_orig": 0.40569692850112915, "epoch": 0.04428787116255662, "kl_loss": 19.95773696899414, "loss_ib": 0.20240497589111328, "step": 154 }, { "ce_ib": 33.74617004394531, "ce_orig": 1.7346209287643433, "epoch": 0.04428787116255662, "kl_loss": 18.556991577148438, "loss_ib": 0.18894453346729279, "step": 154 }, { "ce_ib": 30.752422332763672, "ce_orig": 0.71451336145401, "epoch": 0.04428787116255662, "kl_loss": 16.57543182373047, "loss_ib": 0.168829545378685, "step": 154 }, { "epoch": 0.04457545474153426, "grad_norm": 3.4597690105438232, "learning_rate": 2.372611464968153e-05, "loss": 1.2585, "step": 155 }, { "ce_ib": 28.92538833618164, "ce_orig": 1.050588607788086, "epoch": 0.04457545474153426, "kl_loss": 19.674413681030273, "loss_ib": 0.19963666796684265, "step": 155 }, { "ce_ib": 31.494068145751953, "ce_orig": 1.3162670135498047, "epoch": 0.04457545474153426, "kl_loss": 15.291072845458984, "loss_ib": 0.156060129404068, "step": 155 }, { "ce_ib": 31.52849769592285, "ce_orig": 0.6012848615646362, "epoch": 0.04457545474153426, "kl_loss": 15.920844078063965, "loss_ib": 0.1623612940311432, "step": 155 }, { "ce_ib": 33.46098709106445, "ce_orig": 1.0411237478256226, "epoch": 0.04457545474153426, "kl_loss": 17.932607650756836, "loss_ib": 0.1826721727848053, "step": 155 }, { "ce_ib": 34.06367874145508, "ce_orig": 0.7581042647361755, "epoch": 0.044863038320511896, "kl_loss": 22.63808822631836, "loss_ib": 0.22978724539279938, "step": 156 }, { "ce_ib": 30.403427124023438, "ce_orig": 0.5148236751556396, "epoch": 0.044863038320511896, "kl_loss": 14.46303939819336, "loss_ib": 0.14767073094844818, "step": 156 }, { "ce_ib": 29.40231704711914, "ce_orig": 0.7519353032112122, "epoch": 0.044863038320511896, "kl_loss": 21.479459762573242, "loss_ib": 0.21773482859134674, "step": 156 }, { "ce_ib": 27.831212997436523, "ce_orig": 0.80788654088974, "epoch": 0.044863038320511896, "kl_loss": 16.518142700195312, "loss_ib": 0.16796454787254333, "step": 156 }, { "ce_ib": 27.716188430786133, "ce_orig": 0.7496557831764221, "epoch": 0.04515062189948954, "kl_loss": 13.905786514282227, "loss_ib": 0.1418294757604599, "step": 157 }, { "ce_ib": 28.782617568969727, "ce_orig": 0.7090852856636047, "epoch": 0.04515062189948954, "kl_loss": 15.777366638183594, "loss_ib": 0.16065192222595215, "step": 157 }, { "ce_ib": 26.00276756286621, "ce_orig": 0.494842529296875, "epoch": 0.04515062189948954, "kl_loss": 16.35750389099121, "loss_ib": 0.16617530584335327, "step": 157 }, { "ce_ib": 28.558490753173828, "ce_orig": 0.948776364326477, "epoch": 0.04515062189948954, "kl_loss": 15.582597732543945, "loss_ib": 0.15868182480335236, "step": 157 }, { "ce_ib": 34.348106384277344, "ce_orig": 1.4037892818450928, "epoch": 0.04543820547846718, "kl_loss": 15.35753059387207, "loss_ib": 0.15701010823249817, "step": 158 }, { "ce_ib": 30.06648826599121, "ce_orig": 1.0562583208084106, "epoch": 0.04543820547846718, "kl_loss": 13.857028007507324, "loss_ib": 0.14157693088054657, "step": 158 }, { "ce_ib": 33.296878814697266, "ce_orig": 1.184076189994812, "epoch": 0.04543820547846718, "kl_loss": 14.362920761108398, "loss_ib": 0.14695888757705688, "step": 158 }, { "ce_ib": 30.477880477905273, "ce_orig": 0.6938384771347046, "epoch": 0.04543820547846718, "kl_loss": 13.156094551086426, "loss_ib": 0.13460873067378998, "step": 158 }, { "ce_ib": 30.92000961303711, "ce_orig": 0.8126051425933838, "epoch": 0.04572578905744482, "kl_loss": 13.102733612060547, "loss_ib": 0.13411933183670044, "step": 159 }, { "ce_ib": 32.433162689208984, "ce_orig": 1.181881070137024, "epoch": 0.04572578905744482, "kl_loss": 14.020172119140625, "loss_ib": 0.14344502985477448, "step": 159 }, { "ce_ib": 33.700931549072266, "ce_orig": 1.5680264234542847, "epoch": 0.04572578905744482, "kl_loss": 13.899885177612305, "loss_ib": 0.14236894249916077, "step": 159 }, { "ce_ib": 28.371702194213867, "ce_orig": 0.9268200397491455, "epoch": 0.04572578905744482, "kl_loss": 18.150760650634766, "loss_ib": 0.18434476852416992, "step": 159 }, { "epoch": 0.04601337263642246, "grad_norm": 2.066725254058838, "learning_rate": 2.4522292993630575e-05, "loss": 1.0186, "step": 160 }, { "ce_ib": 29.896162033081055, "ce_orig": 0.8601086735725403, "epoch": 0.04601337263642246, "kl_loss": 12.835603713989258, "loss_ib": 0.13134564459323883, "step": 160 }, { "ce_ib": 29.533695220947266, "ce_orig": 1.1664679050445557, "epoch": 0.04601337263642246, "kl_loss": 15.90629768371582, "loss_ib": 0.1620163470506668, "step": 160 }, { "ce_ib": 28.180938720703125, "ce_orig": 0.8322929739952087, "epoch": 0.04601337263642246, "kl_loss": 12.797597885131836, "loss_ib": 0.13079407811164856, "step": 160 }, { "ce_ib": 28.38677215576172, "ce_orig": 0.8806703090667725, "epoch": 0.04601337263642246, "kl_loss": 16.691715240478516, "loss_ib": 0.16975581645965576, "step": 160 }, { "ce_ib": 27.899879455566406, "ce_orig": 0.6471708416938782, "epoch": 0.0463009562154001, "kl_loss": 14.290294647216797, "loss_ib": 0.14569292962551117, "step": 161 }, { "ce_ib": 27.485563278198242, "ce_orig": 0.9937444925308228, "epoch": 0.0463009562154001, "kl_loss": 15.568538665771484, "loss_ib": 0.1584339439868927, "step": 161 }, { "ce_ib": 30.291170120239258, "ce_orig": 0.7304977178573608, "epoch": 0.0463009562154001, "kl_loss": 9.206818580627441, "loss_ib": 0.09509730339050293, "step": 161 }, { "ce_ib": 29.51616859436035, "ce_orig": 1.386801838874817, "epoch": 0.0463009562154001, "kl_loss": 20.9112548828125, "loss_ib": 0.21206416189670563, "step": 161 }, { "ce_ib": 27.004371643066406, "ce_orig": 0.6013516783714294, "epoch": 0.04658853979437774, "kl_loss": 15.80407428741455, "loss_ib": 0.1607411801815033, "step": 162 }, { "ce_ib": 25.159454345703125, "ce_orig": 0.9960594773292542, "epoch": 0.04658853979437774, "kl_loss": 13.249858856201172, "loss_ib": 0.13501453399658203, "step": 162 }, { "ce_ib": 26.201725006103516, "ce_orig": 0.5098617076873779, "epoch": 0.04658853979437774, "kl_loss": 11.842464447021484, "loss_ib": 0.1210448145866394, "step": 162 }, { "ce_ib": 29.0825138092041, "ce_orig": 0.8241496086120605, "epoch": 0.04658853979437774, "kl_loss": 16.010656356811523, "loss_ib": 0.16301481425762177, "step": 162 }, { "ce_ib": 26.992971420288086, "ce_orig": 0.8256320357322693, "epoch": 0.04687612337335538, "kl_loss": 11.819284439086914, "loss_ib": 0.12089213728904724, "step": 163 }, { "ce_ib": 27.297061920166016, "ce_orig": 0.9797989726066589, "epoch": 0.04687612337335538, "kl_loss": 12.12143325805664, "loss_ib": 0.12394402921199799, "step": 163 }, { "ce_ib": 26.038820266723633, "ce_orig": 0.779868483543396, "epoch": 0.04687612337335538, "kl_loss": 12.200529098510742, "loss_ib": 0.12460917234420776, "step": 163 }, { "ce_ib": 30.567201614379883, "ce_orig": 1.4183546304702759, "epoch": 0.04687612337335538, "kl_loss": 11.150833129882812, "loss_ib": 0.11456504464149475, "step": 163 }, { "ce_ib": 27.423969268798828, "ce_orig": 0.6227314472198486, "epoch": 0.047163706952333025, "kl_loss": 11.591859817504883, "loss_ib": 0.11866099387407303, "step": 164 }, { "ce_ib": 31.1706485748291, "ce_orig": 0.592538595199585, "epoch": 0.047163706952333025, "kl_loss": 11.143152236938477, "loss_ib": 0.11454858630895615, "step": 164 }, { "ce_ib": 32.50811004638672, "ce_orig": 0.8140405416488647, "epoch": 0.047163706952333025, "kl_loss": 13.64712905883789, "loss_ib": 0.1397220939397812, "step": 164 }, { "ce_ib": 27.141164779663086, "ce_orig": 0.41711243987083435, "epoch": 0.047163706952333025, "kl_loss": 12.186077117919922, "loss_ib": 0.12457488477230072, "step": 164 }, { "epoch": 0.04745129053131066, "grad_norm": 1.150227665901184, "learning_rate": 2.531847133757962e-05, "loss": 0.983, "step": 165 }, { "ce_ib": 25.222728729248047, "ce_orig": 0.6572214365005493, "epoch": 0.04745129053131066, "kl_loss": 11.52933120727539, "loss_ib": 0.11781557649374008, "step": 165 }, { "ce_ib": 33.31783676147461, "ce_orig": 0.8566097617149353, "epoch": 0.04745129053131066, "kl_loss": 12.30784797668457, "loss_ib": 0.12641026079654694, "step": 165 }, { "ce_ib": 24.890148162841797, "ce_orig": 0.5485845804214478, "epoch": 0.04745129053131066, "kl_loss": 13.047416687011719, "loss_ib": 0.1329631805419922, "step": 165 }, { "ce_ib": 28.270605087280273, "ce_orig": 0.3421739935874939, "epoch": 0.04745129053131066, "kl_loss": 15.006128311157227, "loss_ib": 0.15288834273815155, "step": 165 }, { "ce_ib": 26.621320724487305, "ce_orig": 1.039825439453125, "epoch": 0.0477388741102883, "kl_loss": 11.003231048583984, "loss_ib": 0.11269444227218628, "step": 166 }, { "ce_ib": 17.792619705200195, "ce_orig": 0.09731145948171616, "epoch": 0.0477388741102883, "kl_loss": 6.299266338348389, "loss_ib": 0.06477192044258118, "step": 166 }, { "ce_ib": 29.130701065063477, "ce_orig": 1.3552623987197876, "epoch": 0.0477388741102883, "kl_loss": 12.245400428771973, "loss_ib": 0.12536707520484924, "step": 166 }, { "ce_ib": 29.495161056518555, "ce_orig": 0.5962749123573303, "epoch": 0.0477388741102883, "kl_loss": 11.876587867736816, "loss_ib": 0.12171538919210434, "step": 166 }, { "ce_ib": 28.59954833984375, "ce_orig": 1.011759638786316, "epoch": 0.048026457689265944, "kl_loss": 10.475525856018066, "loss_ib": 0.10761521011590958, "step": 167 }, { "ce_ib": 26.95580291748047, "ce_orig": 0.7863696813583374, "epoch": 0.048026457689265944, "kl_loss": 11.420799255371094, "loss_ib": 0.11690356582403183, "step": 167 }, { "ce_ib": 25.404388427734375, "ce_orig": 0.49368423223495483, "epoch": 0.048026457689265944, "kl_loss": 10.898456573486328, "loss_ib": 0.11152499914169312, "step": 167 }, { "ce_ib": 27.980323791503906, "ce_orig": 0.8852983713150024, "epoch": 0.048026457689265944, "kl_loss": 11.366129875183105, "loss_ib": 0.11645933240652084, "step": 167 }, { "ce_ib": 25.69623374938965, "ce_orig": 0.875866174697876, "epoch": 0.04831404126824358, "kl_loss": 11.159571647644043, "loss_ib": 0.11416534334421158, "step": 168 }, { "ce_ib": 26.52794647216797, "ce_orig": 0.7182326912879944, "epoch": 0.04831404126824358, "kl_loss": 10.362823486328125, "loss_ib": 0.10628102719783783, "step": 168 }, { "ce_ib": 26.30867576599121, "ce_orig": 0.8692768216133118, "epoch": 0.04831404126824358, "kl_loss": 10.388944625854492, "loss_ib": 0.10652031004428864, "step": 168 }, { "ce_ib": 24.659727096557617, "ce_orig": 0.6755059361457825, "epoch": 0.04831404126824358, "kl_loss": 10.561405181884766, "loss_ib": 0.10808002203702927, "step": 168 }, { "ce_ib": 29.72395896911621, "ce_orig": 1.1792970895767212, "epoch": 0.04860162484722123, "kl_loss": 10.214838981628418, "loss_ib": 0.10512077808380127, "step": 169 }, { "ce_ib": 27.70913314819336, "ce_orig": 0.9696344137191772, "epoch": 0.04860162484722123, "kl_loss": 10.429807662963867, "loss_ib": 0.1070689857006073, "step": 169 }, { "ce_ib": 27.571584701538086, "ce_orig": 0.9312324523925781, "epoch": 0.04860162484722123, "kl_loss": 10.552055358886719, "loss_ib": 0.10827770829200745, "step": 169 }, { "ce_ib": 25.53492546081543, "ce_orig": 0.8822551369667053, "epoch": 0.04860162484722123, "kl_loss": 11.001655578613281, "loss_ib": 0.11257004737854004, "step": 169 }, { "epoch": 0.048889208426198864, "grad_norm": 0.8837189674377441, "learning_rate": 2.6114649681528662e-05, "loss": 0.9786, "step": 170 }, { "ce_ib": 25.924278259277344, "ce_orig": 1.155822992324829, "epoch": 0.048889208426198864, "kl_loss": 10.456619262695312, "loss_ib": 0.10715862363576889, "step": 170 }, { "ce_ib": 27.14344024658203, "ce_orig": 1.013275146484375, "epoch": 0.048889208426198864, "kl_loss": 9.088029861450195, "loss_ib": 0.09359464794397354, "step": 170 }, { "ce_ib": 23.778573989868164, "ce_orig": 0.5937850475311279, "epoch": 0.048889208426198864, "kl_loss": 11.208532333374023, "loss_ib": 0.11446317285299301, "step": 170 }, { "ce_ib": 28.437326431274414, "ce_orig": 1.3872705698013306, "epoch": 0.048889208426198864, "kl_loss": 11.0403413772583, "loss_ib": 0.11324714124202728, "step": 170 }, { "ce_ib": 29.6293888092041, "ce_orig": 1.264078974723816, "epoch": 0.0491767920051765, "kl_loss": 10.278146743774414, "loss_ib": 0.10574440658092499, "step": 171 }, { "ce_ib": 23.555601119995117, "ce_orig": 0.5615886449813843, "epoch": 0.0491767920051765, "kl_loss": 10.424758911132812, "loss_ib": 0.10660314559936523, "step": 171 }, { "ce_ib": 29.939388275146484, "ce_orig": 0.7696157097816467, "epoch": 0.0491767920051765, "kl_loss": 10.607294082641602, "loss_ib": 0.10906687378883362, "step": 171 }, { "ce_ib": 21.64013671875, "ce_orig": 0.8276143074035645, "epoch": 0.0491767920051765, "kl_loss": 11.212567329406738, "loss_ib": 0.11428967863321304, "step": 171 }, { "ce_ib": 27.828157424926758, "ce_orig": 0.9696255922317505, "epoch": 0.04946437558415415, "kl_loss": 10.001435279846191, "loss_ib": 0.10279716551303864, "step": 172 }, { "ce_ib": 23.958757400512695, "ce_orig": 0.6945645213127136, "epoch": 0.04946437558415415, "kl_loss": 11.062480926513672, "loss_ib": 0.11302068829536438, "step": 172 }, { "ce_ib": 27.76424217224121, "ce_orig": 0.9959214329719543, "epoch": 0.04946437558415415, "kl_loss": 10.427704811096191, "loss_ib": 0.10705346614122391, "step": 172 }, { "ce_ib": 25.078935623168945, "ce_orig": 0.5796197056770325, "epoch": 0.04946437558415415, "kl_loss": 10.434064865112305, "loss_ib": 0.10684854537248611, "step": 172 }, { "ce_ib": 28.147438049316406, "ce_orig": 0.8044544458389282, "epoch": 0.049751959163131784, "kl_loss": 10.538864135742188, "loss_ib": 0.10820338129997253, "step": 173 }, { "ce_ib": 29.065446853637695, "ce_orig": 0.8273786902427673, "epoch": 0.049751959163131784, "kl_loss": 9.853753089904785, "loss_ib": 0.1014440730214119, "step": 173 }, { "ce_ib": 27.74785614013672, "ce_orig": 1.2104791402816772, "epoch": 0.049751959163131784, "kl_loss": 10.07681655883789, "loss_ib": 0.10354294627904892, "step": 173 }, { "ce_ib": 26.78622817993164, "ce_orig": 1.5120453834533691, "epoch": 0.049751959163131784, "kl_loss": 9.62009334564209, "loss_ib": 0.09887955337762833, "step": 173 }, { "ce_ib": 19.017391204833984, "ce_orig": 0.5162482857704163, "epoch": 0.05003954274210943, "kl_loss": 7.353050231933594, "loss_ib": 0.07543224096298218, "step": 174 }, { "ce_ib": 23.64644432067871, "ce_orig": 0.9337442517280579, "epoch": 0.05003954274210943, "kl_loss": 10.005657196044922, "loss_ib": 0.10242121666669846, "step": 174 }, { "ce_ib": 26.815704345703125, "ce_orig": 0.6984226107597351, "epoch": 0.05003954274210943, "kl_loss": 10.047138214111328, "loss_ib": 0.10315295308828354, "step": 174 }, { "ce_ib": 23.5247859954834, "ce_orig": 0.6298738718032837, "epoch": 0.05003954274210943, "kl_loss": 9.880701065063477, "loss_ib": 0.1011594831943512, "step": 174 }, { "epoch": 0.050327126321087066, "grad_norm": 0.5031439661979675, "learning_rate": 2.6910828025477707e-05, "loss": 0.9779, "step": 175 }, { "ce_ib": 27.915422439575195, "ce_orig": 1.2774735689163208, "epoch": 0.050327126321087066, "kl_loss": 10.713859558105469, "loss_ib": 0.1099301278591156, "step": 175 }, { "ce_ib": 25.17244529724121, "ce_orig": 0.5252784490585327, "epoch": 0.050327126321087066, "kl_loss": 10.287009239196777, "loss_ib": 0.10538733005523682, "step": 175 }, { "ce_ib": 25.812246322631836, "ce_orig": 0.7732113599777222, "epoch": 0.050327126321087066, "kl_loss": 8.927350997924805, "loss_ib": 0.09185472875833511, "step": 175 }, { "ce_ib": 23.02685546875, "ce_orig": 0.7139325141906738, "epoch": 0.050327126321087066, "kl_loss": 10.248601913452148, "loss_ib": 0.10478869825601578, "step": 175 }, { "ce_ib": 22.77245330810547, "ce_orig": 0.8318886756896973, "epoch": 0.050614709900064704, "kl_loss": 10.135682106018066, "loss_ib": 0.1036340594291687, "step": 176 }, { "ce_ib": 27.42522430419922, "ce_orig": 0.9915688037872314, "epoch": 0.050614709900064704, "kl_loss": 10.458263397216797, "loss_ib": 0.10732515156269073, "step": 176 }, { "ce_ib": 24.290016174316406, "ce_orig": 0.7032797932624817, "epoch": 0.050614709900064704, "kl_loss": 10.18847370147705, "loss_ib": 0.10431373119354248, "step": 176 }, { "ce_ib": 27.81938362121582, "ce_orig": 1.1106735467910767, "epoch": 0.050614709900064704, "kl_loss": 9.77632999420166, "loss_ib": 0.100545234978199, "step": 176 }, { "ce_ib": 28.1321964263916, "ce_orig": 1.3234449625015259, "epoch": 0.05090229347904235, "kl_loss": 9.504875183105469, "loss_ib": 0.09786196798086166, "step": 177 }, { "ce_ib": 25.004257202148438, "ce_orig": 0.7698526382446289, "epoch": 0.05090229347904235, "kl_loss": 10.274667739868164, "loss_ib": 0.10524710267782211, "step": 177 }, { "ce_ib": 25.05718421936035, "ce_orig": 0.8450519442558289, "epoch": 0.05090229347904235, "kl_loss": 7.935550689697266, "loss_ib": 0.0818612277507782, "step": 177 }, { "ce_ib": 24.45059585571289, "ce_orig": 0.6560284495353699, "epoch": 0.05090229347904235, "kl_loss": 10.264579772949219, "loss_ib": 0.10509085655212402, "step": 177 }, { "ce_ib": 22.231950759887695, "ce_orig": 0.8478792309761047, "epoch": 0.051189877058019986, "kl_loss": 9.088963508605957, "loss_ib": 0.09311282634735107, "step": 178 }, { "ce_ib": 25.44860076904297, "ce_orig": 0.7396875619888306, "epoch": 0.051189877058019986, "kl_loss": 9.547811508178711, "loss_ib": 0.09802297502756119, "step": 178 }, { "ce_ib": 26.52227783203125, "ce_orig": 1.3045439720153809, "epoch": 0.051189877058019986, "kl_loss": 9.957924842834473, "loss_ib": 0.1022314727306366, "step": 178 }, { "ce_ib": 25.924222946166992, "ce_orig": 1.1649706363677979, "epoch": 0.051189877058019986, "kl_loss": 10.241584777832031, "loss_ib": 0.10500826686620712, "step": 178 }, { "ce_ib": 27.674495697021484, "ce_orig": 0.5262369513511658, "epoch": 0.051477460636997624, "kl_loss": 8.583837509155273, "loss_ib": 0.08860582113265991, "step": 179 }, { "ce_ib": 29.368635177612305, "ce_orig": 1.8323945999145508, "epoch": 0.051477460636997624, "kl_loss": 10.265556335449219, "loss_ib": 0.10559242218732834, "step": 179 }, { "ce_ib": 24.87542152404785, "ce_orig": 0.8622165322303772, "epoch": 0.051477460636997624, "kl_loss": 9.931290626525879, "loss_ib": 0.10180044919252396, "step": 179 }, { "ce_ib": 24.743249893188477, "ce_orig": 0.8221871852874756, "epoch": 0.051477460636997624, "kl_loss": 9.529619216918945, "loss_ib": 0.09777051955461502, "step": 179 }, { "epoch": 0.05176504421597527, "grad_norm": 0.6572920680046082, "learning_rate": 2.7707006369426753e-05, "loss": 0.9762, "step": 180 }, { "ce_ib": 26.228139877319336, "ce_orig": 0.9346477389335632, "epoch": 0.05176504421597527, "kl_loss": 9.228906631469727, "loss_ib": 0.09491188079118729, "step": 180 }, { "ce_ib": 27.96097183227539, "ce_orig": 1.4497267007827759, "epoch": 0.05176504421597527, "kl_loss": 9.41794204711914, "loss_ib": 0.09697551280260086, "step": 180 }, { "ce_ib": 25.501893997192383, "ce_orig": 1.3674439191818237, "epoch": 0.05176504421597527, "kl_loss": 9.394105911254883, "loss_ib": 0.0964912474155426, "step": 180 }, { "ce_ib": 27.754831314086914, "ce_orig": 0.9353328943252563, "epoch": 0.05176504421597527, "kl_loss": 9.990425109863281, "loss_ib": 0.10267972946166992, "step": 180 }, { "ce_ib": 24.477588653564453, "ce_orig": 1.223670482635498, "epoch": 0.052052627794952906, "kl_loss": 9.197659492492676, "loss_ib": 0.09442435204982758, "step": 181 }, { "ce_ib": 23.42432403564453, "ce_orig": 0.34692513942718506, "epoch": 0.052052627794952906, "kl_loss": 9.035377502441406, "loss_ib": 0.09269620478153229, "step": 181 }, { "ce_ib": 27.408384323120117, "ce_orig": 1.0176830291748047, "epoch": 0.052052627794952906, "kl_loss": 8.829448699951172, "loss_ib": 0.09103532880544662, "step": 181 }, { "ce_ib": 20.15254020690918, "ce_orig": 0.4916859269142151, "epoch": 0.052052627794952906, "kl_loss": 8.9959716796875, "loss_ib": 0.09197497367858887, "step": 181 }, { "ce_ib": 28.84882164001465, "ce_orig": 1.4133418798446655, "epoch": 0.05234021137393055, "kl_loss": 9.433625221252441, "loss_ib": 0.09722113609313965, "step": 182 }, { "ce_ib": 24.220762252807617, "ce_orig": 0.7626959085464478, "epoch": 0.05234021137393055, "kl_loss": 9.004999160766602, "loss_ib": 0.09247206151485443, "step": 182 }, { "ce_ib": 26.707427978515625, "ce_orig": 0.950811505317688, "epoch": 0.05234021137393055, "kl_loss": 9.357291221618652, "loss_ib": 0.09624365717172623, "step": 182 }, { "ce_ib": 23.827503204345703, "ce_orig": 0.5993396639823914, "epoch": 0.05234021137393055, "kl_loss": 9.675762176513672, "loss_ib": 0.09914036840200424, "step": 182 }, { "ce_ib": 25.040048599243164, "ce_orig": 1.0414315462112427, "epoch": 0.05262779495290819, "kl_loss": 9.17612075805664, "loss_ib": 0.09426520764827728, "step": 183 }, { "ce_ib": 26.632596969604492, "ce_orig": 1.2410509586334229, "epoch": 0.05262779495290819, "kl_loss": 9.67950439453125, "loss_ib": 0.09945829957723618, "step": 183 }, { "ce_ib": 22.586328506469727, "ce_orig": 0.5787039399147034, "epoch": 0.05262779495290819, "kl_loss": 9.118326187133789, "loss_ib": 0.09344189614057541, "step": 183 }, { "ce_ib": 29.002498626708984, "ce_orig": 1.1482164859771729, "epoch": 0.05262779495290819, "kl_loss": 10.303224563598633, "loss_ib": 0.10593248903751373, "step": 183 }, { "ce_ib": 23.188966751098633, "ce_orig": 0.7345482110977173, "epoch": 0.052915378531885826, "kl_loss": 9.377893447875977, "loss_ib": 0.09609782695770264, "step": 184 }, { "ce_ib": 25.167457580566406, "ce_orig": 1.279574990272522, "epoch": 0.052915378531885826, "kl_loss": 8.157093048095703, "loss_ib": 0.08408767729997635, "step": 184 }, { "ce_ib": 25.17441749572754, "ce_orig": 1.2902156114578247, "epoch": 0.052915378531885826, "kl_loss": 8.778035163879395, "loss_ib": 0.09029779583215714, "step": 184 }, { "ce_ib": 27.5651798248291, "ce_orig": 0.6481632590293884, "epoch": 0.052915378531885826, "kl_loss": 8.615208625793457, "loss_ib": 0.0889086052775383, "step": 184 }, { "epoch": 0.05320296211086347, "grad_norm": 0.774932861328125, "learning_rate": 2.8503184713375798e-05, "loss": 1.0273, "step": 185 }, { "ce_ib": 28.26412582397461, "ce_orig": 0.9693439602851868, "epoch": 0.05320296211086347, "kl_loss": 9.72558307647705, "loss_ib": 0.10008224099874496, "step": 185 }, { "ce_ib": 20.355464935302734, "ce_orig": 0.6961947679519653, "epoch": 0.05320296211086347, "kl_loss": 8.683027267456055, "loss_ib": 0.08886582404375076, "step": 185 }, { "ce_ib": 19.516334533691406, "ce_orig": 0.6023780703544617, "epoch": 0.05320296211086347, "kl_loss": 9.514884948730469, "loss_ib": 0.09710048139095306, "step": 185 }, { "ce_ib": 21.90512466430664, "ce_orig": 0.8949795961380005, "epoch": 0.05320296211086347, "kl_loss": 9.39652156829834, "loss_ib": 0.09615572541952133, "step": 185 }, { "ce_ib": 24.16393280029297, "ce_orig": 0.730219304561615, "epoch": 0.05349054568984111, "kl_loss": 8.413753509521484, "loss_ib": 0.08655392378568649, "step": 186 }, { "ce_ib": 24.4334774017334, "ce_orig": 1.2984904050827026, "epoch": 0.05349054568984111, "kl_loss": 8.700630187988281, "loss_ib": 0.08944965153932571, "step": 186 }, { "ce_ib": 22.994918823242188, "ce_orig": 0.9692792296409607, "epoch": 0.05349054568984111, "kl_loss": 8.794185638427734, "loss_ib": 0.09024134278297424, "step": 186 }, { "ce_ib": 27.755258560180664, "ce_orig": 1.4234228134155273, "epoch": 0.05349054568984111, "kl_loss": 5.130355358123779, "loss_ib": 0.0540790781378746, "step": 186 }, { "ce_ib": 19.920040130615234, "ce_orig": 0.459452748298645, "epoch": 0.05377812926881875, "kl_loss": 7.401340484619141, "loss_ib": 0.07600540667772293, "step": 187 }, { "ce_ib": 22.339643478393555, "ce_orig": 0.7629045844078064, "epoch": 0.05377812926881875, "kl_loss": 8.446830749511719, "loss_ib": 0.08670226484537125, "step": 187 }, { "ce_ib": 23.796178817749023, "ce_orig": 1.3895570039749146, "epoch": 0.05377812926881875, "kl_loss": 9.165254592895508, "loss_ib": 0.0940321609377861, "step": 187 }, { "ce_ib": 21.33721351623535, "ce_orig": 0.2807011902332306, "epoch": 0.05377812926881875, "kl_loss": 8.006156921386719, "loss_ib": 0.08219528943300247, "step": 187 }, { "ce_ib": 20.01226234436035, "ce_orig": 0.7121122479438782, "epoch": 0.05406571284779639, "kl_loss": 8.959085464477539, "loss_ib": 0.09159208089113235, "step": 188 }, { "ce_ib": 19.18909454345703, "ce_orig": 0.7582953572273254, "epoch": 0.05406571284779639, "kl_loss": 8.402653694152832, "loss_ib": 0.08594544231891632, "step": 188 }, { "ce_ib": 23.931289672851562, "ce_orig": 0.8940808773040771, "epoch": 0.05406571284779639, "kl_loss": 8.514259338378906, "loss_ib": 0.08753572404384613, "step": 188 }, { "ce_ib": 20.879886627197266, "ce_orig": 0.5851081609725952, "epoch": 0.05406571284779639, "kl_loss": 9.260396957397461, "loss_ib": 0.09469195455312729, "step": 188 }, { "ce_ib": 20.511985778808594, "ce_orig": 0.8533673882484436, "epoch": 0.05435329642677403, "kl_loss": 8.759720802307129, "loss_ib": 0.08964840322732925, "step": 189 }, { "ce_ib": 23.13450050354004, "ce_orig": 1.0011026859283447, "epoch": 0.05435329642677403, "kl_loss": 8.676036834716797, "loss_ib": 0.08907381445169449, "step": 189 }, { "ce_ib": 22.484384536743164, "ce_orig": 0.5926994681358337, "epoch": 0.05435329642677403, "kl_loss": 9.435342788696289, "loss_ib": 0.09660186618566513, "step": 189 }, { "ce_ib": 21.21821403503418, "ce_orig": 0.8962640166282654, "epoch": 0.05435329642677403, "kl_loss": 8.669075012207031, "loss_ib": 0.08881256729364395, "step": 189 }, { "epoch": 0.05464088000575167, "grad_norm": 0.43721508979797363, "learning_rate": 2.929936305732484e-05, "loss": 1.0218, "step": 190 }, { "ce_ib": 21.65335464477539, "ce_orig": 0.7994527816772461, "epoch": 0.05464088000575167, "kl_loss": 8.212764739990234, "loss_ib": 0.08429298549890518, "step": 190 }, { "ce_ib": 25.716175079345703, "ce_orig": 1.026253342628479, "epoch": 0.05464088000575167, "kl_loss": 8.664275169372559, "loss_ib": 0.08921436965465546, "step": 190 }, { "ce_ib": 19.4307861328125, "ce_orig": 0.8895479440689087, "epoch": 0.05464088000575167, "kl_loss": 8.509403228759766, "loss_ib": 0.0870371162891388, "step": 190 }, { "ce_ib": 21.85231590270996, "ce_orig": 0.7853972911834717, "epoch": 0.05464088000575167, "kl_loss": 8.377355575561523, "loss_ib": 0.08595878630876541, "step": 190 }, { "ce_ib": 21.575359344482422, "ce_orig": 1.0062997341156006, "epoch": 0.05492846358472931, "kl_loss": 9.271797180175781, "loss_ib": 0.0948755070567131, "step": 191 }, { "ce_ib": 18.518245697021484, "ce_orig": 0.6092102527618408, "epoch": 0.05492846358472931, "kl_loss": 8.641265869140625, "loss_ib": 0.08826448023319244, "step": 191 }, { "ce_ib": 25.908557891845703, "ce_orig": 0.7555634379386902, "epoch": 0.05492846358472931, "kl_loss": 9.02600383758545, "loss_ib": 0.09285089373588562, "step": 191 }, { "ce_ib": 22.47454071044922, "ce_orig": 0.5190201997756958, "epoch": 0.05492846358472931, "kl_loss": 9.089900970458984, "loss_ib": 0.09314646571874619, "step": 191 }, { "ce_ib": 19.4965763092041, "ce_orig": 0.8628413081169128, "epoch": 0.055216047163706955, "kl_loss": 9.05790901184082, "loss_ib": 0.09252873808145523, "step": 192 }, { "ce_ib": 24.495662689208984, "ce_orig": 1.0552870035171509, "epoch": 0.055216047163706955, "kl_loss": 8.362863540649414, "loss_ib": 0.0860782042145729, "step": 192 }, { "ce_ib": 24.617902755737305, "ce_orig": 1.3669184446334839, "epoch": 0.055216047163706955, "kl_loss": 8.252336502075195, "loss_ib": 0.08498515188694, "step": 192 }, { "ce_ib": 21.620195388793945, "ce_orig": 0.9216135144233704, "epoch": 0.055216047163706955, "kl_loss": 8.622823715209961, "loss_ib": 0.08839025348424911, "step": 192 }, { "ce_ib": 23.482017517089844, "ce_orig": 1.2965989112854004, "epoch": 0.05550363074268459, "kl_loss": 8.686678886413574, "loss_ib": 0.089214988052845, "step": 193 }, { "ce_ib": 21.503093719482422, "ce_orig": 1.1102378368377686, "epoch": 0.05550363074268459, "kl_loss": 8.758203506469727, "loss_ib": 0.0897323414683342, "step": 193 }, { "ce_ib": 21.88249969482422, "ce_orig": 0.3644579350948334, "epoch": 0.05550363074268459, "kl_loss": 7.924787998199463, "loss_ib": 0.08143612742424011, "step": 193 }, { "ce_ib": 21.49346160888672, "ce_orig": 0.8568457961082458, "epoch": 0.05550363074268459, "kl_loss": 8.320171356201172, "loss_ib": 0.08535105735063553, "step": 193 }, { "ce_ib": 18.73956298828125, "ce_orig": 0.8066674470901489, "epoch": 0.05579121432166223, "kl_loss": 8.048727035522461, "loss_ib": 0.08236122876405716, "step": 194 }, { "ce_ib": 24.636383056640625, "ce_orig": 0.97906494140625, "epoch": 0.05579121432166223, "kl_loss": 7.121569633483887, "loss_ib": 0.07367932796478271, "step": 194 }, { "ce_ib": 20.886672973632812, "ce_orig": 1.25295090675354, "epoch": 0.05579121432166223, "kl_loss": 8.471221923828125, "loss_ib": 0.08680088818073273, "step": 194 }, { "ce_ib": 19.9046630859375, "ce_orig": 0.5161154866218567, "epoch": 0.05579121432166223, "kl_loss": 7.873350143432617, "loss_ib": 0.08072397112846375, "step": 194 }, { "epoch": 0.056078797900639875, "grad_norm": 0.8270230293273926, "learning_rate": 3.0095541401273885e-05, "loss": 0.9806, "step": 195 }, { "ce_ib": 20.66087532043457, "ce_orig": 0.6626381874084473, "epoch": 0.056078797900639875, "kl_loss": 8.434722900390625, "loss_ib": 0.08641331642866135, "step": 195 }, { "ce_ib": 22.705623626708984, "ce_orig": 0.9331481456756592, "epoch": 0.056078797900639875, "kl_loss": 7.2313232421875, "loss_ib": 0.07458379119634628, "step": 195 }, { "ce_ib": 23.993696212768555, "ce_orig": 0.9489652514457703, "epoch": 0.056078797900639875, "kl_loss": 7.374420166015625, "loss_ib": 0.07614357024431229, "step": 195 }, { "ce_ib": 24.617033004760742, "ce_orig": 0.7637354135513306, "epoch": 0.056078797900639875, "kl_loss": 7.686088562011719, "loss_ib": 0.07932259142398834, "step": 195 }, { "ce_ib": 21.54843521118164, "ce_orig": 0.8521741032600403, "epoch": 0.05636638147961751, "kl_loss": 8.026320457458496, "loss_ib": 0.0824180468916893, "step": 196 }, { "ce_ib": 20.1884822845459, "ce_orig": 0.8504369258880615, "epoch": 0.05636638147961751, "kl_loss": 7.845184326171875, "loss_ib": 0.08047069609165192, "step": 196 }, { "ce_ib": 22.211240768432617, "ce_orig": 0.4319168031215668, "epoch": 0.05636638147961751, "kl_loss": 6.318869590759277, "loss_ib": 0.065409816801548, "step": 196 }, { "ce_ib": 20.042993545532227, "ce_orig": 0.6225204467773438, "epoch": 0.05636638147961751, "kl_loss": 8.074682235717773, "loss_ib": 0.08275111764669418, "step": 196 }, { "ce_ib": 13.801077842712402, "ce_orig": 0.4428274929523468, "epoch": 0.05665396505859516, "kl_loss": 7.092032432556152, "loss_ib": 0.07230043411254883, "step": 197 }, { "ce_ib": 19.726043701171875, "ce_orig": 0.5650824904441833, "epoch": 0.05665396505859516, "kl_loss": 7.761396408081055, "loss_ib": 0.07958656549453735, "step": 197 }, { "ce_ib": 23.52407455444336, "ce_orig": 1.374847650527954, "epoch": 0.05665396505859516, "kl_loss": 6.945611000061035, "loss_ib": 0.07180851697921753, "step": 197 }, { "ce_ib": 21.02933120727539, "ce_orig": 0.9913616180419922, "epoch": 0.05665396505859516, "kl_loss": 7.67958402633667, "loss_ib": 0.07889877259731293, "step": 197 }, { "ce_ib": 26.16086196899414, "ce_orig": 1.5300548076629639, "epoch": 0.056941548637572795, "kl_loss": 7.4000701904296875, "loss_ib": 0.0766167864203453, "step": 198 }, { "ce_ib": 20.750835418701172, "ce_orig": 0.9555485844612122, "epoch": 0.056941548637572795, "kl_loss": 7.1511125564575195, "loss_ib": 0.07358621060848236, "step": 198 }, { "ce_ib": 23.05903434753418, "ce_orig": 1.1008634567260742, "epoch": 0.056941548637572795, "kl_loss": 7.473138332366943, "loss_ib": 0.0770372822880745, "step": 198 }, { "ce_ib": 21.61954689025879, "ce_orig": 1.4359227418899536, "epoch": 0.056941548637572795, "kl_loss": 7.772992134094238, "loss_ib": 0.0798918753862381, "step": 198 }, { "ce_ib": 22.668001174926758, "ce_orig": 1.0338892936706543, "epoch": 0.05722913221655043, "kl_loss": 7.578032493591309, "loss_ib": 0.07804711908102036, "step": 199 }, { "ce_ib": 20.854860305786133, "ce_orig": 0.9726830124855042, "epoch": 0.05722913221655043, "kl_loss": 7.427217483520508, "loss_ib": 0.0763576552271843, "step": 199 }, { "ce_ib": 19.557754516601562, "ce_orig": 0.8703896403312683, "epoch": 0.05722913221655043, "kl_loss": 7.243409633636475, "loss_ib": 0.07438986748456955, "step": 199 }, { "ce_ib": 18.793437957763672, "ce_orig": 0.8299582004547119, "epoch": 0.05722913221655043, "kl_loss": 6.471531867980957, "loss_ib": 0.06659466028213501, "step": 199 }, { "epoch": 0.05751671579552808, "grad_norm": 0.6937683820724487, "learning_rate": 3.089171974522293e-05, "loss": 0.982, "step": 200 }, { "ce_ib": 18.451953887939453, "ce_orig": 1.0577921867370605, "epoch": 0.05751671579552808, "kl_loss": 7.2733869552612305, "loss_ib": 0.07457906752824783, "step": 200 }, { "ce_ib": 23.337678909301758, "ce_orig": 1.3253329992294312, "epoch": 0.05751671579552808, "kl_loss": 7.374900817871094, "loss_ib": 0.07608277350664139, "step": 200 }, { "ce_ib": 18.122037887573242, "ce_orig": 0.9964814782142639, "epoch": 0.05751671579552808, "kl_loss": 7.532997131347656, "loss_ib": 0.07714217156171799, "step": 200 }, { "ce_ib": 19.866018295288086, "ce_orig": 0.7532010078430176, "epoch": 0.05751671579552808, "kl_loss": 6.963897705078125, "loss_ib": 0.07162558287382126, "step": 200 }, { "ce_ib": 18.71930503845215, "ce_orig": 0.8960237503051758, "epoch": 0.057804299374505715, "kl_loss": 6.8690900802612305, "loss_ib": 0.07056283205747604, "step": 201 }, { "ce_ib": 22.056734085083008, "ce_orig": 1.0263980627059937, "epoch": 0.057804299374505715, "kl_loss": 6.602439880371094, "loss_ib": 0.06823007017374039, "step": 201 }, { "ce_ib": 24.96833038330078, "ce_orig": 1.6670337915420532, "epoch": 0.057804299374505715, "kl_loss": 6.63405704498291, "loss_ib": 0.06883740425109863, "step": 201 }, { "ce_ib": 17.40508460998535, "ce_orig": 0.3124699592590332, "epoch": 0.057804299374505715, "kl_loss": 6.398665428161621, "loss_ib": 0.06572715938091278, "step": 201 }, { "ce_ib": 13.636467933654785, "ce_orig": 0.5163049697875977, "epoch": 0.05809188295348336, "kl_loss": 6.814591407775879, "loss_ib": 0.06950955837965012, "step": 202 }, { "ce_ib": 18.503398895263672, "ce_orig": 0.8511436581611633, "epoch": 0.05809188295348336, "kl_loss": 4.558845043182373, "loss_ib": 0.047438789159059525, "step": 202 }, { "ce_ib": 22.386396408081055, "ce_orig": 0.974443793296814, "epoch": 0.05809188295348336, "kl_loss": 6.523048400878906, "loss_ib": 0.06746912002563477, "step": 202 }, { "ce_ib": 20.26010513305664, "ce_orig": 0.7885109186172485, "epoch": 0.05809188295348336, "kl_loss": 6.658895015716553, "loss_ib": 0.06861495971679688, "step": 202 }, { "ce_ib": 24.684518814086914, "ce_orig": 1.362154245376587, "epoch": 0.058379466532461, "kl_loss": 5.672746658325195, "loss_ib": 0.05919591709971428, "step": 203 }, { "ce_ib": 18.035612106323242, "ce_orig": 0.6344237923622131, "epoch": 0.058379466532461, "kl_loss": 6.552053451538086, "loss_ib": 0.06732409447431564, "step": 203 }, { "ce_ib": 19.674922943115234, "ce_orig": 1.129352331161499, "epoch": 0.058379466532461, "kl_loss": 6.27418327331543, "loss_ib": 0.06470932066440582, "step": 203 }, { "ce_ib": 12.673866271972656, "ce_orig": 0.2503475248813629, "epoch": 0.058379466532461, "kl_loss": 4.017500877380371, "loss_ib": 0.0414423942565918, "step": 203 }, { "ce_ib": 16.628164291381836, "ce_orig": 0.6799634099006653, "epoch": 0.058667050111438634, "kl_loss": 5.470815181732178, "loss_ib": 0.056370966136455536, "step": 204 }, { "ce_ib": 23.80594825744629, "ce_orig": 1.2403467893600464, "epoch": 0.058667050111438634, "kl_loss": 5.936471462249756, "loss_ib": 0.061745308339595795, "step": 204 }, { "ce_ib": 22.816349029541016, "ce_orig": 1.0042665004730225, "epoch": 0.058667050111438634, "kl_loss": 6.33897066116333, "loss_ib": 0.06567133963108063, "step": 204 }, { "ce_ib": 15.579545021057129, "ce_orig": 0.5806044936180115, "epoch": 0.058667050111438634, "kl_loss": 6.2884297370910645, "loss_ib": 0.06444225460290909, "step": 204 }, { "epoch": 0.05895463369041628, "grad_norm": 0.43801939487457275, "learning_rate": 3.1687898089171976e-05, "loss": 0.9615, "step": 205 }, { "ce_ib": 20.434833526611328, "ce_orig": 0.9689016342163086, "epoch": 0.05895463369041628, "kl_loss": 6.424372673034668, "loss_ib": 0.06628721207380295, "step": 205 }, { "ce_ib": 15.206514358520508, "ce_orig": 0.4593224823474884, "epoch": 0.05895463369041628, "kl_loss": 6.005724906921387, "loss_ib": 0.06157790124416351, "step": 205 }, { "ce_ib": 21.497190475463867, "ce_orig": 1.140707015991211, "epoch": 0.05895463369041628, "kl_loss": 6.157401084899902, "loss_ib": 0.06372372806072235, "step": 205 }, { "ce_ib": 21.64202308654785, "ce_orig": 0.8690503239631653, "epoch": 0.05895463369041628, "kl_loss": 6.049506187438965, "loss_ib": 0.06265926361083984, "step": 205 }, { "ce_ib": 17.65264129638672, "ce_orig": 0.8661278486251831, "epoch": 0.05924221726939392, "kl_loss": 6.142066955566406, "loss_ib": 0.0631859302520752, "step": 206 }, { "ce_ib": 18.6512451171875, "ce_orig": 1.1120545864105225, "epoch": 0.05924221726939392, "kl_loss": 6.5508646965026855, "loss_ib": 0.06737376749515533, "step": 206 }, { "ce_ib": 19.080215454101562, "ce_orig": 1.205805778503418, "epoch": 0.05924221726939392, "kl_loss": 5.709317207336426, "loss_ib": 0.059001192450523376, "step": 206 }, { "ce_ib": 18.595766067504883, "ce_orig": 0.9016050696372986, "epoch": 0.05924221726939392, "kl_loss": 5.711783409118652, "loss_ib": 0.0589774064719677, "step": 206 }, { "ce_ib": 20.492830276489258, "ce_orig": 0.8852484822273254, "epoch": 0.05952980084837156, "kl_loss": 5.075399398803711, "loss_ib": 0.05280327796936035, "step": 207 }, { "ce_ib": 20.912809371948242, "ce_orig": 0.784504771232605, "epoch": 0.05952980084837156, "kl_loss": 3.873704433441162, "loss_ib": 0.04082832112908363, "step": 207 }, { "ce_ib": 16.91316795349121, "ce_orig": 0.7453713417053223, "epoch": 0.05952980084837156, "kl_loss": 4.164481163024902, "loss_ib": 0.04333612695336342, "step": 207 }, { "ce_ib": 23.150854110717773, "ce_orig": 1.8038743734359741, "epoch": 0.05952980084837156, "kl_loss": 6.1978583335876465, "loss_ib": 0.06429366767406464, "step": 207 }, { "ce_ib": 20.63064193725586, "ce_orig": 1.5274888277053833, "epoch": 0.0598173844273492, "kl_loss": 4.736423492431641, "loss_ib": 0.049427296966314316, "step": 208 }, { "ce_ib": 20.130807876586914, "ce_orig": 0.9102981686592102, "epoch": 0.0598173844273492, "kl_loss": 4.98231315612793, "loss_ib": 0.05183621123433113, "step": 208 }, { "ce_ib": 21.33695411682129, "ce_orig": 0.3839934766292572, "epoch": 0.0598173844273492, "kl_loss": 3.1306653022766113, "loss_ib": 0.033440347760915756, "step": 208 }, { "ce_ib": 19.694299697875977, "ce_orig": 0.9525083899497986, "epoch": 0.0598173844273492, "kl_loss": 4.653975486755371, "loss_ib": 0.048509180545806885, "step": 208 }, { "ce_ib": 21.432010650634766, "ce_orig": 1.1178271770477295, "epoch": 0.06010496800632684, "kl_loss": 3.3814926147460938, "loss_ib": 0.035958126187324524, "step": 209 }, { "ce_ib": 19.939306259155273, "ce_orig": 1.0498489141464233, "epoch": 0.06010496800632684, "kl_loss": 4.5651397705078125, "loss_ib": 0.04764533042907715, "step": 209 }, { "ce_ib": 19.62514877319336, "ce_orig": 1.1263172626495361, "epoch": 0.06010496800632684, "kl_loss": 4.4086761474609375, "loss_ib": 0.04604927450418472, "step": 209 }, { "ce_ib": 17.709300994873047, "ce_orig": 1.0799542665481567, "epoch": 0.06010496800632684, "kl_loss": 4.823720932006836, "loss_ib": 0.0500081367790699, "step": 209 }, { "epoch": 0.06039255158530448, "grad_norm": 0.667425274848938, "learning_rate": 3.248407643312102e-05, "loss": 0.9474, "step": 210 }, { "ce_ib": 22.428897857666016, "ce_orig": 1.325988531112671, "epoch": 0.06039255158530448, "kl_loss": 3.7257208824157715, "loss_ib": 0.039500098675489426, "step": 210 }, { "ce_ib": 18.08632469177246, "ce_orig": 0.3834853172302246, "epoch": 0.06039255158530448, "kl_loss": 3.6763598918914795, "loss_ib": 0.03857222944498062, "step": 210 }, { "ce_ib": 18.410423278808594, "ce_orig": 0.5081047415733337, "epoch": 0.06039255158530448, "kl_loss": 3.751244068145752, "loss_ib": 0.03935348242521286, "step": 210 }, { "ce_ib": 17.127031326293945, "ce_orig": 0.6193530559539795, "epoch": 0.06039255158530448, "kl_loss": 4.159435749053955, "loss_ib": 0.04330705851316452, "step": 210 }, { "ce_ib": 21.037677764892578, "ce_orig": 0.9653246998786926, "epoch": 0.06068013516428212, "kl_loss": 3.6135926246643066, "loss_ib": 0.03823969140648842, "step": 211 }, { "ce_ib": 15.933859825134277, "ce_orig": 0.5138083696365356, "epoch": 0.06068013516428212, "kl_loss": 2.297349452972412, "loss_ib": 0.024566879495978355, "step": 211 }, { "ce_ib": 16.323041915893555, "ce_orig": 1.1270829439163208, "epoch": 0.06068013516428212, "kl_loss": 2.4675984382629395, "loss_ib": 0.026308288797736168, "step": 211 }, { "ce_ib": 18.137113571166992, "ce_orig": 0.5509803891181946, "epoch": 0.06068013516428212, "kl_loss": 2.595515251159668, "loss_ib": 0.02776886336505413, "step": 211 }, { "ce_ib": 14.729268074035645, "ce_orig": 0.4266526401042938, "epoch": 0.060967718743259756, "kl_loss": 1.8660860061645508, "loss_ib": 0.020133785903453827, "step": 212 }, { "ce_ib": 19.452571868896484, "ce_orig": 0.8632349967956543, "epoch": 0.060967718743259756, "kl_loss": 2.0922412872314453, "loss_ib": 0.02286767028272152, "step": 212 }, { "ce_ib": 21.427040100097656, "ce_orig": 1.345961332321167, "epoch": 0.060967718743259756, "kl_loss": 1.7945568561553955, "loss_ib": 0.02008827216923237, "step": 212 }, { "ce_ib": 21.80542755126953, "ce_orig": 1.136615514755249, "epoch": 0.060967718743259756, "kl_loss": 1.982521891593933, "loss_ib": 0.022005761042237282, "step": 212 }, { "ce_ib": 23.523645401000977, "ce_orig": 1.9374449253082275, "epoch": 0.0612553023222374, "kl_loss": 2.183800220489502, "loss_ib": 0.02419036626815796, "step": 213 }, { "ce_ib": 23.139501571655273, "ce_orig": 1.261841058731079, "epoch": 0.0612553023222374, "kl_loss": 1.225545048713684, "loss_ib": 0.014569399878382683, "step": 213 }, { "ce_ib": 14.595914840698242, "ce_orig": 0.4094107151031494, "epoch": 0.0612553023222374, "kl_loss": 1.4455546140670776, "loss_ib": 0.01591513678431511, "step": 213 }, { "ce_ib": 18.374540328979492, "ce_orig": 0.9666364789009094, "epoch": 0.0612553023222374, "kl_loss": 1.5520057678222656, "loss_ib": 0.017357511445879936, "step": 213 }, { "ce_ib": 17.489238739013672, "ce_orig": 0.4721967875957489, "epoch": 0.06154288590121504, "kl_loss": 1.1278434991836548, "loss_ib": 0.013027358800172806, "step": 214 }, { "ce_ib": 21.929288864135742, "ce_orig": 0.6112910509109497, "epoch": 0.06154288590121504, "kl_loss": 1.07718026638031, "loss_ib": 0.012964731082320213, "step": 214 }, { "ce_ib": 18.024003982543945, "ce_orig": 0.4354954957962036, "epoch": 0.06154288590121504, "kl_loss": 1.1616055965423584, "loss_ib": 0.013418455608189106, "step": 214 }, { "ce_ib": 19.154476165771484, "ce_orig": 0.9074000120162964, "epoch": 0.06154288590121504, "kl_loss": 1.048647165298462, "loss_ib": 0.01240191888064146, "step": 214 }, { "epoch": 0.06183046948019268, "grad_norm": 0.19470971822738647, "learning_rate": 3.328025477707007e-05, "loss": 0.8823, "step": 215 }, { "ce_ib": 16.662282943725586, "ce_orig": 0.5908299088478088, "epoch": 0.06183046948019268, "kl_loss": 1.0955469608306885, "loss_ib": 0.012621697969734669, "step": 215 }, { "ce_ib": 15.762285232543945, "ce_orig": 0.5801149606704712, "epoch": 0.06183046948019268, "kl_loss": 0.9997921586036682, "loss_ib": 0.011574150063097477, "step": 215 }, { "ce_ib": 20.8988094329834, "ce_orig": 0.9614391922950745, "epoch": 0.06183046948019268, "kl_loss": 0.9723953008651733, "loss_ib": 0.011813833378255367, "step": 215 }, { "ce_ib": 20.39583969116211, "ce_orig": 1.0183390378952026, "epoch": 0.06183046948019268, "kl_loss": 0.9245635867118835, "loss_ib": 0.011285219341516495, "step": 215 }, { "ce_ib": 14.578946113586426, "ce_orig": 0.734819769859314, "epoch": 0.06211805305917032, "kl_loss": 0.8773603439331055, "loss_ib": 0.010231498628854752, "step": 216 }, { "ce_ib": 13.65113639831543, "ce_orig": 0.4453405439853668, "epoch": 0.06211805305917032, "kl_loss": 0.902603030204773, "loss_ib": 0.010391143150627613, "step": 216 }, { "ce_ib": 24.090421676635742, "ce_orig": 1.5431694984436035, "epoch": 0.06211805305917032, "kl_loss": 0.8628696203231812, "loss_ib": 0.011037738062441349, "step": 216 }, { "ce_ib": 16.371984481811523, "ce_orig": 0.6436638832092285, "epoch": 0.06211805305917032, "kl_loss": 0.9481015205383301, "loss_ib": 0.011118213646113873, "step": 216 }, { "ce_ib": 16.45316505432129, "ce_orig": 0.6905233263969421, "epoch": 0.06240563663814796, "kl_loss": 0.8371706008911133, "loss_ib": 0.010017022490501404, "step": 217 }, { "ce_ib": 19.796371459960938, "ce_orig": 0.9113252758979797, "epoch": 0.06240563663814796, "kl_loss": 0.7912114262580872, "loss_ib": 0.00989175122231245, "step": 217 }, { "ce_ib": 20.719688415527344, "ce_orig": 0.6585960388183594, "epoch": 0.06240563663814796, "kl_loss": 0.7871678471565247, "loss_ib": 0.009943647310137749, "step": 217 }, { "ce_ib": 18.301244735717773, "ce_orig": 0.9191728234291077, "epoch": 0.06240563663814796, "kl_loss": 0.7824192643165588, "loss_ib": 0.009654317051172256, "step": 217 }, { "ce_ib": 16.72066879272461, "ce_orig": 0.46977195143699646, "epoch": 0.0626932202171256, "kl_loss": 0.7237412929534912, "loss_ib": 0.008909479714930058, "step": 218 }, { "ce_ib": 16.60516357421875, "ce_orig": 0.8432900309562683, "epoch": 0.0626932202171256, "kl_loss": 0.7562671899795532, "loss_ib": 0.009223188273608685, "step": 218 }, { "ce_ib": 19.466259002685547, "ce_orig": 0.9356642365455627, "epoch": 0.0626932202171256, "kl_loss": 0.7408407926559448, "loss_ib": 0.009355033747851849, "step": 218 }, { "ce_ib": 19.53274917602539, "ce_orig": 0.6844194531440735, "epoch": 0.0626932202171256, "kl_loss": 0.7530844807624817, "loss_ib": 0.009484118781983852, "step": 218 }, { "ce_ib": 22.165111541748047, "ce_orig": 1.2755643129348755, "epoch": 0.06298080379610324, "kl_loss": 0.6112433671951294, "loss_ib": 0.008328944444656372, "step": 219 }, { "ce_ib": 15.414247512817383, "ce_orig": 0.8299206495285034, "epoch": 0.06298080379610324, "kl_loss": 0.7032531499862671, "loss_ib": 0.008573955856263638, "step": 219 }, { "ce_ib": 16.366025924682617, "ce_orig": 0.660663902759552, "epoch": 0.06298080379610324, "kl_loss": 0.6545971632003784, "loss_ib": 0.008182574063539505, "step": 219 }, { "ce_ib": 19.620121002197266, "ce_orig": 1.2592724561691284, "epoch": 0.06298080379610324, "kl_loss": 0.7279493808746338, "loss_ib": 0.009241505526006222, "step": 219 }, { "epoch": 0.06326838737508088, "grad_norm": 0.07929490506649017, "learning_rate": 3.407643312101911e-05, "loss": 0.8749, "step": 220 }, { "ce_ib": 20.658096313476562, "ce_orig": 1.0993177890777588, "epoch": 0.06326838737508088, "kl_loss": 0.6090418100357056, "loss_ib": 0.008156226947903633, "step": 220 }, { "ce_ib": 17.3227481842041, "ce_orig": 0.6923868656158447, "epoch": 0.06326838737508088, "kl_loss": 0.6292073130607605, "loss_ib": 0.008024347946047783, "step": 220 }, { "ce_ib": 15.15152359008789, "ce_orig": 0.697593092918396, "epoch": 0.06326838737508088, "kl_loss": 0.604870617389679, "loss_ib": 0.007563858292996883, "step": 220 }, { "ce_ib": 20.777067184448242, "ce_orig": 1.269119381904602, "epoch": 0.06326838737508088, "kl_loss": 0.6507552862167358, "loss_ib": 0.008585259318351746, "step": 220 }, { "ce_ib": 18.540620803833008, "ce_orig": 1.0002384185791016, "epoch": 0.06355597095405853, "kl_loss": 0.578797459602356, "loss_ib": 0.0076420363038778305, "step": 221 }, { "ce_ib": 13.15246868133545, "ce_orig": 0.25608256459236145, "epoch": 0.06355597095405853, "kl_loss": 0.7502469420433044, "loss_ib": 0.008817716501653194, "step": 221 }, { "ce_ib": 13.858514785766602, "ce_orig": 0.682886004447937, "epoch": 0.06355597095405853, "kl_loss": 0.538476824760437, "loss_ib": 0.006770619656890631, "step": 221 }, { "ce_ib": 17.7680606842041, "ce_orig": 0.6039354801177979, "epoch": 0.06355597095405853, "kl_loss": 0.5650777816772461, "loss_ib": 0.007427583914250135, "step": 221 }, { "ce_ib": 19.38729476928711, "ce_orig": 0.8789693117141724, "epoch": 0.06384355453303617, "kl_loss": 0.6542633771896362, "loss_ib": 0.008481362834572792, "step": 222 }, { "ce_ib": 18.89866065979004, "ce_orig": 0.7741104960441589, "epoch": 0.06384355453303617, "kl_loss": 0.5847321152687073, "loss_ib": 0.007737187203019857, "step": 222 }, { "ce_ib": 21.54572296142578, "ce_orig": 0.7229393124580383, "epoch": 0.06384355453303617, "kl_loss": 0.5832604169845581, "loss_ib": 0.007987176068127155, "step": 222 }, { "ce_ib": 13.869481086730957, "ce_orig": 0.5696704387664795, "epoch": 0.06384355453303617, "kl_loss": 0.5188637375831604, "loss_ib": 0.006575585342943668, "step": 222 }, { "ce_ib": 14.482152938842773, "ce_orig": 0.5589219331741333, "epoch": 0.0641311381120138, "kl_loss": 0.47938820719718933, "loss_ib": 0.006242097355425358, "step": 223 }, { "ce_ib": 16.80389976501465, "ce_orig": 0.5980596542358398, "epoch": 0.0641311381120138, "kl_loss": 0.6172512769699097, "loss_ib": 0.007852902635931969, "step": 223 }, { "ce_ib": 22.49806785583496, "ce_orig": 0.7062133550643921, "epoch": 0.0641311381120138, "kl_loss": 0.5784010887145996, "loss_ib": 0.008033817633986473, "step": 223 }, { "ce_ib": 17.86919593811035, "ce_orig": 0.6028913259506226, "epoch": 0.0641311381120138, "kl_loss": 0.5538998246192932, "loss_ib": 0.007325917482376099, "step": 223 }, { "ce_ib": 21.530719757080078, "ce_orig": 1.1314647197723389, "epoch": 0.06441872169099144, "kl_loss": 0.5061776638031006, "loss_ib": 0.007214848417788744, "step": 224 }, { "ce_ib": 17.580371856689453, "ce_orig": 0.8268778920173645, "epoch": 0.06441872169099144, "kl_loss": 0.5295155644416809, "loss_ib": 0.007053192704916, "step": 224 }, { "ce_ib": 16.985912322998047, "ce_orig": 0.92490553855896, "epoch": 0.06441872169099144, "kl_loss": 0.47081345319747925, "loss_ib": 0.006406725384294987, "step": 224 }, { "ce_ib": 20.34337043762207, "ce_orig": 1.7162299156188965, "epoch": 0.06441872169099144, "kl_loss": 0.5065193772315979, "loss_ib": 0.0070995306596159935, "step": 224 }, { "epoch": 0.06470630526996908, "grad_norm": 0.07722701877355576, "learning_rate": 3.487261146496815e-05, "loss": 0.8907, "step": 225 }, { "ce_ib": 15.637423515319824, "ce_orig": 0.8265129923820496, "epoch": 0.06470630526996908, "kl_loss": 0.6796841025352478, "loss_ib": 0.008360583335161209, "step": 225 }, { "ce_ib": 21.416494369506836, "ce_orig": 1.278948426246643, "epoch": 0.06470630526996908, "kl_loss": 0.48355668783187866, "loss_ib": 0.006977215874940157, "step": 225 }, { "ce_ib": 19.162933349609375, "ce_orig": 0.33566343784332275, "epoch": 0.06470630526996908, "kl_loss": 0.4927806854248047, "loss_ib": 0.006844100076705217, "step": 225 }, { "ce_ib": 17.001327514648438, "ce_orig": 0.8918877840042114, "epoch": 0.06470630526996908, "kl_loss": 0.4844684898853302, "loss_ib": 0.006544817704707384, "step": 225 }, { "ce_ib": 19.425342559814453, "ce_orig": 1.1151187419891357, "epoch": 0.06499388884894673, "kl_loss": 0.44420889019966125, "loss_ib": 0.006384622771292925, "step": 226 }, { "ce_ib": 20.979902267456055, "ce_orig": 1.1682270765304565, "epoch": 0.06499388884894673, "kl_loss": 0.5223791003227234, "loss_ib": 0.007321780547499657, "step": 226 }, { "ce_ib": 21.13734245300293, "ce_orig": 0.6381849050521851, "epoch": 0.06499388884894673, "kl_loss": 0.5622669458389282, "loss_ib": 0.007736403960734606, "step": 226 }, { "ce_ib": 19.859725952148438, "ce_orig": 1.4218535423278809, "epoch": 0.06499388884894673, "kl_loss": 0.5652158260345459, "loss_ib": 0.0076381308026611805, "step": 226 }, { "ce_ib": 18.34955596923828, "ce_orig": 0.8892937302589417, "epoch": 0.06528147242792437, "kl_loss": 0.477683424949646, "loss_ib": 0.006611789111047983, "step": 227 }, { "ce_ib": 16.387413024902344, "ce_orig": 0.5451152324676514, "epoch": 0.06528147242792437, "kl_loss": 0.4405210614204407, "loss_ib": 0.006043951492756605, "step": 227 }, { "ce_ib": 16.179128646850586, "ce_orig": 0.5826038718223572, "epoch": 0.06528147242792437, "kl_loss": 0.4468899965286255, "loss_ib": 0.006086812354624271, "step": 227 }, { "ce_ib": 15.503174781799316, "ce_orig": 0.4542520344257355, "epoch": 0.06528147242792437, "kl_loss": 0.4687623083591461, "loss_ib": 0.006237940862774849, "step": 227 }, { "ce_ib": 17.556617736816406, "ce_orig": 0.6604429483413696, "epoch": 0.06556905600690201, "kl_loss": 0.4429520070552826, "loss_ib": 0.006185181438922882, "step": 228 }, { "ce_ib": 14.565351486206055, "ce_orig": 0.663815438747406, "epoch": 0.06556905600690201, "kl_loss": 0.41016486287117004, "loss_ib": 0.005558183882385492, "step": 228 }, { "ce_ib": 9.793392181396484, "ce_orig": 0.1998930275440216, "epoch": 0.06556905600690201, "kl_loss": 0.5553406476974487, "loss_ib": 0.006532745435833931, "step": 228 }, { "ce_ib": 15.705013275146484, "ce_orig": 0.949131965637207, "epoch": 0.06556905600690201, "kl_loss": 0.5142616033554077, "loss_ib": 0.006713117007166147, "step": 228 }, { "ce_ib": 22.55472755432129, "ce_orig": 1.56355881690979, "epoch": 0.06585663958587964, "kl_loss": 0.508346676826477, "loss_ib": 0.007338939234614372, "step": 229 }, { "ce_ib": 20.364665985107422, "ce_orig": 1.1723278760910034, "epoch": 0.06585663958587964, "kl_loss": 0.4082661271095276, "loss_ib": 0.006119127850979567, "step": 229 }, { "ce_ib": 16.15178680419922, "ce_orig": 0.8450407981872559, "epoch": 0.06585663958587964, "kl_loss": 0.5447847843170166, "loss_ib": 0.007063026074320078, "step": 229 }, { "ce_ib": 18.998653411865234, "ce_orig": 1.2076853513717651, "epoch": 0.06585663958587964, "kl_loss": 0.42832180857658386, "loss_ib": 0.006183082703500986, "step": 229 }, { "epoch": 0.06614422316485728, "grad_norm": 0.07635564357042313, "learning_rate": 3.56687898089172e-05, "loss": 0.8962, "step": 230 }, { "ce_ib": 22.920480728149414, "ce_orig": 1.7977490425109863, "epoch": 0.06614422316485728, "kl_loss": 0.4276275932788849, "loss_ib": 0.0065683238208293915, "step": 230 }, { "ce_ib": 18.89206886291504, "ce_orig": 1.2325646877288818, "epoch": 0.06614422316485728, "kl_loss": 0.42932283878326416, "loss_ib": 0.006182434968650341, "step": 230 }, { "ce_ib": 19.41433334350586, "ce_orig": 1.1008139848709106, "epoch": 0.06614422316485728, "kl_loss": 0.4227140247821808, "loss_ib": 0.006168573163449764, "step": 230 }, { "ce_ib": 16.897308349609375, "ce_orig": 0.8783938884735107, "epoch": 0.06614422316485728, "kl_loss": 0.4387606680393219, "loss_ib": 0.0060773370787501335, "step": 230 }, { "ce_ib": 20.402490615844727, "ce_orig": 0.4892929196357727, "epoch": 0.06643180674383492, "kl_loss": 0.5622318387031555, "loss_ib": 0.007662567310035229, "step": 231 }, { "ce_ib": 18.776615142822266, "ce_orig": 0.8454554080963135, "epoch": 0.06643180674383492, "kl_loss": 0.3648257553577423, "loss_ib": 0.005525919143110514, "step": 231 }, { "ce_ib": 19.490280151367188, "ce_orig": 0.5873563289642334, "epoch": 0.06643180674383492, "kl_loss": 0.49844107031822205, "loss_ib": 0.006933438591659069, "step": 231 }, { "ce_ib": 18.226577758789062, "ce_orig": 0.9095281362533569, "epoch": 0.06643180674383492, "kl_loss": 0.42676785588264465, "loss_ib": 0.006090336479246616, "step": 231 }, { "ce_ib": 14.32204818725586, "ce_orig": 0.4136866331100464, "epoch": 0.06671939032281257, "kl_loss": 0.5454199910163879, "loss_ib": 0.006886404473334551, "step": 232 }, { "ce_ib": 15.030553817749023, "ce_orig": 1.1399730443954468, "epoch": 0.06671939032281257, "kl_loss": 0.3817654848098755, "loss_ib": 0.00532070966437459, "step": 232 }, { "ce_ib": 17.033527374267578, "ce_orig": 0.9704214334487915, "epoch": 0.06671939032281257, "kl_loss": 0.45833879709243774, "loss_ib": 0.006286740303039551, "step": 232 }, { "ce_ib": 16.526573181152344, "ce_orig": 0.6879238486289978, "epoch": 0.06671939032281257, "kl_loss": 0.3568248152732849, "loss_ib": 0.005220905411988497, "step": 232 }, { "ce_ib": 22.991727828979492, "ce_orig": 1.4614430665969849, "epoch": 0.06700697390179021, "kl_loss": 0.42173314094543457, "loss_ib": 0.006516504101455212, "step": 233 }, { "ce_ib": 18.632497787475586, "ce_orig": 0.5046707391738892, "epoch": 0.06700697390179021, "kl_loss": 0.41837000846862793, "loss_ib": 0.006046949420124292, "step": 233 }, { "ce_ib": 18.9344425201416, "ce_orig": 1.0734100341796875, "epoch": 0.06700697390179021, "kl_loss": 0.40839213132858276, "loss_ib": 0.00597736518830061, "step": 233 }, { "ce_ib": 11.921408653259277, "ce_orig": 0.525043785572052, "epoch": 0.06700697390179021, "kl_loss": 0.35900092124938965, "loss_ib": 0.004782150033861399, "step": 233 }, { "ce_ib": 16.360872268676758, "ce_orig": 0.9665996432304382, "epoch": 0.06729455748076785, "kl_loss": 0.352176696062088, "loss_ib": 0.005157853942364454, "step": 234 }, { "ce_ib": 17.86981964111328, "ce_orig": 0.9465886354446411, "epoch": 0.06729455748076785, "kl_loss": 0.39093858003616333, "loss_ib": 0.005696367472410202, "step": 234 }, { "ce_ib": 18.097686767578125, "ce_orig": 0.8353486657142639, "epoch": 0.06729455748076785, "kl_loss": 0.3744758367538452, "loss_ib": 0.005554527044296265, "step": 234 }, { "ce_ib": 22.27129554748535, "ce_orig": 1.4471676349639893, "epoch": 0.06729455748076785, "kl_loss": 0.41227924823760986, "loss_ib": 0.006349921692162752, "step": 234 }, { "epoch": 0.06758214105974548, "grad_norm": 0.08016426116228104, "learning_rate": 3.646496815286624e-05, "loss": 0.8961, "step": 235 }, { "ce_ib": 17.102169036865234, "ce_orig": 0.6802967190742493, "epoch": 0.06758214105974548, "kl_loss": 0.3811526298522949, "loss_ib": 0.005521743092685938, "step": 235 }, { "ce_ib": 23.21323585510254, "ce_orig": 1.7242603302001953, "epoch": 0.06758214105974548, "kl_loss": 0.43173903226852417, "loss_ib": 0.006638714112341404, "step": 235 }, { "ce_ib": 13.367447853088379, "ce_orig": 0.7693591713905334, "epoch": 0.06758214105974548, "kl_loss": 0.33568012714385986, "loss_ib": 0.004693545866757631, "step": 235 }, { "ce_ib": 16.364444732666016, "ce_orig": 0.9041774868965149, "epoch": 0.06758214105974548, "kl_loss": 0.3745976388454437, "loss_ib": 0.005382420960813761, "step": 235 }, { "ce_ib": 17.089984893798828, "ce_orig": 0.8724990487098694, "epoch": 0.06786972463872312, "kl_loss": 0.3381209969520569, "loss_ib": 0.005090207792818546, "step": 236 }, { "ce_ib": 17.797290802001953, "ce_orig": 1.2699850797653198, "epoch": 0.06786972463872312, "kl_loss": 0.4074021279811859, "loss_ib": 0.0058537498116493225, "step": 236 }, { "ce_ib": 10.40896224975586, "ce_orig": 0.2636343240737915, "epoch": 0.06786972463872312, "kl_loss": 0.6993351578712463, "loss_ib": 0.008034247905015945, "step": 236 }, { "ce_ib": 23.780147552490234, "ce_orig": 1.2295787334442139, "epoch": 0.06786972463872312, "kl_loss": 0.47904911637306213, "loss_ib": 0.007168505806475878, "step": 236 }, { "ce_ib": 17.171159744262695, "ce_orig": 1.21332848072052, "epoch": 0.06815730821770077, "kl_loss": 0.34175872802734375, "loss_ib": 0.005134702660143375, "step": 237 }, { "ce_ib": 18.72576904296875, "ce_orig": 0.8414787650108337, "epoch": 0.06815730821770077, "kl_loss": 0.41571539640426636, "loss_ib": 0.006029731128364801, "step": 237 }, { "ce_ib": 18.983478546142578, "ce_orig": 0.5497841238975525, "epoch": 0.06815730821770077, "kl_loss": 0.400782972574234, "loss_ib": 0.005906177684664726, "step": 237 }, { "ce_ib": 15.720340728759766, "ce_orig": 0.6456199884414673, "epoch": 0.06815730821770077, "kl_loss": 0.3572655916213989, "loss_ib": 0.005144690163433552, "step": 237 }, { "ce_ib": 14.64540958404541, "ce_orig": 0.5299506783485413, "epoch": 0.06844489179667841, "kl_loss": 0.3614061176776886, "loss_ib": 0.005078601650893688, "step": 238 }, { "ce_ib": 14.622838973999023, "ce_orig": 0.6512343883514404, "epoch": 0.06844489179667841, "kl_loss": 0.3499015271663666, "loss_ib": 0.004961299244314432, "step": 238 }, { "ce_ib": 18.794681549072266, "ce_orig": 0.5560781359672546, "epoch": 0.06844489179667841, "kl_loss": 0.3744252324104309, "loss_ib": 0.005623720120638609, "step": 238 }, { "ce_ib": 16.820043563842773, "ce_orig": 0.7689210772514343, "epoch": 0.06844489179667841, "kl_loss": 0.3898257613182068, "loss_ib": 0.005580261815339327, "step": 238 }, { "ce_ib": 20.637855529785156, "ce_orig": 1.1541659832000732, "epoch": 0.06873247537565605, "kl_loss": 0.4067099392414093, "loss_ib": 0.006130884867161512, "step": 239 }, { "ce_ib": 14.409849166870117, "ce_orig": 0.6937656402587891, "epoch": 0.06873247537565605, "kl_loss": 0.30936238169670105, "loss_ib": 0.00453460868448019, "step": 239 }, { "ce_ib": 19.96538543701172, "ce_orig": 1.6420783996582031, "epoch": 0.06873247537565605, "kl_loss": 0.3878486752510071, "loss_ib": 0.005875025410205126, "step": 239 }, { "ce_ib": 16.174251556396484, "ce_orig": 0.7331187725067139, "epoch": 0.06873247537565605, "kl_loss": 0.3374932110309601, "loss_ib": 0.004992356989532709, "step": 239 }, { "epoch": 0.06902005895463369, "grad_norm": 0.09181191027164459, "learning_rate": 3.7261146496815283e-05, "loss": 0.9216, "step": 240 }, { "ce_ib": 16.239824295043945, "ce_orig": 0.45115554332733154, "epoch": 0.06902005895463369, "kl_loss": 0.3430927097797394, "loss_ib": 0.005054909270256758, "step": 240 }, { "ce_ib": 20.204030990600586, "ce_orig": 1.1928750276565552, "epoch": 0.06902005895463369, "kl_loss": 0.37950411438941956, "loss_ib": 0.005815444048494101, "step": 240 }, { "ce_ib": 11.103907585144043, "ce_orig": 0.41011255979537964, "epoch": 0.06902005895463369, "kl_loss": 0.3157821595668793, "loss_ib": 0.004268212243914604, "step": 240 }, { "ce_ib": 16.61946678161621, "ce_orig": 0.958586573600769, "epoch": 0.06902005895463369, "kl_loss": 0.472045361995697, "loss_ib": 0.006382400169968605, "step": 240 }, { "ce_ib": 18.43888282775879, "ce_orig": 0.8224636912345886, "epoch": 0.06930764253361132, "kl_loss": 0.31457871198654175, "loss_ib": 0.004989675246179104, "step": 241 }, { "ce_ib": 19.861295700073242, "ce_orig": 0.5294429659843445, "epoch": 0.06930764253361132, "kl_loss": 0.30837568640708923, "loss_ib": 0.0050698863342404366, "step": 241 }, { "ce_ib": 17.056270599365234, "ce_orig": 0.6633943319320679, "epoch": 0.06930764253361132, "kl_loss": 0.3993522524833679, "loss_ib": 0.0056991493329405785, "step": 241 }, { "ce_ib": 13.237872123718262, "ce_orig": 0.6085235476493835, "epoch": 0.06930764253361132, "kl_loss": 0.276342511177063, "loss_ib": 0.0040872120298445225, "step": 241 }, { "ce_ib": 15.212370872497559, "ce_orig": 0.5519753694534302, "epoch": 0.06959522611258898, "kl_loss": 0.3807227611541748, "loss_ib": 0.005328464321792126, "step": 242 }, { "ce_ib": 14.194107055664062, "ce_orig": 0.6263343691825867, "epoch": 0.06959522611258898, "kl_loss": 0.33415570855140686, "loss_ib": 0.004760967567563057, "step": 242 }, { "ce_ib": 18.368473052978516, "ce_orig": 0.8124864101409912, "epoch": 0.06959522611258898, "kl_loss": 0.3696582317352295, "loss_ib": 0.005533429328352213, "step": 242 }, { "ce_ib": 18.977922439575195, "ce_orig": 0.7746420502662659, "epoch": 0.06959522611258898, "kl_loss": 0.3186471462249756, "loss_ib": 0.005084263626486063, "step": 242 }, { "ce_ib": 18.268203735351562, "ce_orig": 0.9710350632667542, "epoch": 0.06988280969156661, "kl_loss": 0.32097768783569336, "loss_ib": 0.005036597140133381, "step": 243 }, { "ce_ib": 20.087373733520508, "ce_orig": 1.0895576477050781, "epoch": 0.06988280969156661, "kl_loss": 0.3057764768600464, "loss_ib": 0.005066501908004284, "step": 243 }, { "ce_ib": 18.099958419799805, "ce_orig": 0.907975971698761, "epoch": 0.06988280969156661, "kl_loss": 0.35890674591064453, "loss_ib": 0.005399063229560852, "step": 243 }, { "ce_ib": 18.00782012939453, "ce_orig": 0.520527184009552, "epoch": 0.06988280969156661, "kl_loss": 0.36176708340644836, "loss_ib": 0.005418452434241772, "step": 243 }, { "ce_ib": 15.336793899536133, "ce_orig": 0.755825936794281, "epoch": 0.07017039327054425, "kl_loss": 0.27832502126693726, "loss_ib": 0.0043169292621314526, "step": 244 }, { "ce_ib": 14.561528205871582, "ce_orig": 0.5862277150154114, "epoch": 0.07017039327054425, "kl_loss": 0.3262811303138733, "loss_ib": 0.004718963988125324, "step": 244 }, { "ce_ib": 21.186973571777344, "ce_orig": 1.1542885303497314, "epoch": 0.07017039327054425, "kl_loss": 0.3798186182975769, "loss_ib": 0.005916883237659931, "step": 244 }, { "ce_ib": 17.660518646240234, "ce_orig": 0.7000678181648254, "epoch": 0.07017039327054425, "kl_loss": 0.40329715609550476, "loss_ib": 0.005799023434519768, "step": 244 }, { "epoch": 0.07045797684952189, "grad_norm": 0.07606582343578339, "learning_rate": 3.805732484076434e-05, "loss": 0.8966, "step": 245 }, { "ce_ib": 17.2858829498291, "ce_orig": 0.6848281025886536, "epoch": 0.07045797684952189, "kl_loss": 0.3115922510623932, "loss_ib": 0.0048445104621350765, "step": 245 }, { "ce_ib": 12.877274513244629, "ce_orig": 0.42091885209083557, "epoch": 0.07045797684952189, "kl_loss": 0.33227574825286865, "loss_ib": 0.004610484931617975, "step": 245 }, { "ce_ib": 19.50572967529297, "ce_orig": 1.2013055086135864, "epoch": 0.07045797684952189, "kl_loss": 0.29557040333747864, "loss_ib": 0.004906277172267437, "step": 245 }, { "ce_ib": 17.724828720092773, "ce_orig": 0.7979478240013123, "epoch": 0.07045797684952189, "kl_loss": 0.3825852870941162, "loss_ib": 0.005598335526883602, "step": 245 }, { "ce_ib": 17.733549118041992, "ce_orig": 1.1459635496139526, "epoch": 0.07074556042849953, "kl_loss": 0.29438281059265137, "loss_ib": 0.004717182833701372, "step": 246 }, { "ce_ib": 16.1971378326416, "ce_orig": 0.13715046644210815, "epoch": 0.07074556042849953, "kl_loss": 0.6951940059661865, "loss_ib": 0.008571653626859188, "step": 246 }, { "ce_ib": 20.530433654785156, "ce_orig": 1.4083482027053833, "epoch": 0.07074556042849953, "kl_loss": 0.35388949513435364, "loss_ib": 0.005591938272118568, "step": 246 }, { "ce_ib": 16.526330947875977, "ce_orig": 0.6567316055297852, "epoch": 0.07074556042849953, "kl_loss": 0.3231682777404785, "loss_ib": 0.004884315654635429, "step": 246 }, { "ce_ib": 14.093873977661133, "ce_orig": 0.871584951877594, "epoch": 0.07103314400747718, "kl_loss": 0.2740858793258667, "loss_ib": 0.004150246270000935, "step": 247 }, { "ce_ib": 21.621118545532227, "ce_orig": 1.2882436513900757, "epoch": 0.07103314400747718, "kl_loss": 0.4834282696247101, "loss_ib": 0.006996394135057926, "step": 247 }, { "ce_ib": 19.13994026184082, "ce_orig": 1.2011432647705078, "epoch": 0.07103314400747718, "kl_loss": 0.31072482466697693, "loss_ib": 0.005021241959184408, "step": 247 }, { "ce_ib": 13.94855785369873, "ce_orig": 0.6923986673355103, "epoch": 0.07103314400747718, "kl_loss": 0.34611976146698, "loss_ib": 0.004856053274124861, "step": 247 }, { "ce_ib": 18.997570037841797, "ce_orig": 1.2123730182647705, "epoch": 0.07132072758645482, "kl_loss": 0.3029173016548157, "loss_ib": 0.004928929731249809, "step": 248 }, { "ce_ib": 18.082622528076172, "ce_orig": 0.7000762224197388, "epoch": 0.07132072758645482, "kl_loss": 0.3445127308368683, "loss_ib": 0.005253389477729797, "step": 248 }, { "ce_ib": 13.205419540405273, "ce_orig": 0.6170308589935303, "epoch": 0.07132072758645482, "kl_loss": 0.2936919927597046, "loss_ib": 0.004257461987435818, "step": 248 }, { "ce_ib": 16.406328201293945, "ce_orig": 0.8249359130859375, "epoch": 0.07132072758645482, "kl_loss": 0.2896481454372406, "loss_ib": 0.004537113942205906, "step": 248 }, { "ce_ib": 19.35923194885254, "ce_orig": 0.9184130430221558, "epoch": 0.07160831116543245, "kl_loss": 0.2877388000488281, "loss_ib": 0.004813311155885458, "step": 249 }, { "ce_ib": 14.84507942199707, "ce_orig": 0.962078332901001, "epoch": 0.07160831116543245, "kl_loss": 0.33685553073883057, "loss_ib": 0.004853063262999058, "step": 249 }, { "ce_ib": 13.66109848022461, "ce_orig": 0.8815235495567322, "epoch": 0.07160831116543245, "kl_loss": 0.2970173954963684, "loss_ib": 0.004336283542215824, "step": 249 }, { "ce_ib": 15.64456844329834, "ce_orig": 0.9901912808418274, "epoch": 0.07160831116543245, "kl_loss": 0.30990880727767944, "loss_ib": 0.004663544707000256, "step": 249 }, { "epoch": 0.07189589474441009, "grad_norm": 0.07667157799005508, "learning_rate": 3.885350318471338e-05, "loss": 0.8786, "step": 250 }, { "ce_ib": 17.655288696289062, "ce_orig": 0.9249431490898132, "epoch": 0.07189589474441009, "kl_loss": 0.24412468075752258, "loss_ib": 0.004206775221973658, "step": 250 }, { "ce_ib": 16.22374153137207, "ce_orig": 0.8454200625419617, "epoch": 0.07189589474441009, "kl_loss": 0.3324206471443176, "loss_ib": 0.004946580622345209, "step": 250 }, { "ce_ib": 18.696596145629883, "ce_orig": 1.0471431016921997, "epoch": 0.07189589474441009, "kl_loss": 0.3605830669403076, "loss_ib": 0.005475489888340235, "step": 250 }, { "ce_ib": 19.617197036743164, "ce_orig": 0.630739152431488, "epoch": 0.07189589474441009, "kl_loss": 0.42468297481536865, "loss_ib": 0.006208549719303846, "step": 250 }, { "ce_ib": 14.190434455871582, "ce_orig": 0.5681670904159546, "epoch": 0.07218347832338773, "kl_loss": 0.2779189646244049, "loss_ib": 0.004198232665657997, "step": 251 }, { "ce_ib": 12.449499130249023, "ce_orig": 0.7335292100906372, "epoch": 0.07218347832338773, "kl_loss": 0.30513036251068115, "loss_ib": 0.004296253435313702, "step": 251 }, { "ce_ib": 17.19744300842285, "ce_orig": 0.664770245552063, "epoch": 0.07218347832338773, "kl_loss": 0.3403986096382141, "loss_ib": 0.005123730283230543, "step": 251 }, { "ce_ib": 16.57467269897461, "ce_orig": 1.2152647972106934, "epoch": 0.07218347832338773, "kl_loss": 0.2757129669189453, "loss_ib": 0.0044145965948700905, "step": 251 }, { "ce_ib": 20.365676879882812, "ce_orig": 0.9634372591972351, "epoch": 0.07247106190236538, "kl_loss": 0.31626924872398376, "loss_ib": 0.005199260078370571, "step": 252 }, { "ce_ib": 18.716487884521484, "ce_orig": 1.0937143564224243, "epoch": 0.07247106190236538, "kl_loss": 0.3098085820674896, "loss_ib": 0.0049697342328727245, "step": 252 }, { "ce_ib": 16.123247146606445, "ce_orig": 1.0408896207809448, "epoch": 0.07247106190236538, "kl_loss": 0.31008970737457275, "loss_ib": 0.004713221453130245, "step": 252 }, { "ce_ib": 17.019351959228516, "ce_orig": 1.1104483604431152, "epoch": 0.07247106190236538, "kl_loss": 0.30466794967651367, "loss_ib": 0.004748614504933357, "step": 252 }, { "ce_ib": 14.710082054138184, "ce_orig": 0.9470803737640381, "epoch": 0.07275864548134302, "kl_loss": 0.37655502557754517, "loss_ib": 0.005236558150500059, "step": 253 }, { "ce_ib": 20.534164428710938, "ce_orig": 0.901342511177063, "epoch": 0.07275864548134302, "kl_loss": 0.3438325524330139, "loss_ib": 0.005491741932928562, "step": 253 }, { "ce_ib": 16.916545867919922, "ce_orig": 0.9539148211479187, "epoch": 0.07275864548134302, "kl_loss": 0.35449427366256714, "loss_ib": 0.005236596800386906, "step": 253 }, { "ce_ib": 15.45893383026123, "ce_orig": 0.6202948689460754, "epoch": 0.07275864548134302, "kl_loss": 0.3998444080352783, "loss_ib": 0.005544337444007397, "step": 253 }, { "ce_ib": 17.64470100402832, "ce_orig": 1.3979955911636353, "epoch": 0.07304622906032066, "kl_loss": 0.31596821546554565, "loss_ib": 0.004924152046442032, "step": 254 }, { "ce_ib": 17.690441131591797, "ce_orig": 0.8207519054412842, "epoch": 0.07304622906032066, "kl_loss": 0.2767926752567291, "loss_ib": 0.0045369709841907024, "step": 254 }, { "ce_ib": 10.424705505371094, "ce_orig": 0.5839744210243225, "epoch": 0.07304622906032066, "kl_loss": 0.22676922380924225, "loss_ib": 0.0033101625740528107, "step": 254 }, { "ce_ib": 20.686954498291016, "ce_orig": 0.6900187730789185, "epoch": 0.07304622906032066, "kl_loss": 0.4284232258796692, "loss_ib": 0.006352927535772324, "step": 254 }, { "epoch": 0.0733338126392983, "grad_norm": 0.06607817858457565, "learning_rate": 3.964968152866242e-05, "loss": 0.846, "step": 255 }, { "ce_ib": 14.843269348144531, "ce_orig": 0.8040740489959717, "epoch": 0.0733338126392983, "kl_loss": 0.37673041224479675, "loss_ib": 0.005251631140708923, "step": 255 }, { "ce_ib": 14.139528274536133, "ce_orig": 0.7245256304740906, "epoch": 0.0733338126392983, "kl_loss": 0.3231876790523529, "loss_ib": 0.004645829554647207, "step": 255 }, { "ce_ib": 24.16304588317871, "ce_orig": 1.9036223888397217, "epoch": 0.0733338126392983, "kl_loss": 0.2994362413883209, "loss_ib": 0.005410667043179274, "step": 255 }, { "ce_ib": 17.201786041259766, "ce_orig": 0.680133044719696, "epoch": 0.0733338126392983, "kl_loss": 0.3443969786167145, "loss_ib": 0.005164148285984993, "step": 255 }, { "ce_ib": 11.843783378601074, "ce_orig": 0.5880969166755676, "epoch": 0.07362139621827593, "kl_loss": 0.2765531539916992, "loss_ib": 0.003949909936636686, "step": 256 }, { "ce_ib": 15.530258178710938, "ce_orig": 0.7509983777999878, "epoch": 0.07362139621827593, "kl_loss": 0.3052097260951996, "loss_ib": 0.004605122841894627, "step": 256 }, { "ce_ib": 18.292640686035156, "ce_orig": 0.9828827977180481, "epoch": 0.07362139621827593, "kl_loss": 0.29785263538360596, "loss_ib": 0.0048077902756631374, "step": 256 }, { "ce_ib": 12.437490463256836, "ce_orig": 0.5975197553634644, "epoch": 0.07362139621827593, "kl_loss": 0.32125842571258545, "loss_ib": 0.004456333350390196, "step": 256 }, { "ce_ib": 17.51129722595215, "ce_orig": 0.6895196437835693, "epoch": 0.07390897979725358, "kl_loss": 0.29928696155548096, "loss_ib": 0.00474399933591485, "step": 257 }, { "ce_ib": 19.982250213623047, "ce_orig": 1.2780667543411255, "epoch": 0.07390897979725358, "kl_loss": 0.4109703004360199, "loss_ib": 0.006107928231358528, "step": 257 }, { "ce_ib": 18.59293556213379, "ce_orig": 0.7878507375717163, "epoch": 0.07390897979725358, "kl_loss": 0.2821478247642517, "loss_ib": 0.004680771846324205, "step": 257 }, { "ce_ib": 16.528976440429688, "ce_orig": 0.9417824149131775, "epoch": 0.07390897979725358, "kl_loss": 0.2769574522972107, "loss_ib": 0.004422471858561039, "step": 257 }, { "ce_ib": 12.966187477111816, "ce_orig": 0.5238648653030396, "epoch": 0.07419656337623122, "kl_loss": 0.31731730699539185, "loss_ib": 0.004469791427254677, "step": 258 }, { "ce_ib": 13.36031723022461, "ce_orig": 0.5534040927886963, "epoch": 0.07419656337623122, "kl_loss": 0.2720886170864105, "loss_ib": 0.00405691796913743, "step": 258 }, { "ce_ib": 19.149700164794922, "ce_orig": 1.4191524982452393, "epoch": 0.07419656337623122, "kl_loss": 0.34151729941368103, "loss_ib": 0.00533014303073287, "step": 258 }, { "ce_ib": 19.49608612060547, "ce_orig": 1.3304085731506348, "epoch": 0.07419656337623122, "kl_loss": 0.303983211517334, "loss_ib": 0.004989440552890301, "step": 258 }, { "ce_ib": 16.158462524414062, "ce_orig": 0.7256084680557251, "epoch": 0.07448414695520886, "kl_loss": 0.3417550027370453, "loss_ib": 0.0050333961844444275, "step": 259 }, { "ce_ib": 15.630940437316895, "ce_orig": 0.45199069380760193, "epoch": 0.07448414695520886, "kl_loss": 0.3961242437362671, "loss_ib": 0.005524335894733667, "step": 259 }, { "ce_ib": 15.765962600708008, "ce_orig": 1.1196238994598389, "epoch": 0.07448414695520886, "kl_loss": 0.25270766019821167, "loss_ib": 0.004103672690689564, "step": 259 }, { "ce_ib": 13.915310859680176, "ce_orig": 0.8033282160758972, "epoch": 0.07448414695520886, "kl_loss": 0.292714923620224, "loss_ib": 0.00431868014857173, "step": 259 }, { "epoch": 0.0747717305341865, "grad_norm": 0.08863961696624756, "learning_rate": 4.044585987261147e-05, "loss": 0.8927, "step": 260 }, { "ce_ib": 15.066596031188965, "ce_orig": 0.8063942193984985, "epoch": 0.0747717305341865, "kl_loss": 0.28827041387557983, "loss_ib": 0.004389363341033459, "step": 260 }, { "ce_ib": 12.796646118164062, "ce_orig": 0.41930192708969116, "epoch": 0.0747717305341865, "kl_loss": 0.2615140378475189, "loss_ib": 0.0038948049768805504, "step": 260 }, { "ce_ib": 14.110474586486816, "ce_orig": 0.68003249168396, "epoch": 0.0747717305341865, "kl_loss": 0.261357843875885, "loss_ib": 0.0040246257558465, "step": 260 }, { "ce_ib": 17.80391502380371, "ce_orig": 0.7285661697387695, "epoch": 0.0747717305341865, "kl_loss": 0.29259398579597473, "loss_ib": 0.00470633152872324, "step": 260 }, { "ce_ib": 10.909024238586426, "ce_orig": 0.47324129939079285, "epoch": 0.07505931411316413, "kl_loss": 0.2249765694141388, "loss_ib": 0.0033406680449843407, "step": 261 }, { "ce_ib": 15.371655464172363, "ce_orig": 0.9706589579582214, "epoch": 0.07505931411316413, "kl_loss": 0.2712176442146301, "loss_ib": 0.004249341785907745, "step": 261 }, { "ce_ib": 13.265528678894043, "ce_orig": 0.8591080904006958, "epoch": 0.07505931411316413, "kl_loss": 0.2495938241481781, "loss_ib": 0.0038224910385906696, "step": 261 }, { "ce_ib": 10.983420372009277, "ce_orig": 0.6682037711143494, "epoch": 0.07505931411316413, "kl_loss": 0.18751020729541779, "loss_ib": 0.0029734440613538027, "step": 261 }, { "ce_ib": 11.951087951660156, "ce_orig": 0.6800048351287842, "epoch": 0.07534689769214178, "kl_loss": 0.3001071512699127, "loss_ib": 0.004196180030703545, "step": 262 }, { "ce_ib": 17.0267276763916, "ce_orig": 0.4345322549343109, "epoch": 0.07534689769214178, "kl_loss": 0.3833320736885071, "loss_ib": 0.005535993259400129, "step": 262 }, { "ce_ib": 18.44808006286621, "ce_orig": 0.9550086259841919, "epoch": 0.07534689769214178, "kl_loss": 0.2870803773403168, "loss_ib": 0.004715611692517996, "step": 262 }, { "ce_ib": 16.392032623291016, "ce_orig": 1.0675876140594482, "epoch": 0.07534689769214178, "kl_loss": 0.30814555287361145, "loss_ib": 0.004720658529549837, "step": 262 }, { "ce_ib": 16.68846321105957, "ce_orig": 0.6256803274154663, "epoch": 0.07563448127111942, "kl_loss": 0.2585268020629883, "loss_ib": 0.004254114348441362, "step": 263 }, { "ce_ib": 12.127674102783203, "ce_orig": 0.5661578178405762, "epoch": 0.07563448127111942, "kl_loss": 0.23702625930309296, "loss_ib": 0.0035830300766974688, "step": 263 }, { "ce_ib": 16.941381454467773, "ce_orig": 0.6445264220237732, "epoch": 0.07563448127111942, "kl_loss": 0.29147881269454956, "loss_ib": 0.004608925897628069, "step": 263 }, { "ce_ib": 11.159895896911621, "ce_orig": 0.6294872164726257, "epoch": 0.07563448127111942, "kl_loss": 0.25180041790008545, "loss_ib": 0.0036339936777949333, "step": 263 }, { "ce_ib": 16.635135650634766, "ce_orig": 1.0586961507797241, "epoch": 0.07592206485009706, "kl_loss": 0.2687499523162842, "loss_ib": 0.004351012874394655, "step": 264 }, { "ce_ib": 12.455622673034668, "ce_orig": 0.8253864049911499, "epoch": 0.07592206485009706, "kl_loss": 0.24592146277427673, "loss_ib": 0.00370477675460279, "step": 264 }, { "ce_ib": 11.99234676361084, "ce_orig": 0.571262776851654, "epoch": 0.07592206485009706, "kl_loss": 0.19673100113868713, "loss_ib": 0.0031665447168052197, "step": 264 }, { "ce_ib": 16.71959114074707, "ce_orig": 0.8490833044052124, "epoch": 0.07592206485009706, "kl_loss": 0.3431280553340912, "loss_ib": 0.005103239323943853, "step": 264 }, { "epoch": 0.0762096484290747, "grad_norm": 0.09324845671653748, "learning_rate": 4.1242038216560514e-05, "loss": 0.8594, "step": 265 }, { "ce_ib": 13.668450355529785, "ce_orig": 0.7410028576850891, "epoch": 0.0762096484290747, "kl_loss": 0.3923606872558594, "loss_ib": 0.005290451925247908, "step": 265 }, { "ce_ib": 16.50493621826172, "ce_orig": 0.904811441898346, "epoch": 0.0762096484290747, "kl_loss": 0.32142162322998047, "loss_ib": 0.004864709917455912, "step": 265 }, { "ce_ib": 14.940958976745605, "ce_orig": 1.0615205764770508, "epoch": 0.0762096484290747, "kl_loss": 0.2736600637435913, "loss_ib": 0.004230696242302656, "step": 265 }, { "ce_ib": 20.21286964416504, "ce_orig": 0.936401903629303, "epoch": 0.0762096484290747, "kl_loss": 0.2895187437534332, "loss_ib": 0.004916474223136902, "step": 265 }, { "ce_ib": 15.859089851379395, "ce_orig": 0.9013702869415283, "epoch": 0.07649723200805233, "kl_loss": 0.2485354244709015, "loss_ib": 0.004071263130754232, "step": 266 }, { "ce_ib": 14.475261688232422, "ce_orig": 0.9954730272293091, "epoch": 0.07649723200805233, "kl_loss": 0.2513744533061981, "loss_ib": 0.003961270209401846, "step": 266 }, { "ce_ib": 20.038143157958984, "ce_orig": 1.3421083688735962, "epoch": 0.07649723200805233, "kl_loss": 0.281283974647522, "loss_ib": 0.00481665413826704, "step": 266 }, { "ce_ib": 22.541851043701172, "ce_orig": 1.7132771015167236, "epoch": 0.07649723200805233, "kl_loss": 0.31567251682281494, "loss_ib": 0.005410910118371248, "step": 266 }, { "ce_ib": 14.337822914123535, "ce_orig": 0.8144393563270569, "epoch": 0.07678481558702999, "kl_loss": 0.31490829586982727, "loss_ib": 0.004582865163683891, "step": 267 }, { "ce_ib": 16.432825088500977, "ce_orig": 0.5571436285972595, "epoch": 0.07678481558702999, "kl_loss": 0.3173448443412781, "loss_ib": 0.004816730972379446, "step": 267 }, { "ce_ib": 18.915435791015625, "ce_orig": 1.2111248970031738, "epoch": 0.07678481558702999, "kl_loss": 0.27650901675224304, "loss_ib": 0.004656633827835321, "step": 267 }, { "ce_ib": 20.70977783203125, "ce_orig": 1.6732383966445923, "epoch": 0.07678481558702999, "kl_loss": 0.32756784558296204, "loss_ib": 0.00534665584564209, "step": 267 }, { "ce_ib": 19.59430503845215, "ce_orig": 1.263615369796753, "epoch": 0.07707239916600762, "kl_loss": 0.2561582028865814, "loss_ib": 0.004521012306213379, "step": 268 }, { "ce_ib": 24.518985748291016, "ce_orig": 2.1271183490753174, "epoch": 0.07707239916600762, "kl_loss": 0.36851945519447327, "loss_ib": 0.006137093063443899, "step": 268 }, { "ce_ib": 16.20216941833496, "ce_orig": 0.524202823638916, "epoch": 0.07707239916600762, "kl_loss": 0.30454859137535095, "loss_ib": 0.00466570258140564, "step": 268 }, { "ce_ib": 16.534713745117188, "ce_orig": 0.59481281042099, "epoch": 0.07707239916600762, "kl_loss": 0.24704763293266296, "loss_ib": 0.004123947583138943, "step": 268 }, { "ce_ib": 15.644123077392578, "ce_orig": 0.9609376788139343, "epoch": 0.07735998274498526, "kl_loss": 0.24495989084243774, "loss_ib": 0.0040140110068023205, "step": 269 }, { "ce_ib": 13.680428504943848, "ce_orig": 0.7830809950828552, "epoch": 0.07735998274498526, "kl_loss": 0.23677141964435577, "loss_ib": 0.0037357567343860865, "step": 269 }, { "ce_ib": 19.454843521118164, "ce_orig": 0.8037047386169434, "epoch": 0.07735998274498526, "kl_loss": 0.33364683389663696, "loss_ib": 0.005281952675431967, "step": 269 }, { "ce_ib": 13.62769889831543, "ce_orig": 0.7561288475990295, "epoch": 0.07735998274498526, "kl_loss": 0.3251601457595825, "loss_ib": 0.004614371340721846, "step": 269 }, { "epoch": 0.0776475663239629, "grad_norm": 0.06999674439430237, "learning_rate": 4.2038216560509556e-05, "loss": 0.8477, "step": 270 }, { "ce_ib": 15.570327758789062, "ce_orig": 0.5456323027610779, "epoch": 0.0776475663239629, "kl_loss": 0.24074603617191315, "loss_ib": 0.003964493051171303, "step": 270 }, { "ce_ib": 12.79995346069336, "ce_orig": 0.5012090802192688, "epoch": 0.0776475663239629, "kl_loss": 0.3022935688495636, "loss_ib": 0.004302930552512407, "step": 270 }, { "ce_ib": 16.223758697509766, "ce_orig": 0.3916482925415039, "epoch": 0.0776475663239629, "kl_loss": 0.27299919724464417, "loss_ib": 0.004352367948740721, "step": 270 }, { "ce_ib": 14.882962226867676, "ce_orig": 0.9101399183273315, "epoch": 0.0776475663239629, "kl_loss": 0.2818550765514374, "loss_ib": 0.004306846763938665, "step": 270 }, { "ce_ib": 15.584421157836914, "ce_orig": 0.616856575012207, "epoch": 0.07793514990294054, "kl_loss": 0.2159929871559143, "loss_ib": 0.003718371968716383, "step": 271 }, { "ce_ib": 14.746891975402832, "ce_orig": 0.5636629462242126, "epoch": 0.07793514990294054, "kl_loss": 0.3384188413619995, "loss_ib": 0.004858877509832382, "step": 271 }, { "ce_ib": 19.72770881652832, "ce_orig": 1.6866846084594727, "epoch": 0.07793514990294054, "kl_loss": 0.2658270597457886, "loss_ib": 0.004631041083484888, "step": 271 }, { "ce_ib": 13.834111213684082, "ce_orig": 0.4504989981651306, "epoch": 0.07793514990294054, "kl_loss": 0.309722900390625, "loss_ib": 0.0044806404039263725, "step": 271 }, { "ce_ib": 16.82283592224121, "ce_orig": 1.4967201948165894, "epoch": 0.07822273348191819, "kl_loss": 0.2537575364112854, "loss_ib": 0.004219858907163143, "step": 272 }, { "ce_ib": 16.692188262939453, "ce_orig": 0.7724244594573975, "epoch": 0.07822273348191819, "kl_loss": 0.3247263431549072, "loss_ib": 0.004916482139378786, "step": 272 }, { "ce_ib": 17.720109939575195, "ce_orig": 1.0197162628173828, "epoch": 0.07822273348191819, "kl_loss": 0.3129570484161377, "loss_ib": 0.004901581443846226, "step": 272 }, { "ce_ib": 11.472055435180664, "ce_orig": 0.7266469597816467, "epoch": 0.07822273348191819, "kl_loss": 0.2540128827095032, "loss_ib": 0.0036873342469334602, "step": 272 }, { "ce_ib": 14.627097129821777, "ce_orig": 0.5554067492485046, "epoch": 0.07851031706089583, "kl_loss": 0.27136164903640747, "loss_ib": 0.004176326096057892, "step": 273 }, { "ce_ib": 12.32707405090332, "ce_orig": 0.832676887512207, "epoch": 0.07851031706089583, "kl_loss": 0.23146983981132507, "loss_ib": 0.0035474055912345648, "step": 273 }, { "ce_ib": 14.380395889282227, "ce_orig": 0.5141070485115051, "epoch": 0.07851031706089583, "kl_loss": 0.2842778265476227, "loss_ib": 0.004280817694962025, "step": 273 }, { "ce_ib": 16.54999351501465, "ce_orig": 1.1931746006011963, "epoch": 0.07851031706089583, "kl_loss": 0.3062623143196106, "loss_ib": 0.004717622417956591, "step": 273 }, { "ce_ib": 16.448566436767578, "ce_orig": 0.9063194394111633, "epoch": 0.07879790063987346, "kl_loss": 0.254788339138031, "loss_ib": 0.004192739725112915, "step": 274 }, { "ce_ib": 20.326473236083984, "ce_orig": 1.289271593093872, "epoch": 0.07879790063987346, "kl_loss": 0.21474193036556244, "loss_ib": 0.004180066287517548, "step": 274 }, { "ce_ib": 14.406719207763672, "ce_orig": 1.0166672468185425, "epoch": 0.07879790063987346, "kl_loss": 0.2415088266134262, "loss_ib": 0.0038557599764317274, "step": 274 }, { "ce_ib": 17.027986526489258, "ce_orig": 1.0573188066482544, "epoch": 0.07879790063987346, "kl_loss": 0.33195120096206665, "loss_ib": 0.0050223106518387794, "step": 274 }, { "epoch": 0.0790854842188511, "grad_norm": 0.08076049387454987, "learning_rate": 4.2834394904458604e-05, "loss": 0.908, "step": 275 }, { "ce_ib": 11.249130249023438, "ce_orig": 0.5311962962150574, "epoch": 0.0790854842188511, "kl_loss": 0.2099292278289795, "loss_ib": 0.0032242052257061005, "step": 275 }, { "ce_ib": 17.736249923706055, "ce_orig": 0.9784615635871887, "epoch": 0.0790854842188511, "kl_loss": 0.27468031644821167, "loss_ib": 0.004520427901297808, "step": 275 }, { "ce_ib": 14.927811622619629, "ce_orig": 0.7807605862617493, "epoch": 0.0790854842188511, "kl_loss": 0.35637491941452026, "loss_ib": 0.005056530237197876, "step": 275 }, { "ce_ib": 12.488973617553711, "ce_orig": 0.8185478448867798, "epoch": 0.0790854842188511, "kl_loss": 0.31116726994514465, "loss_ib": 0.004360570106655359, "step": 275 }, { "ce_ib": 15.501134872436523, "ce_orig": 1.238783597946167, "epoch": 0.07937306779782874, "kl_loss": 0.20382773876190186, "loss_ib": 0.0035883907694369555, "step": 276 }, { "ce_ib": 17.22933578491211, "ce_orig": 1.2730385065078735, "epoch": 0.07937306779782874, "kl_loss": 0.47506648302078247, "loss_ib": 0.006473598536103964, "step": 276 }, { "ce_ib": 13.309030532836914, "ce_orig": 0.5584474802017212, "epoch": 0.07937306779782874, "kl_loss": 0.23811832070350647, "loss_ib": 0.003712086006999016, "step": 276 }, { "ce_ib": 12.37324333190918, "ce_orig": 0.8598084449768066, "epoch": 0.07937306779782874, "kl_loss": 0.20274879038333893, "loss_ib": 0.0032648120541125536, "step": 276 }, { "ce_ib": 18.88533592224121, "ce_orig": 0.7922468781471252, "epoch": 0.07966065137680639, "kl_loss": 0.2773568034172058, "loss_ib": 0.004662101622670889, "step": 277 }, { "ce_ib": 16.412996292114258, "ce_orig": 0.7500933408737183, "epoch": 0.07966065137680639, "kl_loss": 0.27461355924606323, "loss_ib": 0.004387435037642717, "step": 277 }, { "ce_ib": 15.230081558227539, "ce_orig": 1.1697120666503906, "epoch": 0.07966065137680639, "kl_loss": 0.2722022533416748, "loss_ib": 0.00424503069370985, "step": 277 }, { "ce_ib": 15.583248138427734, "ce_orig": 0.8734590411186218, "epoch": 0.07966065137680639, "kl_loss": 0.2992432117462158, "loss_ib": 0.004550756886601448, "step": 277 }, { "ce_ib": 15.06824779510498, "ce_orig": 1.1103448867797852, "epoch": 0.07994823495578403, "kl_loss": 0.2773784101009369, "loss_ib": 0.0042806086130440235, "step": 278 }, { "ce_ib": 19.022869110107422, "ce_orig": 1.0327725410461426, "epoch": 0.07994823495578403, "kl_loss": 0.33331602811813354, "loss_ib": 0.005235447082668543, "step": 278 }, { "ce_ib": 15.828374862670898, "ce_orig": 0.5875866413116455, "epoch": 0.07994823495578403, "kl_loss": 0.1845521628856659, "loss_ib": 0.0034283590503036976, "step": 278 }, { "ce_ib": 10.436365127563477, "ce_orig": 0.6552335023880005, "epoch": 0.07994823495578403, "kl_loss": 0.18279395997524261, "loss_ib": 0.0028715759981423616, "step": 278 }, { "ce_ib": 12.258537292480469, "ce_orig": 0.6182965636253357, "epoch": 0.08023581853476167, "kl_loss": 0.2173025906085968, "loss_ib": 0.00339887966401875, "step": 279 }, { "ce_ib": 16.939525604248047, "ce_orig": 1.2229260206222534, "epoch": 0.08023581853476167, "kl_loss": 0.249847412109375, "loss_ib": 0.004192426800727844, "step": 279 }, { "ce_ib": 16.706846237182617, "ce_orig": 1.1211984157562256, "epoch": 0.08023581853476167, "kl_loss": 0.2522197961807251, "loss_ib": 0.004192882217466831, "step": 279 }, { "ce_ib": 14.674199104309082, "ce_orig": 0.790857195854187, "epoch": 0.08023581853476167, "kl_loss": 0.20820698142051697, "loss_ib": 0.0035494896583259106, "step": 279 }, { "epoch": 0.0805234021137393, "grad_norm": 0.07456893473863602, "learning_rate": 4.3630573248407646e-05, "loss": 0.8909, "step": 280 }, { "ce_ib": 17.366165161132812, "ce_orig": 0.7224763035774231, "epoch": 0.0805234021137393, "kl_loss": 0.2818063497543335, "loss_ib": 0.004554680082947016, "step": 280 }, { "ce_ib": 15.292021751403809, "ce_orig": 0.5337414145469666, "epoch": 0.0805234021137393, "kl_loss": 0.24038422107696533, "loss_ib": 0.003933044150471687, "step": 280 }, { "ce_ib": 13.491898536682129, "ce_orig": 0.5026684999465942, "epoch": 0.0805234021137393, "kl_loss": 0.19754835963249207, "loss_ib": 0.0033246735110878944, "step": 280 }, { "ce_ib": 18.61618995666504, "ce_orig": 1.3851393461227417, "epoch": 0.0805234021137393, "kl_loss": 0.3309285044670105, "loss_ib": 0.005170903634279966, "step": 280 }, { "ce_ib": 12.345269203186035, "ce_orig": 0.6989408135414124, "epoch": 0.08081098569271694, "kl_loss": 0.22234660387039185, "loss_ib": 0.0034579928033053875, "step": 281 }, { "ce_ib": 11.875962257385254, "ce_orig": 0.6694311499595642, "epoch": 0.08081098569271694, "kl_loss": 0.19901394844055176, "loss_ib": 0.003177735721692443, "step": 281 }, { "ce_ib": 17.15048599243164, "ce_orig": 0.5024470090866089, "epoch": 0.08081098569271694, "kl_loss": 0.3105819821357727, "loss_ib": 0.004820868372917175, "step": 281 }, { "ce_ib": 18.85089111328125, "ce_orig": 1.5827473402023315, "epoch": 0.08081098569271694, "kl_loss": 0.2236773669719696, "loss_ib": 0.004121862351894379, "step": 281 }, { "ce_ib": 14.070013999938965, "ce_orig": 0.9050841331481934, "epoch": 0.08109856927169459, "kl_loss": 0.26318368315696716, "loss_ib": 0.00403883820399642, "step": 282 }, { "ce_ib": 15.759684562683105, "ce_orig": 0.9596781134605408, "epoch": 0.08109856927169459, "kl_loss": 0.3149911165237427, "loss_ib": 0.0047258795239031315, "step": 282 }, { "ce_ib": 18.05628776550293, "ce_orig": 0.9637153148651123, "epoch": 0.08109856927169459, "kl_loss": 0.27664974331855774, "loss_ib": 0.004572126083076, "step": 282 }, { "ce_ib": 18.621143341064453, "ce_orig": 1.693290114402771, "epoch": 0.08109856927169459, "kl_loss": 0.2584025263786316, "loss_ib": 0.004446139093488455, "step": 282 }, { "ce_ib": 11.559967041015625, "ce_orig": 0.8692753911018372, "epoch": 0.08138615285067223, "kl_loss": 0.26356419920921326, "loss_ib": 0.0037916384171694517, "step": 283 }, { "ce_ib": 16.148008346557617, "ce_orig": 1.3362113237380981, "epoch": 0.08138615285067223, "kl_loss": 0.316663920879364, "loss_ib": 0.004781439900398254, "step": 283 }, { "ce_ib": 21.178966522216797, "ce_orig": 1.0704444646835327, "epoch": 0.08138615285067223, "kl_loss": 0.310921311378479, "loss_ib": 0.005227109882980585, "step": 283 }, { "ce_ib": 14.54597282409668, "ce_orig": 0.6114582419395447, "epoch": 0.08138615285067223, "kl_loss": 0.2650757431983948, "loss_ib": 0.004105354659259319, "step": 283 }, { "ce_ib": 12.013655662536621, "ce_orig": 0.8571666479110718, "epoch": 0.08167373642964987, "kl_loss": 0.2690030634403229, "loss_ib": 0.003891396103426814, "step": 284 }, { "ce_ib": 16.22176170349121, "ce_orig": 0.6218030452728271, "epoch": 0.08167373642964987, "kl_loss": 0.291636198759079, "loss_ib": 0.004538537934422493, "step": 284 }, { "ce_ib": 16.29920768737793, "ce_orig": 1.2184849977493286, "epoch": 0.08167373642964987, "kl_loss": 0.2997811734676361, "loss_ib": 0.004627732560038567, "step": 284 }, { "ce_ib": 12.09832763671875, "ce_orig": 0.6244350075721741, "epoch": 0.08167373642964987, "kl_loss": 0.2652917504310608, "loss_ib": 0.0038627502508461475, "step": 284 }, { "epoch": 0.0819613200086275, "grad_norm": 0.07042936980724335, "learning_rate": 4.442675159235669e-05, "loss": 0.9056, "step": 285 }, { "ce_ib": 13.477680206298828, "ce_orig": 0.6597225666046143, "epoch": 0.0819613200086275, "kl_loss": 0.26786327362060547, "loss_ib": 0.0040264008566737175, "step": 285 }, { "ce_ib": 16.648954391479492, "ce_orig": 0.7288675904273987, "epoch": 0.0819613200086275, "kl_loss": 0.234561488032341, "loss_ib": 0.004010510165244341, "step": 285 }, { "ce_ib": 16.058998107910156, "ce_orig": 0.9044990539550781, "epoch": 0.0819613200086275, "kl_loss": 0.438146710395813, "loss_ib": 0.0059873671270906925, "step": 285 }, { "ce_ib": 14.675004005432129, "ce_orig": 0.6858831644058228, "epoch": 0.0819613200086275, "kl_loss": 0.41518154740333557, "loss_ib": 0.005619315896183252, "step": 285 }, { "ce_ib": 19.281421661376953, "ce_orig": 1.3555938005447388, "epoch": 0.08224890358760514, "kl_loss": 0.27201730012893677, "loss_ib": 0.004648315254598856, "step": 286 }, { "ce_ib": 14.502872467041016, "ce_orig": 0.7407470345497131, "epoch": 0.08224890358760514, "kl_loss": 0.16434180736541748, "loss_ib": 0.0030937050469219685, "step": 286 }, { "ce_ib": 16.41741180419922, "ce_orig": 1.1262027025222778, "epoch": 0.08224890358760514, "kl_loss": 0.2105521857738495, "loss_ib": 0.0037472627591341734, "step": 286 }, { "ce_ib": 19.66245460510254, "ce_orig": 1.3670978546142578, "epoch": 0.08224890358760514, "kl_loss": 0.2873149514198303, "loss_ib": 0.004839394707232714, "step": 286 }, { "ce_ib": 13.970117568969727, "ce_orig": 0.588868260383606, "epoch": 0.0825364871665828, "kl_loss": 0.27275267243385315, "loss_ib": 0.004124538041651249, "step": 287 }, { "ce_ib": 17.439908981323242, "ce_orig": 1.1837517023086548, "epoch": 0.0825364871665828, "kl_loss": 0.1923927515745163, "loss_ib": 0.0036679182667285204, "step": 287 }, { "ce_ib": 10.239778518676758, "ce_orig": 0.5817263722419739, "epoch": 0.0825364871665828, "kl_loss": 0.2323988527059555, "loss_ib": 0.003347966354340315, "step": 287 }, { "ce_ib": 13.104039192199707, "ce_orig": 0.8184726238250732, "epoch": 0.0825364871665828, "kl_loss": 0.272987425327301, "loss_ib": 0.0040402780286967754, "step": 287 }, { "ce_ib": 11.393816947937012, "ce_orig": 0.882415235042572, "epoch": 0.08282407074556043, "kl_loss": 0.17284469306468964, "loss_ib": 0.0028678285889327526, "step": 288 }, { "ce_ib": 14.922150611877441, "ce_orig": 0.6627479791641235, "epoch": 0.08282407074556043, "kl_loss": 0.20301824808120728, "loss_ib": 0.0035223974846303463, "step": 288 }, { "ce_ib": 17.70345687866211, "ce_orig": 0.603179931640625, "epoch": 0.08282407074556043, "kl_loss": 0.32347768545150757, "loss_ib": 0.005005122162401676, "step": 288 }, { "ce_ib": 11.391678810119629, "ce_orig": 0.6061888337135315, "epoch": 0.08282407074556043, "kl_loss": 0.26528626680374146, "loss_ib": 0.003792030503973365, "step": 288 }, { "ce_ib": 13.464797019958496, "ce_orig": 0.5479658246040344, "epoch": 0.08311165432453807, "kl_loss": 0.21538397669792175, "loss_ib": 0.003500319318845868, "step": 289 }, { "ce_ib": 19.783390045166016, "ce_orig": 1.4441841840744019, "epoch": 0.08311165432453807, "kl_loss": 0.2706390619277954, "loss_ib": 0.004684729501605034, "step": 289 }, { "ce_ib": 16.319841384887695, "ce_orig": 1.0974111557006836, "epoch": 0.08311165432453807, "kl_loss": 0.3325914144515991, "loss_ib": 0.004957898054271936, "step": 289 }, { "ce_ib": 15.902824401855469, "ce_orig": 0.6798999905586243, "epoch": 0.08311165432453807, "kl_loss": 0.2273552566766739, "loss_ib": 0.003863835008814931, "step": 289 }, { "epoch": 0.08339923790351571, "grad_norm": 0.07085248827934265, "learning_rate": 4.522292993630574e-05, "loss": 0.8988, "step": 290 }, { "ce_ib": 12.853606224060059, "ce_orig": 0.5977413654327393, "epoch": 0.08339923790351571, "kl_loss": 0.258215069770813, "loss_ib": 0.003867511171847582, "step": 290 }, { "ce_ib": 13.45907211303711, "ce_orig": 0.7957695722579956, "epoch": 0.08339923790351571, "kl_loss": 0.2829551100730896, "loss_ib": 0.00417545810341835, "step": 290 }, { "ce_ib": 16.264999389648438, "ce_orig": 0.921114444732666, "epoch": 0.08339923790351571, "kl_loss": 0.2568701505661011, "loss_ib": 0.004195201210677624, "step": 290 }, { "ce_ib": 11.070430755615234, "ce_orig": 0.828477680683136, "epoch": 0.08339923790351571, "kl_loss": 0.18585243821144104, "loss_ib": 0.0029655674006789923, "step": 290 }, { "ce_ib": 15.938783645629883, "ce_orig": 0.8985275626182556, "epoch": 0.08368682148249335, "kl_loss": 0.322698712348938, "loss_ib": 0.004820865113288164, "step": 291 }, { "ce_ib": 12.973055839538574, "ce_orig": 0.9591237902641296, "epoch": 0.08368682148249335, "kl_loss": 0.1751486361026764, "loss_ib": 0.0030487917829304934, "step": 291 }, { "ce_ib": 15.191100120544434, "ce_orig": 0.9854549765586853, "epoch": 0.08368682148249335, "kl_loss": 0.2032536417245865, "loss_ib": 0.0035516463685780764, "step": 291 }, { "ce_ib": 15.310328483581543, "ce_orig": 0.8211847543716431, "epoch": 0.08368682148249335, "kl_loss": 0.2667645514011383, "loss_ib": 0.004198677837848663, "step": 291 }, { "ce_ib": 16.732818603515625, "ce_orig": 0.9525948166847229, "epoch": 0.083974405061471, "kl_loss": 0.24904996156692505, "loss_ib": 0.004163781180977821, "step": 292 }, { "ce_ib": 14.454859733581543, "ce_orig": 0.8364003896713257, "epoch": 0.083974405061471, "kl_loss": 0.300500750541687, "loss_ib": 0.0044504934921860695, "step": 292 }, { "ce_ib": 16.7276611328125, "ce_orig": 1.103460431098938, "epoch": 0.083974405061471, "kl_loss": 0.25054287910461426, "loss_ib": 0.004178194794803858, "step": 292 }, { "ce_ib": 18.47587776184082, "ce_orig": 1.1350774765014648, "epoch": 0.083974405061471, "kl_loss": 0.2811344861984253, "loss_ib": 0.00465893279761076, "step": 292 }, { "ce_ib": 15.593929290771484, "ce_orig": 0.7370646595954895, "epoch": 0.08426198864044863, "kl_loss": 0.21932320296764374, "loss_ib": 0.003752624848857522, "step": 293 }, { "ce_ib": 15.527499198913574, "ce_orig": 1.2750834226608276, "epoch": 0.08426198864044863, "kl_loss": 0.23349913954734802, "loss_ib": 0.0038877411279827356, "step": 293 }, { "ce_ib": 12.307111740112305, "ce_orig": 0.68174147605896, "epoch": 0.08426198864044863, "kl_loss": 0.29035478830337524, "loss_ib": 0.004134258721023798, "step": 293 }, { "ce_ib": 11.335613250732422, "ce_orig": 0.65586918592453, "epoch": 0.08426198864044863, "kl_loss": 0.21021895110607147, "loss_ib": 0.0032357508316636086, "step": 293 }, { "ce_ib": 12.788888931274414, "ce_orig": 1.1009180545806885, "epoch": 0.08454957221942627, "kl_loss": 0.2401624619960785, "loss_ib": 0.00368051347322762, "step": 294 }, { "ce_ib": 16.075815200805664, "ce_orig": 0.7001639604568481, "epoch": 0.08454957221942627, "kl_loss": 0.32635319232940674, "loss_ib": 0.00487111322581768, "step": 294 }, { "ce_ib": 12.539616584777832, "ce_orig": 0.7154040932655334, "epoch": 0.08454957221942627, "kl_loss": 0.1870480477809906, "loss_ib": 0.0031244419515132904, "step": 294 }, { "ce_ib": 12.290575981140137, "ce_orig": 0.8135526180267334, "epoch": 0.08454957221942627, "kl_loss": 0.2699443995952606, "loss_ib": 0.003928501624614, "step": 294 }, { "epoch": 0.08483715579840391, "grad_norm": 0.07897292077541351, "learning_rate": 4.601910828025478e-05, "loss": 0.8706, "step": 295 }, { "ce_ib": 18.31114959716797, "ce_orig": 0.6431681513786316, "epoch": 0.08483715579840391, "kl_loss": 0.27935224771499634, "loss_ib": 0.004624637309461832, "step": 295 }, { "ce_ib": 13.731470108032227, "ce_orig": 0.8691681623458862, "epoch": 0.08483715579840391, "kl_loss": 0.19459585845470428, "loss_ib": 0.003319105366244912, "step": 295 }, { "ce_ib": 11.220470428466797, "ce_orig": 0.7137093544006348, "epoch": 0.08483715579840391, "kl_loss": 0.1932218372821808, "loss_ib": 0.003054265398532152, "step": 295 }, { "ce_ib": 13.056318283081055, "ce_orig": 0.5071139931678772, "epoch": 0.08483715579840391, "kl_loss": 0.21704959869384766, "loss_ib": 0.0034761279821395874, "step": 295 }, { "ce_ib": 11.606334686279297, "ce_orig": 0.7217742800712585, "epoch": 0.08512473937738155, "kl_loss": 0.1716514676809311, "loss_ib": 0.002877148101106286, "step": 296 }, { "ce_ib": 17.7640438079834, "ce_orig": 1.607155203819275, "epoch": 0.08512473937738155, "kl_loss": 0.29561007022857666, "loss_ib": 0.004732504952698946, "step": 296 }, { "ce_ib": 17.47099494934082, "ce_orig": 0.9363014698028564, "epoch": 0.08512473937738155, "kl_loss": 0.27039089798927307, "loss_ib": 0.004451008513569832, "step": 296 }, { "ce_ib": 17.832012176513672, "ce_orig": 1.6501764059066772, "epoch": 0.08512473937738155, "kl_loss": 0.5178996324539185, "loss_ib": 0.006962197367101908, "step": 296 }, { "ce_ib": 13.307634353637695, "ce_orig": 0.8553745746612549, "epoch": 0.08541232295635919, "kl_loss": 0.28302001953125, "loss_ib": 0.004160963464528322, "step": 297 }, { "ce_ib": 13.746207237243652, "ce_orig": 0.6645457744598389, "epoch": 0.08541232295635919, "kl_loss": 0.2449042946100235, "loss_ib": 0.0038236635737121105, "step": 297 }, { "ce_ib": 11.31932544708252, "ce_orig": 0.4558902978897095, "epoch": 0.08541232295635919, "kl_loss": 0.1459667682647705, "loss_ib": 0.002591600175946951, "step": 297 }, { "ce_ib": 10.261171340942383, "ce_orig": 0.7316778302192688, "epoch": 0.08541232295635919, "kl_loss": 0.18448230624198914, "loss_ib": 0.002870940137654543, "step": 297 }, { "ce_ib": 15.214677810668945, "ce_orig": 0.7406959533691406, "epoch": 0.08569990653533684, "kl_loss": 0.3475422263145447, "loss_ib": 0.004996889736503363, "step": 298 }, { "ce_ib": 12.732254981994629, "ce_orig": 0.9583520889282227, "epoch": 0.08569990653533684, "kl_loss": 0.2888698875904083, "loss_ib": 0.004161924123764038, "step": 298 }, { "ce_ib": 13.56235408782959, "ce_orig": 0.7003698348999023, "epoch": 0.08569990653533684, "kl_loss": 0.22925713658332825, "loss_ib": 0.00364880682900548, "step": 298 }, { "ce_ib": 17.023927688598633, "ce_orig": 0.7627611756324768, "epoch": 0.08569990653533684, "kl_loss": 0.3114122152328491, "loss_ib": 0.004816514905542135, "step": 298 }, { "ce_ib": 12.935884475708008, "ce_orig": 0.5755088329315186, "epoch": 0.08598749011431447, "kl_loss": 0.23949839174747467, "loss_ib": 0.003688572207465768, "step": 299 }, { "ce_ib": 15.182515144348145, "ce_orig": 0.7093390226364136, "epoch": 0.08598749011431447, "kl_loss": 0.254234254360199, "loss_ib": 0.0040605938993394375, "step": 299 }, { "ce_ib": 10.937736511230469, "ce_orig": 0.7415173649787903, "epoch": 0.08598749011431447, "kl_loss": 0.21827897429466248, "loss_ib": 0.003276563249528408, "step": 299 }, { "ce_ib": 14.389042854309082, "ce_orig": 0.6369369029998779, "epoch": 0.08598749011431447, "kl_loss": 0.25055113434791565, "loss_ib": 0.003944415133446455, "step": 299 }, { "epoch": 0.08627507369329211, "grad_norm": 0.08575107157230377, "learning_rate": 4.681528662420383e-05, "loss": 0.8178, "step": 300 }, { "ce_ib": 15.538275718688965, "ce_orig": 0.7116795778274536, "epoch": 0.08627507369329211, "kl_loss": 0.1944524198770523, "loss_ib": 0.0034983514342457056, "step": 300 }, { "ce_ib": 14.46932315826416, "ce_orig": 1.0576528310775757, "epoch": 0.08627507369329211, "kl_loss": 0.1829913854598999, "loss_ib": 0.0032768461387604475, "step": 300 }, { "ce_ib": 12.83568000793457, "ce_orig": 1.0147863626480103, "epoch": 0.08627507369329211, "kl_loss": 0.25184863805770874, "loss_ib": 0.0038020543288439512, "step": 300 }, { "ce_ib": 11.396459579467773, "ce_orig": 0.6744865775108337, "epoch": 0.08627507369329211, "kl_loss": 0.21117661893367767, "loss_ib": 0.003251412184908986, "step": 300 }, { "ce_ib": 17.51881980895996, "ce_orig": 1.0844104290008545, "epoch": 0.08656265727226975, "kl_loss": 0.24072128534317017, "loss_ib": 0.004159094765782356, "step": 301 }, { "ce_ib": 16.883913040161133, "ce_orig": 0.7893635034561157, "epoch": 0.08656265727226975, "kl_loss": 0.21162733435630798, "loss_ib": 0.0038046645931899548, "step": 301 }, { "ce_ib": 20.599260330200195, "ce_orig": 1.6651158332824707, "epoch": 0.08656265727226975, "kl_loss": 0.26889339089393616, "loss_ib": 0.004748859908431768, "step": 301 }, { "ce_ib": 13.75562858581543, "ce_orig": 0.9824258685112, "epoch": 0.08656265727226975, "kl_loss": 0.2234395146369934, "loss_ib": 0.0036099578719586134, "step": 301 }, { "ce_ib": 13.83020305633545, "ce_orig": 0.5410613417625427, "epoch": 0.08685024085124739, "kl_loss": 0.2865542471408844, "loss_ib": 0.0042485627345740795, "step": 302 }, { "ce_ib": 17.551300048828125, "ce_orig": 0.7735820412635803, "epoch": 0.08685024085124739, "kl_loss": 0.25298500061035156, "loss_ib": 0.004284979775547981, "step": 302 }, { "ce_ib": 14.208580017089844, "ce_orig": 0.8505828380584717, "epoch": 0.08685024085124739, "kl_loss": 0.5346580147743225, "loss_ib": 0.006767437793314457, "step": 302 }, { "ce_ib": 19.750244140625, "ce_orig": 1.176154613494873, "epoch": 0.08685024085124739, "kl_loss": 0.2657851576805115, "loss_ib": 0.004632875788956881, "step": 302 }, { "ce_ib": 14.662118911743164, "ce_orig": 1.080672264099121, "epoch": 0.08713782443022504, "kl_loss": 0.18392251431941986, "loss_ib": 0.003305436810478568, "step": 303 }, { "ce_ib": 11.911545753479004, "ce_orig": 0.9907505512237549, "epoch": 0.08713782443022504, "kl_loss": 0.18622635304927826, "loss_ib": 0.0030534181278198957, "step": 303 }, { "ce_ib": 15.689916610717773, "ce_orig": 1.1870077848434448, "epoch": 0.08713782443022504, "kl_loss": 0.39201515913009644, "loss_ib": 0.005489143077284098, "step": 303 }, { "ce_ib": 12.059552192687988, "ce_orig": 0.5444112420082092, "epoch": 0.08713782443022504, "kl_loss": 0.23845581710338593, "loss_ib": 0.0035905134864151478, "step": 303 }, { "ce_ib": 14.907177925109863, "ce_orig": 1.255871295928955, "epoch": 0.08742540800920268, "kl_loss": 0.22089144587516785, "loss_ib": 0.003699632128700614, "step": 304 }, { "ce_ib": 15.632399559020996, "ce_orig": 1.2641204595565796, "epoch": 0.08742540800920268, "kl_loss": 0.18549595773220062, "loss_ib": 0.0034181992523372173, "step": 304 }, { "ce_ib": 11.078656196594238, "ce_orig": 0.4686051607131958, "epoch": 0.08742540800920268, "kl_loss": 0.2145492285490036, "loss_ib": 0.0032533579505980015, "step": 304 }, { "ce_ib": 16.48569107055664, "ce_orig": 1.2514501810073853, "epoch": 0.08742540800920268, "kl_loss": 0.15880295634269714, "loss_ib": 0.0032365985680371523, "step": 304 }, { "epoch": 0.08771299158818031, "grad_norm": 0.08359609544277191, "learning_rate": 4.761146496815287e-05, "loss": 0.8481, "step": 305 }, { "ce_ib": 20.280155181884766, "ce_orig": 1.9041812419891357, "epoch": 0.08771299158818031, "kl_loss": 0.2823646068572998, "loss_ib": 0.004851661156862974, "step": 305 }, { "ce_ib": 8.3218994140625, "ce_orig": 0.7794256806373596, "epoch": 0.08771299158818031, "kl_loss": 0.15604904294013977, "loss_ib": 0.0023926803842186928, "step": 305 }, { "ce_ib": 11.23653793334961, "ce_orig": 0.9274653792381287, "epoch": 0.08771299158818031, "kl_loss": 0.22056221961975098, "loss_ib": 0.0033292758744210005, "step": 305 }, { "ce_ib": 15.99108600616455, "ce_orig": 0.8273392915725708, "epoch": 0.08771299158818031, "kl_loss": 0.287705659866333, "loss_ib": 0.004476164933294058, "step": 305 }, { "ce_ib": 12.447872161865234, "ce_orig": 1.0994980335235596, "epoch": 0.08800057516715795, "kl_loss": 0.1934283971786499, "loss_ib": 0.0031790712382644415, "step": 306 }, { "ce_ib": 13.02301025390625, "ce_orig": 0.9902395009994507, "epoch": 0.08800057516715795, "kl_loss": 0.18311861157417297, "loss_ib": 0.003133486956357956, "step": 306 }, { "ce_ib": 15.912498474121094, "ce_orig": 0.8098648190498352, "epoch": 0.08800057516715795, "kl_loss": 0.302369087934494, "loss_ib": 0.004614940844476223, "step": 306 }, { "ce_ib": 11.363813400268555, "ce_orig": 0.7102072238922119, "epoch": 0.08800057516715795, "kl_loss": 0.21124617755413055, "loss_ib": 0.0032488428987562656, "step": 306 }, { "ce_ib": 19.32331085205078, "ce_orig": 1.889481544494629, "epoch": 0.08828815874613559, "kl_loss": 0.2169814109802246, "loss_ib": 0.004102144856005907, "step": 307 }, { "ce_ib": 12.5094633102417, "ce_orig": 0.49748650193214417, "epoch": 0.08828815874613559, "kl_loss": 0.19575588405132294, "loss_ib": 0.0032085052225738764, "step": 307 }, { "ce_ib": 11.513327598571777, "ce_orig": 0.46595466136932373, "epoch": 0.08828815874613559, "kl_loss": 0.22934874892234802, "loss_ib": 0.0034448199439793825, "step": 307 }, { "ce_ib": 15.249246597290039, "ce_orig": 0.3422534167766571, "epoch": 0.08828815874613559, "kl_loss": 0.20166319608688354, "loss_ib": 0.0035415564198046923, "step": 307 }, { "ce_ib": 17.809545516967773, "ce_orig": 1.352950096130371, "epoch": 0.08857574232511324, "kl_loss": 0.26321953535079956, "loss_ib": 0.004413149785250425, "step": 308 }, { "ce_ib": 17.206872940063477, "ce_orig": 1.341861605644226, "epoch": 0.08857574232511324, "kl_loss": 0.19497671723365784, "loss_ib": 0.003670454490929842, "step": 308 }, { "ce_ib": 15.39387321472168, "ce_orig": 0.6654926538467407, "epoch": 0.08857574232511324, "kl_loss": 0.25926852226257324, "loss_ib": 0.004132072441279888, "step": 308 }, { "ce_ib": 14.418597221374512, "ce_orig": 0.6665434837341309, "epoch": 0.08857574232511324, "kl_loss": 0.23031118512153625, "loss_ib": 0.0037449717056006193, "step": 308 }, { "ce_ib": 14.938549995422363, "ce_orig": 0.7124409079551697, "epoch": 0.08886332590409088, "kl_loss": 0.28744351863861084, "loss_ib": 0.004368290305137634, "step": 309 }, { "ce_ib": 15.685905456542969, "ce_orig": 1.2443615198135376, "epoch": 0.08886332590409088, "kl_loss": 0.29595404863357544, "loss_ib": 0.004528130870312452, "step": 309 }, { "ce_ib": 15.15534496307373, "ce_orig": 1.0202579498291016, "epoch": 0.08886332590409088, "kl_loss": 0.36547189950942993, "loss_ib": 0.005170253571122885, "step": 309 }, { "ce_ib": 16.149023056030273, "ce_orig": 1.1084511280059814, "epoch": 0.08886332590409088, "kl_loss": 0.20774857699871063, "loss_ib": 0.0036923878360539675, "step": 309 }, { "epoch": 0.08915090948306852, "grad_norm": 0.08066050708293915, "learning_rate": 4.840764331210191e-05, "loss": 0.9081, "step": 310 }, { "ce_ib": 11.725279808044434, "ce_orig": 0.6793712973594666, "epoch": 0.08915090948306852, "kl_loss": 0.21743886172771454, "loss_ib": 0.003346916288137436, "step": 310 }, { "ce_ib": 9.597118377685547, "ce_orig": 0.5881115794181824, "epoch": 0.08915090948306852, "kl_loss": 0.20812270045280457, "loss_ib": 0.0030409388709813356, "step": 310 }, { "ce_ib": 17.555280685424805, "ce_orig": 1.6664210557937622, "epoch": 0.08915090948306852, "kl_loss": 0.3189018964767456, "loss_ib": 0.004944546613842249, "step": 310 }, { "ce_ib": 10.35605239868164, "ce_orig": 0.6129300594329834, "epoch": 0.08915090948306852, "kl_loss": 0.19374847412109375, "loss_ib": 0.0029730896931141615, "step": 310 }, { "ce_ib": 10.367539405822754, "ce_orig": 0.27700501680374146, "epoch": 0.08943849306204615, "kl_loss": 0.37522298097610474, "loss_ib": 0.00478898361325264, "step": 311 }, { "ce_ib": 12.798125267028809, "ce_orig": 0.35544443130493164, "epoch": 0.08943849306204615, "kl_loss": 0.21808908879756927, "loss_ib": 0.003460703417658806, "step": 311 }, { "ce_ib": 18.546096801757812, "ce_orig": 1.2737302780151367, "epoch": 0.08943849306204615, "kl_loss": 0.1624414622783661, "loss_ib": 0.003479024162515998, "step": 311 }, { "ce_ib": 19.247314453125, "ce_orig": 1.827391266822815, "epoch": 0.08943849306204615, "kl_loss": 0.24330879747867584, "loss_ib": 0.0043578194454312325, "step": 311 }, { "ce_ib": 12.14682674407959, "ce_orig": 0.4805859923362732, "epoch": 0.08972607664102379, "kl_loss": 0.2552676796913147, "loss_ib": 0.003767359536141157, "step": 312 }, { "ce_ib": 13.024700164794922, "ce_orig": 0.9543373584747314, "epoch": 0.08972607664102379, "kl_loss": 0.2680973708629608, "loss_ib": 0.0039834436029195786, "step": 312 }, { "ce_ib": 15.072936058044434, "ce_orig": 1.2514426708221436, "epoch": 0.08972607664102379, "kl_loss": 0.19017720222473145, "loss_ib": 0.0034090655390173197, "step": 312 }, { "ce_ib": 11.06240177154541, "ce_orig": 0.6679608225822449, "epoch": 0.08972607664102379, "kl_loss": 0.17655614018440247, "loss_ib": 0.0028718013782054186, "step": 312 }, { "ce_ib": 11.684070587158203, "ce_orig": 0.5835570096969604, "epoch": 0.09001366022000144, "kl_loss": 0.18113084137439728, "loss_ib": 0.0029797153547406197, "step": 313 }, { "ce_ib": 15.398133277893066, "ce_orig": 0.5319973230361938, "epoch": 0.09001366022000144, "kl_loss": 0.2180468738079071, "loss_ib": 0.0037202818784862757, "step": 313 }, { "ce_ib": 18.00635528564453, "ce_orig": 1.5159127712249756, "epoch": 0.09001366022000144, "kl_loss": 0.25306442379951477, "loss_ib": 0.004331279546022415, "step": 313 }, { "ce_ib": 16.58292007446289, "ce_orig": 1.6001865863800049, "epoch": 0.09001366022000144, "kl_loss": 0.2032628208398819, "loss_ib": 0.0036909200716763735, "step": 313 }, { "ce_ib": 9.98106575012207, "ce_orig": 0.5567405223846436, "epoch": 0.09030124379897908, "kl_loss": 0.18281474709510803, "loss_ib": 0.002826254116371274, "step": 314 }, { "ce_ib": 14.181166648864746, "ce_orig": 0.7332763075828552, "epoch": 0.09030124379897908, "kl_loss": 0.2009732574224472, "loss_ib": 0.0034278493840247393, "step": 314 }, { "ce_ib": 14.160673141479492, "ce_orig": 1.0669901371002197, "epoch": 0.09030124379897908, "kl_loss": 0.1853453665971756, "loss_ib": 0.0032695208210498095, "step": 314 }, { "ce_ib": 13.65168285369873, "ce_orig": 0.6072067618370056, "epoch": 0.09030124379897908, "kl_loss": 0.2821107506752014, "loss_ib": 0.004186275415122509, "step": 314 }, { "epoch": 0.09058882737795672, "grad_norm": 0.0828433707356453, "learning_rate": 4.920382165605096e-05, "loss": 0.9224, "step": 315 }, { "ce_ib": 17.264680862426758, "ce_orig": 1.208104133605957, "epoch": 0.09058882737795672, "kl_loss": 0.2404087483882904, "loss_ib": 0.0041305553168058395, "step": 315 }, { "ce_ib": 9.675837516784668, "ce_orig": 0.6803741455078125, "epoch": 0.09058882737795672, "kl_loss": 0.17154952883720398, "loss_ib": 0.002683078870177269, "step": 315 }, { "ce_ib": 7.8654890060424805, "ce_orig": 0.27281931042671204, "epoch": 0.09058882737795672, "kl_loss": 0.3646223545074463, "loss_ib": 0.004432772286236286, "step": 315 }, { "ce_ib": 10.074167251586914, "ce_orig": 0.7812896370887756, "epoch": 0.09058882737795672, "kl_loss": 0.1766500473022461, "loss_ib": 0.002773917280137539, "step": 315 }, { "ce_ib": 9.807964324951172, "ce_orig": 0.7548955082893372, "epoch": 0.09087641095693436, "kl_loss": 0.15925069153308868, "loss_ib": 0.0025733031798154116, "step": 316 }, { "ce_ib": 12.453634262084961, "ce_orig": 0.3912903964519501, "epoch": 0.09087641095693436, "kl_loss": 0.28723639249801636, "loss_ib": 0.004117727279663086, "step": 316 }, { "ce_ib": 15.324727058410645, "ce_orig": 0.6814879179000854, "epoch": 0.09087641095693436, "kl_loss": 0.2591487467288971, "loss_ib": 0.0041239601559937, "step": 316 }, { "ce_ib": 14.351997375488281, "ce_orig": 1.1507986783981323, "epoch": 0.09087641095693436, "kl_loss": 0.1707887053489685, "loss_ib": 0.003143086563795805, "step": 316 }, { "ce_ib": 11.927781105041504, "ce_orig": 0.5891753435134888, "epoch": 0.091163994535912, "kl_loss": 0.2667624056339264, "loss_ib": 0.0038604019209742546, "step": 317 }, { "ce_ib": 13.470232009887695, "ce_orig": 0.6153560280799866, "epoch": 0.091163994535912, "kl_loss": 0.14252835512161255, "loss_ib": 0.002772306790575385, "step": 317 }, { "ce_ib": 14.50222396850586, "ce_orig": 0.888332724571228, "epoch": 0.091163994535912, "kl_loss": 0.16025802493095398, "loss_ib": 0.003052802523598075, "step": 317 }, { "ce_ib": 16.769819259643555, "ce_orig": 1.285980463027954, "epoch": 0.091163994535912, "kl_loss": 0.21203196048736572, "loss_ib": 0.003797301556915045, "step": 317 }, { "ce_ib": 18.3016414642334, "ce_orig": 0.6251075863838196, "epoch": 0.09145157811488965, "kl_loss": 0.22406277060508728, "loss_ib": 0.00407079141587019, "step": 318 }, { "ce_ib": 13.008817672729492, "ce_orig": 0.5530975461006165, "epoch": 0.09145157811488965, "kl_loss": 0.20128408074378967, "loss_ib": 0.0033137225545942783, "step": 318 }, { "ce_ib": 16.728418350219727, "ce_orig": 1.2118330001831055, "epoch": 0.09145157811488965, "kl_loss": 0.23463211953639984, "loss_ib": 0.004019163083285093, "step": 318 }, { "ce_ib": 11.389937400817871, "ce_orig": 0.665806770324707, "epoch": 0.09145157811488965, "kl_loss": 0.44625556468963623, "loss_ib": 0.005601549055427313, "step": 318 }, { "ce_ib": 17.052478790283203, "ce_orig": 1.3070660829544067, "epoch": 0.09173916169386728, "kl_loss": 0.22904498875141144, "loss_ib": 0.003995697479695082, "step": 319 }, { "ce_ib": 16.69203758239746, "ce_orig": 0.9425002336502075, "epoch": 0.09173916169386728, "kl_loss": 0.4092777371406555, "loss_ib": 0.005761981010437012, "step": 319 }, { "ce_ib": 9.762811660766602, "ce_orig": 0.8007186651229858, "epoch": 0.09173916169386728, "kl_loss": 0.19042058289051056, "loss_ib": 0.0028804868925362825, "step": 319 }, { "ce_ib": 15.089471817016602, "ce_orig": 0.9387741088867188, "epoch": 0.09173916169386728, "kl_loss": 0.1873193383216858, "loss_ib": 0.0033821403048932552, "step": 319 }, { "epoch": 0.09202674527284492, "grad_norm": 0.09044753015041351, "learning_rate": 5e-05, "loss": 0.8929, "step": 320 }, { "ce_ib": 8.850724220275879, "ce_orig": 0.6556456089019775, "epoch": 0.09202674527284492, "kl_loss": 0.12834425270557404, "loss_ib": 0.002168514998629689, "step": 320 }, { "ce_ib": 14.284525871276855, "ce_orig": 1.2114744186401367, "epoch": 0.09202674527284492, "kl_loss": 0.2224428355693817, "loss_ib": 0.0036528806667774916, "step": 320 }, { "ce_ib": 16.129127502441406, "ce_orig": 0.861198902130127, "epoch": 0.09202674527284492, "kl_loss": 0.1843017041683197, "loss_ib": 0.0034559296909719706, "step": 320 }, { "ce_ib": 13.054864883422852, "ce_orig": 0.7228923439979553, "epoch": 0.09202674527284492, "kl_loss": 0.20991846919059753, "loss_ib": 0.003404670860618353, "step": 320 }, { "ce_ib": 14.091462135314941, "ce_orig": 0.6277745962142944, "epoch": 0.09231432885182256, "kl_loss": 0.29013434052467346, "loss_ib": 0.004310489632189274, "step": 321 }, { "ce_ib": 11.505946159362793, "ce_orig": 0.8680534958839417, "epoch": 0.09231432885182256, "kl_loss": 0.19910269975662231, "loss_ib": 0.003141621593385935, "step": 321 }, { "ce_ib": 15.06042194366455, "ce_orig": 1.2571470737457275, "epoch": 0.09231432885182256, "kl_loss": 0.18096956610679626, "loss_ib": 0.0033157377038151026, "step": 321 }, { "ce_ib": 14.149365425109863, "ce_orig": 0.4702112078666687, "epoch": 0.09231432885182256, "kl_loss": 0.24852751195430756, "loss_ib": 0.0039002113044261932, "step": 321 }, { "ce_ib": 21.1373348236084, "ce_orig": 1.5176701545715332, "epoch": 0.0926019124308002, "kl_loss": 0.2831588089466095, "loss_ib": 0.004945321474224329, "step": 322 }, { "ce_ib": 14.581371307373047, "ce_orig": 0.9066507816314697, "epoch": 0.0926019124308002, "kl_loss": 0.4094810485839844, "loss_ib": 0.005552947521209717, "step": 322 }, { "ce_ib": 9.24908447265625, "ce_orig": 0.6094862818717957, "epoch": 0.0926019124308002, "kl_loss": 0.16086669266223907, "loss_ib": 0.002533575287088752, "step": 322 }, { "ce_ib": 12.565040588378906, "ce_orig": 0.8015382289886475, "epoch": 0.0926019124308002, "kl_loss": 0.27496886253356934, "loss_ib": 0.0040061925537884235, "step": 322 }, { "ce_ib": 11.96411418914795, "ce_orig": 0.6789979934692383, "epoch": 0.09288949600977785, "kl_loss": 0.14112810790538788, "loss_ib": 0.0026076924987137318, "step": 323 }, { "ce_ib": 14.88967227935791, "ce_orig": 0.8319886326789856, "epoch": 0.09288949600977785, "kl_loss": 0.2537601888179779, "loss_ib": 0.004026568960398436, "step": 323 }, { "ce_ib": 10.79393482208252, "ce_orig": 0.5163490176200867, "epoch": 0.09288949600977785, "kl_loss": 0.1722070872783661, "loss_ib": 0.002801464172080159, "step": 323 }, { "ce_ib": 10.035134315490723, "ce_orig": 0.5581719875335693, "epoch": 0.09288949600977785, "kl_loss": 0.2455272376537323, "loss_ib": 0.003458785591647029, "step": 323 }, { "ce_ib": 15.038890838623047, "ce_orig": 1.1411057710647583, "epoch": 0.09317707958875548, "kl_loss": 0.2383771389722824, "loss_ib": 0.0038876603357493877, "step": 324 }, { "ce_ib": 11.690932273864746, "ce_orig": 0.6252244114875793, "epoch": 0.09317707958875548, "kl_loss": 0.1746075451374054, "loss_ib": 0.002915168646723032, "step": 324 }, { "ce_ib": 14.972967147827148, "ce_orig": 1.1634771823883057, "epoch": 0.09317707958875548, "kl_loss": 0.24864430725574493, "loss_ib": 0.003983739297837019, "step": 324 }, { "ce_ib": 13.491129875183105, "ce_orig": 0.9431242346763611, "epoch": 0.09317707958875548, "kl_loss": 0.19168300926685333, "loss_ib": 0.0032659429125487804, "step": 324 }, { "epoch": 0.09346466316773312, "grad_norm": 0.07285797595977783, "learning_rate": 4.999996988459869e-05, "loss": 0.9029, "step": 325 }, { "ce_ib": 10.874665260314941, "ce_orig": 0.8838172554969788, "epoch": 0.09346466316773312, "kl_loss": 0.21639001369476318, "loss_ib": 0.00325136655010283, "step": 325 }, { "ce_ib": 12.071526527404785, "ce_orig": 0.715691089630127, "epoch": 0.09346466316773312, "kl_loss": 0.17473536729812622, "loss_ib": 0.002954506315290928, "step": 325 }, { "ce_ib": 9.097990036010742, "ce_orig": 0.6916231513023376, "epoch": 0.09346466316773312, "kl_loss": 0.14074796438217163, "loss_ib": 0.0023172786459326744, "step": 325 }, { "ce_ib": 7.898350238800049, "ce_orig": 0.7045942544937134, "epoch": 0.09346466316773312, "kl_loss": 0.19722947478294373, "loss_ib": 0.0027621297631412745, "step": 325 }, { "ce_ib": 19.925533294677734, "ce_orig": 1.8780890703201294, "epoch": 0.09375224674671076, "kl_loss": 0.29034847021102905, "loss_ib": 0.004896038211882114, "step": 326 }, { "ce_ib": 11.936103820800781, "ce_orig": 0.8948700428009033, "epoch": 0.09375224674671076, "kl_loss": 0.22047904133796692, "loss_ib": 0.003398400731384754, "step": 326 }, { "ce_ib": 14.651416778564453, "ce_orig": 1.5577762126922607, "epoch": 0.09375224674671076, "kl_loss": 0.2572871744632721, "loss_ib": 0.004038013052195311, "step": 326 }, { "ce_ib": 14.2105073928833, "ce_orig": 0.6887364983558655, "epoch": 0.09375224674671076, "kl_loss": 0.1484694480895996, "loss_ib": 0.0029057450592517853, "step": 326 }, { "ce_ib": 9.847541809082031, "ce_orig": 0.7175891995429993, "epoch": 0.0940398303256884, "kl_loss": 0.251788467168808, "loss_ib": 0.003502638777717948, "step": 327 }, { "ce_ib": 8.781983375549316, "ce_orig": 0.6928913593292236, "epoch": 0.0940398303256884, "kl_loss": 0.1348564177751541, "loss_ib": 0.0022267624735832214, "step": 327 }, { "ce_ib": 11.540362358093262, "ce_orig": 0.7704603672027588, "epoch": 0.0940398303256884, "kl_loss": 0.16489502787590027, "loss_ib": 0.002802986418828368, "step": 327 }, { "ce_ib": 13.85096263885498, "ce_orig": 0.8789340853691101, "epoch": 0.0940398303256884, "kl_loss": 0.17469263076782227, "loss_ib": 0.003132022451609373, "step": 327 }, { "ce_ib": 9.01992130279541, "ce_orig": 0.39120611548423767, "epoch": 0.09432741390466605, "kl_loss": 0.17137807607650757, "loss_ib": 0.0026157726533710957, "step": 328 }, { "ce_ib": 12.827068328857422, "ce_orig": 0.6231464147567749, "epoch": 0.09432741390466605, "kl_loss": 0.24973925948143005, "loss_ib": 0.003780099330469966, "step": 328 }, { "ce_ib": 13.935663223266602, "ce_orig": 0.9439969062805176, "epoch": 0.09432741390466605, "kl_loss": 0.2583736777305603, "loss_ib": 0.003977302927523851, "step": 328 }, { "ce_ib": 15.863046646118164, "ce_orig": 1.0275061130523682, "epoch": 0.09432741390466605, "kl_loss": 0.22072093188762665, "loss_ib": 0.00379351363517344, "step": 328 }, { "ce_ib": 16.495813369750977, "ce_orig": 1.1426280736923218, "epoch": 0.09461499748364369, "kl_loss": 0.1818699985742569, "loss_ib": 0.0034682813566178083, "step": 329 }, { "ce_ib": 12.4020357131958, "ce_orig": 0.8381017446517944, "epoch": 0.09461499748364369, "kl_loss": 0.16994866728782654, "loss_ib": 0.0029396903701126575, "step": 329 }, { "ce_ib": 10.978039741516113, "ce_orig": 0.6018507480621338, "epoch": 0.09461499748364369, "kl_loss": 0.1774011105298996, "loss_ib": 0.0028718148823827505, "step": 329 }, { "ce_ib": 13.26439380645752, "ce_orig": 0.8519594669342041, "epoch": 0.09461499748364369, "kl_loss": 0.1966477632522583, "loss_ib": 0.003292917041108012, "step": 329 }, { "epoch": 0.09490258106262132, "grad_norm": 0.08392878621816635, "learning_rate": 4.9999879538467306e-05, "loss": 0.9175, "step": 330 }, { "ce_ib": 14.5608549118042, "ce_orig": 1.4586288928985596, "epoch": 0.09490258106262132, "kl_loss": 0.220241978764534, "loss_ib": 0.0036585049238055944, "step": 330 }, { "ce_ib": 16.367464065551758, "ce_orig": 0.7915551662445068, "epoch": 0.09490258106262132, "kl_loss": 0.22915303707122803, "loss_ib": 0.003928276710212231, "step": 330 }, { "ce_ib": 13.064582824707031, "ce_orig": 0.6998893618583679, "epoch": 0.09490258106262132, "kl_loss": 0.38041651248931885, "loss_ib": 0.005110623314976692, "step": 330 }, { "ce_ib": 11.392269134521484, "ce_orig": 0.36753031611442566, "epoch": 0.09490258106262132, "kl_loss": 0.4851597547531128, "loss_ib": 0.0059908246621489525, "step": 330 }, { "ce_ib": 12.86525821685791, "ce_orig": 0.7186346054077148, "epoch": 0.09519016464159896, "kl_loss": 0.15524542331695557, "loss_ib": 0.0028389799408614635, "step": 331 }, { "ce_ib": 14.1820707321167, "ce_orig": 0.8073091506958008, "epoch": 0.09519016464159896, "kl_loss": 0.22929759323596954, "loss_ib": 0.003711183089762926, "step": 331 }, { "ce_ib": 12.15315055847168, "ce_orig": 0.5545368194580078, "epoch": 0.09519016464159896, "kl_loss": 0.22285009920597076, "loss_ib": 0.003443815978243947, "step": 331 }, { "ce_ib": 12.464353561401367, "ce_orig": 0.864552915096283, "epoch": 0.09519016464159896, "kl_loss": 0.2674625515937805, "loss_ib": 0.00392106082290411, "step": 331 }, { "ce_ib": 8.458319664001465, "ce_orig": 0.49817538261413574, "epoch": 0.0954777482205766, "kl_loss": 0.20442625880241394, "loss_ib": 0.002890094416216016, "step": 332 }, { "ce_ib": 15.385281562805176, "ce_orig": 1.422017216682434, "epoch": 0.0954777482205766, "kl_loss": 0.25458666682243347, "loss_ib": 0.004084394313395023, "step": 332 }, { "ce_ib": 13.032305717468262, "ce_orig": 0.5466614365577698, "epoch": 0.0954777482205766, "kl_loss": 0.2672412097454071, "loss_ib": 0.003975642379373312, "step": 332 }, { "ce_ib": 12.244396209716797, "ce_orig": 0.4979858100414276, "epoch": 0.0954777482205766, "kl_loss": 0.1899423450231552, "loss_ib": 0.0031238629017025232, "step": 332 }, { "ce_ib": 9.587015151977539, "ce_orig": 0.3958915174007416, "epoch": 0.09576533179955425, "kl_loss": 0.31766587495803833, "loss_ib": 0.004135360009968281, "step": 333 }, { "ce_ib": 16.561017990112305, "ce_orig": 1.007829189300537, "epoch": 0.09576533179955425, "kl_loss": 0.20323669910430908, "loss_ib": 0.0036884688306599855, "step": 333 }, { "ce_ib": 13.782530784606934, "ce_orig": 0.8161399960517883, "epoch": 0.09576533179955425, "kl_loss": 0.2164289653301239, "loss_ib": 0.00354254269041121, "step": 333 }, { "ce_ib": 9.973050117492676, "ce_orig": 0.6706444025039673, "epoch": 0.09576533179955425, "kl_loss": 0.20162354409694672, "loss_ib": 0.0030135405249893665, "step": 333 }, { "ce_ib": 12.195393562316895, "ce_orig": 0.613254964351654, "epoch": 0.09605291537853189, "kl_loss": 0.2231156826019287, "loss_ib": 0.003450696123763919, "step": 334 }, { "ce_ib": 8.084924697875977, "ce_orig": 0.27541494369506836, "epoch": 0.09605291537853189, "kl_loss": 0.5247204303741455, "loss_ib": 0.006055696401745081, "step": 334 }, { "ce_ib": 11.561151504516602, "ce_orig": 0.5130017995834351, "epoch": 0.09605291537853189, "kl_loss": 0.15488451719284058, "loss_ib": 0.0027049602940678596, "step": 334 }, { "ce_ib": 12.512232780456543, "ce_orig": 0.6367411613464355, "epoch": 0.09605291537853189, "kl_loss": 0.2246486246585846, "loss_ib": 0.003497709520161152, "step": 334 }, { "epoch": 0.09634049895750953, "grad_norm": 0.07655756175518036, "learning_rate": 4.999972896182352e-05, "loss": 0.8394, "step": 335 }, { "ce_ib": 12.717463493347168, "ce_orig": 0.9400395750999451, "epoch": 0.09634049895750953, "kl_loss": 0.17612457275390625, "loss_ib": 0.0030329918954521418, "step": 335 }, { "ce_ib": 12.413676261901855, "ce_orig": 0.973748505115509, "epoch": 0.09634049895750953, "kl_loss": 0.24444803595542908, "loss_ib": 0.0036858480889350176, "step": 335 }, { "ce_ib": 14.029793739318848, "ce_orig": 0.7324392795562744, "epoch": 0.09634049895750953, "kl_loss": 0.18520355224609375, "loss_ib": 0.003255015006288886, "step": 335 }, { "ce_ib": 15.990370750427246, "ce_orig": 0.6844960451126099, "epoch": 0.09634049895750953, "kl_loss": 0.27585840225219727, "loss_ib": 0.004357621073722839, "step": 335 }, { "ce_ib": 14.750761985778809, "ce_orig": 1.194319725036621, "epoch": 0.09662808253648716, "kl_loss": 0.67383873462677, "loss_ib": 0.008213463239371777, "step": 336 }, { "ce_ib": 17.5143985748291, "ce_orig": 1.5835182666778564, "epoch": 0.09662808253648716, "kl_loss": 0.2557618021965027, "loss_ib": 0.0043090577237308025, "step": 336 }, { "ce_ib": 17.389286041259766, "ce_orig": 1.3591183423995972, "epoch": 0.09662808253648716, "kl_loss": 0.27419230341911316, "loss_ib": 0.004480851348489523, "step": 336 }, { "ce_ib": 9.241145133972168, "ce_orig": 0.607307493686676, "epoch": 0.09662808253648716, "kl_loss": 0.11753670126199722, "loss_ib": 0.002099481411278248, "step": 336 }, { "ce_ib": 15.914252281188965, "ce_orig": 1.711224913597107, "epoch": 0.0969156661154648, "kl_loss": 0.2505919933319092, "loss_ib": 0.004097345285117626, "step": 337 }, { "ce_ib": 14.283632278442383, "ce_orig": 0.9926325082778931, "epoch": 0.0969156661154648, "kl_loss": 0.22402063012123108, "loss_ib": 0.0036685692612081766, "step": 337 }, { "ce_ib": 16.994945526123047, "ce_orig": 0.8979167938232422, "epoch": 0.0969156661154648, "kl_loss": 0.22958716750144958, "loss_ib": 0.003995365928858519, "step": 337 }, { "ce_ib": 15.639780044555664, "ce_orig": 0.5237170457839966, "epoch": 0.0969156661154648, "kl_loss": 0.2666119337081909, "loss_ib": 0.004230096936225891, "step": 337 }, { "ce_ib": 18.789344787597656, "ce_orig": 1.6600208282470703, "epoch": 0.09720324969444245, "kl_loss": 0.2622734010219574, "loss_ib": 0.004501668270677328, "step": 338 }, { "ce_ib": 14.16718578338623, "ce_orig": 0.8235701322555542, "epoch": 0.09720324969444245, "kl_loss": 0.1999812126159668, "loss_ib": 0.0034165303222835064, "step": 338 }, { "ce_ib": 15.722373008728027, "ce_orig": 0.8121756315231323, "epoch": 0.09720324969444245, "kl_loss": 0.17169177532196045, "loss_ib": 0.003289154963567853, "step": 338 }, { "ce_ib": 12.625021934509277, "ce_orig": 0.4633500277996063, "epoch": 0.09720324969444245, "kl_loss": 0.17351466417312622, "loss_ib": 0.0029976486694067717, "step": 338 }, { "ce_ib": 14.416272163391113, "ce_orig": 0.5611670613288879, "epoch": 0.09749083327342009, "kl_loss": 0.29108044505119324, "loss_ib": 0.004352431278675795, "step": 339 }, { "ce_ib": 10.808735847473145, "ce_orig": 0.768107533454895, "epoch": 0.09749083327342009, "kl_loss": 0.22904689610004425, "loss_ib": 0.0033713423181325197, "step": 339 }, { "ce_ib": 17.312829971313477, "ce_orig": 1.2763899564743042, "epoch": 0.09749083327342009, "kl_loss": 0.19993865489959717, "loss_ib": 0.003730669617652893, "step": 339 }, { "ce_ib": 17.75509262084961, "ce_orig": 1.1115076541900635, "epoch": 0.09749083327342009, "kl_loss": 0.26826444268226624, "loss_ib": 0.004458153620362282, "step": 339 }, { "epoch": 0.09777841685239773, "grad_norm": 0.07021026313304901, "learning_rate": 4.999951815503011e-05, "loss": 0.8976, "step": 340 }, { "ce_ib": 7.319950103759766, "ce_orig": 0.25490763783454895, "epoch": 0.09777841685239773, "kl_loss": 0.4792310297489166, "loss_ib": 0.005524305161088705, "step": 340 }, { "ce_ib": 14.642142295837402, "ce_orig": 0.5069236755371094, "epoch": 0.09777841685239773, "kl_loss": 0.23783719539642334, "loss_ib": 0.003842586185783148, "step": 340 }, { "ce_ib": 9.56615924835205, "ce_orig": 0.686457633972168, "epoch": 0.09777841685239773, "kl_loss": 0.14670798182487488, "loss_ib": 0.002423695521429181, "step": 340 }, { "ce_ib": 15.014992713928223, "ce_orig": 0.9454907178878784, "epoch": 0.09777841685239773, "kl_loss": 0.18971547484397888, "loss_ib": 0.003398653818294406, "step": 340 }, { "ce_ib": 13.204034805297852, "ce_orig": 0.6687142252922058, "epoch": 0.09806600043137537, "kl_loss": 0.286098837852478, "loss_ib": 0.004181392025202513, "step": 341 }, { "ce_ib": 15.514037132263184, "ce_orig": 0.5012982487678528, "epoch": 0.09806600043137537, "kl_loss": 0.2910040020942688, "loss_ib": 0.004461443517357111, "step": 341 }, { "ce_ib": 12.121696472167969, "ce_orig": 0.6653417348861694, "epoch": 0.09806600043137537, "kl_loss": 0.24229881167411804, "loss_ib": 0.003635157598182559, "step": 341 }, { "ce_ib": 20.12578773498535, "ce_orig": 0.7655023336410522, "epoch": 0.09806600043137537, "kl_loss": 0.22568227350711823, "loss_ib": 0.004269401542842388, "step": 341 }, { "ce_ib": 9.653379440307617, "ce_orig": 0.7402390837669373, "epoch": 0.098353584010353, "kl_loss": 0.1966065615415573, "loss_ib": 0.002931403461843729, "step": 342 }, { "ce_ib": 12.452383995056152, "ce_orig": 0.8609440326690674, "epoch": 0.098353584010353, "kl_loss": 0.14747576415538788, "loss_ib": 0.0027199957985430956, "step": 342 }, { "ce_ib": 11.025045394897461, "ce_orig": 0.6533346772193909, "epoch": 0.098353584010353, "kl_loss": 0.16730177402496338, "loss_ib": 0.002775522181764245, "step": 342 }, { "ce_ib": 16.325525283813477, "ce_orig": 1.0561354160308838, "epoch": 0.098353584010353, "kl_loss": 0.18068361282348633, "loss_ib": 0.003439388470724225, "step": 342 }, { "ce_ib": 17.46106719970703, "ce_orig": 1.6512928009033203, "epoch": 0.09864116758933066, "kl_loss": 0.4481199383735657, "loss_ib": 0.006227306090295315, "step": 343 }, { "ce_ib": 16.864215850830078, "ce_orig": 1.4105547666549683, "epoch": 0.09864116758933066, "kl_loss": 0.22357934713363647, "loss_ib": 0.003922215197235346, "step": 343 }, { "ce_ib": 9.996209144592285, "ce_orig": 0.7162432670593262, "epoch": 0.09864116758933066, "kl_loss": 0.1958695501089096, "loss_ib": 0.00295831635594368, "step": 343 }, { "ce_ib": 8.547676086425781, "ce_orig": 0.41816598176956177, "epoch": 0.09864116758933066, "kl_loss": 0.1747799813747406, "loss_ib": 0.002602567430585623, "step": 343 }, { "ce_ib": 12.569132804870605, "ce_orig": 0.5451200008392334, "epoch": 0.0989287511683083, "kl_loss": 0.22563554346561432, "loss_ib": 0.0035132686607539654, "step": 344 }, { "ce_ib": 12.415586471557617, "ce_orig": 0.7706530690193176, "epoch": 0.0989287511683083, "kl_loss": 0.1709377020597458, "loss_ib": 0.002950935624539852, "step": 344 }, { "ce_ib": 19.655101776123047, "ce_orig": 1.3017544746398926, "epoch": 0.0989287511683083, "kl_loss": 0.29058775305747986, "loss_ib": 0.004871387500315905, "step": 344 }, { "ce_ib": 17.928071975708008, "ce_orig": 1.330518126487732, "epoch": 0.0989287511683083, "kl_loss": 0.23996703326702118, "loss_ib": 0.004192477557808161, "step": 344 }, { "epoch": 0.09921633474728593, "grad_norm": 0.0755721926689148, "learning_rate": 4.999924711859495e-05, "loss": 0.8515, "step": 345 }, { "ce_ib": 14.76935863494873, "ce_orig": 1.2034357786178589, "epoch": 0.09921633474728593, "kl_loss": 0.22408181428909302, "loss_ib": 0.003717753803357482, "step": 345 }, { "ce_ib": 11.515120506286621, "ce_orig": 0.7314639687538147, "epoch": 0.09921633474728593, "kl_loss": 0.19642382860183716, "loss_ib": 0.003115750150755048, "step": 345 }, { "ce_ib": 11.988049507141113, "ce_orig": 0.5762550830841064, "epoch": 0.09921633474728593, "kl_loss": 0.25246232748031616, "loss_ib": 0.0037234281189739704, "step": 345 }, { "ce_ib": 13.44121265411377, "ce_orig": 0.9119555950164795, "epoch": 0.09921633474728593, "kl_loss": 0.19339382648468018, "loss_ib": 0.003278059186413884, "step": 345 }, { "ce_ib": 16.88981819152832, "ce_orig": 1.815802812576294, "epoch": 0.09950391832626357, "kl_loss": 0.22369977831840515, "loss_ib": 0.003925979603081942, "step": 346 }, { "ce_ib": 11.10827350616455, "ce_orig": 0.8919088244438171, "epoch": 0.09950391832626357, "kl_loss": 0.20008933544158936, "loss_ib": 0.0031117205508053303, "step": 346 }, { "ce_ib": 16.906099319458008, "ce_orig": 1.4990653991699219, "epoch": 0.09950391832626357, "kl_loss": 0.19835729897022247, "loss_ib": 0.0036741828080266714, "step": 346 }, { "ce_ib": 8.436453819274902, "ce_orig": 0.6757850050926208, "epoch": 0.09950391832626357, "kl_loss": 0.16680480539798737, "loss_ib": 0.00251169316470623, "step": 346 }, { "ce_ib": 9.981969833374023, "ce_orig": 0.7898837327957153, "epoch": 0.0997915019052412, "kl_loss": 0.13752737641334534, "loss_ib": 0.0023734706919640303, "step": 347 }, { "ce_ib": 12.792706489562988, "ce_orig": 0.8162432909011841, "epoch": 0.0997915019052412, "kl_loss": 0.14307913184165955, "loss_ib": 0.0027100618463009596, "step": 347 }, { "ce_ib": 12.92000675201416, "ce_orig": 1.0188729763031006, "epoch": 0.0997915019052412, "kl_loss": 0.18868780136108398, "loss_ib": 0.0031788786873221397, "step": 347 }, { "ce_ib": 17.870426177978516, "ce_orig": 1.1175206899642944, "epoch": 0.0997915019052412, "kl_loss": 0.2027907520532608, "loss_ib": 0.0038149498868733644, "step": 347 }, { "ce_ib": 15.885435104370117, "ce_orig": 0.41733163595199585, "epoch": 0.10007908548421886, "kl_loss": 0.20918244123458862, "loss_ib": 0.0036803679540753365, "step": 348 }, { "ce_ib": 12.231342315673828, "ce_orig": 0.48961135745048523, "epoch": 0.10007908548421886, "kl_loss": 0.20116449892520905, "loss_ib": 0.003234779229387641, "step": 348 }, { "ce_ib": 9.306249618530273, "ce_orig": 0.6630443334579468, "epoch": 0.10007908548421886, "kl_loss": 0.1751163899898529, "loss_ib": 0.002681788755580783, "step": 348 }, { "ce_ib": 11.609100341796875, "ce_orig": 0.879733145236969, "epoch": 0.10007908548421886, "kl_loss": 0.41010767221450806, "loss_ib": 0.005261986516416073, "step": 348 }, { "ce_ib": 10.676206588745117, "ce_orig": 0.6579650640487671, "epoch": 0.1003666690631965, "kl_loss": 0.2183065414428711, "loss_ib": 0.003250685753300786, "step": 349 }, { "ce_ib": 11.89196491241455, "ce_orig": 0.8634635806083679, "epoch": 0.1003666690631965, "kl_loss": 0.21364440023899078, "loss_ib": 0.003325640456750989, "step": 349 }, { "ce_ib": 17.328413009643555, "ce_orig": 0.9897369146347046, "epoch": 0.1003666690631965, "kl_loss": 0.27497774362564087, "loss_ib": 0.004482618533074856, "step": 349 }, { "ce_ib": 15.745963096618652, "ce_orig": 1.2580201625823975, "epoch": 0.1003666690631965, "kl_loss": 0.24680611491203308, "loss_ib": 0.004042657557874918, "step": 349 }, { "epoch": 0.10065425264217413, "grad_norm": 0.0724608451128006, "learning_rate": 4.999891585317103e-05, "loss": 0.857, "step": 350 }, { "ce_ib": 15.896184921264648, "ce_orig": 0.8773839473724365, "epoch": 0.10065425264217413, "kl_loss": 0.25826671719551086, "loss_ib": 0.004172285553067923, "step": 350 }, { "ce_ib": 10.407938003540039, "ce_orig": 0.7755264639854431, "epoch": 0.10065425264217413, "kl_loss": 0.13498742878437042, "loss_ib": 0.0023906680289655924, "step": 350 }, { "ce_ib": 15.827054023742676, "ce_orig": 1.3559359312057495, "epoch": 0.10065425264217413, "kl_loss": 0.21587374806404114, "loss_ib": 0.0037414426915347576, "step": 350 }, { "ce_ib": 12.431255340576172, "ce_orig": 1.0548380613327026, "epoch": 0.10065425264217413, "kl_loss": 0.17993846535682678, "loss_ib": 0.003042510012164712, "step": 350 }, { "ce_ib": 11.040481567382812, "ce_orig": 0.8403714895248413, "epoch": 0.10094183622115177, "kl_loss": 0.1840890645980835, "loss_ib": 0.002944938838481903, "step": 351 }, { "ce_ib": 15.373204231262207, "ce_orig": 1.075166940689087, "epoch": 0.10094183622115177, "kl_loss": 0.18732014298439026, "loss_ib": 0.003410521661862731, "step": 351 }, { "ce_ib": 12.945959091186523, "ce_orig": 0.897395133972168, "epoch": 0.10094183622115177, "kl_loss": 0.1956326961517334, "loss_ib": 0.0032509227748960257, "step": 351 }, { "ce_ib": 6.2110090255737305, "ce_orig": 0.1484360694885254, "epoch": 0.10094183622115177, "kl_loss": 0.3617279529571533, "loss_ib": 0.0042383805848658085, "step": 351 }, { "ce_ib": 12.221625328063965, "ce_orig": 0.7823323607444763, "epoch": 0.10122941980012941, "kl_loss": 0.18742753565311432, "loss_ib": 0.003096437780186534, "step": 352 }, { "ce_ib": 13.974717140197754, "ce_orig": 0.5945900082588196, "epoch": 0.10122941980012941, "kl_loss": 0.149112731218338, "loss_ib": 0.002888598944991827, "step": 352 }, { "ce_ib": 14.455492973327637, "ce_orig": 0.8753033876419067, "epoch": 0.10122941980012941, "kl_loss": 0.28339695930480957, "loss_ib": 0.004279518499970436, "step": 352 }, { "ce_ib": 12.000777244567871, "ce_orig": 0.676581859588623, "epoch": 0.10122941980012941, "kl_loss": 0.24054169654846191, "loss_ib": 0.0036054945085197687, "step": 352 }, { "ce_ib": 10.058462142944336, "ce_orig": 0.9673516154289246, "epoch": 0.10151700337910706, "kl_loss": 0.18438181281089783, "loss_ib": 0.002849664306268096, "step": 353 }, { "ce_ib": 14.86198616027832, "ce_orig": 0.6923442482948303, "epoch": 0.10151700337910706, "kl_loss": 0.3370734453201294, "loss_ib": 0.004856932908296585, "step": 353 }, { "ce_ib": 16.324743270874023, "ce_orig": 1.7405447959899902, "epoch": 0.10151700337910706, "kl_loss": 0.1804196834564209, "loss_ib": 0.0034366711042821407, "step": 353 }, { "ce_ib": 10.453534126281738, "ce_orig": 0.6495627164840698, "epoch": 0.10151700337910706, "kl_loss": 0.18358883261680603, "loss_ib": 0.0028812417294830084, "step": 353 }, { "ce_ib": 10.957155227661133, "ce_orig": 0.9104872941970825, "epoch": 0.1018045869580847, "kl_loss": 0.18098904192447662, "loss_ib": 0.002905606059357524, "step": 354 }, { "ce_ib": 12.083660125732422, "ce_orig": 0.5857529640197754, "epoch": 0.1018045869580847, "kl_loss": 0.2257942408323288, "loss_ib": 0.0034663083497434855, "step": 354 }, { "ce_ib": 14.075161933898926, "ce_orig": 0.827916145324707, "epoch": 0.1018045869580847, "kl_loss": 0.22436052560806274, "loss_ib": 0.0036511211656033993, "step": 354 }, { "ce_ib": 9.636879920959473, "ce_orig": 0.3787972331047058, "epoch": 0.1018045869580847, "kl_loss": 0.4520171582698822, "loss_ib": 0.005483859684318304, "step": 354 }, { "epoch": 0.10209217053706234, "grad_norm": 0.07327523827552795, "learning_rate": 4.9998524359556445e-05, "loss": 0.8569, "step": 355 }, { "ce_ib": 14.932779312133789, "ce_orig": 0.9075332880020142, "epoch": 0.10209217053706234, "kl_loss": 0.2982865273952484, "loss_ib": 0.004476143047213554, "step": 355 }, { "ce_ib": 14.173552513122559, "ce_orig": 0.8084387183189392, "epoch": 0.10209217053706234, "kl_loss": 0.33803728222846985, "loss_ib": 0.0047977278009057045, "step": 355 }, { "ce_ib": 8.768068313598633, "ce_orig": 0.1545993983745575, "epoch": 0.10209217053706234, "kl_loss": 0.22588716447353363, "loss_ib": 0.003135678358376026, "step": 355 }, { "ce_ib": 11.144165992736816, "ce_orig": 0.8069305419921875, "epoch": 0.10209217053706234, "kl_loss": 0.1619873195886612, "loss_ib": 0.002734289737418294, "step": 355 }, { "ce_ib": 12.587420463562012, "ce_orig": 1.174453616142273, "epoch": 0.10237975411603997, "kl_loss": 0.25647827982902527, "loss_ib": 0.003823524573817849, "step": 356 }, { "ce_ib": 9.973530769348145, "ce_orig": 0.5818334221839905, "epoch": 0.10237975411603997, "kl_loss": 0.14407533407211304, "loss_ib": 0.0024381063412874937, "step": 356 }, { "ce_ib": 12.697566032409668, "ce_orig": 1.0796477794647217, "epoch": 0.10237975411603997, "kl_loss": 0.24205471575260162, "loss_ib": 0.003690303536131978, "step": 356 }, { "ce_ib": 12.71401596069336, "ce_orig": 0.7969520688056946, "epoch": 0.10237975411603997, "kl_loss": 0.2004072666168213, "loss_ib": 0.003275474300608039, "step": 356 }, { "ce_ib": 11.712475776672363, "ce_orig": 0.8881208896636963, "epoch": 0.10266733769501761, "kl_loss": 0.17075558006763458, "loss_ib": 0.0028788032941520214, "step": 357 }, { "ce_ib": 13.805883407592773, "ce_orig": 0.6269095540046692, "epoch": 0.10266733769501761, "kl_loss": 0.2602432370185852, "loss_ib": 0.003983020782470703, "step": 357 }, { "ce_ib": 9.764449119567871, "ce_orig": 0.7314236760139465, "epoch": 0.10266733769501761, "kl_loss": 0.2458636462688446, "loss_ib": 0.0034350811038166285, "step": 357 }, { "ce_ib": 12.507657051086426, "ce_orig": 0.6812151670455933, "epoch": 0.10266733769501761, "kl_loss": 0.19368158280849457, "loss_ib": 0.0031875811982899904, "step": 357 }, { "ce_ib": 11.365423202514648, "ce_orig": 0.6420213580131531, "epoch": 0.10295492127399525, "kl_loss": 0.4926440715789795, "loss_ib": 0.0060629830695688725, "step": 358 }, { "ce_ib": 7.592077255249023, "ce_orig": 0.265299916267395, "epoch": 0.10295492127399525, "kl_loss": 0.4861292541027069, "loss_ib": 0.005620500538498163, "step": 358 }, { "ce_ib": 15.327858924865723, "ce_orig": 0.9397932887077332, "epoch": 0.10295492127399525, "kl_loss": 0.17111369967460632, "loss_ib": 0.003243922721594572, "step": 358 }, { "ce_ib": 13.333529472351074, "ce_orig": 0.787560224533081, "epoch": 0.10295492127399525, "kl_loss": 0.20652362704277039, "loss_ib": 0.00339858909137547, "step": 358 }, { "ce_ib": 13.753911972045898, "ce_orig": 0.3446463644504547, "epoch": 0.1032425048529729, "kl_loss": 0.4839940667152405, "loss_ib": 0.006215331610292196, "step": 359 }, { "ce_ib": 16.900297164916992, "ce_orig": 1.5462009906768799, "epoch": 0.1032425048529729, "kl_loss": 0.1991090476512909, "loss_ib": 0.003681120229884982, "step": 359 }, { "ce_ib": 14.061060905456543, "ce_orig": 0.8726510405540466, "epoch": 0.1032425048529729, "kl_loss": 0.19025549292564392, "loss_ib": 0.003308660816401243, "step": 359 }, { "ce_ib": 13.532440185546875, "ce_orig": 1.3304260969161987, "epoch": 0.1032425048529729, "kl_loss": 0.16146531701087952, "loss_ib": 0.002967897104099393, "step": 359 }, { "epoch": 0.10353008843195054, "grad_norm": 0.08045380562543869, "learning_rate": 4.99980726386944e-05, "loss": 0.9013, "step": 360 }, { "ce_ib": 16.031070709228516, "ce_orig": 0.641457200050354, "epoch": 0.10353008843195054, "kl_loss": 0.3759670853614807, "loss_ib": 0.005362777505069971, "step": 360 }, { "ce_ib": 10.804533004760742, "ce_orig": 0.6665270924568176, "epoch": 0.10353008843195054, "kl_loss": 0.16297683119773865, "loss_ib": 0.0027102213352918625, "step": 360 }, { "ce_ib": 11.559240341186523, "ce_orig": 0.8196082711219788, "epoch": 0.10353008843195054, "kl_loss": 0.1367412805557251, "loss_ib": 0.002523336559534073, "step": 360 }, { "ce_ib": 11.892834663391113, "ce_orig": 0.439602255821228, "epoch": 0.10353008843195054, "kl_loss": 0.3415584862232208, "loss_ib": 0.004604868125170469, "step": 360 }, { "ce_ib": 8.562467575073242, "ce_orig": 0.45625510811805725, "epoch": 0.10381767201092817, "kl_loss": 0.1342378854751587, "loss_ib": 0.0021986253559589386, "step": 361 }, { "ce_ib": 9.903914451599121, "ce_orig": 0.8635908365249634, "epoch": 0.10381767201092817, "kl_loss": 0.22620341181755066, "loss_ib": 0.0032524254638701677, "step": 361 }, { "ce_ib": 17.545305252075195, "ce_orig": 1.781671166419983, "epoch": 0.10381767201092817, "kl_loss": 0.217964768409729, "loss_ib": 0.003934178035706282, "step": 361 }, { "ce_ib": 12.740987777709961, "ce_orig": 0.7617380619049072, "epoch": 0.10381767201092817, "kl_loss": 0.26160410046577454, "loss_ib": 0.003890139749273658, "step": 361 }, { "ce_ib": 10.342143058776855, "ce_orig": 1.0058131217956543, "epoch": 0.10410525558990581, "kl_loss": 0.3163241147994995, "loss_ib": 0.0041974554769694805, "step": 362 }, { "ce_ib": 19.41802406311035, "ce_orig": 1.730543851852417, "epoch": 0.10410525558990581, "kl_loss": 0.23577484488487244, "loss_ib": 0.004299550782889128, "step": 362 }, { "ce_ib": 15.791916847229004, "ce_orig": 1.4829944372177124, "epoch": 0.10410525558990581, "kl_loss": 0.14233699440956116, "loss_ib": 0.003002561628818512, "step": 362 }, { "ce_ib": 9.117117881774902, "ce_orig": 0.4645211696624756, "epoch": 0.10410525558990581, "kl_loss": 0.1363692581653595, "loss_ib": 0.0022754042875021696, "step": 362 }, { "ce_ib": 13.213629722595215, "ce_orig": 1.1761356592178345, "epoch": 0.10439283916888345, "kl_loss": 0.2095613181591034, "loss_ib": 0.0034169761929661036, "step": 363 }, { "ce_ib": 12.37755012512207, "ce_orig": 0.8143442273139954, "epoch": 0.10439283916888345, "kl_loss": 0.14410914480686188, "loss_ib": 0.002678846474736929, "step": 363 }, { "ce_ib": 17.626813888549805, "ce_orig": 1.4411890506744385, "epoch": 0.10439283916888345, "kl_loss": 0.1780979335308075, "loss_ib": 0.0035436605103313923, "step": 363 }, { "ce_ib": 9.846484184265137, "ce_orig": 0.5962998270988464, "epoch": 0.10439283916888345, "kl_loss": 0.1512468159198761, "loss_ib": 0.002497116569429636, "step": 363 }, { "ce_ib": 12.717291831970215, "ce_orig": 0.9116876721382141, "epoch": 0.1046804227478611, "kl_loss": 0.16959382593631744, "loss_ib": 0.00296766753308475, "step": 364 }, { "ce_ib": 12.457673072814941, "ce_orig": 0.09528730809688568, "epoch": 0.1046804227478611, "kl_loss": 0.38302385807037354, "loss_ib": 0.005076006054878235, "step": 364 }, { "ce_ib": 12.967721939086914, "ce_orig": 0.7480602860450745, "epoch": 0.1046804227478611, "kl_loss": 0.41338658332824707, "loss_ib": 0.005430637858808041, "step": 364 }, { "ce_ib": 15.809802055358887, "ce_orig": 1.5115008354187012, "epoch": 0.1046804227478611, "kl_loss": 0.2618887722492218, "loss_ib": 0.004199867602437735, "step": 364 }, { "epoch": 0.10496800632683874, "grad_norm": 0.1035882830619812, "learning_rate": 4.9997560691673194e-05, "loss": 0.9193, "step": 365 }, { "ce_ib": 13.008557319641113, "ce_orig": 0.8673336505889893, "epoch": 0.10496800632683874, "kl_loss": 0.2006014883518219, "loss_ib": 0.003306870348751545, "step": 365 }, { "ce_ib": 9.279165267944336, "ce_orig": 0.656031608581543, "epoch": 0.10496800632683874, "kl_loss": 0.24030038714408875, "loss_ib": 0.0033309203572571278, "step": 365 }, { "ce_ib": 14.56029987335205, "ce_orig": 1.059706211090088, "epoch": 0.10496800632683874, "kl_loss": 0.22321242094039917, "loss_ib": 0.0036881540436297655, "step": 365 }, { "ce_ib": 10.043885231018066, "ce_orig": 0.7288112044334412, "epoch": 0.10496800632683874, "kl_loss": 0.1112736165523529, "loss_ib": 0.002117124618962407, "step": 365 }, { "ce_ib": 14.350020408630371, "ce_orig": 1.2987266778945923, "epoch": 0.10525558990581638, "kl_loss": 0.21527716517448425, "loss_ib": 0.0035877733025699854, "step": 366 }, { "ce_ib": 9.209977149963379, "ce_orig": 0.7698776721954346, "epoch": 0.10525558990581638, "kl_loss": 0.20659813284873962, "loss_ib": 0.0029869787395000458, "step": 366 }, { "ce_ib": 12.112702369689941, "ce_orig": 0.7612364888191223, "epoch": 0.10525558990581638, "kl_loss": 0.2407711148262024, "loss_ib": 0.003618981223553419, "step": 366 }, { "ce_ib": 11.292844772338867, "ce_orig": 0.769523024559021, "epoch": 0.10525558990581638, "kl_loss": 0.23566709458827972, "loss_ib": 0.00348595529794693, "step": 366 }, { "ce_ib": 12.479425430297852, "ce_orig": 0.8336954116821289, "epoch": 0.10554317348479401, "kl_loss": 0.16503103077411652, "loss_ib": 0.0028982528019696474, "step": 367 }, { "ce_ib": 11.297480583190918, "ce_orig": 0.7182275056838989, "epoch": 0.10554317348479401, "kl_loss": 0.2943016290664673, "loss_ib": 0.004072763957083225, "step": 367 }, { "ce_ib": 13.729005813598633, "ce_orig": 1.3682771921157837, "epoch": 0.10554317348479401, "kl_loss": 0.1870647370815277, "loss_ib": 0.0032435478642582893, "step": 367 }, { "ce_ib": 14.036231994628906, "ce_orig": 1.112056851387024, "epoch": 0.10554317348479401, "kl_loss": 0.15229341387748718, "loss_ib": 0.0029265573248267174, "step": 367 }, { "ce_ib": 15.093040466308594, "ce_orig": 1.170424222946167, "epoch": 0.10583075706377165, "kl_loss": 0.2388845682144165, "loss_ib": 0.0038981495890766382, "step": 368 }, { "ce_ib": 15.43298053741455, "ce_orig": 1.196273922920227, "epoch": 0.10583075706377165, "kl_loss": 0.19452136754989624, "loss_ib": 0.0034885117784142494, "step": 368 }, { "ce_ib": 13.480894088745117, "ce_orig": 1.0033950805664062, "epoch": 0.10583075706377165, "kl_loss": 0.24435830116271973, "loss_ib": 0.003791672410443425, "step": 368 }, { "ce_ib": 15.991963386535645, "ce_orig": 1.5334750413894653, "epoch": 0.10583075706377165, "kl_loss": 0.1978762149810791, "loss_ib": 0.0035779583267867565, "step": 368 }, { "ce_ib": 9.99071979522705, "ce_orig": 0.521371066570282, "epoch": 0.1061183406427493, "kl_loss": 0.14332063496112823, "loss_ib": 0.0024322783574461937, "step": 369 }, { "ce_ib": 14.23776912689209, "ce_orig": 1.3547425270080566, "epoch": 0.1061183406427493, "kl_loss": 0.18942734599113464, "loss_ib": 0.0033180504105985165, "step": 369 }, { "ce_ib": 10.9193754196167, "ce_orig": 0.7963501214981079, "epoch": 0.1061183406427493, "kl_loss": 0.19985352456569672, "loss_ib": 0.003090472659096122, "step": 369 }, { "ce_ib": 11.383045196533203, "ce_orig": 0.7126600742340088, "epoch": 0.1061183406427493, "kl_loss": 0.17306244373321533, "loss_ib": 0.002868928946554661, "step": 369 }, { "epoch": 0.10640592422172694, "grad_norm": 0.08818119019269943, "learning_rate": 4.999698851972622e-05, "loss": 0.9172, "step": 370 }, { "ce_ib": 13.027803421020508, "ce_orig": 0.8471740484237671, "epoch": 0.10640592422172694, "kl_loss": 0.1602221429347992, "loss_ib": 0.0029050016310065985, "step": 370 }, { "ce_ib": 12.130885124206543, "ce_orig": 0.5990825891494751, "epoch": 0.10640592422172694, "kl_loss": 0.19608041644096375, "loss_ib": 0.0031738923862576485, "step": 370 }, { "ce_ib": 11.950088500976562, "ce_orig": 0.6112602353096008, "epoch": 0.10640592422172694, "kl_loss": 0.1965973824262619, "loss_ib": 0.0031609826255589724, "step": 370 }, { "ce_ib": 9.864639282226562, "ce_orig": 0.7072968482971191, "epoch": 0.10640592422172694, "kl_loss": 0.1892612874507904, "loss_ib": 0.002879076637327671, "step": 370 }, { "ce_ib": 7.837416648864746, "ce_orig": 0.22909517586231232, "epoch": 0.10669350780070458, "kl_loss": 0.4259476363658905, "loss_ib": 0.005043217912316322, "step": 371 }, { "ce_ib": 16.050464630126953, "ce_orig": 1.3338783979415894, "epoch": 0.10669350780070458, "kl_loss": 0.18167968094348907, "loss_ib": 0.0034218430519104004, "step": 371 }, { "ce_ib": 7.732363224029541, "ce_orig": 0.6679915189743042, "epoch": 0.10669350780070458, "kl_loss": 0.19385015964508057, "loss_ib": 0.00271173776127398, "step": 371 }, { "ce_ib": 17.768779754638672, "ce_orig": 1.290654182434082, "epoch": 0.10669350780070458, "kl_loss": 0.18727800250053406, "loss_ib": 0.0036496578250080347, "step": 371 }, { "ce_ib": 16.024396896362305, "ce_orig": 1.4784846305847168, "epoch": 0.10698109137968222, "kl_loss": 0.17223666608333588, "loss_ib": 0.0033248059917241335, "step": 372 }, { "ce_ib": 9.74294376373291, "ce_orig": 0.5707986950874329, "epoch": 0.10698109137968222, "kl_loss": 0.16291573643684387, "loss_ib": 0.0026034514885395765, "step": 372 }, { "ce_ib": 16.458507537841797, "ce_orig": 0.9432319402694702, "epoch": 0.10698109137968222, "kl_loss": 0.1663103997707367, "loss_ib": 0.0033089546486735344, "step": 372 }, { "ce_ib": 15.392163276672363, "ce_orig": 1.5210273265838623, "epoch": 0.10698109137968222, "kl_loss": 0.22455021739006042, "loss_ib": 0.003784718457609415, "step": 372 }, { "ce_ib": 14.316435813903809, "ce_orig": 0.8189164400100708, "epoch": 0.10726867495865985, "kl_loss": 0.16313040256500244, "loss_ib": 0.0030629474204033613, "step": 373 }, { "ce_ib": 11.636860847473145, "ce_orig": 0.7378359436988831, "epoch": 0.10726867495865985, "kl_loss": 0.1494181752204895, "loss_ib": 0.0026578675024211407, "step": 373 }, { "ce_ib": 17.269123077392578, "ce_orig": 1.541763424873352, "epoch": 0.10726867495865985, "kl_loss": 0.26547926664352417, "loss_ib": 0.004381704609841108, "step": 373 }, { "ce_ib": 10.263904571533203, "ce_orig": 0.8089870810508728, "epoch": 0.10726867495865985, "kl_loss": 0.11840936541557312, "loss_ib": 0.002210484119132161, "step": 373 }, { "ce_ib": 15.512616157531738, "ce_orig": 0.9539732933044434, "epoch": 0.1075562585376375, "kl_loss": 0.28004124760627747, "loss_ib": 0.004351674113422632, "step": 374 }, { "ce_ib": 13.218826293945312, "ce_orig": 0.9203503131866455, "epoch": 0.1075562585376375, "kl_loss": 0.17954644560813904, "loss_ib": 0.003117346903309226, "step": 374 }, { "ce_ib": 12.426115036010742, "ce_orig": 1.001791000366211, "epoch": 0.1075562585376375, "kl_loss": 0.24035847187042236, "loss_ib": 0.003646196098998189, "step": 374 }, { "ce_ib": 13.382880210876465, "ce_orig": 1.0965611934661865, "epoch": 0.1075562585376375, "kl_loss": 0.16744542121887207, "loss_ib": 0.003012742381542921, "step": 374 }, { "epoch": 0.10784384211661514, "grad_norm": 0.0786062702536583, "learning_rate": 4.999635612423198e-05, "loss": 0.8711, "step": 375 }, { "ce_ib": 7.170506477355957, "ce_orig": 0.2852292060852051, "epoch": 0.10784384211661514, "kl_loss": 0.37380170822143555, "loss_ib": 0.004455067683011293, "step": 375 }, { "ce_ib": 10.11276626586914, "ce_orig": 0.5102769136428833, "epoch": 0.10784384211661514, "kl_loss": 0.18036767840385437, "loss_ib": 0.002814953215420246, "step": 375 }, { "ce_ib": 11.423179626464844, "ce_orig": 1.2335662841796875, "epoch": 0.10784384211661514, "kl_loss": 0.19887100160121918, "loss_ib": 0.0031310277990996838, "step": 375 }, { "ce_ib": 14.86428451538086, "ce_orig": 0.6654768586158752, "epoch": 0.10784384211661514, "kl_loss": 0.19978465139865875, "loss_ib": 0.0034842747263610363, "step": 375 }, { "ce_ib": 12.019170761108398, "ce_orig": 0.830958902835846, "epoch": 0.10813142569559278, "kl_loss": 0.19432778656482697, "loss_ib": 0.0031451948452740908, "step": 376 }, { "ce_ib": 15.544536590576172, "ce_orig": 0.608134388923645, "epoch": 0.10813142569559278, "kl_loss": 0.3602546155452728, "loss_ib": 0.005156999919563532, "step": 376 }, { "ce_ib": 10.856096267700195, "ce_orig": 0.7232799530029297, "epoch": 0.10813142569559278, "kl_loss": 0.15802645683288574, "loss_ib": 0.00266587408259511, "step": 376 }, { "ce_ib": 13.540989875793457, "ce_orig": 1.0887871980667114, "epoch": 0.10813142569559278, "kl_loss": 0.19060353934764862, "loss_ib": 0.0032601344864815474, "step": 376 }, { "ce_ib": 13.389488220214844, "ce_orig": 0.8150464296340942, "epoch": 0.10841900927457042, "kl_loss": 0.19611474871635437, "loss_ib": 0.0033000963740050793, "step": 377 }, { "ce_ib": 7.958892822265625, "ce_orig": 0.558684229850769, "epoch": 0.10841900927457042, "kl_loss": 0.12297540158033371, "loss_ib": 0.002025643130764365, "step": 377 }, { "ce_ib": 13.451696395874023, "ce_orig": 0.9451778531074524, "epoch": 0.10841900927457042, "kl_loss": 0.22830717265605927, "loss_ib": 0.003628241363912821, "step": 377 }, { "ce_ib": 11.917108535766602, "ce_orig": 1.090754747390747, "epoch": 0.10841900927457042, "kl_loss": 0.18710459768772125, "loss_ib": 0.003062756499275565, "step": 377 }, { "ce_ib": 11.53650951385498, "ce_orig": 0.4949207007884979, "epoch": 0.10870659285354806, "kl_loss": 0.2471131980419159, "loss_ib": 0.0036247826647013426, "step": 378 }, { "ce_ib": 9.730238914489746, "ce_orig": 0.40288040041923523, "epoch": 0.10870659285354806, "kl_loss": 0.18191629648208618, "loss_ib": 0.0027921865694224834, "step": 378 }, { "ce_ib": 9.56220817565918, "ce_orig": 0.5649886727333069, "epoch": 0.10870659285354806, "kl_loss": 0.17736974358558655, "loss_ib": 0.0027299183420836926, "step": 378 }, { "ce_ib": 16.986759185791016, "ce_orig": 1.3326983451843262, "epoch": 0.10870659285354806, "kl_loss": 0.27190378308296204, "loss_ib": 0.0044177137315273285, "step": 378 }, { "ce_ib": 10.621078491210938, "ce_orig": 0.9211146831512451, "epoch": 0.10899417643252571, "kl_loss": 0.1395106166601181, "loss_ib": 0.002457214053720236, "step": 379 }, { "ce_ib": 8.39609432220459, "ce_orig": 0.679756224155426, "epoch": 0.10899417643252571, "kl_loss": 0.1734372079372406, "loss_ib": 0.0025739814154803753, "step": 379 }, { "ce_ib": 13.126282691955566, "ce_orig": 0.5308454036712646, "epoch": 0.10899417643252571, "kl_loss": 0.23796755075454712, "loss_ib": 0.0036923037841916084, "step": 379 }, { "ce_ib": 15.385143280029297, "ce_orig": 0.9731943607330322, "epoch": 0.10899417643252571, "kl_loss": 0.2400083839893341, "loss_ib": 0.003938598092645407, "step": 379 }, { "epoch": 0.10928176001150335, "grad_norm": 0.07642538100481033, "learning_rate": 4.9995663506714054e-05, "loss": 0.8705, "step": 380 }, { "ce_ib": 10.140104293823242, "ce_orig": 0.55213463306427, "epoch": 0.10928176001150335, "kl_loss": 0.2998710870742798, "loss_ib": 0.004012721125036478, "step": 380 }, { "ce_ib": 12.016203880310059, "ce_orig": 0.2663145363330841, "epoch": 0.10928176001150335, "kl_loss": 0.20258453488349915, "loss_ib": 0.0032274657860398293, "step": 380 }, { "ce_ib": 10.269865989685059, "ce_orig": 0.5478006601333618, "epoch": 0.10928176001150335, "kl_loss": 0.17457614839076996, "loss_ib": 0.0027727477718144655, "step": 380 }, { "ce_ib": 10.28240966796875, "ce_orig": 0.46482110023498535, "epoch": 0.10928176001150335, "kl_loss": 0.14175333082675934, "loss_ib": 0.0024457741528749466, "step": 380 }, { "ce_ib": 18.375350952148438, "ce_orig": 1.6469268798828125, "epoch": 0.10956934359048098, "kl_loss": 0.2459729164838791, "loss_ib": 0.004297263920307159, "step": 381 }, { "ce_ib": 13.591058731079102, "ce_orig": 0.654187798500061, "epoch": 0.10956934359048098, "kl_loss": 0.33038705587387085, "loss_ib": 0.004662976134568453, "step": 381 }, { "ce_ib": 18.45250129699707, "ce_orig": 1.5424803495407104, "epoch": 0.10956934359048098, "kl_loss": 0.25389549136161804, "loss_ib": 0.004384204745292664, "step": 381 }, { "ce_ib": 15.972155570983887, "ce_orig": 1.1866068840026855, "epoch": 0.10956934359048098, "kl_loss": 0.26268285512924194, "loss_ib": 0.004224043805152178, "step": 381 }, { "ce_ib": 10.061860084533691, "ce_orig": 0.5798574090003967, "epoch": 0.10985692716945862, "kl_loss": 0.18744969367980957, "loss_ib": 0.002880682935938239, "step": 382 }, { "ce_ib": 8.527949333190918, "ce_orig": 0.7655165195465088, "epoch": 0.10985692716945862, "kl_loss": 0.19700750708580017, "loss_ib": 0.002822869922965765, "step": 382 }, { "ce_ib": 7.723175525665283, "ce_orig": 0.46251556277275085, "epoch": 0.10985692716945862, "kl_loss": 0.1479792296886444, "loss_ib": 0.0022521098144352436, "step": 382 }, { "ce_ib": 16.92078399658203, "ce_orig": 1.5507680177688599, "epoch": 0.10985692716945862, "kl_loss": 0.17009945213794708, "loss_ib": 0.0033930731005966663, "step": 382 }, { "ce_ib": 11.547307014465332, "ce_orig": 0.9038912057876587, "epoch": 0.11014451074843626, "kl_loss": 0.18578889966011047, "loss_ib": 0.003012619446963072, "step": 383 }, { "ce_ib": 7.641073226928711, "ce_orig": 0.6663032174110413, "epoch": 0.11014451074843626, "kl_loss": 0.12631307542324066, "loss_ib": 0.002027238020673394, "step": 383 }, { "ce_ib": 7.092626094818115, "ce_orig": 0.4686228632926941, "epoch": 0.11014451074843626, "kl_loss": 0.1317451447248459, "loss_ib": 0.002026714151725173, "step": 383 }, { "ce_ib": 9.421049118041992, "ce_orig": 0.6183243989944458, "epoch": 0.11014451074843626, "kl_loss": 0.15724687278270721, "loss_ib": 0.002514573512598872, "step": 383 }, { "ce_ib": 11.571142196655273, "ce_orig": 0.4451025128364563, "epoch": 0.11043209432741391, "kl_loss": 0.2353937327861786, "loss_ib": 0.0035110514145344496, "step": 384 }, { "ce_ib": 16.550886154174805, "ce_orig": 1.2699673175811768, "epoch": 0.11043209432741391, "kl_loss": 0.2898581027984619, "loss_ib": 0.004553669597953558, "step": 384 }, { "ce_ib": 12.445303916931152, "ce_orig": 0.6089316606521606, "epoch": 0.11043209432741391, "kl_loss": 0.5906498432159424, "loss_ib": 0.007151029072701931, "step": 384 }, { "ce_ib": 11.304732322692871, "ce_orig": 0.6872734427452087, "epoch": 0.11043209432741391, "kl_loss": 0.132551908493042, "loss_ib": 0.002455992391332984, "step": 384 }, { "epoch": 0.11071967790639155, "grad_norm": 0.08736824244260788, "learning_rate": 4.999491066884113e-05, "loss": 0.8343, "step": 385 }, { "ce_ib": 12.851602554321289, "ce_orig": 1.4722890853881836, "epoch": 0.11071967790639155, "kl_loss": 0.16855554282665253, "loss_ib": 0.0029707157518714666, "step": 385 }, { "ce_ib": 12.488396644592285, "ce_orig": 1.012579321861267, "epoch": 0.11071967790639155, "kl_loss": 0.24618947505950928, "loss_ib": 0.0037107341922819614, "step": 385 }, { "ce_ib": 9.774558067321777, "ce_orig": 0.6036505103111267, "epoch": 0.11071967790639155, "kl_loss": 0.14310193061828613, "loss_ib": 0.0024084749165922403, "step": 385 }, { "ce_ib": 10.53403091430664, "ce_orig": 0.8375312089920044, "epoch": 0.11071967790639155, "kl_loss": 0.2290131151676178, "loss_ib": 0.00334353419020772, "step": 385 }, { "ce_ib": 13.784265518188477, "ce_orig": 0.7486900091171265, "epoch": 0.11100726148536919, "kl_loss": 0.275905966758728, "loss_ib": 0.004137486219406128, "step": 386 }, { "ce_ib": 13.386645317077637, "ce_orig": 0.8458417654037476, "epoch": 0.11100726148536919, "kl_loss": 0.2864159941673279, "loss_ib": 0.0042028240859508514, "step": 386 }, { "ce_ib": 4.843447685241699, "ce_orig": 0.1851879358291626, "epoch": 0.11100726148536919, "kl_loss": 0.44297945499420166, "loss_ib": 0.0049141389317810535, "step": 386 }, { "ce_ib": 11.102249145507812, "ce_orig": 0.7399924397468567, "epoch": 0.11100726148536919, "kl_loss": 0.2577285170555115, "loss_ib": 0.0036875098012387753, "step": 386 }, { "ce_ib": 13.290738105773926, "ce_orig": 0.8414790034294128, "epoch": 0.11129484506434682, "kl_loss": 0.1596413552761078, "loss_ib": 0.0029254870023578405, "step": 387 }, { "ce_ib": 12.116263389587402, "ce_orig": 1.0983738899230957, "epoch": 0.11129484506434682, "kl_loss": 0.22985008358955383, "loss_ib": 0.0035101270768791437, "step": 387 }, { "ce_ib": 11.536699295043945, "ce_orig": 0.7217467427253723, "epoch": 0.11129484506434682, "kl_loss": 0.23231491446495056, "loss_ib": 0.003476819023489952, "step": 387 }, { "ce_ib": 10.348511695861816, "ce_orig": 0.9353364706039429, "epoch": 0.11129484506434682, "kl_loss": 0.16923439502716064, "loss_ib": 0.0027271949220448732, "step": 387 }, { "ce_ib": 8.719440460205078, "ce_orig": 0.6035894155502319, "epoch": 0.11158242864332446, "kl_loss": 0.22707051038742065, "loss_ib": 0.0031426490750163794, "step": 388 }, { "ce_ib": 12.744837760925293, "ce_orig": 0.7636030316352844, "epoch": 0.11158242864332446, "kl_loss": 0.19510197639465332, "loss_ib": 0.0032255034893751144, "step": 388 }, { "ce_ib": 10.507633209228516, "ce_orig": 0.5344758033752441, "epoch": 0.11158242864332446, "kl_loss": 0.23824182152748108, "loss_ib": 0.0034331816714257, "step": 388 }, { "ce_ib": 13.216085433959961, "ce_orig": 0.9561126232147217, "epoch": 0.11158242864332446, "kl_loss": 0.19082219898700714, "loss_ib": 0.003229830414056778, "step": 388 }, { "ce_ib": 12.790705680847168, "ce_orig": 0.7942649722099304, "epoch": 0.11187001222230211, "kl_loss": 0.19223928451538086, "loss_ib": 0.003201463259756565, "step": 389 }, { "ce_ib": 12.605323791503906, "ce_orig": 0.9660126566886902, "epoch": 0.11187001222230211, "kl_loss": 0.18265745043754578, "loss_ib": 0.0030871068593114614, "step": 389 }, { "ce_ib": 16.678693771362305, "ce_orig": 1.4949008226394653, "epoch": 0.11187001222230211, "kl_loss": 0.2443901002407074, "loss_ib": 0.004111770074814558, "step": 389 }, { "ce_ib": 15.18307876586914, "ce_orig": 1.5530723333358765, "epoch": 0.11187001222230211, "kl_loss": 0.18980354070663452, "loss_ib": 0.0034163433592766523, "step": 389 }, { "epoch": 0.11215759580127975, "grad_norm": 0.0806172788143158, "learning_rate": 4.999409761242696e-05, "loss": 0.889, "step": 390 }, { "ce_ib": 12.329959869384766, "ce_orig": 0.6557547450065613, "epoch": 0.11215759580127975, "kl_loss": 0.11406560242176056, "loss_ib": 0.0023736520670354366, "step": 390 }, { "ce_ib": 10.382856369018555, "ce_orig": 0.36463189125061035, "epoch": 0.11215759580127975, "kl_loss": 0.2578916549682617, "loss_ib": 0.0036172019317746162, "step": 390 }, { "ce_ib": 13.944049835205078, "ce_orig": 0.8022533655166626, "epoch": 0.11215759580127975, "kl_loss": 0.23697403073310852, "loss_ib": 0.0037641453091055155, "step": 390 }, { "ce_ib": 10.437244415283203, "ce_orig": 0.6617816090583801, "epoch": 0.11215759580127975, "kl_loss": 0.15966740250587463, "loss_ib": 0.0026403984520584345, "step": 390 }, { "ce_ib": 11.55241584777832, "ce_orig": 0.7899225950241089, "epoch": 0.11244517938025739, "kl_loss": 0.12170088291168213, "loss_ib": 0.0023722504265606403, "step": 391 }, { "ce_ib": 14.663440704345703, "ce_orig": 0.9394941329956055, "epoch": 0.11244517938025739, "kl_loss": 0.23881687223911285, "loss_ib": 0.00385451246984303, "step": 391 }, { "ce_ib": 9.422616004943848, "ce_orig": 0.5803003907203674, "epoch": 0.11244517938025739, "kl_loss": 0.16054609417915344, "loss_ib": 0.0025477223098278046, "step": 391 }, { "ce_ib": 11.833211898803711, "ce_orig": 0.6175609827041626, "epoch": 0.11244517938025739, "kl_loss": 0.2186504304409027, "loss_ib": 0.0033698254264891148, "step": 391 }, { "ce_ib": 11.895299911499023, "ce_orig": 0.6896355152130127, "epoch": 0.11273276295923502, "kl_loss": 0.17966461181640625, "loss_ib": 0.0029861759394407272, "step": 392 }, { "ce_ib": 11.261984825134277, "ce_orig": 0.7158202528953552, "epoch": 0.11273276295923502, "kl_loss": 0.19520384073257446, "loss_ib": 0.00307823671028018, "step": 392 }, { "ce_ib": 12.316457748413086, "ce_orig": 0.8367967009544373, "epoch": 0.11273276295923502, "kl_loss": 0.2615872323513031, "loss_ib": 0.0038475177716463804, "step": 392 }, { "ce_ib": 10.227145195007324, "ce_orig": 0.7019678950309753, "epoch": 0.11273276295923502, "kl_loss": 0.21493881940841675, "loss_ib": 0.0031721023842692375, "step": 392 }, { "ce_ib": 16.03828239440918, "ce_orig": 1.3268945217132568, "epoch": 0.11302034653821266, "kl_loss": 0.23496520519256592, "loss_ib": 0.003953480161726475, "step": 393 }, { "ce_ib": 7.363077163696289, "ce_orig": 0.6715714335441589, "epoch": 0.11302034653821266, "kl_loss": 0.12172873318195343, "loss_ib": 0.0019535948522388935, "step": 393 }, { "ce_ib": 10.327352523803711, "ce_orig": 0.9410114884376526, "epoch": 0.11302034653821266, "kl_loss": 0.11792122572660446, "loss_ib": 0.0022119474597275257, "step": 393 }, { "ce_ib": 5.172538757324219, "ce_orig": 0.20720714330673218, "epoch": 0.11302034653821266, "kl_loss": 0.41349154710769653, "loss_ib": 0.004652169067412615, "step": 393 }, { "ce_ib": 10.094765663146973, "ce_orig": 0.6660728454589844, "epoch": 0.11330793011719031, "kl_loss": 0.1545972228050232, "loss_ib": 0.0025554485619068146, "step": 394 }, { "ce_ib": 12.061307907104492, "ce_orig": 0.5917040109634399, "epoch": 0.11330793011719031, "kl_loss": 0.19155195355415344, "loss_ib": 0.003121650079265237, "step": 394 }, { "ce_ib": 13.97226333618164, "ce_orig": 1.101852536201477, "epoch": 0.11330793011719031, "kl_loss": 0.19805079698562622, "loss_ib": 0.003377734450623393, "step": 394 }, { "ce_ib": 14.349608421325684, "ce_orig": 0.5646123886108398, "epoch": 0.11330793011719031, "kl_loss": 0.17135578393936157, "loss_ib": 0.0031485187355428934, "step": 394 }, { "epoch": 0.11359551369616795, "grad_norm": 0.08417540043592453, "learning_rate": 4.999322433943038e-05, "loss": 0.8409, "step": 395 }, { "ce_ib": 12.859439849853516, "ce_orig": 0.9198188185691833, "epoch": 0.11359551369616795, "kl_loss": 0.1865035444498062, "loss_ib": 0.0031509792897850275, "step": 395 }, { "ce_ib": 10.23005485534668, "ce_orig": 0.6933926939964294, "epoch": 0.11359551369616795, "kl_loss": 0.14806464314460754, "loss_ib": 0.0025036518927663565, "step": 395 }, { "ce_ib": 14.05105972290039, "ce_orig": 0.6480773687362671, "epoch": 0.11359551369616795, "kl_loss": 0.2830086648464203, "loss_ib": 0.0042351926676929, "step": 395 }, { "ce_ib": 12.827180862426758, "ce_orig": 1.2222548723220825, "epoch": 0.11359551369616795, "kl_loss": 0.19166235625743866, "loss_ib": 0.0031993414741009474, "step": 395 }, { "ce_ib": 14.012380599975586, "ce_orig": 1.3009854555130005, "epoch": 0.11388309727514559, "kl_loss": 0.2228410542011261, "loss_ib": 0.003629648592323065, "step": 396 }, { "ce_ib": 7.52554178237915, "ce_orig": 0.6004323363304138, "epoch": 0.11388309727514559, "kl_loss": 0.15014877915382385, "loss_ib": 0.002254042075946927, "step": 396 }, { "ce_ib": 11.584349632263184, "ce_orig": 0.8162614703178406, "epoch": 0.11388309727514559, "kl_loss": 0.1859622299671173, "loss_ib": 0.003018057206645608, "step": 396 }, { "ce_ib": 11.174099922180176, "ce_orig": 0.7962226271629333, "epoch": 0.11388309727514559, "kl_loss": 0.16366738080978394, "loss_ib": 0.0027540838345885277, "step": 396 }, { "ce_ib": 13.57970905303955, "ce_orig": 1.1856755018234253, "epoch": 0.11417068085412323, "kl_loss": 0.272286593914032, "loss_ib": 0.004080836661159992, "step": 397 }, { "ce_ib": 6.8682122230529785, "ce_orig": 0.43402042984962463, "epoch": 0.11417068085412323, "kl_loss": 0.1285514086484909, "loss_ib": 0.00197233515791595, "step": 397 }, { "ce_ib": 11.961787223815918, "ce_orig": 0.782745897769928, "epoch": 0.11417068085412323, "kl_loss": 0.15355338156223297, "loss_ib": 0.0027317123021930456, "step": 397 }, { "ce_ib": 10.129254341125488, "ce_orig": 0.8172139525413513, "epoch": 0.11417068085412323, "kl_loss": 0.17509959638118744, "loss_ib": 0.0027639211621135473, "step": 397 }, { "ce_ib": 8.069706916809082, "ce_orig": 0.6624881029129028, "epoch": 0.11445826443310086, "kl_loss": 0.12610213458538055, "loss_ib": 0.0020679919980466366, "step": 398 }, { "ce_ib": 7.447951793670654, "ce_orig": 0.44954437017440796, "epoch": 0.11445826443310086, "kl_loss": 0.16658943891525269, "loss_ib": 0.002410689601674676, "step": 398 }, { "ce_ib": 11.109574317932129, "ce_orig": 0.47779056429862976, "epoch": 0.11445826443310086, "kl_loss": 0.23340463638305664, "loss_ib": 0.0034450036473572254, "step": 398 }, { "ce_ib": 15.319025039672852, "ce_orig": 1.082602620124817, "epoch": 0.11445826443310086, "kl_loss": 0.1651686728000641, "loss_ib": 0.0031835888512432575, "step": 398 }, { "ce_ib": 16.39435386657715, "ce_orig": 1.458138108253479, "epoch": 0.11474584801207852, "kl_loss": 0.23157645761966705, "loss_ib": 0.003955199848860502, "step": 399 }, { "ce_ib": 12.060273170471191, "ce_orig": 1.2219758033752441, "epoch": 0.11474584801207852, "kl_loss": 0.18119218945503235, "loss_ib": 0.0030179491732269526, "step": 399 }, { "ce_ib": 9.549758911132812, "ce_orig": 0.5686326026916504, "epoch": 0.11474584801207852, "kl_loss": 0.1396368145942688, "loss_ib": 0.0023513438645750284, "step": 399 }, { "ce_ib": 12.140963554382324, "ce_orig": 0.8329185247421265, "epoch": 0.11474584801207852, "kl_loss": 0.1271989345550537, "loss_ib": 0.002486085519194603, "step": 399 }, { "epoch": 0.11503343159105615, "grad_norm": 0.08466464281082153, "learning_rate": 4.9992290851955325e-05, "loss": 0.8643, "step": 400 }, { "ce_ib": 16.369003295898438, "ce_orig": 0.8453714847564697, "epoch": 0.11503343159105615, "kl_loss": 0.20362722873687744, "loss_ib": 0.0036731725558638573, "step": 400 }, { "ce_ib": 10.80587387084961, "ce_orig": 0.9257553219795227, "epoch": 0.11503343159105615, "kl_loss": 0.18605493009090424, "loss_ib": 0.0029411364812403917, "step": 400 }, { "ce_ib": 6.573936939239502, "ce_orig": 0.6002892851829529, "epoch": 0.11503343159105615, "kl_loss": 0.15251712501049042, "loss_ib": 0.0021825649309903383, "step": 400 }, { "ce_ib": 13.615230560302734, "ce_orig": 1.3942912817001343, "epoch": 0.11503343159105615, "kl_loss": 0.171320840716362, "loss_ib": 0.0030747312121093273, "step": 400 }, { "ce_ib": 12.808405876159668, "ce_orig": 1.0415929555892944, "epoch": 0.11532101517003379, "kl_loss": 0.17026068270206451, "loss_ib": 0.002983447164297104, "step": 401 }, { "ce_ib": 7.786767959594727, "ce_orig": 0.5461778044700623, "epoch": 0.11532101517003379, "kl_loss": 0.1809147298336029, "loss_ib": 0.0025878241285681725, "step": 401 }, { "ce_ib": 9.318531036376953, "ce_orig": 1.0691779851913452, "epoch": 0.11532101517003379, "kl_loss": 0.12710833549499512, "loss_ib": 0.0022029364481568336, "step": 401 }, { "ce_ib": 15.711153030395508, "ce_orig": 1.2399132251739502, "epoch": 0.11532101517003379, "kl_loss": 0.20981115102767944, "loss_ib": 0.003669226774945855, "step": 401 }, { "ce_ib": 13.523634910583496, "ce_orig": 1.0126256942749023, "epoch": 0.11560859874901143, "kl_loss": 0.17583820223808289, "loss_ib": 0.003110745456069708, "step": 402 }, { "ce_ib": 10.453843116760254, "ce_orig": 0.7707417607307434, "epoch": 0.11560859874901143, "kl_loss": 0.13824975490570068, "loss_ib": 0.0024278818164020777, "step": 402 }, { "ce_ib": 12.620675086975098, "ce_orig": 0.9837019443511963, "epoch": 0.11560859874901143, "kl_loss": 0.15091584622859955, "loss_ib": 0.0027712257578969, "step": 402 }, { "ce_ib": 14.844929695129395, "ce_orig": 1.3407633304595947, "epoch": 0.11560859874901143, "kl_loss": 0.30624860525131226, "loss_ib": 0.00454697897657752, "step": 402 }, { "ce_ib": 11.737789154052734, "ce_orig": 1.1215554475784302, "epoch": 0.11589618232798907, "kl_loss": 0.16605661809444427, "loss_ib": 0.002834344981238246, "step": 403 }, { "ce_ib": 11.818507194519043, "ce_orig": 0.4051503837108612, "epoch": 0.11589618232798907, "kl_loss": 0.2137288749217987, "loss_ib": 0.0033191393595188856, "step": 403 }, { "ce_ib": 10.569378852844238, "ce_orig": 0.7266899347305298, "epoch": 0.11589618232798907, "kl_loss": 0.19015324115753174, "loss_ib": 0.002958470256999135, "step": 403 }, { "ce_ib": 10.655888557434082, "ce_orig": 0.640403151512146, "epoch": 0.11589618232798907, "kl_loss": 0.18397970497608185, "loss_ib": 0.0029053858015686274, "step": 403 }, { "ce_ib": 10.284205436706543, "ce_orig": 1.0149288177490234, "epoch": 0.11618376590696672, "kl_loss": 0.16832667589187622, "loss_ib": 0.0027116872370243073, "step": 404 }, { "ce_ib": 13.454412460327148, "ce_orig": 1.0919182300567627, "epoch": 0.11618376590696672, "kl_loss": 0.15390118956565857, "loss_ib": 0.0028844529297202826, "step": 404 }, { "ce_ib": 8.412931442260742, "ce_orig": 0.6086220145225525, "epoch": 0.11618376590696672, "kl_loss": 0.13261398673057556, "loss_ib": 0.002167432801797986, "step": 404 }, { "ce_ib": 16.36043930053711, "ce_orig": 1.389167308807373, "epoch": 0.11618376590696672, "kl_loss": 0.13541021943092346, "loss_ib": 0.002990146167576313, "step": 404 }, { "epoch": 0.11647134948594436, "grad_norm": 0.08868135511875153, "learning_rate": 4.999129715225077e-05, "loss": 0.8893, "step": 405 }, { "ce_ib": 11.492820739746094, "ce_orig": 0.746446967124939, "epoch": 0.11647134948594436, "kl_loss": 0.1755758821964264, "loss_ib": 0.002905040979385376, "step": 405 }, { "ce_ib": 14.550654411315918, "ce_orig": 1.1409695148468018, "epoch": 0.11647134948594436, "kl_loss": 0.16501018404960632, "loss_ib": 0.003105167066678405, "step": 405 }, { "ce_ib": 12.881452560424805, "ce_orig": 1.0264896154403687, "epoch": 0.11647134948594436, "kl_loss": 0.18386085331439972, "loss_ib": 0.003126753494143486, "step": 405 }, { "ce_ib": 15.17376708984375, "ce_orig": 1.3239004611968994, "epoch": 0.11647134948594436, "kl_loss": 0.18682563304901123, "loss_ib": 0.0033856327645480633, "step": 405 }, { "ce_ib": 14.622434616088867, "ce_orig": 1.3146438598632812, "epoch": 0.116758933064922, "kl_loss": 0.18558424711227417, "loss_ib": 0.003318085800856352, "step": 406 }, { "ce_ib": 8.00043773651123, "ce_orig": 0.7650782465934753, "epoch": 0.116758933064922, "kl_loss": 0.14243070781230927, "loss_ib": 0.0022243508137762547, "step": 406 }, { "ce_ib": 11.638957977294922, "ce_orig": 0.927288830280304, "epoch": 0.116758933064922, "kl_loss": 0.14190661907196045, "loss_ib": 0.0025829619262367487, "step": 406 }, { "ce_ib": 8.698803901672363, "ce_orig": 0.4740663766860962, "epoch": 0.116758933064922, "kl_loss": 0.18497580289840698, "loss_ib": 0.0027196381706744432, "step": 406 }, { "ce_ib": 11.999215126037598, "ce_orig": 0.5628153681755066, "epoch": 0.11704651664389963, "kl_loss": 0.261201411485672, "loss_ib": 0.0038119356613606215, "step": 407 }, { "ce_ib": 14.865316390991211, "ce_orig": 1.6626498699188232, "epoch": 0.11704651664389963, "kl_loss": 0.17202956974506378, "loss_ib": 0.003206827212125063, "step": 407 }, { "ce_ib": 11.803093910217285, "ce_orig": 0.8193854093551636, "epoch": 0.11704651664389963, "kl_loss": 0.2457035779953003, "loss_ib": 0.003637345042079687, "step": 407 }, { "ce_ib": 14.206315994262695, "ce_orig": 1.1790286302566528, "epoch": 0.11704651664389963, "kl_loss": 0.21022199094295502, "loss_ib": 0.0035228515043854713, "step": 407 }, { "ce_ib": 9.615798950195312, "ce_orig": 0.5693954229354858, "epoch": 0.11733410022287727, "kl_loss": 0.20928806066513062, "loss_ib": 0.003054460510611534, "step": 408 }, { "ce_ib": 10.448309898376465, "ce_orig": 0.7434052228927612, "epoch": 0.11733410022287727, "kl_loss": 0.18974988162517548, "loss_ib": 0.002942329505458474, "step": 408 }, { "ce_ib": 12.322173118591309, "ce_orig": 0.7398363351821899, "epoch": 0.11733410022287727, "kl_loss": 0.32504746317863464, "loss_ib": 0.004482691641896963, "step": 408 }, { "ce_ib": 11.393105506896973, "ce_orig": 0.2980586290359497, "epoch": 0.11733410022287727, "kl_loss": 0.2762417793273926, "loss_ib": 0.003901728196069598, "step": 408 }, { "ce_ib": 9.13760757446289, "ce_orig": 0.48705342411994934, "epoch": 0.11762168380185492, "kl_loss": 0.2090642750263214, "loss_ib": 0.003004403319209814, "step": 409 }, { "ce_ib": 13.404657363891602, "ce_orig": 1.3054029941558838, "epoch": 0.11762168380185492, "kl_loss": 0.15996284782886505, "loss_ib": 0.0029400940984487534, "step": 409 }, { "ce_ib": 14.58011245727539, "ce_orig": 0.6604776978492737, "epoch": 0.11762168380185492, "kl_loss": 0.17515218257904053, "loss_ib": 0.0032095329370349646, "step": 409 }, { "ce_ib": 12.46037769317627, "ce_orig": 0.969291090965271, "epoch": 0.11762168380185492, "kl_loss": 0.12114151567220688, "loss_ib": 0.002457452705129981, "step": 409 }, { "epoch": 0.11790926738083256, "grad_norm": 0.08972907811403275, "learning_rate": 4.9990243242710764e-05, "loss": 0.8016, "step": 410 }, { "ce_ib": 14.017788887023926, "ce_orig": 1.2842930555343628, "epoch": 0.11790926738083256, "kl_loss": 0.20839394629001617, "loss_ib": 0.0034857182763516903, "step": 410 }, { "ce_ib": 12.625293731689453, "ce_orig": 0.331617534160614, "epoch": 0.11790926738083256, "kl_loss": 0.23530715703964233, "loss_ib": 0.0036156009882688522, "step": 410 }, { "ce_ib": 13.452978134155273, "ce_orig": 0.9680318832397461, "epoch": 0.11790926738083256, "kl_loss": 0.17226648330688477, "loss_ib": 0.003067962359637022, "step": 410 }, { "ce_ib": 13.609016418457031, "ce_orig": 1.1668546199798584, "epoch": 0.11790926738083256, "kl_loss": 0.15326163172721863, "loss_ib": 0.0028935179580003023, "step": 410 }, { "ce_ib": 11.401368141174316, "ce_orig": 0.7574223279953003, "epoch": 0.1181968509598102, "kl_loss": 0.17012295126914978, "loss_ib": 0.002841366222128272, "step": 411 }, { "ce_ib": 13.586700439453125, "ce_orig": 1.1896238327026367, "epoch": 0.1181968509598102, "kl_loss": 0.2817670702934265, "loss_ib": 0.004176340531557798, "step": 411 }, { "ce_ib": 16.24236488342285, "ce_orig": 1.1911630630493164, "epoch": 0.1181968509598102, "kl_loss": 0.19016054272651672, "loss_ib": 0.003525841748341918, "step": 411 }, { "ce_ib": 13.229630470275879, "ce_orig": 0.9971056580543518, "epoch": 0.1181968509598102, "kl_loss": 0.1399802565574646, "loss_ib": 0.0027227657847106457, "step": 411 }, { "ce_ib": 10.67956829071045, "ce_orig": 0.8728124499320984, "epoch": 0.11848443453878783, "kl_loss": 0.15304341912269592, "loss_ib": 0.0025983911473304033, "step": 412 }, { "ce_ib": 7.926272869110107, "ce_orig": 0.4618622958660126, "epoch": 0.11848443453878783, "kl_loss": 0.08525725454092026, "loss_ib": 0.0016451997216790915, "step": 412 }, { "ce_ib": 12.342477798461914, "ce_orig": 0.6581653952598572, "epoch": 0.11848443453878783, "kl_loss": 0.20672234892845154, "loss_ib": 0.0033014710061252117, "step": 412 }, { "ce_ib": 12.10908317565918, "ce_orig": 0.8213714957237244, "epoch": 0.11848443453878783, "kl_loss": 0.23801177740097046, "loss_ib": 0.00359102594666183, "step": 412 }, { "ce_ib": 11.018802642822266, "ce_orig": 0.5446355938911438, "epoch": 0.11877201811776547, "kl_loss": 0.26025596261024475, "loss_ib": 0.0037044398486614227, "step": 413 }, { "ce_ib": 12.422916412353516, "ce_orig": 0.9991008043289185, "epoch": 0.11877201811776547, "kl_loss": 0.37930434942245483, "loss_ib": 0.00503533473238349, "step": 413 }, { "ce_ib": 11.024622917175293, "ce_orig": 0.8313679099082947, "epoch": 0.11877201811776547, "kl_loss": 0.18216568231582642, "loss_ib": 0.002924119122326374, "step": 413 }, { "ce_ib": 12.971683502197266, "ce_orig": 0.9980677366256714, "epoch": 0.11877201811776547, "kl_loss": 0.28354763984680176, "loss_ib": 0.004132644273340702, "step": 413 }, { "ce_ib": 10.75366497039795, "ce_orig": 1.0008810758590698, "epoch": 0.11905960169674312, "kl_loss": 0.21501143276691437, "loss_ib": 0.00322548090480268, "step": 414 }, { "ce_ib": 15.019447326660156, "ce_orig": 1.0870994329452515, "epoch": 0.11905960169674312, "kl_loss": 0.18550065159797668, "loss_ib": 0.003356951056048274, "step": 414 }, { "ce_ib": 13.59741497039795, "ce_orig": 1.1491084098815918, "epoch": 0.11905960169674312, "kl_loss": 0.31042391061782837, "loss_ib": 0.004463980905711651, "step": 414 }, { "ce_ib": 11.30091667175293, "ce_orig": 0.7725252509117126, "epoch": 0.11905960169674312, "kl_loss": 0.19686946272850037, "loss_ib": 0.003098786110058427, "step": 414 }, { "epoch": 0.11934718527572076, "grad_norm": 0.0853128507733345, "learning_rate": 4.998912912587444e-05, "loss": 0.8496, "step": 415 }, { "ce_ib": 10.824992179870605, "ce_orig": 1.003801703453064, "epoch": 0.11934718527572076, "kl_loss": 0.11075378954410553, "loss_ib": 0.0021900369320064783, "step": 415 }, { "ce_ib": 14.990334510803223, "ce_orig": 1.1157439947128296, "epoch": 0.11934718527572076, "kl_loss": 0.18331551551818848, "loss_ib": 0.0033321885857731104, "step": 415 }, { "ce_ib": 10.030242919921875, "ce_orig": 0.7444831728935242, "epoch": 0.11934718527572076, "kl_loss": 0.2142019271850586, "loss_ib": 0.0031450435053557158, "step": 415 }, { "ce_ib": 7.975912570953369, "ce_orig": 0.713485062122345, "epoch": 0.11934718527572076, "kl_loss": 0.20920607447624207, "loss_ib": 0.00288965180516243, "step": 415 }, { "ce_ib": 12.238396644592285, "ce_orig": 1.1776320934295654, "epoch": 0.1196347688546984, "kl_loss": 0.21955502033233643, "loss_ib": 0.0034193897154182196, "step": 416 }, { "ce_ib": 13.989873886108398, "ce_orig": 1.128517746925354, "epoch": 0.1196347688546984, "kl_loss": 0.2628554701805115, "loss_ib": 0.0040275417268276215, "step": 416 }, { "ce_ib": 15.87778091430664, "ce_orig": 1.3535970449447632, "epoch": 0.1196347688546984, "kl_loss": 0.197160542011261, "loss_ib": 0.0035593833308666945, "step": 416 }, { "ce_ib": 8.849984169006348, "ce_orig": 0.872184157371521, "epoch": 0.1196347688546984, "kl_loss": 0.1935926228761673, "loss_ib": 0.0028209243901073933, "step": 416 }, { "ce_ib": 9.946513175964355, "ce_orig": 0.5356448292732239, "epoch": 0.11992235243367604, "kl_loss": 0.2691783308982849, "loss_ib": 0.0036864345893263817, "step": 417 }, { "ce_ib": 13.770381927490234, "ce_orig": 1.427547812461853, "epoch": 0.11992235243367604, "kl_loss": 0.1527450531721115, "loss_ib": 0.002904488705098629, "step": 417 }, { "ce_ib": 12.310346603393555, "ce_orig": 1.485551118850708, "epoch": 0.11992235243367604, "kl_loss": 0.1050770953297615, "loss_ib": 0.0022818055003881454, "step": 417 }, { "ce_ib": 14.205962181091309, "ce_orig": 1.5815967321395874, "epoch": 0.11992235243367604, "kl_loss": 0.26177799701690674, "loss_ib": 0.004038376267999411, "step": 417 }, { "ce_ib": 9.17827320098877, "ce_orig": 0.5437095165252686, "epoch": 0.12020993601265367, "kl_loss": 0.17721109092235565, "loss_ib": 0.0026899382937699556, "step": 418 }, { "ce_ib": 15.857308387756348, "ce_orig": 0.8890218138694763, "epoch": 0.12020993601265367, "kl_loss": 0.35342293977737427, "loss_ib": 0.0051199602894485, "step": 418 }, { "ce_ib": 12.519335746765137, "ce_orig": 0.40189069509506226, "epoch": 0.12020993601265367, "kl_loss": 0.19997818768024445, "loss_ib": 0.0032517153304070234, "step": 418 }, { "ce_ib": 10.383864402770996, "ce_orig": 0.9198765754699707, "epoch": 0.12020993601265367, "kl_loss": 0.1422748863697052, "loss_ib": 0.0024611353874206543, "step": 418 }, { "ce_ib": 4.41956090927124, "ce_orig": 0.15882746875286102, "epoch": 0.12049751959163132, "kl_loss": 0.42377138137817383, "loss_ib": 0.004679669626057148, "step": 419 }, { "ce_ib": 8.898272514343262, "ce_orig": 0.6479420065879822, "epoch": 0.12049751959163132, "kl_loss": 0.14590340852737427, "loss_ib": 0.002348861424252391, "step": 419 }, { "ce_ib": 11.02161693572998, "ce_orig": 0.6498445272445679, "epoch": 0.12049751959163132, "kl_loss": 0.18951579928398132, "loss_ib": 0.0029973196797072887, "step": 419 }, { "ce_ib": 13.597489356994629, "ce_orig": 1.474985122680664, "epoch": 0.12049751959163132, "kl_loss": 0.2165094017982483, "loss_ib": 0.0035248426720499992, "step": 419 }, { "epoch": 0.12078510317060896, "grad_norm": 0.09395145624876022, "learning_rate": 4.998795480442595e-05, "loss": 0.919, "step": 420 }, { "ce_ib": 13.930419921875, "ce_orig": 1.4253751039505005, "epoch": 0.12078510317060896, "kl_loss": 0.25621849298477173, "loss_ib": 0.003955226857215166, "step": 420 }, { "ce_ib": 13.867815017700195, "ce_orig": 1.0413322448730469, "epoch": 0.12078510317060896, "kl_loss": 0.1656143069267273, "loss_ib": 0.003042924450710416, "step": 420 }, { "ce_ib": 9.55808162689209, "ce_orig": 0.8998080492019653, "epoch": 0.12078510317060896, "kl_loss": 0.2003626972436905, "loss_ib": 0.002959434874355793, "step": 420 }, { "ce_ib": 6.539864540100098, "ce_orig": 0.4415733814239502, "epoch": 0.12078510317060896, "kl_loss": 0.16704899072647095, "loss_ib": 0.0023244761396199465, "step": 420 }, { "ce_ib": 13.084672927856445, "ce_orig": 0.9477989077568054, "epoch": 0.1210726867495866, "kl_loss": 0.1585165113210678, "loss_ib": 0.0028936322778463364, "step": 421 }, { "ce_ib": 10.002495765686035, "ce_orig": 0.7920336127281189, "epoch": 0.1210726867495866, "kl_loss": 0.23921585083007812, "loss_ib": 0.0033924079034477472, "step": 421 }, { "ce_ib": 9.44317626953125, "ce_orig": 0.7052544355392456, "epoch": 0.1210726867495866, "kl_loss": 0.1775376945734024, "loss_ib": 0.002719694282859564, "step": 421 }, { "ce_ib": 6.67018985748291, "ce_orig": 0.35514646768569946, "epoch": 0.1210726867495866, "kl_loss": 0.27639925479888916, "loss_ib": 0.0034310114569962025, "step": 421 }, { "ce_ib": 9.008115768432617, "ce_orig": 1.0835165977478027, "epoch": 0.12136027032856424, "kl_loss": 0.1306457817554474, "loss_ib": 0.002207269426435232, "step": 422 }, { "ce_ib": 9.596372604370117, "ce_orig": 0.6315584182739258, "epoch": 0.12136027032856424, "kl_loss": 0.16708403825759888, "loss_ib": 0.002630477538332343, "step": 422 }, { "ce_ib": 10.36826229095459, "ce_orig": 0.8352252840995789, "epoch": 0.12136027032856424, "kl_loss": 0.4174191355705261, "loss_ib": 0.005211017560213804, "step": 422 }, { "ce_ib": 6.275569438934326, "ce_orig": 0.6971433758735657, "epoch": 0.12136027032856424, "kl_loss": 0.10864199697971344, "loss_ib": 0.001713976846076548, "step": 422 }, { "ce_ib": 11.055356979370117, "ce_orig": 0.711353600025177, "epoch": 0.12164785390754188, "kl_loss": 0.223836749792099, "loss_ib": 0.0033439029939472675, "step": 423 }, { "ce_ib": 12.989297866821289, "ce_orig": 0.8257631063461304, "epoch": 0.12164785390754188, "kl_loss": 0.21258409321308136, "loss_ib": 0.003424770664423704, "step": 423 }, { "ce_ib": 7.487967014312744, "ce_orig": 0.5072060227394104, "epoch": 0.12164785390754188, "kl_loss": 0.15735791623592377, "loss_ib": 0.002322375774383545, "step": 423 }, { "ce_ib": 13.437426567077637, "ce_orig": 0.9563009142875671, "epoch": 0.12164785390754188, "kl_loss": 0.1478041410446167, "loss_ib": 0.0028217840008437634, "step": 423 }, { "ce_ib": 12.20171070098877, "ce_orig": 0.7322474718093872, "epoch": 0.12193543748651951, "kl_loss": 0.2593429684638977, "loss_ib": 0.003813600866124034, "step": 424 }, { "ce_ib": 10.579559326171875, "ce_orig": 0.5674452781677246, "epoch": 0.12193543748651951, "kl_loss": 0.24632222950458527, "loss_ib": 0.0035211783833801746, "step": 424 }, { "ce_ib": 12.876055717468262, "ce_orig": 1.14524245262146, "epoch": 0.12193543748651951, "kl_loss": 0.21795441210269928, "loss_ib": 0.003467149566859007, "step": 424 }, { "ce_ib": 8.761207580566406, "ce_orig": 0.9090970754623413, "epoch": 0.12193543748651951, "kl_loss": 0.15418817102909088, "loss_ib": 0.0024180023465305567, "step": 424 }, { "epoch": 0.12222302106549716, "grad_norm": 0.07512833178043365, "learning_rate": 4.9986720281194496e-05, "loss": 0.8761, "step": 425 }, { "ce_ib": 7.6993608474731445, "ce_orig": 0.40163472294807434, "epoch": 0.12222302106549716, "kl_loss": 0.20606671273708344, "loss_ib": 0.0028306031599640846, "step": 425 }, { "ce_ib": 10.682936668395996, "ce_orig": 0.752029538154602, "epoch": 0.12222302106549716, "kl_loss": 0.17551946640014648, "loss_ib": 0.0028234883211553097, "step": 425 }, { "ce_ib": 10.21149730682373, "ce_orig": 0.8434242010116577, "epoch": 0.12222302106549716, "kl_loss": 0.19770103693008423, "loss_ib": 0.0029981599655002356, "step": 425 }, { "ce_ib": 9.649618148803711, "ce_orig": 0.6008751392364502, "epoch": 0.12222302106549716, "kl_loss": 0.2020394206047058, "loss_ib": 0.0029853556770831347, "step": 425 }, { "ce_ib": 11.479440689086914, "ce_orig": 0.9273905158042908, "epoch": 0.1225106046444748, "kl_loss": 0.15146127343177795, "loss_ib": 0.0026625567115843296, "step": 426 }, { "ce_ib": 7.9811859130859375, "ce_orig": 0.25573351979255676, "epoch": 0.1225106046444748, "kl_loss": 0.23791244626045227, "loss_ib": 0.0031772428192198277, "step": 426 }, { "ce_ib": 10.76065444946289, "ce_orig": 0.8275227546691895, "epoch": 0.1225106046444748, "kl_loss": 0.2022540271282196, "loss_ib": 0.0030986058991402388, "step": 426 }, { "ce_ib": 10.59325885772705, "ce_orig": 0.6065911650657654, "epoch": 0.1225106046444748, "kl_loss": 0.2510051429271698, "loss_ib": 0.003569377353414893, "step": 426 }, { "ce_ib": 9.989922523498535, "ce_orig": 0.6457223296165466, "epoch": 0.12279818822345244, "kl_loss": 0.41983091831207275, "loss_ib": 0.005197301506996155, "step": 427 }, { "ce_ib": 14.872665405273438, "ce_orig": 1.3183645009994507, "epoch": 0.12279818822345244, "kl_loss": 0.25291332602500916, "loss_ib": 0.004016399849206209, "step": 427 }, { "ce_ib": 14.173356056213379, "ce_orig": 0.860676646232605, "epoch": 0.12279818822345244, "kl_loss": 0.22176355123519897, "loss_ib": 0.0036349711008369923, "step": 427 }, { "ce_ib": 12.447295188903809, "ce_orig": 1.0465346574783325, "epoch": 0.12279818822345244, "kl_loss": 0.15125788748264313, "loss_ib": 0.00275730830617249, "step": 427 }, { "ce_ib": 11.742615699768066, "ce_orig": 0.8324576616287231, "epoch": 0.12308577180243008, "kl_loss": 0.26873379945755005, "loss_ib": 0.0038615993689745665, "step": 428 }, { "ce_ib": 15.946845054626465, "ce_orig": 1.4635050296783447, "epoch": 0.12308577180243008, "kl_loss": 0.3334965407848358, "loss_ib": 0.004929649643599987, "step": 428 }, { "ce_ib": 11.777470588684082, "ce_orig": 0.8487641215324402, "epoch": 0.12308577180243008, "kl_loss": 0.18009008467197418, "loss_ib": 0.0029786478262394667, "step": 428 }, { "ce_ib": 15.157903671264648, "ce_orig": 1.4350470304489136, "epoch": 0.12308577180243008, "kl_loss": 0.16165342926979065, "loss_ib": 0.003132324665784836, "step": 428 }, { "ce_ib": 6.574849605560303, "ce_orig": 0.35640019178390503, "epoch": 0.12337335538140771, "kl_loss": 0.16976439952850342, "loss_ib": 0.0023551289923489094, "step": 429 }, { "ce_ib": 11.606804847717285, "ce_orig": 0.7963778972625732, "epoch": 0.12337335538140771, "kl_loss": 0.17389288544654846, "loss_ib": 0.002899609040468931, "step": 429 }, { "ce_ib": 11.487293243408203, "ce_orig": 1.072171926498413, "epoch": 0.12337335538140771, "kl_loss": 0.19142760336399078, "loss_ib": 0.0030630051624029875, "step": 429 }, { "ce_ib": 7.667901992797852, "ce_orig": 0.5443602204322815, "epoch": 0.12337335538140771, "kl_loss": 0.1836308240890503, "loss_ib": 0.0026030982844531536, "step": 429 }, { "epoch": 0.12366093896038537, "grad_norm": 0.08391211926937103, "learning_rate": 4.998542555915435e-05, "loss": 0.9167, "step": 430 }, { "ce_ib": 11.157709121704102, "ce_orig": 0.8726559281349182, "epoch": 0.12366093896038537, "kl_loss": 0.19528821110725403, "loss_ib": 0.0030686529353260994, "step": 430 }, { "ce_ib": 12.455047607421875, "ce_orig": 1.3305251598358154, "epoch": 0.12366093896038537, "kl_loss": 0.11633329838514328, "loss_ib": 0.002408837666735053, "step": 430 }, { "ce_ib": 17.702678680419922, "ce_orig": 1.9683383703231812, "epoch": 0.12366093896038537, "kl_loss": 0.21032744646072388, "loss_ib": 0.003873542184010148, "step": 430 }, { "ce_ib": 11.364348411560059, "ce_orig": 1.2615947723388672, "epoch": 0.12366093896038537, "kl_loss": 0.15659835934638977, "loss_ib": 0.0027024184819310904, "step": 430 }, { "ce_ib": 10.107429504394531, "ce_orig": 0.8148799538612366, "epoch": 0.123948522539363, "kl_loss": 0.13077875971794128, "loss_ib": 0.0023185305763036013, "step": 431 }, { "ce_ib": 11.587873458862305, "ce_orig": 1.074462890625, "epoch": 0.123948522539363, "kl_loss": 0.24695566296577454, "loss_ib": 0.0036283438093960285, "step": 431 }, { "ce_ib": 10.614514350891113, "ce_orig": 0.9438521862030029, "epoch": 0.123948522539363, "kl_loss": 0.2546341121196747, "loss_ib": 0.0036077925469726324, "step": 431 }, { "ce_ib": 10.189565658569336, "ce_orig": 0.468057245016098, "epoch": 0.123948522539363, "kl_loss": 0.21918027102947235, "loss_ib": 0.003210759023204446, "step": 431 }, { "ce_ib": 16.234272003173828, "ce_orig": 1.4394607543945312, "epoch": 0.12423610611834064, "kl_loss": 0.16391563415527344, "loss_ib": 0.0032625836320221424, "step": 432 }, { "ce_ib": 13.389922142028809, "ce_orig": 1.0571950674057007, "epoch": 0.12423610611834064, "kl_loss": 0.25300243496894836, "loss_ib": 0.003869016421958804, "step": 432 }, { "ce_ib": 11.05131721496582, "ce_orig": 0.8905650973320007, "epoch": 0.12423610611834064, "kl_loss": 0.1906907856464386, "loss_ib": 0.0030120396986603737, "step": 432 }, { "ce_ib": 8.993093490600586, "ce_orig": 0.7904607653617859, "epoch": 0.12423610611834064, "kl_loss": 0.18500834703445435, "loss_ib": 0.002749392529949546, "step": 432 }, { "ce_ib": 13.643828392028809, "ce_orig": 0.8764438629150391, "epoch": 0.12452368969731828, "kl_loss": 0.25997138023376465, "loss_ib": 0.003964096307754517, "step": 433 }, { "ce_ib": 6.452097415924072, "ce_orig": 0.5795682072639465, "epoch": 0.12452368969731828, "kl_loss": 0.1325344741344452, "loss_ib": 0.001970554469153285, "step": 433 }, { "ce_ib": 10.294032096862793, "ce_orig": 0.34366491436958313, "epoch": 0.12452368969731828, "kl_loss": 0.12770652770996094, "loss_ib": 0.0023064683191478252, "step": 433 }, { "ce_ib": 8.313075065612793, "ce_orig": 0.6022379398345947, "epoch": 0.12452368969731828, "kl_loss": 0.11339238286018372, "loss_ib": 0.0019652312621474266, "step": 433 }, { "ce_ib": 14.330761909484863, "ce_orig": 0.8713304996490479, "epoch": 0.12481127327629592, "kl_loss": 0.22767247259616852, "loss_ib": 0.003709800774231553, "step": 434 }, { "ce_ib": 9.519655227661133, "ce_orig": 0.5508330464363098, "epoch": 0.12481127327629592, "kl_loss": 0.1265774965286255, "loss_ib": 0.002217740286141634, "step": 434 }, { "ce_ib": 12.286112785339355, "ce_orig": 0.8811700344085693, "epoch": 0.12481127327629592, "kl_loss": 0.17079584300518036, "loss_ib": 0.0029365697409957647, "step": 434 }, { "ce_ib": 8.997398376464844, "ce_orig": 0.48554953932762146, "epoch": 0.12481127327629592, "kl_loss": 0.13161113858222961, "loss_ib": 0.0022158510982990265, "step": 434 }, { "epoch": 0.12509885685527355, "grad_norm": 0.08008844405412674, "learning_rate": 4.99840706414248e-05, "loss": 0.8499, "step": 435 }, { "ce_ib": 12.028959274291992, "ce_orig": 0.7656774520874023, "epoch": 0.12509885685527355, "kl_loss": 0.18438570201396942, "loss_ib": 0.0030467526521533728, "step": 435 }, { "ce_ib": 9.531744003295898, "ce_orig": 0.7000839710235596, "epoch": 0.12509885685527355, "kl_loss": 0.1339460015296936, "loss_ib": 0.002292634453624487, "step": 435 }, { "ce_ib": 7.86661958694458, "ce_orig": 0.47849422693252563, "epoch": 0.12509885685527355, "kl_loss": 0.20920854806900024, "loss_ib": 0.0028787474147975445, "step": 435 }, { "ce_ib": 10.296324729919434, "ce_orig": 1.1329785585403442, "epoch": 0.12509885685527355, "kl_loss": 0.17465677857398987, "loss_ib": 0.002776200184598565, "step": 435 }, { "ce_ib": 8.947026252746582, "ce_orig": 0.9858295321464539, "epoch": 0.1253864404342512, "kl_loss": 0.22594591975212097, "loss_ib": 0.0031541618518531322, "step": 436 }, { "ce_ib": 10.008584022521973, "ce_orig": 0.7601190805435181, "epoch": 0.1253864404342512, "kl_loss": 0.18392398953437805, "loss_ib": 0.0028400979936122894, "step": 436 }, { "ce_ib": 18.1694393157959, "ce_orig": 1.7608329057693481, "epoch": 0.1253864404342512, "kl_loss": 0.3656727969646454, "loss_ib": 0.005473671946674585, "step": 436 }, { "ce_ib": 10.617599487304688, "ce_orig": 0.7405425906181335, "epoch": 0.1253864404342512, "kl_loss": 0.23880283534526825, "loss_ib": 0.003449788084253669, "step": 436 }, { "ce_ib": 7.292166233062744, "ce_orig": 0.321105033159256, "epoch": 0.12567402401322886, "kl_loss": 0.573823094367981, "loss_ib": 0.006467447150498629, "step": 437 }, { "ce_ib": 12.345170021057129, "ce_orig": 1.1237767934799194, "epoch": 0.12567402401322886, "kl_loss": 0.12964360415935516, "loss_ib": 0.0025309529155492783, "step": 437 }, { "ce_ib": 9.116506576538086, "ce_orig": 0.351901113986969, "epoch": 0.12567402401322886, "kl_loss": 0.1449497938156128, "loss_ib": 0.0023611485958099365, "step": 437 }, { "ce_ib": 9.928841590881348, "ce_orig": 0.5612432956695557, "epoch": 0.12567402401322886, "kl_loss": 0.17729271948337555, "loss_ib": 0.0027658112812787294, "step": 437 }, { "ce_ib": 8.56289005279541, "ce_orig": 0.5716758966445923, "epoch": 0.12596160759220648, "kl_loss": 0.1342535763978958, "loss_ib": 0.0021988246589899063, "step": 438 }, { "ce_ib": 13.346972465515137, "ce_orig": 0.7096478939056396, "epoch": 0.12596160759220648, "kl_loss": 0.1945207715034485, "loss_ib": 0.0032799046020954847, "step": 438 }, { "ce_ib": 5.58247709274292, "ce_orig": 0.38993921875953674, "epoch": 0.12596160759220648, "kl_loss": 0.3592712879180908, "loss_ib": 0.004150960128754377, "step": 438 }, { "ce_ib": 10.52940845489502, "ce_orig": 0.3933676481246948, "epoch": 0.12596160759220648, "kl_loss": 0.13906532526016235, "loss_ib": 0.0024435939267277718, "step": 438 }, { "ce_ib": 10.115212440490723, "ce_orig": 0.6660525798797607, "epoch": 0.12624919117118413, "kl_loss": 0.28316277265548706, "loss_ib": 0.003843148937448859, "step": 439 }, { "ce_ib": 11.30185317993164, "ce_orig": 0.8098467588424683, "epoch": 0.12624919117118413, "kl_loss": 0.16112932562828064, "loss_ib": 0.002741478616371751, "step": 439 }, { "ce_ib": 7.795021057128906, "ce_orig": 0.6182560324668884, "epoch": 0.12624919117118413, "kl_loss": 0.3065950274467468, "loss_ib": 0.003845452331006527, "step": 439 }, { "ce_ib": 13.468255996704102, "ce_orig": 0.9566720128059387, "epoch": 0.12624919117118413, "kl_loss": 0.2001672387123108, "loss_ib": 0.003348497673869133, "step": 439 }, { "epoch": 0.12653677475016176, "grad_norm": 0.08590603619813919, "learning_rate": 4.998265553127013e-05, "loss": 0.8382, "step": 440 }, { "ce_ib": 11.135417938232422, "ce_orig": 0.9260854125022888, "epoch": 0.12653677475016176, "kl_loss": 0.15384265780448914, "loss_ib": 0.0026519682724028826, "step": 440 }, { "ce_ib": 11.6417818069458, "ce_orig": 0.7246519923210144, "epoch": 0.12653677475016176, "kl_loss": 0.18312156200408936, "loss_ib": 0.002995393704622984, "step": 440 }, { "ce_ib": 11.070989608764648, "ce_orig": 1.1319186687469482, "epoch": 0.12653677475016176, "kl_loss": 0.18624573945999146, "loss_ib": 0.002969556488096714, "step": 440 }, { "ce_ib": 15.00080394744873, "ce_orig": 1.5474122762680054, "epoch": 0.12653677475016176, "kl_loss": 0.17769742012023926, "loss_ib": 0.003277054289355874, "step": 440 }, { "ce_ib": 12.565924644470215, "ce_orig": 0.9930309057235718, "epoch": 0.1268243583291394, "kl_loss": 0.22812071442604065, "loss_ib": 0.003537799697369337, "step": 441 }, { "ce_ib": 8.496469497680664, "ce_orig": 0.7013565301895142, "epoch": 0.1268243583291394, "kl_loss": 0.1900731325149536, "loss_ib": 0.0027503781020641327, "step": 441 }, { "ce_ib": 9.66351318359375, "ce_orig": 0.984688401222229, "epoch": 0.1268243583291394, "kl_loss": 0.11712448298931122, "loss_ib": 0.00213759602047503, "step": 441 }, { "ce_ib": 11.531122207641602, "ce_orig": 0.8578464388847351, "epoch": 0.1268243583291394, "kl_loss": 0.22207866609096527, "loss_ib": 0.003373898798599839, "step": 441 }, { "ce_ib": 11.552083015441895, "ce_orig": 1.012474775314331, "epoch": 0.12711194190811706, "kl_loss": 0.19562029838562012, "loss_ib": 0.003111411351710558, "step": 442 }, { "ce_ib": 8.36318588256836, "ce_orig": 0.7492285966873169, "epoch": 0.12711194190811706, "kl_loss": 0.16260814666748047, "loss_ib": 0.0024623998906463385, "step": 442 }, { "ce_ib": 9.527094841003418, "ce_orig": 0.7202103137969971, "epoch": 0.12711194190811706, "kl_loss": 0.128434419631958, "loss_ib": 0.0022370535880327225, "step": 442 }, { "ce_ib": 11.373018264770508, "ce_orig": 0.8286006450653076, "epoch": 0.12711194190811706, "kl_loss": 0.22360824048519135, "loss_ib": 0.0033733840100467205, "step": 442 }, { "ce_ib": 12.500737190246582, "ce_orig": 1.1852082014083862, "epoch": 0.12739952548709468, "kl_loss": 0.17222145199775696, "loss_ib": 0.0029722880572080612, "step": 443 }, { "ce_ib": 14.716822624206543, "ce_orig": 1.8037943840026855, "epoch": 0.12739952548709468, "kl_loss": 0.22250494360923767, "loss_ib": 0.003696731524541974, "step": 443 }, { "ce_ib": 13.993595123291016, "ce_orig": 1.002560019493103, "epoch": 0.12739952548709468, "kl_loss": 0.1844272017478943, "loss_ib": 0.0032436316832900047, "step": 443 }, { "ce_ib": 9.316429138183594, "ce_orig": 0.4433915317058563, "epoch": 0.12739952548709468, "kl_loss": 0.3312546908855438, "loss_ib": 0.0042441897094249725, "step": 443 }, { "ce_ib": 10.669767379760742, "ce_orig": 0.8024405837059021, "epoch": 0.12768710906607234, "kl_loss": 0.18377812206745148, "loss_ib": 0.002904757857322693, "step": 444 }, { "ce_ib": 8.749341011047363, "ce_orig": 0.44320985674858093, "epoch": 0.12768710906607234, "kl_loss": 0.2103624790906906, "loss_ib": 0.002978558884933591, "step": 444 }, { "ce_ib": 6.491762161254883, "ce_orig": 0.7110791802406311, "epoch": 0.12768710906607234, "kl_loss": 0.12732303142547607, "loss_ib": 0.0019224064890295267, "step": 444 }, { "ce_ib": 14.327024459838867, "ce_orig": 1.2938189506530762, "epoch": 0.12768710906607234, "kl_loss": 0.1754641830921173, "loss_ib": 0.003187343943864107, "step": 444 }, { "epoch": 0.12797469264504996, "grad_norm": 0.07503530383110046, "learning_rate": 4.99811802320997e-05, "loss": 0.8966, "step": 445 }, { "ce_ib": 12.345433235168457, "ce_orig": 0.8386138677597046, "epoch": 0.12797469264504996, "kl_loss": 0.31317782402038574, "loss_ib": 0.004366321489214897, "step": 445 }, { "ce_ib": 11.949541091918945, "ce_orig": 0.5236607193946838, "epoch": 0.12797469264504996, "kl_loss": 0.19711901247501373, "loss_ib": 0.0031661440152674913, "step": 445 }, { "ce_ib": 10.233663558959961, "ce_orig": 0.6846522688865662, "epoch": 0.12797469264504996, "kl_loss": 0.16328191757202148, "loss_ib": 0.002656185533851385, "step": 445 }, { "ce_ib": 8.310503959655762, "ce_orig": 0.7847996950149536, "epoch": 0.12797469264504996, "kl_loss": 0.137738898396492, "loss_ib": 0.002208439400419593, "step": 445 }, { "ce_ib": 6.889098167419434, "ce_orig": 0.5118075609207153, "epoch": 0.1282622762240276, "kl_loss": 0.16013775765895844, "loss_ib": 0.0022902872879058123, "step": 446 }, { "ce_ib": 14.948297500610352, "ce_orig": 1.007593035697937, "epoch": 0.1282622762240276, "kl_loss": 0.17850220203399658, "loss_ib": 0.0032798515167087317, "step": 446 }, { "ce_ib": 10.017216682434082, "ce_orig": 1.0469541549682617, "epoch": 0.1282622762240276, "kl_loss": 0.15087240934371948, "loss_ib": 0.0025104456581175327, "step": 446 }, { "ce_ib": 9.104086875915527, "ce_orig": 0.5955268144607544, "epoch": 0.1282622762240276, "kl_loss": 0.2088235318660736, "loss_ib": 0.002998644020408392, "step": 446 }, { "ce_ib": 7.966549396514893, "ce_orig": 0.7193945646286011, "epoch": 0.12854985980300526, "kl_loss": 0.17041301727294922, "loss_ib": 0.0025007850490510464, "step": 447 }, { "ce_ib": 12.620382308959961, "ce_orig": 0.6646131873130798, "epoch": 0.12854985980300526, "kl_loss": 0.21500855684280396, "loss_ib": 0.0034121237695217133, "step": 447 }, { "ce_ib": 5.8810319900512695, "ce_orig": 0.6042389869689941, "epoch": 0.12854985980300526, "kl_loss": 0.16328245401382446, "loss_ib": 0.0022209277376532555, "step": 447 }, { "ce_ib": 13.061161994934082, "ce_orig": 0.9521631598472595, "epoch": 0.12854985980300526, "kl_loss": 0.17168429493904114, "loss_ib": 0.0030229592230170965, "step": 447 }, { "ce_ib": 8.089184761047363, "ce_orig": 0.7481786608695984, "epoch": 0.12883744338198289, "kl_loss": 0.15286147594451904, "loss_ib": 0.0023375332821160555, "step": 448 }, { "ce_ib": 7.247897624969482, "ce_orig": 0.7153653502464294, "epoch": 0.12883744338198289, "kl_loss": 0.16917859017848969, "loss_ib": 0.0024165755603462458, "step": 448 }, { "ce_ib": 9.982969284057617, "ce_orig": 0.8300044536590576, "epoch": 0.12883744338198289, "kl_loss": 0.1288834512233734, "loss_ib": 0.002287131268531084, "step": 448 }, { "ce_ib": 12.154969215393066, "ce_orig": 0.8374365568161011, "epoch": 0.12883744338198289, "kl_loss": 0.2313854843378067, "loss_ib": 0.003529351670295, "step": 448 }, { "ce_ib": 7.137256622314453, "ce_orig": 0.24174675345420837, "epoch": 0.12912502696096054, "kl_loss": 0.4337605834007263, "loss_ib": 0.005051331594586372, "step": 449 }, { "ce_ib": 13.23520565032959, "ce_orig": 0.9527087807655334, "epoch": 0.12912502696096054, "kl_loss": 0.14814800024032593, "loss_ib": 0.002805000403895974, "step": 449 }, { "ce_ib": 9.36728572845459, "ce_orig": 0.4500534236431122, "epoch": 0.12912502696096054, "kl_loss": 0.12568199634552002, "loss_ib": 0.002193548483774066, "step": 449 }, { "ce_ib": 8.504453659057617, "ce_orig": 0.9163048267364502, "epoch": 0.12912502696096054, "kl_loss": 0.15279194712638855, "loss_ib": 0.0023783647920936346, "step": 449 }, { "epoch": 0.12941261053993816, "grad_norm": 0.09120236337184906, "learning_rate": 4.9979644747467835e-05, "loss": 0.8569, "step": 450 }, { "ce_ib": 12.404295921325684, "ce_orig": 0.7500115036964417, "epoch": 0.12941261053993816, "kl_loss": 0.18148070573806763, "loss_ib": 0.0030552365351468325, "step": 450 }, { "ce_ib": 9.151787757873535, "ce_orig": 0.4986724555492401, "epoch": 0.12941261053993816, "kl_loss": 0.1752292811870575, "loss_ib": 0.0026674713008105755, "step": 450 }, { "ce_ib": 8.871505737304688, "ce_orig": 0.6981923580169678, "epoch": 0.12941261053993816, "kl_loss": 0.14069266617298126, "loss_ib": 0.00229407730512321, "step": 450 }, { "ce_ib": 8.211197853088379, "ce_orig": 0.7622634172439575, "epoch": 0.12941261053993816, "kl_loss": 0.13836929202079773, "loss_ib": 0.00220481283031404, "step": 450 }, { "ce_ib": 7.645545482635498, "ce_orig": 0.5680274963378906, "epoch": 0.1297001941189158, "kl_loss": 0.18493801355361938, "loss_ib": 0.0026139344554394484, "step": 451 }, { "ce_ib": 9.379469871520996, "ce_orig": 0.5945746302604675, "epoch": 0.1297001941189158, "kl_loss": 0.15481063723564148, "loss_ib": 0.0024860533885657787, "step": 451 }, { "ce_ib": 13.473487854003906, "ce_orig": 0.9739643931388855, "epoch": 0.1297001941189158, "kl_loss": 0.2487793266773224, "loss_ib": 0.0038351418916136026, "step": 451 }, { "ce_ib": 9.095867156982422, "ce_orig": 0.7306302785873413, "epoch": 0.1297001941189158, "kl_loss": 0.1404043734073639, "loss_ib": 0.002313630422577262, "step": 451 }, { "ce_ib": 8.908297538757324, "ce_orig": 0.548682451248169, "epoch": 0.12998777769789346, "kl_loss": 0.18304413557052612, "loss_ib": 0.002721270779147744, "step": 452 }, { "ce_ib": 12.341330528259277, "ce_orig": 1.0068693161010742, "epoch": 0.12998777769789346, "kl_loss": 0.21775811910629272, "loss_ib": 0.0034117139875888824, "step": 452 }, { "ce_ib": 7.933249473571777, "ce_orig": 0.6957258582115173, "epoch": 0.12998777769789346, "kl_loss": 0.12882256507873535, "loss_ib": 0.002081550657749176, "step": 452 }, { "ce_ib": 11.709693908691406, "ce_orig": 0.7259184718132019, "epoch": 0.12998777769789346, "kl_loss": 0.20683181285858154, "loss_ib": 0.003239287296310067, "step": 452 }, { "ce_ib": 9.15219783782959, "ce_orig": 0.521969199180603, "epoch": 0.1302753612768711, "kl_loss": 0.16149017214775085, "loss_ib": 0.0025301214773207903, "step": 453 }, { "ce_ib": 10.897204399108887, "ce_orig": 0.9679385423660278, "epoch": 0.1302753612768711, "kl_loss": 0.1327183097600937, "loss_ib": 0.0024169033858925104, "step": 453 }, { "ce_ib": 11.597270965576172, "ce_orig": 0.9538221955299377, "epoch": 0.1302753612768711, "kl_loss": 0.13329055905342102, "loss_ib": 0.002492632484063506, "step": 453 }, { "ce_ib": 14.650552749633789, "ce_orig": 0.9307949542999268, "epoch": 0.1302753612768711, "kl_loss": 0.3576693534851074, "loss_ib": 0.005041748750954866, "step": 453 }, { "ce_ib": 9.383811950683594, "ce_orig": 0.7557501196861267, "epoch": 0.13056294485584874, "kl_loss": 0.1699744164943695, "loss_ib": 0.0026381253264844418, "step": 454 }, { "ce_ib": 16.616901397705078, "ce_orig": 1.1251425743103027, "epoch": 0.13056294485584874, "kl_loss": 0.260105699300766, "loss_ib": 0.0042627472430467606, "step": 454 }, { "ce_ib": 9.158967018127441, "ce_orig": 0.602447509765625, "epoch": 0.13056294485584874, "kl_loss": 0.12641242146492004, "loss_ib": 0.0021800207905471325, "step": 454 }, { "ce_ib": 12.393420219421387, "ce_orig": 1.04123055934906, "epoch": 0.13056294485584874, "kl_loss": 0.21238833665847778, "loss_ib": 0.0033632253762334585, "step": 454 }, { "epoch": 0.13085052843482636, "grad_norm": 0.09227544069290161, "learning_rate": 4.997804908107387e-05, "loss": 0.8765, "step": 455 }, { "ce_ib": 9.478934288024902, "ce_orig": 0.8604238033294678, "epoch": 0.13085052843482636, "kl_loss": 0.09945785254240036, "loss_ib": 0.0019424718338996172, "step": 455 }, { "ce_ib": 7.167737007141113, "ce_orig": 0.7395135164260864, "epoch": 0.13085052843482636, "kl_loss": 0.18323373794555664, "loss_ib": 0.0025491111446172, "step": 455 }, { "ce_ib": 9.015175819396973, "ce_orig": 0.5233743786811829, "epoch": 0.13085052843482636, "kl_loss": 0.22085565328598022, "loss_ib": 0.00311007397249341, "step": 455 }, { "ce_ib": 16.64781951904297, "ce_orig": 1.744786024093628, "epoch": 0.13085052843482636, "kl_loss": 0.17802797257900238, "loss_ib": 0.0034450613893568516, "step": 455 }, { "ce_ib": 10.087674140930176, "ce_orig": 0.6486227512359619, "epoch": 0.13113811201380401, "kl_loss": 0.23665431141853333, "loss_ib": 0.0033753104507923126, "step": 456 }, { "ce_ib": 12.518637657165527, "ce_orig": 1.2168270349502563, "epoch": 0.13113811201380401, "kl_loss": 0.15110589563846588, "loss_ib": 0.002762922551482916, "step": 456 }, { "ce_ib": 13.409689903259277, "ce_orig": 1.1832727193832397, "epoch": 0.13113811201380401, "kl_loss": 0.14149300754070282, "loss_ib": 0.0027558987494558096, "step": 456 }, { "ce_ib": 7.571767807006836, "ce_orig": 0.4468522071838379, "epoch": 0.13113811201380401, "kl_loss": 0.2032560110092163, "loss_ib": 0.002789736958220601, "step": 456 }, { "ce_ib": 16.250171661376953, "ce_orig": 1.4707938432693481, "epoch": 0.13142569559278164, "kl_loss": 0.15541328489780426, "loss_ib": 0.0031791499350219965, "step": 457 }, { "ce_ib": 10.158995628356934, "ce_orig": 0.7189385890960693, "epoch": 0.13142569559278164, "kl_loss": 0.13689836859703064, "loss_ib": 0.0023848831187933683, "step": 457 }, { "ce_ib": 13.75023078918457, "ce_orig": 0.9671751856803894, "epoch": 0.13142569559278164, "kl_loss": 0.20036864280700684, "loss_ib": 0.0033787095453590155, "step": 457 }, { "ce_ib": 12.164261817932129, "ce_orig": 0.6848416328430176, "epoch": 0.13142569559278164, "kl_loss": 0.18254505097866058, "loss_ib": 0.0030418764799833298, "step": 457 }, { "ce_ib": 9.728108406066895, "ce_orig": 0.6200440526008606, "epoch": 0.1317132791717593, "kl_loss": 0.15019859373569489, "loss_ib": 0.002474796725437045, "step": 458 }, { "ce_ib": 13.638520240783691, "ce_orig": 1.041512370109558, "epoch": 0.1317132791717593, "kl_loss": 0.19027158617973328, "loss_ib": 0.0032665678299963474, "step": 458 }, { "ce_ib": 12.803059577941895, "ce_orig": 0.5324247479438782, "epoch": 0.1317132791717593, "kl_loss": 0.18024376034736633, "loss_ib": 0.003082743613049388, "step": 458 }, { "ce_ib": 10.689647674560547, "ce_orig": 0.8073751926422119, "epoch": 0.1317132791717593, "kl_loss": 0.12346737831830978, "loss_ib": 0.002303638495504856, "step": 458 }, { "ce_ib": 5.675622463226318, "ce_orig": 0.3405647575855255, "epoch": 0.13200086275073694, "kl_loss": 0.31278595328330994, "loss_ib": 0.0036954216193407774, "step": 459 }, { "ce_ib": 15.82054615020752, "ce_orig": 1.3749570846557617, "epoch": 0.13200086275073694, "kl_loss": 0.21644842624664307, "loss_ib": 0.00374653865583241, "step": 459 }, { "ce_ib": 10.457240104675293, "ce_orig": 0.5686371326446533, "epoch": 0.13200086275073694, "kl_loss": 0.19664248824119568, "loss_ib": 0.0030121486634016037, "step": 459 }, { "ce_ib": 9.230670928955078, "ce_orig": 0.669769823551178, "epoch": 0.13200086275073694, "kl_loss": 0.15697245299816132, "loss_ib": 0.0024927917402237654, "step": 459 }, { "epoch": 0.13228844632971457, "grad_norm": 0.08651373535394669, "learning_rate": 4.997639323676214e-05, "loss": 0.7999, "step": 460 }, { "ce_ib": 10.430649757385254, "ce_orig": 0.5384361147880554, "epoch": 0.13228844632971457, "kl_loss": 0.240619957447052, "loss_ib": 0.0034492644481360912, "step": 460 }, { "ce_ib": 11.414108276367188, "ce_orig": 0.2244451642036438, "epoch": 0.13228844632971457, "kl_loss": 0.333604633808136, "loss_ib": 0.004477457143366337, "step": 460 }, { "ce_ib": 8.57000732421875, "ce_orig": 0.6421215534210205, "epoch": 0.13228844632971457, "kl_loss": 0.11957961320877075, "loss_ib": 0.002052796771749854, "step": 460 }, { "ce_ib": 9.772636413574219, "ce_orig": 0.7227917909622192, "epoch": 0.13228844632971457, "kl_loss": 0.1671256273984909, "loss_ib": 0.002648519817739725, "step": 460 }, { "ce_ib": 6.091513156890869, "ce_orig": 0.5446451902389526, "epoch": 0.13257602990869222, "kl_loss": 0.15295615792274475, "loss_ib": 0.0021387129090726376, "step": 461 }, { "ce_ib": 10.357866287231445, "ce_orig": 0.7494820356369019, "epoch": 0.13257602990869222, "kl_loss": 0.16398490965366364, "loss_ib": 0.002675635740160942, "step": 461 }, { "ce_ib": 9.155532836914062, "ce_orig": 0.6777340173721313, "epoch": 0.13257602990869222, "kl_loss": 0.16127201914787292, "loss_ib": 0.0025282735005021095, "step": 461 }, { "ce_ib": 10.313591003417969, "ce_orig": 0.7135111689567566, "epoch": 0.13257602990869222, "kl_loss": 0.22754691541194916, "loss_ib": 0.0033068279735744, "step": 461 }, { "ce_ib": 8.072470664978027, "ce_orig": 0.6382450461387634, "epoch": 0.13286361348766984, "kl_loss": 0.12815770506858826, "loss_ib": 0.0020888240542262793, "step": 462 }, { "ce_ib": 11.419739723205566, "ce_orig": 1.4712454080581665, "epoch": 0.13286361348766984, "kl_loss": 0.15876120328903198, "loss_ib": 0.0027295860927551985, "step": 462 }, { "ce_ib": 11.649603843688965, "ce_orig": 0.5335864424705505, "epoch": 0.13286361348766984, "kl_loss": 0.23220552504062653, "loss_ib": 0.0034870156086981297, "step": 462 }, { "ce_ib": 13.856771469116211, "ce_orig": 1.503601312637329, "epoch": 0.13286361348766984, "kl_loss": 0.22454500198364258, "loss_ib": 0.003631127066910267, "step": 462 }, { "ce_ib": 11.232563018798828, "ce_orig": 0.8185619115829468, "epoch": 0.1331511970666475, "kl_loss": 0.14658993482589722, "loss_ib": 0.002589155687019229, "step": 463 }, { "ce_ib": 8.680917739868164, "ce_orig": 0.897162914276123, "epoch": 0.1331511970666475, "kl_loss": 0.16236066818237305, "loss_ib": 0.002491698367521167, "step": 463 }, { "ce_ib": 13.455824851989746, "ce_orig": 0.7123657464981079, "epoch": 0.1331511970666475, "kl_loss": 0.1669284999370575, "loss_ib": 0.0030148671939969063, "step": 463 }, { "ce_ib": 11.438149452209473, "ce_orig": 0.6367284059524536, "epoch": 0.1331511970666475, "kl_loss": 0.17310284078121185, "loss_ib": 0.0028748433105647564, "step": 463 }, { "ce_ib": 9.650132179260254, "ce_orig": 0.877562403678894, "epoch": 0.13343878064562514, "kl_loss": 0.131558358669281, "loss_ib": 0.0022805966436862946, "step": 464 }, { "ce_ib": 10.920985221862793, "ce_orig": 0.9254859089851379, "epoch": 0.13343878064562514, "kl_loss": 0.15900883078575134, "loss_ib": 0.002682186895981431, "step": 464 }, { "ce_ib": 7.144834518432617, "ce_orig": 0.9159427285194397, "epoch": 0.13343878064562514, "kl_loss": 0.12562786042690277, "loss_ib": 0.0019707619212567806, "step": 464 }, { "ce_ib": 7.252218723297119, "ce_orig": 0.5822017192840576, "epoch": 0.13343878064562514, "kl_loss": 0.23755145072937012, "loss_ib": 0.0031007362995296717, "step": 464 }, { "epoch": 0.13372636422460277, "grad_norm": 0.09323103725910187, "learning_rate": 4.997467721852196e-05, "loss": 0.8438, "step": 465 }, { "ce_ib": 13.914019584655762, "ce_orig": 1.2358434200286865, "epoch": 0.13372636422460277, "kl_loss": 0.20358413457870483, "loss_ib": 0.0034272430930286646, "step": 465 }, { "ce_ib": 6.4653425216674805, "ce_orig": 0.5584582090377808, "epoch": 0.13372636422460277, "kl_loss": 0.0890372097492218, "loss_ib": 0.0015369063476100564, "step": 465 }, { "ce_ib": 10.534329414367676, "ce_orig": 0.4327813684940338, "epoch": 0.13372636422460277, "kl_loss": 0.17528124153614044, "loss_ib": 0.0028062453493475914, "step": 465 }, { "ce_ib": 13.77268123626709, "ce_orig": 0.8556481599807739, "epoch": 0.13372636422460277, "kl_loss": 0.20487025380134583, "loss_ib": 0.003425970673561096, "step": 465 }, { "ce_ib": 9.667628288269043, "ce_orig": 0.7900619506835938, "epoch": 0.13401394780358042, "kl_loss": 0.16862963140010834, "loss_ib": 0.002653059083968401, "step": 466 }, { "ce_ib": 11.5745210647583, "ce_orig": 0.5225064158439636, "epoch": 0.13401394780358042, "kl_loss": 0.219425767660141, "loss_ib": 0.0033517098054289818, "step": 466 }, { "ce_ib": 10.800277709960938, "ce_orig": 0.9123367667198181, "epoch": 0.13401394780358042, "kl_loss": 0.2272198349237442, "loss_ib": 0.0033522259909659624, "step": 466 }, { "ce_ib": 8.781864166259766, "ce_orig": 0.7642026543617249, "epoch": 0.13401394780358042, "kl_loss": 0.17208728194236755, "loss_ib": 0.00259905937127769, "step": 466 }, { "ce_ib": 12.304344177246094, "ce_orig": 0.7450142502784729, "epoch": 0.13430153138255804, "kl_loss": 0.1326742172241211, "loss_ib": 0.0025571766309440136, "step": 467 }, { "ce_ib": 9.575723648071289, "ce_orig": 0.648908793926239, "epoch": 0.13430153138255804, "kl_loss": 0.19128626585006714, "loss_ib": 0.0028704351279884577, "step": 467 }, { "ce_ib": 13.457468032836914, "ce_orig": 1.4314584732055664, "epoch": 0.13430153138255804, "kl_loss": 0.20292793214321136, "loss_ib": 0.0033750259317457676, "step": 467 }, { "ce_ib": 8.486967086791992, "ce_orig": 0.6459015011787415, "epoch": 0.13430153138255804, "kl_loss": 0.16141179203987122, "loss_ib": 0.002462814562022686, "step": 467 }, { "ce_ib": 9.87436580657959, "ce_orig": 1.0700461864471436, "epoch": 0.1345891149615357, "kl_loss": 0.24746514856815338, "loss_ib": 0.0034620880614966154, "step": 468 }, { "ce_ib": 10.845966339111328, "ce_orig": 0.6945490837097168, "epoch": 0.1345891149615357, "kl_loss": 0.1763351410627365, "loss_ib": 0.0028479481115937233, "step": 468 }, { "ce_ib": 11.760831832885742, "ce_orig": 0.9512259364128113, "epoch": 0.1345891149615357, "kl_loss": 0.15363314747810364, "loss_ib": 0.002712414599955082, "step": 468 }, { "ce_ib": 9.594245910644531, "ce_orig": 0.6800144910812378, "epoch": 0.1345891149615357, "kl_loss": 0.2686789929866791, "loss_ib": 0.0036462144926190376, "step": 468 }, { "ce_ib": 9.218502044677734, "ce_orig": 0.45141276717185974, "epoch": 0.13487669854051335, "kl_loss": 0.1673453450202942, "loss_ib": 0.0025953035801649094, "step": 469 }, { "ce_ib": 8.04023265838623, "ce_orig": 0.626139223575592, "epoch": 0.13487669854051335, "kl_loss": 0.18813760578632355, "loss_ib": 0.0026853992603719234, "step": 469 }, { "ce_ib": 9.180455207824707, "ce_orig": 0.4675959348678589, "epoch": 0.13487669854051335, "kl_loss": 0.19254645705223083, "loss_ib": 0.0028435098938643932, "step": 469 }, { "ce_ib": 10.131449699401855, "ce_orig": 0.6631660461425781, "epoch": 0.13487669854051335, "kl_loss": 0.14070668816566467, "loss_ib": 0.0024202116765081882, "step": 469 }, { "epoch": 0.13516428211949097, "grad_norm": 0.08323580771684647, "learning_rate": 4.9972901030487616e-05, "loss": 0.8432, "step": 470 }, { "ce_ib": 9.376252174377441, "ce_orig": 0.6429654955863953, "epoch": 0.13516428211949097, "kl_loss": 0.15271279215812683, "loss_ib": 0.002464753109961748, "step": 470 }, { "ce_ib": 7.387055397033691, "ce_orig": 0.4410795569419861, "epoch": 0.13516428211949097, "kl_loss": 0.13434870541095734, "loss_ib": 0.0020821925718337297, "step": 470 }, { "ce_ib": 12.794949531555176, "ce_orig": 0.8125112056732178, "epoch": 0.13516428211949097, "kl_loss": 0.5913262963294983, "loss_ib": 0.007192757446318865, "step": 470 }, { "ce_ib": 7.509584903717041, "ce_orig": 0.8456118106842041, "epoch": 0.13516428211949097, "kl_loss": 0.13973768055438995, "loss_ib": 0.0021483353339135647, "step": 470 }, { "ce_ib": 7.9404191970825195, "ce_orig": 0.7081736326217651, "epoch": 0.13545186569846862, "kl_loss": 0.12523691356182098, "loss_ib": 0.0020464109256863594, "step": 471 }, { "ce_ib": 10.213021278381348, "ce_orig": 0.7080956101417542, "epoch": 0.13545186569846862, "kl_loss": 0.2242983877658844, "loss_ib": 0.003264285856857896, "step": 471 }, { "ce_ib": 9.126559257507324, "ce_orig": 0.7322322726249695, "epoch": 0.13545186569846862, "kl_loss": 0.1383284032344818, "loss_ib": 0.002295939950272441, "step": 471 }, { "ce_ib": 6.414395809173584, "ce_orig": 0.6884047985076904, "epoch": 0.13545186569846862, "kl_loss": 0.11249984800815582, "loss_ib": 0.0017664380138739944, "step": 471 }, { "ce_ib": 5.14065408706665, "ce_orig": 0.2586210370063782, "epoch": 0.13573944927744624, "kl_loss": 0.3770146667957306, "loss_ib": 0.004284211900085211, "step": 472 }, { "ce_ib": 14.23343276977539, "ce_orig": 1.3532360792160034, "epoch": 0.13573944927744624, "kl_loss": 0.18985393643379211, "loss_ib": 0.003321882337331772, "step": 472 }, { "ce_ib": 14.564502716064453, "ce_orig": 1.749810814857483, "epoch": 0.13573944927744624, "kl_loss": 0.15691399574279785, "loss_ib": 0.0030255902092903852, "step": 472 }, { "ce_ib": 8.07909870147705, "ce_orig": 0.5683416724205017, "epoch": 0.13573944927744624, "kl_loss": 0.20622625946998596, "loss_ib": 0.0028701722621917725, "step": 472 }, { "ce_ib": 13.582554817199707, "ce_orig": 1.6216903924942017, "epoch": 0.1360270328564239, "kl_loss": 0.1717289686203003, "loss_ib": 0.0030755449552088976, "step": 473 }, { "ce_ib": 12.75936222076416, "ce_orig": 1.1129322052001953, "epoch": 0.1360270328564239, "kl_loss": 0.18489691615104675, "loss_ib": 0.003124905051663518, "step": 473 }, { "ce_ib": 8.29798412322998, "ce_orig": 0.4912956953048706, "epoch": 0.1360270328564239, "kl_loss": 0.13187135756015778, "loss_ib": 0.002148512052372098, "step": 473 }, { "ce_ib": 6.32996129989624, "ce_orig": 0.5624181628227234, "epoch": 0.1360270328564239, "kl_loss": 0.15103286504745483, "loss_ib": 0.0021433248184621334, "step": 473 }, { "ce_ib": 9.895087242126465, "ce_orig": 0.9939194321632385, "epoch": 0.13631461643540155, "kl_loss": 0.14027726650238037, "loss_ib": 0.00239228131249547, "step": 474 }, { "ce_ib": 10.561649322509766, "ce_orig": 0.8449274897575378, "epoch": 0.13631461643540155, "kl_loss": 0.16884073615074158, "loss_ib": 0.002744572004303336, "step": 474 }, { "ce_ib": 10.697015762329102, "ce_orig": 0.6244873404502869, "epoch": 0.13631461643540155, "kl_loss": 0.16410231590270996, "loss_ib": 0.002710724715143442, "step": 474 }, { "ce_ib": 10.975496292114258, "ce_orig": 0.6514372825622559, "epoch": 0.13631461643540155, "kl_loss": 0.20907053351402283, "loss_ib": 0.003188254777342081, "step": 474 }, { "epoch": 0.13660220001437917, "grad_norm": 0.09574563801288605, "learning_rate": 4.997106467693835e-05, "loss": 0.8712, "step": 475 }, { "ce_ib": 8.283028602600098, "ce_orig": 0.6631106734275818, "epoch": 0.13660220001437917, "kl_loss": 0.19269996881484985, "loss_ib": 0.002755302470177412, "step": 475 }, { "ce_ib": 9.683073997497559, "ce_orig": 0.7057353258132935, "epoch": 0.13660220001437917, "kl_loss": 0.22878339886665344, "loss_ib": 0.0032561414409428835, "step": 475 }, { "ce_ib": 8.93950366973877, "ce_orig": 0.7505787014961243, "epoch": 0.13660220001437917, "kl_loss": 0.1079094409942627, "loss_ib": 0.001973044592887163, "step": 475 }, { "ce_ib": 6.951815128326416, "ce_orig": 0.5303117632865906, "epoch": 0.13660220001437917, "kl_loss": 0.11965961754322052, "loss_ib": 0.0018917776178568602, "step": 475 }, { "ce_ib": 14.84595775604248, "ce_orig": 1.473997950553894, "epoch": 0.13688978359335682, "kl_loss": 0.16360431909561157, "loss_ib": 0.0031206386629492044, "step": 476 }, { "ce_ib": 13.593896865844727, "ce_orig": 1.2449053525924683, "epoch": 0.13688978359335682, "kl_loss": 0.16457515954971313, "loss_ib": 0.003005141159519553, "step": 476 }, { "ce_ib": 9.549323081970215, "ce_orig": 0.7047984004020691, "epoch": 0.13688978359335682, "kl_loss": 0.2452981024980545, "loss_ib": 0.0034079132601618767, "step": 476 }, { "ce_ib": 10.544528007507324, "ce_orig": 0.7549718022346497, "epoch": 0.13688978359335682, "kl_loss": 0.1296602040529251, "loss_ib": 0.0023510546889156103, "step": 476 }, { "ce_ib": 7.901725769042969, "ce_orig": 0.8333771824836731, "epoch": 0.13717736717233445, "kl_loss": 0.11247368156909943, "loss_ib": 0.001914909458719194, "step": 477 }, { "ce_ib": 6.190486431121826, "ce_orig": 0.6102291345596313, "epoch": 0.13717736717233445, "kl_loss": 0.10293813049793243, "loss_ib": 0.0016484298976138234, "step": 477 }, { "ce_ib": 8.575281143188477, "ce_orig": 0.701132595539093, "epoch": 0.13717736717233445, "kl_loss": 0.12163711339235306, "loss_ib": 0.002073899144306779, "step": 477 }, { "ce_ib": 9.477543830871582, "ce_orig": 0.6797293424606323, "epoch": 0.13717736717233445, "kl_loss": 0.13846732676029205, "loss_ib": 0.0023324275389313698, "step": 477 }, { "ce_ib": 8.02422046661377, "ce_orig": 0.7941074371337891, "epoch": 0.1374649507513121, "kl_loss": 0.11544310301542282, "loss_ib": 0.001956852851435542, "step": 478 }, { "ce_ib": 10.08478832244873, "ce_orig": 0.5088381171226501, "epoch": 0.1374649507513121, "kl_loss": 0.26347583532333374, "loss_ib": 0.003643237054347992, "step": 478 }, { "ce_ib": 10.609148025512695, "ce_orig": 1.1123254299163818, "epoch": 0.1374649507513121, "kl_loss": 0.18334609270095825, "loss_ib": 0.0028943754732608795, "step": 478 }, { "ce_ib": 8.124927520751953, "ce_orig": 0.911295473575592, "epoch": 0.1374649507513121, "kl_loss": 0.1195707842707634, "loss_ib": 0.0020082006230950356, "step": 478 }, { "ce_ib": 9.455392837524414, "ce_orig": 0.46617555618286133, "epoch": 0.13775253433028975, "kl_loss": 0.2140653133392334, "loss_ib": 0.003086192300543189, "step": 479 }, { "ce_ib": 12.214388847351074, "ce_orig": 0.7688418030738831, "epoch": 0.13775253433028975, "kl_loss": 0.20302480459213257, "loss_ib": 0.0032516869250684977, "step": 479 }, { "ce_ib": 10.966753005981445, "ce_orig": 0.7571495175361633, "epoch": 0.13775253433028975, "kl_loss": 0.17398342490196228, "loss_ib": 0.0028365093749016523, "step": 479 }, { "ce_ib": 7.949142932891846, "ce_orig": 0.6712113618850708, "epoch": 0.13775253433028975, "kl_loss": 0.16949275135993958, "loss_ib": 0.002489841775968671, "step": 479 }, { "epoch": 0.13804011790926737, "grad_norm": 0.11252865940332413, "learning_rate": 4.996916816229837e-05, "loss": 0.8761, "step": 480 }, { "ce_ib": 11.602306365966797, "ce_orig": 0.8134323358535767, "epoch": 0.13804011790926737, "kl_loss": 0.2448122501373291, "loss_ib": 0.0036083529703319073, "step": 480 }, { "ce_ib": 11.314531326293945, "ce_orig": 0.7367826700210571, "epoch": 0.13804011790926737, "kl_loss": 0.15320701897144318, "loss_ib": 0.002663523191586137, "step": 480 }, { "ce_ib": 12.606677055358887, "ce_orig": 1.1588752269744873, "epoch": 0.13804011790926737, "kl_loss": 0.15930581092834473, "loss_ib": 0.002853725804015994, "step": 480 }, { "ce_ib": 11.054275512695312, "ce_orig": 1.0181690454483032, "epoch": 0.13804011790926737, "kl_loss": 0.11396267265081406, "loss_ib": 0.0022450541146099567, "step": 480 }, { "ce_ib": 14.066468238830566, "ce_orig": 1.4801671504974365, "epoch": 0.13832770148824503, "kl_loss": 0.20112600922584534, "loss_ib": 0.0034179065842181444, "step": 481 }, { "ce_ib": 8.212839126586914, "ce_orig": 0.7344709038734436, "epoch": 0.13832770148824503, "kl_loss": 0.16998212039470673, "loss_ib": 0.002521105110645294, "step": 481 }, { "ce_ib": 12.749667167663574, "ce_orig": 1.22507905960083, "epoch": 0.13832770148824503, "kl_loss": 0.16252657771110535, "loss_ib": 0.0029002325609326363, "step": 481 }, { "ce_ib": 9.067646026611328, "ce_orig": 0.8712934851646423, "epoch": 0.13832770148824503, "kl_loss": 0.14971376955509186, "loss_ib": 0.0024039021227508783, "step": 481 }, { "ce_ib": 7.4774956703186035, "ce_orig": 0.6922398805618286, "epoch": 0.13861528506722265, "kl_loss": 0.17292888462543488, "loss_ib": 0.0024770384188741446, "step": 482 }, { "ce_ib": 12.176875114440918, "ce_orig": 0.8391960859298706, "epoch": 0.13861528506722265, "kl_loss": 0.28599101305007935, "loss_ib": 0.00407759752124548, "step": 482 }, { "ce_ib": 14.910351753234863, "ce_orig": 1.4995876550674438, "epoch": 0.13861528506722265, "kl_loss": 0.20326115190982819, "loss_ib": 0.0035236466210335493, "step": 482 }, { "ce_ib": 14.353828430175781, "ce_orig": 1.3694660663604736, "epoch": 0.13861528506722265, "kl_loss": 0.2608376145362854, "loss_ib": 0.004043758846819401, "step": 482 }, { "ce_ib": 10.655997276306152, "ce_orig": 0.795907735824585, "epoch": 0.1389028686462003, "kl_loss": 0.17903940379619598, "loss_ib": 0.0028559938073158264, "step": 483 }, { "ce_ib": 8.001945495605469, "ce_orig": 0.6496250629425049, "epoch": 0.1389028686462003, "kl_loss": 0.22284536063671112, "loss_ib": 0.003028648206964135, "step": 483 }, { "ce_ib": 15.7087984085083, "ce_orig": 1.539727807044983, "epoch": 0.1389028686462003, "kl_loss": 0.1869555413722992, "loss_ib": 0.003440435044467449, "step": 483 }, { "ce_ib": 11.261712074279785, "ce_orig": 0.7162747383117676, "epoch": 0.1389028686462003, "kl_loss": 0.15583762526512146, "loss_ib": 0.002684547333046794, "step": 483 }, { "ce_ib": 12.349994659423828, "ce_orig": 0.5102917551994324, "epoch": 0.13919045222517795, "kl_loss": 0.21702654659748077, "loss_ib": 0.003405264811590314, "step": 484 }, { "ce_ib": 14.703964233398438, "ce_orig": 1.2549042701721191, "epoch": 0.13919045222517795, "kl_loss": 0.28059592843055725, "loss_ib": 0.004276355262845755, "step": 484 }, { "ce_ib": 14.395584106445312, "ce_orig": 1.6029713153839111, "epoch": 0.13919045222517795, "kl_loss": 0.1588822305202484, "loss_ib": 0.0030283809173852205, "step": 484 }, { "ce_ib": 12.572036743164062, "ce_orig": 1.4179061651229858, "epoch": 0.13919045222517795, "kl_loss": 0.23325228691101074, "loss_ib": 0.0035897265188395977, "step": 484 }, { "epoch": 0.13947803580415558, "grad_norm": 0.09978976100683212, "learning_rate": 4.996721149113682e-05, "loss": 0.9298, "step": 485 }, { "ce_ib": 15.488334655761719, "ce_orig": 1.308066964149475, "epoch": 0.13947803580415558, "kl_loss": 0.17892438173294067, "loss_ib": 0.0033380771055817604, "step": 485 }, { "ce_ib": 10.043342590332031, "ce_orig": 0.9190800786018372, "epoch": 0.13947803580415558, "kl_loss": 0.14057381451129913, "loss_ib": 0.0024100723676383495, "step": 485 }, { "ce_ib": 10.405566215515137, "ce_orig": 0.41310566663742065, "epoch": 0.13947803580415558, "kl_loss": 0.08804390579462051, "loss_ib": 0.001920995651744306, "step": 485 }, { "ce_ib": 12.68533706665039, "ce_orig": 0.9749146103858948, "epoch": 0.13947803580415558, "kl_loss": 0.17658352851867676, "loss_ib": 0.003034368623048067, "step": 485 }, { "ce_ib": 14.109472274780273, "ce_orig": 0.93257075548172, "epoch": 0.13976561938313323, "kl_loss": 0.15330049395561218, "loss_ib": 0.002943952102214098, "step": 486 }, { "ce_ib": 7.845019340515137, "ce_orig": 0.7454962730407715, "epoch": 0.13976561938313323, "kl_loss": 0.18838530778884888, "loss_ib": 0.0026683551259338856, "step": 486 }, { "ce_ib": 9.430821418762207, "ce_orig": 1.0630453824996948, "epoch": 0.13976561938313323, "kl_loss": 0.15098202228546143, "loss_ib": 0.00245290226303041, "step": 486 }, { "ce_ib": 6.5644049644470215, "ce_orig": 0.5489628314971924, "epoch": 0.13976561938313323, "kl_loss": 0.08801446855068207, "loss_ib": 0.001536585041321814, "step": 486 }, { "ce_ib": 11.013578414916992, "ce_orig": 0.7610940933227539, "epoch": 0.14005320296211085, "kl_loss": 0.22202414274215698, "loss_ib": 0.0033215992152690887, "step": 487 }, { "ce_ib": 13.75318717956543, "ce_orig": 0.7965566515922546, "epoch": 0.14005320296211085, "kl_loss": 0.22268138825893402, "loss_ib": 0.003602132434025407, "step": 487 }, { "ce_ib": 11.45129680633545, "ce_orig": 1.317887306213379, "epoch": 0.14005320296211085, "kl_loss": 0.1648291051387787, "loss_ib": 0.002793420571833849, "step": 487 }, { "ce_ib": 9.824847221374512, "ce_orig": 0.6467515230178833, "epoch": 0.14005320296211085, "kl_loss": 0.21943452954292297, "loss_ib": 0.0031768297776579857, "step": 487 }, { "ce_ib": 9.987610816955566, "ce_orig": 0.7534988522529602, "epoch": 0.1403407865410885, "kl_loss": 0.1998450607061386, "loss_ib": 0.0029972116462886333, "step": 488 }, { "ce_ib": 14.38665771484375, "ce_orig": 1.332573413848877, "epoch": 0.1403407865410885, "kl_loss": 0.23315776884555817, "loss_ib": 0.003770243376493454, "step": 488 }, { "ce_ib": 6.623453140258789, "ce_orig": 0.42733436822891235, "epoch": 0.1403407865410885, "kl_loss": 0.14417804777622223, "loss_ib": 0.0021041256841272116, "step": 488 }, { "ce_ib": 12.093878746032715, "ce_orig": 1.1107982397079468, "epoch": 0.1403407865410885, "kl_loss": 0.1123935654759407, "loss_ib": 0.00233332347124815, "step": 488 }, { "ce_ib": 11.833623886108398, "ce_orig": 0.9317137598991394, "epoch": 0.14062837012006615, "kl_loss": 0.4279143214225769, "loss_ib": 0.005462505854666233, "step": 489 }, { "ce_ib": 6.175386428833008, "ce_orig": 0.2635171413421631, "epoch": 0.14062837012006615, "kl_loss": 0.17456625401973724, "loss_ib": 0.0023632009979337454, "step": 489 }, { "ce_ib": 9.941847801208496, "ce_orig": 0.6531252861022949, "epoch": 0.14062837012006615, "kl_loss": 0.17595279216766357, "loss_ib": 0.0027537124697118998, "step": 489 }, { "ce_ib": 7.677126407623291, "ce_orig": 0.688906192779541, "epoch": 0.14062837012006615, "kl_loss": 0.18364465236663818, "loss_ib": 0.0026041590608656406, "step": 489 }, { "epoch": 0.14091595369904378, "grad_norm": 0.0886775329709053, "learning_rate": 4.996519466816778e-05, "loss": 0.9075, "step": 490 }, { "ce_ib": 8.481292724609375, "ce_orig": 0.5066956281661987, "epoch": 0.14091595369904378, "kl_loss": 0.14637017250061035, "loss_ib": 0.002311830874532461, "step": 490 }, { "ce_ib": 14.51606559753418, "ce_orig": 1.596727967262268, "epoch": 0.14091595369904378, "kl_loss": 0.19026514887809753, "loss_ib": 0.0033542579039931297, "step": 490 }, { "ce_ib": 10.839821815490723, "ce_orig": 1.242689609527588, "epoch": 0.14091595369904378, "kl_loss": 0.21338334679603577, "loss_ib": 0.0032178156543523073, "step": 490 }, { "ce_ib": 7.8446831703186035, "ce_orig": 0.968952476978302, "epoch": 0.14091595369904378, "kl_loss": 0.2997243404388428, "loss_ib": 0.003781711682677269, "step": 490 }, { "ce_ib": 11.051322937011719, "ce_orig": 1.4200416803359985, "epoch": 0.14120353727802143, "kl_loss": 0.17061398923397064, "loss_ib": 0.0028112721629440784, "step": 491 }, { "ce_ib": 11.496525764465332, "ce_orig": 1.1261836290359497, "epoch": 0.14120353727802143, "kl_loss": 0.1715063452720642, "loss_ib": 0.002864715876057744, "step": 491 }, { "ce_ib": 15.705190658569336, "ce_orig": 1.4249088764190674, "epoch": 0.14120353727802143, "kl_loss": 0.19172680377960205, "loss_ib": 0.0034877872094511986, "step": 491 }, { "ce_ib": 10.472744941711426, "ce_orig": 0.9399302005767822, "epoch": 0.14120353727802143, "kl_loss": 0.15676361322402954, "loss_ib": 0.0026149104814976454, "step": 491 }, { "ce_ib": 7.808863639831543, "ce_orig": 0.8644165396690369, "epoch": 0.14149112085699905, "kl_loss": 0.09857909381389618, "loss_ib": 0.0017666771309450269, "step": 492 }, { "ce_ib": 9.123184204101562, "ce_orig": 0.736179530620575, "epoch": 0.14149112085699905, "kl_loss": 0.1718408167362213, "loss_ib": 0.0026307266671210527, "step": 492 }, { "ce_ib": 16.71449851989746, "ce_orig": 1.8901475667953491, "epoch": 0.14149112085699905, "kl_loss": 0.21999290585517883, "loss_ib": 0.0038713787216693163, "step": 492 }, { "ce_ib": 14.769342422485352, "ce_orig": 1.0042953491210938, "epoch": 0.14149112085699905, "kl_loss": 0.19468256831169128, "loss_ib": 0.0034237599465996027, "step": 492 }, { "ce_ib": 7.843172073364258, "ce_orig": 0.2853364646434784, "epoch": 0.1417787044359767, "kl_loss": 0.13801902532577515, "loss_ib": 0.002164507517591119, "step": 493 }, { "ce_ib": 10.78830337524414, "ce_orig": 1.1020339727401733, "epoch": 0.1417787044359767, "kl_loss": 0.21507477760314941, "loss_ib": 0.003229578025639057, "step": 493 }, { "ce_ib": 7.485945224761963, "ce_orig": 0.6249547004699707, "epoch": 0.1417787044359767, "kl_loss": 0.0884731262922287, "loss_ib": 0.0016333258245140314, "step": 493 }, { "ce_ib": 10.592840194702148, "ce_orig": 0.6959387063980103, "epoch": 0.1417787044359767, "kl_loss": 0.3251839876174927, "loss_ib": 0.004311123862862587, "step": 493 }, { "ce_ib": 6.683375358581543, "ce_orig": 0.47197264432907104, "epoch": 0.14206628801495436, "kl_loss": 0.1459130495786667, "loss_ib": 0.0021274678874760866, "step": 494 }, { "ce_ib": 8.309039115905762, "ce_orig": 0.34105879068374634, "epoch": 0.14206628801495436, "kl_loss": 0.15694405138492584, "loss_ib": 0.0024003442376852036, "step": 494 }, { "ce_ib": 13.072383880615234, "ce_orig": 1.3826266527175903, "epoch": 0.14206628801495436, "kl_loss": 0.19439606368541718, "loss_ib": 0.003251199144870043, "step": 494 }, { "ce_ib": 8.67587947845459, "ce_orig": 0.5467540621757507, "epoch": 0.14206628801495436, "kl_loss": 0.22117763757705688, "loss_ib": 0.0030793643090873957, "step": 494 }, { "epoch": 0.14235387159393198, "grad_norm": 0.11509755253791809, "learning_rate": 4.996311769825024e-05, "loss": 0.8795, "step": 495 }, { "ce_ib": 7.835722923278809, "ce_orig": 0.5985096096992493, "epoch": 0.14235387159393198, "kl_loss": 0.11672006547451019, "loss_ib": 0.0019507729448378086, "step": 495 }, { "ce_ib": 10.796977996826172, "ce_orig": 1.2538580894470215, "epoch": 0.14235387159393198, "kl_loss": 0.17189006507396698, "loss_ib": 0.0027985982596874237, "step": 495 }, { "ce_ib": 11.224424362182617, "ce_orig": 0.8003069758415222, "epoch": 0.14235387159393198, "kl_loss": 0.11536049842834473, "loss_ib": 0.0022760473657399416, "step": 495 }, { "ce_ib": 9.976873397827148, "ce_orig": 0.9437066316604614, "epoch": 0.14235387159393198, "kl_loss": 0.14582431316375732, "loss_ib": 0.002455930458381772, "step": 495 }, { "ce_ib": 12.75202751159668, "ce_orig": 1.2885056734085083, "epoch": 0.14264145517290963, "kl_loss": 0.17118601500988007, "loss_ib": 0.002987062791362405, "step": 496 }, { "ce_ib": 11.649064064025879, "ce_orig": 0.8830009698867798, "epoch": 0.14264145517290963, "kl_loss": 0.1887287050485611, "loss_ib": 0.0030521934386342764, "step": 496 }, { "ce_ib": 14.029234886169434, "ce_orig": 0.9412078261375427, "epoch": 0.14264145517290963, "kl_loss": 0.14774635434150696, "loss_ib": 0.002880387008190155, "step": 496 }, { "ce_ib": 16.335601806640625, "ce_orig": 2.0776398181915283, "epoch": 0.14264145517290963, "kl_loss": 0.1809537559747696, "loss_ib": 0.003443097695708275, "step": 496 }, { "ce_ib": 9.790528297424316, "ce_orig": 0.9552518129348755, "epoch": 0.14292903875188726, "kl_loss": 0.1889423429965973, "loss_ib": 0.002868476090952754, "step": 497 }, { "ce_ib": 9.869925498962402, "ce_orig": 0.8539248704910278, "epoch": 0.14292903875188726, "kl_loss": 0.19081233441829681, "loss_ib": 0.002895115874707699, "step": 497 }, { "ce_ib": 9.595001220703125, "ce_orig": 0.5288217663764954, "epoch": 0.14292903875188726, "kl_loss": 0.19318905472755432, "loss_ib": 0.002891390584409237, "step": 497 }, { "ce_ib": 9.586201667785645, "ce_orig": 1.1783746480941772, "epoch": 0.14292903875188726, "kl_loss": 0.18821683526039124, "loss_ib": 0.002840788336470723, "step": 497 }, { "ce_ib": 12.379876136779785, "ce_orig": 1.2077107429504395, "epoch": 0.1432166223308649, "kl_loss": 0.14908835291862488, "loss_ib": 0.0027288710698485374, "step": 498 }, { "ce_ib": 11.757010459899902, "ce_orig": 0.6566261649131775, "epoch": 0.1432166223308649, "kl_loss": 0.1946725696325302, "loss_ib": 0.003122426802292466, "step": 498 }, { "ce_ib": 8.702943801879883, "ce_orig": 0.4927518963813782, "epoch": 0.1432166223308649, "kl_loss": 0.10925129801034927, "loss_ib": 0.001962807262316346, "step": 498 }, { "ce_ib": 10.411445617675781, "ce_orig": 0.706779956817627, "epoch": 0.1432166223308649, "kl_loss": 0.17433921992778778, "loss_ib": 0.002784536685794592, "step": 498 }, { "ce_ib": 14.122117042541504, "ce_orig": 1.4039651155471802, "epoch": 0.14350420590984256, "kl_loss": 0.16670997440814972, "loss_ib": 0.0030793112237006426, "step": 499 }, { "ce_ib": 10.383757591247559, "ce_orig": 1.0631924867630005, "epoch": 0.14350420590984256, "kl_loss": 0.16225400567054749, "loss_ib": 0.002660915721207857, "step": 499 }, { "ce_ib": 6.402273654937744, "ce_orig": 0.6313638091087341, "epoch": 0.14350420590984256, "kl_loss": 0.18505465984344482, "loss_ib": 0.0024907737970352173, "step": 499 }, { "ce_ib": 8.23951244354248, "ce_orig": 0.8967234492301941, "epoch": 0.14350420590984256, "kl_loss": 0.13677600026130676, "loss_ib": 0.0021917112171649933, "step": 499 }, { "epoch": 0.14379178948882018, "grad_norm": 0.09538047015666962, "learning_rate": 4.996098058638809e-05, "loss": 0.8901, "step": 500 } ], "logging_steps": 5, "max_steps": 10434, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 2, "trial_name": null, "trial_params": null }