{"step": 0, "train_loss": 12.010697364807129, "lr": 0.0, "tps": 910, "wall": 72.0} {"step": 1, "train_loss": 11.96965503692627, "lr": 4.0000000000000003e-07, "tps": 929, "wall": 141.0} {"step": 2, "train_loss": 11.981226921081543, "lr": 8.000000000000001e-07, "tps": 932, "wall": 210.8} {"step": 3, "train_loss": 11.984458923339844, "lr": 1.2000000000000002e-06, "tps": 946, "wall": 276.8} {"step": 4, "train_loss": 11.962907791137695, "lr": 1.6000000000000001e-06, "tps": 944, "wall": 346.8} {"step": 5, "train_loss": 11.980673789978027, "lr": 2e-06, "tps": 945, "wall": 415.8} {"step": 6, "train_loss": 11.898082733154297, "lr": 2.4000000000000003e-06, "tps": 946, "wall": 484.5} {"step": 7, "train_loss": 11.908851623535156, "lr": 2.8e-06, "tps": 947, "wall": 553.6} {"step": 8, "train_loss": 11.831507682800293, "lr": 3.2000000000000003e-06, "tps": 957, "wall": 616.1} {"step": 9, "train_loss": 11.751951217651367, "lr": 3.6000000000000003e-06, "tps": 937, "wall": 698.7} {"step": 10, "train_loss": 11.724292755126953, "lr": 4e-06, "tps": 944, "wall": 763.6} {"step": 11, "train_loss": 11.649297714233398, "lr": 4.4e-06, "tps": 945, "wall": 832.1} {"step": 12, "train_loss": 11.556442260742188, "lr": 4.800000000000001e-06, "tps": 944, "wall": 901.7} {"step": 13, "train_loss": 11.515082359313965, "lr": 5.200000000000001e-06, "tps": 943, "wall": 972.2} {"step": 14, "train_loss": 11.432888984680176, "lr": 5.6e-06, "tps": 946, "wall": 1039.0} {"step": 15, "train_loss": 11.280614852905273, "lr": 6e-06, "tps": 949, "wall": 1103.8} {"step": 16, "train_loss": 11.243553161621094, "lr": 6.4000000000000006e-06, "tps": 949, "wall": 1173.3} {"step": 17, "train_loss": 11.123882293701172, "lr": 6.8e-06, "tps": 948, "wall": 1244.0} {"step": 18, "train_loss": 11.010810852050781, "lr": 7.2000000000000005e-06, "tps": 948, "wall": 1312.5} {"step": 19, "train_loss": 10.999919891357422, "lr": 7.6e-06, "tps": 950, "wall": 1378.7} {"step": 20, "train_loss": 10.937429428100586, "lr": 8e-06, "tps": 951, "wall": 1447.0} {"step": 21, "train_loss": 10.852409362792969, "lr": 8.400000000000001e-06, "tps": 953, "wall": 1512.7} {"step": 22, "train_loss": 10.72719669342041, "lr": 8.8e-06, "tps": 952, "wall": 1582.8} {"step": 23, "train_loss": 10.672483444213867, "lr": 9.2e-06, "tps": 951, "wall": 1653.1} {"step": 24, "train_loss": 10.674062728881836, "lr": 9.600000000000001e-06, "tps": 951, "wall": 1722.0} {"step": 25, "train_loss": 10.623747825622559, "lr": 1e-05, "tps": 950, "wall": 1792.7} {"step": 26, "train_loss": 10.523874282836914, "lr": 1.0400000000000002e-05, "tps": 951, "wall": 1860.2} {"step": 27, "train_loss": 10.469463348388672, "lr": 1.08e-05, "tps": 950, "wall": 1930.0} {"step": 28, "train_loss": 10.356807708740234, "lr": 1.12e-05, "tps": 950, "wall": 1999.6} {"step": 29, "train_loss": 10.294553756713867, "lr": 1.16e-05, "tps": 948, "wall": 2073.3} {"step": 30, "train_loss": 10.223312377929688, "lr": 1.2e-05, "tps": 947, "wall": 2144.0} {"step": 31, "train_loss": 10.260488510131836, "lr": 1.2400000000000002e-05, "tps": 948, "wall": 2210.1} {"step": 32, "train_loss": 10.180464744567871, "lr": 1.2800000000000001e-05, "tps": 947, "wall": 2281.4} {"step": 33, "train_loss": 10.115972518920898, "lr": 1.32e-05, "tps": 947, "wall": 2352.4} {"step": 34, "train_loss": 10.067770004272461, "lr": 1.36e-05, "tps": 948, "wall": 2418.9} {"step": 35, "train_loss": 10.072193145751953, "lr": 1.4e-05, "tps": 948, "wall": 2488.2} {"step": 36, "train_loss": 10.045570373535156, "lr": 1.4400000000000001e-05, "tps": 947, "wall": 2558.8} {"step": 37, "train_loss": 10.00036907196045, "lr": 1.48e-05, "tps": 948, "wall": 2625.7} {"step": 38, "train_loss": 9.990562438964844, "lr": 1.52e-05, "tps": 948, "wall": 2694.0} {"step": 39, "train_loss": 9.957466125488281, "lr": 1.56e-05, "tps": 948, "wall": 2763.5} {"step": 40, "train_loss": 9.912899017333984, "lr": 1.6e-05, "tps": 948, "wall": 2831.7} {"step": 41, "train_loss": 9.890909194946289, "lr": 1.6400000000000002e-05, "tps": 951, "wall": 2894.3} {"step": 42, "train_loss": 9.889411926269531, "lr": 1.6800000000000002e-05, "tps": 950, "wall": 2963.7} {"step": 43, "train_loss": 9.917186737060547, "lr": 1.72e-05, "tps": 951, "wall": 3030.5} {"step": 44, "train_loss": 9.838390350341797, "lr": 1.76e-05, "tps": 951, "wall": 3100.0} {"step": 45, "train_loss": 9.816900253295898, "lr": 1.8e-05, "tps": 950, "wall": 3170.0} {"step": 46, "train_loss": 9.792354583740234, "lr": 1.84e-05, "tps": 951, "wall": 3237.6} {"step": 47, "train_loss": 9.856487274169922, "lr": 1.88e-05, "tps": 951, "wall": 3306.8} {"step": 48, "train_loss": 9.773977279663086, "lr": 1.9200000000000003e-05, "tps": 950, "wall": 3379.4} {"step": 49, "train_loss": 9.736377716064453, "lr": 1.96e-05, "tps": 949, "wall": 3450.2} {"step": 50, "train_loss": 9.75018310546875, "lr": 2e-05, "tps": 950, "wall": 3516.7} {"step": 51, "train_loss": 9.754556655883789, "lr": 2.04e-05, "tps": 949, "wall": 3588.7} {"step": 52, "train_loss": 9.765791893005371, "lr": 2.0800000000000004e-05, "tps": 950, "wall": 3653.1} {"step": 53, "train_loss": 9.722951889038086, "lr": 2.12e-05, "tps": 951, "wall": 3720.9} {"step": 54, "train_loss": 9.664896011352539, "lr": 2.16e-05, "tps": 951, "wall": 3789.6} {"step": 55, "train_loss": 9.628379821777344, "lr": 2.2000000000000003e-05, "tps": 950, "wall": 3859.4} {"step": 56, "train_loss": 9.626276016235352, "lr": 2.24e-05, "tps": 952, "wall": 3923.7} {"step": 57, "train_loss": 9.62670612335205, "lr": 2.2800000000000002e-05, "tps": 952, "wall": 3992.4} {"step": 58, "train_loss": 9.62191390991211, "lr": 2.32e-05, "tps": 952, "wall": 4060.7} {"step": 59, "train_loss": 9.592965126037598, "lr": 2.36e-05, "tps": 952, "wall": 4130.0} {"step": 60, "train_loss": 9.557229995727539, "lr": 2.4e-05, "tps": 951, "wall": 4199.4} {"step": 61, "train_loss": 9.518532752990723, "lr": 2.44e-05, "tps": 952, "wall": 4264.6} {"step": 62, "train_loss": 9.565384864807129, "lr": 2.4800000000000003e-05, "tps": 953, "wall": 4332.1} {"step": 63, "train_loss": 9.482979774475098, "lr": 2.52e-05, "tps": 952, "wall": 4403.1} {"step": 64, "train_loss": 9.412121772766113, "lr": 2.5600000000000002e-05, "tps": 951, "wall": 4476.1} {"step": 65, "train_loss": 9.506957054138184, "lr": 2.6000000000000002e-05, "tps": 949, "wall": 4557.0} {"step": 66, "train_loss": 9.467164993286133, "lr": 2.64e-05, "tps": 949, "wall": 4626.4} {"step": 67, "train_loss": 9.377189636230469, "lr": 2.68e-05, "tps": 948, "wall": 4696.0} {"step": 68, "train_loss": 9.370645523071289, "lr": 2.72e-05, "tps": 949, "wall": 4764.9} {"step": 69, "train_loss": 9.341726303100586, "lr": 2.7600000000000003e-05, "tps": 948, "wall": 4834.6} {"step": 70, "train_loss": 9.364311218261719, "lr": 2.8e-05, "tps": 949, "wall": 4901.3} {"step": 71, "train_loss": 9.270305633544922, "lr": 2.8400000000000003e-05, "tps": 949, "wall": 4970.5} {"step": 72, "train_loss": 9.281624794006348, "lr": 2.8800000000000002e-05, "tps": 949, "wall": 5039.0} {"step": 73, "train_loss": 9.233774185180664, "lr": 2.92e-05, "tps": 948, "wall": 5111.5} {"step": 74, "train_loss": 9.294072151184082, "lr": 2.96e-05, "tps": 948, "wall": 5182.1} {"step": 75, "train_loss": 9.223991394042969, "lr": 3e-05, "tps": 948, "wall": 5252.6} {"step": 76, "train_loss": 9.157362937927246, "lr": 3.04e-05, "tps": 948, "wall": 5320.3} {"step": 77, "train_loss": 9.209671020507812, "lr": 3.08e-05, "tps": 949, "wall": 5386.0} {"step": 78, "train_loss": 9.179274559020996, "lr": 3.12e-05, "tps": 949, "wall": 5453.8} {"step": 79, "train_loss": 9.085465431213379, "lr": 3.16e-05, "tps": 949, "wall": 5520.9} {"step": 80, "train_loss": 9.1079740524292, "lr": 3.2e-05, "tps": 949, "wall": 5588.9} {"step": 81, "train_loss": 9.08513069152832, "lr": 3.24e-05, "tps": 950, "wall": 5654.1} {"step": 82, "train_loss": 9.015950202941895, "lr": 3.2800000000000004e-05, "tps": 950, "wall": 5725.6} {"step": 83, "train_loss": 9.063796997070312, "lr": 3.32e-05, "tps": 950, "wall": 5794.7} {"step": 84, "train_loss": 8.99737548828125, "lr": 3.3600000000000004e-05, "tps": 949, "wall": 5864.6} {"step": 85, "train_loss": 8.945900917053223, "lr": 3.4e-05, "tps": 950, "wall": 5927.5} {"step": 86, "train_loss": 8.93387222290039, "lr": 3.44e-05, "tps": 950, "wall": 5997.7} {"step": 87, "train_loss": 8.958739280700684, "lr": 3.4800000000000006e-05, "tps": 951, "wall": 6063.6} {"step": 88, "train_loss": 8.918479919433594, "lr": 3.52e-05, "tps": 951, "wall": 6131.5} {"step": 89, "train_loss": 8.855342864990234, "lr": 3.56e-05, "tps": 951, "wall": 6200.0} {"step": 90, "train_loss": 8.866922378540039, "lr": 3.6e-05, "tps": 951, "wall": 6264.9} {"step": 91, "train_loss": 8.829869270324707, "lr": 3.6400000000000004e-05, "tps": 951, "wall": 6336.0} {"step": 92, "train_loss": 8.79916000366211, "lr": 3.68e-05, "tps": 951, "wall": 6402.7} {"step": 93, "train_loss": 8.740850448608398, "lr": 3.72e-05, "tps": 951, "wall": 6473.9} {"step": 94, "train_loss": 8.792409896850586, "lr": 3.76e-05, "tps": 951, "wall": 6544.5} {"step": 95, "train_loss": 8.686039924621582, "lr": 3.8e-05, "tps": 950, "wall": 6618.3} {"step": 96, "train_loss": 8.677000045776367, "lr": 3.8400000000000005e-05, "tps": 950, "wall": 6688.5} {"step": 97, "train_loss": 8.69382095336914, "lr": 3.88e-05, "tps": 950, "wall": 6758.0} {"step": 98, "train_loss": 8.663525581359863, "lr": 3.92e-05, "tps": 950, "wall": 6829.5} {"step": 99, "train_loss": 8.636314392089844, "lr": 3.96e-05, "tps": 949, "wall": 6901.8} {"step": 100, "train_loss": 8.546436309814453, "lr": 4e-05, "tps": 949, "wall": 6971.8} {"step": 101, "train_loss": 8.57101058959961, "lr": 4.0400000000000006e-05, "tps": 949, "wall": 7037.2} {"step": 102, "train_loss": 8.568340301513672, "lr": 4.08e-05, "tps": 950, "wall": 7098.6} {"step": 103, "train_loss": 8.628861427307129, "lr": 4.12e-05, "tps": 950, "wall": 7169.0} {"step": 104, "train_loss": 8.567682266235352, "lr": 4.160000000000001e-05, "tps": 950, "wall": 7236.2} {"step": 105, "train_loss": 8.497370719909668, "lr": 4.2000000000000004e-05, "tps": 950, "wall": 7305.0} {"step": 106, "train_loss": 8.448330879211426, "lr": 4.24e-05, "tps": 951, "wall": 7372.6} {"step": 107, "train_loss": 8.481821060180664, "lr": 4.2800000000000004e-05, "tps": 951, "wall": 7441.1} {"step": 108, "train_loss": 8.367916107177734, "lr": 4.32e-05, "tps": 952, "wall": 7503.3} {"step": 109, "train_loss": 8.396551132202148, "lr": 4.36e-05, "tps": 951, "wall": 7573.5} {"step": 110, "train_loss": 8.405254364013672, "lr": 4.4000000000000006e-05, "tps": 951, "wall": 7644.2} {"step": 111, "train_loss": 8.329368591308594, "lr": 4.44e-05, "tps": 951, "wall": 7710.7} {"step": 112, "train_loss": 8.313891410827637, "lr": 4.48e-05, "tps": 952, "wall": 7777.5} {"step": 113, "train_loss": 8.262480735778809, "lr": 4.52e-05, "tps": 952, "wall": 7845.9} {"step": 114, "train_loss": 8.29344367980957, "lr": 4.5600000000000004e-05, "tps": 952, "wall": 7915.4} {"step": 115, "train_loss": 8.254911422729492, "lr": 4.6e-05, "tps": 952, "wall": 7985.2} {"step": 116, "train_loss": 8.21626091003418, "lr": 4.64e-05, "tps": 951, "wall": 8056.0} {"step": 117, "train_loss": 8.169304847717285, "lr": 4.68e-05, "tps": 951, "wall": 8124.6} {"step": 118, "train_loss": 8.246122360229492, "lr": 4.72e-05, "tps": 951, "wall": 8199.2} {"step": 119, "train_loss": 8.201326370239258, "lr": 4.7600000000000005e-05, "tps": 951, "wall": 8269.0} {"step": 120, "train_loss": 8.185909271240234, "lr": 4.8e-05, "tps": 951, "wall": 8338.2} {"step": 121, "train_loss": 8.069734573364258, "lr": 4.8400000000000004e-05, "tps": 950, "wall": 8408.3} {"step": 122, "train_loss": 8.208276748657227, "lr": 4.88e-05, "tps": 950, "wall": 8479.6} {"step": 123, "train_loss": 8.085567474365234, "lr": 4.92e-05, "tps": 950, "wall": 8551.2} {"step": 124, "train_loss": 8.038138389587402, "lr": 4.9600000000000006e-05, "tps": 950, "wall": 8620.6} {"step": 125, "train_loss": 8.055192947387695, "lr": 5e-05, "tps": 950, "wall": 8690.3} {"step": 126, "train_loss": 7.997938632965088, "lr": 5.04e-05, "tps": 950, "wall": 8757.7} {"step": 127, "train_loss": 7.917834281921387, "lr": 5.08e-05, "tps": 950, "wall": 8827.9} {"step": 128, "train_loss": 8.007091522216797, "lr": 5.1200000000000004e-05, "tps": 950, "wall": 8898.8} {"step": 129, "train_loss": 7.9727630615234375, "lr": 5.16e-05, "tps": 949, "wall": 8969.1} {"step": 130, "train_loss": 8.010106086730957, "lr": 5.2000000000000004e-05, "tps": 950, "wall": 9036.3} {"step": 131, "train_loss": 8.01589298248291, "lr": 5.24e-05, "tps": 949, "wall": 9106.5} {"step": 132, "train_loss": 8.031391143798828, "lr": 5.28e-05, "tps": 949, "wall": 9175.9} {"step": 133, "train_loss": 7.955106735229492, "lr": 5.3200000000000006e-05, "tps": 949, "wall": 9246.2} {"step": 134, "train_loss": 7.808548450469971, "lr": 5.36e-05, "tps": 949, "wall": 9313.0} {"step": 135, "train_loss": 7.913183212280273, "lr": 5.4e-05, "tps": 949, "wall": 9384.5} {"step": 136, "train_loss": 7.795839309692383, "lr": 5.44e-05, "tps": 949, "wall": 9454.6} {"step": 137, "train_loss": 7.834445953369141, "lr": 5.4800000000000004e-05, "tps": 949, "wall": 9525.0} {"step": 138, "train_loss": 7.766136646270752, "lr": 5.520000000000001e-05, "tps": 949, "wall": 9593.7} {"step": 139, "train_loss": 7.865386009216309, "lr": 5.56e-05, "tps": 949, "wall": 9661.5} {"step": 140, "train_loss": 7.720357894897461, "lr": 5.6e-05, "tps": 949, "wall": 9730.2} {"step": 141, "train_loss": 7.792556285858154, "lr": 5.640000000000001e-05, "tps": 949, "wall": 9798.9} {"step": 142, "train_loss": 7.801546096801758, "lr": 5.6800000000000005e-05, "tps": 949, "wall": 9868.0} {"step": 143, "train_loss": 7.684850215911865, "lr": 5.72e-05, "tps": 949, "wall": 9936.3} {"step": 144, "train_loss": 7.762656211853027, "lr": 5.7600000000000004e-05, "tps": 949, "wall": 10007.3} {"step": 145, "train_loss": 7.695272445678711, "lr": 5.8e-05, "tps": 950, "wall": 10070.4} {"step": 146, "train_loss": 7.647067070007324, "lr": 5.84e-05, "tps": 950, "wall": 10135.7} {"step": 147, "train_loss": 7.5962114334106445, "lr": 5.8800000000000006e-05, "tps": 950, "wall": 10202.3} {"step": 148, "train_loss": 7.5769476890563965, "lr": 5.92e-05, "tps": 950, "wall": 10273.5} {"step": 149, "train_loss": 7.548748016357422, "lr": 5.96e-05, "tps": 950, "wall": 10344.3} {"step": 150, "train_loss": 7.6254777908325195, "lr": 6e-05, "tps": 950, "wall": 10415.4} {"step": 151, "train_loss": 7.604466915130615, "lr": 6.0400000000000004e-05, "tps": 950, "wall": 10481.2} {"step": 152, "train_loss": 7.6124372482299805, "lr": 6.08e-05, "tps": 950, "wall": 10545.6} {"step": 153, "train_loss": 7.598109245300293, "lr": 6.120000000000001e-05, "tps": 950, "wall": 10617.3} {"step": 154, "train_loss": 7.537181377410889, "lr": 6.16e-05, "tps": 950, "wall": 10684.7} {"step": 155, "train_loss": 7.536397933959961, "lr": 6.2e-05, "tps": 950, "wall": 10756.2} {"step": 156, "train_loss": 7.611353874206543, "lr": 6.24e-05, "tps": 950, "wall": 10824.0} {"step": 157, "train_loss": 7.585582733154297, "lr": 6.280000000000001e-05, "tps": 950, "wall": 10895.4} {"step": 158, "train_loss": 7.527928352355957, "lr": 6.32e-05, "tps": 950, "wall": 10967.1} {"step": 159, "train_loss": 7.502246856689453, "lr": 6.36e-05, "tps": 950, "wall": 11037.3} {"step": 160, "train_loss": 7.561649322509766, "lr": 6.4e-05, "tps": 950, "wall": 11102.1} {"step": 161, "train_loss": 7.506707191467285, "lr": 6.44e-05, "tps": 950, "wall": 11171.0} {"step": 162, "train_loss": 7.418725967407227, "lr": 6.48e-05, "tps": 950, "wall": 11241.1} {"step": 163, "train_loss": 7.482645034790039, "lr": 6.520000000000001e-05, "tps": 950, "wall": 11304.6} {"step": 164, "train_loss": 7.406603813171387, "lr": 6.560000000000001e-05, "tps": 950, "wall": 11372.8} {"step": 165, "train_loss": 7.5249409675598145, "lr": 6.6e-05, "tps": 950, "wall": 11440.8} {"step": 166, "train_loss": 7.427241325378418, "lr": 6.64e-05, "tps": 950, "wall": 11510.6} {"step": 167, "train_loss": 7.447353363037109, "lr": 6.68e-05, "tps": 950, "wall": 11577.6} {"step": 168, "train_loss": 7.498727798461914, "lr": 6.720000000000001e-05, "tps": 950, "wall": 11647.8} {"step": 169, "train_loss": 7.482230186462402, "lr": 6.76e-05, "tps": 951, "wall": 11713.7} {"step": 170, "train_loss": 7.46236515045166, "lr": 6.8e-05, "tps": 950, "wall": 11786.5} {"step": 171, "train_loss": 7.454972743988037, "lr": 6.840000000000001e-05, "tps": 950, "wall": 11859.2} {"step": 172, "train_loss": 7.340647220611572, "lr": 6.88e-05, "tps": 950, "wall": 11929.2} {"step": 173, "train_loss": 7.350194931030273, "lr": 6.92e-05, "tps": 950, "wall": 11995.7} {"step": 174, "train_loss": 7.376027584075928, "lr": 6.960000000000001e-05, "tps": 950, "wall": 12064.2} {"step": 175, "train_loss": 7.371550559997559, "lr": 7.000000000000001e-05, "tps": 950, "wall": 12135.8} {"step": 176, "train_loss": 7.384304523468018, "lr": 7.04e-05, "tps": 950, "wall": 12208.4} {"step": 177, "train_loss": 7.328788757324219, "lr": 7.08e-05, "tps": 949, "wall": 12280.8} {"step": 178, "train_loss": 7.395209312438965, "lr": 7.12e-05, "tps": 949, "wall": 12352.1} {"step": 179, "train_loss": 7.33361291885376, "lr": 7.159999999999999e-05, "tps": 949, "wall": 12420.2} {"step": 180, "train_loss": 7.377456188201904, "lr": 7.2e-05, "tps": 949, "wall": 12490.0} {"step": 181, "train_loss": 7.323899745941162, "lr": 7.240000000000001e-05, "tps": 949, "wall": 12560.0} {"step": 182, "train_loss": 7.292990207672119, "lr": 7.280000000000001e-05, "tps": 949, "wall": 12631.6} {"step": 183, "train_loss": 7.298776626586914, "lr": 7.32e-05, "tps": 949, "wall": 12698.4} {"step": 184, "train_loss": 7.287654399871826, "lr": 7.36e-05, "tps": 949, "wall": 12766.7} {"step": 185, "train_loss": 7.4055705070495605, "lr": 7.400000000000001e-05, "tps": 949, "wall": 12836.7} {"step": 186, "train_loss": 7.303425312042236, "lr": 7.44e-05, "tps": 949, "wall": 12908.0} {"step": 187, "train_loss": 7.372511863708496, "lr": 7.48e-05, "tps": 949, "wall": 12972.2} {"step": 188, "train_loss": 7.328755855560303, "lr": 7.52e-05, "tps": 950, "wall": 13036.1} {"step": 189, "train_loss": 7.291041374206543, "lr": 7.56e-05, "tps": 949, "wall": 13107.6} {"step": 190, "train_loss": 7.3111162185668945, "lr": 7.6e-05, "tps": 950, "wall": 13173.5} {"step": 191, "train_loss": 7.15685510635376, "lr": 7.640000000000001e-05, "tps": 950, "wall": 13239.9} {"step": 192, "train_loss": 7.15998649597168, "lr": 7.680000000000001e-05, "tps": 950, "wall": 13305.0} {"step": 193, "train_loss": 7.24061393737793, "lr": 7.72e-05, "tps": 950, "wall": 13375.0} {"step": 194, "train_loss": 7.124547004699707, "lr": 7.76e-05, "tps": 950, "wall": 13445.9} {"step": 195, "train_loss": 7.190953731536865, "lr": 7.8e-05, "tps": 950, "wall": 13509.5} {"step": 196, "train_loss": 7.198164939880371, "lr": 7.84e-05, "tps": 950, "wall": 13578.9} {"step": 197, "train_loss": 7.225650787353516, "lr": 7.88e-05, "tps": 950, "wall": 13645.3} {"step": 198, "train_loss": 7.273319721221924, "lr": 7.92e-05, "tps": 951, "wall": 13713.2} {"step": 199, "train_loss": 7.220339298248291, "lr": 7.960000000000001e-05, "tps": 951, "wall": 13778.7} {"step": 200, "train_loss": 7.227572441101074, "lr": 8e-05, "tps": 950, "wall": 13852.0} {"step": 201, "train_loss": 7.183426380157471, "lr": 8.04e-05, "tps": 950, "wall": 13922.3} {"step": 202, "train_loss": 7.148515701293945, "lr": 8.080000000000001e-05, "tps": 950, "wall": 13992.4} {"step": 203, "train_loss": 7.05709981918335, "lr": 8.120000000000001e-05, "tps": 950, "wall": 14061.3} {"step": 204, "train_loss": 7.183977127075195, "lr": 8.16e-05, "tps": 950, "wall": 14131.5} {"step": 205, "train_loss": 7.176589488983154, "lr": 8.2e-05, "tps": 950, "wall": 14202.5} {"step": 206, "train_loss": 7.1453857421875, "lr": 8.24e-05, "tps": 950, "wall": 14271.2} {"step": 207, "train_loss": 7.105539321899414, "lr": 8.28e-05, "tps": 950, "wall": 14342.6} {"step": 208, "train_loss": 7.100157737731934, "lr": 8.320000000000002e-05, "tps": 950, "wall": 14412.4} {"step": 209, "train_loss": 7.05872106552124, "lr": 8.360000000000001e-05, "tps": 950, "wall": 14480.1} {"step": 210, "train_loss": 7.101036071777344, "lr": 8.400000000000001e-05, "tps": 950, "wall": 14550.7} {"step": 211, "train_loss": 7.044875621795654, "lr": 8.44e-05, "tps": 950, "wall": 14615.0} {"step": 212, "train_loss": 7.097972869873047, "lr": 8.48e-05, "tps": 950, "wall": 14686.2} {"step": 213, "train_loss": 6.992912292480469, "lr": 8.52e-05, "tps": 950, "wall": 14756.0} {"step": 214, "train_loss": 7.08118200302124, "lr": 8.560000000000001e-05, "tps": 950, "wall": 14825.2} {"step": 215, "train_loss": 7.1326584815979, "lr": 8.6e-05, "tps": 950, "wall": 14895.4} {"step": 216, "train_loss": 7.148928642272949, "lr": 8.64e-05, "tps": 950, "wall": 14962.4} {"step": 217, "train_loss": 7.109501361846924, "lr": 8.68e-05, "tps": 950, "wall": 15026.5} {"step": 218, "train_loss": 7.008996963500977, "lr": 8.72e-05, "tps": 950, "wall": 15096.3} {"step": 219, "train_loss": 7.075092315673828, "lr": 8.76e-05, "tps": 950, "wall": 15163.2} {"step": 220, "train_loss": 7.020389080047607, "lr": 8.800000000000001e-05, "tps": 950, "wall": 15232.8} {"step": 221, "train_loss": 7.091025352478027, "lr": 8.840000000000001e-05, "tps": 950, "wall": 15300.6} {"step": 222, "train_loss": 7.056920051574707, "lr": 8.88e-05, "tps": 951, "wall": 15366.1} {"step": 223, "train_loss": 7.152129173278809, "lr": 8.92e-05, "tps": 951, "wall": 15435.1} {"step": 224, "train_loss": 7.064220428466797, "lr": 8.96e-05, "tps": 951, "wall": 15501.2} {"step": 225, "train_loss": 6.997412204742432, "lr": 9e-05, "tps": 951, "wall": 15570.4} {"step": 226, "train_loss": 7.063786506652832, "lr": 9.04e-05, "tps": 950, "wall": 15643.5} {"step": 227, "train_loss": 6.965593338012695, "lr": 9.080000000000001e-05, "tps": 950, "wall": 15717.4} {"step": 228, "train_loss": 7.039894104003906, "lr": 9.120000000000001e-05, "tps": 950, "wall": 15787.1} {"step": 229, "train_loss": 6.952626705169678, "lr": 9.16e-05, "tps": 950, "wall": 15855.8} {"step": 230, "train_loss": 6.942599296569824, "lr": 9.2e-05, "tps": 950, "wall": 15924.0} {"step": 231, "train_loss": 7.002662658691406, "lr": 9.240000000000001e-05, "tps": 950, "wall": 15990.5} {"step": 232, "train_loss": 6.943019866943359, "lr": 9.28e-05, "tps": 950, "wall": 16061.0} {"step": 233, "train_loss": 6.960333824157715, "lr": 9.32e-05, "tps": 950, "wall": 16131.9} {"step": 234, "train_loss": 6.937358856201172, "lr": 9.36e-05, "tps": 950, "wall": 16201.5} {"step": 235, "train_loss": 7.024790287017822, "lr": 9.4e-05, "tps": 950, "wall": 16271.5} {"step": 236, "train_loss": 6.930718898773193, "lr": 9.44e-05, "tps": 950, "wall": 16336.1} {"step": 237, "train_loss": 6.937183380126953, "lr": 9.480000000000001e-05, "tps": 950, "wall": 16403.5} {"step": 238, "train_loss": 6.8715739250183105, "lr": 9.520000000000001e-05, "tps": 950, "wall": 16474.3} {"step": 239, "train_loss": 6.93061637878418, "lr": 9.56e-05, "tps": 950, "wall": 16544.3} {"step": 240, "train_loss": 6.979474067687988, "lr": 9.6e-05, "tps": 950, "wall": 16613.8} {"step": 241, "train_loss": 6.921299934387207, "lr": 9.64e-05, "tps": 950, "wall": 16679.0} {"step": 242, "train_loss": 6.957469940185547, "lr": 9.680000000000001e-05, "tps": 950, "wall": 16746.9} {"step": 243, "train_loss": 6.879013538360596, "lr": 9.72e-05, "tps": 950, "wall": 16816.5} {"step": 244, "train_loss": 6.913014888763428, "lr": 9.76e-05, "tps": 950, "wall": 16885.7} {"step": 245, "train_loss": 7.024452209472656, "lr": 9.800000000000001e-05, "tps": 950, "wall": 16954.2} {"step": 246, "train_loss": 6.84881591796875, "lr": 9.84e-05, "tps": 950, "wall": 17026.9} {"step": 247, "train_loss": 6.880790710449219, "lr": 9.88e-05, "tps": 950, "wall": 17097.1} {"step": 248, "train_loss": 6.854176998138428, "lr": 9.920000000000001e-05, "tps": 950, "wall": 17165.3} {"step": 249, "train_loss": 6.880331039428711, "lr": 9.960000000000001e-05, "tps": 950, "wall": 17233.9} {"step": 250, "train_loss": 6.834688663482666, "lr": 0.0001, "tps": 950, "wall": 17300.9} {"step": 251, "train_loss": 6.8714141845703125, "lr": 0.0001004, "tps": 950, "wall": 17371.0} {"step": 252, "train_loss": 6.800280570983887, "lr": 0.0001008, "tps": 950, "wall": 17443.6} {"step": 253, "train_loss": 6.9418511390686035, "lr": 0.0001012, "tps": 950, "wall": 17516.2} {"step": 254, "train_loss": 6.868705749511719, "lr": 0.0001016, "tps": 950, "wall": 17586.5} {"step": 255, "train_loss": 6.815644264221191, "lr": 0.00010200000000000001, "tps": 950, "wall": 17657.7} {"step": 256, "train_loss": 6.77958345413208, "lr": 0.00010240000000000001, "tps": 950, "wall": 17723.7} {"step": 257, "train_loss": 6.937411308288574, "lr": 0.0001028, "tps": 950, "wall": 17793.5} {"step": 258, "train_loss": 6.900570869445801, "lr": 0.0001032, "tps": 950, "wall": 17861.4} {"step": 259, "train_loss": 6.812521457672119, "lr": 0.00010360000000000001, "tps": 950, "wall": 17925.4} {"step": 260, "train_loss": 6.801298141479492, "lr": 0.00010400000000000001, "tps": 950, "wall": 17994.2} {"step": 261, "train_loss": 6.8707661628723145, "lr": 0.0001044, "tps": 950, "wall": 18062.3} {"step": 262, "train_loss": 6.789557456970215, "lr": 0.0001048, "tps": 950, "wall": 18132.6} {"step": 263, "train_loss": 6.859119415283203, "lr": 0.0001052, "tps": 950, "wall": 18201.8} {"step": 264, "train_loss": 6.8055009841918945, "lr": 0.0001056, "tps": 950, "wall": 18270.5} {"step": 265, "train_loss": 6.834200382232666, "lr": 0.00010600000000000002, "tps": 950, "wall": 18339.8} {"step": 266, "train_loss": 6.800358295440674, "lr": 0.00010640000000000001, "tps": 950, "wall": 18408.0} {"step": 267, "train_loss": 6.751619338989258, "lr": 0.00010680000000000001, "tps": 950, "wall": 18478.3} {"step": 268, "train_loss": 6.717314720153809, "lr": 0.0001072, "tps": 950, "wall": 18547.6} {"step": 269, "train_loss": 6.701727867126465, "lr": 0.0001076, "tps": 950, "wall": 18619.3} {"step": 270, "train_loss": 6.80031681060791, "lr": 0.000108, "tps": 950, "wall": 18686.8} {"step": 271, "train_loss": 6.727226257324219, "lr": 0.0001084, "tps": 950, "wall": 18756.3} {"step": 272, "train_loss": 6.743181228637695, "lr": 0.0001088, "tps": 950, "wall": 18826.0} {"step": 273, "train_loss": 6.76618766784668, "lr": 0.00010920000000000001, "tps": 950, "wall": 18894.4} {"step": 274, "train_loss": 6.704598426818848, "lr": 0.00010960000000000001, "tps": 950, "wall": 18962.7} {"step": 275, "train_loss": 6.787660121917725, "lr": 0.00011, "tps": 950, "wall": 19033.8} {"step": 276, "train_loss": 6.824916362762451, "lr": 0.00011040000000000001, "tps": 950, "wall": 19102.8} {"step": 277, "train_loss": 6.768315315246582, "lr": 0.00011080000000000001, "tps": 950, "wall": 19170.7} {"step": 278, "train_loss": 6.778186798095703, "lr": 0.0001112, "tps": 950, "wall": 19240.4} {"step": 279, "train_loss": 6.891635894775391, "lr": 0.0001116, "tps": 950, "wall": 19309.4} {"step": 280, "train_loss": 6.687043190002441, "lr": 0.000112, "tps": 950, "wall": 19378.2} {"step": 281, "train_loss": 6.700618267059326, "lr": 0.0001124, "tps": 950, "wall": 19448.9} {"step": 282, "train_loss": 6.6609787940979, "lr": 0.00011280000000000002, "tps": 950, "wall": 19519.9} {"step": 283, "train_loss": 6.698223114013672, "lr": 0.00011320000000000001, "tps": 950, "wall": 19589.3} {"step": 284, "train_loss": 6.716220378875732, "lr": 0.00011360000000000001, "tps": 950, "wall": 19649.8} {"step": 285, "train_loss": 6.691295146942139, "lr": 0.000114, "tps": 950, "wall": 19718.1} {"step": 286, "train_loss": 6.73696231842041, "lr": 0.0001144, "tps": 950, "wall": 19789.9} {"step": 287, "train_loss": 6.656528472900391, "lr": 0.0001148, "tps": 950, "wall": 19859.5} {"step": 288, "train_loss": 6.752964973449707, "lr": 0.00011520000000000001, "tps": 950, "wall": 19929.0} {"step": 289, "train_loss": 6.674808025360107, "lr": 0.0001156, "tps": 950, "wall": 19998.0} {"step": 290, "train_loss": 6.720906734466553, "lr": 0.000116, "tps": 950, "wall": 20063.6} {"step": 291, "train_loss": 6.663248062133789, "lr": 0.0001164, "tps": 950, "wall": 20131.5} {"step": 292, "train_loss": 6.7036309242248535, "lr": 0.0001168, "tps": 950, "wall": 20202.6} {"step": 293, "train_loss": 6.714572906494141, "lr": 0.00011720000000000002, "tps": 950, "wall": 20274.1} {"step": 294, "train_loss": 6.666934490203857, "lr": 0.00011760000000000001, "tps": 950, "wall": 20344.4} {"step": 295, "train_loss": 6.600334167480469, "lr": 0.00011800000000000001, "tps": 950, "wall": 20414.9} {"step": 296, "train_loss": 6.655667304992676, "lr": 0.0001184, "tps": 950, "wall": 20484.6} {"step": 297, "train_loss": 6.661040782928467, "lr": 0.0001188, "tps": 950, "wall": 20551.0} {"step": 298, "train_loss": 6.632915496826172, "lr": 0.0001192, "tps": 950, "wall": 20620.1} {"step": 299, "train_loss": 6.618807792663574, "lr": 0.00011960000000000001, "tps": 950, "wall": 20689.7} {"step": 300, "train_loss": 6.614377975463867, "lr": 0.00012, "tps": 950, "wall": 20758.5} {"step": 301, "train_loss": 6.662299633026123, "lr": 0.00012040000000000001, "tps": 950, "wall": 20826.1} {"step": 302, "train_loss": 6.521039962768555, "lr": 0.00012080000000000001, "tps": 950, "wall": 20895.3} {"step": 303, "train_loss": 6.576781272888184, "lr": 0.0001212, "tps": 950, "wall": 20965.3} {"step": 304, "train_loss": 6.61014986038208, "lr": 0.0001216, "tps": 950, "wall": 21033.3} {"step": 305, "train_loss": 6.546360969543457, "lr": 0.00012200000000000001, "tps": 950, "wall": 21104.7} {"step": 306, "train_loss": 6.51076602935791, "lr": 0.00012240000000000002, "tps": 950, "wall": 21174.6} {"step": 307, "train_loss": 6.613102912902832, "lr": 0.0001228, "tps": 950, "wall": 21243.1} {"step": 308, "train_loss": 6.706655502319336, "lr": 0.0001232, "tps": 950, "wall": 21311.6} {"step": 309, "train_loss": 6.506377220153809, "lr": 0.0001236, "tps": 949, "wall": 21385.8} {"step": 310, "train_loss": 6.586215019226074, "lr": 0.000124, "tps": 950, "wall": 21452.9} {"step": 311, "train_loss": 6.556800842285156, "lr": 0.00012440000000000002, "tps": 950, "wall": 21522.6} {"step": 312, "train_loss": 6.5988078117370605, "lr": 0.0001248, "tps": 950, "wall": 21592.3} {"step": 313, "train_loss": 6.651913642883301, "lr": 0.0001252, "tps": 950, "wall": 21661.3} {"step": 314, "train_loss": 6.557708740234375, "lr": 0.00012560000000000002, "tps": 949, "wall": 21731.0} {"step": 315, "train_loss": 6.532888412475586, "lr": 0.000126, "tps": 950, "wall": 21794.6} {"step": 316, "train_loss": 6.5781683921813965, "lr": 0.0001264, "tps": 950, "wall": 21862.8} {"step": 317, "train_loss": 6.482700347900391, "lr": 0.0001268, "tps": 950, "wall": 21933.1} {"step": 318, "train_loss": 6.604485988616943, "lr": 0.0001272, "tps": 950, "wall": 21999.1} {"step": 319, "train_loss": 6.4464850425720215, "lr": 0.0001276, "tps": 950, "wall": 22068.6} {"step": 320, "train_loss": 6.5144853591918945, "lr": 0.000128, "tps": 950, "wall": 22137.1} {"step": 321, "train_loss": 6.455866813659668, "lr": 0.0001284, "tps": 950, "wall": 22207.9} {"step": 322, "train_loss": 6.486355781555176, "lr": 0.0001288, "tps": 950, "wall": 22279.8} {"step": 323, "train_loss": 6.4549031257629395, "lr": 0.0001292, "tps": 950, "wall": 22348.9} {"step": 324, "train_loss": 6.530110836029053, "lr": 0.0001296, "tps": 950, "wall": 22414.5} {"step": 325, "train_loss": 6.607028007507324, "lr": 0.00013000000000000002, "tps": 950, "wall": 22485.0} {"step": 326, "train_loss": 6.514010906219482, "lr": 0.00013040000000000003, "tps": 950, "wall": 22554.0} {"step": 327, "train_loss": 6.465014457702637, "lr": 0.0001308, "tps": 950, "wall": 22624.0} {"step": 328, "train_loss": 6.4984540939331055, "lr": 0.00013120000000000002, "tps": 950, "wall": 22688.1} {"step": 329, "train_loss": 6.462447166442871, "lr": 0.0001316, "tps": 950, "wall": 22759.2} {"step": 330, "train_loss": 6.518398761749268, "lr": 0.000132, "tps": 950, "wall": 22829.3} {"step": 331, "train_loss": 6.4680070877075195, "lr": 0.00013240000000000002, "tps": 950, "wall": 22899.9} {"step": 332, "train_loss": 6.447476863861084, "lr": 0.0001328, "tps": 950, "wall": 22970.0} {"step": 333, "train_loss": 6.381522178649902, "lr": 0.0001332, "tps": 950, "wall": 23038.9} {"step": 334, "train_loss": 6.48856782913208, "lr": 0.0001336, "tps": 950, "wall": 23104.9} {"step": 335, "train_loss": 6.46949577331543, "lr": 0.000134, "tps": 950, "wall": 23172.7} {"step": 336, "train_loss": 6.465555191040039, "lr": 0.00013440000000000001, "tps": 950, "wall": 23243.1} {"step": 337, "train_loss": 6.470580101013184, "lr": 0.0001348, "tps": 950, "wall": 23312.5} {"step": 338, "train_loss": 6.36439323425293, "lr": 0.0001352, "tps": 950, "wall": 23382.3} {"step": 339, "train_loss": 6.419361591339111, "lr": 0.0001356, "tps": 950, "wall": 23452.6} {"step": 340, "train_loss": 6.47628116607666, "lr": 0.000136, "tps": 950, "wall": 23519.9} {"step": 341, "train_loss": 6.548401355743408, "lr": 0.00013639999999999998, "tps": 950, "wall": 23589.2} {"step": 342, "train_loss": 6.477028846740723, "lr": 0.00013680000000000002, "tps": 950, "wall": 23659.1} {"step": 343, "train_loss": 6.393309593200684, "lr": 0.00013720000000000003, "tps": 950, "wall": 23727.9} {"step": 344, "train_loss": 6.475951671600342, "lr": 0.0001376, "tps": 950, "wall": 23798.7} {"step": 345, "train_loss": 6.403281211853027, "lr": 0.00013800000000000002, "tps": 949, "wall": 23869.8} {"step": 346, "train_loss": 6.365392684936523, "lr": 0.0001384, "tps": 949, "wall": 23939.0} {"step": 347, "train_loss": 6.390451431274414, "lr": 0.0001388, "tps": 949, "wall": 24009.5} {"step": 348, "train_loss": 6.302589416503906, "lr": 0.00013920000000000002, "tps": 949, "wall": 24078.9} {"step": 349, "train_loss": 6.386647701263428, "lr": 0.0001396, "tps": 950, "wall": 24144.3} {"step": 350, "train_loss": 6.399471282958984, "lr": 0.00014000000000000001, "tps": 950, "wall": 24213.0} {"step": 351, "train_loss": 6.351105690002441, "lr": 0.0001404, "tps": 949, "wall": 24284.1} {"step": 352, "train_loss": 6.503957748413086, "lr": 0.0001408, "tps": 949, "wall": 24354.1} {"step": 353, "train_loss": 6.351240634918213, "lr": 0.00014120000000000002, "tps": 949, "wall": 24421.3} {"step": 354, "train_loss": 6.482774257659912, "lr": 0.0001416, "tps": 950, "wall": 24488.3} {"step": 355, "train_loss": 6.330733776092529, "lr": 0.000142, "tps": 950, "wall": 24556.6} {"step": 356, "train_loss": 6.387248992919922, "lr": 0.0001424, "tps": 950, "wall": 24623.1} {"step": 357, "train_loss": 6.311038017272949, "lr": 0.0001428, "tps": 950, "wall": 24694.3} {"step": 358, "train_loss": 6.391651153564453, "lr": 0.00014319999999999998, "tps": 950, "wall": 24762.6} {"step": 359, "train_loss": 6.444822788238525, "lr": 0.0001436, "tps": 950, "wall": 24830.3} {"step": 360, "train_loss": 6.380366802215576, "lr": 0.000144, "tps": 950, "wall": 24898.5} {"step": 361, "train_loss": 6.473605155944824, "lr": 0.0001444, "tps": 950, "wall": 24964.3} {"step": 362, "train_loss": 6.346048355102539, "lr": 0.00014480000000000002, "tps": 950, "wall": 25030.7} {"step": 363, "train_loss": 6.364605903625488, "lr": 0.0001452, "tps": 950, "wall": 25099.2} {"step": 364, "train_loss": 6.404881954193115, "lr": 0.00014560000000000002, "tps": 950, "wall": 25169.1} {"step": 365, "train_loss": 6.300661563873291, "lr": 0.00014600000000000003, "tps": 950, "wall": 25239.8} {"step": 366, "train_loss": 6.4173736572265625, "lr": 0.0001464, "tps": 950, "wall": 25309.1} {"step": 367, "train_loss": 6.400043964385986, "lr": 0.00014680000000000002, "tps": 950, "wall": 25379.1} {"step": 368, "train_loss": 6.31707763671875, "lr": 0.0001472, "tps": 950, "wall": 25449.1} {"step": 369, "train_loss": 6.348995685577393, "lr": 0.0001476, "tps": 950, "wall": 25520.8} {"step": 370, "train_loss": 6.296699523925781, "lr": 0.00014800000000000002, "tps": 950, "wall": 25591.0} {"step": 371, "train_loss": 6.293729782104492, "lr": 0.0001484, "tps": 950, "wall": 25656.8} {"step": 372, "train_loss": 6.2845258712768555, "lr": 0.0001488, "tps": 950, "wall": 25724.2} {"step": 373, "train_loss": 6.261140823364258, "lr": 0.0001492, "tps": 946, "wall": 25892.5} {"step": 374, "train_loss": 6.251989364624023, "lr": 0.0001496, "tps": 944, "wall": 26007.0} {"step": 375, "train_loss": 6.41848087310791, "lr": 0.00015, "tps": 944, "wall": 26078.7} {"step": 376, "train_loss": 6.346327781677246, "lr": 0.0001504, "tps": 944, "wall": 26147.6} {"step": 377, "train_loss": 6.294341087341309, "lr": 0.0001508, "tps": 944, "wall": 26215.9} {"step": 378, "train_loss": 6.451261520385742, "lr": 0.0001512, "tps": 945, "wall": 26282.5} {"step": 379, "train_loss": 6.352449417114258, "lr": 0.00015160000000000003, "tps": 945, "wall": 26352.8} {"step": 380, "train_loss": 6.299004077911377, "lr": 0.000152, "tps": 944, "wall": 26423.6} {"step": 381, "train_loss": 6.297604560852051, "lr": 0.00015240000000000002, "tps": 944, "wall": 26494.4} {"step": 382, "train_loss": 6.350645065307617, "lr": 0.00015280000000000003, "tps": 944, "wall": 26566.4} {"step": 383, "train_loss": 6.373189926147461, "lr": 0.0001532, "tps": 945, "wall": 26630.3} {"step": 384, "train_loss": 6.249897480010986, "lr": 0.00015360000000000002, "tps": 945, "wall": 26699.6} {"step": 385, "train_loss": 6.31105899810791, "lr": 0.000154, "tps": 944, "wall": 26769.9} {"step": 386, "train_loss": 6.351818084716797, "lr": 0.0001544, "tps": 945, "wall": 26838.5} {"step": 0, "train_loss": 12.010716438293457, "lr": 0.0, "tps": 15150, "wall": 4.3} {"step": 1, "train_loss": 11.969657897949219, "lr": 4.0000000000000003e-07, "tps": 15699, "wall": 8.3} {"step": 2, "train_loss": 11.981173515319824, "lr": 8.000000000000001e-07, "tps": 15849, "wall": 12.4} {"step": 3, "train_loss": 11.984479904174805, "lr": 1.2000000000000002e-06, "tps": 15590, "wall": 16.8} {"step": 4, "train_loss": 11.962882995605469, "lr": 1.6000000000000001e-06, "tps": 15326, "wall": 21.4} {"step": 5, "train_loss": 11.980674743652344, "lr": 2e-06, "tps": 15037, "wall": 26.1} {"step": 6, "train_loss": 11.898042678833008, "lr": 2.4000000000000003e-06, "tps": 14871, "wall": 30.8} {"step": 7, "train_loss": 11.908845901489258, "lr": 2.8e-06, "tps": 14725, "wall": 35.6} {"step": 8, "train_loss": 11.831623077392578, "lr": 3.2000000000000003e-06, "tps": 14659, "wall": 40.2} {"step": 9, "train_loss": 11.751938819885254, "lr": 3.6000000000000003e-06, "tps": 14610, "wall": 44.9} {"step": 10, "train_loss": 11.72433853149414, "lr": 4e-06, "tps": 14576, "wall": 49.5} {"step": 11, "train_loss": 11.649327278137207, "lr": 4.4e-06, "tps": 14546, "wall": 54.1} {"step": 12, "train_loss": 11.556391716003418, "lr": 4.800000000000001e-06, "tps": 14505, "wall": 58.7} {"step": 13, "train_loss": 11.515069007873535, "lr": 5.200000000000001e-06, "tps": 14421, "wall": 63.6} {"step": 14, "train_loss": 11.432933807373047, "lr": 5.6e-06, "tps": 14349, "wall": 68.5} {"step": 15, "train_loss": 11.280631065368652, "lr": 6e-06, "tps": 14257, "wall": 73.5} {"step": 16, "train_loss": 11.243517875671387, "lr": 6.4000000000000006e-06, "tps": 14170, "wall": 78.6} {"step": 17, "train_loss": 11.123958587646484, "lr": 6.8e-06, "tps": 14090, "wall": 83.7} {"step": 18, "train_loss": 11.010825157165527, "lr": 7.2000000000000005e-06, "tps": 14023, "wall": 88.8} {"step": 19, "train_loss": 10.999862670898438, "lr": 7.6e-06, "tps": 13963, "wall": 93.9} {"step": 20, "train_loss": 10.937461853027344, "lr": 8e-06, "tps": 13905, "wall": 99.0} {"step": 21, "train_loss": 10.85239028930664, "lr": 8.400000000000001e-06, "tps": 13869, "wall": 104.0} {"step": 22, "train_loss": 10.727189064025879, "lr": 8.8e-06, "tps": 13818, "wall": 109.1} {"step": 23, "train_loss": 10.672470092773438, "lr": 9.2e-06, "tps": 13662, "wall": 115.1} {"step": 24, "train_loss": 10.674057960510254, "lr": 9.600000000000001e-06, "tps": 13610, "wall": 120.4} {"step": 25, "train_loss": 10.623744010925293, "lr": 1e-05, "tps": 13562, "wall": 125.6} {"step": 26, "train_loss": 10.523907661437988, "lr": 1.0400000000000002e-05, "tps": 13529, "wall": 130.8} {"step": 27, "train_loss": 10.469468116760254, "lr": 1.08e-05, "tps": 13504, "wall": 135.9} {"step": 28, "train_loss": 10.356780052185059, "lr": 1.12e-05, "tps": 13455, "wall": 141.2} {"step": 29, "train_loss": 10.294554710388184, "lr": 1.16e-05, "tps": 13421, "wall": 146.5} {"step": 30, "train_loss": 10.223319053649902, "lr": 1.2e-05, "tps": 13401, "wall": 151.6} {"step": 31, "train_loss": 10.260537147521973, "lr": 1.2400000000000002e-05, "tps": 13380, "wall": 156.7} {"step": 32, "train_loss": 10.180481910705566, "lr": 1.2800000000000001e-05, "tps": 13357, "wall": 161.9} {"step": 33, "train_loss": 10.115983963012695, "lr": 1.32e-05, "tps": 13338, "wall": 167.1} {"step": 34, "train_loss": 10.067758560180664, "lr": 1.36e-05, "tps": 13312, "wall": 172.3} {"step": 35, "train_loss": 10.07221794128418, "lr": 1.4e-05, "tps": 13288, "wall": 177.5} {"step": 36, "train_loss": 10.045547485351562, "lr": 1.4400000000000001e-05, "tps": 13258, "wall": 182.9} {"step": 37, "train_loss": 10.000375747680664, "lr": 1.48e-05, "tps": 13235, "wall": 188.2} {"step": 38, "train_loss": 9.990550994873047, "lr": 1.52e-05, "tps": 13217, "wall": 193.4} {"step": 39, "train_loss": 9.957462310791016, "lr": 1.56e-05, "tps": 13196, "wall": 198.6} {"step": 40, "train_loss": 9.912924766540527, "lr": 1.6e-05, "tps": 13166, "wall": 204.1} {"step": 41, "train_loss": 9.890881538391113, "lr": 1.6400000000000002e-05, "tps": 13146, "wall": 209.4} {"step": 42, "train_loss": 9.889427185058594, "lr": 1.6800000000000002e-05, "tps": 13114, "wall": 214.9} {"step": 43, "train_loss": 9.91720199584961, "lr": 1.72e-05, "tps": 13082, "wall": 220.4} {"step": 44, "train_loss": 9.838401794433594, "lr": 1.76e-05, "tps": 13016, "wall": 226.6} {"step": 45, "train_loss": 9.816916465759277, "lr": 1.8e-05, "tps": 12991, "wall": 232.1} {"step": 46, "train_loss": 9.7923583984375, "lr": 1.84e-05, "tps": 12974, "wall": 237.4} {"step": 47, "train_loss": 9.856515884399414, "lr": 1.88e-05, "tps": 12951, "wall": 242.9} {"step": 48, "train_loss": 9.773988723754883, "lr": 1.9200000000000003e-05, "tps": 12935, "wall": 248.3} {"step": 49, "train_loss": 9.736372947692871, "lr": 1.96e-05, "tps": 12916, "wall": 253.7} {"step": 50, "train_loss": 9.750191688537598, "lr": 2e-05, "tps": 12899, "wall": 259.1} {"step": 51, "train_loss": 9.75458812713623, "lr": 2.04e-05, "tps": 12882, "wall": 264.5} {"step": 52, "train_loss": 9.765801429748535, "lr": 2.0800000000000004e-05, "tps": 12859, "wall": 270.1} {"step": 53, "train_loss": 9.72293472290039, "lr": 2.12e-05, "tps": 12835, "wall": 275.7} {"step": 54, "train_loss": 9.66488265991211, "lr": 2.16e-05, "tps": 12812, "wall": 281.3} {"step": 55, "train_loss": 9.62839412689209, "lr": 2.2000000000000003e-05, "tps": 12788, "wall": 287.0} {"step": 56, "train_loss": 9.626287460327148, "lr": 2.24e-05, "tps": 12760, "wall": 292.7} {"step": 57, "train_loss": 9.62674331665039, "lr": 2.2800000000000002e-05, "tps": 12734, "wall": 298.5} {"step": 58, "train_loss": 9.62192153930664, "lr": 2.32e-05, "tps": 12694, "wall": 304.6} {"step": 59, "train_loss": 9.592950820922852, "lr": 2.36e-05, "tps": 12613, "wall": 311.7} {"step": 0, "train_loss": 12.010716438293457, "lr": 0.0, "tps": 11755, "wall": 5.6} {"step": 1, "train_loss": 11.969657897949219, "lr": 4.0000000000000003e-07, "tps": 12136, "wall": 10.8} {"step": 2, "train_loss": 11.981173515319824, "lr": 8.000000000000001e-07, "tps": 12319, "wall": 16.0} {"step": 3, "train_loss": 11.984479904174805, "lr": 1.2000000000000002e-06, "tps": 12448, "wall": 21.1} {"step": 4, "train_loss": 11.962882995605469, "lr": 1.6000000000000001e-06, "tps": 12529, "wall": 26.2} {"step": 5, "train_loss": 11.980674743652344, "lr": 2e-06, "tps": 12540, "wall": 31.4} {"step": 6, "train_loss": 11.898042678833008, "lr": 2.4000000000000003e-06, "tps": 12597, "wall": 36.4} {"step": 7, "train_loss": 11.908845901489258, "lr": 2.8e-06, "tps": 12652, "wall": 41.4} {"step": 8, "train_loss": 11.831623077392578, "lr": 3.2000000000000003e-06, "tps": 12695, "wall": 46.5} {"step": 9, "train_loss": 11.751938819885254, "lr": 3.6000000000000003e-06, "tps": 12731, "wall": 51.5} {"step": 10, "train_loss": 11.72433853149414, "lr": 4e-06, "tps": 12754, "wall": 56.5} {"step": 11, "train_loss": 11.649327278137207, "lr": 4.4e-06, "tps": 12778, "wall": 61.5} {"step": 12, "train_loss": 11.556391716003418, "lr": 4.800000000000001e-06, "tps": 12793, "wall": 66.6} {"step": 13, "train_loss": 11.515069007873535, "lr": 5.200000000000001e-06, "tps": 12806, "wall": 71.6} {"step": 14, "train_loss": 11.432933807373047, "lr": 5.6e-06, "tps": 12810, "wall": 76.7} {"step": 15, "train_loss": 11.280631065368652, "lr": 6e-06, "tps": 12810, "wall": 81.9} {"step": 16, "train_loss": 11.243517875671387, "lr": 6.4000000000000006e-06, "tps": 12801, "wall": 87.0} {"step": 17, "train_loss": 11.123958587646484, "lr": 6.8e-06, "tps": 12777, "wall": 92.3} {"step": 18, "train_loss": 11.010825157165527, "lr": 7.2000000000000005e-06, "tps": 12757, "wall": 97.6} {"step": 19, "train_loss": 10.999862670898438, "lr": 7.6e-06, "tps": 12737, "wall": 102.9} {"step": 20, "train_loss": 10.937461853027344, "lr": 8e-06, "tps": 12713, "wall": 108.3} {"step": 21, "train_loss": 10.85239028930664, "lr": 8.400000000000001e-06, "tps": 12685, "wall": 113.7} {"step": 22, "train_loss": 10.727189064025879, "lr": 8.8e-06, "tps": 12651, "wall": 119.1} {"step": 23, "train_loss": 10.672470092773438, "lr": 9.2e-06, "tps": 12618, "wall": 124.7} {"step": 24, "train_loss": 10.674057960510254, "lr": 9.600000000000001e-06, "tps": 12580, "wall": 130.2} {"step": 25, "train_loss": 10.623744010925293, "lr": 1e-05, "tps": 12536, "wall": 135.9} {"step": 26, "train_loss": 10.523907661437988, "lr": 1.0400000000000002e-05, "tps": 12490, "wall": 141.7} {"step": 27, "train_loss": 10.469468116760254, "lr": 1.08e-05, "tps": 12441, "wall": 147.5} {"step": 28, "train_loss": 10.356780052185059, "lr": 1.12e-05, "tps": 12385, "wall": 153.4} {"step": 29, "train_loss": 10.294554710388184, "lr": 1.16e-05, "tps": 12330, "wall": 159.5} {"step": 30, "train_loss": 10.223319053649902, "lr": 1.2e-05, "tps": 12275, "wall": 165.5} {"step": 31, "train_loss": 10.260537147521973, "lr": 1.2400000000000002e-05, "tps": 12215, "wall": 171.7} {"step": 32, "train_loss": 10.180481910705566, "lr": 1.2800000000000001e-05, "tps": 12154, "wall": 177.9} {"step": 33, "train_loss": 10.115983963012695, "lr": 1.32e-05, "tps": 12087, "wall": 184.3} {"step": 34, "train_loss": 10.067758560180664, "lr": 1.36e-05, "tps": 12022, "wall": 190.8} {"step": 35, "train_loss": 10.07221794128418, "lr": 1.4e-05, "tps": 11957, "wall": 197.3} {"step": 36, "train_loss": 10.045547485351562, "lr": 1.4400000000000001e-05, "tps": 11890, "wall": 203.9} {"step": 37, "train_loss": 10.000375747680664, "lr": 1.48e-05, "tps": 11826, "wall": 210.6} {"step": 38, "train_loss": 9.990550994873047, "lr": 1.52e-05, "tps": 11751, "wall": 217.5} {"step": 39, "train_loss": 9.957462310791016, "lr": 1.56e-05, "tps": 11680, "wall": 224.4} {"step": 40, "train_loss": 9.912924766540527, "lr": 1.6e-05, "tps": 11612, "wall": 231.4} {"step": 41, "train_loss": 9.890881538391113, "lr": 1.6400000000000002e-05, "tps": 11543, "wall": 238.4} {"step": 42, "train_loss": 9.889427185058594, "lr": 1.6800000000000002e-05, "tps": 11473, "wall": 245.6} {"step": 43, "train_loss": 9.91720199584961, "lr": 1.72e-05, "tps": 11405, "wall": 252.8} {"step": 44, "train_loss": 9.838401794433594, "lr": 1.76e-05, "tps": 11337, "wall": 260.1} {"step": 45, "train_loss": 9.816916465759277, "lr": 1.8e-05, "tps": 11268, "wall": 267.5} {"step": 46, "train_loss": 9.7923583984375, "lr": 1.84e-05, "tps": 11198, "wall": 275.1} {"step": 47, "train_loss": 9.856515884399414, "lr": 1.88e-05, "tps": 11134, "wall": 282.5} {"step": 48, "train_loss": 9.773988723754883, "lr": 1.9200000000000003e-05, "tps": 11071, "wall": 290.1} {"step": 49, "train_loss": 9.736372947692871, "lr": 1.96e-05, "tps": 11007, "wall": 297.7} {"step": 50, "train_loss": 9.750191688537598, "lr": 2e-05, "tps": 10948, "wall": 305.3} {"step": 51, "train_loss": 9.75458812713623, "lr": 2.04e-05, "tps": 10888, "wall": 313.0} {"step": 52, "train_loss": 9.765801429748535, "lr": 2.0800000000000004e-05, "tps": 10834, "wall": 320.6} {"step": 53, "train_loss": 9.72293472290039, "lr": 2.12e-05, "tps": 10779, "wall": 328.3} {"step": 54, "train_loss": 9.66488265991211, "lr": 2.16e-05, "tps": 10722, "wall": 336.2} {"step": 55, "train_loss": 9.62839412689209, "lr": 2.2000000000000003e-05, "tps": 10670, "wall": 343.9} {"step": 56, "train_loss": 9.626287460327148, "lr": 2.24e-05, "tps": 10625, "wall": 351.6} {"step": 57, "train_loss": 9.62674331665039, "lr": 2.2800000000000002e-05, "tps": 10579, "wall": 359.3} {"step": 58, "train_loss": 9.62192153930664, "lr": 2.32e-05, "tps": 10535, "wall": 367.0} {"step": 59, "train_loss": 9.592950820922852, "lr": 2.36e-05, "tps": 10491, "wall": 374.8} {"step": 60, "train_loss": 9.557247161865234, "lr": 2.4e-05, "tps": 10453, "wall": 382.4} {"step": 61, "train_loss": 9.518527030944824, "lr": 2.44e-05, "tps": 10413, "wall": 390.2} {"step": 62, "train_loss": 9.565380096435547, "lr": 2.4800000000000003e-05, "tps": 10373, "wall": 398.0} {"step": 63, "train_loss": 9.482965469360352, "lr": 2.52e-05, "tps": 10338, "wall": 405.7} {"step": 64, "train_loss": 9.412120819091797, "lr": 2.5600000000000002e-05, "tps": 10304, "wall": 413.4} {"step": 65, "train_loss": 9.5069580078125, "lr": 2.6000000000000002e-05, "tps": 10272, "wall": 421.1} {"step": 66, "train_loss": 9.467168807983398, "lr": 2.64e-05, "tps": 10239, "wall": 428.8} {"step": 67, "train_loss": 9.377161026000977, "lr": 2.68e-05, "tps": 10207, "wall": 436.6} {"step": 68, "train_loss": 9.370655059814453, "lr": 2.72e-05, "tps": 10178, "wall": 444.3} {"step": 69, "train_loss": 9.341713905334473, "lr": 2.7600000000000003e-05, "tps": 10148, "wall": 452.1} {"step": 70, "train_loss": 9.364286422729492, "lr": 2.8e-05, "tps": 10122, "wall": 459.7} {"step": 71, "train_loss": 9.270344734191895, "lr": 2.8400000000000003e-05, "tps": 10096, "wall": 467.4} {"step": 72, "train_loss": 9.28166389465332, "lr": 2.8800000000000002e-05, "tps": 10071, "wall": 475.0} {"step": 73, "train_loss": 9.233768463134766, "lr": 2.92e-05, "tps": 10046, "wall": 482.7} {"step": 74, "train_loss": 9.294058799743652, "lr": 2.96e-05, "tps": 10024, "wall": 490.3} {"step": 75, "train_loss": 9.224015235900879, "lr": 3e-05, "tps": 10002, "wall": 497.9} {"step": 76, "train_loss": 9.157353401184082, "lr": 3.04e-05, "tps": 9980, "wall": 505.6} {"step": 77, "train_loss": 9.2096586227417, "lr": 3.08e-05, "tps": 9957, "wall": 513.4} {"step": 78, "train_loss": 9.179288864135742, "lr": 3.12e-05, "tps": 9937, "wall": 521.0} {"step": 79, "train_loss": 9.085453033447266, "lr": 3.16e-05, "tps": 9917, "wall": 528.6} {"step": 80, "train_loss": 9.107942581176758, "lr": 3.2e-05, "tps": 9898, "wall": 536.3} {"step": 81, "train_loss": 9.085135459899902, "lr": 3.24e-05, "tps": 9879, "wall": 544.0} {"step": 82, "train_loss": 9.015960693359375, "lr": 3.2800000000000004e-05, "tps": 9861, "wall": 551.6} {"step": 83, "train_loss": 9.06379508972168, "lr": 3.32e-05, "tps": 9844, "wall": 559.2} {"step": 84, "train_loss": 8.99739933013916, "lr": 3.3600000000000004e-05, "tps": 9826, "wall": 566.9} {"step": 85, "train_loss": 8.945883750915527, "lr": 3.4e-05, "tps": 9806, "wall": 574.7} {"step": 86, "train_loss": 8.933882713317871, "lr": 3.44e-05, "tps": 9790, "wall": 582.4} {"step": 87, "train_loss": 8.958731651306152, "lr": 3.4800000000000006e-05, "tps": 9774, "wall": 590.0} {"step": 88, "train_loss": 8.918476104736328, "lr": 3.52e-05, "tps": 9758, "wall": 597.7} {"step": 89, "train_loss": 8.855347633361816, "lr": 3.56e-05, "tps": 9743, "wall": 605.3} {"step": 90, "train_loss": 8.866905212402344, "lr": 3.6e-05, "tps": 9728, "wall": 613.0} {"step": 91, "train_loss": 8.829865455627441, "lr": 3.6400000000000004e-05, "tps": 9713, "wall": 620.7} {"step": 92, "train_loss": 8.799142837524414, "lr": 3.68e-05, "tps": 9700, "wall": 628.3} {"step": 93, "train_loss": 8.740829467773438, "lr": 3.72e-05, "tps": 9685, "wall": 636.0} {"step": 94, "train_loss": 8.792405128479004, "lr": 3.76e-05, "tps": 9671, "wall": 643.7} {"step": 95, "train_loss": 8.686074256896973, "lr": 3.8e-05, "tps": 9659, "wall": 651.3} {"step": 96, "train_loss": 8.677027702331543, "lr": 3.8400000000000005e-05, "tps": 9646, "wall": 659.0} {"step": 97, "train_loss": 8.693831443786621, "lr": 3.88e-05, "tps": 9634, "wall": 666.6} {"step": 98, "train_loss": 8.663509368896484, "lr": 3.92e-05, "tps": 9621, "wall": 674.3} {"step": 99, "train_loss": 8.636314392089844, "lr": 3.96e-05, "tps": 9609, "wall": 682.0} {"step": 100, "train_loss": 8.546420097351074, "lr": 4e-05, "tps": 9598, "wall": 689.6} {"step": 101, "train_loss": 8.571012496948242, "lr": 4.0400000000000006e-05, "tps": 9584, "wall": 697.4} {"step": 102, "train_loss": 8.568342208862305, "lr": 4.08e-05, "tps": 9573, "wall": 705.1} {"step": 103, "train_loss": 8.628839492797852, "lr": 4.12e-05, "tps": 9561, "wall": 712.8} {"step": 104, "train_loss": 8.5676851272583, "lr": 4.160000000000001e-05, "tps": 9550, "wall": 720.5} {"step": 105, "train_loss": 8.497340202331543, "lr": 4.2000000000000004e-05, "tps": 9540, "wall": 728.2} {"step": 106, "train_loss": 8.448352813720703, "lr": 4.24e-05, "tps": 9530, "wall": 735.8} {"step": 107, "train_loss": 8.481856346130371, "lr": 4.2800000000000004e-05, "tps": 9519, "wall": 743.5} {"step": 108, "train_loss": 8.367953300476074, "lr": 4.32e-05, "tps": 9508, "wall": 751.3} {"step": 109, "train_loss": 8.396543502807617, "lr": 4.36e-05, "tps": 9498, "wall": 759.0} {"step": 110, "train_loss": 8.405295372009277, "lr": 4.4000000000000006e-05, "tps": 9488, "wall": 766.7} {"step": 111, "train_loss": 8.329401969909668, "lr": 4.44e-05, "tps": 9478, "wall": 774.4} {"step": 112, "train_loss": 8.313867568969727, "lr": 4.48e-05, "tps": 9468, "wall": 782.1} {"step": 113, "train_loss": 8.262494087219238, "lr": 4.52e-05, "tps": 9460, "wall": 789.8} {"step": 114, "train_loss": 8.293413162231445, "lr": 4.5600000000000004e-05, "tps": 9450, "wall": 797.4} {"step": 115, "train_loss": 8.254898071289062, "lr": 4.6e-05, "tps": 9441, "wall": 805.2} {"step": 116, "train_loss": 8.216276168823242, "lr": 4.64e-05, "tps": 9431, "wall": 813.0} {"step": 117, "train_loss": 8.169356346130371, "lr": 4.68e-05, "tps": 9421, "wall": 820.8} {"step": 118, "train_loss": 8.24614429473877, "lr": 4.72e-05, "tps": 9413, "wall": 828.5} {"step": 119, "train_loss": 8.201354026794434, "lr": 4.7600000000000005e-05, "tps": 9404, "wall": 836.2} {"step": 120, "train_loss": 8.185944557189941, "lr": 4.8e-05, "tps": 9396, "wall": 843.9} {"step": 121, "train_loss": 8.069718360900879, "lr": 4.8400000000000004e-05, "tps": 9388, "wall": 851.6} {"step": 122, "train_loss": 8.208297729492188, "lr": 4.88e-05, "tps": 9381, "wall": 859.2} {"step": 123, "train_loss": 8.085550308227539, "lr": 4.92e-05, "tps": 9373, "wall": 867.0} {"step": 124, "train_loss": 8.03810977935791, "lr": 4.9600000000000006e-05, "tps": 9364, "wall": 874.7} {"step": 125, "train_loss": 8.05516529083252, "lr": 5e-05, "tps": 9357, "wall": 882.5} {"step": 126, "train_loss": 7.997936725616455, "lr": 5.04e-05, "tps": 9348, "wall": 890.3} {"step": 127, "train_loss": 7.9177446365356445, "lr": 5.08e-05, "tps": 9342, "wall": 897.9} {"step": 128, "train_loss": 8.007017135620117, "lr": 5.1200000000000004e-05, "tps": 9336, "wall": 905.5} {"step": 129, "train_loss": 7.972557067871094, "lr": 5.16e-05, "tps": 9329, "wall": 913.2} {"step": 130, "train_loss": 8.009966850280762, "lr": 5.2000000000000004e-05, "tps": 9322, "wall": 920.9} {"step": 131, "train_loss": 8.015609741210938, "lr": 5.24e-05, "tps": 9315, "wall": 928.6} {"step": 132, "train_loss": 8.031258583068848, "lr": 5.28e-05, "tps": 9308, "wall": 936.4} {"step": 133, "train_loss": 7.954874038696289, "lr": 5.3200000000000006e-05, "tps": 9301, "wall": 944.1} {"step": 134, "train_loss": 7.80820894241333, "lr": 5.36e-05, "tps": 9294, "wall": 951.8} {"step": 135, "train_loss": 7.913119316101074, "lr": 5.4e-05, "tps": 9289, "wall": 959.5} {"step": 136, "train_loss": 7.79510498046875, "lr": 5.44e-05, "tps": 9282, "wall": 967.2} {"step": 137, "train_loss": 7.834118366241455, "lr": 5.4800000000000004e-05, "tps": 9276, "wall": 975.0} {"step": 138, "train_loss": 7.765554428100586, "lr": 5.520000000000001e-05, "tps": 9269, "wall": 982.7} {"step": 139, "train_loss": 7.864133834838867, "lr": 5.56e-05, "tps": 9263, "wall": 990.4} {"step": 140, "train_loss": 7.720888614654541, "lr": 5.6e-05, "tps": 9256, "wall": 998.3} {"step": 141, "train_loss": 7.791794300079346, "lr": 5.640000000000001e-05, "tps": 9250, "wall": 1006.0} {"step": 142, "train_loss": 7.801263809204102, "lr": 5.6800000000000005e-05, "tps": 9244, "wall": 1013.7} {"step": 143, "train_loss": 7.684856414794922, "lr": 5.72e-05, "tps": 9240, "wall": 1021.3} {"step": 144, "train_loss": 7.761735916137695, "lr": 5.7600000000000004e-05, "tps": 9234, "wall": 1029.1} {"step": 145, "train_loss": 7.694338321685791, "lr": 5.8e-05, "tps": 9229, "wall": 1036.8} {"step": 146, "train_loss": 7.6453704833984375, "lr": 5.84e-05, "tps": 9223, "wall": 1044.5} {"step": 147, "train_loss": 7.595042705535889, "lr": 5.8800000000000006e-05, "tps": 9216, "wall": 1052.3} {"step": 148, "train_loss": 7.574378490447998, "lr": 5.92e-05, "tps": 9211, "wall": 1060.1} {"step": 149, "train_loss": 7.547858238220215, "lr": 5.96e-05, "tps": 9205, "wall": 1067.9} {"step": 150, "train_loss": 7.622703552246094, "lr": 6e-05, "tps": 9200, "wall": 1075.6} {"step": 151, "train_loss": 7.601994514465332, "lr": 6.0400000000000004e-05, "tps": 9195, "wall": 1083.3} {"step": 152, "train_loss": 7.610236644744873, "lr": 6.08e-05, "tps": 9190, "wall": 1091.1} {"step": 153, "train_loss": 7.596889972686768, "lr": 6.120000000000001e-05, "tps": 9185, "wall": 1098.7} {"step": 154, "train_loss": 7.53411865234375, "lr": 6.16e-05, "tps": 9180, "wall": 1106.4} {"step": 155, "train_loss": 7.533018589019775, "lr": 6.2e-05, "tps": 9175, "wall": 1114.3} {"step": 156, "train_loss": 7.608554840087891, "lr": 6.24e-05, "tps": 9170, "wall": 1122.0} {"step": 157, "train_loss": 7.584914684295654, "lr": 6.280000000000001e-05, "tps": 9165, "wall": 1129.7} {"step": 158, "train_loss": 7.5255231857299805, "lr": 6.32e-05, "tps": 9161, "wall": 1137.4} {"step": 159, "train_loss": 7.4985432624816895, "lr": 6.36e-05, "tps": 9156, "wall": 1145.2} {"step": 160, "train_loss": 7.560420989990234, "lr": 6.4e-05, "tps": 9152, "wall": 1152.8} {"step": 161, "train_loss": 7.505138397216797, "lr": 6.44e-05, "tps": 9148, "wall": 1160.5} {"step": 162, "train_loss": 7.4167094230651855, "lr": 6.48e-05, "tps": 9144, "wall": 1168.2} {"step": 163, "train_loss": 7.479063987731934, "lr": 6.520000000000001e-05, "tps": 9138, "wall": 1176.1} {"step": 164, "train_loss": 7.403266906738281, "lr": 6.560000000000001e-05, "tps": 9134, "wall": 1183.8} {"step": 165, "train_loss": 7.523157119750977, "lr": 6.6e-05, "tps": 9130, "wall": 1191.5} {"step": 166, "train_loss": 7.427882194519043, "lr": 6.64e-05, "tps": 9126, "wall": 1199.2} {"step": 167, "train_loss": 7.444023132324219, "lr": 6.68e-05, "tps": 9122, "wall": 1206.9} {"step": 168, "train_loss": 7.502746105194092, "lr": 6.720000000000001e-05, "tps": 9118, "wall": 1214.6} {"step": 169, "train_loss": 7.482631683349609, "lr": 6.76e-05, "tps": 9114, "wall": 1222.3} {"step": 170, "train_loss": 7.465363502502441, "lr": 6.8e-05, "tps": 9110, "wall": 1230.1} {"step": 171, "train_loss": 7.453548431396484, "lr": 6.840000000000001e-05, "tps": 9105, "wall": 1237.9} {"step": 172, "train_loss": 7.33956241607666, "lr": 6.88e-05, "tps": 9102, "wall": 1245.6} {"step": 173, "train_loss": 7.356197357177734, "lr": 6.92e-05, "tps": 9098, "wall": 1253.3} {"step": 174, "train_loss": 7.369173526763916, "lr": 6.960000000000001e-05, "tps": 9094, "wall": 1261.0} {"step": 175, "train_loss": 7.375523567199707, "lr": 7.000000000000001e-05, "tps": 9091, "wall": 1268.7} {"step": 176, "train_loss": 7.382493495941162, "lr": 7.04e-05, "tps": 9088, "wall": 1276.3} {"step": 177, "train_loss": 7.334375381469727, "lr": 7.08e-05, "tps": 9084, "wall": 1284.1} {"step": 178, "train_loss": 7.39451789855957, "lr": 7.12e-05, "tps": 9080, "wall": 1291.8} {"step": 179, "train_loss": 7.333327770233154, "lr": 7.159999999999999e-05, "tps": 9077, "wall": 1299.5} {"step": 180, "train_loss": 7.37626838684082, "lr": 7.2e-05, "tps": 9074, "wall": 1307.2} {"step": 181, "train_loss": 7.321794509887695, "lr": 7.240000000000001e-05, "tps": 9070, "wall": 1315.0} {"step": 182, "train_loss": 7.290129661560059, "lr": 7.280000000000001e-05, "tps": 9066, "wall": 1322.7} {"step": 183, "train_loss": 7.301864147186279, "lr": 7.32e-05, "tps": 9063, "wall": 1330.5} {"step": 184, "train_loss": 7.287424087524414, "lr": 7.36e-05, "tps": 9060, "wall": 1338.2} {"step": 185, "train_loss": 7.40167236328125, "lr": 7.400000000000001e-05, "tps": 9056, "wall": 1345.9} {"step": 186, "train_loss": 7.30732536315918, "lr": 7.44e-05, "tps": 9052, "wall": 1353.7} {"step": 187, "train_loss": 7.3695173263549805, "lr": 7.48e-05, "tps": 9049, "wall": 1361.5} {"step": 188, "train_loss": 7.33498477935791, "lr": 7.52e-05, "tps": 9046, "wall": 1369.1} {"step": 189, "train_loss": 7.29096794128418, "lr": 7.56e-05, "tps": 9043, "wall": 1376.9} {"step": 190, "train_loss": 7.324825286865234, "lr": 7.6e-05, "tps": 9040, "wall": 1384.6} {"step": 191, "train_loss": 7.163296699523926, "lr": 7.640000000000001e-05, "tps": 9038, "wall": 1392.2} {"step": 192, "train_loss": 7.160993576049805, "lr": 7.680000000000001e-05, "tps": 9035, "wall": 1399.9} {"step": 193, "train_loss": 7.254158973693848, "lr": 7.72e-05, "tps": 9032, "wall": 1407.6} {"step": 194, "train_loss": 7.130463600158691, "lr": 7.76e-05, "tps": 9028, "wall": 1415.5} {"step": 195, "train_loss": 7.196925163269043, "lr": 7.8e-05, "tps": 9025, "wall": 1423.2} {"step": 196, "train_loss": 7.206007480621338, "lr": 7.84e-05, "tps": 9021, "wall": 1431.0} {"step": 197, "train_loss": 7.2311553955078125, "lr": 7.88e-05, "tps": 9019, "wall": 1438.7} {"step": 198, "train_loss": 7.276366233825684, "lr": 7.92e-05, "tps": 9016, "wall": 1446.4} {"step": 199, "train_loss": 7.229197025299072, "lr": 7.960000000000001e-05, "tps": 9014, "wall": 1454.0} {"step": 200, "train_loss": 7.224910259246826, "lr": 8e-05, "tps": 9011, "wall": 1461.8} {"step": 201, "train_loss": 7.1847076416015625, "lr": 8.04e-05, "tps": 9008, "wall": 1469.5} {"step": 202, "train_loss": 7.146562576293945, "lr": 8.080000000000001e-05, "tps": 9005, "wall": 1477.3} {"step": 203, "train_loss": 7.0555877685546875, "lr": 8.120000000000001e-05, "tps": 9002, "wall": 1485.0} {"step": 204, "train_loss": 7.185199737548828, "lr": 8.16e-05, "tps": 8999, "wall": 1492.8} {"step": 205, "train_loss": 7.175101280212402, "lr": 8.2e-05, "tps": 8997, "wall": 1500.5} {"step": 206, "train_loss": 7.158578872680664, "lr": 8.24e-05, "tps": 8994, "wall": 1508.2} {"step": 207, "train_loss": 7.1070146560668945, "lr": 8.28e-05, "tps": 8991, "wall": 1516.0} {"step": 208, "train_loss": 7.111502647399902, "lr": 8.320000000000002e-05, "tps": 8989, "wall": 1523.7} {"step": 209, "train_loss": 7.058177471160889, "lr": 8.360000000000001e-05, "tps": 8986, "wall": 1531.5} {"step": 210, "train_loss": 7.106117248535156, "lr": 8.400000000000001e-05, "tps": 8984, "wall": 1539.2} {"step": 211, "train_loss": 7.045265197753906, "lr": 8.44e-05, "tps": 8981, "wall": 1546.9} {"step": 212, "train_loss": 7.104379653930664, "lr": 8.48e-05, "tps": 8979, "wall": 1554.6} {"step": 213, "train_loss": 6.994361877441406, "lr": 8.52e-05, "tps": 8976, "wall": 1562.4} {"step": 214, "train_loss": 7.086819171905518, "lr": 8.560000000000001e-05, "tps": 8974, "wall": 1570.1} {"step": 215, "train_loss": 7.129000663757324, "lr": 8.6e-05, "tps": 8972, "wall": 1577.7} {"step": 216, "train_loss": 7.151320457458496, "lr": 8.64e-05, "tps": 8970, "wall": 1585.4} {"step": 217, "train_loss": 7.112557411193848, "lr": 8.68e-05, "tps": 8967, "wall": 1593.3} {"step": 218, "train_loss": 7.019594192504883, "lr": 8.72e-05, "tps": 8965, "wall": 1600.9} {"step": 219, "train_loss": 7.079097747802734, "lr": 8.76e-05, "tps": 8962, "wall": 1608.7} {"step": 220, "train_loss": 7.027222633361816, "lr": 8.800000000000001e-05, "tps": 8960, "wall": 1616.3} {"step": 221, "train_loss": 7.101859092712402, "lr": 8.840000000000001e-05, "tps": 8958, "wall": 1624.1} {"step": 222, "train_loss": 7.060854434967041, "lr": 8.88e-05, "tps": 8956, "wall": 1631.8} {"step": 223, "train_loss": 7.158807277679443, "lr": 8.92e-05, "tps": 8954, "wall": 1639.5} {"step": 224, "train_loss": 7.0644941329956055, "lr": 8.96e-05, "tps": 8951, "wall": 1647.2} {"step": 225, "train_loss": 6.997409343719482, "lr": 9e-05, "tps": 8949, "wall": 1655.0} {"step": 226, "train_loss": 7.068938255310059, "lr": 9.04e-05, "tps": 8947, "wall": 1662.6} {"step": 227, "train_loss": 6.967785358428955, "lr": 9.080000000000001e-05, "tps": 8945, "wall": 1670.4} {"step": 0, "train_loss": 12.010716438293457, "lr": 0.0, "tps": 15208, "wall": 4.3} {"step": 1, "train_loss": 11.969657897949219, "lr": 4.0000000000000003e-07, "tps": 16009, "wall": 8.2} {"step": 2, "train_loss": 11.981173515319824, "lr": 8.000000000000001e-07, "tps": 16050, "wall": 12.2} {"step": 3, "train_loss": 11.984479904174805, "lr": 1.2000000000000002e-06, "tps": 15992, "wall": 16.4} {"step": 4, "train_loss": 11.962882995605469, "lr": 1.6000000000000001e-06, "tps": 15895, "wall": 20.6} {"step": 5, "train_loss": 11.980674743652344, "lr": 2e-06, "tps": 15775, "wall": 24.9} {"step": 6, "train_loss": 11.898042678833008, "lr": 2.4000000000000003e-06, "tps": 15665, "wall": 29.3} {"step": 7, "train_loss": 11.908845901489258, "lr": 2.8e-06, "tps": 15573, "wall": 33.7} {"step": 8, "train_loss": 11.831623077392578, "lr": 3.2000000000000003e-06, "tps": 15485, "wall": 38.1} {"step": 9, "train_loss": 11.751938819885254, "lr": 3.6000000000000003e-06, "tps": 15380, "wall": 42.6} {"step": 10, "train_loss": 11.72433853149414, "lr": 4e-06, "tps": 15280, "wall": 47.2} {"step": 11, "train_loss": 11.649327278137207, "lr": 4.4e-06, "tps": 15181, "wall": 51.8} {"step": 12, "train_loss": 11.556391716003418, "lr": 4.800000000000001e-06, "tps": 15049, "wall": 56.6} {"step": 13, "train_loss": 11.515069007873535, "lr": 5.200000000000001e-06, "tps": 14894, "wall": 61.6} {"step": 14, "train_loss": 11.432933807373047, "lr": 5.6e-06, "tps": 14730, "wall": 66.7} {"step": 15, "train_loss": 11.280631065368652, "lr": 6e-06, "tps": 14576, "wall": 71.9} {"step": 16, "train_loss": 11.243517875671387, "lr": 6.4000000000000006e-06, "tps": 14436, "wall": 77.2} {"step": 17, "train_loss": 11.123958587646484, "lr": 6.8e-06, "tps": 14294, "wall": 82.5} {"step": 18, "train_loss": 11.010825157165527, "lr": 7.2000000000000005e-06, "tps": 14185, "wall": 87.8} {"step": 19, "train_loss": 10.999862670898438, "lr": 7.6e-06, "tps": 14080, "wall": 93.1} {"step": 20, "train_loss": 10.937461853027344, "lr": 8e-06, "tps": 13974, "wall": 98.5} {"step": 21, "train_loss": 10.85239028930664, "lr": 8.400000000000001e-06, "tps": 13877, "wall": 103.9} {"step": 22, "train_loss": 10.727189064025879, "lr": 8.8e-06, "tps": 13789, "wall": 109.3} {"step": 23, "train_loss": 10.672470092773438, "lr": 9.2e-06, "tps": 13710, "wall": 114.7} {"step": 24, "train_loss": 10.674057960510254, "lr": 9.600000000000001e-06, "tps": 13639, "wall": 120.1} {"step": 25, "train_loss": 10.623744010925293, "lr": 1e-05, "tps": 13579, "wall": 125.5} {"step": 26, "train_loss": 10.523907661437988, "lr": 1.0400000000000002e-05, "tps": 13512, "wall": 130.9} {"step": 27, "train_loss": 10.469468116760254, "lr": 1.08e-05, "tps": 13461, "wall": 136.3} {"step": 28, "train_loss": 10.356780052185059, "lr": 1.12e-05, "tps": 13413, "wall": 141.7} {"step": 29, "train_loss": 10.294554710388184, "lr": 1.16e-05, "tps": 13363, "wall": 147.1} {"step": 30, "train_loss": 10.223319053649902, "lr": 1.2e-05, "tps": 13314, "wall": 152.6} {"step": 31, "train_loss": 10.260537147521973, "lr": 1.2400000000000002e-05, "tps": 13269, "wall": 158.0} {"step": 32, "train_loss": 10.180481910705566, "lr": 1.2800000000000001e-05, "tps": 13221, "wall": 163.6} {"step": 33, "train_loss": 10.115983963012695, "lr": 1.32e-05, "tps": 13171, "wall": 169.2} {"step": 34, "train_loss": 10.067758560180664, "lr": 1.36e-05, "tps": 13118, "wall": 174.9} {"step": 35, "train_loss": 10.07221794128418, "lr": 1.4e-05, "tps": 13063, "wall": 180.6} {"step": 36, "train_loss": 10.045547485351562, "lr": 1.4400000000000001e-05, "tps": 13006, "wall": 186.4} {"step": 37, "train_loss": 10.000375747680664, "lr": 1.48e-05, "tps": 12940, "wall": 192.5} {"step": 38, "train_loss": 9.990550994873047, "lr": 1.52e-05, "tps": 12870, "wall": 198.6} {"step": 39, "train_loss": 9.957462310791016, "lr": 1.56e-05, "tps": 12800, "wall": 204.8} {"step": 40, "train_loss": 9.912924766540527, "lr": 1.6e-05, "tps": 12724, "wall": 211.2} {"step": 41, "train_loss": 9.890881538391113, "lr": 1.6400000000000002e-05, "tps": 12645, "wall": 217.7} {"step": 42, "train_loss": 9.889427185058594, "lr": 1.6800000000000002e-05, "tps": 12566, "wall": 224.3} {"step": 43, "train_loss": 9.91720199584961, "lr": 1.72e-05, "tps": 12486, "wall": 230.9} {"step": 44, "train_loss": 9.838401794433594, "lr": 1.76e-05, "tps": 12401, "wall": 237.8} {"step": 45, "train_loss": 9.816916465759277, "lr": 1.8e-05, "tps": 12314, "wall": 244.8} {"step": 46, "train_loss": 9.7923583984375, "lr": 1.84e-05, "tps": 12216, "wall": 252.1} {"step": 47, "train_loss": 9.856515884399414, "lr": 1.88e-05, "tps": 12125, "wall": 259.4} {"step": 48, "train_loss": 9.773988723754883, "lr": 1.9200000000000003e-05, "tps": 12028, "wall": 267.0} {"step": 49, "train_loss": 9.736372947692871, "lr": 1.96e-05, "tps": 11940, "wall": 274.4} {"step": 50, "train_loss": 9.750191688537598, "lr": 2e-05, "tps": 11850, "wall": 282.1} {"step": 51, "train_loss": 9.75458812713623, "lr": 2.04e-05, "tps": 11756, "wall": 289.9} {"step": 52, "train_loss": 9.765801429748535, "lr": 2.0800000000000004e-05, "tps": 11670, "wall": 297.6} {"step": 53, "train_loss": 9.72293472290039, "lr": 2.12e-05, "tps": 11582, "wall": 305.5} {"step": 54, "train_loss": 9.66488265991211, "lr": 2.16e-05, "tps": 11492, "wall": 313.6} {"step": 55, "train_loss": 9.62839412689209, "lr": 2.2000000000000003e-05, "tps": 11409, "wall": 321.7} {"step": 56, "train_loss": 9.626287460327148, "lr": 2.24e-05, "tps": 11328, "wall": 329.7} {"step": 57, "train_loss": 9.62674331665039, "lr": 2.2800000000000002e-05, "tps": 11254, "wall": 337.7} {"step": 58, "train_loss": 9.62192153930664, "lr": 2.32e-05, "tps": 11178, "wall": 345.9} {"step": 59, "train_loss": 9.592950820922852, "lr": 2.36e-05, "tps": 11108, "wall": 354.0} {"step": 60, "train_loss": 9.557247161865234, "lr": 2.4e-05, "tps": 11039, "wall": 362.1} {"step": 61, "train_loss": 9.518527030944824, "lr": 2.44e-05, "tps": 10968, "wall": 370.4} {"step": 62, "train_loss": 9.565380096435547, "lr": 2.4800000000000003e-05, "tps": 10906, "wall": 378.6} {"step": 63, "train_loss": 9.482965469360352, "lr": 2.52e-05, "tps": 10845, "wall": 386.7} {"step": 64, "train_loss": 9.412120819091797, "lr": 2.5600000000000002e-05, "tps": 10791, "wall": 394.8} {"step": 65, "train_loss": 9.5069580078125, "lr": 2.6000000000000002e-05, "tps": 10738, "wall": 402.8} {"step": 66, "train_loss": 9.467168807983398, "lr": 2.64e-05, "tps": 10691, "wall": 410.7} {"step": 67, "train_loss": 9.377161026000977, "lr": 2.68e-05, "tps": 10645, "wall": 418.6} {"step": 68, "train_loss": 9.370655059814453, "lr": 2.72e-05, "tps": 10602, "wall": 426.5} {"step": 69, "train_loss": 9.341713905334473, "lr": 2.7600000000000003e-05, "tps": 10556, "wall": 434.6} {"step": 70, "train_loss": 9.364286422729492, "lr": 2.8e-05, "tps": 10516, "wall": 442.5} {"step": 71, "train_loss": 9.270344734191895, "lr": 2.8400000000000003e-05, "tps": 10473, "wall": 450.5} {"step": 72, "train_loss": 9.28166389465332, "lr": 2.8800000000000002e-05, "tps": 10431, "wall": 458.6} {"step": 73, "train_loss": 9.233768463134766, "lr": 2.92e-05, "tps": 10397, "wall": 466.4} {"step": 74, "train_loss": 9.294058799743652, "lr": 2.96e-05, "tps": 10365, "wall": 474.2} {"step": 75, "train_loss": 9.224015235900879, "lr": 3e-05, "tps": 10335, "wall": 481.9} {"step": 76, "train_loss": 9.157353401184082, "lr": 3.04e-05, "tps": 10306, "wall": 489.6} {"step": 77, "train_loss": 9.2096586227417, "lr": 3.08e-05, "tps": 10276, "wall": 497.4} {"step": 78, "train_loss": 9.179288864135742, "lr": 3.12e-05, "tps": 10248, "wall": 505.2} {"step": 79, "train_loss": 9.085453033447266, "lr": 3.16e-05, "tps": 10222, "wall": 512.9} {"step": 80, "train_loss": 9.107942581176758, "lr": 3.2e-05, "tps": 10198, "wall": 520.5} {"step": 81, "train_loss": 9.085135459899902, "lr": 3.24e-05, "tps": 10173, "wall": 528.2} {"step": 82, "train_loss": 9.015960693359375, "lr": 3.2800000000000004e-05, "tps": 10148, "wall": 536.0} {"step": 83, "train_loss": 9.06379508972168, "lr": 3.32e-05, "tps": 10125, "wall": 543.7} {"step": 84, "train_loss": 8.99739933013916, "lr": 3.3600000000000004e-05, "tps": 10100, "wall": 551.5} {"step": 85, "train_loss": 8.945883750915527, "lr": 3.4e-05, "tps": 10078, "wall": 559.2} {"step": 86, "train_loss": 8.933882713317871, "lr": 3.44e-05, "tps": 10058, "wall": 566.8} {"step": 87, "train_loss": 8.958731651306152, "lr": 3.4800000000000006e-05, "tps": 10039, "wall": 574.5} {"step": 88, "train_loss": 8.918476104736328, "lr": 3.52e-05, "tps": 10020, "wall": 582.1} {"step": 89, "train_loss": 8.855347633361816, "lr": 3.56e-05, "tps": 10001, "wall": 589.7} {"step": 90, "train_loss": 8.866905212402344, "lr": 3.6e-05, "tps": 9983, "wall": 597.4} {"step": 91, "train_loss": 8.829865455627441, "lr": 3.6400000000000004e-05, "tps": 9966, "wall": 604.9} {"step": 92, "train_loss": 8.799142837524414, "lr": 3.68e-05, "tps": 9947, "wall": 612.7} {"step": 93, "train_loss": 8.740829467773438, "lr": 3.72e-05, "tps": 9930, "wall": 620.4} {"step": 94, "train_loss": 8.792405128479004, "lr": 3.76e-05, "tps": 9913, "wall": 628.0} {"step": 95, "train_loss": 8.686074256896973, "lr": 3.8e-05, "tps": 9899, "wall": 635.5} {"step": 96, "train_loss": 8.677027702331543, "lr": 3.8400000000000005e-05, "tps": 9884, "wall": 643.1} {"step": 97, "train_loss": 8.693831443786621, "lr": 3.88e-05, "tps": 9869, "wall": 650.7} {"step": 98, "train_loss": 8.663509368896484, "lr": 3.92e-05, "tps": 9856, "wall": 658.3} {"step": 99, "train_loss": 8.636314392089844, "lr": 3.96e-05, "tps": 9840, "wall": 666.0} {"step": 100, "train_loss": 8.546420097351074, "lr": 4e-05, "tps": 9825, "wall": 673.7} {"step": 101, "train_loss": 8.571012496948242, "lr": 4.0400000000000006e-05, "tps": 9810, "wall": 681.4} {"step": 102, "train_loss": 8.568342208862305, "lr": 4.08e-05, "tps": 9797, "wall": 689.0} {"step": 103, "train_loss": 8.628839492797852, "lr": 4.12e-05, "tps": 9783, "wall": 696.7} {"step": 104, "train_loss": 8.5676851272583, "lr": 4.160000000000001e-05, "tps": 9771, "wall": 704.2} {"step": 105, "train_loss": 8.497340202331543, "lr": 4.2000000000000004e-05, "tps": 9756, "wall": 712.0} {"step": 106, "train_loss": 8.448352813720703, "lr": 4.24e-05, "tps": 9742, "wall": 719.7} {"step": 107, "train_loss": 8.481856346130371, "lr": 4.2800000000000004e-05, "tps": 9730, "wall": 727.4} {"step": 108, "train_loss": 8.367953300476074, "lr": 4.32e-05, "tps": 9716, "wall": 735.1} {"step": 109, "train_loss": 8.396543502807617, "lr": 4.36e-05, "tps": 9704, "wall": 742.8} {"step": 110, "train_loss": 8.405295372009277, "lr": 4.4000000000000006e-05, "tps": 9692, "wall": 750.6} {"step": 111, "train_loss": 8.329401969909668, "lr": 4.44e-05, "tps": 9679, "wall": 758.3} {"step": 112, "train_loss": 8.313867568969727, "lr": 4.48e-05, "tps": 9666, "wall": 766.1} {"step": 113, "train_loss": 8.262494087219238, "lr": 4.52e-05, "tps": 9655, "wall": 773.8} {"step": 114, "train_loss": 8.293413162231445, "lr": 4.5600000000000004e-05, "tps": 9643, "wall": 781.5} {"step": 115, "train_loss": 8.254898071289062, "lr": 4.6e-05, "tps": 9632, "wall": 789.3} {"step": 116, "train_loss": 8.216276168823242, "lr": 4.64e-05, "tps": 9619, "wall": 797.1} {"step": 117, "train_loss": 8.169356346130371, "lr": 4.68e-05, "tps": 9608, "wall": 804.8} {"step": 118, "train_loss": 8.24614429473877, "lr": 4.72e-05, "tps": 9598, "wall": 812.5} {"step": 119, "train_loss": 8.201354026794434, "lr": 4.7600000000000005e-05, "tps": 9588, "wall": 820.2} {"step": 120, "train_loss": 8.185944557189941, "lr": 4.8e-05, "tps": 9576, "wall": 828.0} {"step": 121, "train_loss": 8.069718360900879, "lr": 4.8400000000000004e-05, "tps": 9566, "wall": 835.7} {"step": 122, "train_loss": 8.208297729492188, "lr": 4.88e-05, "tps": 9555, "wall": 843.6} {"step": 123, "train_loss": 8.085550308227539, "lr": 4.92e-05, "tps": 9544, "wall": 851.5} {"step": 124, "train_loss": 8.03810977935791, "lr": 4.9600000000000006e-05, "tps": 9534, "wall": 859.2} {"step": 125, "train_loss": 8.05516529083252, "lr": 5e-05, "tps": 9524, "wall": 867.0} {"step": 126, "train_loss": 7.997936725616455, "lr": 5.04e-05, "tps": 9515, "wall": 874.7} {"step": 127, "train_loss": 7.9177446365356445, "lr": 5.08e-05, "tps": 9507, "wall": 882.3} {"step": 128, "train_loss": 8.007017135620117, "lr": 5.1200000000000004e-05, "tps": 9498, "wall": 890.0} {"step": 129, "train_loss": 7.972557067871094, "lr": 5.16e-05, "tps": 9489, "wall": 897.8} {"step": 130, "train_loss": 8.009966850280762, "lr": 5.2000000000000004e-05, "tps": 9482, "wall": 905.4} {"step": 131, "train_loss": 8.015609741210938, "lr": 5.24e-05, "tps": 9473, "wall": 913.2} {"step": 132, "train_loss": 8.031258583068848, "lr": 5.28e-05, "tps": 9458, "wall": 921.5} {"step": 133, "train_loss": 7.954874038696289, "lr": 5.3200000000000006e-05, "tps": 9444, "wall": 929.8} {"step": 134, "train_loss": 7.80820894241333, "lr": 5.36e-05, "tps": 9434, "wall": 937.8} {"step": 135, "train_loss": 7.913119316101074, "lr": 5.4e-05, "tps": 9425, "wall": 945.6} {"step": 136, "train_loss": 7.79510498046875, "lr": 5.44e-05, "tps": 9415, "wall": 953.6} {"step": 137, "train_loss": 7.834118366241455, "lr": 5.4800000000000004e-05, "tps": 9405, "wall": 961.5} {"step": 138, "train_loss": 7.765554428100586, "lr": 5.520000000000001e-05, "tps": 9394, "wall": 969.6} {"step": 139, "train_loss": 7.864133834838867, "lr": 5.56e-05, "tps": 9385, "wall": 977.5} {"step": 140, "train_loss": 7.720888614654541, "lr": 5.6e-05, "tps": 9377, "wall": 985.4} {"step": 141, "train_loss": 7.791794300079346, "lr": 5.640000000000001e-05, "tps": 9369, "wall": 993.3} {"step": 142, "train_loss": 7.801263809204102, "lr": 5.6800000000000005e-05, "tps": 9361, "wall": 1001.1} {"step": 143, "train_loss": 7.684856414794922, "lr": 5.72e-05, "tps": 9353, "wall": 1009.0} {"step": 144, "train_loss": 7.761735916137695, "lr": 5.7600000000000004e-05, "tps": 9345, "wall": 1016.9} {"step": 145, "train_loss": 7.694338321685791, "lr": 5.8e-05, "tps": 9337, "wall": 1024.7} {"step": 146, "train_loss": 7.6453704833984375, "lr": 5.84e-05, "tps": 9328, "wall": 1032.7} {"step": 147, "train_loss": 7.595042705535889, "lr": 5.8800000000000006e-05, "tps": 9321, "wall": 1040.6} {"step": 148, "train_loss": 7.574378490447998, "lr": 5.92e-05, "tps": 9314, "wall": 1048.3} {"step": 149, "train_loss": 7.547858238220215, "lr": 5.96e-05, "tps": 9308, "wall": 1056.1} {"step": 150, "train_loss": 7.622703552246094, "lr": 6e-05, "tps": 9301, "wall": 1063.9} {"step": 151, "train_loss": 7.601994514465332, "lr": 6.0400000000000004e-05, "tps": 9294, "wall": 1071.7} {"step": 152, "train_loss": 7.610236644744873, "lr": 6.08e-05, "tps": 9288, "wall": 1079.5} {"step": 153, "train_loss": 7.596889972686768, "lr": 6.120000000000001e-05, "tps": 9281, "wall": 1087.4} {"step": 154, "train_loss": 7.53411865234375, "lr": 6.16e-05, "tps": 9274, "wall": 1095.3} {"step": 155, "train_loss": 7.533018589019775, "lr": 6.2e-05, "tps": 9267, "wall": 1103.1} {"step": 156, "train_loss": 7.608554840087891, "lr": 6.24e-05, "tps": 9261, "wall": 1110.9} {"step": 157, "train_loss": 7.584914684295654, "lr": 6.280000000000001e-05, "tps": 9254, "wall": 1118.8} {"step": 158, "train_loss": 7.5255231857299805, "lr": 6.32e-05, "tps": 9249, "wall": 1126.6} {"step": 159, "train_loss": 7.4985432624816895, "lr": 6.36e-05, "tps": 9243, "wall": 1134.4} {"step": 160, "train_loss": 7.560420989990234, "lr": 6.4e-05, "tps": 9237, "wall": 1142.2} {"step": 161, "train_loss": 7.505138397216797, "lr": 6.44e-05, "tps": 9231, "wall": 1150.0} {"step": 162, "train_loss": 7.4167094230651855, "lr": 6.48e-05, "tps": 9224, "wall": 1158.0} {"step": 163, "train_loss": 7.479063987731934, "lr": 6.520000000000001e-05, "tps": 9219, "wall": 1165.8} {"step": 164, "train_loss": 7.403266906738281, "lr": 6.560000000000001e-05, "tps": 9213, "wall": 1173.6} {"step": 165, "train_loss": 7.523157119750977, "lr": 6.6e-05, "tps": 9207, "wall": 1181.5} {"step": 166, "train_loss": 7.427882194519043, "lr": 6.64e-05, "tps": 9202, "wall": 1189.4} {"step": 167, "train_loss": 7.444023132324219, "lr": 6.68e-05, "tps": 9197, "wall": 1197.1} {"step": 168, "train_loss": 7.502746105194092, "lr": 6.720000000000001e-05, "tps": 9190, "wall": 1205.1} {"step": 169, "train_loss": 7.482631683349609, "lr": 6.76e-05, "tps": 9176, "wall": 1214.0} {"step": 170, "train_loss": 7.465363502502441, "lr": 6.8e-05, "tps": 9161, "wall": 1223.2} {"step": 171, "train_loss": 7.453548431396484, "lr": 6.840000000000001e-05, "tps": 9154, "wall": 1231.3} {"step": 172, "train_loss": 7.33956241607666, "lr": 6.88e-05, "tps": 9148, "wall": 1239.3} {"step": 173, "train_loss": 7.356197357177734, "lr": 6.92e-05, "tps": 9143, "wall": 1247.2} {"step": 174, "train_loss": 7.369173526763916, "lr": 6.960000000000001e-05, "tps": 9136, "wall": 1255.2} {"step": 175, "train_loss": 7.375523567199707, "lr": 7.000000000000001e-05, "tps": 9130, "wall": 1263.3} {"step": 176, "train_loss": 7.382493495941162, "lr": 7.04e-05, "tps": 9125, "wall": 1271.2} {"step": 177, "train_loss": 7.334375381469727, "lr": 7.08e-05, "tps": 9119, "wall": 1279.1} {"step": 178, "train_loss": 7.39451789855957, "lr": 7.12e-05, "tps": 9110, "wall": 1287.7} {"step": 179, "train_loss": 7.333327770233154, "lr": 7.159999999999999e-05, "tps": 9103, "wall": 1295.8} {"step": 180, "train_loss": 7.37626838684082, "lr": 7.2e-05, "tps": 9089, "wall": 1305.1} {"step": 181, "train_loss": 7.321794509887695, "lr": 7.240000000000001e-05, "tps": 9074, "wall": 1314.4} {"step": 182, "train_loss": 7.290129661560059, "lr": 7.280000000000001e-05, "tps": 9058, "wall": 1323.9} {"step": 183, "train_loss": 7.301864147186279, "lr": 7.32e-05, "tps": 9041, "wall": 1333.7} {"step": 184, "train_loss": 7.287424087524414, "lr": 7.36e-05, "tps": 9023, "wall": 1343.6} {"step": 185, "train_loss": 7.40167236328125, "lr": 7.400000000000001e-05, "tps": 9005, "wall": 1353.5} {"step": 186, "train_loss": 7.30732536315918, "lr": 7.44e-05, "tps": 8987, "wall": 1363.5} {"step": 187, "train_loss": 7.3695173263549805, "lr": 7.48e-05, "tps": 8968, "wall": 1373.7} {"step": 188, "train_loss": 7.33498477935791, "lr": 7.52e-05, "tps": 8954, "wall": 1383.3} {"step": 189, "train_loss": 7.29096794128418, "lr": 7.56e-05, "tps": 8936, "wall": 1393.4} {"step": 190, "train_loss": 7.324825286865234, "lr": 7.6e-05, "tps": 8919, "wall": 1403.4} {"step": 191, "train_loss": 7.163296699523926, "lr": 7.640000000000001e-05, "tps": 8904, "wall": 1413.1} {"step": 192, "train_loss": 7.160993576049805, "lr": 7.680000000000001e-05, "tps": 8888, "wall": 1423.0} {"step": 193, "train_loss": 7.254158973693848, "lr": 7.72e-05, "tps": 8871, "wall": 1433.1} {"step": 194, "train_loss": 7.130463600158691, "lr": 7.76e-05, "tps": 8856, "wall": 1442.9} {"step": 195, "train_loss": 7.196925163269043, "lr": 7.8e-05, "tps": 8841, "wall": 1452.8} {"step": 196, "train_loss": 7.206007480621338, "lr": 7.84e-05, "tps": 8825, "wall": 1462.9} {"step": 197, "train_loss": 7.2311553955078125, "lr": 7.88e-05, "tps": 8811, "wall": 1472.6} {"step": 198, "train_loss": 7.276366233825684, "lr": 7.92e-05, "tps": 8806, "wall": 1480.9} {"step": 199, "train_loss": 7.229197025299072, "lr": 7.960000000000001e-05, "tps": 8800, "wall": 1489.3} {"step": 200, "train_loss": 7.224910259246826, "lr": 8e-05, "tps": 8794, "wall": 1497.8} {"step": 201, "train_loss": 7.1847076416015625, "lr": 8.04e-05, "tps": 8787, "wall": 1506.5} {"step": 202, "train_loss": 7.146562576293945, "lr": 8.080000000000001e-05, "tps": 8779, "wall": 1515.4} {"step": 203, "train_loss": 7.0555877685546875, "lr": 8.120000000000001e-05, "tps": 8763, "wall": 1525.6} {"step": 204, "train_loss": 7.185199737548828, "lr": 8.16e-05, "tps": 8748, "wall": 1535.8} {"step": 205, "train_loss": 7.175101280212402, "lr": 8.2e-05, "tps": 8733, "wall": 1545.8} {"step": 206, "train_loss": 7.158578872680664, "lr": 8.24e-05, "tps": 8719, "wall": 1555.9} {"step": 207, "train_loss": 7.1070146560668945, "lr": 8.28e-05, "tps": 8704, "wall": 1566.1} {"step": 208, "train_loss": 7.111502647399902, "lr": 8.320000000000002e-05, "tps": 8690, "wall": 1576.2} {"step": 209, "train_loss": 7.058177471160889, "lr": 8.360000000000001e-05, "tps": 8676, "wall": 1586.3} {"step": 210, "train_loss": 7.106117248535156, "lr": 8.400000000000001e-05, "tps": 8661, "wall": 1596.4} {"step": 211, "train_loss": 7.045265197753906, "lr": 8.44e-05, "tps": 8648, "wall": 1606.6} {"step": 212, "train_loss": 7.104379653930664, "lr": 8.48e-05, "tps": 8634, "wall": 1616.6} {"step": 213, "train_loss": 6.994361877441406, "lr": 8.52e-05, "tps": 8621, "wall": 1626.7} {"step": 214, "train_loss": 7.086819171905518, "lr": 8.560000000000001e-05, "tps": 8608, "wall": 1636.7} {"step": 215, "train_loss": 7.129000663757324, "lr": 8.6e-05, "tps": 8595, "wall": 1646.9} {"step": 216, "train_loss": 7.151320457458496, "lr": 8.64e-05, "tps": 8585, "wall": 1656.5} {"step": 217, "train_loss": 7.112557411193848, "lr": 8.68e-05, "tps": 8571, "wall": 1666.7} {"step": 218, "train_loss": 7.019594192504883, "lr": 8.72e-05, "tps": 8555, "wall": 1677.5} {"step": 219, "train_loss": 7.079097747802734, "lr": 8.76e-05, "tps": 8547, "wall": 1686.9} {"step": 220, "train_loss": 7.027222633361816, "lr": 8.800000000000001e-05, "tps": 8534, "wall": 1697.0} {"step": 221, "train_loss": 7.101859092712402, "lr": 8.840000000000001e-05, "tps": 8523, "wall": 1707.0} {"step": 222, "train_loss": 7.060854434967041, "lr": 8.88e-05, "tps": 8513, "wall": 1716.7} {"step": 223, "train_loss": 7.158807277679443, "lr": 8.92e-05, "tps": 8502, "wall": 1726.6} {"step": 224, "train_loss": 7.0644941329956055, "lr": 8.96e-05, "tps": 8490, "wall": 1736.7} {"step": 225, "train_loss": 6.997409343719482, "lr": 9e-05, "tps": 8482, "wall": 1746.1} {"step": 226, "train_loss": 7.068938255310059, "lr": 9.04e-05, "tps": 8470, "wall": 1756.2} {"step": 227, "train_loss": 6.967785358428955, "lr": 9.080000000000001e-05, "tps": 8461, "wall": 1766.0} {"step": 228, "train_loss": 7.041006565093994, "lr": 9.120000000000001e-05, "tps": 8451, "wall": 1775.8} {"step": 229, "train_loss": 6.949634552001953, "lr": 9.16e-05, "tps": 8441, "wall": 1785.6} {"step": 230, "train_loss": 6.94615364074707, "lr": 9.2e-05, "tps": 8433, "wall": 1795.2} {"step": 231, "train_loss": 7.006380081176758, "lr": 9.240000000000001e-05, "tps": 8423, "wall": 1805.0} {"step": 232, "train_loss": 6.948620796203613, "lr": 9.28e-05, "tps": 8413, "wall": 1815.0} {"step": 233, "train_loss": 6.969529151916504, "lr": 9.32e-05, "tps": 8403, "wall": 1824.9} {"step": 234, "train_loss": 6.937190055847168, "lr": 9.36e-05, "tps": 8393, "wall": 1834.8} {"step": 235, "train_loss": 7.02977180480957, "lr": 9.4e-05, "tps": 8384, "wall": 1844.6} {"step": 236, "train_loss": 6.917998790740967, "lr": 9.44e-05, "tps": 8375, "wall": 1854.5} {"step": 237, "train_loss": 6.939247131347656, "lr": 9.480000000000001e-05, "tps": 8367, "wall": 1864.0} {"step": 238, "train_loss": 6.855594158172607, "lr": 9.520000000000001e-05, "tps": 8359, "wall": 1873.7} {"step": 239, "train_loss": 6.915129661560059, "lr": 9.56e-05, "tps": 8351, "wall": 1883.3} {"step": 240, "train_loss": 6.972247123718262, "lr": 9.6e-05, "tps": 8343, "wall": 1893.1} {"step": 241, "train_loss": 6.902806282043457, "lr": 9.64e-05, "tps": 8336, "wall": 1902.5} {"step": 242, "train_loss": 6.944427013397217, "lr": 9.680000000000001e-05, "tps": 8327, "wall": 1912.5} {"step": 243, "train_loss": 6.861973762512207, "lr": 9.72e-05, "tps": 8318, "wall": 1922.2} {"step": 244, "train_loss": 6.898660659790039, "lr": 9.76e-05, "tps": 8309, "wall": 1932.4} {"step": 245, "train_loss": 7.0103302001953125, "lr": 9.800000000000001e-05, "tps": 8302, "wall": 1941.7} {"step": 246, "train_loss": 6.834933757781982, "lr": 9.84e-05, "tps": 8292, "wall": 1952.1} {"step": 247, "train_loss": 6.871231555938721, "lr": 9.88e-05, "tps": 8282, "wall": 1962.4} {"step": 248, "train_loss": 6.844915390014648, "lr": 9.920000000000001e-05, "tps": 8274, "wall": 1972.1} {"step": 249, "train_loss": 6.867319107055664, "lr": 9.960000000000001e-05, "tps": 8267, "wall": 1981.8} {"step": 250, "train_loss": 6.830150604248047, "lr": 0.0001, "tps": 8257, "wall": 1992.0} {"step": 251, "train_loss": 6.861065864562988, "lr": 0.0001004, "tps": 8247, "wall": 2002.4} {"step": 252, "train_loss": 6.793179988861084, "lr": 0.0001008, "tps": 8236, "wall": 2013.0} {"step": 253, "train_loss": 6.928295612335205, "lr": 0.0001012, "tps": 8229, "wall": 2022.7} {"step": 254, "train_loss": 6.860710620880127, "lr": 0.0001016, "tps": 8226, "wall": 2031.5} {"step": 255, "train_loss": 6.808207988739014, "lr": 0.00010200000000000001, "tps": 8223, "wall": 2040.2} {"step": 256, "train_loss": 6.7704949378967285, "lr": 0.00010240000000000001, "tps": 8222, "wall": 2048.4} {"step": 257, "train_loss": 6.92716121673584, "lr": 0.0001028, "tps": 8220, "wall": 2056.8} {"step": 258, "train_loss": 6.888156890869141, "lr": 0.0001032, "tps": 8220, "wall": 2064.9} {"step": 259, "train_loss": 6.802608966827393, "lr": 0.00010360000000000001, "tps": 8218, "wall": 2073.2} {"step": 260, "train_loss": 6.793181896209717, "lr": 0.00010400000000000001, "tps": 8217, "wall": 2081.5} {"step": 261, "train_loss": 6.872438430786133, "lr": 0.0001044, "tps": 8216, "wall": 2089.7} {"step": 262, "train_loss": 6.780069351196289, "lr": 0.0001048, "tps": 8215, "wall": 2097.9} {"step": 263, "train_loss": 6.851951599121094, "lr": 0.0001052, "tps": 8214, "wall": 2106.1} {"step": 264, "train_loss": 6.796478748321533, "lr": 0.0001056, "tps": 8214, "wall": 2114.2} {"step": 265, "train_loss": 6.8257293701171875, "lr": 0.00010600000000000002, "tps": 8213, "wall": 2122.3} {"step": 266, "train_loss": 6.793089866638184, "lr": 0.00010640000000000001, "tps": 8213, "wall": 2130.4} {"step": 267, "train_loss": 6.746341705322266, "lr": 0.00010680000000000001, "tps": 8213, "wall": 2138.3} {"step": 268, "train_loss": 6.707442760467529, "lr": 0.0001072, "tps": 8213, "wall": 2146.3} {"step": 269, "train_loss": 6.698787689208984, "lr": 0.0001076, "tps": 8214, "wall": 2154.2} {"step": 270, "train_loss": 6.797616958618164, "lr": 0.000108, "tps": 8214, "wall": 2162.0} {"step": 271, "train_loss": 6.727644920349121, "lr": 0.0001084, "tps": 8214, "wall": 2170.0} {"step": 272, "train_loss": 6.738304615020752, "lr": 0.0001088, "tps": 8214, "wall": 2178.0} {"step": 273, "train_loss": 6.76308012008667, "lr": 0.00010920000000000001, "tps": 8214, "wall": 2185.9} {"step": 274, "train_loss": 6.700827121734619, "lr": 0.00010960000000000001, "tps": 8215, "wall": 2193.8} {"step": 275, "train_loss": 6.783364295959473, "lr": 0.00011, "tps": 8215, "wall": 2201.6} {"step": 276, "train_loss": 6.816576957702637, "lr": 0.00011040000000000001, "tps": 8216, "wall": 2209.4} {"step": 277, "train_loss": 6.767274379730225, "lr": 0.00011080000000000001, "tps": 8217, "wall": 2217.2} {"step": 278, "train_loss": 6.771701812744141, "lr": 0.0001112, "tps": 8217, "wall": 2225.0} {"step": 279, "train_loss": 6.883213996887207, "lr": 0.0001116, "tps": 8217, "wall": 2232.9} {"step": 280, "train_loss": 6.681258201599121, "lr": 0.000112, "tps": 8217, "wall": 2241.0} {"step": 281, "train_loss": 6.695852279663086, "lr": 0.0001124, "tps": 8218, "wall": 2248.8} {"step": 282, "train_loss": 6.652372360229492, "lr": 0.00011280000000000002, "tps": 8219, "wall": 2256.5} {"step": 283, "train_loss": 6.691885948181152, "lr": 0.00011320000000000001, "tps": 8220, "wall": 2264.2} {"step": 284, "train_loss": 6.7239861488342285, "lr": 0.00011360000000000001, "tps": 8220, "wall": 2272.1} {"step": 285, "train_loss": 6.685210704803467, "lr": 0.000114, "tps": 8221, "wall": 2279.9} {"step": 286, "train_loss": 6.7303466796875, "lr": 0.0001144, "tps": 8221, "wall": 2287.7} {"step": 287, "train_loss": 6.647150993347168, "lr": 0.0001148, "tps": 8221, "wall": 2295.6} {"step": 288, "train_loss": 6.748040199279785, "lr": 0.00011520000000000001, "tps": 8222, "wall": 2303.4} {"step": 289, "train_loss": 6.667152404785156, "lr": 0.0001156, "tps": 8223, "wall": 2311.2} {"step": 290, "train_loss": 6.720929145812988, "lr": 0.000116, "tps": 8223, "wall": 2319.0} {"step": 291, "train_loss": 6.6657233238220215, "lr": 0.0001164, "tps": 8224, "wall": 2326.7} {"step": 292, "train_loss": 6.697333335876465, "lr": 0.0001168, "tps": 8223, "wall": 2335.0} {"step": 293, "train_loss": 6.703644752502441, "lr": 0.00011720000000000002, "tps": 8222, "wall": 2343.2} {"step": 294, "train_loss": 6.6643524169921875, "lr": 0.00011760000000000001, "tps": 8221, "wall": 2351.4} {"step": 295, "train_loss": 6.595453262329102, "lr": 0.00011800000000000001, "tps": 8222, "wall": 2359.2} {"step": 296, "train_loss": 6.646897315979004, "lr": 0.0001184, "tps": 8222, "wall": 2367.1} {"step": 297, "train_loss": 6.663555145263672, "lr": 0.0001188, "tps": 8222, "wall": 2375.1} {"step": 298, "train_loss": 6.621366024017334, "lr": 0.0001192, "tps": 8223, "wall": 2383.0} {"step": 299, "train_loss": 6.61474609375, "lr": 0.00011960000000000001, "tps": 8223, "wall": 2390.8} {"step": 300, "train_loss": 6.614176273345947, "lr": 0.00012, "tps": 8223, "wall": 2398.8} {"step": 301, "train_loss": 6.668420314788818, "lr": 0.00012040000000000001, "tps": 8224, "wall": 2406.5} {"step": 302, "train_loss": 6.533787727355957, "lr": 0.00012080000000000001, "tps": 8224, "wall": 2414.5} {"step": 303, "train_loss": 6.579748153686523, "lr": 0.0001212, "tps": 8224, "wall": 2422.4} {"step": 304, "train_loss": 6.624425888061523, "lr": 0.0001216, "tps": 8224, "wall": 2430.4} {"step": 305, "train_loss": 6.551595687866211, "lr": 0.00012200000000000001, "tps": 8224, "wall": 2438.3} {"step": 306, "train_loss": 6.523261070251465, "lr": 0.00012240000000000002, "tps": 8224, "wall": 2446.2} {"step": 307, "train_loss": 6.631338119506836, "lr": 0.0001228, "tps": 8225, "wall": 2454.0} {"step": 308, "train_loss": 6.712448596954346, "lr": 0.0001232, "tps": 8225, "wall": 2461.9} {"step": 309, "train_loss": 6.5173420906066895, "lr": 0.0001236, "tps": 8226, "wall": 2469.7} {"step": 310, "train_loss": 6.582144737243652, "lr": 0.000124, "tps": 8226, "wall": 2477.7} {"step": 311, "train_loss": 6.5684967041015625, "lr": 0.00012440000000000002, "tps": 8226, "wall": 2485.6} {"step": 312, "train_loss": 6.608975410461426, "lr": 0.0001248, "tps": 8226, "wall": 2493.4} {"step": 313, "train_loss": 6.6701884269714355, "lr": 0.0001252, "tps": 8227, "wall": 2501.2} {"step": 314, "train_loss": 6.567470073699951, "lr": 0.00012560000000000002, "tps": 8227, "wall": 2509.1} {"step": 315, "train_loss": 6.540990829467773, "lr": 0.000126, "tps": 8227, "wall": 2517.0} {"step": 316, "train_loss": 6.5851569175720215, "lr": 0.0001264, "tps": 8228, "wall": 2524.8} {"step": 317, "train_loss": 6.481107234954834, "lr": 0.0001268, "tps": 8228, "wall": 2532.8} {"step": 318, "train_loss": 6.609848976135254, "lr": 0.0001272, "tps": 8228, "wall": 2540.6} {"step": 319, "train_loss": 6.4503583908081055, "lr": 0.0001276, "tps": 8229, "wall": 2548.4} {"step": 320, "train_loss": 6.507472515106201, "lr": 0.000128, "tps": 8229, "wall": 2556.2} {"step": 321, "train_loss": 6.458249092102051, "lr": 0.0001284, "tps": 8230, "wall": 2564.0} {"step": 322, "train_loss": 6.472954750061035, "lr": 0.0001288, "tps": 8230, "wall": 2571.8} {"step": 323, "train_loss": 6.451105117797852, "lr": 0.0001292, "tps": 8231, "wall": 2579.6} {"step": 324, "train_loss": 6.520007133483887, "lr": 0.0001296, "tps": 8231, "wall": 2587.4} {"step": 325, "train_loss": 6.603074073791504, "lr": 0.00013000000000000002, "tps": 8231, "wall": 2595.4} {"step": 326, "train_loss": 6.516155242919922, "lr": 0.00013040000000000003, "tps": 8232, "wall": 2603.2} {"step": 327, "train_loss": 6.4657816886901855, "lr": 0.0001308, "tps": 8232, "wall": 2611.1} {"step": 328, "train_loss": 6.5054473876953125, "lr": 0.00013120000000000002, "tps": 8232, "wall": 2619.0} {"step": 329, "train_loss": 6.458938121795654, "lr": 0.0001316, "tps": 8233, "wall": 2626.8} {"step": 330, "train_loss": 6.521381855010986, "lr": 0.000132, "tps": 8233, "wall": 2634.7} {"step": 331, "train_loss": 6.463772773742676, "lr": 0.00013240000000000002, "tps": 8233, "wall": 2642.7} {"step": 332, "train_loss": 6.451740741729736, "lr": 0.0001328, "tps": 8232, "wall": 2650.9} {"step": 333, "train_loss": 6.378885269165039, "lr": 0.0001332, "tps": 8232, "wall": 2658.8} {"step": 334, "train_loss": 6.495925426483154, "lr": 0.0001336, "tps": 8232, "wall": 2666.9} {"step": 335, "train_loss": 6.472762107849121, "lr": 0.000134, "tps": 8232, "wall": 2674.8} {"step": 336, "train_loss": 6.4720072746276855, "lr": 0.00013440000000000001, "tps": 8232, "wall": 2682.7} {"step": 337, "train_loss": 6.472258567810059, "lr": 0.0001348, "tps": 8232, "wall": 2690.5} {"step": 338, "train_loss": 6.3701701164245605, "lr": 0.0001352, "tps": 8233, "wall": 2698.4} {"step": 339, "train_loss": 6.421249866485596, "lr": 0.0001356, "tps": 8233, "wall": 2706.2} {"step": 340, "train_loss": 6.4820942878723145, "lr": 0.000136, "tps": 8233, "wall": 2714.1} {"step": 341, "train_loss": 6.5441083908081055, "lr": 0.00013639999999999998, "tps": 8234, "wall": 2722.0} {"step": 342, "train_loss": 6.470989227294922, "lr": 0.00013680000000000002, "tps": 8234, "wall": 2729.8} {"step": 343, "train_loss": 6.382760047912598, "lr": 0.00013720000000000003, "tps": 8234, "wall": 2737.7} {"step": 344, "train_loss": 6.468560695648193, "lr": 0.0001376, "tps": 8235, "wall": 2745.5} {"step": 345, "train_loss": 6.399266242980957, "lr": 0.00013800000000000002, "tps": 8235, "wall": 2753.4} {"step": 346, "train_loss": 6.351539611816406, "lr": 0.0001384, "tps": 8235, "wall": 2761.2} {"step": 347, "train_loss": 6.384849548339844, "lr": 0.0001388, "tps": 8235, "wall": 2769.1} {"step": 348, "train_loss": 6.312592506408691, "lr": 0.00013920000000000002, "tps": 8235, "wall": 2777.3} {"step": 349, "train_loss": 6.390865325927734, "lr": 0.0001396, "tps": 8235, "wall": 2785.4} {"step": 350, "train_loss": 6.405248165130615, "lr": 0.00014000000000000001, "tps": 8234, "wall": 2793.4} {"step": 351, "train_loss": 6.351445198059082, "lr": 0.0001404, "tps": 8234, "wall": 2801.5} {"step": 352, "train_loss": 6.5202765464782715, "lr": 0.0001408, "tps": 8233, "wall": 2809.7} {"step": 353, "train_loss": 6.3550567626953125, "lr": 0.00014120000000000002, "tps": 8233, "wall": 2817.7} {"step": 354, "train_loss": 6.469671249389648, "lr": 0.0001416, "tps": 8233, "wall": 2825.7} {"step": 355, "train_loss": 6.326552391052246, "lr": 0.000142, "tps": 8233, "wall": 2833.7} {"step": 356, "train_loss": 6.381911277770996, "lr": 0.0001424, "tps": 8233, "wall": 2841.5} {"step": 357, "train_loss": 6.304686546325684, "lr": 0.0001428, "tps": 8234, "wall": 2849.4} {"step": 358, "train_loss": 6.392787456512451, "lr": 0.00014319999999999998, "tps": 8234, "wall": 2857.2} {"step": 359, "train_loss": 6.445312023162842, "lr": 0.0001436, "tps": 8234, "wall": 2865.0} {"step": 360, "train_loss": 6.3740081787109375, "lr": 0.000144, "tps": 8235, "wall": 2872.9} {"step": 361, "train_loss": 6.481538772583008, "lr": 0.0001444, "tps": 8234, "wall": 2880.9} {"step": 362, "train_loss": 6.353227138519287, "lr": 0.00014480000000000002, "tps": 8234, "wall": 2888.9} {"step": 363, "train_loss": 6.357383728027344, "lr": 0.0001452, "tps": 8234, "wall": 2896.8} {"step": 364, "train_loss": 6.413549423217773, "lr": 0.00014560000000000002, "tps": 8231, "wall": 2905.9} {"step": 365, "train_loss": 6.305184841156006, "lr": 0.00014600000000000003, "tps": 8227, "wall": 2915.5} {"step": 366, "train_loss": 6.423856258392334, "lr": 0.0001464, "tps": 8222, "wall": 2925.2} {"step": 367, "train_loss": 6.398845672607422, "lr": 0.00014680000000000002, "tps": 8217, "wall": 2934.8} {"step": 368, "train_loss": 6.332057952880859, "lr": 0.0001472, "tps": 8212, "wall": 2944.5} {"step": 369, "train_loss": 6.350677967071533, "lr": 0.0001476, "tps": 8208, "wall": 2954.2} {"step": 370, "train_loss": 6.2995924949646, "lr": 0.00014800000000000002, "tps": 8203, "wall": 2963.9} {"step": 371, "train_loss": 6.29654598236084, "lr": 0.0001484, "tps": 8198, "wall": 2973.7} {"step": 372, "train_loss": 6.283391952514648, "lr": 0.0001488, "tps": 8193, "wall": 2983.5} {"step": 373, "train_loss": 6.262945175170898, "lr": 0.0001492, "tps": 8191, "wall": 2992.3} {"step": 374, "train_loss": 6.256057262420654, "lr": 0.0001496, "tps": 8191, "wall": 3000.3} {"step": 375, "train_loss": 6.422400951385498, "lr": 0.00015, "tps": 8190, "wall": 3008.4} {"step": 376, "train_loss": 6.343482494354248, "lr": 0.0001504, "tps": 8190, "wall": 3016.6} {"step": 377, "train_loss": 6.288861274719238, "lr": 0.0001508, "tps": 8190, "wall": 3024.7} {"step": 378, "train_loss": 6.456772804260254, "lr": 0.0001512, "tps": 8189, "wall": 3032.8} {"step": 379, "train_loss": 6.354854583740234, "lr": 0.00015160000000000003, "tps": 8189, "wall": 3040.9} {"step": 380, "train_loss": 6.301961898803711, "lr": 0.000152, "tps": 8189, "wall": 3049.0} {"step": 381, "train_loss": 6.296117782592773, "lr": 0.00015240000000000002, "tps": 8188, "wall": 3057.2} {"step": 382, "train_loss": 6.353492259979248, "lr": 0.00015280000000000003, "tps": 8187, "wall": 3065.5} {"step": 383, "train_loss": 6.376057147979736, "lr": 0.0001532, "tps": 8187, "wall": 3073.8} {"step": 384, "train_loss": 6.251082420349121, "lr": 0.00015360000000000002, "tps": 8186, "wall": 3081.9} {"step": 385, "train_loss": 6.305881977081299, "lr": 0.000154, "tps": 8186, "wall": 3090.0} {"step": 386, "train_loss": 6.346584320068359, "lr": 0.0001544, "tps": 8186, "wall": 3097.9} {"step": 387, "train_loss": 6.2744035720825195, "lr": 0.00015480000000000002, "tps": 8186, "wall": 3106.0} {"step": 388, "train_loss": 6.211904525756836, "lr": 0.0001552, "tps": 8186, "wall": 3114.0} {"step": 389, "train_loss": 6.3420610427856445, "lr": 0.00015560000000000001, "tps": 8186, "wall": 3122.1} {"step": 390, "train_loss": 6.266308307647705, "lr": 0.000156, "tps": 8186, "wall": 3130.1} {"step": 391, "train_loss": 6.272176742553711, "lr": 0.0001564, "tps": 8186, "wall": 3138.3} {"step": 392, "train_loss": 6.15432596206665, "lr": 0.0001568, "tps": 8186, "wall": 3146.2} {"step": 393, "train_loss": 6.2673420906066895, "lr": 0.0001572, "tps": 8186, "wall": 3154.2} {"step": 394, "train_loss": 6.2778639793396, "lr": 0.0001576, "tps": 8186, "wall": 3162.3} {"step": 395, "train_loss": 6.2631449699401855, "lr": 0.000158, "tps": 8186, "wall": 3170.2} {"step": 396, "train_loss": 6.2309699058532715, "lr": 0.0001584, "tps": 8186, "wall": 3178.2} {"step": 397, "train_loss": 6.255127906799316, "lr": 0.00015879999999999998, "tps": 8186, "wall": 3186.1} {"step": 398, "train_loss": 6.258402347564697, "lr": 0.00015920000000000002, "tps": 8186, "wall": 3194.1} {"step": 399, "train_loss": 6.190685272216797, "lr": 0.00015960000000000003, "tps": 8186, "wall": 3202.0} {"step": 400, "train_loss": 6.229249000549316, "lr": 0.00016, "tps": 8187, "wall": 3209.8} {"step": 401, "train_loss": 6.208676815032959, "lr": 0.00016040000000000002, "tps": 8187, "wall": 3217.7} {"step": 402, "train_loss": 6.247330188751221, "lr": 0.0001608, "tps": 8188, "wall": 3225.5} {"step": 403, "train_loss": 6.300992012023926, "lr": 0.00016120000000000002, "tps": 8188, "wall": 3233.4} {"step": 404, "train_loss": 6.185318470001221, "lr": 0.00016160000000000002, "tps": 8188, "wall": 3241.2} {"step": 405, "train_loss": 6.174660682678223, "lr": 0.000162, "tps": 8189, "wall": 3249.0} {"step": 406, "train_loss": 6.233938694000244, "lr": 0.00016240000000000002, "tps": 8189, "wall": 3257.0} {"step": 407, "train_loss": 6.3452324867248535, "lr": 0.0001628, "tps": 8189, "wall": 3264.9} {"step": 408, "train_loss": 6.373632907867432, "lr": 0.0001632, "tps": 8190, "wall": 3272.7} {"step": 409, "train_loss": 6.206953525543213, "lr": 0.0001636, "tps": 8190, "wall": 3280.6} {"step": 410, "train_loss": 6.310626983642578, "lr": 0.000164, "tps": 8190, "wall": 3288.5} {"step": 411, "train_loss": 6.143367767333984, "lr": 0.0001644, "tps": 8190, "wall": 3296.4} {"step": 412, "train_loss": 6.173959732055664, "lr": 0.0001648, "tps": 8191, "wall": 3304.4} {"step": 413, "train_loss": 6.241881370544434, "lr": 0.0001652, "tps": 8191, "wall": 3312.3} {"step": 414, "train_loss": 6.282281398773193, "lr": 0.0001656, "tps": 8191, "wall": 3320.1} {"step": 415, "train_loss": 6.273196220397949, "lr": 0.000166, "tps": 8192, "wall": 3328.0} {"step": 416, "train_loss": 6.259731292724609, "lr": 0.00016640000000000003, "tps": 8192, "wall": 3335.8} {"step": 417, "train_loss": 6.198642253875732, "lr": 0.00016680000000000002, "tps": 8192, "wall": 3343.7} {"step": 418, "train_loss": 6.241038799285889, "lr": 0.00016720000000000003, "tps": 8193, "wall": 3351.6} {"step": 419, "train_loss": 6.095648765563965, "lr": 0.0001676, "tps": 8193, "wall": 3359.4} {"step": 420, "train_loss": 6.195520401000977, "lr": 0.00016800000000000002, "tps": 8193, "wall": 3367.3} {"step": 421, "train_loss": 6.118620872497559, "lr": 0.00016840000000000003, "tps": 8193, "wall": 3375.4} {"step": 422, "train_loss": 6.108532905578613, "lr": 0.0001688, "tps": 8193, "wall": 3383.3} {"step": 423, "train_loss": 6.171170234680176, "lr": 0.00016920000000000002, "tps": 8193, "wall": 3391.2} {"step": 424, "train_loss": 6.139626502990723, "lr": 0.0001696, "tps": 8194, "wall": 3399.1} {"step": 425, "train_loss": 6.237159252166748, "lr": 0.00017, "tps": 8194, "wall": 3406.9} {"step": 426, "train_loss": 6.2342681884765625, "lr": 0.0001704, "tps": 8194, "wall": 3414.8} {"step": 427, "train_loss": 6.223633766174316, "lr": 0.0001708, "tps": 8195, "wall": 3422.7} {"step": 428, "train_loss": 6.151854515075684, "lr": 0.00017120000000000001, "tps": 8194, "wall": 3430.8} {"step": 429, "train_loss": 6.187539100646973, "lr": 0.0001716, "tps": 8194, "wall": 3438.8} {"step": 430, "train_loss": 6.1514892578125, "lr": 0.000172, "tps": 8194, "wall": 3446.8} {"step": 431, "train_loss": 6.133560657501221, "lr": 0.0001724, "tps": 8195, "wall": 3454.7} {"step": 432, "train_loss": 6.230044841766357, "lr": 0.0001728, "tps": 8195, "wall": 3462.7} {"step": 433, "train_loss": 6.226946830749512, "lr": 0.0001732, "tps": 8195, "wall": 3470.5} {"step": 434, "train_loss": 6.128452301025391, "lr": 0.0001736, "tps": 8195, "wall": 3478.5} {"step": 435, "train_loss": 6.129484176635742, "lr": 0.00017400000000000003, "tps": 8195, "wall": 3486.6} {"step": 436, "train_loss": 6.079336166381836, "lr": 0.0001744, "tps": 8195, "wall": 3494.5} {"step": 437, "train_loss": 6.118319511413574, "lr": 0.00017480000000000002, "tps": 8195, "wall": 3502.5} {"step": 438, "train_loss": 6.091137409210205, "lr": 0.0001752, "tps": 8195, "wall": 3510.4} {"step": 439, "train_loss": 6.133516311645508, "lr": 0.0001756, "tps": 8196, "wall": 3518.2} {"step": 440, "train_loss": 6.166476726531982, "lr": 0.00017600000000000002, "tps": 8196, "wall": 3526.1} {"step": 441, "train_loss": 6.0679779052734375, "lr": 0.0001764, "tps": 8196, "wall": 3534.0} {"step": 442, "train_loss": 6.076618194580078, "lr": 0.00017680000000000001, "tps": 8196, "wall": 3541.9} {"step": 443, "train_loss": 6.138522148132324, "lr": 0.0001772, "tps": 8196, "wall": 3549.9} {"step": 444, "train_loss": 6.0238847732543945, "lr": 0.0001776, "tps": 8197, "wall": 3557.8} {"step": 445, "train_loss": 6.180910587310791, "lr": 0.00017800000000000002, "tps": 8197, "wall": 3565.6} {"step": 446, "train_loss": 6.050921440124512, "lr": 0.0001784, "tps": 8197, "wall": 3573.5} {"step": 447, "train_loss": 6.131178379058838, "lr": 0.0001788, "tps": 8197, "wall": 3581.4} {"step": 448, "train_loss": 6.052955150604248, "lr": 0.0001792, "tps": 8198, "wall": 3589.2} {"step": 449, "train_loss": 6.0562310218811035, "lr": 0.0001796, "tps": 8198, "wall": 3597.1} {"step": 450, "train_loss": 6.160515785217285, "lr": 0.00018, "tps": 8198, "wall": 3604.9} {"step": 451, "train_loss": 6.163562297821045, "lr": 0.0001804, "tps": 8198, "wall": 3613.1} {"step": 452, "train_loss": 6.116617679595947, "lr": 0.0001808, "tps": 8198, "wall": 3621.1} {"step": 453, "train_loss": 6.10582971572876, "lr": 0.0001812, "tps": 8198, "wall": 3629.1} {"step": 454, "train_loss": 6.120636940002441, "lr": 0.00018160000000000002, "tps": 8198, "wall": 3637.2} {"step": 455, "train_loss": 6.041521072387695, "lr": 0.000182, "tps": 8197, "wall": 3645.4} {"step": 456, "train_loss": 6.142800331115723, "lr": 0.00018240000000000002, "tps": 8197, "wall": 3653.4} {"step": 457, "train_loss": 6.074841499328613, "lr": 0.00018280000000000003, "tps": 8196, "wall": 3662.1} {"step": 458, "train_loss": 5.9995222091674805, "lr": 0.0001832, "tps": 8196, "wall": 3670.0} {"step": 459, "train_loss": 5.98374605178833, "lr": 0.00018360000000000002, "tps": 8196, "wall": 3678.1} {"step": 460, "train_loss": 6.117372512817383, "lr": 0.000184, "tps": 8195, "wall": 3686.5} {"step": 461, "train_loss": 5.955442905426025, "lr": 0.0001844, "tps": 8195, "wall": 3694.6} {"step": 462, "train_loss": 6.055397987365723, "lr": 0.00018480000000000002, "tps": 8194, "wall": 3703.0} {"step": 463, "train_loss": 6.016414642333984, "lr": 0.0001852, "tps": 8193, "wall": 3711.1} {"step": 464, "train_loss": 6.1722917556762695, "lr": 0.0001856, "tps": 8193, "wall": 3719.3} {"step": 465, "train_loss": 6.0914812088012695, "lr": 0.000186, "tps": 8193, "wall": 3727.3} {"step": 466, "train_loss": 6.0906829833984375, "lr": 0.0001864, "tps": 8192, "wall": 3735.6} {"step": 467, "train_loss": 6.086376667022705, "lr": 0.00018680000000000001, "tps": 8193, "wall": 3743.5} {"step": 468, "train_loss": 6.200233459472656, "lr": 0.0001872, "tps": 8193, "wall": 3751.4} {"step": 469, "train_loss": 6.075436592102051, "lr": 0.0001876, "tps": 8193, "wall": 3759.2} {"step": 470, "train_loss": 6.025042533874512, "lr": 0.000188, "tps": 8193, "wall": 3767.2} {"step": 471, "train_loss": 6.126089096069336, "lr": 0.0001884, "tps": 8193, "wall": 3775.2} {"step": 472, "train_loss": 6.043671131134033, "lr": 0.0001888, "tps": 8194, "wall": 3783.0} {"step": 473, "train_loss": 6.0245256423950195, "lr": 0.00018920000000000002, "tps": 8193, "wall": 3791.1} {"step": 474, "train_loss": 5.942976474761963, "lr": 0.00018960000000000003, "tps": 8194, "wall": 3799.0} {"step": 475, "train_loss": 6.091484546661377, "lr": 0.00019, "tps": 8194, "wall": 3806.9} {"step": 476, "train_loss": 5.985710144042969, "lr": 0.00019040000000000002, "tps": 8194, "wall": 3814.9} {"step": 477, "train_loss": 6.028562545776367, "lr": 0.0001908, "tps": 8194, "wall": 3822.8} {"step": 478, "train_loss": 6.09187126159668, "lr": 0.0001912, "tps": 8194, "wall": 3830.8} {"step": 479, "train_loss": 5.940023422241211, "lr": 0.00019160000000000002, "tps": 8194, "wall": 3838.9} {"step": 480, "train_loss": 6.0169596672058105, "lr": 0.000192, "tps": 8191, "wall": 3848.3} {"step": 481, "train_loss": 6.02901554107666, "lr": 0.00019240000000000001, "tps": 8191, "wall": 3856.2} {"step": 482, "train_loss": 6.03078031539917, "lr": 0.0001928, "tps": 8191, "wall": 3864.2} {"step": 483, "train_loss": 6.1872334480285645, "lr": 0.0001932, "tps": 8191, "wall": 3872.1} {"step": 484, "train_loss": 6.057066917419434, "lr": 0.00019360000000000002, "tps": 8191, "wall": 3880.1} {"step": 485, "train_loss": 6.09598445892334, "lr": 0.000194, "tps": 8192, "wall": 3887.9} {"step": 486, "train_loss": 6.070280075073242, "lr": 0.0001944, "tps": 8192, "wall": 3896.0} {"step": 487, "train_loss": 6.118204116821289, "lr": 0.0001948, "tps": 8192, "wall": 3903.9} {"step": 488, "train_loss": 6.0730791091918945, "lr": 0.0001952, "tps": 8192, "wall": 3911.9} {"step": 489, "train_loss": 5.9558186531066895, "lr": 0.00019559999999999998, "tps": 8192, "wall": 3919.8} {"step": 490, "train_loss": 5.990260124206543, "lr": 0.00019600000000000002, "tps": 8192, "wall": 3927.7} {"step": 491, "train_loss": 6.017838478088379, "lr": 0.00019640000000000003, "tps": 8192, "wall": 3935.6} {"step": 492, "train_loss": 5.985353469848633, "lr": 0.0001968, "tps": 8192, "wall": 3943.7} {"step": 493, "train_loss": 6.053163051605225, "lr": 0.00019720000000000002, "tps": 8192, "wall": 3951.5} {"step": 494, "train_loss": 5.94920015335083, "lr": 0.0001976, "tps": 8192, "wall": 3959.5} {"step": 495, "train_loss": 5.934459209442139, "lr": 0.00019800000000000002, "tps": 8192, "wall": 3967.6} {"step": 496, "train_loss": 6.0132269859313965, "lr": 0.00019840000000000002, "tps": 8192, "wall": 3975.6} {"step": 497, "train_loss": 5.975042819976807, "lr": 0.0001988, "tps": 8193, "wall": 3983.5} {"step": 498, "train_loss": 5.939201831817627, "lr": 0.00019920000000000002, "tps": 8193, "wall": 3991.4} {"step": 499, "train_loss": 5.9232988357543945, "lr": 0.0001996, "tps": 8193, "wall": 3999.3} {"step": 500, "train_loss": 6.008620738983154, "lr": 0.0002, "tps": 8193, "wall": 4007.2} {"step": 501, "train_loss": 5.963677883148193, "lr": 0.00020040000000000002, "tps": 8193, "wall": 4015.1} {"step": 502, "train_loss": 5.872026443481445, "lr": 0.0002008, "tps": 8193, "wall": 4023.2} {"step": 503, "train_loss": 5.97503662109375, "lr": 0.0002012, "tps": 8193, "wall": 4031.2} {"step": 504, "train_loss": 5.958600997924805, "lr": 0.0002016, "tps": 8193, "wall": 4039.1} {"step": 505, "train_loss": 5.948509693145752, "lr": 0.000202, "tps": 8193, "wall": 4047.1} {"step": 506, "train_loss": 5.927149295806885, "lr": 0.0002024, "tps": 8193, "wall": 4055.1} {"step": 507, "train_loss": 5.8611907958984375, "lr": 0.0002028, "tps": 8194, "wall": 4062.9} {"step": 508, "train_loss": 5.98408317565918, "lr": 0.0002032, "tps": 8194, "wall": 4070.8} {"step": 509, "train_loss": 5.938296794891357, "lr": 0.00020360000000000002, "tps": 8194, "wall": 4078.7} {"step": 510, "train_loss": 5.92401647567749, "lr": 0.00020400000000000003, "tps": 8194, "wall": 4086.7} {"step": 511, "train_loss": 5.946033954620361, "lr": 0.0002044, "tps": 8194, "wall": 4094.7} {"step": 512, "train_loss": 5.991347312927246, "lr": 0.00020480000000000002, "tps": 8194, "wall": 4102.7} {"step": 513, "train_loss": 5.962096691131592, "lr": 0.00020520000000000003, "tps": 8194, "wall": 4110.7} {"step": 514, "train_loss": 5.88456392288208, "lr": 0.0002056, "tps": 8194, "wall": 4118.6} {"step": 515, "train_loss": 5.968488693237305, "lr": 0.00020600000000000002, "tps": 8194, "wall": 4126.5} {"step": 516, "train_loss": 5.791565895080566, "lr": 0.0002064, "tps": 8195, "wall": 4134.4} {"step": 517, "train_loss": 5.939478874206543, "lr": 0.0002068, "tps": 8195, "wall": 4142.4} {"step": 518, "train_loss": 5.8717360496521, "lr": 0.00020720000000000002, "tps": 8195, "wall": 4150.3} {"step": 519, "train_loss": 5.9247965812683105, "lr": 0.0002076, "tps": 8195, "wall": 4158.3} {"step": 520, "train_loss": 5.862225532531738, "lr": 0.00020800000000000001, "tps": 8195, "wall": 4166.3} {"step": 521, "train_loss": 5.852553844451904, "lr": 0.0002084, "tps": 8195, "wall": 4174.3} {"step": 522, "train_loss": 5.902935028076172, "lr": 0.0002088, "tps": 8195, "wall": 4182.2} {"step": 523, "train_loss": 5.885616302490234, "lr": 0.0002092, "tps": 8195, "wall": 4190.0} {"step": 524, "train_loss": 5.972059726715088, "lr": 0.0002096, "tps": 8195, "wall": 4198.0} {"step": 525, "train_loss": 5.825538158416748, "lr": 0.00021, "tps": 8195, "wall": 4205.9} {"step": 526, "train_loss": 5.833919048309326, "lr": 0.0002104, "tps": 8195, "wall": 4214.0} {"step": 527, "train_loss": 5.7566022872924805, "lr": 0.00021080000000000003, "tps": 8195, "wall": 4222.0} {"step": 528, "train_loss": 5.81620979309082, "lr": 0.0002112, "tps": 8196, "wall": 4229.9} {"step": 529, "train_loss": 5.892806053161621, "lr": 0.00021160000000000002, "tps": 8196, "wall": 4237.8} {"step": 530, "train_loss": 5.9619460105896, "lr": 0.00021200000000000003, "tps": 8196, "wall": 4245.7} {"step": 531, "train_loss": 5.950444221496582, "lr": 0.0002124, "tps": 8196, "wall": 4253.6} {"step": 532, "train_loss": 5.91858434677124, "lr": 0.00021280000000000002, "tps": 8196, "wall": 4261.6} {"step": 533, "train_loss": 5.906973838806152, "lr": 0.0002132, "tps": 8196, "wall": 4269.5} {"step": 534, "train_loss": 5.911952018737793, "lr": 0.00021360000000000001, "tps": 8196, "wall": 4277.5} {"step": 535, "train_loss": 5.801994323730469, "lr": 0.00021400000000000002, "tps": 8197, "wall": 4285.4} {"step": 536, "train_loss": 5.898230075836182, "lr": 0.0002144, "tps": 8197, "wall": 4293.3} {"step": 537, "train_loss": 5.827934741973877, "lr": 0.00021480000000000002, "tps": 8197, "wall": 4301.3} {"step": 538, "train_loss": 5.765103816986084, "lr": 0.0002152, "tps": 8197, "wall": 4309.2} {"step": 539, "train_loss": 5.8629889488220215, "lr": 0.0002156, "tps": 8197, "wall": 4317.1} {"step": 540, "train_loss": 5.8080596923828125, "lr": 0.000216, "tps": 8197, "wall": 4325.0} {"step": 541, "train_loss": 5.805428504943848, "lr": 0.0002164, "tps": 8197, "wall": 4332.9} {"step": 542, "train_loss": 5.930794715881348, "lr": 0.0002168, "tps": 8197, "wall": 4340.9} {"step": 543, "train_loss": 5.850437641143799, "lr": 0.0002172, "tps": 8198, "wall": 4348.8} {"step": 544, "train_loss": 5.832879066467285, "lr": 0.0002176, "tps": 8198, "wall": 4356.7} {"step": 545, "train_loss": 5.778327465057373, "lr": 0.00021799999999999999, "tps": 8198, "wall": 4364.6} {"step": 546, "train_loss": 5.832293510437012, "lr": 0.00021840000000000002, "tps": 8198, "wall": 4372.3} {"step": 547, "train_loss": 5.870752811431885, "lr": 0.00021880000000000003, "tps": 8198, "wall": 4380.3} {"step": 548, "train_loss": 5.856667995452881, "lr": 0.00021920000000000002, "tps": 8199, "wall": 4388.2} {"step": 549, "train_loss": 5.956472873687744, "lr": 0.00021960000000000003, "tps": 8198, "wall": 4396.3} {"step": 550, "train_loss": 5.719222545623779, "lr": 0.00022, "tps": 8198, "wall": 4404.2} {"step": 551, "train_loss": 5.855328559875488, "lr": 0.00022040000000000002, "tps": 8199, "wall": 4412.2} {"step": 552, "train_loss": 5.769230842590332, "lr": 0.00022080000000000003, "tps": 8199, "wall": 4420.1} {"step": 553, "train_loss": 5.869473934173584, "lr": 0.0002212, "tps": 8199, "wall": 4428.0} {"step": 554, "train_loss": 5.79547643661499, "lr": 0.00022160000000000002, "tps": 8199, "wall": 4436.0} {"step": 555, "train_loss": 5.853137493133545, "lr": 0.000222, "tps": 8199, "wall": 4443.8} {"step": 556, "train_loss": 5.674281120300293, "lr": 0.0002224, "tps": 8199, "wall": 4451.8} {"step": 557, "train_loss": 5.704626560211182, "lr": 0.0002228, "tps": 8199, "wall": 4459.8} {"step": 558, "train_loss": 5.824363708496094, "lr": 0.0002232, "tps": 8199, "wall": 4467.7} {"step": 559, "train_loss": 5.777165412902832, "lr": 0.00022360000000000001, "tps": 8200, "wall": 4475.6} {"step": 560, "train_loss": 5.758789539337158, "lr": 0.000224, "tps": 8200, "wall": 4483.5} {"step": 561, "train_loss": 5.727207660675049, "lr": 0.0002244, "tps": 8200, "wall": 4491.5} {"step": 562, "train_loss": 5.797261714935303, "lr": 0.0002248, "tps": 8200, "wall": 4499.4} {"step": 563, "train_loss": 5.8158183097839355, "lr": 0.0002252, "tps": 8200, "wall": 4507.2} {"step": 564, "train_loss": 5.7206244468688965, "lr": 0.00022560000000000004, "tps": 8200, "wall": 4515.3} {"step": 565, "train_loss": 5.751682281494141, "lr": 0.00022600000000000002, "tps": 8200, "wall": 4523.1} {"step": 566, "train_loss": 5.818722248077393, "lr": 0.00022640000000000003, "tps": 8200, "wall": 4531.1} {"step": 567, "train_loss": 5.815788269042969, "lr": 0.0002268, "tps": 8201, "wall": 4539.0} {"step": 568, "train_loss": 5.678128719329834, "lr": 0.00022720000000000002, "tps": 8201, "wall": 4546.9} {"step": 569, "train_loss": 5.756110191345215, "lr": 0.00022760000000000003, "tps": 8201, "wall": 4554.7} {"step": 570, "train_loss": 5.641219615936279, "lr": 0.000228, "tps": 8201, "wall": 4562.7} {"step": 571, "train_loss": 5.742143630981445, "lr": 0.00022840000000000002, "tps": 8201, "wall": 4570.6} {"step": 572, "train_loss": 5.673131942749023, "lr": 0.0002288, "tps": 8201, "wall": 4578.7} {"step": 573, "train_loss": 5.826358795166016, "lr": 0.00022920000000000001, "tps": 8201, "wall": 4586.6} {"step": 574, "train_loss": 5.7561540603637695, "lr": 0.0002296, "tps": 8201, "wall": 4594.5} {"step": 575, "train_loss": 5.707111358642578, "lr": 0.00023, "tps": 8201, "wall": 4602.4} {"step": 576, "train_loss": 5.80816125869751, "lr": 0.00023040000000000002, "tps": 8201, "wall": 4610.4} {"step": 577, "train_loss": 5.671545028686523, "lr": 0.0002308, "tps": 8202, "wall": 4618.4} {"step": 578, "train_loss": 5.692502975463867, "lr": 0.0002312, "tps": 8202, "wall": 4626.3} {"step": 579, "train_loss": 5.729332447052002, "lr": 0.0002316, "tps": 8201, "wall": 4634.4} {"step": 580, "train_loss": 5.738648891448975, "lr": 0.000232, "tps": 8201, "wall": 4642.5} {"step": 581, "train_loss": 5.798223495483398, "lr": 0.0002324, "tps": 8201, "wall": 4650.4} {"step": 582, "train_loss": 5.741125106811523, "lr": 0.0002328, "tps": 8201, "wall": 4658.4} {"step": 583, "train_loss": 5.749061584472656, "lr": 0.00023320000000000003, "tps": 8201, "wall": 4666.4} {"step": 584, "train_loss": 5.792296409606934, "lr": 0.0002336, "tps": 8201, "wall": 4674.3} {"step": 585, "train_loss": 5.660738468170166, "lr": 0.00023400000000000002, "tps": 8202, "wall": 4682.2} {"step": 586, "train_loss": 5.784145355224609, "lr": 0.00023440000000000003, "tps": 8202, "wall": 4690.1} {"step": 587, "train_loss": 5.6493730545043945, "lr": 0.00023480000000000002, "tps": 8202, "wall": 4698.2} {"step": 588, "train_loss": 5.66927433013916, "lr": 0.00023520000000000002, "tps": 8202, "wall": 4706.1} {"step": 589, "train_loss": 5.701961040496826, "lr": 0.0002356, "tps": 8202, "wall": 4714.0} {"step": 590, "train_loss": 5.692753791809082, "lr": 0.00023600000000000002, "tps": 8202, "wall": 4722.0} {"step": 591, "train_loss": 5.812047481536865, "lr": 0.0002364, "tps": 8202, "wall": 4730.0} {"step": 592, "train_loss": 5.733218669891357, "lr": 0.0002368, "tps": 8202, "wall": 4737.9} {"step": 593, "train_loss": 5.793978691101074, "lr": 0.00023720000000000002, "tps": 8202, "wall": 4745.7} {"step": 594, "train_loss": 5.763716220855713, "lr": 0.0002376, "tps": 8202, "wall": 4753.8} {"step": 595, "train_loss": 5.682308673858643, "lr": 0.000238, "tps": 8202, "wall": 4761.7} {"step": 596, "train_loss": 5.619478225708008, "lr": 0.0002384, "tps": 8203, "wall": 4769.6} {"step": 597, "train_loss": 5.748959064483643, "lr": 0.0002388, "tps": 8203, "wall": 4777.4} {"step": 598, "train_loss": 5.824892520904541, "lr": 0.00023920000000000001, "tps": 8203, "wall": 4785.4} {"step": 599, "train_loss": 5.692966938018799, "lr": 0.0002396, "tps": 8203, "wall": 4793.3} {"step": 600, "train_loss": 5.731812000274658, "lr": 0.00024, "tps": 8203, "wall": 4801.2} {"step": 601, "train_loss": 5.63253927230835, "lr": 0.00024040000000000002, "tps": 8203, "wall": 4809.1} {"step": 602, "train_loss": 5.842336654663086, "lr": 0.00024080000000000003, "tps": 8203, "wall": 4817.0} {"step": 603, "train_loss": 5.676102638244629, "lr": 0.0002412, "tps": 8204, "wall": 4824.9} {"step": 604, "train_loss": 5.660632133483887, "lr": 0.00024160000000000002, "tps": 8204, "wall": 4832.9} {"step": 605, "train_loss": 5.665566921234131, "lr": 0.00024200000000000003, "tps": 8204, "wall": 4840.8} {"step": 606, "train_loss": 5.633821964263916, "lr": 0.0002424, "tps": 8204, "wall": 4848.7} {"step": 607, "train_loss": 5.64265775680542, "lr": 0.00024280000000000002, "tps": 8204, "wall": 4856.6} {"step": 608, "train_loss": 5.6627278327941895, "lr": 0.0002432, "tps": 8204, "wall": 4864.7} {"step": 609, "train_loss": 5.544399738311768, "lr": 0.0002436, "tps": 8204, "wall": 4872.8} {"step": 610, "train_loss": 5.730643272399902, "lr": 0.00024400000000000002, "tps": 8204, "wall": 4880.7} {"step": 611, "train_loss": 5.588254928588867, "lr": 0.00024440000000000003, "tps": 8204, "wall": 4888.6} {"step": 612, "train_loss": 5.5961594581604, "lr": 0.00024480000000000004, "tps": 8204, "wall": 4896.6} {"step": 613, "train_loss": 5.6844892501831055, "lr": 0.0002452, "tps": 8204, "wall": 4904.6} {"step": 614, "train_loss": 5.6194257736206055, "lr": 0.0002456, "tps": 8204, "wall": 4912.5} {"step": 615, "train_loss": 5.705297470092773, "lr": 0.000246, "tps": 8204, "wall": 4920.5} {"step": 616, "train_loss": 5.740699768066406, "lr": 0.0002464, "tps": 8204, "wall": 4928.4} {"step": 617, "train_loss": 5.767560958862305, "lr": 0.00024680000000000004, "tps": 8204, "wall": 4936.4} {"step": 618, "train_loss": 5.573716640472412, "lr": 0.0002472, "tps": 8204, "wall": 4944.4} {"step": 619, "train_loss": 5.685541152954102, "lr": 0.0002476, "tps": 8204, "wall": 4952.2} {"step": 620, "train_loss": 5.730355739593506, "lr": 0.000248, "tps": 8204, "wall": 4960.3} {"step": 621, "train_loss": 5.653598785400391, "lr": 0.0002484, "tps": 8204, "wall": 4968.3} {"step": 622, "train_loss": 5.595381259918213, "lr": 0.00024880000000000003, "tps": 8204, "wall": 4976.2} {"step": 623, "train_loss": 5.7193522453308105, "lr": 0.0002492, "tps": 8204, "wall": 4984.1} {"step": 624, "train_loss": 5.676779270172119, "lr": 0.0002496, "tps": 8204, "wall": 4992.2} {"step": 625, "train_loss": 5.5648016929626465, "lr": 0.00025, "tps": 8205, "wall": 5000.0} {"step": 626, "train_loss": 5.633183479309082, "lr": 0.0002504, "tps": 8205, "wall": 5007.9} {"step": 627, "train_loss": 5.660727024078369, "lr": 0.0002508, "tps": 8205, "wall": 5015.9} {"step": 628, "train_loss": 5.663954257965088, "lr": 0.00025120000000000003, "tps": 8205, "wall": 5023.8} {"step": 629, "train_loss": 5.610518932342529, "lr": 0.0002516, "tps": 8205, "wall": 5031.8} {"step": 630, "train_loss": 5.685047149658203, "lr": 0.000252, "tps": 8205, "wall": 5039.8} {"step": 631, "train_loss": 5.550748825073242, "lr": 0.0002524, "tps": 8205, "wall": 5047.8} {"step": 632, "train_loss": 5.656621932983398, "lr": 0.0002528, "tps": 8205, "wall": 5055.9} {"step": 633, "train_loss": 5.594236373901367, "lr": 0.00025320000000000003, "tps": 8205, "wall": 5063.9} {"step": 634, "train_loss": 5.549386024475098, "lr": 0.0002536, "tps": 8205, "wall": 5071.9} {"step": 635, "train_loss": 5.655777931213379, "lr": 0.000254, "tps": 8205, "wall": 5079.9} {"step": 636, "train_loss": 5.6302170753479, "lr": 0.0002544, "tps": 8205, "wall": 5087.9} {"step": 637, "train_loss": 5.590420722961426, "lr": 0.0002548, "tps": 8204, "wall": 5095.9} {"step": 638, "train_loss": 5.524381160736084, "lr": 0.0002552, "tps": 8205, "wall": 5103.9} {"step": 639, "train_loss": 5.6539740562438965, "lr": 0.0002556, "tps": 8204, "wall": 5111.9} {"step": 640, "train_loss": 5.5590314865112305, "lr": 0.000256, "tps": 8205, "wall": 5119.9} {"step": 641, "train_loss": 5.484954357147217, "lr": 0.0002564, "tps": 8205, "wall": 5127.8} {"step": 642, "train_loss": 5.518410682678223, "lr": 0.0002568, "tps": 8205, "wall": 5135.8} {"step": 643, "train_loss": 5.594386100769043, "lr": 0.0002572, "tps": 8205, "wall": 5143.8} {"step": 644, "train_loss": 5.65074348449707, "lr": 0.0002576, "tps": 8205, "wall": 5151.7} {"step": 645, "train_loss": 5.5826287269592285, "lr": 0.000258, "tps": 8205, "wall": 5159.7} {"step": 646, "train_loss": 5.481391429901123, "lr": 0.0002584, "tps": 8205, "wall": 5167.6} {"step": 647, "train_loss": 5.597357273101807, "lr": 0.00025880000000000006, "tps": 8205, "wall": 5175.7} {"step": 648, "train_loss": 5.683604717254639, "lr": 0.0002592, "tps": 8205, "wall": 5183.6} {"step": 649, "train_loss": 5.512895107269287, "lr": 0.0002596, "tps": 8205, "wall": 5191.5} {"step": 650, "train_loss": 5.613630771636963, "lr": 0.00026000000000000003, "tps": 8205, "wall": 5199.5} {"step": 651, "train_loss": 5.647934913635254, "lr": 0.00026040000000000004, "tps": 8205, "wall": 5207.4} {"step": 652, "train_loss": 5.625419616699219, "lr": 0.00026080000000000005, "tps": 8205, "wall": 5215.4} {"step": 653, "train_loss": 5.686135292053223, "lr": 0.0002612, "tps": 8205, "wall": 5223.3} {"step": 654, "train_loss": 5.611735820770264, "lr": 0.0002616, "tps": 8205, "wall": 5231.4} {"step": 655, "train_loss": 5.581735134124756, "lr": 0.000262, "tps": 8205, "wall": 5239.3} {"step": 656, "train_loss": 5.567470550537109, "lr": 0.00026240000000000004, "tps": 8205, "wall": 5247.2} {"step": 657, "train_loss": 5.6073737144470215, "lr": 0.00026280000000000005, "tps": 8205, "wall": 5255.1} {"step": 658, "train_loss": 5.52794075012207, "lr": 0.0002632, "tps": 8205, "wall": 5263.0} {"step": 659, "train_loss": 5.496123313903809, "lr": 0.0002636, "tps": 8206, "wall": 5270.9} {"step": 660, "train_loss": 5.545600891113281, "lr": 0.000264, "tps": 8206, "wall": 5278.8} {"step": 661, "train_loss": 5.522614002227783, "lr": 0.00026440000000000003, "tps": 8206, "wall": 5286.7} {"step": 662, "train_loss": 5.536319255828857, "lr": 0.00026480000000000004, "tps": 8206, "wall": 5294.7} {"step": 663, "train_loss": 5.586118221282959, "lr": 0.0002652, "tps": 8206, "wall": 5302.6} {"step": 664, "train_loss": 5.544389724731445, "lr": 0.0002656, "tps": 8206, "wall": 5310.5} {"step": 665, "train_loss": 5.458126068115234, "lr": 0.000266, "tps": 8206, "wall": 5318.4} {"step": 666, "train_loss": 5.578784942626953, "lr": 0.0002664, "tps": 8206, "wall": 5326.4} {"step": 667, "train_loss": 5.612828731536865, "lr": 0.00026680000000000003, "tps": 8206, "wall": 5334.3} {"step": 668, "train_loss": 5.488961219787598, "lr": 0.0002672, "tps": 8206, "wall": 5342.2} {"step": 669, "train_loss": 5.570904731750488, "lr": 0.0002676, "tps": 8207, "wall": 5350.1} {"step": 670, "train_loss": 5.555810928344727, "lr": 0.000268, "tps": 8207, "wall": 5358.1} {"step": 671, "train_loss": 5.508840084075928, "lr": 0.0002684, "tps": 8207, "wall": 5366.1} {"step": 672, "train_loss": 5.489246368408203, "lr": 0.00026880000000000003, "tps": 8207, "wall": 5374.0} {"step": 673, "train_loss": 5.58160924911499, "lr": 0.0002692, "tps": 8207, "wall": 5381.8} {"step": 674, "train_loss": 5.46330451965332, "lr": 0.0002696, "tps": 8207, "wall": 5389.8} {"step": 675, "train_loss": 5.525323867797852, "lr": 0.00027, "tps": 8207, "wall": 5397.7} {"step": 676, "train_loss": 5.5003275871276855, "lr": 0.0002704, "tps": 8207, "wall": 5405.7} {"step": 677, "train_loss": 5.504080772399902, "lr": 0.0002708, "tps": 8207, "wall": 5413.6} {"step": 678, "train_loss": 5.542366981506348, "lr": 0.0002712, "tps": 8207, "wall": 5421.7} {"step": 679, "train_loss": 5.587100982666016, "lr": 0.0002716, "tps": 8207, "wall": 5429.6} {"step": 680, "train_loss": 5.535815715789795, "lr": 0.000272, "tps": 8207, "wall": 5437.5} {"step": 681, "train_loss": 5.48971700668335, "lr": 0.0002724, "tps": 8208, "wall": 5445.3} {"step": 682, "train_loss": 5.4615373611450195, "lr": 0.00027279999999999996, "tps": 8208, "wall": 5453.3} {"step": 683, "train_loss": 5.447316646575928, "lr": 0.00027319999999999997, "tps": 8208, "wall": 5461.2} {"step": 684, "train_loss": 5.406307220458984, "lr": 0.00027360000000000004, "tps": 8208, "wall": 5469.1} {"step": 685, "train_loss": 5.48118782043457, "lr": 0.00027400000000000005, "tps": 8208, "wall": 5477.1} {"step": 686, "train_loss": 5.61761474609375, "lr": 0.00027440000000000006, "tps": 8208, "wall": 5485.1} {"step": 687, "train_loss": 5.560122489929199, "lr": 0.0002748, "tps": 8208, "wall": 5493.0} {"step": 688, "train_loss": 5.414003372192383, "lr": 0.0002752, "tps": 8208, "wall": 5500.8} {"step": 689, "train_loss": 5.528520107269287, "lr": 0.00027560000000000003, "tps": 8208, "wall": 5508.8} {"step": 690, "train_loss": 5.448956489562988, "lr": 0.00027600000000000004, "tps": 8208, "wall": 5516.7} {"step": 691, "train_loss": 5.549769401550293, "lr": 0.00027640000000000005, "tps": 8208, "wall": 5524.6} {"step": 692, "train_loss": 5.506220817565918, "lr": 0.0002768, "tps": 8208, "wall": 5532.6} {"step": 693, "train_loss": 5.484633922576904, "lr": 0.0002772, "tps": 8209, "wall": 5540.5} {"step": 694, "train_loss": 5.560054302215576, "lr": 0.0002776, "tps": 8209, "wall": 5548.4} {"step": 695, "train_loss": 5.533147811889648, "lr": 0.00027800000000000004, "tps": 8209, "wall": 5556.2} {"step": 696, "train_loss": 5.502384185791016, "lr": 0.00027840000000000005, "tps": 8209, "wall": 5564.2} {"step": 697, "train_loss": 5.4892778396606445, "lr": 0.0002788, "tps": 8209, "wall": 5572.1} {"step": 698, "train_loss": 5.493578910827637, "lr": 0.0002792, "tps": 8209, "wall": 5580.0} {"step": 699, "train_loss": 5.5006890296936035, "lr": 0.0002796, "tps": 8209, "wall": 5588.0} {"step": 700, "train_loss": 5.460302352905273, "lr": 0.00028000000000000003, "tps": 8209, "wall": 5596.0} {"step": 701, "train_loss": 5.402367115020752, "lr": 0.00028040000000000004, "tps": 8209, "wall": 5603.9} {"step": 702, "train_loss": 5.431836128234863, "lr": 0.0002808, "tps": 8209, "wall": 5611.8} {"step": 703, "train_loss": 5.39325475692749, "lr": 0.0002812, "tps": 8209, "wall": 5619.8} {"step": 704, "train_loss": 5.4990339279174805, "lr": 0.0002816, "tps": 8209, "wall": 5627.7} {"step": 705, "train_loss": 5.477495193481445, "lr": 0.000282, "tps": 8210, "wall": 5635.6} {"step": 706, "train_loss": 5.380888938903809, "lr": 0.00028240000000000003, "tps": 8210, "wall": 5643.5} {"step": 707, "train_loss": 5.513946056365967, "lr": 0.0002828, "tps": 8210, "wall": 5651.6} {"step": 708, "train_loss": 5.438549518585205, "lr": 0.0002832, "tps": 8210, "wall": 5659.4} {"step": 709, "train_loss": 5.512615203857422, "lr": 0.0002836, "tps": 8210, "wall": 5667.3} {"step": 710, "train_loss": 5.452942371368408, "lr": 0.000284, "tps": 8210, "wall": 5675.3} {"step": 711, "train_loss": 5.471718788146973, "lr": 0.0002844, "tps": 8210, "wall": 5683.2} {"step": 712, "train_loss": 5.330721378326416, "lr": 0.0002848, "tps": 8210, "wall": 5691.2} {"step": 713, "train_loss": 5.345630645751953, "lr": 0.0002852, "tps": 8210, "wall": 5699.1} {"step": 714, "train_loss": 5.429271697998047, "lr": 0.0002856, "tps": 8210, "wall": 5707.0} {"step": 715, "train_loss": 5.453914642333984, "lr": 0.000286, "tps": 8210, "wall": 5715.0} {"step": 716, "train_loss": 5.409001350402832, "lr": 0.00028639999999999997, "tps": 8210, "wall": 5723.0} {"step": 717, "train_loss": 5.426086902618408, "lr": 0.0002868, "tps": 8210, "wall": 5730.8} {"step": 718, "train_loss": 5.40101432800293, "lr": 0.0002872, "tps": 8210, "wall": 5738.8} {"step": 719, "train_loss": 5.446428298950195, "lr": 0.0002876, "tps": 8210, "wall": 5746.7} {"step": 720, "train_loss": 5.524192810058594, "lr": 0.000288, "tps": 8211, "wall": 5754.6} {"step": 721, "train_loss": 5.424327850341797, "lr": 0.00028839999999999996, "tps": 8210, "wall": 5762.7} {"step": 722, "train_loss": 5.350529193878174, "lr": 0.0002888, "tps": 8211, "wall": 5770.6} {"step": 723, "train_loss": 5.4665961265563965, "lr": 0.00028920000000000004, "tps": 8210, "wall": 5778.6} {"step": 724, "train_loss": 5.420737266540527, "lr": 0.00028960000000000005, "tps": 8211, "wall": 5786.5} {"step": 725, "train_loss": 5.493924617767334, "lr": 0.00029000000000000006, "tps": 8211, "wall": 5794.5} {"step": 726, "train_loss": 5.513996124267578, "lr": 0.0002904, "tps": 8211, "wall": 5802.4} {"step": 727, "train_loss": 5.376010417938232, "lr": 0.0002908, "tps": 8211, "wall": 5810.4} {"step": 728, "train_loss": 5.395144939422607, "lr": 0.00029120000000000003, "tps": 8211, "wall": 5818.3} {"step": 729, "train_loss": 5.367190361022949, "lr": 0.00029160000000000004, "tps": 8211, "wall": 5826.2} {"step": 730, "train_loss": 5.385706901550293, "lr": 0.00029200000000000005, "tps": 8211, "wall": 5834.2} {"step": 731, "train_loss": 5.429317474365234, "lr": 0.0002924, "tps": 8211, "wall": 5842.2} {"step": 732, "train_loss": 5.367587566375732, "lr": 0.0002928, "tps": 8211, "wall": 5850.2} {"step": 733, "train_loss": 5.35517692565918, "lr": 0.0002932, "tps": 8211, "wall": 5858.1} {"step": 734, "train_loss": 5.443021297454834, "lr": 0.00029360000000000003, "tps": 8211, "wall": 5866.0} {"step": 735, "train_loss": 5.497082233428955, "lr": 0.00029400000000000004, "tps": 8211, "wall": 5873.9} {"step": 736, "train_loss": 5.375549793243408, "lr": 0.0002944, "tps": 8211, "wall": 5881.9} {"step": 737, "train_loss": 5.298451900482178, "lr": 0.0002948, "tps": 8211, "wall": 5889.8} {"step": 738, "train_loss": 5.4498114585876465, "lr": 0.0002952, "tps": 8211, "wall": 5897.8} {"step": 739, "train_loss": 5.410192966461182, "lr": 0.00029560000000000003, "tps": 8212, "wall": 5905.6} {"step": 740, "train_loss": 5.331624507904053, "lr": 0.00029600000000000004, "tps": 8212, "wall": 5913.5} {"step": 741, "train_loss": 5.413943290710449, "lr": 0.0002964, "tps": 8212, "wall": 5921.3} {"step": 742, "train_loss": 5.382948875427246, "lr": 0.0002968, "tps": 8212, "wall": 5929.3} {"step": 743, "train_loss": 5.365107536315918, "lr": 0.0002972, "tps": 8212, "wall": 5937.2} {"step": 744, "train_loss": 5.510809898376465, "lr": 0.0002976, "tps": 8212, "wall": 5945.1} {"step": 745, "train_loss": 5.311875343322754, "lr": 0.000298, "tps": 8212, "wall": 5953.2} {"step": 746, "train_loss": 5.433866500854492, "lr": 0.0002984, "tps": 8212, "wall": 5961.1} {"step": 747, "train_loss": 5.447698593139648, "lr": 0.0002988, "tps": 8212, "wall": 5969.1} {"step": 748, "train_loss": 5.336556434631348, "lr": 0.0002992, "tps": 8212, "wall": 5977.0} {"step": 749, "train_loss": 5.33349609375, "lr": 0.0002996, "tps": 8212, "wall": 5984.9} {"step": 750, "train_loss": 5.408371925354004, "lr": 0.0003, "tps": 8212, "wall": 5992.9} {"step": 751, "train_loss": 5.430371284484863, "lr": 0.0003004, "tps": 8212, "wall": 6000.9} {"step": 752, "train_loss": 5.318763256072998, "lr": 0.0003008, "tps": 8212, "wall": 6008.9} {"step": 753, "train_loss": 5.311625003814697, "lr": 0.0003012, "tps": 8212, "wall": 6016.9} {"step": 754, "train_loss": 5.306049346923828, "lr": 0.0003016, "tps": 8212, "wall": 6024.9} {"step": 755, "train_loss": 5.433687686920166, "lr": 0.00030199999999999997, "tps": 8212, "wall": 6032.9} {"step": 756, "train_loss": 5.375729560852051, "lr": 0.0003024, "tps": 8212, "wall": 6040.8} {"step": 757, "train_loss": 5.309166431427002, "lr": 0.0003028, "tps": 8212, "wall": 6048.8} {"step": 758, "train_loss": 5.38424015045166, "lr": 0.00030320000000000005, "tps": 8212, "wall": 6056.7} {"step": 759, "train_loss": 5.307019233703613, "lr": 0.00030360000000000006, "tps": 8212, "wall": 6064.6} {"step": 760, "train_loss": 5.383220672607422, "lr": 0.000304, "tps": 8212, "wall": 6072.7} {"step": 761, "train_loss": 5.294981479644775, "lr": 0.0003044, "tps": 8212, "wall": 6080.5} {"step": 762, "train_loss": 5.368431568145752, "lr": 0.00030480000000000004, "tps": 8212, "wall": 6088.5} {"step": 763, "train_loss": 5.292013168334961, "lr": 0.00030520000000000005, "tps": 8212, "wall": 6096.4} {"step": 764, "train_loss": 5.4371185302734375, "lr": 0.00030560000000000006, "tps": 8212, "wall": 6104.4} {"step": 765, "train_loss": 5.351200580596924, "lr": 0.000306, "tps": 8213, "wall": 6112.3} {"step": 766, "train_loss": 5.340127468109131, "lr": 0.0003064, "tps": 8213, "wall": 6120.2} {"step": 767, "train_loss": 5.360552787780762, "lr": 0.00030680000000000003, "tps": 8213, "wall": 6128.1} {"step": 768, "train_loss": 5.404268264770508, "lr": 0.00030720000000000004, "tps": 8213, "wall": 6136.0} {"step": 769, "train_loss": 5.331717491149902, "lr": 0.00030760000000000005, "tps": 8213, "wall": 6143.9} {"step": 770, "train_loss": 5.281200408935547, "lr": 0.000308, "tps": 8213, "wall": 6151.8} {"step": 771, "train_loss": 5.344422817230225, "lr": 0.0003084, "tps": 8213, "wall": 6159.8} {"step": 772, "train_loss": 5.264127254486084, "lr": 0.0003088, "tps": 8213, "wall": 6167.7} {"step": 773, "train_loss": 5.276521682739258, "lr": 0.00030920000000000003, "tps": 8213, "wall": 6175.6} {"step": 774, "train_loss": 5.411465644836426, "lr": 0.00030960000000000004, "tps": 8213, "wall": 6183.5} {"step": 775, "train_loss": 5.405810356140137, "lr": 0.00031, "tps": 8213, "wall": 6191.5} {"step": 776, "train_loss": 5.34330940246582, "lr": 0.0003104, "tps": 8213, "wall": 6199.5} {"step": 777, "train_loss": 5.423803806304932, "lr": 0.0003108, "tps": 8213, "wall": 6207.4} {"step": 778, "train_loss": 5.310341835021973, "lr": 0.00031120000000000003, "tps": 8213, "wall": 6215.3} {"step": 779, "train_loss": 5.295477390289307, "lr": 0.0003116, "tps": 8214, "wall": 6223.2} {"step": 780, "train_loss": 5.285206317901611, "lr": 0.000312, "tps": 8214, "wall": 6231.2} {"step": 781, "train_loss": 5.365818023681641, "lr": 0.0003124, "tps": 8214, "wall": 6239.1} {"step": 782, "train_loss": 5.251062393188477, "lr": 0.0003128, "tps": 8214, "wall": 6247.1} {"step": 783, "train_loss": 5.427029609680176, "lr": 0.0003132, "tps": 8214, "wall": 6255.1} {"step": 784, "train_loss": 5.237859725952148, "lr": 0.0003136, "tps": 8214, "wall": 6263.0} {"step": 785, "train_loss": 5.398069858551025, "lr": 0.000314, "tps": 8214, "wall": 6270.9} {"step": 786, "train_loss": 5.259491920471191, "lr": 0.0003144, "tps": 8214, "wall": 6278.8} {"step": 787, "train_loss": 5.332746505737305, "lr": 0.0003148, "tps": 8214, "wall": 6286.9} {"step": 788, "train_loss": 5.263917922973633, "lr": 0.0003152, "tps": 8214, "wall": 6294.8} {"step": 789, "train_loss": 5.2852888107299805, "lr": 0.0003156, "tps": 8214, "wall": 6302.7} {"step": 790, "train_loss": 5.285665988922119, "lr": 0.000316, "tps": 8214, "wall": 6310.7} {"step": 791, "train_loss": 5.28436279296875, "lr": 0.0003164, "tps": 8214, "wall": 6318.8} {"step": 792, "train_loss": 5.239752292633057, "lr": 0.0003168, "tps": 8214, "wall": 6326.7} {"step": 793, "train_loss": 5.344485282897949, "lr": 0.0003172, "tps": 8214, "wall": 6334.7} {"step": 794, "train_loss": 5.3622307777404785, "lr": 0.00031759999999999997, "tps": 8214, "wall": 6342.7} {"step": 795, "train_loss": 5.218603610992432, "lr": 0.00031800000000000003, "tps": 8214, "wall": 6350.7} {"step": 796, "train_loss": 5.362639427185059, "lr": 0.00031840000000000004, "tps": 8214, "wall": 6358.6} {"step": 797, "train_loss": 5.224099159240723, "lr": 0.00031880000000000005, "tps": 8214, "wall": 6366.5} {"step": 798, "train_loss": 5.308069229125977, "lr": 0.00031920000000000006, "tps": 8214, "wall": 6374.5} {"step": 799, "train_loss": 5.212588787078857, "lr": 0.0003196, "tps": 8214, "wall": 6382.6} {"step": 800, "train_loss": 5.349121570587158, "lr": 0.00032, "tps": 8214, "wall": 6390.5} {"step": 801, "train_loss": 5.2957305908203125, "lr": 0.00032040000000000004, "tps": 8214, "wall": 6398.5} {"step": 802, "train_loss": 5.384538650512695, "lr": 0.00032080000000000005, "tps": 8214, "wall": 6406.4} {"step": 803, "train_loss": 5.315651893615723, "lr": 0.00032120000000000006, "tps": 8214, "wall": 6414.4} {"step": 804, "train_loss": 5.32709264755249, "lr": 0.0003216, "tps": 8214, "wall": 6422.5} {"step": 805, "train_loss": 5.431555271148682, "lr": 0.000322, "tps": 8214, "wall": 6430.3} {"step": 806, "train_loss": 5.2603302001953125, "lr": 0.00032240000000000003, "tps": 8214, "wall": 6438.3} {"step": 807, "train_loss": 5.246528625488281, "lr": 0.00032280000000000004, "tps": 8214, "wall": 6446.3} {"step": 808, "train_loss": 5.272825717926025, "lr": 0.00032320000000000005, "tps": 8214, "wall": 6454.2} {"step": 809, "train_loss": 5.279551982879639, "lr": 0.0003236, "tps": 8214, "wall": 6462.1} {"step": 810, "train_loss": 5.212888717651367, "lr": 0.000324, "tps": 8214, "wall": 6469.9} {"step": 811, "train_loss": 5.2370171546936035, "lr": 0.0003244, "tps": 8214, "wall": 6477.9} {"step": 812, "train_loss": 5.105750560760498, "lr": 0.00032480000000000003, "tps": 8215, "wall": 6485.8} {"step": 813, "train_loss": 5.253546237945557, "lr": 0.0003252, "tps": 8214, "wall": 6493.9} {"step": 814, "train_loss": 5.298264503479004, "lr": 0.0003256, "tps": 8214, "wall": 6501.8} {"step": 815, "train_loss": 5.2315521240234375, "lr": 0.000326, "tps": 8215, "wall": 6509.6} {"step": 816, "train_loss": 5.2983832359313965, "lr": 0.0003264, "tps": 8215, "wall": 6517.6} {"step": 817, "train_loss": 5.261338233947754, "lr": 0.00032680000000000003, "tps": 8215, "wall": 6525.5} {"step": 818, "train_loss": 5.300230026245117, "lr": 0.0003272, "tps": 8215, "wall": 6533.5} {"step": 819, "train_loss": 5.317348480224609, "lr": 0.0003276, "tps": 8215, "wall": 6541.4} {"step": 820, "train_loss": 5.232231616973877, "lr": 0.000328, "tps": 8215, "wall": 6549.4} {"step": 821, "train_loss": 5.247647762298584, "lr": 0.0003284, "tps": 8215, "wall": 6557.4} {"step": 822, "train_loss": 5.207674503326416, "lr": 0.0003288, "tps": 8215, "wall": 6565.3} {"step": 823, "train_loss": 5.379413604736328, "lr": 0.0003292, "tps": 8215, "wall": 6573.2} {"step": 824, "train_loss": 5.253627300262451, "lr": 0.0003296, "tps": 8215, "wall": 6581.1} {"step": 825, "train_loss": 5.215616703033447, "lr": 0.00033, "tps": 8215, "wall": 6589.0} {"step": 826, "train_loss": 5.2558393478393555, "lr": 0.0003304, "tps": 8215, "wall": 6596.8} {"step": 827, "train_loss": 5.308377265930176, "lr": 0.0003308, "tps": 8215, "wall": 6604.7} {"step": 828, "train_loss": 5.364165782928467, "lr": 0.0003312, "tps": 8215, "wall": 6612.8} {"step": 829, "train_loss": 5.299557685852051, "lr": 0.0003316, "tps": 8216, "wall": 6620.6} {"step": 830, "train_loss": 5.2443766593933105, "lr": 0.000332, "tps": 8216, "wall": 6628.4} {"step": 831, "train_loss": 5.1883649826049805, "lr": 0.0003324, "tps": 8216, "wall": 6636.4} {"step": 832, "train_loss": 5.2448649406433105, "lr": 0.00033280000000000007, "tps": 8216, "wall": 6644.2} {"step": 833, "train_loss": 5.30685567855835, "lr": 0.0003332, "tps": 8216, "wall": 6652.1} {"step": 834, "train_loss": 5.334205627441406, "lr": 0.00033360000000000003, "tps": 8216, "wall": 6660.0} {"step": 835, "train_loss": 5.226640224456787, "lr": 0.00033400000000000004, "tps": 8216, "wall": 6668.0} {"step": 836, "train_loss": 5.403724193572998, "lr": 0.00033440000000000005, "tps": 8216, "wall": 6676.0} {"step": 837, "train_loss": 5.21420955657959, "lr": 0.00033480000000000006, "tps": 8216, "wall": 6683.8} {"step": 838, "train_loss": 5.371016502380371, "lr": 0.0003352, "tps": 8216, "wall": 6691.9} {"step": 839, "train_loss": 5.256168842315674, "lr": 0.0003356, "tps": 8216, "wall": 6699.7} {"step": 840, "train_loss": 5.276399612426758, "lr": 0.00033600000000000004, "tps": 8216, "wall": 6707.6} {"step": 841, "train_loss": 5.176352500915527, "lr": 0.00033640000000000005, "tps": 8216, "wall": 6715.6} {"step": 842, "train_loss": 5.141754150390625, "lr": 0.00033680000000000006, "tps": 8217, "wall": 6723.4} {"step": 843, "train_loss": 5.177907943725586, "lr": 0.0003372, "tps": 8216, "wall": 6731.5} {"step": 844, "train_loss": 5.133210182189941, "lr": 0.0003376, "tps": 8217, "wall": 6739.4} {"step": 845, "train_loss": 5.192574977874756, "lr": 0.00033800000000000003, "tps": 8217, "wall": 6747.3} {"step": 846, "train_loss": 5.2700114250183105, "lr": 0.00033840000000000004, "tps": 8217, "wall": 6755.1} {"step": 847, "train_loss": 5.3152360916137695, "lr": 0.0003388, "tps": 8217, "wall": 6763.0} {"step": 848, "train_loss": 5.228885650634766, "lr": 0.0003392, "tps": 8217, "wall": 6770.9} {"step": 849, "train_loss": 5.216063499450684, "lr": 0.0003396, "tps": 8217, "wall": 6778.8} {"step": 850, "train_loss": 5.173056602478027, "lr": 0.00034, "tps": 8217, "wall": 6786.7} {"step": 851, "train_loss": 5.231125831604004, "lr": 0.00034040000000000003, "tps": 8217, "wall": 6794.7} {"step": 852, "train_loss": 5.2592058181762695, "lr": 0.0003408, "tps": 8217, "wall": 6802.5} {"step": 853, "train_loss": 5.353560924530029, "lr": 0.0003412, "tps": 8218, "wall": 6810.4} {"step": 854, "train_loss": 5.196814060211182, "lr": 0.0003416, "tps": 8218, "wall": 6818.2} {"step": 855, "train_loss": 5.232926845550537, "lr": 0.000342, "tps": 8218, "wall": 6826.1} {"step": 856, "train_loss": 5.277395725250244, "lr": 0.00034240000000000003, "tps": 8218, "wall": 6834.1} {"step": 857, "train_loss": 5.222734451293945, "lr": 0.0003428, "tps": 8218, "wall": 6841.9} {"step": 858, "train_loss": 5.204154014587402, "lr": 0.0003432, "tps": 8218, "wall": 6849.8} {"step": 859, "train_loss": 5.211606025695801, "lr": 0.0003436, "tps": 8218, "wall": 6857.8} {"step": 860, "train_loss": 5.149078845977783, "lr": 0.000344, "tps": 8218, "wall": 6865.8} {"step": 861, "train_loss": 5.170357704162598, "lr": 0.0003444, "tps": 8218, "wall": 6873.8} {"step": 862, "train_loss": 5.158098220825195, "lr": 0.0003448, "tps": 8218, "wall": 6881.6} {"step": 863, "train_loss": 5.150259971618652, "lr": 0.0003452, "tps": 8218, "wall": 6889.5} {"step": 864, "train_loss": 5.182669639587402, "lr": 0.0003456, "tps": 8218, "wall": 6897.4} {"step": 865, "train_loss": 5.308904647827148, "lr": 0.000346, "tps": 8218, "wall": 6905.3} {"step": 866, "train_loss": 5.136135578155518, "lr": 0.0003464, "tps": 8218, "wall": 6913.3} {"step": 867, "train_loss": 5.256572723388672, "lr": 0.00034679999999999997, "tps": 8218, "wall": 6921.2} {"step": 868, "train_loss": 5.174912452697754, "lr": 0.0003472, "tps": 8219, "wall": 6929.1} {"step": 869, "train_loss": 5.167933464050293, "lr": 0.00034760000000000005, "tps": 8219, "wall": 6936.9} {"step": 870, "train_loss": 5.12449312210083, "lr": 0.00034800000000000006, "tps": 8219, "wall": 6944.8} {"step": 871, "train_loss": 5.183069229125977, "lr": 0.00034840000000000007, "tps": 8219, "wall": 6952.7} {"step": 872, "train_loss": 5.1747612953186035, "lr": 0.0003488, "tps": 8219, "wall": 6960.6} {"step": 873, "train_loss": 5.1776275634765625, "lr": 0.00034920000000000003, "tps": 8219, "wall": 6968.4} {"step": 874, "train_loss": 5.143501281738281, "lr": 0.00034960000000000004, "tps": 8219, "wall": 6976.3} {"step": 875, "train_loss": 5.198053359985352, "lr": 0.00035000000000000005, "tps": 8219, "wall": 6984.2} {"step": 876, "train_loss": 5.229363441467285, "lr": 0.0003504, "tps": 8220, "wall": 6992.1} {"step": 877, "train_loss": 5.172265529632568, "lr": 0.0003508, "tps": 8220, "wall": 6999.9} {"step": 878, "train_loss": 5.196827411651611, "lr": 0.0003512, "tps": 8220, "wall": 7007.7} {"step": 879, "train_loss": 5.136916637420654, "lr": 0.00035160000000000004, "tps": 8220, "wall": 7015.5} {"step": 880, "train_loss": 5.112915992736816, "lr": 0.00035200000000000005, "tps": 8220, "wall": 7023.3} {"step": 881, "train_loss": 5.043799877166748, "lr": 0.0003524, "tps": 8220, "wall": 7031.4} {"step": 882, "train_loss": 5.2116169929504395, "lr": 0.0003528, "tps": 8220, "wall": 7039.4} {"step": 883, "train_loss": 5.219935417175293, "lr": 0.0003532, "tps": 8220, "wall": 7047.2} {"step": 884, "train_loss": 5.250269889831543, "lr": 0.00035360000000000003, "tps": 8220, "wall": 7055.1} {"step": 885, "train_loss": 5.136037349700928, "lr": 0.00035400000000000004, "tps": 8220, "wall": 7063.0} {"step": 886, "train_loss": 5.0916948318481445, "lr": 0.0003544, "tps": 8221, "wall": 7070.8} {"step": 887, "train_loss": 5.07633638381958, "lr": 0.0003548, "tps": 8221, "wall": 7078.8} {"step": 888, "train_loss": 5.043059349060059, "lr": 0.0003552, "tps": 8221, "wall": 7086.7} {"step": 889, "train_loss": 5.079103946685791, "lr": 0.0003556, "tps": 8221, "wall": 7094.6} {"step": 890, "train_loss": 5.281242370605469, "lr": 0.00035600000000000003, "tps": 8221, "wall": 7102.4} {"step": 891, "train_loss": 5.0999908447265625, "lr": 0.0003564, "tps": 8221, "wall": 7110.3} {"step": 892, "train_loss": 5.087121963500977, "lr": 0.0003568, "tps": 8221, "wall": 7118.1} {"step": 893, "train_loss": 5.1715989112854, "lr": 0.0003572, "tps": 8221, "wall": 7126.0} {"step": 894, "train_loss": 5.0790324211120605, "lr": 0.0003576, "tps": 8222, "wall": 7133.8} {"step": 895, "train_loss": 5.222184181213379, "lr": 0.00035800000000000003, "tps": 8222, "wall": 7141.6} {"step": 896, "train_loss": 5.1994500160217285, "lr": 0.0003584, "tps": 8222, "wall": 7149.5} {"step": 897, "train_loss": 5.222716331481934, "lr": 0.0003588, "tps": 8222, "wall": 7157.5} {"step": 898, "train_loss": 5.140061855316162, "lr": 0.0003592, "tps": 8222, "wall": 7165.3} {"step": 899, "train_loss": 5.084072589874268, "lr": 0.0003596, "tps": 8222, "wall": 7173.2} {"step": 900, "train_loss": 5.114589691162109, "lr": 0.00036, "tps": 8222, "wall": 7181.1} {"step": 901, "train_loss": 5.204066753387451, "lr": 0.0003604, "tps": 8222, "wall": 7188.9} {"step": 902, "train_loss": 5.194717884063721, "lr": 0.0003608, "tps": 8222, "wall": 7196.8} {"step": 903, "train_loss": 5.177615165710449, "lr": 0.0003612, "tps": 8223, "wall": 7204.7} {"step": 904, "train_loss": 5.17513370513916, "lr": 0.0003616, "tps": 8223, "wall": 7212.6} {"step": 905, "train_loss": 5.148855209350586, "lr": 0.000362, "tps": 8223, "wall": 7220.5} {"step": 906, "train_loss": 5.141429901123047, "lr": 0.0003624, "tps": 8223, "wall": 7228.3} {"step": 907, "train_loss": 5.106249809265137, "lr": 0.00036280000000000004, "tps": 8223, "wall": 7236.2} {"step": 908, "train_loss": 5.068938255310059, "lr": 0.00036320000000000005, "tps": 8223, "wall": 7244.0} {"step": 909, "train_loss": 5.1794633865356445, "lr": 0.00036360000000000006, "tps": 8223, "wall": 7252.0} {"step": 910, "train_loss": 5.141506671905518, "lr": 0.000364, "tps": 8223, "wall": 7259.7} {"step": 911, "train_loss": 5.150445938110352, "lr": 0.0003644, "tps": 8223, "wall": 7267.6} {"step": 912, "train_loss": 5.152048110961914, "lr": 0.00036480000000000003, "tps": 8223, "wall": 7275.7} {"step": 913, "train_loss": 5.148883819580078, "lr": 0.00036520000000000004, "tps": 8224, "wall": 7283.5} {"step": 914, "train_loss": 5.1529221534729, "lr": 0.00036560000000000005, "tps": 8224, "wall": 7291.3} {"step": 915, "train_loss": 5.162792205810547, "lr": 0.000366, "tps": 8224, "wall": 7299.2} {"step": 916, "train_loss": 5.210881233215332, "lr": 0.0003664, "tps": 8224, "wall": 7307.1} {"step": 917, "train_loss": 5.159272193908691, "lr": 0.0003668, "tps": 8224, "wall": 7314.9} {"step": 918, "train_loss": 5.07550048828125, "lr": 0.00036720000000000004, "tps": 8224, "wall": 7322.8} {"step": 919, "train_loss": 5.165005683898926, "lr": 0.00036760000000000004, "tps": 8224, "wall": 7330.7} {"step": 920, "train_loss": 5.032782554626465, "lr": 0.000368, "tps": 8224, "wall": 7339.0} {"step": 921, "train_loss": 5.116034030914307, "lr": 0.0003684, "tps": 8224, "wall": 7346.9} {"step": 922, "train_loss": 5.0578508377075195, "lr": 0.0003688, "tps": 8224, "wall": 7354.8} {"step": 923, "train_loss": 5.162692070007324, "lr": 0.00036920000000000003, "tps": 8224, "wall": 7362.7} {"step": 924, "train_loss": 5.169073104858398, "lr": 0.00036960000000000004, "tps": 8224, "wall": 7370.6} {"step": 925, "train_loss": 5.106270790100098, "lr": 0.00037, "tps": 8224, "wall": 7378.4} {"step": 926, "train_loss": 5.154305458068848, "lr": 0.0003704, "tps": 8224, "wall": 7386.3} {"step": 927, "train_loss": 5.055850028991699, "lr": 0.0003708, "tps": 8224, "wall": 7394.3} {"step": 928, "train_loss": 5.059996128082275, "lr": 0.0003712, "tps": 8225, "wall": 7402.2} {"step": 929, "train_loss": 5.066558837890625, "lr": 0.00037160000000000003, "tps": 8225, "wall": 7410.0} {"step": 930, "train_loss": 5.116373062133789, "lr": 0.000372, "tps": 8225, "wall": 7417.9} {"step": 931, "train_loss": 5.132394790649414, "lr": 0.0003724, "tps": 8225, "wall": 7425.8} {"step": 932, "train_loss": 5.18654203414917, "lr": 0.0003728, "tps": 8225, "wall": 7433.7} {"step": 933, "train_loss": 5.096957683563232, "lr": 0.0003732, "tps": 8225, "wall": 7441.5} {"step": 934, "train_loss": 5.06719970703125, "lr": 0.00037360000000000003, "tps": 8225, "wall": 7449.5} {"step": 935, "train_loss": 5.094935417175293, "lr": 0.000374, "tps": 8225, "wall": 7457.4} {"step": 936, "train_loss": 5.0611186027526855, "lr": 0.0003744, "tps": 8225, "wall": 7465.3} {"step": 937, "train_loss": 5.013148307800293, "lr": 0.0003748, "tps": 8225, "wall": 7473.2} {"step": 938, "train_loss": 5.238504409790039, "lr": 0.0003752, "tps": 8225, "wall": 7481.0} {"step": 939, "train_loss": 5.125873565673828, "lr": 0.0003756, "tps": 8226, "wall": 7488.9} {"step": 940, "train_loss": 4.999767780303955, "lr": 0.000376, "tps": 8226, "wall": 7496.7} {"step": 941, "train_loss": 5.075995445251465, "lr": 0.0003764, "tps": 8226, "wall": 7504.6} {"step": 942, "train_loss": 5.132859230041504, "lr": 0.0003768, "tps": 8226, "wall": 7512.6} {"step": 943, "train_loss": 5.0206379890441895, "lr": 0.00037720000000000006, "tps": 8226, "wall": 7520.5} {"step": 944, "train_loss": 5.07814359664917, "lr": 0.0003776, "tps": 8226, "wall": 7528.4} {"step": 945, "train_loss": 5.113105773925781, "lr": 0.000378, "tps": 8226, "wall": 7536.3} {"step": 946, "train_loss": 5.10667085647583, "lr": 0.00037840000000000004, "tps": 8226, "wall": 7544.1} {"step": 947, "train_loss": 5.177572727203369, "lr": 0.00037880000000000005, "tps": 8226, "wall": 7552.1} {"step": 948, "train_loss": 5.101136684417725, "lr": 0.00037920000000000006, "tps": 8226, "wall": 7559.9} {"step": 949, "train_loss": 5.039100170135498, "lr": 0.0003796, "tps": 8226, "wall": 7567.9} {"step": 950, "train_loss": 5.061150074005127, "lr": 0.00038, "tps": 8226, "wall": 7575.9} {"step": 951, "train_loss": 5.007184028625488, "lr": 0.00038040000000000003, "tps": 8226, "wall": 7583.7} {"step": 952, "train_loss": 5.0814409255981445, "lr": 0.00038080000000000004, "tps": 8226, "wall": 7591.6} {"step": 953, "train_loss": 5.096714973449707, "lr": 0.00038120000000000005, "tps": 8227, "wall": 7599.5} {"step": 954, "train_loss": 5.081258296966553, "lr": 0.0003816, "tps": 8227, "wall": 7607.3} {"step": 955, "train_loss": 4.90668249130249, "lr": 0.000382, "tps": 8227, "wall": 7615.2} {"step": 956, "train_loss": 4.991013526916504, "lr": 0.0003824, "tps": 8227, "wall": 7623.1} {"step": 957, "train_loss": 5.092946529388428, "lr": 0.00038280000000000003, "tps": 8227, "wall": 7631.1} {"step": 958, "train_loss": 4.96461296081543, "lr": 0.00038320000000000004, "tps": 8227, "wall": 7638.9} {"step": 959, "train_loss": 5.0375847816467285, "lr": 0.0003836, "tps": 8227, "wall": 7646.8} {"step": 960, "train_loss": 4.963925838470459, "lr": 0.000384, "tps": 8227, "wall": 7654.7} {"step": 961, "train_loss": 5.035660743713379, "lr": 0.0003844, "tps": 8227, "wall": 7662.5} {"step": 962, "train_loss": 4.964784145355225, "lr": 0.00038480000000000003, "tps": 8227, "wall": 7670.3} {"step": 963, "train_loss": 4.991646766662598, "lr": 0.00038520000000000004, "tps": 8228, "wall": 7678.2} {"step": 964, "train_loss": 4.992018699645996, "lr": 0.0003856, "tps": 8228, "wall": 7686.0} {"step": 965, "train_loss": 5.0902557373046875, "lr": 0.000386, "tps": 8228, "wall": 7693.9} {"step": 966, "train_loss": 5.067432880401611, "lr": 0.0003864, "tps": 8228, "wall": 7701.8} {"step": 967, "train_loss": 5.043779373168945, "lr": 0.0003868, "tps": 8228, "wall": 7709.6} {"step": 968, "train_loss": 5.089406490325928, "lr": 0.00038720000000000003, "tps": 8228, "wall": 7717.4} {"step": 969, "train_loss": 4.9587602615356445, "lr": 0.0003876, "tps": 8228, "wall": 7725.4} {"step": 970, "train_loss": 5.059728145599365, "lr": 0.000388, "tps": 8228, "wall": 7733.2} {"step": 971, "train_loss": 4.933650016784668, "lr": 0.0003884, "tps": 8228, "wall": 7741.1} {"step": 972, "train_loss": 5.021586894989014, "lr": 0.0003888, "tps": 8229, "wall": 7749.0} {"step": 973, "train_loss": 5.0312910079956055, "lr": 0.00038920000000000003, "tps": 8228, "wall": 7757.0} {"step": 974, "train_loss": 5.045805931091309, "lr": 0.0003896, "tps": 8229, "wall": 7764.9} {"step": 975, "train_loss": 5.06046199798584, "lr": 0.00039, "tps": 8229, "wall": 7772.8} {"step": 976, "train_loss": 5.068984031677246, "lr": 0.0003904, "tps": 8229, "wall": 7780.7} {"step": 977, "train_loss": 4.935007572174072, "lr": 0.0003908, "tps": 8229, "wall": 7788.5} {"step": 978, "train_loss": 5.091857433319092, "lr": 0.00039119999999999997, "tps": 8229, "wall": 7796.4} {"step": 979, "train_loss": 4.997890472412109, "lr": 0.0003916, "tps": 8229, "wall": 7804.3} {"step": 980, "train_loss": 5.0711588859558105, "lr": 0.00039200000000000004, "tps": 8229, "wall": 7812.3} {"step": 981, "train_loss": 4.980260848999023, "lr": 0.00039240000000000005, "tps": 8229, "wall": 7820.2} {"step": 982, "train_loss": 5.0436811447143555, "lr": 0.00039280000000000006, "tps": 8229, "wall": 7828.1} {"step": 983, "train_loss": 5.0046892166137695, "lr": 0.0003932, "tps": 8229, "wall": 7836.0} {"step": 984, "train_loss": 5.021867752075195, "lr": 0.0003936, "tps": 8229, "wall": 7843.9} {"step": 985, "train_loss": 4.956333160400391, "lr": 0.00039400000000000004, "tps": 8229, "wall": 7851.7} {"step": 986, "train_loss": 4.918623447418213, "lr": 0.00039440000000000005, "tps": 8229, "wall": 7859.6} {"step": 987, "train_loss": 4.987807273864746, "lr": 0.00039480000000000006, "tps": 8230, "wall": 7867.4} {"step": 988, "train_loss": 5.071261405944824, "lr": 0.0003952, "tps": 8230, "wall": 7875.4} {"step": 989, "train_loss": 5.012908935546875, "lr": 0.0003956, "tps": 8230, "wall": 7883.4} {"step": 990, "train_loss": 5.039987564086914, "lr": 0.00039600000000000003, "tps": 8230, "wall": 7891.3} {"step": 991, "train_loss": 5.064021587371826, "lr": 0.00039640000000000004, "tps": 8230, "wall": 7899.1} {"step": 992, "train_loss": 5.025051593780518, "lr": 0.00039680000000000005, "tps": 8230, "wall": 7907.0} {"step": 993, "train_loss": 5.032013416290283, "lr": 0.0003972, "tps": 8230, "wall": 7914.8} {"step": 994, "train_loss": 4.972027778625488, "lr": 0.0003976, "tps": 8230, "wall": 7922.7} {"step": 995, "train_loss": 4.994180679321289, "lr": 0.000398, "tps": 8230, "wall": 7930.6} {"step": 996, "train_loss": 5.034337997436523, "lr": 0.00039840000000000003, "tps": 8230, "wall": 7938.5} {"step": 997, "train_loss": 4.910403251647949, "lr": 0.00039880000000000004, "tps": 8230, "wall": 7946.4} {"step": 998, "train_loss": 4.872997760772705, "lr": 0.0003992, "tps": 8230, "wall": 7954.3} {"step": 999, "train_loss": 4.898589134216309, "lr": 0.0003996, "tps": 8230, "wall": 7962.2} {"step": 1000, "train_loss": 4.9435601234436035, "lr": 0.0004, "tps": 8231, "wall": 7970.0, "val_loss_monitor": 4.992207848305834} {"step": 1001, "train_loss": 5.045272350311279, "lr": 0.00039999999898047517, "tps": 8180, "wall": 8026.9} {"step": 1002, "train_loss": 5.061905384063721, "lr": 0.00039999999592190056, "tps": 8181, "wall": 8034.8} {"step": 1003, "train_loss": 4.978282928466797, "lr": 0.00039999999082427625, "tps": 8181, "wall": 8042.8} {"step": 1004, "train_loss": 4.865948677062988, "lr": 0.00039999998368760235, "tps": 8180, "wall": 8050.8} {"step": 1005, "train_loss": 4.9350738525390625, "lr": 0.0003999999745118789, "tps": 8180, "wall": 8058.9} {"step": 1006, "train_loss": 5.010183811187744, "lr": 0.00039999996329710593, "tps": 8181, "wall": 8066.8} {"step": 1007, "train_loss": 5.137956142425537, "lr": 0.00039999995004328374, "tps": 8180, "wall": 8074.8} {"step": 1008, "train_loss": 4.966292381286621, "lr": 0.0003999999347504123, "tps": 8181, "wall": 8082.8} {"step": 1009, "train_loss": 4.946002960205078, "lr": 0.00039999991741849187, "tps": 8181, "wall": 8090.8} {"step": 1010, "train_loss": 5.1181254386901855, "lr": 0.0003999998980475227, "tps": 8181, "wall": 8098.7} {"step": 1011, "train_loss": 4.9694108963012695, "lr": 0.00039999987663750483, "tps": 8181, "wall": 8106.7} {"step": 1012, "train_loss": 4.956024169921875, "lr": 0.0003999998531884387, "tps": 8181, "wall": 8114.7} {"step": 1013, "train_loss": 4.9146552085876465, "lr": 0.00039999982770032446, "tps": 8181, "wall": 8122.6} {"step": 1014, "train_loss": 5.021173477172852, "lr": 0.0003999998001731625, "tps": 8181, "wall": 8130.5} {"step": 1015, "train_loss": 4.948258399963379, "lr": 0.00039999977060695304, "tps": 8181, "wall": 8138.4} {"step": 1016, "train_loss": 4.935249328613281, "lr": 0.00039999973900169643, "tps": 8181, "wall": 8146.5} {"step": 1017, "train_loss": 4.915841102600098, "lr": 0.000399999705357393, "tps": 8181, "wall": 8154.3} {"step": 1018, "train_loss": 4.895730018615723, "lr": 0.0003999996696740432, "tps": 8181, "wall": 8162.2} {"step": 1019, "train_loss": 4.9482879638671875, "lr": 0.00039999963195164743, "tps": 8181, "wall": 8170.1} {"step": 1020, "train_loss": 5.058908939361572, "lr": 0.0003999995921902061, "tps": 8181, "wall": 8178.2} {"step": 1021, "train_loss": 5.04762077331543, "lr": 0.0003999995503897196, "tps": 8181, "wall": 8186.1} {"step": 1022, "train_loss": 4.925821781158447, "lr": 0.0003999995065501884, "tps": 8181, "wall": 8194.0} {"step": 1023, "train_loss": 5.0881476402282715, "lr": 0.00039999946067161316, "tps": 8182, "wall": 8201.9} {"step": 1024, "train_loss": 4.9279584884643555, "lr": 0.0003999994127539943, "tps": 8182, "wall": 8209.8} {"step": 1025, "train_loss": 4.991594314575195, "lr": 0.0003999993627973323, "tps": 8182, "wall": 8217.7} {"step": 1026, "train_loss": 4.989718437194824, "lr": 0.0003999993108016278, "tps": 8182, "wall": 8225.5} {"step": 1027, "train_loss": 4.8588104248046875, "lr": 0.00039999925676688136, "tps": 8182, "wall": 8233.5} {"step": 1028, "train_loss": 4.989034175872803, "lr": 0.0003999992006930936, "tps": 8182, "wall": 8241.4} {"step": 1029, "train_loss": 5.077073097229004, "lr": 0.00039999914258026514, "tps": 8182, "wall": 8249.3} {"step": 1030, "train_loss": 4.923821449279785, "lr": 0.0003999990824283967, "tps": 8182, "wall": 8257.1} {"step": 1031, "train_loss": 4.971362590789795, "lr": 0.0003999990202374889, "tps": 8183, "wall": 8264.9} {"step": 1032, "train_loss": 4.9785966873168945, "lr": 0.0003999989560075425, "tps": 8183, "wall": 8272.9} {"step": 1033, "train_loss": 4.903679847717285, "lr": 0.0003999988897385581, "tps": 8183, "wall": 8280.8} {"step": 1034, "train_loss": 4.953607559204102, "lr": 0.0003999988214305366, "tps": 8183, "wall": 8288.6} {"step": 1035, "train_loss": 5.075329780578613, "lr": 0.0003999987510834787, "tps": 8183, "wall": 8296.6} {"step": 1036, "train_loss": 5.004819869995117, "lr": 0.00039999867869738517, "tps": 8183, "wall": 8304.5} {"step": 1037, "train_loss": 4.959005355834961, "lr": 0.0003999986042722569, "tps": 8183, "wall": 8312.3} {"step": 1038, "train_loss": 4.941742897033691, "lr": 0.0003999985278080947, "tps": 8183, "wall": 8320.1} {"step": 1039, "train_loss": 4.938665390014648, "lr": 0.0003999984493048995, "tps": 8184, "wall": 8328.1} {"step": 1040, "train_loss": 4.962063312530518, "lr": 0.000399998368762672, "tps": 8184, "wall": 8335.9} {"step": 1041, "train_loss": 4.897371292114258, "lr": 0.00039999828618141335, "tps": 8184, "wall": 8343.8} {"step": 1042, "train_loss": 4.994592666625977, "lr": 0.0003999982015611244, "tps": 8184, "wall": 8351.7} {"step": 1043, "train_loss": 4.875363349914551, "lr": 0.000399998114901806, "tps": 8184, "wall": 8359.6} {"step": 1044, "train_loss": 4.871382236480713, "lr": 0.00039999802620345926, "tps": 8184, "wall": 8367.6} {"step": 1045, "train_loss": 4.844536781311035, "lr": 0.0003999979354660851, "tps": 8184, "wall": 8375.4} {"step": 1046, "train_loss": 4.931535720825195, "lr": 0.0003999978426896846, "tps": 8184, "wall": 8383.3} {"step": 1047, "train_loss": 4.924246311187744, "lr": 0.00039999774787425886, "tps": 8184, "wall": 8391.2} {"step": 1048, "train_loss": 4.870777606964111, "lr": 0.00039999765101980883, "tps": 8185, "wall": 8399.1} {"step": 1049, "train_loss": 4.8874897956848145, "lr": 0.00039999755212633567, "tps": 8185, "wall": 8407.0} {"step": 1050, "train_loss": 4.910763263702393, "lr": 0.0003999974511938405, "tps": 8185, "wall": 8414.9} {"step": 1051, "train_loss": 4.872481346130371, "lr": 0.00039999734822232454, "tps": 8185, "wall": 8422.7} {"step": 1052, "train_loss": 4.920723915100098, "lr": 0.00039999724321178884, "tps": 8185, "wall": 8430.6} {"step": 1053, "train_loss": 4.994449138641357, "lr": 0.0003999971361622346, "tps": 8185, "wall": 8438.5} {"step": 1054, "train_loss": 4.8473029136657715, "lr": 0.0003999970270736631, "tps": 8185, "wall": 8446.4} {"step": 1055, "train_loss": 4.9855146408081055, "lr": 0.00039999691594607556, "tps": 8186, "wall": 8454.2} {"step": 1056, "train_loss": 4.9366068840026855, "lr": 0.0003999968027794731, "tps": 8186, "wall": 8462.0} {"step": 1057, "train_loss": 4.922293663024902, "lr": 0.00039999668757385724, "tps": 8186, "wall": 8469.9} {"step": 1058, "train_loss": 4.84320068359375, "lr": 0.0003999965703292291, "tps": 8186, "wall": 8477.9} {"step": 1059, "train_loss": 4.894876480102539, "lr": 0.00039999645104559016, "tps": 8186, "wall": 8485.8} {"step": 1060, "train_loss": 4.787520885467529, "lr": 0.0003999963297229416, "tps": 8186, "wall": 8493.6} {"step": 1061, "train_loss": 4.927883148193359, "lr": 0.00039999620636128495, "tps": 8186, "wall": 8501.6} {"step": 1062, "train_loss": 4.864121437072754, "lr": 0.00039999608096062146, "tps": 8186, "wall": 8509.5} {"step": 1063, "train_loss": 4.885068893432617, "lr": 0.0003999959535209527, "tps": 8186, "wall": 8517.3} {"step": 1064, "train_loss": 4.842036724090576, "lr": 0.00039999582404228, "tps": 8187, "wall": 8525.2} {"step": 1065, "train_loss": 4.873863220214844, "lr": 0.0003999956925246048, "tps": 8187, "wall": 8533.2} {"step": 1066, "train_loss": 4.827798366546631, "lr": 0.0003999955589679288, "tps": 8187, "wall": 8541.0} {"step": 1067, "train_loss": 4.964442253112793, "lr": 0.00039999542337225327, "tps": 8187, "wall": 8548.9} {"step": 1068, "train_loss": 4.928494930267334, "lr": 0.0003999952857375799, "tps": 8187, "wall": 8556.8} {"step": 1069, "train_loss": 4.876481533050537, "lr": 0.00039999514606391015, "tps": 8187, "wall": 8564.6} {"step": 1070, "train_loss": 4.8393731117248535, "lr": 0.00039999500435124565, "tps": 8187, "wall": 8572.4} {"step": 1071, "train_loss": 4.862422466278076, "lr": 0.00039999486059958805, "tps": 8187, "wall": 8580.3} {"step": 1072, "train_loss": 4.824560642242432, "lr": 0.0003999947148089389, "tps": 8188, "wall": 8588.2} {"step": 1073, "train_loss": 4.855657577514648, "lr": 0.0003999945669792999, "tps": 8188, "wall": 8596.1} {"step": 1074, "train_loss": 4.890350341796875, "lr": 0.0003999944171106727, "tps": 8188, "wall": 8603.9} {"step": 1075, "train_loss": 4.86351203918457, "lr": 0.000399994265203059, "tps": 8188, "wall": 8611.9} {"step": 1076, "train_loss": 4.9004364013671875, "lr": 0.0003999941112564605, "tps": 8188, "wall": 8619.8} {"step": 1077, "train_loss": 4.830790042877197, "lr": 0.000399993955270879, "tps": 8188, "wall": 8627.6} {"step": 1078, "train_loss": 4.844696044921875, "lr": 0.00039999379724631624, "tps": 8188, "wall": 8635.5} {"step": 1079, "train_loss": 4.793303489685059, "lr": 0.000399993637182774, "tps": 8188, "wall": 8643.4} {"step": 1080, "train_loss": 4.761898517608643, "lr": 0.00039999347508025407, "tps": 8188, "wall": 8651.4} {"step": 1081, "train_loss": 4.8622941970825195, "lr": 0.00039999331093875843, "tps": 8188, "wall": 8659.2} {"step": 1082, "train_loss": 4.970963954925537, "lr": 0.0003999931447582887, "tps": 8189, "wall": 8667.1} {"step": 1083, "train_loss": 4.852688789367676, "lr": 0.0003999929765388469, "tps": 8189, "wall": 8675.0} {"step": 1084, "train_loss": 4.968208312988281, "lr": 0.00039999280628043494, "tps": 8189, "wall": 8682.9} {"step": 1085, "train_loss": 4.8815107345581055, "lr": 0.00039999263398305475, "tps": 8189, "wall": 8690.7} {"step": 1086, "train_loss": 4.906038761138916, "lr": 0.0003999924596467083, "tps": 8189, "wall": 8698.6} {"step": 1087, "train_loss": 4.837263107299805, "lr": 0.0003999922832713975, "tps": 8189, "wall": 8706.4} {"step": 1088, "train_loss": 4.889171600341797, "lr": 0.0003999921048571244, "tps": 8189, "wall": 8714.4} {"step": 1089, "train_loss": 4.977303504943848, "lr": 0.00039999192440389093, "tps": 8189, "wall": 8722.2} {"step": 1090, "train_loss": 4.847591400146484, "lr": 0.0003999917419116992, "tps": 8190, "wall": 8730.1} {"step": 1091, "train_loss": 4.912111759185791, "lr": 0.00039999155738055137, "tps": 8190, "wall": 8737.9} {"step": 1092, "train_loss": 4.776633262634277, "lr": 0.00039999137081044944, "tps": 8190, "wall": 8745.8} {"step": 1093, "train_loss": 4.87253999710083, "lr": 0.00039999118220139545, "tps": 8190, "wall": 8753.7} {"step": 1094, "train_loss": 4.843990325927734, "lr": 0.0003999909915533916, "tps": 8190, "wall": 8761.6} {"step": 1095, "train_loss": 4.8224968910217285, "lr": 0.00039999079886644015, "tps": 8190, "wall": 8769.4} {"step": 1096, "train_loss": 4.8327789306640625, "lr": 0.00039999060414054317, "tps": 8190, "wall": 8777.4} {"step": 1097, "train_loss": 4.905767917633057, "lr": 0.0003999904073757028, "tps": 8190, "wall": 8785.2} {"step": 1098, "train_loss": 4.7770209312438965, "lr": 0.0003999902085719215, "tps": 8190, "wall": 8793.1} {"step": 1099, "train_loss": 4.912321090698242, "lr": 0.00039999000772920126, "tps": 8191, "wall": 8800.9} {"step": 1100, "train_loss": 4.805744171142578, "lr": 0.00039998980484754447, "tps": 8191, "wall": 8808.8} {"step": 1101, "train_loss": 4.702916622161865, "lr": 0.0003999895999269535, "tps": 8191, "wall": 8816.6} {"step": 1102, "train_loss": 4.796922206878662, "lr": 0.0003999893929674306, "tps": 8191, "wall": 8824.6} {"step": 1103, "train_loss": 4.868038654327393, "lr": 0.0003999891839689781, "tps": 8191, "wall": 8832.4} {"step": 1104, "train_loss": 4.8100972175598145, "lr": 0.00039998897293159834, "tps": 8191, "wall": 8840.4} {"step": 1105, "train_loss": 4.700133323669434, "lr": 0.0003999887598552938, "tps": 8191, "wall": 8848.1} {"step": 1106, "train_loss": 4.774001121520996, "lr": 0.0003999885447400669, "tps": 8191, "wall": 8856.0} {"step": 1107, "train_loss": 4.734935283660889, "lr": 0.00039998832758592, "tps": 8192, "wall": 8863.9} {"step": 1108, "train_loss": 4.742660045623779, "lr": 0.00039998810839285556, "tps": 8192, "wall": 8871.7} {"step": 1109, "train_loss": 4.75625467300415, "lr": 0.0003999878871608761, "tps": 8192, "wall": 8879.6} {"step": 1110, "train_loss": 4.845061302185059, "lr": 0.00039998766388998414, "tps": 8192, "wall": 8887.5} {"step": 1111, "train_loss": 4.7738752365112305, "lr": 0.00039998743858018213, "tps": 8192, "wall": 8895.4} {"step": 1112, "train_loss": 4.799306869506836, "lr": 0.0003999872112314727, "tps": 8192, "wall": 8903.3} {"step": 1113, "train_loss": 4.7935967445373535, "lr": 0.00039998698184385846, "tps": 8192, "wall": 8911.0} {"step": 1114, "train_loss": 4.791575908660889, "lr": 0.00039998675041734194, "tps": 8193, "wall": 8918.9} {"step": 1115, "train_loss": 4.8694539070129395, "lr": 0.0003999865169519257, "tps": 8193, "wall": 8926.7} {"step": 1116, "train_loss": 4.845602512359619, "lr": 0.0003999862814476125, "tps": 8193, "wall": 8934.5} {"step": 1117, "train_loss": 4.830136299133301, "lr": 0.00039998604390440503, "tps": 8193, "wall": 8942.4} {"step": 1118, "train_loss": 4.743980884552002, "lr": 0.00039998580432230586, "tps": 8193, "wall": 8950.2} {"step": 1119, "train_loss": 4.77908182144165, "lr": 0.00039998556270131767, "tps": 8193, "wall": 8958.2} {"step": 1120, "train_loss": 4.857384204864502, "lr": 0.0003999853190414434, "tps": 8193, "wall": 8966.0} {"step": 1121, "train_loss": 4.821906566619873, "lr": 0.0003999850733426857, "tps": 8193, "wall": 8973.9} {"step": 1122, "train_loss": 4.917291641235352, "lr": 0.00039998482560504737, "tps": 8194, "wall": 8981.8} {"step": 1123, "train_loss": 4.870391368865967, "lr": 0.00039998457582853116, "tps": 8194, "wall": 8989.7} {"step": 1124, "train_loss": 4.880152702331543, "lr": 0.0003999843240131399, "tps": 8194, "wall": 8997.6} {"step": 1125, "train_loss": 4.896996021270752, "lr": 0.0003999840701588765, "tps": 8194, "wall": 9005.4} {"step": 1126, "train_loss": 4.845821380615234, "lr": 0.00039998381426574383, "tps": 8194, "wall": 9013.4} {"step": 1127, "train_loss": 4.808712005615234, "lr": 0.00039998355633374483, "tps": 8194, "wall": 9021.3} {"step": 1128, "train_loss": 4.6866841316223145, "lr": 0.00039998329636288234, "tps": 8194, "wall": 9029.2} {"step": 1129, "train_loss": 4.765096664428711, "lr": 0.00039998303435315923, "tps": 8194, "wall": 9037.1} {"step": 1130, "train_loss": 4.739654541015625, "lr": 0.0003999827703045787, "tps": 8194, "wall": 9045.0} {"step": 1131, "train_loss": 5.009300708770752, "lr": 0.0003999825042171435, "tps": 8194, "wall": 9052.9} {"step": 1132, "train_loss": 4.7806315422058105, "lr": 0.0003999822360908569, "tps": 8194, "wall": 9060.8} {"step": 1133, "train_loss": 4.831971168518066, "lr": 0.0003999819659257217, "tps": 8194, "wall": 9068.7} {"step": 1134, "train_loss": 4.897317886352539, "lr": 0.00039998169372174107, "tps": 8194, "wall": 9076.7} {"step": 1135, "train_loss": 4.797842025756836, "lr": 0.00039998141947891806, "tps": 8195, "wall": 9084.5} {"step": 1136, "train_loss": 4.811625003814697, "lr": 0.00039998114319725575, "tps": 8195, "wall": 9092.4} {"step": 1137, "train_loss": 4.796964168548584, "lr": 0.00039998086487675737, "tps": 8195, "wall": 9100.2} {"step": 1138, "train_loss": 4.67112922668457, "lr": 0.000399980584517426, "tps": 8195, "wall": 9108.1} {"step": 1139, "train_loss": 4.776609420776367, "lr": 0.00039998030211926486, "tps": 8195, "wall": 9116.0} {"step": 1140, "train_loss": 4.734410285949707, "lr": 0.0003999800176822771, "tps": 8195, "wall": 9123.8} {"step": 1141, "train_loss": 4.806573867797852, "lr": 0.000399979731206466, "tps": 8195, "wall": 9131.8} {"step": 1142, "train_loss": 4.7178802490234375, "lr": 0.00039997944269183476, "tps": 8195, "wall": 9139.7} {"step": 1143, "train_loss": 4.812088966369629, "lr": 0.0003999791521383866, "tps": 8195, "wall": 9147.6} {"step": 1144, "train_loss": 4.798398494720459, "lr": 0.00039997885954612487, "tps": 8196, "wall": 9155.4} {"step": 1145, "train_loss": 4.74282169342041, "lr": 0.00039997856491505294, "tps": 8196, "wall": 9163.3} {"step": 1146, "train_loss": 4.813595771789551, "lr": 0.00039997826824517406, "tps": 8196, "wall": 9171.1} {"step": 1147, "train_loss": 4.735983371734619, "lr": 0.0003999779695364916, "tps": 8196, "wall": 9179.0} {"step": 1148, "train_loss": 4.80549955368042, "lr": 0.000399977668789009, "tps": 8196, "wall": 9186.9} {"step": 1149, "train_loss": 4.703988552093506, "lr": 0.00039997736600272957, "tps": 8196, "wall": 9194.8} {"step": 1150, "train_loss": 4.714730262756348, "lr": 0.0003999770611776569, "tps": 8196, "wall": 9202.6} {"step": 1151, "train_loss": 4.75101375579834, "lr": 0.0003999767543137943, "tps": 8196, "wall": 9210.5} {"step": 1152, "train_loss": 4.754495143890381, "lr": 0.00039997644541114527, "tps": 8197, "wall": 9218.3} {"step": 1153, "train_loss": 4.7454376220703125, "lr": 0.0003999761344697134, "tps": 8197, "wall": 9226.2} {"step": 1154, "train_loss": 4.7841339111328125, "lr": 0.0003999758214895021, "tps": 8197, "wall": 9234.2} {"step": 1155, "train_loss": 4.770107269287109, "lr": 0.0003999755064705149, "tps": 8197, "wall": 9242.1} {"step": 1156, "train_loss": 4.76100492477417, "lr": 0.00039997518941275545, "tps": 8197, "wall": 9250.0} {"step": 1157, "train_loss": 4.7862420082092285, "lr": 0.00039997487031622733, "tps": 8197, "wall": 9258.0} {"step": 1158, "train_loss": 4.686400413513184, "lr": 0.00039997454918093417, "tps": 8197, "wall": 9265.9} {"step": 1159, "train_loss": 4.771719932556152, "lr": 0.00039997422600687954, "tps": 8197, "wall": 9273.9} {"step": 1160, "train_loss": 4.728001117706299, "lr": 0.0003999739007940672, "tps": 8197, "wall": 9281.6} {"step": 1161, "train_loss": 4.81715202331543, "lr": 0.00039997357354250074, "tps": 8197, "wall": 9289.6} {"step": 1162, "train_loss": 4.696300506591797, "lr": 0.00039997324425218383, "tps": 8197, "wall": 9297.3} {"step": 1163, "train_loss": 4.690386772155762, "lr": 0.00039997291292312036, "tps": 8197, "wall": 9305.2} {"step": 1164, "train_loss": 4.723413944244385, "lr": 0.00039997257955531396, "tps": 8197, "wall": 9313.2} {"step": 1165, "train_loss": 4.683060646057129, "lr": 0.00039997224414876843, "tps": 8198, "wall": 9321.1} {"step": 1166, "train_loss": 4.757824897766113, "lr": 0.0003999719067034877, "tps": 8198, "wall": 9328.9} {"step": 1167, "train_loss": 4.638425350189209, "lr": 0.0003999715672194754, "tps": 8198, "wall": 9336.8} {"step": 1168, "train_loss": 4.738912582397461, "lr": 0.00039997122569673533, "tps": 8198, "wall": 9344.7} {"step": 1169, "train_loss": 4.6077494621276855, "lr": 0.00039997088213527166, "tps": 8198, "wall": 9352.6} {"step": 1170, "train_loss": 4.812661170959473, "lr": 0.000399970536535088, "tps": 8198, "wall": 9360.4} {"step": 1171, "train_loss": 4.661199569702148, "lr": 0.00039997018889618844, "tps": 8198, "wall": 9368.4} {"step": 1172, "train_loss": 4.756358623504639, "lr": 0.00039996983921857676, "tps": 8198, "wall": 9376.3} {"step": 1173, "train_loss": 4.7665486335754395, "lr": 0.00039996948750225706, "tps": 8198, "wall": 9384.2} {"step": 1174, "train_loss": 4.729637145996094, "lr": 0.0003999691337472333, "tps": 8198, "wall": 9392.0} {"step": 1175, "train_loss": 4.756919860839844, "lr": 0.00039996877795350934, "tps": 8199, "wall": 9399.9} {"step": 1176, "train_loss": 4.695396423339844, "lr": 0.0003999684201210894, "tps": 8199, "wall": 9407.8} {"step": 1177, "train_loss": 4.724659442901611, "lr": 0.00039996806024997743, "tps": 8199, "wall": 9415.6} {"step": 1178, "train_loss": 4.706009864807129, "lr": 0.0003999676983401776, "tps": 8199, "wall": 9423.5} {"step": 1179, "train_loss": 4.64346981048584, "lr": 0.0003999673343916939, "tps": 8199, "wall": 9431.6} {"step": 1180, "train_loss": 4.717358112335205, "lr": 0.00039996696840453053, "tps": 8199, "wall": 9439.4} {"step": 1181, "train_loss": 4.6503400802612305, "lr": 0.00039996660037869156, "tps": 8199, "wall": 9447.2} {"step": 1182, "train_loss": 4.71332311630249, "lr": 0.00039996623031418127, "tps": 8199, "wall": 9455.1} {"step": 1183, "train_loss": 4.659783363342285, "lr": 0.00039996585821100374, "tps": 8199, "wall": 9462.9} {"step": 1184, "train_loss": 4.680459976196289, "lr": 0.00039996548406916324, "tps": 8199, "wall": 9470.9} {"step": 1185, "train_loss": 4.79026460647583, "lr": 0.000399965107888664, "tps": 8200, "wall": 9478.7} {"step": 1186, "train_loss": 4.704169273376465, "lr": 0.0003999647296695103, "tps": 8200, "wall": 9486.7} {"step": 1187, "train_loss": 4.551026344299316, "lr": 0.0003999643494117064, "tps": 8200, "wall": 9494.6} {"step": 1188, "train_loss": 4.840258598327637, "lr": 0.00039996396711525656, "tps": 8200, "wall": 9502.5} {"step": 1189, "train_loss": 4.752726078033447, "lr": 0.00039996358278016525, "tps": 8200, "wall": 9510.5} {"step": 1190, "train_loss": 4.670491695404053, "lr": 0.00039996319640643667, "tps": 8200, "wall": 9518.3} {"step": 1191, "train_loss": 4.655618667602539, "lr": 0.00039996280799407526, "tps": 8200, "wall": 9526.2} {"step": 1192, "train_loss": 4.629777431488037, "lr": 0.00039996241754308546, "tps": 8200, "wall": 9534.1} {"step": 1193, "train_loss": 4.701459884643555, "lr": 0.00039996202505347163, "tps": 8200, "wall": 9542.0} {"step": 1194, "train_loss": 4.69545841217041, "lr": 0.00039996163052523836, "tps": 8200, "wall": 9549.8} {"step": 1195, "train_loss": 4.817142009735107, "lr": 0.0003999612339583898, "tps": 8200, "wall": 9557.9} {"step": 1196, "train_loss": 4.762042045593262, "lr": 0.0003999608353529308, "tps": 8200, "wall": 9565.8} {"step": 1197, "train_loss": 4.671631813049316, "lr": 0.0003999604347088657, "tps": 8200, "wall": 9573.6} {"step": 1198, "train_loss": 4.804741859436035, "lr": 0.00039996003202619906, "tps": 8200, "wall": 9581.6} {"step": 1199, "train_loss": 4.73103141784668, "lr": 0.00039995962730493545, "tps": 8200, "wall": 9589.5} {"step": 1200, "train_loss": 4.807280540466309, "lr": 0.00039995922054507935, "tps": 8201, "wall": 9597.3} {"step": 1201, "train_loss": 4.633725643157959, "lr": 0.0003999588117466356, "tps": 8201, "wall": 9605.2} {"step": 1202, "train_loss": 4.719608306884766, "lr": 0.00039995840090960863, "tps": 8201, "wall": 9613.3} {"step": 1203, "train_loss": 4.732734680175781, "lr": 0.00039995798803400313, "tps": 8201, "wall": 9621.1} {"step": 1204, "train_loss": 4.773506164550781, "lr": 0.00039995757311982384, "tps": 8201, "wall": 9629.0} {"step": 1205, "train_loss": 4.679075241088867, "lr": 0.0003999571561670754, "tps": 8201, "wall": 9636.9} {"step": 1206, "train_loss": 4.688185691833496, "lr": 0.0003999567371757626, "tps": 8201, "wall": 9644.8} {"step": 1207, "train_loss": 4.774514675140381, "lr": 0.0003999563161458901, "tps": 8201, "wall": 9652.6} {"step": 1208, "train_loss": 4.667168140411377, "lr": 0.00039995589307746275, "tps": 8201, "wall": 9660.5} {"step": 1209, "train_loss": 4.632888317108154, "lr": 0.0003999554679704853, "tps": 8201, "wall": 9668.4} {"step": 1210, "train_loss": 4.65654993057251, "lr": 0.00039995504082496257, "tps": 8201, "wall": 9676.4} {"step": 1211, "train_loss": 4.634416103363037, "lr": 0.00039995461164089944, "tps": 8201, "wall": 9684.2} {"step": 1212, "train_loss": 4.649348735809326, "lr": 0.00039995418041830063, "tps": 8202, "wall": 9692.1} {"step": 1213, "train_loss": 4.698212146759033, "lr": 0.00039995374715717124, "tps": 8202, "wall": 9700.1} {"step": 1214, "train_loss": 4.654970645904541, "lr": 0.00039995331185751603, "tps": 8202, "wall": 9707.9} {"step": 1215, "train_loss": 4.644562721252441, "lr": 0.00039995287451933994, "tps": 8202, "wall": 9715.8} {"step": 1216, "train_loss": 4.73197603225708, "lr": 0.00039995243514264796, "tps": 8202, "wall": 9723.7} {"step": 1217, "train_loss": 4.783881664276123, "lr": 0.00039995199372744506, "tps": 8202, "wall": 9731.7} {"step": 1218, "train_loss": 4.654913902282715, "lr": 0.00039995155027373625, "tps": 8202, "wall": 9739.6} {"step": 1219, "train_loss": 4.686858177185059, "lr": 0.0003999511047815265, "tps": 8202, "wall": 9747.4} {"step": 1220, "train_loss": 4.658271789550781, "lr": 0.000399950657250821, "tps": 8202, "wall": 9755.2} {"step": 1221, "train_loss": 4.668768405914307, "lr": 0.00039995020768162466, "tps": 8202, "wall": 9763.0} {"step": 1222, "train_loss": 4.77125358581543, "lr": 0.00039994975607394263, "tps": 8203, "wall": 9770.9} {"step": 1223, "train_loss": 4.665433883666992, "lr": 0.00039994930242778, "tps": 8203, "wall": 9778.8} {"step": 1224, "train_loss": 4.702731132507324, "lr": 0.000399948846743142, "tps": 8203, "wall": 9786.7} {"step": 1225, "train_loss": 4.6964216232299805, "lr": 0.0003999483890200337, "tps": 8203, "wall": 9794.6} {"step": 1226, "train_loss": 4.647231101989746, "lr": 0.0003999479292584603, "tps": 8203, "wall": 9802.6} {"step": 1227, "train_loss": 4.897383213043213, "lr": 0.00039994746745842705, "tps": 8203, "wall": 9810.5} {"step": 1228, "train_loss": 4.626866817474365, "lr": 0.00039994700361993914, "tps": 8203, "wall": 9818.4} {"step": 1229, "train_loss": 4.657550811767578, "lr": 0.00039994653774300186, "tps": 8203, "wall": 9826.3} {"step": 1230, "train_loss": 4.634598255157471, "lr": 0.0003999460698276204, "tps": 8203, "wall": 9834.2} {"step": 1231, "train_loss": 4.637929916381836, "lr": 0.0003999455998738002, "tps": 8203, "wall": 9842.0} {"step": 1232, "train_loss": 4.558623790740967, "lr": 0.00039994512788154646, "tps": 8203, "wall": 9850.0} {"step": 1233, "train_loss": 4.664977550506592, "lr": 0.0003999446538508646, "tps": 8203, "wall": 9857.9} {"step": 1234, "train_loss": 4.633219242095947, "lr": 0.00039994417778175997, "tps": 8203, "wall": 9865.7} {"step": 1235, "train_loss": 4.692331314086914, "lr": 0.00039994369967423797, "tps": 8203, "wall": 9873.6} {"step": 1236, "train_loss": 4.728762626647949, "lr": 0.000399943219528304, "tps": 8204, "wall": 9881.4} {"step": 1237, "train_loss": 4.73136043548584, "lr": 0.0003999427373439635, "tps": 8204, "wall": 9889.3} {"step": 1238, "train_loss": 4.644661903381348, "lr": 0.00039994225312122187, "tps": 8204, "wall": 9897.2} {"step": 1239, "train_loss": 4.659997463226318, "lr": 0.0003999417668600848, "tps": 8204, "wall": 9905.1} {"step": 1240, "train_loss": 4.6398420333862305, "lr": 0.00039994127856055755, "tps": 8204, "wall": 9913.1} {"step": 1241, "train_loss": 4.622168064117432, "lr": 0.00039994078822264573, "tps": 8204, "wall": 9921.0} {"step": 1242, "train_loss": 4.694138526916504, "lr": 0.00039994029584635506, "tps": 8204, "wall": 9928.9} {"step": 1243, "train_loss": 4.690127372741699, "lr": 0.00039993980143169085, "tps": 8204, "wall": 9936.7} {"step": 1244, "train_loss": 4.670016765594482, "lr": 0.0003999393049786589, "tps": 8204, "wall": 9944.6} {"step": 1245, "train_loss": 4.816817760467529, "lr": 0.0003999388064872648, "tps": 8204, "wall": 9952.5} {"step": 1246, "train_loss": 4.778169631958008, "lr": 0.0003999383059575141, "tps": 8204, "wall": 9960.3} {"step": 1247, "train_loss": 4.7419843673706055, "lr": 0.0003999378033894126, "tps": 8204, "wall": 9968.2} {"step": 1248, "train_loss": 4.717869758605957, "lr": 0.0003999372987829659, "tps": 8204, "wall": 9976.2} {"step": 1249, "train_loss": 4.587336540222168, "lr": 0.00039993679213817974, "tps": 8205, "wall": 9984.1} {"step": 1250, "train_loss": 4.6892499923706055, "lr": 0.00039993628345505987, "tps": 8205, "wall": 9992.0} {"step": 1251, "train_loss": 4.689759731292725, "lr": 0.0003999357727336121, "tps": 8205, "wall": 9999.9} {"step": 1252, "train_loss": 4.613215446472168, "lr": 0.00039993525997384207, "tps": 8205, "wall": 10007.8} {"step": 1253, "train_loss": 4.622912406921387, "lr": 0.0003999347451757557, "tps": 8205, "wall": 10015.7} {"step": 1254, "train_loss": 4.65015983581543, "lr": 0.00039993422833935877, "tps": 8205, "wall": 10023.6} {"step": 1255, "train_loss": 4.59445333480835, "lr": 0.0003999337094646572, "tps": 8205, "wall": 10031.6} {"step": 1256, "train_loss": 4.6067986488342285, "lr": 0.00039993318855165687, "tps": 8205, "wall": 10039.5} {"step": 1257, "train_loss": 4.576318740844727, "lr": 0.0003999326656003637, "tps": 8205, "wall": 10047.4} {"step": 1258, "train_loss": 4.691201210021973, "lr": 0.00039993214061078347, "tps": 8205, "wall": 10055.3} {"step": 1259, "train_loss": 4.593299865722656, "lr": 0.0003999316135829222, "tps": 8205, "wall": 10063.1} {"step": 1260, "train_loss": 4.659182071685791, "lr": 0.00039993108451678595, "tps": 8205, "wall": 10071.0} {"step": 1261, "train_loss": 4.7067036628723145, "lr": 0.00039993055341238054, "tps": 8205, "wall": 10078.8} {"step": 1262, "train_loss": 4.594326972961426, "lr": 0.0003999300202697122, "tps": 8205, "wall": 10086.8} {"step": 1263, "train_loss": 4.591923236846924, "lr": 0.0003999294850887868, "tps": 8205, "wall": 10094.8} {"step": 1264, "train_loss": 4.577571392059326, "lr": 0.00039992894786961046, "tps": 8206, "wall": 10102.7} {"step": 1265, "train_loss": 4.633742332458496, "lr": 0.00039992840861218925, "tps": 8206, "wall": 10110.6} {"step": 1266, "train_loss": 4.6200385093688965, "lr": 0.0003999278673165293, "tps": 8206, "wall": 10118.5} {"step": 1267, "train_loss": 4.529497146606445, "lr": 0.00039992732398263673, "tps": 8206, "wall": 10126.5} {"step": 1268, "train_loss": 4.572568893432617, "lr": 0.0003999267786105178, "tps": 8206, "wall": 10134.4} {"step": 1269, "train_loss": 4.734988212585449, "lr": 0.00039992623120017846, "tps": 8206, "wall": 10142.4} {"step": 1270, "train_loss": 4.568746566772461, "lr": 0.0003999256817516251, "tps": 8206, "wall": 10150.2} {"step": 1271, "train_loss": 4.618176460266113, "lr": 0.0003999251302648638, "tps": 8206, "wall": 10158.4} {"step": 1272, "train_loss": 4.647491931915283, "lr": 0.00039992457673990097, "tps": 8206, "wall": 10166.2} {"step": 1273, "train_loss": 4.616684913635254, "lr": 0.00039992402117674283, "tps": 8206, "wall": 10174.1} {"step": 1274, "train_loss": 4.615680694580078, "lr": 0.00039992346357539557, "tps": 8206, "wall": 10182.1} {"step": 1275, "train_loss": 4.634770393371582, "lr": 0.0003999229039358656, "tps": 8206, "wall": 10190.0} {"step": 1276, "train_loss": 4.6517333984375, "lr": 0.00039992234225815924, "tps": 8206, "wall": 10197.8} {"step": 1277, "train_loss": 4.660839557647705, "lr": 0.00039992177854228286, "tps": 8206, "wall": 10205.7} {"step": 1278, "train_loss": 4.617219924926758, "lr": 0.00039992121278824283, "tps": 8206, "wall": 10213.8} {"step": 1279, "train_loss": 4.67158317565918, "lr": 0.0003999206449960456, "tps": 8206, "wall": 10221.6} {"step": 1280, "train_loss": 4.51252555847168, "lr": 0.00039992007516569757, "tps": 8206, "wall": 10229.5} {"step": 1281, "train_loss": 4.563910007476807, "lr": 0.00039991950329720517, "tps": 8206, "wall": 10237.3} {"step": 1282, "train_loss": 4.562044620513916, "lr": 0.00039991892939057495, "tps": 8207, "wall": 10245.2} {"step": 1283, "train_loss": 4.676471710205078, "lr": 0.0003999183534458133, "tps": 8207, "wall": 10253.1} {"step": 1284, "train_loss": 4.594236373901367, "lr": 0.00039991777546292685, "tps": 8207, "wall": 10261.1} {"step": 1285, "train_loss": 4.615555763244629, "lr": 0.0003999171954419221, "tps": 8207, "wall": 10269.0} {"step": 1286, "train_loss": 4.5979084968566895, "lr": 0.0003999166133828056, "tps": 8207, "wall": 10277.1} {"step": 1287, "train_loss": 4.5551228523254395, "lr": 0.000399916029285584, "tps": 8207, "wall": 10285.0} {"step": 1288, "train_loss": 4.630454063415527, "lr": 0.00039991544315026386, "tps": 8207, "wall": 10292.9} {"step": 1289, "train_loss": 4.667497634887695, "lr": 0.0003999148549768518, "tps": 8207, "wall": 10300.8} {"step": 1290, "train_loss": 4.622450828552246, "lr": 0.0003999142647653546, "tps": 8207, "wall": 10308.7} {"step": 1291, "train_loss": 4.615522861480713, "lr": 0.0003999136725157789, "tps": 8207, "wall": 10316.6} {"step": 1292, "train_loss": 4.63803243637085, "lr": 0.00039991307822813133, "tps": 8207, "wall": 10324.5} {"step": 1293, "train_loss": 4.609838485717773, "lr": 0.00039991248190241873, "tps": 8207, "wall": 10332.6} {"step": 1294, "train_loss": 4.570164680480957, "lr": 0.00039991188353864776, "tps": 8207, "wall": 10340.5} {"step": 1295, "train_loss": 4.600584983825684, "lr": 0.00039991128313682526, "tps": 8207, "wall": 10348.5} {"step": 1296, "train_loss": 4.613836288452148, "lr": 0.000399910680696958, "tps": 8207, "wall": 10356.3} {"step": 1297, "train_loss": 4.582393169403076, "lr": 0.00039991007621905284, "tps": 8207, "wall": 10364.2} {"step": 1298, "train_loss": 4.559587001800537, "lr": 0.0003999094697031165, "tps": 8207, "wall": 10372.2} {"step": 1299, "train_loss": 4.591813087463379, "lr": 0.0003999088611491561, "tps": 8207, "wall": 10380.1} {"step": 1300, "train_loss": 4.650841236114502, "lr": 0.00039990825055717834, "tps": 8207, "wall": 10387.9} {"step": 1301, "train_loss": 4.512392997741699, "lr": 0.00039990763792719015, "tps": 8207, "wall": 10396.0} {"step": 1302, "train_loss": 4.641554832458496, "lr": 0.00039990702325919857, "tps": 8207, "wall": 10403.9} {"step": 1303, "train_loss": 4.62892484664917, "lr": 0.0003999064065532104, "tps": 8207, "wall": 10411.7} {"step": 1304, "train_loss": 4.535024166107178, "lr": 0.00039990578780923277, "tps": 8207, "wall": 10419.7} {"step": 1305, "train_loss": 4.545868873596191, "lr": 0.00039990516702727264, "tps": 8208, "wall": 10427.6} {"step": 1306, "train_loss": 4.629889488220215, "lr": 0.0003999045442073371, "tps": 8208, "wall": 10435.4} {"step": 1307, "train_loss": 4.573093414306641, "lr": 0.00039990391934943307, "tps": 8208, "wall": 10443.3} {"step": 1308, "train_loss": 4.6078290939331055, "lr": 0.0003999032924535677, "tps": 8208, "wall": 10451.3} {"step": 1309, "train_loss": 4.617202281951904, "lr": 0.0003999026635197482, "tps": 8208, "wall": 10459.4} {"step": 1310, "train_loss": 4.539329528808594, "lr": 0.0003999020325479815, "tps": 8208, "wall": 10467.2} {"step": 1311, "train_loss": 4.575080871582031, "lr": 0.0003999013995382749, "tps": 8208, "wall": 10475.1} {"step": 1312, "train_loss": 4.5195512771606445, "lr": 0.0003999007644906355, "tps": 8208, "wall": 10483.1} {"step": 1313, "train_loss": 4.598353862762451, "lr": 0.0003999001274050705, "tps": 8208, "wall": 10491.2} {"step": 1314, "train_loss": 4.625001430511475, "lr": 0.0003998994882815871, "tps": 8208, "wall": 10499.0} {"step": 1315, "train_loss": 4.59637451171875, "lr": 0.0003998988471201926, "tps": 8208, "wall": 10506.9} {"step": 1316, "train_loss": 4.679962158203125, "lr": 0.0003998982039208942, "tps": 8208, "wall": 10514.9} {"step": 1317, "train_loss": 4.630194664001465, "lr": 0.00039989755868369926, "tps": 8208, "wall": 10522.7} {"step": 1318, "train_loss": 4.51894474029541, "lr": 0.00039989691140861504, "tps": 8208, "wall": 10530.6} {"step": 1319, "train_loss": 4.62994384765625, "lr": 0.00039989626209564885, "tps": 8208, "wall": 10538.6} {"step": 1320, "train_loss": 4.55045223236084, "lr": 0.00039989561074480807, "tps": 8208, "wall": 10546.6} {"step": 1321, "train_loss": 4.627624988555908, "lr": 0.0003998949573561, "tps": 8208, "wall": 10554.5} {"step": 1322, "train_loss": 4.630970478057861, "lr": 0.00039989430192953224, "tps": 8208, "wall": 10562.4} {"step": 1323, "train_loss": 4.497800827026367, "lr": 0.00039989364446511204, "tps": 8208, "wall": 10570.2} {"step": 1324, "train_loss": 4.632914066314697, "lr": 0.00039989298496284696, "tps": 8208, "wall": 10578.3} {"step": 1325, "train_loss": 4.579835414886475, "lr": 0.00039989232342274437, "tps": 8208, "wall": 10586.2} {"step": 1326, "train_loss": 4.537700653076172, "lr": 0.0003998916598448118, "tps": 8208, "wall": 10594.1} {"step": 1327, "train_loss": 4.525162220001221, "lr": 0.0003998909942290568, "tps": 8208, "wall": 10602.1} {"step": 1328, "train_loss": 4.727307319641113, "lr": 0.0003998903265754869, "tps": 8208, "wall": 10610.0} {"step": 1329, "train_loss": 4.524457931518555, "lr": 0.0003998896568841096, "tps": 8209, "wall": 10617.9} {"step": 1330, "train_loss": 4.5882134437561035, "lr": 0.00039988898515493256, "tps": 8209, "wall": 10625.9} {"step": 1331, "train_loss": 4.56532096862793, "lr": 0.0003998883113879633, "tps": 8209, "wall": 10633.9} {"step": 1332, "train_loss": 4.555336952209473, "lr": 0.0003998876355832096, "tps": 8209, "wall": 10641.9} {"step": 1333, "train_loss": 4.492532730102539, "lr": 0.00039988695774067904, "tps": 8209, "wall": 10649.8} {"step": 1334, "train_loss": 4.500787258148193, "lr": 0.00039988627786037925, "tps": 8209, "wall": 10657.7} {"step": 1335, "train_loss": 4.527832508087158, "lr": 0.000399885595942318, "tps": 8209, "wall": 10665.6} {"step": 1336, "train_loss": 4.576085567474365, "lr": 0.00039988491198650295, "tps": 8209, "wall": 10673.5} {"step": 1337, "train_loss": 4.47157096862793, "lr": 0.00039988422599294195, "tps": 8209, "wall": 10681.4} {"step": 1338, "train_loss": 4.608249664306641, "lr": 0.00039988353796164265, "tps": 8209, "wall": 10689.3} {"step": 1339, "train_loss": 4.419526100158691, "lr": 0.0003998828478926129, "tps": 8209, "wall": 10697.4} {"step": 1340, "train_loss": 4.618539333343506, "lr": 0.00039988215578586045, "tps": 8209, "wall": 10705.3} {"step": 1341, "train_loss": 4.608982563018799, "lr": 0.0003998814616413934, "tps": 8209, "wall": 10713.3} {"step": 1342, "train_loss": 4.685171604156494, "lr": 0.0003998807654592193, "tps": 8209, "wall": 10721.1} {"step": 1343, "train_loss": 4.499762058258057, "lr": 0.0003998800672393461, "tps": 8209, "wall": 10729.0} {"step": 1344, "train_loss": 4.520339488983154, "lr": 0.0003998793669817819, "tps": 8209, "wall": 10736.9} {"step": 1345, "train_loss": 4.5678935050964355, "lr": 0.00039987866468653443, "tps": 8209, "wall": 10744.8} {"step": 1346, "train_loss": 4.618645668029785, "lr": 0.00039987796035361166, "tps": 8209, "wall": 10752.9} {"step": 1347, "train_loss": 4.5087103843688965, "lr": 0.0003998772539830217, "tps": 8209, "wall": 10760.8} {"step": 1348, "train_loss": 4.628432750701904, "lr": 0.0003998765455747725, "tps": 8209, "wall": 10768.7} {"step": 1349, "train_loss": 4.475942134857178, "lr": 0.000399875835128872, "tps": 8209, "wall": 10776.5} {"step": 1350, "train_loss": 4.636872291564941, "lr": 0.00039987512264532836, "tps": 8209, "wall": 10784.4} {"step": 1351, "train_loss": 4.560041427612305, "lr": 0.0003998744081241495, "tps": 8209, "wall": 10792.4} {"step": 1352, "train_loss": 4.457737445831299, "lr": 0.0003998736915653437, "tps": 8209, "wall": 10800.3} {"step": 1353, "train_loss": 4.622546195983887, "lr": 0.00039987297296891904, "tps": 8210, "wall": 10808.2} {"step": 1354, "train_loss": 4.517186641693115, "lr": 0.0003998722523348835, "tps": 8210, "wall": 10816.2} {"step": 1355, "train_loss": 4.494877338409424, "lr": 0.00039987152966324544, "tps": 8210, "wall": 10824.2} {"step": 1356, "train_loss": 4.5018463134765625, "lr": 0.0003998708049540128, "tps": 8210, "wall": 10832.0} {"step": 1357, "train_loss": 4.457038402557373, "lr": 0.0003998700782071941, "tps": 8210, "wall": 10840.0} {"step": 1358, "train_loss": 4.5878448486328125, "lr": 0.00039986934942279746, "tps": 8210, "wall": 10847.8} {"step": 1359, "train_loss": 4.60910701751709, "lr": 0.000399868618600831, "tps": 8210, "wall": 10855.8} {"step": 1360, "train_loss": 4.542285442352295, "lr": 0.00039986788574130315, "tps": 8210, "wall": 10863.7} {"step": 1361, "train_loss": 4.529748439788818, "lr": 0.0003998671508442221, "tps": 8210, "wall": 10871.9} {"step": 1362, "train_loss": 4.547299385070801, "lr": 0.0003998664139095963, "tps": 8210, "wall": 10879.7} {"step": 1363, "train_loss": 4.495146751403809, "lr": 0.000399865674937434, "tps": 8210, "wall": 10887.5} {"step": 1364, "train_loss": 4.513406276702881, "lr": 0.00039986493392774367, "tps": 8210, "wall": 10895.5} {"step": 1365, "train_loss": 4.518949508666992, "lr": 0.00039986419088053354, "tps": 8210, "wall": 10903.4} {"step": 1366, "train_loss": 4.533870220184326, "lr": 0.00039986344579581213, "tps": 8210, "wall": 10911.2} {"step": 1367, "train_loss": 4.613901615142822, "lr": 0.0003998626986735879, "tps": 8210, "wall": 10919.1} {"step": 1368, "train_loss": 4.53813362121582, "lr": 0.00039986194951386933, "tps": 8210, "wall": 10927.0} {"step": 1369, "train_loss": 4.469614028930664, "lr": 0.00039986119831666485, "tps": 8210, "wall": 10935.0} {"step": 1370, "train_loss": 4.472394943237305, "lr": 0.00039986044508198297, "tps": 8210, "wall": 10942.9} {"step": 1371, "train_loss": 4.483421802520752, "lr": 0.00039985968980983216, "tps": 8210, "wall": 10950.8} {"step": 1372, "train_loss": 4.545148849487305, "lr": 0.00039985893250022114, "tps": 8210, "wall": 10958.7} {"step": 1373, "train_loss": 4.53466796875, "lr": 0.00039985817315315843, "tps": 8210, "wall": 10966.8} {"step": 1374, "train_loss": 4.522141456604004, "lr": 0.0003998574117686526, "tps": 8210, "wall": 10974.7} {"step": 1375, "train_loss": 4.462009906768799, "lr": 0.0003998566483467122, "tps": 8210, "wall": 10982.7} {"step": 1376, "train_loss": 4.498175144195557, "lr": 0.00039985588288734604, "tps": 8210, "wall": 10990.6} {"step": 1377, "train_loss": 4.501992702484131, "lr": 0.0003998551153905627, "tps": 8210, "wall": 10998.6} {"step": 1378, "train_loss": 4.4826836585998535, "lr": 0.0003998543458563708, "tps": 8210, "wall": 11006.6} {"step": 1379, "train_loss": 4.5459418296813965, "lr": 0.00039985357428477916, "tps": 8210, "wall": 11014.6} {"step": 1380, "train_loss": 4.543052673339844, "lr": 0.0003998528006757965, "tps": 8210, "wall": 11022.6} {"step": 1381, "train_loss": 4.509597301483154, "lr": 0.0003998520250294317, "tps": 8210, "wall": 11030.5} {"step": 1382, "train_loss": 4.515263080596924, "lr": 0.00039985124734569336, "tps": 8210, "wall": 11038.4} {"step": 1383, "train_loss": 4.440272808074951, "lr": 0.0003998504676245903, "tps": 8211, "wall": 11046.4} {"step": 1384, "train_loss": 4.539642333984375, "lr": 0.0003998496858661315, "tps": 8211, "wall": 11054.3} {"step": 1385, "train_loss": 4.560224533081055, "lr": 0.0003998489020703257, "tps": 8211, "wall": 11062.1} {"step": 1386, "train_loss": 4.614431381225586, "lr": 0.0003998481162371818, "tps": 8211, "wall": 11070.1} {"step": 1387, "train_loss": 4.462393760681152, "lr": 0.0003998473283667087, "tps": 8211, "wall": 11077.9} {"step": 1388, "train_loss": 4.621335983276367, "lr": 0.00039984653845891535, "tps": 8211, "wall": 11085.8} {"step": 1389, "train_loss": 4.517425537109375, "lr": 0.0003998457465138107, "tps": 8211, "wall": 11093.7} {"step": 1390, "train_loss": 4.573616027832031, "lr": 0.0003998449525314037, "tps": 8211, "wall": 11101.5} {"step": 1391, "train_loss": 4.508877754211426, "lr": 0.0003998441565117033, "tps": 8211, "wall": 11109.5} {"step": 1392, "train_loss": 4.476749420166016, "lr": 0.0003998433584547186, "tps": 8211, "wall": 11117.5} {"step": 1393, "train_loss": 4.534924507141113, "lr": 0.00039984255836045864, "tps": 8211, "wall": 11125.3} {"step": 1394, "train_loss": 4.490825176239014, "lr": 0.00039984175622893235, "tps": 8211, "wall": 11133.3} {"step": 1395, "train_loss": 4.4903998374938965, "lr": 0.000399840952060149, "tps": 8211, "wall": 11141.2} {"step": 1396, "train_loss": 4.507728099822998, "lr": 0.00039984014585411757, "tps": 8211, "wall": 11149.1} {"step": 1397, "train_loss": 4.478072643280029, "lr": 0.00039983933761084724, "tps": 8211, "wall": 11157.0} {"step": 1398, "train_loss": 4.494084358215332, "lr": 0.0003998385273303472, "tps": 8211, "wall": 11164.9} {"step": 1399, "train_loss": 4.5045552253723145, "lr": 0.00039983771501262664, "tps": 8211, "wall": 11172.9} {"step": 1400, "train_loss": 4.513916492462158, "lr": 0.0003998369006576946, "tps": 8211, "wall": 11180.8} {"step": 1401, "train_loss": 4.464971542358398, "lr": 0.0003998360842655605, "tps": 8211, "wall": 11188.7} {"step": 1402, "train_loss": 4.521989822387695, "lr": 0.0003998352658362335, "tps": 8212, "wall": 11196.5} {"step": 1403, "train_loss": 4.451214790344238, "lr": 0.0003998344453697228, "tps": 8212, "wall": 11204.4} {"step": 1404, "train_loss": 4.464422225952148, "lr": 0.0003998336228660379, "tps": 8212, "wall": 11212.3} {"step": 1405, "train_loss": 4.410032749176025, "lr": 0.0003998327983251879, "tps": 8212, "wall": 11220.0} {"step": 1406, "train_loss": 4.43341588973999, "lr": 0.00039983197174718225, "tps": 8212, "wall": 11228.0} {"step": 1407, "train_loss": 4.585686683654785, "lr": 0.00039983114313203033, "tps": 8212, "wall": 11236.0} {"step": 1408, "train_loss": 4.460929870605469, "lr": 0.00039983031247974146, "tps": 8212, "wall": 11243.9} {"step": 1409, "train_loss": 4.486190319061279, "lr": 0.0003998294797903251, "tps": 8212, "wall": 11251.8} {"step": 1410, "train_loss": 4.576257228851318, "lr": 0.00039982864506379065, "tps": 8212, "wall": 11259.7} {"step": 1411, "train_loss": 4.596654891967773, "lr": 0.0003998278083001476, "tps": 8212, "wall": 11267.5} {"step": 1412, "train_loss": 4.391627311706543, "lr": 0.0003998269694994054, "tps": 8212, "wall": 11275.3} {"step": 1413, "train_loss": 4.523165225982666, "lr": 0.0003998261286615735, "tps": 8212, "wall": 11283.2} {"step": 1414, "train_loss": 4.450710773468018, "lr": 0.00039982528578666156, "tps": 8213, "wall": 11291.0} {"step": 1415, "train_loss": 4.520599842071533, "lr": 0.000399824440874679, "tps": 8213, "wall": 11299.0} {"step": 1416, "train_loss": 4.488309860229492, "lr": 0.00039982359392563556, "tps": 8213, "wall": 11306.8} {"step": 1417, "train_loss": 4.559157371520996, "lr": 0.0003998227449395406, "tps": 8213, "wall": 11314.7} {"step": 1418, "train_loss": 4.454958438873291, "lr": 0.0003998218939164039, "tps": 8213, "wall": 11322.5} {"step": 1419, "train_loss": 4.461142539978027, "lr": 0.00039982104085623503, "tps": 8213, "wall": 11330.3} {"step": 1420, "train_loss": 4.487216472625732, "lr": 0.0003998201857590437, "tps": 8213, "wall": 11338.1} {"step": 1421, "train_loss": 4.474348068237305, "lr": 0.00039981932862483957, "tps": 8213, "wall": 11346.0} {"step": 1422, "train_loss": 4.4344563484191895, "lr": 0.0003998184694536324, "tps": 8213, "wall": 11353.9} {"step": 1423, "train_loss": 4.428739547729492, "lr": 0.00039981760824543184, "tps": 8213, "wall": 11361.7} {"step": 1424, "train_loss": 4.465841770172119, "lr": 0.0003998167450002477, "tps": 8213, "wall": 11369.6} {"step": 1425, "train_loss": 4.483972072601318, "lr": 0.00039981587971808975, "tps": 8214, "wall": 11377.4} {"step": 1426, "train_loss": 4.44539737701416, "lr": 0.0003998150123989678, "tps": 8214, "wall": 11385.2} {"step": 1427, "train_loss": 4.55517578125, "lr": 0.0003998141430428916, "tps": 8214, "wall": 11393.1} {"step": 1428, "train_loss": 4.430209636688232, "lr": 0.0003998132716498711, "tps": 8214, "wall": 11401.0} {"step": 1429, "train_loss": 4.597554683685303, "lr": 0.0003998123982199161, "tps": 8214, "wall": 11408.8} {"step": 1430, "train_loss": 4.435302257537842, "lr": 0.00039981152275303663, "tps": 8214, "wall": 11416.9} {"step": 1431, "train_loss": 4.534822463989258, "lr": 0.0003998106452492424, "tps": 8214, "wall": 11424.7} {"step": 1432, "train_loss": 4.549343585968018, "lr": 0.0003998097657085435, "tps": 8214, "wall": 11432.6} {"step": 1433, "train_loss": 4.464436054229736, "lr": 0.0003998088841309498, "tps": 8214, "wall": 11440.4} {"step": 1434, "train_loss": 4.497504234313965, "lr": 0.0003998080005164714, "tps": 8214, "wall": 11448.3} {"step": 1435, "train_loss": 4.490735054016113, "lr": 0.0003998071148651182, "tps": 8214, "wall": 11456.2} {"step": 1436, "train_loss": 4.422408580780029, "lr": 0.00039980622717690023, "tps": 8214, "wall": 11464.1} {"step": 1437, "train_loss": 4.452938079833984, "lr": 0.00039980533745182764, "tps": 8214, "wall": 11472.1} {"step": 1438, "train_loss": 4.410110950469971, "lr": 0.00039980444568991046, "tps": 8214, "wall": 11479.9} {"step": 1439, "train_loss": 4.412936210632324, "lr": 0.0003998035518911588, "tps": 8214, "wall": 11487.8} {"step": 1440, "train_loss": 4.299249172210693, "lr": 0.00039980265605558274, "tps": 8215, "wall": 11495.6} {"step": 1441, "train_loss": 4.430314540863037, "lr": 0.00039980175818319253, "tps": 8215, "wall": 11503.5} {"step": 1442, "train_loss": 4.431102275848389, "lr": 0.0003998008582739983, "tps": 8215, "wall": 11511.4} {"step": 1443, "train_loss": 4.360854625701904, "lr": 0.0003997999563280101, "tps": 8215, "wall": 11519.3} {"step": 1444, "train_loss": 4.4841742515563965, "lr": 0.00039979905234523833, "tps": 8215, "wall": 11527.1} {"step": 1445, "train_loss": 4.444150447845459, "lr": 0.00039979814632569314, "tps": 8215, "wall": 11535.1} {"step": 1446, "train_loss": 4.537737846374512, "lr": 0.0003997972382693849, "tps": 8215, "wall": 11543.0} {"step": 1447, "train_loss": 4.4780097007751465, "lr": 0.0003997963281763238, "tps": 8215, "wall": 11550.8} {"step": 1448, "train_loss": 4.3389739990234375, "lr": 0.0003997954160465201, "tps": 8215, "wall": 11558.6} {"step": 1449, "train_loss": 4.392765045166016, "lr": 0.0003997945018799842, "tps": 8215, "wall": 11566.6} {"step": 1450, "train_loss": 4.460565090179443, "lr": 0.0003997935856767265, "tps": 8215, "wall": 11574.4} {"step": 1451, "train_loss": 4.418766975402832, "lr": 0.00039979266743675733, "tps": 8215, "wall": 11582.2} {"step": 1452, "train_loss": 4.416629791259766, "lr": 0.0003997917471600871, "tps": 8215, "wall": 11590.1} {"step": 1453, "train_loss": 4.337268829345703, "lr": 0.0003997908248467262, "tps": 8215, "wall": 11598.1} {"step": 1454, "train_loss": 4.500454902648926, "lr": 0.00039978990049668514, "tps": 8216, "wall": 11605.9} {"step": 1455, "train_loss": 4.3884968757629395, "lr": 0.0003997889741099743, "tps": 8216, "wall": 11613.8} {"step": 1456, "train_loss": 4.439655780792236, "lr": 0.00039978804568660434, "tps": 8216, "wall": 11621.7} {"step": 1457, "train_loss": 4.509394645690918, "lr": 0.0003997871152265856, "tps": 8216, "wall": 11629.7} {"step": 1458, "train_loss": 4.498140335083008, "lr": 0.00039978618272992875, "tps": 8216, "wall": 11637.5} {"step": 1459, "train_loss": 4.500428676605225, "lr": 0.0003997852481966442, "tps": 8216, "wall": 11645.3} {"step": 1460, "train_loss": 4.405645847320557, "lr": 0.00039978431162674273, "tps": 8216, "wall": 11653.4} {"step": 1461, "train_loss": 4.518421173095703, "lr": 0.0003997833730202348, "tps": 8216, "wall": 11661.2} {"step": 1462, "train_loss": 4.393247604370117, "lr": 0.00039978243237713106, "tps": 8216, "wall": 11669.0} {"step": 1463, "train_loss": 4.437001705169678, "lr": 0.0003997814896974423, "tps": 8216, "wall": 11677.0} {"step": 1464, "train_loss": 4.486171245574951, "lr": 0.000399780544981179, "tps": 8216, "wall": 11684.9} {"step": 1465, "train_loss": 4.511774063110352, "lr": 0.00039977959822835206, "tps": 8216, "wall": 11692.7} {"step": 1466, "train_loss": 4.441953182220459, "lr": 0.00039977864943897205, "tps": 8216, "wall": 11700.6} {"step": 1467, "train_loss": 4.5688982009887695, "lr": 0.00039977769861304977, "tps": 8216, "wall": 11708.4} {"step": 1468, "train_loss": 4.401706218719482, "lr": 0.000399776745750596, "tps": 8216, "wall": 11716.3} {"step": 1469, "train_loss": 4.404959678649902, "lr": 0.00039977579085162155, "tps": 8216, "wall": 11724.2} {"step": 1470, "train_loss": 4.41892671585083, "lr": 0.0003997748339161372, "tps": 8217, "wall": 11732.1} {"step": 1471, "train_loss": 4.455246448516846, "lr": 0.00039977387494415377, "tps": 8217, "wall": 11739.9} {"step": 1472, "train_loss": 4.367446422576904, "lr": 0.0003997729139356822, "tps": 8217, "wall": 11747.8} {"step": 1473, "train_loss": 4.512764930725098, "lr": 0.0003997719508907333, "tps": 8217, "wall": 11755.7} {"step": 1474, "train_loss": 4.5297393798828125, "lr": 0.00039977098580931805, "tps": 8217, "wall": 11763.5} {"step": 1475, "train_loss": 4.380661487579346, "lr": 0.0003997700186914473, "tps": 8217, "wall": 11771.6} {"step": 1476, "train_loss": 4.393603324890137, "lr": 0.0003997690495371321, "tps": 8217, "wall": 11779.4} {"step": 1477, "train_loss": 4.514737606048584, "lr": 0.0003997680783463834, "tps": 8217, "wall": 11787.3} {"step": 1478, "train_loss": 4.4468793869018555, "lr": 0.00039976710511921215, "tps": 8217, "wall": 11795.1} {"step": 1479, "train_loss": 4.403871059417725, "lr": 0.00039976612985562936, "tps": 8217, "wall": 11802.9} {"step": 1480, "train_loss": 4.437618255615234, "lr": 0.0003997651525556462, "tps": 8217, "wall": 11810.8} {"step": 1481, "train_loss": 4.407041549682617, "lr": 0.0003997641732192736, "tps": 8217, "wall": 11818.7} {"step": 1482, "train_loss": 4.377017021179199, "lr": 0.0003997631918465228, "tps": 8218, "wall": 11826.4} {"step": 1483, "train_loss": 4.383193016052246, "lr": 0.0003997622084374048, "tps": 8218, "wall": 11834.4} {"step": 1484, "train_loss": 4.441775321960449, "lr": 0.0003997612229919308, "tps": 8218, "wall": 11842.4} {"step": 1485, "train_loss": 4.384314060211182, "lr": 0.00039976023551011194, "tps": 8218, "wall": 11850.2} {"step": 1486, "train_loss": 4.345935344696045, "lr": 0.00039975924599195935, "tps": 8218, "wall": 11858.1} {"step": 1487, "train_loss": 4.370238304138184, "lr": 0.0003997582544374843, "tps": 8218, "wall": 11865.9} {"step": 1488, "train_loss": 4.4065327644348145, "lr": 0.00039975726084669807, "tps": 8218, "wall": 11873.9} {"step": 1489, "train_loss": 4.442470073699951, "lr": 0.00039975626521961187, "tps": 8218, "wall": 11881.7} {"step": 1490, "train_loss": 4.467632293701172, "lr": 0.00039975526755623694, "tps": 8218, "wall": 11889.6} {"step": 1491, "train_loss": 4.3543381690979, "lr": 0.00039975426785658467, "tps": 8218, "wall": 11897.6} {"step": 1492, "train_loss": 4.444766998291016, "lr": 0.0003997532661206662, "tps": 8218, "wall": 11905.4} {"step": 1493, "train_loss": 4.327332019805908, "lr": 0.00039975226234849315, "tps": 8218, "wall": 11913.3} {"step": 1494, "train_loss": 4.457636833190918, "lr": 0.00039975125654007667, "tps": 8218, "wall": 11921.2} {"step": 1495, "train_loss": 4.345424175262451, "lr": 0.0003997502486954283, "tps": 8218, "wall": 11929.0} {"step": 1496, "train_loss": 4.392212867736816, "lr": 0.0003997492388145593, "tps": 8218, "wall": 11936.7} {"step": 1497, "train_loss": 4.4364752769470215, "lr": 0.0003997482268974813, "tps": 8219, "wall": 11944.5} {"step": 1498, "train_loss": 4.440369606018066, "lr": 0.0003997472129442055, "tps": 8219, "wall": 11952.5} {"step": 1499, "train_loss": 4.285851001739502, "lr": 0.00039974619695474367, "tps": 8219, "wall": 11960.5} {"step": 1500, "train_loss": 4.392758846282959, "lr": 0.00039974517892910717, "tps": 8219, "wall": 11968.3} {"step": 1501, "train_loss": 4.406935214996338, "lr": 0.00039974415886730755, "tps": 8219, "wall": 11976.2} {"step": 1502, "train_loss": 4.433352470397949, "lr": 0.0003997431367693564, "tps": 8219, "wall": 11984.1} {"step": 1503, "train_loss": 4.3941850662231445, "lr": 0.0003997421126352653, "tps": 8219, "wall": 11992.0} {"step": 1504, "train_loss": 4.289754390716553, "lr": 0.00039974108646504574, "tps": 8219, "wall": 11999.8} {"step": 1505, "train_loss": 4.248438835144043, "lr": 0.0003997400582587095, "tps": 8219, "wall": 12007.6} {"step": 1506, "train_loss": 4.3780598640441895, "lr": 0.0003997390280162681, "tps": 8219, "wall": 12015.6} {"step": 1507, "train_loss": 4.413748741149902, "lr": 0.0003997379957377333, "tps": 8219, "wall": 12023.4} {"step": 1508, "train_loss": 4.47637414932251, "lr": 0.0003997369614231168, "tps": 8219, "wall": 12031.4} {"step": 1509, "train_loss": 4.364847660064697, "lr": 0.00039973592507243025, "tps": 8219, "wall": 12039.2} {"step": 1510, "train_loss": 4.382769584655762, "lr": 0.00039973488668568533, "tps": 8219, "wall": 12047.1} {"step": 1511, "train_loss": 4.44349479675293, "lr": 0.000399733846262894, "tps": 8219, "wall": 12055.0} {"step": 1512, "train_loss": 4.5011372566223145, "lr": 0.0003997328038040679, "tps": 8219, "wall": 12063.0} {"step": 1513, "train_loss": 4.39810037612915, "lr": 0.00039973175930921887, "tps": 8219, "wall": 12070.8} {"step": 1514, "train_loss": 4.536872386932373, "lr": 0.00039973071277835874, "tps": 8219, "wall": 12078.9} {"step": 1515, "train_loss": 4.39614725112915, "lr": 0.00039972966421149937, "tps": 8219, "wall": 12086.8} {"step": 1516, "train_loss": 4.424501895904541, "lr": 0.0003997286136086527, "tps": 8220, "wall": 12094.6} {"step": 1517, "train_loss": 4.489660263061523, "lr": 0.0003997275609698305, "tps": 8220, "wall": 12102.6} {"step": 1518, "train_loss": 4.269589424133301, "lr": 0.0003997265062950447, "tps": 8220, "wall": 12110.4} {"step": 1519, "train_loss": 4.385365009307861, "lr": 0.00039972544958430747, "tps": 8220, "wall": 12118.3} {"step": 1520, "train_loss": 4.531612396240234, "lr": 0.00039972439083763055, "tps": 8220, "wall": 12126.2} {"step": 1521, "train_loss": 4.377907752990723, "lr": 0.00039972333005502606, "tps": 8220, "wall": 12134.2} {"step": 1522, "train_loss": 4.430678844451904, "lr": 0.00039972226723650585, "tps": 8220, "wall": 12142.0} {"step": 1523, "train_loss": 4.4110541343688965, "lr": 0.0003997212023820822, "tps": 8220, "wall": 12149.9} {"step": 1524, "train_loss": 4.368601322174072, "lr": 0.00039972013549176695, "tps": 8220, "wall": 12157.8} {"step": 1525, "train_loss": 4.321864128112793, "lr": 0.0003997190665655723, "tps": 8220, "wall": 12165.6} {"step": 1526, "train_loss": 4.400363445281982, "lr": 0.0003997179956035104, "tps": 8220, "wall": 12173.5} {"step": 1527, "train_loss": 4.4151811599731445, "lr": 0.00039971692260559326, "tps": 8220, "wall": 12181.4} {"step": 1528, "train_loss": 4.45591402053833, "lr": 0.00039971584757183317, "tps": 8220, "wall": 12189.2} {"step": 1529, "train_loss": 4.455726623535156, "lr": 0.00039971477050224216, "tps": 8220, "wall": 12197.2} {"step": 1530, "train_loss": 4.4321794509887695, "lr": 0.0003997136913968325, "tps": 8220, "wall": 12205.1} {"step": 1531, "train_loss": 4.385993957519531, "lr": 0.00039971261025561653, "tps": 8220, "wall": 12213.0} {"step": 1532, "train_loss": 4.458761692047119, "lr": 0.0003997115270786063, "tps": 8220, "wall": 12220.8} {"step": 1533, "train_loss": 4.3189496994018555, "lr": 0.00039971044186581424, "tps": 8221, "wall": 12228.7} {"step": 1534, "train_loss": 4.392651557922363, "lr": 0.0003997093546172525, "tps": 8221, "wall": 12236.5} {"step": 1535, "train_loss": 4.322317123413086, "lr": 0.0003997082653329335, "tps": 8221, "wall": 12244.3} {"step": 1536, "train_loss": 4.4159440994262695, "lr": 0.0003997071740128695, "tps": 8221, "wall": 12252.3} {"step": 1537, "train_loss": 4.400217533111572, "lr": 0.0003997060806570729, "tps": 8221, "wall": 12260.1} {"step": 1538, "train_loss": 4.373973846435547, "lr": 0.0003997049852655562, "tps": 8221, "wall": 12268.0} {"step": 1539, "train_loss": 4.360029220581055, "lr": 0.0003997038878383316, "tps": 8220, "wall": 12277.4} {"step": 1540, "train_loss": 4.349948883056641, "lr": 0.0003997027883754117, "tps": 8220, "wall": 12285.1} {"step": 1541, "train_loss": 4.437762260437012, "lr": 0.00039970168687680893, "tps": 8220, "wall": 12293.0} {"step": 1542, "train_loss": 4.414657115936279, "lr": 0.0003997005833425357, "tps": 8220, "wall": 12300.9} {"step": 1543, "train_loss": 4.346222877502441, "lr": 0.0003996994777726045, "tps": 8220, "wall": 12308.8} {"step": 1544, "train_loss": 4.378623008728027, "lr": 0.00039969837016702787, "tps": 8220, "wall": 12316.7} {"step": 1545, "train_loss": 4.394568920135498, "lr": 0.00039969726052581844, "tps": 8220, "wall": 12324.5} {"step": 1546, "train_loss": 4.452059268951416, "lr": 0.0003996961488489887, "tps": 8221, "wall": 12332.3} {"step": 1547, "train_loss": 4.37922477722168, "lr": 0.00039969503513655126, "tps": 8221, "wall": 12340.2} {"step": 1548, "train_loss": 4.445825576782227, "lr": 0.0003996939193885187, "tps": 8221, "wall": 12348.0} {"step": 1549, "train_loss": 4.439702987670898, "lr": 0.0003996928016049038, "tps": 8221, "wall": 12355.9} {"step": 1550, "train_loss": 4.446392059326172, "lr": 0.00039969168178571906, "tps": 8221, "wall": 12363.7} {"step": 1551, "train_loss": 4.389598846435547, "lr": 0.00039969055993097725, "tps": 8221, "wall": 12371.7} {"step": 1552, "train_loss": 4.454184532165527, "lr": 0.000399689436040691, "tps": 8221, "wall": 12379.5} {"step": 1553, "train_loss": 4.413010597229004, "lr": 0.00039968831011487317, "tps": 8221, "wall": 12387.3} {"step": 1554, "train_loss": 4.390768051147461, "lr": 0.0003996871821535364, "tps": 8221, "wall": 12395.2} {"step": 1555, "train_loss": 4.432257652282715, "lr": 0.0003996860521566935, "tps": 8221, "wall": 12403.1} {"step": 1556, "train_loss": 4.3524065017700195, "lr": 0.0003996849201243574, "tps": 8221, "wall": 12410.9} {"step": 1557, "train_loss": 4.371930122375488, "lr": 0.0003996837860565407, "tps": 8221, "wall": 12418.8} {"step": 1558, "train_loss": 4.493139743804932, "lr": 0.00039968264995325636, "tps": 8221, "wall": 12426.5} {"step": 1559, "train_loss": 4.331891059875488, "lr": 0.0003996815118145173, "tps": 8221, "wall": 12434.5} {"step": 1560, "train_loss": 4.346599102020264, "lr": 0.0003996803716403362, "tps": 8222, "wall": 12442.4} {"step": 1561, "train_loss": 4.362513065338135, "lr": 0.00039967922943072627, "tps": 8222, "wall": 12450.2} {"step": 1562, "train_loss": 4.304070949554443, "lr": 0.00039967808518570023, "tps": 8222, "wall": 12458.1} {"step": 1563, "train_loss": 4.429489612579346, "lr": 0.0003996769389052712, "tps": 8222, "wall": 12465.9} {"step": 1564, "train_loss": 4.461625099182129, "lr": 0.00039967579058945203, "tps": 8222, "wall": 12473.7} {"step": 1565, "train_loss": 4.286694049835205, "lr": 0.0003996746402382558, "tps": 8222, "wall": 12481.5} {"step": 1566, "train_loss": 4.401432037353516, "lr": 0.0003996734878516955, "tps": 8222, "wall": 12489.4} {"step": 1567, "train_loss": 4.425371170043945, "lr": 0.0003996723334297842, "tps": 8222, "wall": 12497.4} {"step": 1568, "train_loss": 4.404685974121094, "lr": 0.0003996711769725351, "tps": 8222, "wall": 12505.3} {"step": 1569, "train_loss": 4.3301239013671875, "lr": 0.000399670018479961, "tps": 8222, "wall": 12513.0} {"step": 1570, "train_loss": 4.396319389343262, "lr": 0.0003996688579520754, "tps": 8222, "wall": 12520.9} {"step": 1571, "train_loss": 4.400292873382568, "lr": 0.0003996676953888911, "tps": 8222, "wall": 12528.8} {"step": 1572, "train_loss": 4.454692363739014, "lr": 0.0003996665307904215, "tps": 8223, "wall": 12536.5} {"step": 1573, "train_loss": 4.403159141540527, "lr": 0.00039966536415667975, "tps": 8223, "wall": 12544.4} {"step": 1574, "train_loss": 4.45076322555542, "lr": 0.000399664195487679, "tps": 8223, "wall": 12552.4} {"step": 1575, "train_loss": 4.4366350173950195, "lr": 0.0003996630247834325, "tps": 8223, "wall": 12560.2} {"step": 1576, "train_loss": 4.421143054962158, "lr": 0.0003996618520439536, "tps": 8223, "wall": 12568.1} {"step": 1577, "train_loss": 4.360937595367432, "lr": 0.00039966067726925547, "tps": 8223, "wall": 12575.8} {"step": 1578, "train_loss": 4.34235954284668, "lr": 0.0003996595004593515, "tps": 8223, "wall": 12583.7} {"step": 1579, "train_loss": 4.397807598114014, "lr": 0.0003996583216142549, "tps": 8223, "wall": 12591.5} {"step": 1580, "train_loss": 4.38392448425293, "lr": 0.0003996571407339792, "tps": 8223, "wall": 12599.2} {"step": 1581, "train_loss": 4.364680290222168, "lr": 0.00039965595781853765, "tps": 8223, "wall": 12607.0} {"step": 1582, "train_loss": 4.4205474853515625, "lr": 0.0003996547728679437, "tps": 8223, "wall": 12615.0} {"step": 1583, "train_loss": 4.372150421142578, "lr": 0.0003996535858822108, "tps": 8223, "wall": 12622.8} {"step": 1584, "train_loss": 4.438732147216797, "lr": 0.0003996523968613524, "tps": 8223, "wall": 12630.7} {"step": 1585, "train_loss": 4.37103796005249, "lr": 0.00039965120580538185, "tps": 8224, "wall": 12638.6} {"step": 1586, "train_loss": 4.4727253913879395, "lr": 0.0003996500127143127, "tps": 8224, "wall": 12646.4} {"step": 1587, "train_loss": 4.356691360473633, "lr": 0.00039964881758815853, "tps": 8224, "wall": 12654.3} {"step": 1588, "train_loss": 4.369088649749756, "lr": 0.0003996476204269328, "tps": 8224, "wall": 12662.0} {"step": 1589, "train_loss": 4.461766242980957, "lr": 0.0003996464212306492, "tps": 8224, "wall": 12669.8} {"step": 1590, "train_loss": 4.519635200500488, "lr": 0.00039964521999932113, "tps": 8224, "wall": 12677.9} {"step": 1591, "train_loss": 4.3410844802856445, "lr": 0.0003996440167329623, "tps": 8224, "wall": 12685.7} {"step": 1592, "train_loss": 4.385713577270508, "lr": 0.00039964281143158633, "tps": 8224, "wall": 12693.5} {"step": 1593, "train_loss": 4.4057512283325195, "lr": 0.0003996416040952069, "tps": 8224, "wall": 12701.4} {"step": 1594, "train_loss": 4.3889946937561035, "lr": 0.0003996403947238377, "tps": 8224, "wall": 12709.2} {"step": 1595, "train_loss": 4.331186771392822, "lr": 0.0003996391833174923, "tps": 8224, "wall": 12717.1} {"step": 1596, "train_loss": 4.365958213806152, "lr": 0.00039963796987618457, "tps": 8224, "wall": 12725.0} {"step": 1597, "train_loss": 4.410674571990967, "lr": 0.00039963675439992814, "tps": 8224, "wall": 12732.9} {"step": 1598, "train_loss": 4.452185153961182, "lr": 0.00039963553688873694, "tps": 8224, "wall": 12740.8} {"step": 1599, "train_loss": 4.4350175857543945, "lr": 0.0003996343173426246, "tps": 8225, "wall": 12748.6} {"step": 1600, "train_loss": 4.370882987976074, "lr": 0.00039963309576160496, "tps": 8225, "wall": 12756.5} {"step": 1601, "train_loss": 4.433296203613281, "lr": 0.000399631872145692, "tps": 8225, "wall": 12764.3} {"step": 1602, "train_loss": 4.324623107910156, "lr": 0.0003996306464948994, "tps": 8225, "wall": 12772.3} {"step": 1603, "train_loss": 4.536214828491211, "lr": 0.0003996294188092411, "tps": 8225, "wall": 12780.1} {"step": 1604, "train_loss": 4.382420539855957, "lr": 0.00039962818908873107, "tps": 8225, "wall": 12788.0} {"step": 1605, "train_loss": 4.320723056793213, "lr": 0.0003996269573333831, "tps": 8225, "wall": 12796.0} {"step": 1606, "train_loss": 4.387574672698975, "lr": 0.00039962572354321137, "tps": 8225, "wall": 12803.7} {"step": 1607, "train_loss": 4.410020351409912, "lr": 0.0003996244877182297, "tps": 8225, "wall": 12811.5} {"step": 1608, "train_loss": 4.2790632247924805, "lr": 0.00039962324985845206, "tps": 8225, "wall": 12819.5} {"step": 1609, "train_loss": 4.437352657318115, "lr": 0.00039962200996389253, "tps": 8225, "wall": 12827.2} {"step": 1610, "train_loss": 4.309732913970947, "lr": 0.0003996207680345652, "tps": 8225, "wall": 12835.1} {"step": 1611, "train_loss": 4.337502479553223, "lr": 0.00039961952407048404, "tps": 8225, "wall": 12842.9} {"step": 1612, "train_loss": 4.4231791496276855, "lr": 0.00039961827807166327, "tps": 8225, "wall": 12850.7} {"step": 1613, "train_loss": 4.312328815460205, "lr": 0.00039961703003811686, "tps": 8225, "wall": 12858.7} {"step": 1614, "train_loss": 4.294538497924805, "lr": 0.0003996157799698591, "tps": 8226, "wall": 12866.4} {"step": 1615, "train_loss": 4.251206398010254, "lr": 0.00039961452786690396, "tps": 8226, "wall": 12874.2} {"step": 1616, "train_loss": 4.28125, "lr": 0.00039961327372926576, "tps": 8226, "wall": 12882.1} {"step": 1617, "train_loss": 4.399332523345947, "lr": 0.00039961201755695874, "tps": 8226, "wall": 12889.9} {"step": 1618, "train_loss": 4.361268997192383, "lr": 0.00039961075934999695, "tps": 8226, "wall": 12897.8} {"step": 1619, "train_loss": 4.464192867279053, "lr": 0.00039960949910839485, "tps": 8226, "wall": 12905.6} {"step": 1620, "train_loss": 4.312042236328125, "lr": 0.00039960823683216664, "tps": 8226, "wall": 12913.4} {"step": 1621, "train_loss": 4.327540397644043, "lr": 0.0003996069725213266, "tps": 8226, "wall": 12921.2} {"step": 1622, "train_loss": 4.323060035705566, "lr": 0.000399605706175889, "tps": 8226, "wall": 12929.0} {"step": 1623, "train_loss": 4.331927299499512, "lr": 0.00039960443779586837, "tps": 8226, "wall": 12936.9} {"step": 1624, "train_loss": 4.2773027420043945, "lr": 0.0003996031673812788, "tps": 8227, "wall": 12944.6} {"step": 1625, "train_loss": 4.344051837921143, "lr": 0.00039960189493213493, "tps": 8227, "wall": 12952.5} {"step": 1626, "train_loss": 4.432026386260986, "lr": 0.00039960062044845104, "tps": 8227, "wall": 12960.4} {"step": 1627, "train_loss": 4.406363010406494, "lr": 0.0003995993439302416, "tps": 8227, "wall": 12968.2} {"step": 1628, "train_loss": 4.399316787719727, "lr": 0.0003995980653775211, "tps": 8227, "wall": 12976.1} {"step": 1629, "train_loss": 4.266620635986328, "lr": 0.0003995967847903039, "tps": 8227, "wall": 12984.0} {"step": 1630, "train_loss": 4.366299152374268, "lr": 0.00039959550216860475, "tps": 8227, "wall": 12991.8} {"step": 1631, "train_loss": 4.380943298339844, "lr": 0.000399594217512438, "tps": 8227, "wall": 12999.5} {"step": 1632, "train_loss": 4.35617733001709, "lr": 0.00039959293082181827, "tps": 8227, "wall": 13007.3} {"step": 1633, "train_loss": 4.2943315505981445, "lr": 0.00039959164209676, "tps": 8227, "wall": 13015.1} {"step": 1634, "train_loss": 4.333253383636475, "lr": 0.00039959035133727797, "tps": 8227, "wall": 13022.9} {"step": 1635, "train_loss": 4.169354438781738, "lr": 0.00039958905854338666, "tps": 8228, "wall": 13030.7} {"step": 1636, "train_loss": 4.429441928863525, "lr": 0.00039958776371510084, "tps": 8227, "wall": 13038.7} {"step": 1637, "train_loss": 4.239395618438721, "lr": 0.0003995864668524351, "tps": 8228, "wall": 13046.4} {"step": 1638, "train_loss": 4.363236427307129, "lr": 0.0003995851679554042, "tps": 8228, "wall": 13054.4} {"step": 1639, "train_loss": 4.317258834838867, "lr": 0.0003995838670240227, "tps": 8228, "wall": 13062.2} {"step": 1640, "train_loss": 4.33726167678833, "lr": 0.0003995825640583055, "tps": 8228, "wall": 13069.9} {"step": 1641, "train_loss": 4.342668056488037, "lr": 0.0003995812590582672, "tps": 8228, "wall": 13077.8} {"step": 1642, "train_loss": 4.303609371185303, "lr": 0.00039957995202392275, "tps": 8228, "wall": 13085.6} {"step": 1643, "train_loss": 4.369996070861816, "lr": 0.000399578642955287, "tps": 8228, "wall": 13093.6} {"step": 1644, "train_loss": 4.4680399894714355, "lr": 0.00039957733185237455, "tps": 8228, "wall": 13101.5} {"step": 1645, "train_loss": 4.406850337982178, "lr": 0.0003995760187152004, "tps": 8228, "wall": 13109.4} {"step": 1646, "train_loss": 4.329588890075684, "lr": 0.00039957470354377937, "tps": 8228, "wall": 13117.2} {"step": 1647, "train_loss": 4.4019293785095215, "lr": 0.0003995733863381264, "tps": 8228, "wall": 13125.0} {"step": 1648, "train_loss": 4.370950222015381, "lr": 0.00039957206709825637, "tps": 8228, "wall": 13132.8} {"step": 1649, "train_loss": 4.44463586807251, "lr": 0.0003995707458241843, "tps": 8229, "wall": 13140.6} {"step": 1650, "train_loss": 4.452391624450684, "lr": 0.0003995694225159251, "tps": 8229, "wall": 13148.4} {"step": 1651, "train_loss": 4.363387107849121, "lr": 0.00039956809717349375, "tps": 8229, "wall": 13156.4} {"step": 1652, "train_loss": 4.418005466461182, "lr": 0.0003995667697969052, "tps": 8229, "wall": 13164.3} {"step": 1653, "train_loss": 4.355794429779053, "lr": 0.0003995654403861747, "tps": 8229, "wall": 13172.1} {"step": 1654, "train_loss": 4.354413986206055, "lr": 0.0003995641089413171, "tps": 8229, "wall": 13180.0} {"step": 1655, "train_loss": 4.2779388427734375, "lr": 0.0003995627754623476, "tps": 8229, "wall": 13187.8} {"step": 1656, "train_loss": 4.253943920135498, "lr": 0.00039956143994928126, "tps": 8229, "wall": 13195.6} {"step": 1657, "train_loss": 4.252686023712158, "lr": 0.0003995601024021332, "tps": 8229, "wall": 13203.5} {"step": 1658, "train_loss": 4.365013122558594, "lr": 0.00039955876282091857, "tps": 8229, "wall": 13211.3} {"step": 1659, "train_loss": 4.2375102043151855, "lr": 0.0003995574212056526, "tps": 8229, "wall": 13219.2} {"step": 1660, "train_loss": 4.386535167694092, "lr": 0.0003995560775563504, "tps": 8229, "wall": 13227.0} {"step": 1661, "train_loss": 4.392304420471191, "lr": 0.0003995547318730273, "tps": 8229, "wall": 13234.8} {"step": 1662, "train_loss": 4.386415004730225, "lr": 0.00039955338415569844, "tps": 8230, "wall": 13242.5} {"step": 1663, "train_loss": 4.337930202484131, "lr": 0.00039955203440437915, "tps": 8230, "wall": 13250.4} {"step": 1664, "train_loss": 4.4096198081970215, "lr": 0.00039955068261908467, "tps": 8230, "wall": 13258.2} {"step": 1665, "train_loss": 4.344628810882568, "lr": 0.0003995493287998303, "tps": 8230, "wall": 13266.1} {"step": 1666, "train_loss": 4.256573677062988, "lr": 0.00039954797294663156, "tps": 8230, "wall": 13273.9} {"step": 1667, "train_loss": 4.369065284729004, "lr": 0.00039954661505950357, "tps": 8230, "wall": 13281.7} {"step": 1668, "train_loss": 4.356021881103516, "lr": 0.0003995452551384619, "tps": 8230, "wall": 13289.5} {"step": 1669, "train_loss": 4.337020397186279, "lr": 0.00039954389318352175, "tps": 8230, "wall": 13297.3} {"step": 1670, "train_loss": 4.324562072753906, "lr": 0.00039954252919469877, "tps": 8230, "wall": 13305.2} {"step": 1671, "train_loss": 4.301239013671875, "lr": 0.0003995411631720082, "tps": 8230, "wall": 13313.1} {"step": 1672, "train_loss": 4.31462287902832, "lr": 0.0003995397951154657, "tps": 8230, "wall": 13320.8} {"step": 1673, "train_loss": 4.290858745574951, "lr": 0.0003995384250250867, "tps": 8230, "wall": 13328.6} {"step": 1674, "train_loss": 4.327287673950195, "lr": 0.0003995370529008866, "tps": 8231, "wall": 13336.4} {"step": 1675, "train_loss": 4.371038436889648, "lr": 0.00039953567874288114, "tps": 8231, "wall": 13344.3} {"step": 1676, "train_loss": 4.202077388763428, "lr": 0.00039953430255108575, "tps": 8231, "wall": 13352.1} {"step": 1677, "train_loss": 4.371878623962402, "lr": 0.0003995329243255161, "tps": 8231, "wall": 13359.9} {"step": 1678, "train_loss": 4.275742053985596, "lr": 0.0003995315440661878, "tps": 8231, "wall": 13367.7} {"step": 1679, "train_loss": 4.2530317306518555, "lr": 0.00039953016177311643, "tps": 8231, "wall": 13375.5} {"step": 1680, "train_loss": 4.323309898376465, "lr": 0.0003995287774463177, "tps": 8231, "wall": 13383.3} {"step": 1681, "train_loss": 4.318470001220703, "lr": 0.00039952739108580724, "tps": 8231, "wall": 13391.2} {"step": 1682, "train_loss": 4.330247402191162, "lr": 0.0003995260026916007, "tps": 8231, "wall": 13399.1} {"step": 1683, "train_loss": 4.218991756439209, "lr": 0.000399524612263714, "tps": 8231, "wall": 13406.9} {"step": 1684, "train_loss": 4.382482528686523, "lr": 0.00039952321980216273, "tps": 8231, "wall": 13414.7} {"step": 1685, "train_loss": 4.370102882385254, "lr": 0.00039952182530696276, "tps": 8231, "wall": 13422.5} {"step": 1686, "train_loss": 4.37052059173584, "lr": 0.0003995204287781298, "tps": 8232, "wall": 13430.3} {"step": 1687, "train_loss": 4.289381980895996, "lr": 0.00039951903021567977, "tps": 8232, "wall": 13438.0} {"step": 1688, "train_loss": 4.333766460418701, "lr": 0.0003995176296196284, "tps": 8232, "wall": 13445.8} {"step": 1689, "train_loss": 4.3545403480529785, "lr": 0.0003995162269899916, "tps": 8232, "wall": 13453.7} {"step": 1690, "train_loss": 4.3246870040893555, "lr": 0.0003995148223267853, "tps": 8232, "wall": 13461.5} {"step": 1691, "train_loss": 4.384580612182617, "lr": 0.0003995134156300254, "tps": 8232, "wall": 13469.3} {"step": 1692, "train_loss": 4.290839672088623, "lr": 0.0003995120068997278, "tps": 8232, "wall": 13477.0} {"step": 1693, "train_loss": 4.306334495544434, "lr": 0.00039951059613590843, "tps": 8232, "wall": 13484.8} {"step": 1694, "train_loss": 4.350961208343506, "lr": 0.0003995091833385833, "tps": 8232, "wall": 13492.6} {"step": 1695, "train_loss": 4.27387809753418, "lr": 0.0003995077685077685, "tps": 8233, "wall": 13500.3} {"step": 1696, "train_loss": 4.344853401184082, "lr": 0.00039950635164347995, "tps": 8233, "wall": 13508.1} {"step": 1697, "train_loss": 4.353573799133301, "lr": 0.00039950493274573375, "tps": 8233, "wall": 13516.0} {"step": 1698, "train_loss": 4.319220066070557, "lr": 0.000399503511814546, "tps": 8233, "wall": 13523.8} {"step": 1699, "train_loss": 4.319931507110596, "lr": 0.0003995020888499327, "tps": 8233, "wall": 13531.6} {"step": 1700, "train_loss": 4.268070220947266, "lr": 0.00039950066385191003, "tps": 8233, "wall": 13539.4} {"step": 1701, "train_loss": 4.389842987060547, "lr": 0.00039949923682049414, "tps": 8233, "wall": 13547.2} {"step": 1702, "train_loss": 4.328927993774414, "lr": 0.0003994978077557012, "tps": 8233, "wall": 13554.9} {"step": 1703, "train_loss": 4.454225540161133, "lr": 0.0003994963766575474, "tps": 8233, "wall": 13562.8} {"step": 1704, "train_loss": 4.301184177398682, "lr": 0.00039949494352604887, "tps": 8233, "wall": 13570.5} {"step": 1705, "train_loss": 4.324665546417236, "lr": 0.000399493508361222, "tps": 8233, "wall": 13578.4} {"step": 1706, "train_loss": 4.229001045227051, "lr": 0.00039949207116308285, "tps": 8234, "wall": 13586.2} {"step": 1707, "train_loss": 4.392392158508301, "lr": 0.00039949063193164786, "tps": 8234, "wall": 13594.0} {"step": 1708, "train_loss": 4.2571210861206055, "lr": 0.00039948919066693325, "tps": 8234, "wall": 13601.9} {"step": 1709, "train_loss": 4.403139114379883, "lr": 0.0003994877473689555, "tps": 8234, "wall": 13609.7} {"step": 1710, "train_loss": 4.368639945983887, "lr": 0.00039948630203773066, "tps": 8234, "wall": 13617.5} {"step": 1711, "train_loss": 4.380156517028809, "lr": 0.0003994848546732754, "tps": 8234, "wall": 13625.3} {"step": 1712, "train_loss": 4.3276543617248535, "lr": 0.00039948340527560595, "tps": 8234, "wall": 13633.1} {"step": 1713, "train_loss": 4.318974494934082, "lr": 0.0003994819538447388, "tps": 8234, "wall": 13640.9} {"step": 1714, "train_loss": 4.250965118408203, "lr": 0.00039948050038069035, "tps": 8234, "wall": 13648.7} {"step": 1715, "train_loss": 4.267594337463379, "lr": 0.00039947904488347704, "tps": 8234, "wall": 13656.5} {"step": 1716, "train_loss": 4.26502799987793, "lr": 0.0003994775873531155, "tps": 8234, "wall": 13664.3} {"step": 1717, "train_loss": 4.356215000152588, "lr": 0.00039947612778962205, "tps": 8235, "wall": 13672.1} {"step": 1718, "train_loss": 4.279736042022705, "lr": 0.00039947466619301344, "tps": 8235, "wall": 13680.0} {"step": 1719, "train_loss": 4.1749653816223145, "lr": 0.000399473202563306, "tps": 8235, "wall": 13687.7} {"step": 1720, "train_loss": 4.24863862991333, "lr": 0.00039947173690051634, "tps": 8235, "wall": 13695.6} {"step": 1721, "train_loss": 4.319100379943848, "lr": 0.0003994702692046613, "tps": 8235, "wall": 13703.3} {"step": 1722, "train_loss": 4.1915459632873535, "lr": 0.00039946879947575723, "tps": 8235, "wall": 13711.1} {"step": 1723, "train_loss": 4.422854423522949, "lr": 0.0003994673277138209, "tps": 8235, "wall": 13719.0} {"step": 1724, "train_loss": 4.179982662200928, "lr": 0.000399465853918869, "tps": 8235, "wall": 13726.7} {"step": 1725, "train_loss": 4.388463020324707, "lr": 0.0003994643780909182, "tps": 8235, "wall": 13734.5} {"step": 1726, "train_loss": 4.3172173500061035, "lr": 0.00039946290022998523, "tps": 8235, "wall": 13742.2} {"step": 1727, "train_loss": 4.371799468994141, "lr": 0.0003994614203360868, "tps": 8236, "wall": 13750.0} {"step": 1728, "train_loss": 4.266278266906738, "lr": 0.00039945993840923965, "tps": 8236, "wall": 13758.0} {"step": 1729, "train_loss": 4.273404598236084, "lr": 0.0003994584544494607, "tps": 8236, "wall": 13765.7} {"step": 1730, "train_loss": 4.365301132202148, "lr": 0.0003994569684567666, "tps": 8236, "wall": 13773.6} {"step": 1731, "train_loss": 4.267486095428467, "lr": 0.0003994554804311743, "tps": 8236, "wall": 13781.4} {"step": 1732, "train_loss": 4.384615421295166, "lr": 0.0003994539903727005, "tps": 8236, "wall": 13789.2} {"step": 1733, "train_loss": 4.313955307006836, "lr": 0.0003994524982813623, "tps": 8236, "wall": 13796.9} {"step": 1734, "train_loss": 4.311763286590576, "lr": 0.00039945100415717644, "tps": 8236, "wall": 13804.6} {"step": 1735, "train_loss": 4.300256729125977, "lr": 0.00039944950800015997, "tps": 8236, "wall": 13812.5} {"step": 1736, "train_loss": 4.313724040985107, "lr": 0.00039944800981032963, "tps": 8236, "wall": 13820.3} {"step": 1737, "train_loss": 4.290371417999268, "lr": 0.0003994465095877026, "tps": 8236, "wall": 13828.1} {"step": 1738, "train_loss": 4.286742210388184, "lr": 0.00039944500733229586, "tps": 8237, "wall": 13835.8} {"step": 1739, "train_loss": 4.3327250480651855, "lr": 0.0003994435030441263, "tps": 8237, "wall": 13843.6} {"step": 1740, "train_loss": 4.300056457519531, "lr": 0.0003994419967232111, "tps": 8237, "wall": 13851.3} {"step": 1741, "train_loss": 4.273721218109131, "lr": 0.0003994404883695672, "tps": 8237, "wall": 13859.2} {"step": 1742, "train_loss": 4.313580513000488, "lr": 0.00039943897798321173, "tps": 8237, "wall": 13867.7} {"step": 1743, "train_loss": 4.300393581390381, "lr": 0.0003994374655641618, "tps": 8237, "wall": 13875.6} {"step": 1744, "train_loss": 4.360512733459473, "lr": 0.0003994359511124346, "tps": 8237, "wall": 13883.3} {"step": 1745, "train_loss": 4.181862831115723, "lr": 0.00039943443462804725, "tps": 8237, "wall": 13891.2} {"step": 1746, "train_loss": 4.332045078277588, "lr": 0.0003994329161110169, "tps": 8237, "wall": 13898.9} {"step": 1747, "train_loss": 4.203501224517822, "lr": 0.0003994313955613607, "tps": 8237, "wall": 13906.6} {"step": 1748, "train_loss": 4.286258220672607, "lr": 0.000399429872979096, "tps": 8237, "wall": 13914.4} {"step": 1749, "train_loss": 4.266307830810547, "lr": 0.0003994283483642399, "tps": 8237, "wall": 13922.1} {"step": 1750, "train_loss": 4.266120433807373, "lr": 0.0003994268217168099, "tps": 8237, "wall": 13929.9} {"step": 1751, "train_loss": 4.271501064300537, "lr": 0.0003994252930368231, "tps": 8237, "wall": 13937.8} {"step": 1752, "train_loss": 4.335542678833008, "lr": 0.0003994237623242969, "tps": 8238, "wall": 13945.6} {"step": 1753, "train_loss": 4.4548492431640625, "lr": 0.0003994222295792486, "tps": 8238, "wall": 13953.4} {"step": 1754, "train_loss": 4.340343952178955, "lr": 0.0003994206948016956, "tps": 8238, "wall": 13961.1} {"step": 1755, "train_loss": 4.28239631652832, "lr": 0.0003994191579916552, "tps": 8238, "wall": 13968.9} {"step": 1756, "train_loss": 4.288127422332764, "lr": 0.00039941761914914493, "tps": 8238, "wall": 13976.6} {"step": 1757, "train_loss": 4.262441635131836, "lr": 0.00039941607827418215, "tps": 8238, "wall": 13984.4} {"step": 1758, "train_loss": 4.360592365264893, "lr": 0.0003994145353667843, "tps": 8238, "wall": 13992.3} {"step": 1759, "train_loss": 4.262928485870361, "lr": 0.00039941299042696893, "tps": 8238, "wall": 14000.1} {"step": 1760, "train_loss": 4.369897842407227, "lr": 0.00039941144345475346, "tps": 8238, "wall": 14007.8} {"step": 1761, "train_loss": 4.2184319496154785, "lr": 0.0003994098944501555, "tps": 8239, "wall": 14015.6} {"step": 1762, "train_loss": 4.2881622314453125, "lr": 0.0003994083434131925, "tps": 8239, "wall": 14023.3} {"step": 1763, "train_loss": 4.311666488647461, "lr": 0.0003994067903438821, "tps": 8239, "wall": 14031.1} {"step": 1764, "train_loss": 4.241363525390625, "lr": 0.0003994052352422418, "tps": 8239, "wall": 14038.9} {"step": 1765, "train_loss": 4.3177080154418945, "lr": 0.0003994036781082894, "tps": 8239, "wall": 14046.6} {"step": 1766, "train_loss": 4.295700550079346, "lr": 0.0003994021189420424, "tps": 8239, "wall": 14054.4} {"step": 1767, "train_loss": 4.267152786254883, "lr": 0.0003994005577435184, "tps": 8239, "wall": 14062.2} {"step": 1768, "train_loss": 4.343614101409912, "lr": 0.0003993989945127353, "tps": 8239, "wall": 14069.9} {"step": 1769, "train_loss": 4.296828746795654, "lr": 0.00039939742924971066, "tps": 8239, "wall": 14077.7} {"step": 1770, "train_loss": 4.156832218170166, "lr": 0.00039939586195446216, "tps": 8240, "wall": 14085.4} {"step": 1771, "train_loss": 4.209266662597656, "lr": 0.0003993942926270077, "tps": 8240, "wall": 14093.2} {"step": 1772, "train_loss": 4.349416255950928, "lr": 0.000399392721267365, "tps": 8240, "wall": 14101.0} {"step": 1773, "train_loss": 4.234566688537598, "lr": 0.00039939114787555184, "tps": 8240, "wall": 14108.7} {"step": 1774, "train_loss": 4.312314033508301, "lr": 0.000399389572451586, "tps": 8240, "wall": 14116.6} {"step": 1775, "train_loss": 4.214340686798096, "lr": 0.00039938799499548543, "tps": 8240, "wall": 14124.4} {"step": 1776, "train_loss": 4.272163391113281, "lr": 0.00039938641550726797, "tps": 8240, "wall": 14132.2} {"step": 1777, "train_loss": 4.278409004211426, "lr": 0.0003993848339869514, "tps": 8240, "wall": 14140.0} {"step": 1778, "train_loss": 4.241714954376221, "lr": 0.0003993832504345538, "tps": 8240, "wall": 14147.7} {"step": 1779, "train_loss": 4.152773857116699, "lr": 0.00039938166485009303, "tps": 8240, "wall": 14155.4} {"step": 1780, "train_loss": 4.333730697631836, "lr": 0.000399380077233587, "tps": 8241, "wall": 14163.2} {"step": 1781, "train_loss": 4.278159141540527, "lr": 0.0003993784875850538, "tps": 8241, "wall": 14170.9} {"step": 1782, "train_loss": 4.36543607711792, "lr": 0.0003993768959045114, "tps": 8241, "wall": 14178.8} {"step": 1783, "train_loss": 4.324662208557129, "lr": 0.00039937530219197776, "tps": 8241, "wall": 14186.6} {"step": 1784, "train_loss": 4.297322750091553, "lr": 0.00039937370644747106, "tps": 8241, "wall": 14194.4} {"step": 1785, "train_loss": 4.126680374145508, "lr": 0.0003993721086710093, "tps": 8241, "wall": 14202.2} {"step": 1786, "train_loss": 4.349955081939697, "lr": 0.00039937050886261054, "tps": 8241, "wall": 14209.9} {"step": 1787, "train_loss": 4.306846618652344, "lr": 0.000399368907022293, "tps": 8241, "wall": 14217.7} {"step": 1788, "train_loss": 4.369693756103516, "lr": 0.00039936730315007473, "tps": 8241, "wall": 14225.4} {"step": 1789, "train_loss": 4.25449275970459, "lr": 0.000399365697245974, "tps": 8241, "wall": 14233.2} {"step": 1790, "train_loss": 4.345077037811279, "lr": 0.0003993640893100089, "tps": 8241, "wall": 14241.1} {"step": 1791, "train_loss": 4.276242256164551, "lr": 0.0003993624793421977, "tps": 8242, "wall": 14248.8} {"step": 1792, "train_loss": 4.227108955383301, "lr": 0.00039936086734255864, "tps": 8242, "wall": 14256.5} {"step": 1793, "train_loss": 4.279947757720947, "lr": 0.00039935925331111005, "tps": 8242, "wall": 14264.1} {"step": 1794, "train_loss": 4.387248992919922, "lr": 0.00039935763724787006, "tps": 8242, "wall": 14271.9} {"step": 1795, "train_loss": 4.236542701721191, "lr": 0.000399356019152857, "tps": 8242, "wall": 14279.7} {"step": 1796, "train_loss": 4.253355979919434, "lr": 0.00039935439902608934, "tps": 8242, "wall": 14287.5} {"step": 1797, "train_loss": 4.168915271759033, "lr": 0.0003993527768675853, "tps": 8242, "wall": 14295.3} {"step": 1798, "train_loss": 4.2043914794921875, "lr": 0.0003993511526773633, "tps": 8242, "wall": 14303.0} {"step": 1799, "train_loss": 4.207451820373535, "lr": 0.0003993495264554418, "tps": 8243, "wall": 14310.7} {"step": 1800, "train_loss": 4.235585689544678, "lr": 0.0003993478982018391, "tps": 8243, "wall": 14318.5} {"step": 1801, "train_loss": 4.289872646331787, "lr": 0.00039934626791657366, "tps": 8243, "wall": 14326.3} {"step": 1802, "train_loss": 4.208775043487549, "lr": 0.0003993446355996641, "tps": 8243, "wall": 14334.1} {"step": 1803, "train_loss": 4.361788749694824, "lr": 0.00039934300125112873, "tps": 8243, "wall": 14341.8} {"step": 1804, "train_loss": 4.212436199188232, "lr": 0.0003993413648709862, "tps": 8243, "wall": 14349.5} {"step": 1805, "train_loss": 4.35902738571167, "lr": 0.00039933972645925497, "tps": 8243, "wall": 14357.4} {"step": 1806, "train_loss": 4.353546142578125, "lr": 0.0003993380860159536, "tps": 8243, "wall": 14365.1} {"step": 1807, "train_loss": 4.20766019821167, "lr": 0.00039933644354110074, "tps": 8243, "wall": 14372.9} {"step": 1808, "train_loss": 4.241876125335693, "lr": 0.00039933479903471485, "tps": 8244, "wall": 14380.6} {"step": 1809, "train_loss": 4.235961437225342, "lr": 0.0003993331524968147, "tps": 8244, "wall": 14388.4} {"step": 1810, "train_loss": 4.427000999450684, "lr": 0.0003993315039274189, "tps": 8244, "wall": 14396.2} {"step": 1811, "train_loss": 4.297969818115234, "lr": 0.0003993298533265461, "tps": 8244, "wall": 14403.9} {"step": 1812, "train_loss": 4.191615104675293, "lr": 0.00039932820069421505, "tps": 8244, "wall": 14411.9} {"step": 1813, "train_loss": 4.206923007965088, "lr": 0.00039932654603044447, "tps": 8244, "wall": 14419.6} {"step": 1814, "train_loss": 4.274007320404053, "lr": 0.000399324889335253, "tps": 8244, "wall": 14427.4} {"step": 1815, "train_loss": 4.329958915710449, "lr": 0.00039932323060865954, "tps": 8244, "wall": 14435.1} {"step": 1816, "train_loss": 4.328815460205078, "lr": 0.00039932156985068276, "tps": 8244, "wall": 14442.9} {"step": 1817, "train_loss": 4.328554630279541, "lr": 0.0003993199070613416, "tps": 8244, "wall": 14450.7} {"step": 1818, "train_loss": 4.234221935272217, "lr": 0.00039931824224065485, "tps": 8245, "wall": 14458.4} {"step": 1819, "train_loss": 4.3619914054870605, "lr": 0.0003993165753886413, "tps": 8245, "wall": 14466.2} {"step": 1820, "train_loss": 4.31520938873291, "lr": 0.00039931490650531987, "tps": 8245, "wall": 14474.1} {"step": 1821, "train_loss": 4.258465766906738, "lr": 0.0003993132355907095, "tps": 8245, "wall": 14481.9} {"step": 1822, "train_loss": 4.259907245635986, "lr": 0.0003993115626448291, "tps": 8245, "wall": 14489.6} {"step": 1823, "train_loss": 4.212600231170654, "lr": 0.00039930988766769763, "tps": 8245, "wall": 14497.5} {"step": 1824, "train_loss": 4.257474422454834, "lr": 0.000399308210659334, "tps": 8245, "wall": 14505.6} {"step": 1825, "train_loss": 4.302183628082275, "lr": 0.00039930653161975737, "tps": 8245, "wall": 14513.3} {"step": 1826, "train_loss": 4.216691970825195, "lr": 0.0003993048505489865, "tps": 8245, "wall": 14521.2} {"step": 1827, "train_loss": 4.181943416595459, "lr": 0.0003993031674470407, "tps": 8245, "wall": 14529.0} {"step": 1828, "train_loss": 4.262084484100342, "lr": 0.00039930148231393886, "tps": 8245, "wall": 14536.8} {"step": 1829, "train_loss": 4.2806925773620605, "lr": 0.0003992997951497002, "tps": 8245, "wall": 14544.6} {"step": 1830, "train_loss": 4.196146011352539, "lr": 0.0003992981059543437, "tps": 8245, "wall": 14552.3} {"step": 1831, "train_loss": 4.271555423736572, "lr": 0.0003992964147278885, "tps": 8245, "wall": 14560.1} {"step": 1832, "train_loss": 4.3527421951293945, "lr": 0.0003992947214703539, "tps": 8246, "wall": 14567.9} {"step": 1833, "train_loss": 4.336941242218018, "lr": 0.000399293026181759, "tps": 8246, "wall": 14575.7} {"step": 1834, "train_loss": 4.3032755851745605, "lr": 0.000399291328862123, "tps": 8246, "wall": 14583.5} {"step": 1835, "train_loss": 4.2916669845581055, "lr": 0.0003992896295114651, "tps": 8246, "wall": 14591.2} {"step": 1836, "train_loss": 4.259749889373779, "lr": 0.0003992879281298045, "tps": 8246, "wall": 14599.2} {"step": 1837, "train_loss": 4.291693687438965, "lr": 0.00039928622471716073, "tps": 8246, "wall": 14607.0} {"step": 1838, "train_loss": 4.238137722015381, "lr": 0.0003992845192735528, "tps": 8246, "wall": 14614.7} {"step": 1839, "train_loss": 4.182566165924072, "lr": 0.00039928281179900014, "tps": 8246, "wall": 14622.5} {"step": 1840, "train_loss": 4.3063812255859375, "lr": 0.00039928110229352204, "tps": 8246, "wall": 14630.3} {"step": 1841, "train_loss": 4.326638698577881, "lr": 0.00039927939075713796, "tps": 8246, "wall": 14638.0} {"step": 1842, "train_loss": 4.301968097686768, "lr": 0.0003992776771898673, "tps": 8246, "wall": 14645.7} {"step": 1843, "train_loss": 4.177729606628418, "lr": 0.00039927596159172935, "tps": 8246, "wall": 14653.7} {"step": 1844, "train_loss": 4.342338562011719, "lr": 0.0003992742439627436, "tps": 8247, "wall": 14661.5} {"step": 1845, "train_loss": 4.324954986572266, "lr": 0.00039927252430292957, "tps": 8247, "wall": 14669.3} {"step": 1846, "train_loss": 4.243705749511719, "lr": 0.00039927080261230666, "tps": 8247, "wall": 14677.1} {"step": 1847, "train_loss": 4.25351095199585, "lr": 0.00039926907889089436, "tps": 8247, "wall": 14684.9} {"step": 1848, "train_loss": 4.212452411651611, "lr": 0.0003992673531387123, "tps": 8247, "wall": 14692.7} {"step": 1849, "train_loss": 4.245655536651611, "lr": 0.0003992656253557799, "tps": 8247, "wall": 14700.4} {"step": 1850, "train_loss": 4.309330463409424, "lr": 0.0003992638955421168, "tps": 8247, "wall": 14708.2} {"step": 1851, "train_loss": 4.203622817993164, "lr": 0.0003992621636977427, "tps": 8247, "wall": 14716.1} {"step": 1852, "train_loss": 4.274515151977539, "lr": 0.00039926042982267704, "tps": 8247, "wall": 14723.9} {"step": 1853, "train_loss": 4.170333385467529, "lr": 0.0003992586939169395, "tps": 8247, "wall": 14731.7} {"step": 1854, "train_loss": 4.300251007080078, "lr": 0.0003992569559805498, "tps": 8247, "wall": 14739.4} {"step": 1855, "train_loss": 4.295590877532959, "lr": 0.00039925521601352765, "tps": 8248, "wall": 14747.2} {"step": 1856, "train_loss": 4.133167743682861, "lr": 0.00039925347401589264, "tps": 8248, "wall": 14755.0} {"step": 1857, "train_loss": 4.178982734680176, "lr": 0.0003992517299876646, "tps": 8248, "wall": 14762.9} {"step": 1858, "train_loss": 4.313704490661621, "lr": 0.0003992499839288633, "tps": 8248, "wall": 14770.6} {"step": 1859, "train_loss": 4.150111198425293, "lr": 0.00039924823583950845, "tps": 8248, "wall": 14778.5} {"step": 1860, "train_loss": 4.315151214599609, "lr": 0.0003992464857196199, "tps": 8248, "wall": 14786.2} {"step": 1861, "train_loss": 4.2477617263793945, "lr": 0.00039924473356921746, "tps": 8248, "wall": 14794.0} {"step": 1862, "train_loss": 4.230588436126709, "lr": 0.000399242979388321, "tps": 8248, "wall": 14801.7} {"step": 1863, "train_loss": 4.256988048553467, "lr": 0.0003992412231769504, "tps": 8248, "wall": 14809.5} {"step": 1864, "train_loss": 4.2403459548950195, "lr": 0.0003992394649351255, "tps": 8248, "wall": 14817.2} {"step": 1865, "train_loss": 4.153286457061768, "lr": 0.0003992377046628662, "tps": 8248, "wall": 14825.1} {"step": 1866, "train_loss": 4.179260730743408, "lr": 0.00039923594236019255, "tps": 8248, "wall": 14832.9} {"step": 1867, "train_loss": 4.296149253845215, "lr": 0.0003992341780271244, "tps": 8249, "wall": 14840.6} {"step": 1868, "train_loss": 4.178200721740723, "lr": 0.00039923241166368184, "tps": 8249, "wall": 14848.4} {"step": 1869, "train_loss": 4.293901443481445, "lr": 0.0003992306432698847, "tps": 8249, "wall": 14856.2} {"step": 1870, "train_loss": 4.241929531097412, "lr": 0.00039922887284575326, "tps": 8249, "wall": 14863.9} {"step": 1871, "train_loss": 4.172014236450195, "lr": 0.0003992271003913074, "tps": 8249, "wall": 14871.6} {"step": 1872, "train_loss": 4.181382179260254, "lr": 0.0003992253259065673, "tps": 8249, "wall": 14879.4} {"step": 1873, "train_loss": 4.134922504425049, "lr": 0.00039922354939155296, "tps": 8249, "wall": 14887.0} {"step": 1874, "train_loss": 4.3134541511535645, "lr": 0.0003992217708462846, "tps": 8249, "wall": 14894.9} {"step": 1875, "train_loss": 4.134208679199219, "lr": 0.0003992199902707823, "tps": 8249, "wall": 14902.7} {"step": 1876, "train_loss": 4.290909290313721, "lr": 0.0003992182076650662, "tps": 8250, "wall": 14910.4} {"step": 1877, "train_loss": 4.322070121765137, "lr": 0.00039921642302915666, "tps": 8250, "wall": 14918.1} {"step": 1878, "train_loss": 4.270356178283691, "lr": 0.0003992146363630737, "tps": 8250, "wall": 14925.9} {"step": 1879, "train_loss": 4.272197246551514, "lr": 0.0003992128476668377, "tps": 8250, "wall": 14933.7} {"step": 1880, "train_loss": 4.340170860290527, "lr": 0.0003992110569404688, "tps": 8250, "wall": 14941.4} {"step": 1881, "train_loss": 4.211117744445801, "lr": 0.0003992092641839874, "tps": 8250, "wall": 14949.2} {"step": 1882, "train_loss": 4.259397983551025, "lr": 0.00039920746939741373, "tps": 8250, "wall": 14957.0} {"step": 1883, "train_loss": 4.232878684997559, "lr": 0.0003992056725807682, "tps": 8250, "wall": 14964.9} {"step": 1884, "train_loss": 4.392290115356445, "lr": 0.0003992038737340711, "tps": 8250, "wall": 14972.5} {"step": 1885, "train_loss": 4.264921188354492, "lr": 0.00039920207285734275, "tps": 8250, "wall": 14980.2} {"step": 1886, "train_loss": 4.2690839767456055, "lr": 0.0003992002699506037, "tps": 8251, "wall": 14988.0} {"step": 1887, "train_loss": 4.30490779876709, "lr": 0.0003991984650138743, "tps": 8251, "wall": 14995.8} {"step": 1888, "train_loss": 4.242253303527832, "lr": 0.00039919665804717496, "tps": 8251, "wall": 15003.5} {"step": 1889, "train_loss": 4.239110946655273, "lr": 0.00039919484905052624, "tps": 8251, "wall": 15011.3} {"step": 1890, "train_loss": 4.183483123779297, "lr": 0.0003991930380239485, "tps": 8251, "wall": 15019.2} {"step": 1891, "train_loss": 4.256083965301514, "lr": 0.0003991912249674624, "tps": 8251, "wall": 15027.0} {"step": 1892, "train_loss": 4.250791549682617, "lr": 0.00039918940988108837, "tps": 8251, "wall": 15034.7} {"step": 1893, "train_loss": 4.2762932777404785, "lr": 0.000399187592764847, "tps": 8251, "wall": 15042.6} {"step": 1894, "train_loss": 4.252388954162598, "lr": 0.0003991857736187589, "tps": 8251, "wall": 15050.4} {"step": 1895, "train_loss": 4.353893280029297, "lr": 0.00039918395244284465, "tps": 8251, "wall": 15058.1} {"step": 1896, "train_loss": 4.215836524963379, "lr": 0.00039918212923712495, "tps": 8251, "wall": 15065.9} {"step": 1897, "train_loss": 4.173960208892822, "lr": 0.0003991803040016203, "tps": 8251, "wall": 15073.8} {"step": 1898, "train_loss": 4.346343040466309, "lr": 0.00039917847673635155, "tps": 8252, "wall": 15081.5} {"step": 1899, "train_loss": 4.260683059692383, "lr": 0.0003991766474413393, "tps": 8252, "wall": 15089.3} {"step": 1900, "train_loss": 4.126276016235352, "lr": 0.0003991748161166043, "tps": 8252, "wall": 15097.1} {"step": 1901, "train_loss": 4.214418888092041, "lr": 0.00039917298276216727, "tps": 8252, "wall": 15104.9} {"step": 1902, "train_loss": 4.304847240447998, "lr": 0.000399171147378049, "tps": 8252, "wall": 15112.7} {"step": 1903, "train_loss": 4.203917503356934, "lr": 0.0003991693099642703, "tps": 8252, "wall": 15120.5} {"step": 1904, "train_loss": 4.27485466003418, "lr": 0.00039916747052085196, "tps": 8252, "wall": 15128.3} {"step": 1905, "train_loss": 4.181604862213135, "lr": 0.0003991656290478148, "tps": 8252, "wall": 15136.2} {"step": 1906, "train_loss": 4.215717792510986, "lr": 0.0003991637855451797, "tps": 8252, "wall": 15144.0} {"step": 1907, "train_loss": 4.224186420440674, "lr": 0.00039916194001296757, "tps": 8252, "wall": 15151.8} {"step": 1908, "train_loss": 4.305672645568848, "lr": 0.0003991600924511993, "tps": 8252, "wall": 15159.5} {"step": 1909, "train_loss": 4.229226112365723, "lr": 0.0003991582428598958, "tps": 8252, "wall": 15167.3} {"step": 1910, "train_loss": 4.1029205322265625, "lr": 0.00039915639123907804, "tps": 8252, "wall": 15175.1} {"step": 1911, "train_loss": 4.196858882904053, "lr": 0.00039915453758876694, "tps": 8252, "wall": 15183.0} {"step": 1912, "train_loss": 4.276641845703125, "lr": 0.00039915268190898355, "tps": 8253, "wall": 15190.8} {"step": 1913, "train_loss": 4.20978307723999, "lr": 0.000399150824199749, "tps": 8253, "wall": 15198.6} {"step": 1914, "train_loss": 4.2507734298706055, "lr": 0.00039914896446108407, "tps": 8253, "wall": 15206.4} {"step": 1915, "train_loss": 4.143156051635742, "lr": 0.00039914710269301005, "tps": 8253, "wall": 15214.3} {"step": 1916, "train_loss": 4.219441890716553, "lr": 0.000399145238895548, "tps": 8253, "wall": 15222.1} {"step": 1917, "train_loss": 4.181357383728027, "lr": 0.0003991433730687189, "tps": 8253, "wall": 15230.0} {"step": 1918, "train_loss": 4.094117641448975, "lr": 0.000399141505212544, "tps": 8253, "wall": 15237.7} {"step": 1919, "train_loss": 4.20632791519165, "lr": 0.0003991396353270445, "tps": 8253, "wall": 15245.6} {"step": 1920, "train_loss": 4.225602149963379, "lr": 0.00039913776341224145, "tps": 8253, "wall": 15253.5} {"step": 1921, "train_loss": 4.255648612976074, "lr": 0.0003991358894681562, "tps": 8253, "wall": 15261.3} {"step": 1922, "train_loss": 4.236549377441406, "lr": 0.0003991340134948098, "tps": 8253, "wall": 15269.2} {"step": 1923, "train_loss": 4.161081790924072, "lr": 0.00039913213549222374, "tps": 8253, "wall": 15277.0} {"step": 1924, "train_loss": 4.081216335296631, "lr": 0.000399130255460419, "tps": 8253, "wall": 15284.9} {"step": 1925, "train_loss": 4.132081031799316, "lr": 0.0003991283733994172, "tps": 8253, "wall": 15292.7} {"step": 1926, "train_loss": 4.237725734710693, "lr": 0.0003991264893092394, "tps": 8253, "wall": 15300.5} {"step": 1927, "train_loss": 4.235710144042969, "lr": 0.00039912460318990704, "tps": 8253, "wall": 15308.4} {"step": 1928, "train_loss": 4.2365007400512695, "lr": 0.0003991227150414415, "tps": 8253, "wall": 15316.3} {"step": 1929, "train_loss": 4.253073692321777, "lr": 0.00039912082486386416, "tps": 8253, "wall": 15324.1} {"step": 1930, "train_loss": 4.19178581237793, "lr": 0.00039911893265719644, "tps": 8253, "wall": 15332.0} {"step": 1931, "train_loss": 4.149759292602539, "lr": 0.0003991170384214597, "tps": 8254, "wall": 15339.8} {"step": 1932, "train_loss": 4.236352443695068, "lr": 0.00039911514215667555, "tps": 8254, "wall": 15347.6} {"step": 1933, "train_loss": 4.321640491485596, "lr": 0.0003991132438628653, "tps": 8254, "wall": 15355.5} {"step": 1934, "train_loss": 4.269175052642822, "lr": 0.00039911134354005053, "tps": 8254, "wall": 15363.4} {"step": 1935, "train_loss": 4.236247539520264, "lr": 0.00039910944118825285, "tps": 8254, "wall": 15371.2} {"step": 1936, "train_loss": 4.273247241973877, "lr": 0.00039910753680749364, "tps": 8254, "wall": 15379.1} {"step": 1937, "train_loss": 4.256158351898193, "lr": 0.0003991056303977946, "tps": 8254, "wall": 15386.8} {"step": 1938, "train_loss": 4.263798236846924, "lr": 0.0003991037219591773, "tps": 8254, "wall": 15394.7} {"step": 1939, "train_loss": 4.276469707489014, "lr": 0.0003991018114916634, "tps": 8254, "wall": 15402.6} {"step": 1940, "train_loss": 4.131449222564697, "lr": 0.0003990998989952744, "tps": 8254, "wall": 15410.4} {"step": 1941, "train_loss": 4.184836387634277, "lr": 0.0003990979844700321, "tps": 8254, "wall": 15418.2} {"step": 1942, "train_loss": 4.194834232330322, "lr": 0.0003990960679159581, "tps": 8254, "wall": 15426.0} {"step": 1943, "train_loss": 4.152342319488525, "lr": 0.0003990941493330742, "tps": 8254, "wall": 15434.0} {"step": 1944, "train_loss": 4.150484561920166, "lr": 0.00039909222872140204, "tps": 8254, "wall": 15441.8} {"step": 1945, "train_loss": 4.206022262573242, "lr": 0.00039909030608096353, "tps": 8254, "wall": 15449.6} {"step": 1946, "train_loss": 4.1881914138793945, "lr": 0.0003990883814117802, "tps": 8254, "wall": 15457.5} {"step": 1947, "train_loss": 4.241501808166504, "lr": 0.0003990864547138741, "tps": 8254, "wall": 15465.3} {"step": 1948, "train_loss": 4.221035480499268, "lr": 0.0003990845259872669, "tps": 8254, "wall": 15473.2} {"step": 1949, "train_loss": 4.261132717132568, "lr": 0.0003990825952319805, "tps": 8254, "wall": 15481.0} {"step": 1950, "train_loss": 4.1850152015686035, "lr": 0.0003990806624480368, "tps": 8255, "wall": 15488.7} {"step": 1951, "train_loss": 4.250789642333984, "lr": 0.00039907872763545767, "tps": 8255, "wall": 15496.7} {"step": 1952, "train_loss": 4.107629299163818, "lr": 0.00039907679079426503, "tps": 8255, "wall": 15504.5} {"step": 1953, "train_loss": 4.172806739807129, "lr": 0.0003990748519244808, "tps": 8255, "wall": 15512.4} {"step": 1954, "train_loss": 4.1173858642578125, "lr": 0.000399072911026127, "tps": 8255, "wall": 15520.2} {"step": 1955, "train_loss": 4.146478176116943, "lr": 0.0003990709680992255, "tps": 8255, "wall": 15528.0} {"step": 1956, "train_loss": 4.169149398803711, "lr": 0.00039906902314379845, "tps": 8255, "wall": 15535.8} {"step": 1957, "train_loss": 4.226391315460205, "lr": 0.0003990670761598677, "tps": 8255, "wall": 15543.6} {"step": 1958, "train_loss": 4.184098243713379, "lr": 0.0003990651271474556, "tps": 8255, "wall": 15551.5} {"step": 1959, "train_loss": 4.180622100830078, "lr": 0.00039906317610658397, "tps": 8255, "wall": 15559.4} {"step": 1960, "train_loss": 4.189942836761475, "lr": 0.000399061223037275, "tps": 8255, "wall": 15567.2} {"step": 1961, "train_loss": 4.296084403991699, "lr": 0.0003990592679395508, "tps": 8255, "wall": 15575.0} {"step": 1962, "train_loss": 4.165223121643066, "lr": 0.0003990573108134335, "tps": 8255, "wall": 15582.8} {"step": 1963, "train_loss": 4.1560587882995605, "lr": 0.00039905535165894534, "tps": 8255, "wall": 15590.7} {"step": 1964, "train_loss": 4.1885175704956055, "lr": 0.00039905339047610844, "tps": 8255, "wall": 15598.5} {"step": 1965, "train_loss": 4.2100324630737305, "lr": 0.00039905142726494503, "tps": 8255, "wall": 15606.3} {"step": 1966, "train_loss": 4.192905902862549, "lr": 0.00039904946202547745, "tps": 8255, "wall": 15614.3} {"step": 1967, "train_loss": 4.090229034423828, "lr": 0.0003990474947577278, "tps": 8255, "wall": 15622.0} {"step": 1968, "train_loss": 4.149113178253174, "lr": 0.00039904552546171846, "tps": 8256, "wall": 15629.8} {"step": 1969, "train_loss": 4.099058151245117, "lr": 0.0003990435541374717, "tps": 8256, "wall": 15637.6} {"step": 1970, "train_loss": 4.274134159088135, "lr": 0.00039904158078500997, "tps": 8256, "wall": 15645.5} {"step": 1971, "train_loss": 4.130117416381836, "lr": 0.0003990396054043554, "tps": 8256, "wall": 15653.4} {"step": 1972, "train_loss": 4.291894435882568, "lr": 0.00039903762799553056, "tps": 8256, "wall": 15661.2} {"step": 1973, "train_loss": 4.177754878997803, "lr": 0.0003990356485585578, "tps": 8256, "wall": 15669.2} {"step": 1974, "train_loss": 4.202975273132324, "lr": 0.00039903366709345955, "tps": 8256, "wall": 15677.2} {"step": 1975, "train_loss": 4.1980366706848145, "lr": 0.00039903168360025816, "tps": 8256, "wall": 15685.0} {"step": 1976, "train_loss": 4.100544452667236, "lr": 0.0003990296980789762, "tps": 8256, "wall": 15692.8} {"step": 1977, "train_loss": 4.277813911437988, "lr": 0.00039902771052963614, "tps": 8256, "wall": 15700.6} {"step": 1978, "train_loss": 4.176630973815918, "lr": 0.0003990257209522605, "tps": 8256, "wall": 15708.5} {"step": 1979, "train_loss": 4.213395595550537, "lr": 0.0003990237293468717, "tps": 8256, "wall": 15716.3} {"step": 1980, "train_loss": 4.132573127746582, "lr": 0.0003990217357134925, "tps": 8256, "wall": 15724.1} {"step": 1981, "train_loss": 4.245491027832031, "lr": 0.0003990197400521454, "tps": 8256, "wall": 15732.1} {"step": 1982, "train_loss": 4.164012908935547, "lr": 0.000399017742362853, "tps": 8256, "wall": 15739.9} {"step": 1983, "train_loss": 4.159972190856934, "lr": 0.0003990157426456379, "tps": 8256, "wall": 15747.8} {"step": 1984, "train_loss": 4.1664018630981445, "lr": 0.0003990137409005229, "tps": 8256, "wall": 15755.6} {"step": 1985, "train_loss": 4.261380195617676, "lr": 0.0003990117371275304, "tps": 8256, "wall": 15763.5} {"step": 1986, "train_loss": 4.272646903991699, "lr": 0.0003990097313266833, "tps": 8256, "wall": 15771.4} {"step": 1987, "train_loss": 4.287563800811768, "lr": 0.00039900772349800434, "tps": 8256, "wall": 15779.2} {"step": 1988, "train_loss": 4.257627010345459, "lr": 0.0003990057136415162, "tps": 8256, "wall": 15787.0} {"step": 1989, "train_loss": 4.122962951660156, "lr": 0.00039900370175724155, "tps": 8256, "wall": 15794.7} {"step": 1990, "train_loss": 4.2148942947387695, "lr": 0.0003990016878452034, "tps": 8257, "wall": 15802.5} {"step": 1991, "train_loss": 4.168492317199707, "lr": 0.00039899967190542434, "tps": 8257, "wall": 15810.4} {"step": 1992, "train_loss": 4.244843006134033, "lr": 0.0003989976539379274, "tps": 8257, "wall": 15818.3} {"step": 1993, "train_loss": 4.172220706939697, "lr": 0.00039899563394273535, "tps": 8257, "wall": 15826.1} {"step": 1994, "train_loss": 4.1328020095825195, "lr": 0.00039899361191987105, "tps": 8257, "wall": 15833.9} {"step": 1995, "train_loss": 4.250286102294922, "lr": 0.0003989915878693574, "tps": 8257, "wall": 15841.7} {"step": 1996, "train_loss": 4.106930255889893, "lr": 0.0003989895617912174, "tps": 8257, "wall": 15849.6} {"step": 1997, "train_loss": 4.326920032501221, "lr": 0.0003989875336854739, "tps": 8257, "wall": 15857.5} {"step": 1998, "train_loss": 4.222195148468018, "lr": 0.00039898550355215, "tps": 8257, "wall": 15865.3} {"step": 1999, "train_loss": 4.2502970695495605, "lr": 0.0003989834713912687, "tps": 8257, "wall": 15873.2} {"step": 2000, "train_loss": 4.101815223693848, "lr": 0.00039898143720285277, "tps": 8257, "wall": 15881.0, "val_loss_monitor": 4.194191261104088} {"step": 2001, "train_loss": 4.149109840393066, "lr": 0.00039897940098692557, "tps": 8232, "wall": 15937.5} {"step": 2002, "train_loss": 4.124473571777344, "lr": 0.00039897736274350994, "tps": 8232, "wall": 15945.4} {"step": 2003, "train_loss": 4.228590965270996, "lr": 0.0003989753224726292, "tps": 8232, "wall": 15953.3} {"step": 2004, "train_loss": 4.132325172424316, "lr": 0.00039897328017430623, "tps": 8232, "wall": 15961.1} {"step": 2005, "train_loss": 4.274881362915039, "lr": 0.0003989712358485643, "tps": 8232, "wall": 15969.1} {"step": 2006, "train_loss": 4.256635665893555, "lr": 0.00039896918949542645, "tps": 8232, "wall": 15977.2} {"step": 2007, "train_loss": 4.224767684936523, "lr": 0.00039896714111491605, "tps": 8232, "wall": 15985.0} {"step": 2008, "train_loss": 4.156439781188965, "lr": 0.00039896509070705606, "tps": 8232, "wall": 15992.9} {"step": 2009, "train_loss": 4.132124423980713, "lr": 0.00039896303827186995, "tps": 8232, "wall": 16000.8} {"step": 2010, "train_loss": 4.210198879241943, "lr": 0.0003989609838093809, "tps": 8232, "wall": 16008.7} {"step": 2011, "train_loss": 4.028721809387207, "lr": 0.00039895892731961203, "tps": 8232, "wall": 16016.6} {"step": 2012, "train_loss": 4.22627067565918, "lr": 0.0003989568688025868, "tps": 8232, "wall": 16024.5} {"step": 2013, "train_loss": 4.178215026855469, "lr": 0.00039895480825832846, "tps": 8232, "wall": 16032.6} {"step": 2014, "train_loss": 4.100836277008057, "lr": 0.0003989527456868604, "tps": 8232, "wall": 16040.4} {"step": 2015, "train_loss": 4.068551540374756, "lr": 0.00039895068108820593, "tps": 8232, "wall": 16048.3} {"step": 2016, "train_loss": 4.126698970794678, "lr": 0.00039894861446238846, "tps": 8232, "wall": 16056.2} {"step": 2017, "train_loss": 4.09868049621582, "lr": 0.0003989465458094314, "tps": 8232, "wall": 16064.0} {"step": 2018, "train_loss": 4.173244953155518, "lr": 0.0003989444751293582, "tps": 8232, "wall": 16071.9} {"step": 2019, "train_loss": 4.215710639953613, "lr": 0.00039894240242219236, "tps": 8232, "wall": 16079.8} {"step": 2020, "train_loss": 4.293146133422852, "lr": 0.0003989403276879572, "tps": 8232, "wall": 16087.6} {"step": 2021, "train_loss": 4.175570487976074, "lr": 0.00039893825092667635, "tps": 8232, "wall": 16095.6} {"step": 2022, "train_loss": 4.287879943847656, "lr": 0.0003989361721383734, "tps": 8232, "wall": 16103.4} {"step": 2023, "train_loss": 4.145168304443359, "lr": 0.00039893409132307176, "tps": 8233, "wall": 16111.1} {"step": 2024, "train_loss": 4.189172744750977, "lr": 0.000398932008480795, "tps": 8233, "wall": 16119.1} {"step": 2025, "train_loss": 4.211763381958008, "lr": 0.00039892992361156685, "tps": 8233, "wall": 16126.8} {"step": 2026, "train_loss": 4.149174690246582, "lr": 0.0003989278367154108, "tps": 8233, "wall": 16134.7} {"step": 2027, "train_loss": 4.140087127685547, "lr": 0.0003989257477923505, "tps": 8233, "wall": 16142.5} {"step": 2028, "train_loss": 4.163764476776123, "lr": 0.00039892365684240976, "tps": 8233, "wall": 16150.2} {"step": 2029, "train_loss": 4.166100025177002, "lr": 0.0003989215638656121, "tps": 8233, "wall": 16158.2} {"step": 2030, "train_loss": 4.167536735534668, "lr": 0.0003989194688619812, "tps": 8233, "wall": 16166.0} {"step": 2031, "train_loss": 4.294244766235352, "lr": 0.0003989173718315411, "tps": 8233, "wall": 16173.9} {"step": 2032, "train_loss": 4.182240009307861, "lr": 0.0003989152727743151, "tps": 8233, "wall": 16181.6} {"step": 2033, "train_loss": 4.162364959716797, "lr": 0.0003989131716903273, "tps": 8233, "wall": 16189.4} {"step": 2034, "train_loss": 4.178505897521973, "lr": 0.0003989110685796014, "tps": 8233, "wall": 16197.2} {"step": 2035, "train_loss": 4.219072341918945, "lr": 0.00039890896344216124, "tps": 8233, "wall": 16205.0} {"step": 2036, "train_loss": 4.119536876678467, "lr": 0.0003989068562780307, "tps": 8234, "wall": 16212.8} {"step": 2037, "train_loss": 4.190798282623291, "lr": 0.00039890474708723355, "tps": 8234, "wall": 16220.5} {"step": 2038, "train_loss": 4.193461894989014, "lr": 0.0003989026358697938, "tps": 8234, "wall": 16228.2} {"step": 2039, "train_loss": 4.1887335777282715, "lr": 0.00039890052262573527, "tps": 8234, "wall": 16236.1} {"step": 2040, "train_loss": 4.22591495513916, "lr": 0.000398898407355082, "tps": 8234, "wall": 16243.8} {"step": 2041, "train_loss": 4.111476421356201, "lr": 0.00039889629005785787, "tps": 8234, "wall": 16251.7} {"step": 2042, "train_loss": 4.160743713378906, "lr": 0.0003988941707340868, "tps": 8234, "wall": 16259.5} {"step": 2043, "train_loss": 4.071552276611328, "lr": 0.000398892049383793, "tps": 8234, "wall": 16267.3} {"step": 2044, "train_loss": 4.223559379577637, "lr": 0.0003988899260070004, "tps": 8234, "wall": 16275.2} {"step": 2045, "train_loss": 4.176201343536377, "lr": 0.00039888780060373294, "tps": 8234, "wall": 16283.0} {"step": 2046, "train_loss": 4.13601016998291, "lr": 0.0003988856731740148, "tps": 8234, "wall": 16290.8} {"step": 2047, "train_loss": 4.122195720672607, "lr": 0.00039888354371787015, "tps": 8234, "wall": 16298.7} {"step": 2048, "train_loss": 4.206895351409912, "lr": 0.00039888141223532304, "tps": 8234, "wall": 16307.0} {"step": 2049, "train_loss": 4.182774543762207, "lr": 0.00039887927872639764, "tps": 8234, "wall": 16315.2} {"step": 2050, "train_loss": 4.297541618347168, "lr": 0.000398877143191118, "tps": 8234, "wall": 16323.5} {"step": 2051, "train_loss": 4.1685991287231445, "lr": 0.00039887500562950845, "tps": 8233, "wall": 16332.5} {"step": 2052, "train_loss": 4.157918930053711, "lr": 0.00039887286604159313, "tps": 8233, "wall": 16342.1} {"step": 2053, "train_loss": 4.220697402954102, "lr": 0.00039887072442739633, "tps": 8232, "wall": 16350.3} {"step": 2054, "train_loss": 4.173562526702881, "lr": 0.0003988685807869422, "tps": 8232, "wall": 16358.3} {"step": 2055, "train_loss": 4.2167792320251465, "lr": 0.0003988664351202553, "tps": 8232, "wall": 16366.1} {"step": 2056, "train_loss": 4.053380012512207, "lr": 0.0003988642874273596, "tps": 8233, "wall": 16374.0} {"step": 2057, "train_loss": 4.120952129364014, "lr": 0.00039886213770827967, "tps": 8232, "wall": 16382.1} {"step": 2058, "train_loss": 4.264501094818115, "lr": 0.00039885998596303967, "tps": 8232, "wall": 16390.2} {"step": 2059, "train_loss": 4.121362686157227, "lr": 0.0003988578321916641, "tps": 8232, "wall": 16398.2} {"step": 2060, "train_loss": 4.251139163970947, "lr": 0.00039885567639417736, "tps": 8232, "wall": 16406.1} {"step": 2061, "train_loss": 4.044054985046387, "lr": 0.00039885351857060384, "tps": 8232, "wall": 16414.2} {"step": 2062, "train_loss": 4.167842864990234, "lr": 0.000398851358720968, "tps": 8232, "wall": 16421.9} {"step": 2063, "train_loss": 4.204665660858154, "lr": 0.00039884919684529424, "tps": 8232, "wall": 16430.0} {"step": 2064, "train_loss": 4.094421863555908, "lr": 0.0003988470329436072, "tps": 8232, "wall": 16438.0} {"step": 2065, "train_loss": 4.217576026916504, "lr": 0.0003988448670159312, "tps": 8232, "wall": 16446.0} {"step": 2066, "train_loss": 4.206545829772949, "lr": 0.00039884269906229086, "tps": 8232, "wall": 16454.2} {"step": 2067, "train_loss": 4.251287937164307, "lr": 0.0003988405290827108, "tps": 8232, "wall": 16462.5} {"step": 2068, "train_loss": 4.131955146789551, "lr": 0.00039883835707721555, "tps": 8232, "wall": 16470.4} {"step": 2069, "train_loss": 4.215571403503418, "lr": 0.0003988361830458297, "tps": 8232, "wall": 16478.5} {"step": 2070, "train_loss": 4.260306358337402, "lr": 0.00039883400698857794, "tps": 8232, "wall": 16486.8} {"step": 2071, "train_loss": 4.131473064422607, "lr": 0.00039883182890548477, "tps": 8232, "wall": 16495.3} {"step": 2072, "train_loss": 4.190277576446533, "lr": 0.000398829648796575, "tps": 8231, "wall": 16503.5} {"step": 2073, "train_loss": 4.245358467102051, "lr": 0.0003988274666618734, "tps": 8231, "wall": 16511.7} {"step": 2074, "train_loss": 4.157098293304443, "lr": 0.0003988252825014045, "tps": 8231, "wall": 16519.6} {"step": 2075, "train_loss": 4.164256572723389, "lr": 0.00039882309631519315, "tps": 8232, "wall": 16527.3} {"step": 2076, "train_loss": 4.110271453857422, "lr": 0.00039882090810326406, "tps": 8232, "wall": 16535.2} {"step": 2077, "train_loss": 4.302127361297607, "lr": 0.0003988187178656421, "tps": 8231, "wall": 16543.3} {"step": 2078, "train_loss": 4.1703596115112305, "lr": 0.000398816525602352, "tps": 8231, "wall": 16551.5} {"step": 2079, "train_loss": 4.147554397583008, "lr": 0.00039881433131341864, "tps": 8231, "wall": 16559.7} {"step": 2080, "train_loss": 4.220151424407959, "lr": 0.0003988121349988668, "tps": 8231, "wall": 16567.6} {"step": 2081, "train_loss": 4.129532814025879, "lr": 0.0003988099366587214, "tps": 8231, "wall": 16576.1} {"step": 2082, "train_loss": 4.147375106811523, "lr": 0.00039880773629300746, "tps": 8231, "wall": 16584.0} {"step": 2083, "train_loss": 4.217823028564453, "lr": 0.0003988055339017498, "tps": 8231, "wall": 16591.8} {"step": 2084, "train_loss": 4.154336452484131, "lr": 0.00039880332948497336, "tps": 8231, "wall": 16599.5} {"step": 2085, "train_loss": 4.150912284851074, "lr": 0.00039880112304270315, "tps": 8231, "wall": 16607.3} {"step": 2086, "train_loss": 4.057307243347168, "lr": 0.00039879891457496406, "tps": 8231, "wall": 16615.1} {"step": 2087, "train_loss": 4.239006996154785, "lr": 0.00039879670408178125, "tps": 8231, "wall": 16622.9} {"step": 2088, "train_loss": 4.225438594818115, "lr": 0.0003987944915631797, "tps": 8231, "wall": 16630.8} {"step": 2089, "train_loss": 4.167706489562988, "lr": 0.00039879227701918453, "tps": 8231, "wall": 16638.9} {"step": 2090, "train_loss": 4.147353172302246, "lr": 0.0003987900604498207, "tps": 8231, "wall": 16646.8} {"step": 2091, "train_loss": 4.267417907714844, "lr": 0.00039878784185511345, "tps": 8232, "wall": 16654.7} {"step": 2092, "train_loss": 4.142530918121338, "lr": 0.0003987856212350878, "tps": 8232, "wall": 16662.6} {"step": 2093, "train_loss": 4.18541145324707, "lr": 0.000398783398589769, "tps": 8232, "wall": 16670.4} {"step": 2094, "train_loss": 4.238128185272217, "lr": 0.0003987811739191822, "tps": 8232, "wall": 16678.2} {"step": 2095, "train_loss": 4.151575565338135, "lr": 0.00039877894722335257, "tps": 8232, "wall": 16685.9} {"step": 2096, "train_loss": 4.150160789489746, "lr": 0.00039877671850230533, "tps": 8232, "wall": 16693.8} {"step": 2097, "train_loss": 4.2440948486328125, "lr": 0.00039877448775606575, "tps": 8232, "wall": 16701.8} {"step": 2098, "train_loss": 4.080045223236084, "lr": 0.00039877225498465913, "tps": 8232, "wall": 16709.8} {"step": 2099, "train_loss": 4.143349647521973, "lr": 0.00039877002018811074, "tps": 8232, "wall": 16717.5} {"step": 2100, "train_loss": 4.148801326751709, "lr": 0.0003987677833664459, "tps": 8232, "wall": 16725.4} {"step": 2101, "train_loss": 4.1677422523498535, "lr": 0.00039876554451968984, "tps": 8232, "wall": 16733.2} {"step": 2102, "train_loss": 4.15775728225708, "lr": 0.00039876330364786814, "tps": 8232, "wall": 16741.1} {"step": 2103, "train_loss": 4.131258964538574, "lr": 0.000398761060751006, "tps": 8232, "wall": 16749.0} {"step": 2104, "train_loss": 4.18812894821167, "lr": 0.00039875881582912895, "tps": 8232, "wall": 16757.0} {"step": 2105, "train_loss": 4.139420509338379, "lr": 0.00039875656888226226, "tps": 8232, "wall": 16764.8} {"step": 2106, "train_loss": 4.059701919555664, "lr": 0.0003987543199104316, "tps": 8232, "wall": 16772.6} {"step": 2107, "train_loss": 4.076533317565918, "lr": 0.0003987520689136623, "tps": 8232, "wall": 16780.5} {"step": 2108, "train_loss": 4.195845603942871, "lr": 0.0003987498158919799, "tps": 8232, "wall": 16788.5} {"step": 2109, "train_loss": 4.183465480804443, "lr": 0.00039874756084540985, "tps": 8232, "wall": 16796.3} {"step": 2110, "train_loss": 4.093130111694336, "lr": 0.0003987453037739778, "tps": 8232, "wall": 16804.1} {"step": 2111, "train_loss": 4.162564277648926, "lr": 0.0003987430446777093, "tps": 8232, "wall": 16812.0} {"step": 2112, "train_loss": 4.186951160430908, "lr": 0.0003987407835566299, "tps": 8233, "wall": 16819.8} {"step": 2113, "train_loss": 4.105319023132324, "lr": 0.0003987385204107652, "tps": 8233, "wall": 16827.5} {"step": 2114, "train_loss": 4.210760593414307, "lr": 0.00039873625524014094, "tps": 8233, "wall": 16835.3} {"step": 2115, "train_loss": 4.08756160736084, "lr": 0.0003987339880447827, "tps": 8233, "wall": 16843.2} {"step": 2116, "train_loss": 4.1487579345703125, "lr": 0.00039873171882471616, "tps": 8233, "wall": 16851.0} {"step": 2117, "train_loss": 4.295212745666504, "lr": 0.000398729447579967, "tps": 8233, "wall": 16858.9} {"step": 2118, "train_loss": 4.097927093505859, "lr": 0.00039872717431056103, "tps": 8233, "wall": 16866.6} {"step": 2119, "train_loss": 4.178301811218262, "lr": 0.00039872489901652397, "tps": 8233, "wall": 16874.5} {"step": 2120, "train_loss": 4.164144515991211, "lr": 0.00039872262169788155, "tps": 8233, "wall": 16882.3} {"step": 2121, "train_loss": 4.039958477020264, "lr": 0.0003987203423546596, "tps": 8233, "wall": 16890.0} {"step": 2122, "train_loss": 4.1389265060424805, "lr": 0.000398718060986884, "tps": 8233, "wall": 16898.0} {"step": 2123, "train_loss": 4.132968425750732, "lr": 0.0003987157775945805, "tps": 8233, "wall": 16906.1} {"step": 2124, "train_loss": 4.152246475219727, "lr": 0.000398713492177775, "tps": 8233, "wall": 16913.9} {"step": 2125, "train_loss": 4.150088787078857, "lr": 0.00039871120473649344, "tps": 8233, "wall": 16922.9} {"step": 2126, "train_loss": 4.141258716583252, "lr": 0.00039870891527076164, "tps": 8233, "wall": 16931.1} {"step": 2127, "train_loss": 4.174232482910156, "lr": 0.0003987066237806056, "tps": 8232, "wall": 16939.4} {"step": 2128, "train_loss": 4.125637531280518, "lr": 0.0003987043302660512, "tps": 8232, "wall": 16947.2} {"step": 2129, "train_loss": 4.201503276824951, "lr": 0.0003987020347271245, "tps": 8233, "wall": 16955.0} {"step": 2130, "train_loss": 4.1935811042785645, "lr": 0.0003986997371638515, "tps": 8233, "wall": 16962.8} {"step": 2131, "train_loss": 4.153715133666992, "lr": 0.0003986974375762582, "tps": 8233, "wall": 16970.9} {"step": 2132, "train_loss": 4.044655799865723, "lr": 0.0003986951359643707, "tps": 8233, "wall": 16978.6} {"step": 2133, "train_loss": 4.139624118804932, "lr": 0.000398692832328215, "tps": 8233, "wall": 16986.5} {"step": 2134, "train_loss": 4.153742790222168, "lr": 0.00039869052666781726, "tps": 8233, "wall": 16994.4} {"step": 2135, "train_loss": 4.136318683624268, "lr": 0.00039868821898320355, "tps": 8233, "wall": 17002.2} {"step": 2136, "train_loss": 4.255443572998047, "lr": 0.0003986859092744, "tps": 8233, "wall": 17010.0} {"step": 2137, "train_loss": 4.245987415313721, "lr": 0.00039868359754143283, "tps": 8233, "wall": 17017.9} {"step": 2138, "train_loss": 4.202544212341309, "lr": 0.0003986812837843282, "tps": 8233, "wall": 17026.1} {"step": 2139, "train_loss": 4.090260982513428, "lr": 0.0003986789680031123, "tps": 8233, "wall": 17034.3} {"step": 2140, "train_loss": 4.060917377471924, "lr": 0.0003986766501978114, "tps": 8233, "wall": 17042.6} {"step": 2141, "train_loss": 4.122195243835449, "lr": 0.0003986743303684517, "tps": 8232, "wall": 17051.0} {"step": 2142, "train_loss": 4.098852634429932, "lr": 0.00039867200851505957, "tps": 8232, "wall": 17059.1} {"step": 2143, "train_loss": 4.213517665863037, "lr": 0.0003986696846376612, "tps": 8232, "wall": 17066.9} {"step": 2144, "train_loss": 4.133699417114258, "lr": 0.0003986673587362831, "tps": 8232, "wall": 17074.8} {"step": 2145, "train_loss": 4.1883440017700195, "lr": 0.00039866503081095137, "tps": 8232, "wall": 17082.7} {"step": 2146, "train_loss": 4.297508716583252, "lr": 0.00039866270086169256, "tps": 8232, "wall": 17090.9} {"step": 2147, "train_loss": 4.187790870666504, "lr": 0.00039866036888853306, "tps": 8232, "wall": 17099.0} {"step": 2148, "train_loss": 4.125323295593262, "lr": 0.0003986580348914991, "tps": 8232, "wall": 17107.4} {"step": 2149, "train_loss": 4.144757270812988, "lr": 0.0003986556988706174, "tps": 8232, "wall": 17115.4} {"step": 2150, "train_loss": 4.05948543548584, "lr": 0.0003986533608259142, "tps": 8232, "wall": 17123.4} {"step": 2151, "train_loss": 4.172745227813721, "lr": 0.00039865102075741605, "tps": 8232, "wall": 17131.3} {"step": 2152, "train_loss": 4.149352550506592, "lr": 0.0003986486786651495, "tps": 8232, "wall": 17139.3} {"step": 2153, "train_loss": 4.220414161682129, "lr": 0.00039864633454914105, "tps": 8232, "wall": 17147.1} {"step": 2154, "train_loss": 4.142090797424316, "lr": 0.00039864398840941726, "tps": 8232, "wall": 17155.0} {"step": 2155, "train_loss": 4.163522720336914, "lr": 0.0003986416402460047, "tps": 8232, "wall": 17162.8} {"step": 2156, "train_loss": 4.168607711791992, "lr": 0.00039863929005892995, "tps": 8232, "wall": 17170.5} {"step": 2157, "train_loss": 4.086388111114502, "lr": 0.0003986369378482198, "tps": 8232, "wall": 17178.5} {"step": 2158, "train_loss": 4.142261028289795, "lr": 0.00039863458361390057, "tps": 8232, "wall": 17186.4} {"step": 2159, "train_loss": 4.126718997955322, "lr": 0.0003986322273559992, "tps": 8232, "wall": 17194.2} {"step": 2160, "train_loss": 4.210928440093994, "lr": 0.0003986298690745423, "tps": 8232, "wall": 17202.2} {"step": 2161, "train_loss": 4.11500358581543, "lr": 0.0003986275087695565, "tps": 8232, "wall": 17210.2} {"step": 2162, "train_loss": 4.151077747344971, "lr": 0.0003986251464410687, "tps": 8232, "wall": 17218.1} {"step": 2163, "train_loss": 4.127845287322998, "lr": 0.00039862278208910556, "tps": 8232, "wall": 17225.8} {"step": 2164, "train_loss": 4.146788120269775, "lr": 0.00039862041571369386, "tps": 8232, "wall": 17233.9} {"step": 2165, "train_loss": 4.1682024002075195, "lr": 0.0003986180473148604, "tps": 8232, "wall": 17241.9} {"step": 2166, "train_loss": 4.0570783615112305, "lr": 0.0003986156768926321, "tps": 8232, "wall": 17250.0} {"step": 2167, "train_loss": 4.105431079864502, "lr": 0.0003986133044470358, "tps": 8232, "wall": 17258.4} {"step": 2168, "train_loss": 4.077175617218018, "lr": 0.00039861092997809825, "tps": 8232, "wall": 17266.7} {"step": 2169, "train_loss": 4.109577178955078, "lr": 0.00039860855348584635, "tps": 8232, "wall": 17274.5} {"step": 2170, "train_loss": 4.194184303283691, "lr": 0.0003986061749703072, "tps": 8232, "wall": 17282.3} {"step": 2171, "train_loss": 4.147461414337158, "lr": 0.0003986037944315076, "tps": 8232, "wall": 17290.1} {"step": 2172, "train_loss": 4.110749244689941, "lr": 0.00039860141186947456, "tps": 8232, "wall": 17298.1} {"step": 2173, "train_loss": 4.228323936462402, "lr": 0.00039859902728423506, "tps": 8232, "wall": 17306.0} {"step": 2174, "train_loss": 4.092558860778809, "lr": 0.00039859664067581614, "tps": 8232, "wall": 17313.7} {"step": 2175, "train_loss": 4.158108234405518, "lr": 0.0003985942520442448, "tps": 8232, "wall": 17321.8} {"step": 2176, "train_loss": 4.174701690673828, "lr": 0.0003985918613895481, "tps": 8232, "wall": 17329.8} {"step": 2177, "train_loss": 4.0862298011779785, "lr": 0.00039858946871175314, "tps": 8232, "wall": 17338.1} {"step": 2178, "train_loss": 4.158327579498291, "lr": 0.00039858707401088704, "tps": 8232, "wall": 17346.7} {"step": 2179, "train_loss": 4.14375638961792, "lr": 0.00039858467728697683, "tps": 8232, "wall": 17354.9} {"step": 2180, "train_loss": 4.11359977722168, "lr": 0.00039858227854004983, "tps": 8232, "wall": 17362.8} {"step": 2181, "train_loss": 4.138995170593262, "lr": 0.00039857987777013303, "tps": 8232, "wall": 17370.7} {"step": 2182, "train_loss": 4.088939189910889, "lr": 0.0003985774749772537, "tps": 8232, "wall": 17378.6} {"step": 2183, "train_loss": 4.159228801727295, "lr": 0.0003985750701614392, "tps": 8232, "wall": 17386.5} {"step": 2184, "train_loss": 4.153986930847168, "lr": 0.00039857266332271656, "tps": 8232, "wall": 17394.4} {"step": 2185, "train_loss": 4.1478071212768555, "lr": 0.00039857025446111315, "tps": 8232, "wall": 17402.3} {"step": 2186, "train_loss": 4.055820941925049, "lr": 0.0003985678435766562, "tps": 8232, "wall": 17410.3} {"step": 2187, "train_loss": 4.111093521118164, "lr": 0.0003985654306693731, "tps": 8232, "wall": 17418.5} {"step": 2188, "train_loss": 4.185079097747803, "lr": 0.0003985630157392911, "tps": 8232, "wall": 17426.4} {"step": 2189, "train_loss": 4.134875297546387, "lr": 0.00039856059878643765, "tps": 8232, "wall": 17434.2} {"step": 2190, "train_loss": 4.123824119567871, "lr": 0.0003985581798108401, "tps": 8232, "wall": 17442.0} {"step": 2191, "train_loss": 4.153932571411133, "lr": 0.00039855575881252576, "tps": 8232, "wall": 17449.8} {"step": 2192, "train_loss": 4.167076110839844, "lr": 0.0003985533357915221, "tps": 8232, "wall": 17457.6} {"step": 2193, "train_loss": 4.1608076095581055, "lr": 0.00039855091074785664, "tps": 8231, "wall": 17468.6} {"step": 2194, "train_loss": 4.079793453216553, "lr": 0.0003985484836815568, "tps": 8229, "wall": 17481.0} {"step": 2195, "train_loss": 4.113667011260986, "lr": 0.00039854605459265006, "tps": 8226, "wall": 17493.3} {"step": 2196, "train_loss": 4.194798469543457, "lr": 0.000398543623481164, "tps": 8227, "wall": 17501.2} {"step": 2197, "train_loss": 4.082360744476318, "lr": 0.0003985411903471261, "tps": 8227, "wall": 17508.9} {"step": 2198, "train_loss": 4.1796417236328125, "lr": 0.0003985387551905639, "tps": 8225, "wall": 17519.7} {"step": 2199, "train_loss": 4.067371368408203, "lr": 0.00039853631801150505, "tps": 8225, "wall": 17528.4} {"step": 2200, "train_loss": 4.1565022468566895, "lr": 0.00039853387880997717, "tps": 8225, "wall": 17537.2} {"step": 2201, "train_loss": 4.192437171936035, "lr": 0.0003985314375860078, "tps": 8224, "wall": 17545.9} {"step": 2202, "train_loss": 4.15106201171875, "lr": 0.0003985289943396246, "tps": 8224, "wall": 17554.5} {"step": 2203, "train_loss": 4.148452281951904, "lr": 0.00039852654907085536, "tps": 8224, "wall": 17563.2} {"step": 2204, "train_loss": 4.137076377868652, "lr": 0.0003985241017797277, "tps": 8223, "wall": 17571.9} {"step": 2205, "train_loss": 4.1314496994018555, "lr": 0.0003985216524662694, "tps": 8223, "wall": 17580.6} {"step": 2206, "train_loss": 4.118042945861816, "lr": 0.0003985192011305081, "tps": 8223, "wall": 17589.3} {"step": 2207, "train_loss": 4.090348243713379, "lr": 0.0003985167477724717, "tps": 8222, "wall": 17598.1} {"step": 2208, "train_loss": 4.107318878173828, "lr": 0.00039851429239218787, "tps": 8222, "wall": 17606.6} {"step": 2209, "train_loss": 4.116876602172852, "lr": 0.00039851183498968443, "tps": 8222, "wall": 17614.7} {"step": 2210, "train_loss": 4.060361862182617, "lr": 0.00039850937556498933, "tps": 8222, "wall": 17622.6} {"step": 2211, "train_loss": 4.13803243637085, "lr": 0.0003985069141181304, "tps": 8222, "wall": 17630.9} {"step": 2212, "train_loss": 4.187274932861328, "lr": 0.00039850445064913546, "tps": 8222, "wall": 17639.1} {"step": 2213, "train_loss": 4.086998462677002, "lr": 0.0003985019851580324, "tps": 8222, "wall": 17647.1} {"step": 2214, "train_loss": 4.124454975128174, "lr": 0.00039849951764484926, "tps": 8221, "wall": 17655.7} {"step": 2215, "train_loss": 4.164516925811768, "lr": 0.0003984970481096139, "tps": 8221, "wall": 17663.8} {"step": 2216, "train_loss": 4.108913421630859, "lr": 0.0003984945765523543, "tps": 8221, "wall": 17673.2} {"step": 2217, "train_loss": 4.14548397064209, "lr": 0.0003984921029730985, "tps": 8220, "wall": 17683.1} {"step": 2218, "train_loss": 4.0541768074035645, "lr": 0.00039848962737187453, "tps": 8219, "wall": 17693.0} {"step": 2219, "train_loss": 4.0912251472473145, "lr": 0.0003984871497487104, "tps": 8218, "wall": 17702.3} {"step": 2220, "train_loss": 4.182229042053223, "lr": 0.0003984846701036341, "tps": 8218, "wall": 17710.5} {"step": 2221, "train_loss": 4.06156063079834, "lr": 0.0003984821884366739, "tps": 8218, "wall": 17718.9} {"step": 2222, "train_loss": 3.953092575073242, "lr": 0.00039847970474785776, "tps": 8218, "wall": 17727.5} {"step": 2223, "train_loss": 4.058444976806641, "lr": 0.0003984772190372139, "tps": 8218, "wall": 17735.7} {"step": 2224, "train_loss": 4.082152843475342, "lr": 0.00039847473130477044, "tps": 8217, "wall": 17743.8} {"step": 2225, "train_loss": 4.1533284187316895, "lr": 0.0003984722415505556, "tps": 8217, "wall": 17751.9} {"step": 2226, "train_loss": 4.058980941772461, "lr": 0.0003984697497745974, "tps": 8217, "wall": 17760.4} {"step": 2227, "train_loss": 4.2789306640625, "lr": 0.0003984672559769244, "tps": 8217, "wall": 17768.5} {"step": 2228, "train_loss": 4.085078716278076, "lr": 0.0003984647601575646, "tps": 8217, "wall": 17777.1} {"step": 2229, "train_loss": 4.102916717529297, "lr": 0.00039846226231654634, "tps": 8216, "wall": 17786.6} {"step": 2230, "train_loss": 4.065319538116455, "lr": 0.0003984597624538979, "tps": 8215, "wall": 17796.1} {"step": 2231, "train_loss": 4.044780254364014, "lr": 0.00039845726056964763, "tps": 8215, "wall": 17805.6} {"step": 2232, "train_loss": 3.9464635848999023, "lr": 0.0003984547566638239, "tps": 8214, "wall": 17815.1} {"step": 2233, "train_loss": 4.162283897399902, "lr": 0.00039845225073645497, "tps": 8213, "wall": 17824.8} {"step": 2234, "train_loss": 4.13631010055542, "lr": 0.0003984497427875693, "tps": 8212, "wall": 17834.3} {"step": 2235, "train_loss": 4.085916042327881, "lr": 0.00039844723281719533, "tps": 8212, "wall": 17843.9} {"step": 2236, "train_loss": 4.214929103851318, "lr": 0.00039844472082536145, "tps": 8211, "wall": 17853.6} {"step": 2237, "train_loss": 4.179731369018555, "lr": 0.00039844220681209603, "tps": 8210, "wall": 17863.4} {"step": 2238, "train_loss": 4.162860870361328, "lr": 0.00039843969077742777, "tps": 8209, "wall": 17872.9} {"step": 2239, "train_loss": 4.181973457336426, "lr": 0.00039843717272138496, "tps": 8209, "wall": 17882.6} {"step": 2240, "train_loss": 4.101703643798828, "lr": 0.0003984346526439962, "tps": 8208, "wall": 17892.3} {"step": 2241, "train_loss": 4.133056163787842, "lr": 0.00039843213054529007, "tps": 8207, "wall": 17902.1} {"step": 2242, "train_loss": 4.20131254196167, "lr": 0.00039842960642529513, "tps": 8206, "wall": 17911.8} {"step": 2243, "train_loss": 4.16014289855957, "lr": 0.0003984270802840399, "tps": 8205, "wall": 17921.5} {"step": 2244, "train_loss": 4.060423851013184, "lr": 0.00039842455212155315, "tps": 8205, "wall": 17931.3} {"step": 2245, "train_loss": 4.101911544799805, "lr": 0.0003984220219378633, "tps": 8204, "wall": 17940.9} {"step": 2246, "train_loss": 4.161965370178223, "lr": 0.00039841948973299917, "tps": 8203, "wall": 17950.6} {"step": 2247, "train_loss": 4.095888614654541, "lr": 0.0003984169555069894, "tps": 8202, "wall": 17960.5} {"step": 2248, "train_loss": 4.12378454208374, "lr": 0.00039841441925986276, "tps": 8201, "wall": 17970.2} {"step": 2249, "train_loss": 4.0462493896484375, "lr": 0.00039841188099164784, "tps": 8201, "wall": 17979.4} {"step": 2250, "train_loss": 4.149685859680176, "lr": 0.0003984093407023736, "tps": 8201, "wall": 17988.1} {"step": 2251, "train_loss": 3.9583704471588135, "lr": 0.0003984067983920686, "tps": 8200, "wall": 17996.7} {"step": 2252, "train_loss": 4.0601677894592285, "lr": 0.0003984042540607618, "tps": 8200, "wall": 18005.5} {"step": 2253, "train_loss": 4.185407638549805, "lr": 0.00039840170770848193, "tps": 8200, "wall": 18014.1} {"step": 2254, "train_loss": 4.186232566833496, "lr": 0.0003983991593352579, "tps": 8199, "wall": 18022.7} {"step": 2255, "train_loss": 4.147280216217041, "lr": 0.0003983966089411185, "tps": 8199, "wall": 18031.4} {"step": 2256, "train_loss": 4.019291400909424, "lr": 0.0003983940565260926, "tps": 8199, "wall": 18040.2} {"step": 2257, "train_loss": 4.178249359130859, "lr": 0.00039839150209020925, "tps": 8198, "wall": 18048.7} {"step": 2258, "train_loss": 4.09194803237915, "lr": 0.0003983889456334973, "tps": 8198, "wall": 18057.2} {"step": 2259, "train_loss": 3.9798824787139893, "lr": 0.00039838638715598574, "tps": 8198, "wall": 18065.5} {"step": 2260, "train_loss": 4.0774736404418945, "lr": 0.00039838382665770354, "tps": 8198, "wall": 18074.1} {"step": 2261, "train_loss": 4.107024192810059, "lr": 0.0003983812641386797, "tps": 8198, "wall": 18082.7} {"step": 2262, "train_loss": 4.119085311889648, "lr": 0.0003983786995989432, "tps": 8197, "wall": 18091.1} {"step": 2263, "train_loss": 4.1814117431640625, "lr": 0.00039837613303852316, "tps": 8197, "wall": 18099.4} {"step": 2264, "train_loss": 4.111677169799805, "lr": 0.0003983735644574487, "tps": 8197, "wall": 18107.9} {"step": 2265, "train_loss": 4.091769695281982, "lr": 0.00039837099385574883, "tps": 8197, "wall": 18116.4} {"step": 2266, "train_loss": 4.094053268432617, "lr": 0.00039836842123345265, "tps": 8197, "wall": 18124.7} {"step": 2267, "train_loss": 4.1557793617248535, "lr": 0.0003983658465905893, "tps": 8196, "wall": 18133.0} {"step": 2268, "train_loss": 4.0928778648376465, "lr": 0.00039836326992718807, "tps": 8196, "wall": 18141.3} {"step": 2269, "train_loss": 4.195437908172607, "lr": 0.00039836069124327806, "tps": 8196, "wall": 18149.5} {"step": 2270, "train_loss": 4.163545608520508, "lr": 0.0003983581105388885, "tps": 8196, "wall": 18157.7} {"step": 2271, "train_loss": 4.071491241455078, "lr": 0.0003983555278140486, "tps": 8195, "wall": 18167.4} {"step": 2272, "train_loss": 4.129642486572266, "lr": 0.0003983529430687876, "tps": 8195, "wall": 18176.9} {"step": 2273, "train_loss": 4.139116287231445, "lr": 0.00039835035630313484, "tps": 8194, "wall": 18185.4} {"step": 2274, "train_loss": 4.0284037590026855, "lr": 0.00039834776751711964, "tps": 8194, "wall": 18193.9} {"step": 2275, "train_loss": 4.008245944976807, "lr": 0.00039834517671077116, "tps": 8194, "wall": 18202.2} {"step": 2276, "train_loss": 4.136421203613281, "lr": 0.00039834258388411894, "tps": 8194, "wall": 18210.4} {"step": 2277, "train_loss": 4.0165486335754395, "lr": 0.0003983399890371923, "tps": 8194, "wall": 18218.7} {"step": 2278, "train_loss": 4.146952152252197, "lr": 0.0003983373921700206, "tps": 8194, "wall": 18226.7} {"step": 2279, "train_loss": 4.092480659484863, "lr": 0.0003983347932826333, "tps": 8194, "wall": 18234.7} {"step": 2280, "train_loss": 4.052053451538086, "lr": 0.0003983321923750598, "tps": 8194, "wall": 18242.7} {"step": 2281, "train_loss": 4.141684532165527, "lr": 0.00039832958944732954, "tps": 8194, "wall": 18250.6} {"step": 2282, "train_loss": 4.090565204620361, "lr": 0.0003983269844994721, "tps": 8194, "wall": 18258.7} {"step": 2283, "train_loss": 4.068453788757324, "lr": 0.0003983243775315169, "tps": 8194, "wall": 18266.6} {"step": 2284, "train_loss": 4.17002534866333, "lr": 0.0003983217685434935, "tps": 8194, "wall": 18274.6} {"step": 2285, "train_loss": 4.09297513961792, "lr": 0.0003983191575354315, "tps": 8194, "wall": 18282.6} {"step": 2286, "train_loss": 4.067611217498779, "lr": 0.0003983165445073604, "tps": 8194, "wall": 18290.8} {"step": 2287, "train_loss": 4.136112689971924, "lr": 0.00039831392945930983, "tps": 8194, "wall": 18299.1} {"step": 2288, "train_loss": 4.063094139099121, "lr": 0.0003983113123913094, "tps": 8193, "wall": 18308.8} {"step": 2289, "train_loss": 3.9892072677612305, "lr": 0.0003983086933033888, "tps": 8192, "wall": 18318.5} {"step": 2290, "train_loss": 4.0395827293396, "lr": 0.0003983060721955777, "tps": 8192, "wall": 18327.9} {"step": 2291, "train_loss": 4.14064359664917, "lr": 0.00039830344906790577, "tps": 8191, "wall": 18336.0} {"step": 2292, "train_loss": 4.075397491455078, "lr": 0.0003983008239204027, "tps": 8192, "wall": 18344.0} {"step": 2293, "train_loss": 4.096182823181152, "lr": 0.00039829819675309824, "tps": 8191, "wall": 18352.1} {"step": 2294, "train_loss": 4.130499839782715, "lr": 0.00039829556756602213, "tps": 8191, "wall": 18360.5} {"step": 2295, "train_loss": 4.0736470222473145, "lr": 0.00039829293635920427, "tps": 8191, "wall": 18369.2} {"step": 2296, "train_loss": 4.1014933586120605, "lr": 0.0003982903031326743, "tps": 8191, "wall": 18377.7} {"step": 2297, "train_loss": 4.1258721351623535, "lr": 0.0003982876678864622, "tps": 8191, "wall": 18386.0} {"step": 2298, "train_loss": 4.106794357299805, "lr": 0.0003982850306205977, "tps": 8191, "wall": 18394.2} {"step": 2299, "train_loss": 4.144443988800049, "lr": 0.0003982823913351108, "tps": 8190, "wall": 18402.5} {"step": 2300, "train_loss": 4.06464958190918, "lr": 0.00039827975003003133, "tps": 8190, "wall": 18410.8} {"step": 2301, "train_loss": 4.0337090492248535, "lr": 0.0003982771067053891, "tps": 8190, "wall": 18419.3} {"step": 2302, "train_loss": 4.125198841094971, "lr": 0.0003982744613612142, "tps": 8190, "wall": 18428.2} {"step": 2303, "train_loss": 4.05255126953125, "lr": 0.00039827181399753665, "tps": 8189, "wall": 18438.3} {"step": 2304, "train_loss": 4.151566982269287, "lr": 0.00039826916461438623, "tps": 8188, "wall": 18446.8} {"step": 2305, "train_loss": 4.126660346984863, "lr": 0.0003982665132117931, "tps": 8188, "wall": 18455.0} {"step": 2306, "train_loss": 4.1122236251831055, "lr": 0.00039826385978978726, "tps": 8188, "wall": 18463.2} {"step": 2307, "train_loss": 4.03790283203125, "lr": 0.00039826120434839884, "tps": 8188, "wall": 18471.3} {"step": 2308, "train_loss": 4.195583343505859, "lr": 0.00039825854688765774, "tps": 8188, "wall": 18479.4} {"step": 2309, "train_loss": 4.080143928527832, "lr": 0.0003982558874075942, "tps": 8188, "wall": 18487.9} {"step": 2310, "train_loss": 4.079603672027588, "lr": 0.00039825322590823846, "tps": 8188, "wall": 18496.2} {"step": 2311, "train_loss": 4.045477867126465, "lr": 0.0003982505623896204, "tps": 8188, "wall": 18504.2} {"step": 2312, "train_loss": 4.077966690063477, "lr": 0.0003982478968517704, "tps": 8188, "wall": 18512.3} {"step": 2313, "train_loss": 4.1130690574646, "lr": 0.0003982452292947185, "tps": 8188, "wall": 18520.3} {"step": 2314, "train_loss": 4.157153129577637, "lr": 0.000398242559718495, "tps": 8188, "wall": 18528.4} {"step": 2315, "train_loss": 4.150197982788086, "lr": 0.0003982398881231302, "tps": 8188, "wall": 18536.7} {"step": 2316, "train_loss": 4.04819393157959, "lr": 0.0003982372145086543, "tps": 8188, "wall": 18545.0} {"step": 2317, "train_loss": 4.139155387878418, "lr": 0.00039823453887509756, "tps": 8187, "wall": 18554.0} {"step": 2318, "train_loss": 4.144802570343018, "lr": 0.0003982318612224904, "tps": 8186, "wall": 18563.4} {"step": 2319, "train_loss": 4.020670413970947, "lr": 0.000398229181550863, "tps": 8186, "wall": 18572.9} {"step": 2320, "train_loss": 4.074458122253418, "lr": 0.00039822649986024576, "tps": 8185, "wall": 18582.2} {"step": 2321, "train_loss": 4.147770404815674, "lr": 0.0003982238161506692, "tps": 8185, "wall": 18591.6} {"step": 2322, "train_loss": 4.095615863800049, "lr": 0.0003982211304221635, "tps": 8184, "wall": 18601.1} {"step": 2323, "train_loss": 4.15355110168457, "lr": 0.00039821844267475925, "tps": 8183, "wall": 18610.5} {"step": 2324, "train_loss": 4.068856716156006, "lr": 0.00039821575290848685, "tps": 8183, "wall": 18620.2} {"step": 2325, "train_loss": 4.145378112792969, "lr": 0.00039821306112337667, "tps": 8182, "wall": 18630.2} {"step": 2326, "train_loss": 4.025833606719971, "lr": 0.0003982103673194594, "tps": 8181, "wall": 18639.9} {"step": 2327, "train_loss": 4.107869625091553, "lr": 0.0003982076714967654, "tps": 8180, "wall": 18649.8} {"step": 2328, "train_loss": 4.142786979675293, "lr": 0.00039820497365532524, "tps": 8179, "wall": 18660.8} {"step": 2329, "train_loss": 4.047732353210449, "lr": 0.00039820227379516954, "tps": 8178, "wall": 18671.2} {"step": 2330, "train_loss": 4.090080261230469, "lr": 0.0003981995719163288, "tps": 8177, "wall": 18681.5} {"step": 2331, "train_loss": 4.08812141418457, "lr": 0.00039819686801883364, "tps": 8176, "wall": 18692.2} {"step": 2332, "train_loss": 4.081151008605957, "lr": 0.0003981941621027148, "tps": 8174, "wall": 18702.9} {"step": 2333, "train_loss": 4.054259777069092, "lr": 0.0003981914541680028, "tps": 8173, "wall": 18714.4} {"step": 2334, "train_loss": 3.9896111488342285, "lr": 0.0003981887442147284, "tps": 8171, "wall": 18726.2} {"step": 2335, "train_loss": 4.052223205566406, "lr": 0.0003981860322429223, "tps": 8170, "wall": 18737.9} {"step": 2336, "train_loss": 4.08847188949585, "lr": 0.0003981833182526151, "tps": 8165, "wall": 18757.6} {"step": 2337, "train_loss": 4.070720672607422, "lr": 0.0003981806022438377, "tps": 8162, "wall": 18772.6} {"step": 2338, "train_loss": 4.140042781829834, "lr": 0.00039817788421662076, "tps": 8161, "wall": 18781.0} {"step": 2339, "train_loss": 4.115926265716553, "lr": 0.00039817516417099506, "tps": 8161, "wall": 18789.4} {"step": 2340, "train_loss": 3.9902241230010986, "lr": 0.0003981724421069916, "tps": 8161, "wall": 18798.3} {"step": 2341, "train_loss": 4.055506706237793, "lr": 0.00039816971802464097, "tps": 8160, "wall": 18807.8} {"step": 2342, "train_loss": 4.068941593170166, "lr": 0.00039816699192397415, "tps": 8160, "wall": 18817.4} {"step": 2343, "train_loss": 4.160626411437988, "lr": 0.000398164263805022, "tps": 8159, "wall": 18826.2} {"step": 2344, "train_loss": 4.137358665466309, "lr": 0.00039816153366781546, "tps": 8159, "wall": 18835.7} {"step": 2345, "train_loss": 4.128082752227783, "lr": 0.00039815880151238545, "tps": 8158, "wall": 18845.2} {"step": 2346, "train_loss": 4.009490013122559, "lr": 0.0003981560673387628, "tps": 8157, "wall": 18854.8} {"step": 2347, "train_loss": 4.111088275909424, "lr": 0.0003981533311469787, "tps": 8157, "wall": 18863.9} {"step": 2348, "train_loss": 4.0983147621154785, "lr": 0.000398150592937064, "tps": 8156, "wall": 18873.4} {"step": 2349, "train_loss": 4.120238304138184, "lr": 0.0003981478527090497, "tps": 8156, "wall": 18882.9} {"step": 2350, "train_loss": 4.0527825355529785, "lr": 0.0003981451104629669, "tps": 8155, "wall": 18892.4} {"step": 2351, "train_loss": 4.1038055419921875, "lr": 0.0003981423661988466, "tps": 8154, "wall": 18902.0} {"step": 2352, "train_loss": 4.000622749328613, "lr": 0.00039813961991672, "tps": 8153, "wall": 18912.0} {"step": 2353, "train_loss": 4.105041027069092, "lr": 0.0003981368716166182, "tps": 8153, "wall": 18921.3} {"step": 2354, "train_loss": 4.1041388511657715, "lr": 0.00039813412129857217, "tps": 8152, "wall": 18930.3} {"step": 2355, "train_loss": 4.077672481536865, "lr": 0.00039813136896261326, "tps": 8152, "wall": 18939.4} {"step": 2356, "train_loss": 4.010402679443359, "lr": 0.00039812861460877255, "tps": 8152, "wall": 18948.2} {"step": 2357, "train_loss": 4.108839511871338, "lr": 0.0003981258582370812, "tps": 8151, "wall": 18957.2} {"step": 2358, "train_loss": 4.031752586364746, "lr": 0.00039812309984757054, "tps": 8151, "wall": 18966.2} {"step": 2359, "train_loss": 4.232316493988037, "lr": 0.00039812033944027175, "tps": 8150, "wall": 18975.3} {"step": 2360, "train_loss": 3.989715576171875, "lr": 0.0003981175770152162, "tps": 8150, "wall": 18984.1} {"step": 2361, "train_loss": 4.035110950469971, "lr": 0.000398114812572435, "tps": 8150, "wall": 18993.1} {"step": 2362, "train_loss": 3.986477851867676, "lr": 0.00039811204611195963, "tps": 8149, "wall": 19001.9} {"step": 2363, "train_loss": 4.097870349884033, "lr": 0.0003981092776338213, "tps": 8149, "wall": 19011.0} {"step": 2364, "train_loss": 4.093055248260498, "lr": 0.00039810650713805146, "tps": 8148, "wall": 19020.0} {"step": 2365, "train_loss": 4.050332069396973, "lr": 0.00039810373462468153, "tps": 8148, "wall": 19028.7} {"step": 2366, "train_loss": 4.184586524963379, "lr": 0.00039810096009374276, "tps": 8148, "wall": 19037.8} {"step": 2367, "train_loss": 4.098074913024902, "lr": 0.00039809818354526676, "tps": 8147, "wall": 19046.5} {"step": 2368, "train_loss": 3.9968481063842773, "lr": 0.0003980954049792849, "tps": 8147, "wall": 19055.5} {"step": 2369, "train_loss": 4.023069381713867, "lr": 0.0003980926243958286, "tps": 8147, "wall": 19064.4} {"step": 2370, "train_loss": 4.15001106262207, "lr": 0.00039808984179492946, "tps": 8146, "wall": 19073.3} {"step": 2371, "train_loss": 4.140623092651367, "lr": 0.000398087057176619, "tps": 8146, "wall": 19082.1} {"step": 2372, "train_loss": 4.187007427215576, "lr": 0.00039808427054092863, "tps": 8146, "wall": 19091.0} {"step": 2373, "train_loss": 4.017231464385986, "lr": 0.00039808148188789005, "tps": 8145, "wall": 19100.2} {"step": 2374, "train_loss": 4.132759094238281, "lr": 0.0003980786912175348, "tps": 8145, "wall": 19109.1} {"step": 2375, "train_loss": 4.004693508148193, "lr": 0.0003980758985298945, "tps": 8144, "wall": 19118.1} {"step": 2376, "train_loss": 4.1204118728637695, "lr": 0.0003980731038250008, "tps": 8144, "wall": 19127.0} {"step": 2377, "train_loss": 4.098705291748047, "lr": 0.0003980703071028854, "tps": 8144, "wall": 19135.9} {"step": 2378, "train_loss": 4.0378098487854, "lr": 0.00039806750836357985, "tps": 8143, "wall": 19144.6} {"step": 2379, "train_loss": 4.110062122344971, "lr": 0.00039806470760711597, "tps": 8143, "wall": 19153.4} {"step": 2380, "train_loss": 4.148690223693848, "lr": 0.0003980619048335254, "tps": 8143, "wall": 19162.4} {"step": 2381, "train_loss": 4.168468475341797, "lr": 0.00039805910004284, "tps": 8142, "wall": 19171.2} {"step": 2382, "train_loss": 4.079953670501709, "lr": 0.0003980562932350914, "tps": 8142, "wall": 19180.2} {"step": 2383, "train_loss": 4.121803283691406, "lr": 0.00039805348441031155, "tps": 8142, "wall": 19189.0} {"step": 2384, "train_loss": 4.1568779945373535, "lr": 0.00039805067356853217, "tps": 8141, "wall": 19198.0} {"step": 2385, "train_loss": 4.125864028930664, "lr": 0.00039804786070978513, "tps": 8141, "wall": 19206.6} {"step": 2386, "train_loss": 4.0479865074157715, "lr": 0.00039804504583410233, "tps": 8140, "wall": 19215.7} {"step": 2387, "train_loss": 4.051701545715332, "lr": 0.0003980422289415156, "tps": 8140, "wall": 19224.6} {"step": 2388, "train_loss": 4.003537178039551, "lr": 0.00039803941003205685, "tps": 8140, "wall": 19233.4} {"step": 2389, "train_loss": 4.089040279388428, "lr": 0.00039803658910575804, "tps": 8140, "wall": 19242.1} {"step": 2390, "train_loss": 4.1222920417785645, "lr": 0.00039803376616265107, "tps": 8139, "wall": 19250.9} {"step": 2391, "train_loss": 4.236099720001221, "lr": 0.000398030941202768, "tps": 8139, "wall": 19259.9} {"step": 2392, "train_loss": 4.073434352874756, "lr": 0.00039802811422614084, "tps": 8138, "wall": 19268.7} {"step": 2393, "train_loss": 3.9602222442626953, "lr": 0.0003980252852328015, "tps": 8138, "wall": 19277.6} {"step": 2394, "train_loss": 4.165871620178223, "lr": 0.00039802245422278215, "tps": 8138, "wall": 19286.7} {"step": 2395, "train_loss": 4.037109375, "lr": 0.0003980196211961148, "tps": 8137, "wall": 19296.1} {"step": 2396, "train_loss": 4.064733028411865, "lr": 0.00039801678615283153, "tps": 8137, "wall": 19305.2} {"step": 2397, "train_loss": 4.037590026855469, "lr": 0.0003980139490929645, "tps": 8136, "wall": 19314.2} {"step": 2398, "train_loss": 3.969398021697998, "lr": 0.0003980111100165458, "tps": 8136, "wall": 19323.1} {"step": 2399, "train_loss": 4.022239685058594, "lr": 0.00039800826892360765, "tps": 8136, "wall": 19332.1} {"step": 2400, "train_loss": 4.192785739898682, "lr": 0.0003980054258141822, "tps": 8135, "wall": 19341.1} {"step": 2401, "train_loss": 4.0900373458862305, "lr": 0.0003980025806883016, "tps": 8135, "wall": 19350.0} {"step": 2402, "train_loss": 4.100881099700928, "lr": 0.0003979997335459982, "tps": 8134, "wall": 19358.8} {"step": 2403, "train_loss": 4.0675048828125, "lr": 0.0003979968843873041, "tps": 8134, "wall": 19367.7} {"step": 2404, "train_loss": 4.177422046661377, "lr": 0.0003979940332122517, "tps": 8134, "wall": 19376.5} {"step": 2405, "train_loss": 3.999478816986084, "lr": 0.0003979911800208733, "tps": 8133, "wall": 19385.4} {"step": 2406, "train_loss": 4.097501754760742, "lr": 0.0003979883248132012, "tps": 8133, "wall": 19394.4} {"step": 2407, "train_loss": 4.1311211585998535, "lr": 0.0003979854675892677, "tps": 8133, "wall": 19403.2} {"step": 2408, "train_loss": 4.103408336639404, "lr": 0.0003979826083491052, "tps": 8132, "wall": 19412.1} {"step": 2409, "train_loss": 4.042229175567627, "lr": 0.0003979797470927461, "tps": 8132, "wall": 19420.4} {"step": 2410, "train_loss": 4.090813636779785, "lr": 0.0003979768838202227, "tps": 8132, "wall": 19429.5} {"step": 2411, "train_loss": 3.9836983680725098, "lr": 0.00039797401853156766, "tps": 8132, "wall": 19438.3} {"step": 2412, "train_loss": 3.9417409896850586, "lr": 0.0003979711512268132, "tps": 8131, "wall": 19447.2} {"step": 2413, "train_loss": 4.037329196929932, "lr": 0.000397968281905992, "tps": 8131, "wall": 19456.2} {"step": 2414, "train_loss": 4.193700790405273, "lr": 0.00039796541056913643, "tps": 8130, "wall": 19465.0} {"step": 2415, "train_loss": 4.124484062194824, "lr": 0.0003979625372162791, "tps": 8130, "wall": 19474.1} {"step": 2416, "train_loss": 4.071821212768555, "lr": 0.00039795966184745247, "tps": 8130, "wall": 19482.9} {"step": 2417, "train_loss": 4.1050825119018555, "lr": 0.0003979567844626892, "tps": 8129, "wall": 19492.1} {"step": 2418, "train_loss": 3.9870967864990234, "lr": 0.0003979539050620218, "tps": 8129, "wall": 19501.1} {"step": 2419, "train_loss": 4.023258209228516, "lr": 0.00039795102364548294, "tps": 8129, "wall": 19509.9} {"step": 2420, "train_loss": 4.023440837860107, "lr": 0.00039794814021310536, "tps": 8128, "wall": 19518.9} {"step": 2421, "train_loss": 4.134433746337891, "lr": 0.0003979452547649215, "tps": 8128, "wall": 19527.7} {"step": 2422, "train_loss": 4.218094825744629, "lr": 0.00039794236730096425, "tps": 8128, "wall": 19536.5} {"step": 2423, "train_loss": 4.129400253295898, "lr": 0.00039793947782126616, "tps": 8127, "wall": 19545.4} {"step": 2424, "train_loss": 4.032871723175049, "lr": 0.00039793658632586014, "tps": 8127, "wall": 19554.3} {"step": 2425, "train_loss": 4.025307655334473, "lr": 0.00039793369281477875, "tps": 8126, "wall": 19563.3} {"step": 2426, "train_loss": 4.166590213775635, "lr": 0.0003979307972880549, "tps": 8126, "wall": 19572.3} {"step": 2427, "train_loss": 4.107674598693848, "lr": 0.00039792789974572136, "tps": 8126, "wall": 19581.2} {"step": 2428, "train_loss": 4.046412944793701, "lr": 0.0003979250001878109, "tps": 8125, "wall": 19590.1} {"step": 2429, "train_loss": 4.00986909866333, "lr": 0.00039792209861435647, "tps": 8125, "wall": 19599.0} {"step": 2430, "train_loss": 4.080301284790039, "lr": 0.00039791919502539085, "tps": 8125, "wall": 19607.7} {"step": 2431, "train_loss": 4.035521030426025, "lr": 0.00039791628942094696, "tps": 8125, "wall": 19616.3} {"step": 2432, "train_loss": 4.09724235534668, "lr": 0.0003979133818010577, "tps": 8124, "wall": 19624.9} {"step": 2433, "train_loss": 4.044577598571777, "lr": 0.0003979104721657561, "tps": 8124, "wall": 19633.6} {"step": 2434, "train_loss": 4.094155788421631, "lr": 0.00039790756051507497, "tps": 8124, "wall": 19642.2} {"step": 2435, "train_loss": 3.9805781841278076, "lr": 0.0003979046468490474, "tps": 8124, "wall": 19650.7} {"step": 2436, "train_loss": 4.099203586578369, "lr": 0.0003979017311677064, "tps": 8123, "wall": 19659.3} {"step": 2437, "train_loss": 4.120710372924805, "lr": 0.0003978988134710849, "tps": 8123, "wall": 19668.3} {"step": 2438, "train_loss": 4.110302448272705, "lr": 0.00039789589375921605, "tps": 8122, "wall": 19678.4} {"step": 2439, "train_loss": 4.0051589012146, "lr": 0.0003978929720321329, "tps": 8121, "wall": 19688.2} {"step": 2440, "train_loss": 4.095966815948486, "lr": 0.0003978900482898685, "tps": 8121, "wall": 19697.9} {"step": 2441, "train_loss": 4.059842586517334, "lr": 0.00039788712253245606, "tps": 8121, "wall": 19705.9} {"step": 2442, "train_loss": 4.087954998016357, "lr": 0.00039788419475992866, "tps": 8121, "wall": 19713.8} {"step": 2443, "train_loss": 4.156579971313477, "lr": 0.00039788126497231947, "tps": 8121, "wall": 19721.8} {"step": 2444, "train_loss": 4.013286113739014, "lr": 0.0003978783331696617, "tps": 8121, "wall": 19729.8} {"step": 2445, "train_loss": 4.084534645080566, "lr": 0.00039787539935198855, "tps": 8121, "wall": 19737.8} {"step": 2446, "train_loss": 4.084088325500488, "lr": 0.00039787246351933323, "tps": 8121, "wall": 19745.7} {"step": 2447, "train_loss": 4.090554237365723, "lr": 0.000397869525671729, "tps": 8121, "wall": 19753.7} {"step": 2448, "train_loss": 4.147721767425537, "lr": 0.00039786658580920917, "tps": 8121, "wall": 19761.9} {"step": 2449, "train_loss": 3.9706077575683594, "lr": 0.0003978636439318071, "tps": 8121, "wall": 19770.1} {"step": 2450, "train_loss": 4.101555824279785, "lr": 0.000397860700039556, "tps": 8121, "wall": 19778.1} {"step": 2451, "train_loss": 4.031877517700195, "lr": 0.0003978577541324892, "tps": 8121, "wall": 19786.1} {"step": 2452, "train_loss": 4.043636798858643, "lr": 0.0003978548062106403, "tps": 8121, "wall": 19794.0} {"step": 2453, "train_loss": 4.089889049530029, "lr": 0.0003978518562740424, "tps": 8121, "wall": 19801.9} {"step": 2454, "train_loss": 4.009161949157715, "lr": 0.0003978489043227291, "tps": 8121, "wall": 19809.9} {"step": 2455, "train_loss": 4.06187105178833, "lr": 0.00039784595035673376, "tps": 8121, "wall": 19818.1} {"step": 2456, "train_loss": 4.0253825187683105, "lr": 0.0003978429943760899, "tps": 8121, "wall": 19826.2} {"step": 2457, "train_loss": 4.128584861755371, "lr": 0.000397840036380831, "tps": 8121, "wall": 19834.2} {"step": 2458, "train_loss": 4.140567779541016, "lr": 0.0003978370763709905, "tps": 8121, "wall": 19842.1} {"step": 2459, "train_loss": 4.000917434692383, "lr": 0.000397834114346602, "tps": 8121, "wall": 19850.0} {"step": 2460, "train_loss": 4.058790683746338, "lr": 0.0003978311503076991, "tps": 8121, "wall": 19858.0} {"step": 2461, "train_loss": 4.0583882331848145, "lr": 0.0003978281842543152, "tps": 8121, "wall": 19865.9} {"step": 2462, "train_loss": 3.972414970397949, "lr": 0.000397825216186484, "tps": 8121, "wall": 19874.0} {"step": 2463, "train_loss": 4.126299858093262, "lr": 0.00039782224610423924, "tps": 8121, "wall": 19881.9} {"step": 2464, "train_loss": 4.105301856994629, "lr": 0.00039781927400761434, "tps": 8122, "wall": 19889.9} {"step": 2465, "train_loss": 4.03827428817749, "lr": 0.0003978162998966431, "tps": 8122, "wall": 19897.7} {"step": 2466, "train_loss": 4.034860610961914, "lr": 0.00039781332377135934, "tps": 8122, "wall": 19905.7} {"step": 2467, "train_loss": 4.077364921569824, "lr": 0.00039781034563179647, "tps": 8122, "wall": 19913.4} {"step": 2468, "train_loss": 4.132662773132324, "lr": 0.0003978073654779885, "tps": 8122, "wall": 19921.3} {"step": 2469, "train_loss": 4.1622467041015625, "lr": 0.00039780438330996897, "tps": 8122, "wall": 19929.4} {"step": 2470, "train_loss": 4.131066799163818, "lr": 0.00039780139912777183, "tps": 8122, "wall": 19937.4} {"step": 2471, "train_loss": 4.189774513244629, "lr": 0.0003977984129314308, "tps": 8122, "wall": 19945.3} {"step": 2472, "train_loss": 4.041950702667236, "lr": 0.00039779542472097974, "tps": 8122, "wall": 19953.2} {"step": 2473, "train_loss": 4.086331844329834, "lr": 0.00039779243449645244, "tps": 8122, "wall": 19961.2} {"step": 2474, "train_loss": 4.080138206481934, "lr": 0.0003977894422578829, "tps": 8122, "wall": 19969.1} {"step": 2475, "train_loss": 4.065690040588379, "lr": 0.0003977864480053049, "tps": 8122, "wall": 19977.0} {"step": 2476, "train_loss": 4.10250997543335, "lr": 0.0003977834517387524, "tps": 8122, "wall": 19984.9} {"step": 2477, "train_loss": 4.123254776000977, "lr": 0.00039778045345825936, "tps": 8122, "wall": 19993.1} {"step": 2478, "train_loss": 4.068857192993164, "lr": 0.0003977774531638597, "tps": 8122, "wall": 20001.1} {"step": 2479, "train_loss": 3.9939403533935547, "lr": 0.0003977744508555874, "tps": 8122, "wall": 20008.9} {"step": 2480, "train_loss": 4.109786033630371, "lr": 0.0003977714465334766, "tps": 8122, "wall": 20016.8} {"step": 2481, "train_loss": 4.079831600189209, "lr": 0.0003977684401975612, "tps": 8122, "wall": 20024.7} {"step": 2482, "train_loss": 4.021622180938721, "lr": 0.00039776543184787523, "tps": 8123, "wall": 20032.7} {"step": 2483, "train_loss": 3.9369702339172363, "lr": 0.0003977624214844529, "tps": 8123, "wall": 20040.6} {"step": 2484, "train_loss": 4.090121269226074, "lr": 0.0003977594091073282, "tps": 8123, "wall": 20048.6} {"step": 2485, "train_loss": 4.100613594055176, "lr": 0.00039775639471653537, "tps": 8123, "wall": 20056.6} {"step": 2486, "train_loss": 4.041265487670898, "lr": 0.00039775337831210835, "tps": 8123, "wall": 20064.5} {"step": 2487, "train_loss": 4.14351749420166, "lr": 0.0003977503598940816, "tps": 8123, "wall": 20072.3} {"step": 2488, "train_loss": 3.967548370361328, "lr": 0.00039774733946248904, "tps": 8123, "wall": 20080.4} {"step": 2489, "train_loss": 3.937567710876465, "lr": 0.000397744317017365, "tps": 8123, "wall": 20088.3} {"step": 2490, "train_loss": 4.031781196594238, "lr": 0.0003977412925587438, "tps": 8123, "wall": 20096.4} {"step": 2491, "train_loss": 4.008172035217285, "lr": 0.0003977382660866596, "tps": 8123, "wall": 20104.3} {"step": 2492, "train_loss": 4.044496059417725, "lr": 0.00039773523760114674, "tps": 8123, "wall": 20112.4} {"step": 2493, "train_loss": 4.075611114501953, "lr": 0.0003977322071022394, "tps": 8123, "wall": 20120.3} {"step": 2494, "train_loss": 4.006170272827148, "lr": 0.0003977291745899721, "tps": 8123, "wall": 20128.2} {"step": 2495, "train_loss": 3.9916648864746094, "lr": 0.000397726140064379, "tps": 8123, "wall": 20136.1} {"step": 2496, "train_loss": 4.019881725311279, "lr": 0.00039772310352549465, "tps": 8123, "wall": 20144.0} {"step": 2497, "train_loss": 4.080031394958496, "lr": 0.00039772006497335326, "tps": 8123, "wall": 20152.0} {"step": 2498, "train_loss": 4.03270149230957, "lr": 0.0003977170244079895, "tps": 8123, "wall": 20160.1} {"step": 2499, "train_loss": 4.057666778564453, "lr": 0.0003977139818294376, "tps": 8123, "wall": 20168.1} {"step": 2500, "train_loss": 4.002631187438965, "lr": 0.0003977109372377321, "tps": 8123, "wall": 20176.1} {"step": 2501, "train_loss": 4.088200569152832, "lr": 0.0003977078906329075, "tps": 8123, "wall": 20184.0} {"step": 2502, "train_loss": 4.0762619972229, "lr": 0.0003977048420149983, "tps": 8123, "wall": 20191.9} {"step": 2503, "train_loss": 4.076669692993164, "lr": 0.000397701791384039, "tps": 8123, "wall": 20199.8} {"step": 2504, "train_loss": 4.0855865478515625, "lr": 0.0003976987387400643, "tps": 8124, "wall": 20207.6} {"step": 2505, "train_loss": 4.093549728393555, "lr": 0.00039769568408310857, "tps": 8124, "wall": 20215.5} {"step": 2506, "train_loss": 4.080039024353027, "lr": 0.0003976926274132065, "tps": 8124, "wall": 20223.4} {"step": 2507, "train_loss": 3.9497876167297363, "lr": 0.00039768956873039287, "tps": 8124, "wall": 20231.2} {"step": 2508, "train_loss": 4.166049957275391, "lr": 0.00039768650803470205, "tps": 8124, "wall": 20239.2} {"step": 2509, "train_loss": 4.069238662719727, "lr": 0.0003976834453261689, "tps": 8124, "wall": 20247.1} {"step": 2510, "train_loss": 4.045438766479492, "lr": 0.0003976803806048281, "tps": 8124, "wall": 20255.1} {"step": 2511, "train_loss": 4.131802558898926, "lr": 0.0003976773138707143, "tps": 8124, "wall": 20263.0} {"step": 2512, "train_loss": 4.0445146560668945, "lr": 0.0003976742451238623, "tps": 8124, "wall": 20271.0} {"step": 2513, "train_loss": 3.9464526176452637, "lr": 0.00039767117436430684, "tps": 8124, "wall": 20278.8} {"step": 2514, "train_loss": 4.055555820465088, "lr": 0.0003976681015920827, "tps": 8124, "wall": 20286.9} {"step": 2515, "train_loss": 4.060767650604248, "lr": 0.00039766502680722463, "tps": 8124, "wall": 20295.0} {"step": 2516, "train_loss": 4.017880439758301, "lr": 0.00039766195000976763, "tps": 8124, "wall": 20302.9} {"step": 2517, "train_loss": 4.021117687225342, "lr": 0.0003976588711997464, "tps": 8124, "wall": 20310.9} {"step": 2518, "train_loss": 4.126641273498535, "lr": 0.00039765579037719583, "tps": 8124, "wall": 20318.8} {"step": 2519, "train_loss": 4.0223846435546875, "lr": 0.0003976527075421509, "tps": 8124, "wall": 20326.7} {"step": 2520, "train_loss": 4.059442043304443, "lr": 0.0003976496226946465, "tps": 8124, "wall": 20334.6} {"step": 2521, "train_loss": 4.068333148956299, "lr": 0.00039764653583471756, "tps": 8124, "wall": 20343.2} {"step": 2522, "train_loss": 4.09769868850708, "lr": 0.00039764344696239905, "tps": 8124, "wall": 20351.2} {"step": 2523, "train_loss": 4.098891735076904, "lr": 0.00039764035607772595, "tps": 8124, "wall": 20359.3} {"step": 2524, "train_loss": 4.073235511779785, "lr": 0.00039763726318073323, "tps": 8124, "wall": 20367.2} {"step": 2525, "train_loss": 4.056885242462158, "lr": 0.0003976341682714561, "tps": 8124, "wall": 20375.1} {"step": 2526, "train_loss": 4.1270341873168945, "lr": 0.00039763107134992945, "tps": 8124, "wall": 20383.2} {"step": 2527, "train_loss": 4.128920078277588, "lr": 0.0003976279724161883, "tps": 8124, "wall": 20391.0} {"step": 2528, "train_loss": 3.9797463417053223, "lr": 0.0003976248714702681, "tps": 8124, "wall": 20398.9} {"step": 2001, "train_loss": 4.145802021026611, "lr": 0.00039897940098692557, "tps": 29084491, "wall": 4.5} {"step": 2002, "train_loss": 4.192625999450684, "lr": 0.00039897736274350994, "tps": 14608198, "wall": 9.0} {"step": 2003, "train_loss": 4.125477313995361, "lr": 0.0003989753224726292, "tps": 9987597, "wall": 13.1} {"step": 2004, "train_loss": 4.281839847564697, "lr": 0.00039897328017430623, "tps": 7539520, "wall": 17.4} {"step": 2005, "train_loss": 4.130866527557373, "lr": 0.0003989712358485643, "tps": 6038214, "wall": 21.8} {"step": 2006, "train_loss": 4.207844257354736, "lr": 0.00039896918949542645, "tps": 5025138, "wall": 26.2} {"step": 2007, "train_loss": 4.161769866943359, "lr": 0.00039896714111491605, "tps": 4220691, "wall": 31.2} {"step": 2008, "train_loss": 4.275393962860107, "lr": 0.00039896509070705606, "tps": 3687034, "wall": 35.7} {"step": 2009, "train_loss": 4.231445789337158, "lr": 0.00039896303827186995, "tps": 3272225, "wall": 40.3} {"step": 2010, "train_loss": 4.2308855056762695, "lr": 0.0003989609838093809, "tps": 2940085, "wall": 44.8} {"step": 2011, "train_loss": 4.142087459564209, "lr": 0.00039895892731961203, "tps": 2665488, "wall": 49.5} {"step": 2012, "train_loss": 4.2411370277404785, "lr": 0.0003989568688025868, "tps": 2432874, "wall": 54.2} {"step": 2013, "train_loss": 4.1261467933654785, "lr": 0.00039895480825832846, "tps": 2205761, "wall": 59.8} {"step": 2014, "train_loss": 4.156797409057617, "lr": 0.0003989527456868604, "tps": 2032158, "wall": 65.0} {"step": 2015, "train_loss": 4.307425022125244, "lr": 0.00039895068108820593, "tps": 1854992, "wall": 71.2} {"step": 2016, "train_loss": 4.173663139343262, "lr": 0.00039894861446238846, "tps": 1715726, "wall": 77.0} {"step": 2017, "train_loss": 4.13433313369751, "lr": 0.0003989465458094314, "tps": 1606353, "wall": 82.3} {"step": 2018, "train_loss": 4.249319553375244, "lr": 0.0003989444751293582, "tps": 1509147, "wall": 87.7} {"step": 2019, "train_loss": 4.21440315246582, "lr": 0.00039894240242219236, "tps": 1422262, "wall": 93.1} {"step": 2020, "train_loss": 4.211029529571533, "lr": 0.0003989403276879572, "tps": 1343770, "wall": 98.6} {"step": 2021, "train_loss": 4.27194881439209, "lr": 0.00039893825092667635, "tps": 1274162, "wall": 104.0} {"step": 2022, "train_loss": 4.238604545593262, "lr": 0.0003989361721383734, "tps": 1212571, "wall": 109.3} {"step": 2023, "train_loss": 4.19783353805542, "lr": 0.00039893409132307176, "tps": 1156240, "wall": 114.7} {"step": 2024, "train_loss": 4.1190009117126465, "lr": 0.000398932008480795, "tps": 1104351, "wall": 120.2} {"step": 2025, "train_loss": 4.178001403808594, "lr": 0.00039892992361156685, "tps": 1058195, "wall": 125.5} {"step": 2026, "train_loss": 4.124128818511963, "lr": 0.0003989278367154108, "tps": 1015753, "wall": 130.8} {"step": 2027, "train_loss": 4.202582836151123, "lr": 0.0003989257477923505, "tps": 976847, "wall": 136.1} {"step": 2028, "train_loss": 4.278439998626709, "lr": 0.00039892365684240976, "tps": 940826, "wall": 141.3} {"step": 2029, "train_loss": 4.179559707641602, "lr": 0.0003989215638656121, "tps": 907081, "wall": 146.7} {"step": 2030, "train_loss": 4.213678359985352, "lr": 0.0003989194688619812, "tps": 875562, "wall": 152.0} {"step": 2031, "train_loss": 4.15058708190918, "lr": 0.0003989173718315411, "tps": 846074, "wall": 157.4} {"step": 2032, "train_loss": 4.200195789337158, "lr": 0.0003989152727743151, "tps": 818189, "wall": 162.8} {"step": 2033, "train_loss": 4.208986759185791, "lr": 0.0003989131716903273, "tps": 792078, "wall": 168.3} {"step": 2034, "train_loss": 4.05858039855957, "lr": 0.0003989110685796014, "tps": 767285, "wall": 173.8} {"step": 2035, "train_loss": 4.227958679199219, "lr": 0.00039890896344216124, "tps": 743956, "wall": 179.4} {"step": 2036, "train_loss": 4.194838523864746, "lr": 0.0003989068562780307, "tps": 722216, "wall": 184.8} {"step": 2037, "train_loss": 4.214662075042725, "lr": 0.00039890474708723355, "tps": 701842, "wall": 190.3} {"step": 2038, "train_loss": 4.166149139404297, "lr": 0.0003989026358697938, "tps": 682013, "wall": 195.9} {"step": 2039, "train_loss": 4.095802307128906, "lr": 0.00039890052262573527, "tps": 663292, "wall": 201.6} {"step": 2040, "train_loss": 4.180076599121094, "lr": 0.000398898407355082, "tps": 645118, "wall": 207.3} {"step": 2041, "train_loss": 4.113349914550781, "lr": 0.00039889629005785787, "tps": 627608, "wall": 213.2} {"step": 2042, "train_loss": 4.239883899688721, "lr": 0.0003988941707340868, "tps": 610628, "wall": 219.3} {"step": 2043, "train_loss": 4.074393272399902, "lr": 0.000398892049383793, "tps": 594470, "wall": 225.3} {"step": 2044, "train_loss": 4.24578857421875, "lr": 0.0003988899260070004, "tps": 578916, "wall": 231.5} {"step": 2045, "train_loss": 4.07546329498291, "lr": 0.00039888780060373294, "tps": 563629, "wall": 237.9} {"step": 2046, "train_loss": 4.227598667144775, "lr": 0.0003988856731740148, "tps": 548871, "wall": 244.4} {"step": 2047, "train_loss": 4.045393466949463, "lr": 0.00039888354371787015, "tps": 534781, "wall": 251.0} {"step": 2048, "train_loss": 4.236889362335205, "lr": 0.00039888141223532304, "tps": 521072, "wall": 257.7} {"step": 2049, "train_loss": 4.244922637939453, "lr": 0.00039887927872639764, "tps": 507740, "wall": 264.6} {"step": 2050, "train_loss": 4.153323650360107, "lr": 0.000398877143191118, "tps": 495013, "wall": 271.5} {"step": 2051, "train_loss": 4.113892078399658, "lr": 0.00039887500562950845, "tps": 482658, "wall": 278.6} {"step": 2052, "train_loss": 4.207523345947266, "lr": 0.00039887286604159313, "tps": 470866, "wall": 285.7} {"step": 2053, "train_loss": 4.253358840942383, "lr": 0.00039887072442739633, "tps": 459454, "wall": 293.0} {"step": 2054, "train_loss": 4.183430194854736, "lr": 0.0003988685807869422, "tps": 448352, "wall": 300.4} {"step": 2055, "train_loss": 4.147868633270264, "lr": 0.0003988664351202553, "tps": 437728, "wall": 307.8} {"step": 2056, "train_loss": 4.12426233291626, "lr": 0.0003988642874273596, "tps": 427445, "wall": 315.4} {"step": 2057, "train_loss": 4.187397003173828, "lr": 0.00039886213770827967, "tps": 417582, "wall": 323.0} {"step": 2058, "train_loss": 4.190308094024658, "lr": 0.00039885998596303967, "tps": 407972, "wall": 330.8} {"step": 2059, "train_loss": 4.17612361907959, "lr": 0.0003988578321916641, "tps": 398847, "wall": 338.5} {"step": 2060, "train_loss": 4.288812160491943, "lr": 0.00039885567639417736, "tps": 389937, "wall": 346.4} {"step": 2061, "train_loss": 4.224678039550781, "lr": 0.00039885351857060384, "tps": 381329, "wall": 354.4} {"step": 2062, "train_loss": 4.188549995422363, "lr": 0.000398851358720968, "tps": 372967, "wall": 362.5} {"step": 2063, "train_loss": 4.25001335144043, "lr": 0.00039884919684529424, "tps": 365122, "wall": 370.5} {"step": 2064, "train_loss": 4.152125835418701, "lr": 0.0003988470329436072, "tps": 357668, "wall": 378.4} {"step": 2065, "train_loss": 4.134777069091797, "lr": 0.0003988448670159312, "tps": 350428, "wall": 386.4} {"step": 2066, "train_loss": 4.2266035079956055, "lr": 0.00039884269906229086, "tps": 343509, "wall": 394.4} {"step": 2067, "train_loss": 4.2569074630737305, "lr": 0.0003988405290827108, "tps": 336852, "wall": 402.3} {"step": 2068, "train_loss": 4.134617805480957, "lr": 0.00039883835707721555, "tps": 330368, "wall": 410.4} {"step": 2069, "train_loss": 4.119653701782227, "lr": 0.0003988361830458297, "tps": 324148, "wall": 418.5} {"step": 2070, "train_loss": 4.268721580505371, "lr": 0.00039883400698857794, "tps": 318248, "wall": 426.5} {"step": 2071, "train_loss": 4.199428558349609, "lr": 0.00039883182890548477, "tps": 311607, "wall": 435.8} {"step": 2072, "train_loss": 4.14913272857666, "lr": 0.000398829648796575, "tps": 306216, "wall": 443.7} {"step": 2073, "train_loss": 4.186805248260498, "lr": 0.0003988274666618734, "tps": 300942, "wall": 451.7} {"step": 2074, "train_loss": 4.092137336730957, "lr": 0.0003988252825014045, "tps": 295821, "wall": 459.7} {"step": 2075, "train_loss": 4.2058234214782715, "lr": 0.00039882309631519315, "tps": 290970, "wall": 467.6} {"step": 2076, "train_loss": 4.237617492675781, "lr": 0.00039882090810326406, "tps": 286302, "wall": 475.4} {"step": 2077, "train_loss": 4.191257953643799, "lr": 0.0003988187178656421, "tps": 280830, "wall": 484.9} {"step": 2078, "train_loss": 4.25652551651001, "lr": 0.000398816525602352, "tps": 275921, "wall": 493.8} {"step": 2079, "train_loss": 4.304065704345703, "lr": 0.00039881433131341864, "tps": 271755, "wall": 501.6} {"step": 2080, "train_loss": 4.097171783447266, "lr": 0.0003988121349988668, "tps": 267701, "wall": 509.4} {"step": 2081, "train_loss": 4.1681694984436035, "lr": 0.0003988099366587214, "tps": 263778, "wall": 517.3} {"step": 2082, "train_loss": 4.154562950134277, "lr": 0.00039880773629300746, "tps": 259928, "wall": 525.2} {"step": 2083, "train_loss": 4.177040100097656, "lr": 0.0003988055339017498, "tps": 256288, "wall": 532.9} {"step": 2084, "train_loss": 4.172863006591797, "lr": 0.00039880332948497336, "tps": 252684, "wall": 540.8} {"step": 2085, "train_loss": 4.219720840454102, "lr": 0.00039880112304270315, "tps": 249289, "wall": 548.4} {"step": 2086, "train_loss": 4.183227062225342, "lr": 0.00039879891457496406, "tps": 245937, "wall": 556.1} {"step": 2087, "train_loss": 4.143647193908691, "lr": 0.00039879670408178125, "tps": 242677, "wall": 563.9} {"step": 2088, "train_loss": 4.184206962585449, "lr": 0.0003987944915631797, "tps": 239537, "wall": 571.5} {"step": 2089, "train_loss": 4.211633682250977, "lr": 0.00039879227701918453, "tps": 236484, "wall": 579.2} {"step": 2090, "train_loss": 4.148477554321289, "lr": 0.0003987900604498207, "tps": 233520, "wall": 586.8} {"step": 2091, "train_loss": 4.114526748657227, "lr": 0.00039878784185511345, "tps": 230598, "wall": 594.5} {"step": 2092, "train_loss": 4.187132835388184, "lr": 0.0003987856212350878, "tps": 227722, "wall": 602.3} {"step": 2093, "train_loss": 4.177909851074219, "lr": 0.000398783398589769, "tps": 224948, "wall": 610.1} {"step": 2094, "train_loss": 4.210122108459473, "lr": 0.0003987811739191822, "tps": 222262, "wall": 617.7} {"step": 2095, "train_loss": 4.140332221984863, "lr": 0.00039877894722335257, "tps": 219632, "wall": 625.4} {"step": 2096, "train_loss": 4.13720703125, "lr": 0.00039877671850230533, "tps": 217029, "wall": 633.2} {"step": 2097, "train_loss": 4.12257719039917, "lr": 0.00039877448775606575, "tps": 214520, "wall": 640.9} {"step": 2098, "train_loss": 4.210001468658447, "lr": 0.00039877225498465913, "tps": 212095, "wall": 648.6} {"step": 2099, "train_loss": 4.215959072113037, "lr": 0.00039877002018811074, "tps": 209691, "wall": 656.3} {"step": 2100, "train_loss": 4.1891093254089355, "lr": 0.0003987677833664459, "tps": 207314, "wall": 664.2} {"step": 2101, "train_loss": 4.047127723693848, "lr": 0.00039876554451968984, "tps": 205061, "wall": 671.8} {"step": 2102, "train_loss": 4.13638973236084, "lr": 0.00039876330364786814, "tps": 202817, "wall": 679.5} {"step": 2103, "train_loss": 4.098830223083496, "lr": 0.000398761060751006, "tps": 200620, "wall": 687.3} {"step": 2104, "train_loss": 4.10334587097168, "lr": 0.00039875881582912895, "tps": 198480, "wall": 695.0} {"step": 2105, "train_loss": 4.160007476806641, "lr": 0.00039875656888226226, "tps": 196386, "wall": 702.8} {"step": 2106, "train_loss": 4.228237628936768, "lr": 0.0003987543199104316, "tps": 194342, "wall": 710.5} {"step": 2107, "train_loss": 4.1244354248046875, "lr": 0.0003987520689136623, "tps": 192282, "wall": 718.5} {"step": 2108, "train_loss": 4.212455749511719, "lr": 0.0003987498158919799, "tps": 190333, "wall": 726.2} {"step": 2109, "train_loss": 4.142996788024902, "lr": 0.00039874756084540985, "tps": 188401, "wall": 734.0} {"step": 2110, "train_loss": 4.168865203857422, "lr": 0.0003987453037739778, "tps": 186529, "wall": 741.7} {"step": 2111, "train_loss": 4.1185712814331055, "lr": 0.0003987430446777093, "tps": 184677, "wall": 749.5} {"step": 2112, "train_loss": 4.1562910079956055, "lr": 0.0003987407835566299, "tps": 182884, "wall": 757.2} {"step": 2113, "train_loss": 4.183867931365967, "lr": 0.0003987385204107652, "tps": 181086, "wall": 765.1} {"step": 2114, "train_loss": 4.1178202629089355, "lr": 0.00039873625524014094, "tps": 179336, "wall": 772.9} {"step": 2115, "train_loss": 4.155092239379883, "lr": 0.0003987339880447827, "tps": 177584, "wall": 780.9} {"step": 2116, "train_loss": 4.1310224533081055, "lr": 0.00039873171882471616, "tps": 175932, "wall": 788.6} {"step": 2117, "train_loss": 4.180204391479492, "lr": 0.000398729447579967, "tps": 174294, "wall": 796.4} {"step": 2118, "train_loss": 4.122966766357422, "lr": 0.00039872717431056103, "tps": 172685, "wall": 804.2} {"step": 2119, "train_loss": 4.222507476806641, "lr": 0.00039872489901652397, "tps": 171101, "wall": 812.0} {"step": 2120, "train_loss": 4.223474979400635, "lr": 0.00039872262169788155, "tps": 169563, "wall": 819.8} {"step": 2121, "train_loss": 4.1579790115356445, "lr": 0.0003987203423546596, "tps": 168039, "wall": 827.6} {"step": 2122, "train_loss": 4.189184188842773, "lr": 0.000398718060986884, "tps": 166531, "wall": 835.5} {"step": 2123, "train_loss": 4.159430027008057, "lr": 0.0003987157775945805, "tps": 165032, "wall": 843.5} {"step": 2124, "train_loss": 4.158581733703613, "lr": 0.000398713492177775, "tps": 163592, "wall": 851.3} {"step": 2125, "train_loss": 4.16079568862915, "lr": 0.00039871120473649344, "tps": 162168, "wall": 859.2} {"step": 2126, "train_loss": 4.134448528289795, "lr": 0.00039870891527076164, "tps": 160775, "wall": 867.0} {"step": 2127, "train_loss": 4.188441276550293, "lr": 0.0003987066237806056, "tps": 159406, "wall": 874.9} {"step": 2128, "train_loss": 4.136590480804443, "lr": 0.0003987043302660512, "tps": 158076, "wall": 882.7} {"step": 2129, "train_loss": 4.165887355804443, "lr": 0.0003987020347271245, "tps": 156751, "wall": 890.5} {"step": 2130, "train_loss": 4.174256324768066, "lr": 0.0003986997371638515, "tps": 155440, "wall": 898.5} {"step": 2131, "train_loss": 4.1447343826293945, "lr": 0.0003986974375762582, "tps": 154167, "wall": 906.3} {"step": 2132, "train_loss": 4.257042407989502, "lr": 0.0003986951359643707, "tps": 152921, "wall": 914.1} {"step": 2133, "train_loss": 4.104767322540283, "lr": 0.000398692832328215, "tps": 151671, "wall": 922.1} {"step": 2134, "train_loss": 4.040945529937744, "lr": 0.00039869052666781726, "tps": 150477, "wall": 929.8} {"step": 2135, "train_loss": 4.05164909362793, "lr": 0.00039868821898320355, "tps": 149298, "wall": 937.6} {"step": 2136, "train_loss": 4.3260698318481445, "lr": 0.0003986859092744, "tps": 148120, "wall": 945.5} {"step": 2137, "train_loss": 4.197805881500244, "lr": 0.00039868359754143283, "tps": 146974, "wall": 953.3} {"step": 2138, "train_loss": 4.081225872039795, "lr": 0.0003986812837843282, "tps": 145821, "wall": 961.3} {"step": 2139, "train_loss": 4.269128799438477, "lr": 0.0003986789680031123, "tps": 144707, "wall": 969.2} {"step": 2140, "train_loss": 4.066225051879883, "lr": 0.0003986766501978114, "tps": 143610, "wall": 977.0} {"step": 2141, "train_loss": 4.178093433380127, "lr": 0.0003986743303684517, "tps": 142515, "wall": 985.0} {"step": 2142, "train_loss": 4.150821208953857, "lr": 0.00039867200851505957, "tps": 141456, "wall": 992.8} {"step": 2143, "train_loss": 4.255518436431885, "lr": 0.0003986696846376612, "tps": 140402, "wall": 1000.8} {"step": 2144, "train_loss": 4.263809680938721, "lr": 0.0003986673587362831, "tps": 139371, "wall": 1008.6} {"step": 2145, "train_loss": 4.176678657531738, "lr": 0.00039866503081095137, "tps": 138342, "wall": 1016.6} {"step": 2146, "train_loss": 4.085152626037598, "lr": 0.00039866270086169256, "tps": 137335, "wall": 1024.5} {"step": 2147, "train_loss": 4.097204208374023, "lr": 0.00039866036888853306, "tps": 136361, "wall": 1032.3} {"step": 2148, "train_loss": 4.155244827270508, "lr": 0.0003986580348914991, "tps": 135394, "wall": 1040.2} {"step": 2149, "train_loss": 4.135390281677246, "lr": 0.0003986556988706174, "tps": 134444, "wall": 1048.0} {"step": 2150, "train_loss": 4.008167266845703, "lr": 0.0003986533608259142, "tps": 133505, "wall": 1055.9} {"step": 2151, "train_loss": 4.128597259521484, "lr": 0.00039865102075741605, "tps": 132576, "wall": 1063.8} {"step": 2152, "train_loss": 4.153010368347168, "lr": 0.0003986486786651495, "tps": 131665, "wall": 1071.6} {"step": 2153, "train_loss": 4.1951189041137695, "lr": 0.00039864633454914105, "tps": 130751, "wall": 1079.6} {"step": 2154, "train_loss": 4.136593341827393, "lr": 0.00039864398840941726, "tps": 129860, "wall": 1087.5} {"step": 2155, "train_loss": 4.067377090454102, "lr": 0.0003986416402460047, "tps": 129000, "wall": 1095.3} {"step": 2156, "train_loss": 4.136727333068848, "lr": 0.00039863929005892995, "tps": 128141, "wall": 1103.2} {"step": 2157, "train_loss": 4.113605499267578, "lr": 0.0003986369378482198, "tps": 127283, "wall": 1111.1} {"step": 2158, "train_loss": 4.210951805114746, "lr": 0.00039863458361390057, "tps": 126449, "wall": 1119.0} {"step": 2159, "train_loss": 4.094762802124023, "lr": 0.0003986322273559992, "tps": 125618, "wall": 1126.9} {"step": 2160, "train_loss": 4.146851062774658, "lr": 0.0003986298690745423, "tps": 124797, "wall": 1134.8} {"step": 2161, "train_loss": 4.297077655792236, "lr": 0.0003986275087695565, "tps": 123987, "wall": 1142.8} {"step": 2162, "train_loss": 4.055533409118652, "lr": 0.0003986251464410687, "tps": 123205, "wall": 1150.6} {"step": 2163, "train_loss": 4.161843299865723, "lr": 0.00039862278208910556, "tps": 122421, "wall": 1158.5} {"step": 2164, "train_loss": 4.055643081665039, "lr": 0.00039862041571369386, "tps": 121659, "wall": 1166.2} {"step": 2165, "train_loss": 4.117963790893555, "lr": 0.0003986180473148604, "tps": 120894, "wall": 1174.2} {"step": 2166, "train_loss": 4.276895523071289, "lr": 0.0003986156768926321, "tps": 120147, "wall": 1182.0} {"step": 2167, "train_loss": 4.040958404541016, "lr": 0.0003986133044470358, "tps": 119413, "wall": 1189.8} {"step": 2168, "train_loss": 4.088466167449951, "lr": 0.00039861092997809825, "tps": 118673, "wall": 1197.8} {"step": 2169, "train_loss": 4.108015537261963, "lr": 0.00039860855348584635, "tps": 117948, "wall": 1205.7} {"step": 2170, "train_loss": 4.204493045806885, "lr": 0.0003986061749703072, "tps": 117241, "wall": 1213.6} {"step": 2171, "train_loss": 4.1450324058532715, "lr": 0.0003986037944315076, "tps": 116537, "wall": 1221.4} {"step": 2172, "train_loss": 4.209976673126221, "lr": 0.00039860141186947456, "tps": 115839, "wall": 1229.4} {"step": 2173, "train_loss": 4.006438255310059, "lr": 0.00039859902728423506, "tps": 115163, "wall": 1237.2} {"step": 2174, "train_loss": 4.105752468109131, "lr": 0.00039859664067581614, "tps": 114485, "wall": 1245.1} {"step": 2175, "train_loss": 4.227029323577881, "lr": 0.0003985942520442448, "tps": 113830, "wall": 1252.8} {"step": 2176, "train_loss": 4.125975608825684, "lr": 0.0003985918613895481, "tps": 113162, "wall": 1260.8} {"step": 2177, "train_loss": 4.143192291259766, "lr": 0.00039858946871175314, "tps": 112508, "wall": 1268.7} {"step": 2178, "train_loss": 4.130281925201416, "lr": 0.00039858707401088704, "tps": 111868, "wall": 1276.5} {"step": 2179, "train_loss": 4.144658088684082, "lr": 0.00039858467728697683, "tps": 111233, "wall": 1284.4} {"step": 2180, "train_loss": 4.02517557144165, "lr": 0.00039858227854004983, "tps": 110618, "wall": 1292.1} {"step": 2181, "train_loss": 4.202719688415527, "lr": 0.00039857987777013303, "tps": 109993, "wall": 1300.1} {"step": 2182, "train_loss": 4.1064581871032715, "lr": 0.0003985774749772537, "tps": 109379, "wall": 1308.0} {"step": 2183, "train_loss": 4.178147315979004, "lr": 0.0003985750701614392, "tps": 108776, "wall": 1315.8} {"step": 2184, "train_loss": 4.128682613372803, "lr": 0.00039857266332271656, "tps": 108173, "wall": 1323.8} {"step": 2185, "train_loss": 4.1747145652771, "lr": 0.00039857025446111315, "tps": 107582, "wall": 1331.6} {"step": 2186, "train_loss": 4.244251251220703, "lr": 0.0003985678435766562, "tps": 107004, "wall": 1339.5} {"step": 2187, "train_loss": 4.182286262512207, "lr": 0.0003985654306693731, "tps": 106427, "wall": 1347.3} {"step": 2188, "train_loss": 4.181619167327881, "lr": 0.0003985630157392911, "tps": 105854, "wall": 1355.2} {"step": 2189, "train_loss": 4.183427333831787, "lr": 0.00039856059878643765, "tps": 105290, "wall": 1363.1} {"step": 2190, "train_loss": 4.014970779418945, "lr": 0.0003985581798108401, "tps": 104738, "wall": 1370.9} {"step": 2191, "train_loss": 4.288435935974121, "lr": 0.00039855575881252576, "tps": 104173, "wall": 1379.0} {"step": 2192, "train_loss": 4.028695106506348, "lr": 0.0003985533357915221, "tps": 103624, "wall": 1386.9} {"step": 2193, "train_loss": 3.9978737831115723, "lr": 0.00039855091074785664, "tps": 103090, "wall": 1394.8} {"step": 2194, "train_loss": 4.118136405944824, "lr": 0.0003985484836815568, "tps": 102558, "wall": 1402.6} {"step": 2195, "train_loss": 4.0816330909729, "lr": 0.00039854605459265006, "tps": 102035, "wall": 1410.5} {"step": 2196, "train_loss": 4.170027732849121, "lr": 0.000398543623481164, "tps": 101518, "wall": 1418.3} {"step": 2197, "train_loss": 4.049556255340576, "lr": 0.0003985411903471261, "tps": 100999, "wall": 1426.2} {"step": 2198, "train_loss": 4.145646572113037, "lr": 0.0003985387551905639, "tps": 100489, "wall": 1434.1} {"step": 2199, "train_loss": 4.209890365600586, "lr": 0.00039853631801150505, "tps": 99976, "wall": 1442.1} {"step": 2200, "train_loss": 4.194787502288818, "lr": 0.00039853387880997717, "tps": 99482, "wall": 1449.9} {"step": 2201, "train_loss": 4.2133331298828125, "lr": 0.0003985314375860078, "tps": 98993, "wall": 1457.8} {"step": 2202, "train_loss": 4.177229404449463, "lr": 0.0003985289943396246, "tps": 98506, "wall": 1465.7} {"step": 2203, "train_loss": 4.141175270080566, "lr": 0.00039852654907085536, "tps": 98024, "wall": 1473.5} {"step": 2204, "train_loss": 4.027212142944336, "lr": 0.0003985241017797277, "tps": 97548, "wall": 1481.4} {"step": 2205, "train_loss": 4.086610794067383, "lr": 0.0003985216524662694, "tps": 97074, "wall": 1489.3} {"step": 2206, "train_loss": 4.146800518035889, "lr": 0.0003985192011305081, "tps": 96601, "wall": 1497.3} {"step": 2207, "train_loss": 4.104382038116455, "lr": 0.0003985167477724717, "tps": 96141, "wall": 1505.1} {"step": 2208, "train_loss": 4.073602676391602, "lr": 0.00039851429239218787, "tps": 95690, "wall": 1512.9} {"step": 2209, "train_loss": 4.1510396003723145, "lr": 0.00039851183498968443, "tps": 95236, "wall": 1520.8} {"step": 2210, "train_loss": 4.030197620391846, "lr": 0.00039850937556498933, "tps": 94787, "wall": 1528.7} {"step": 2211, "train_loss": 4.095216751098633, "lr": 0.0003985069141181304, "tps": 94343, "wall": 1536.6} {"step": 2212, "train_loss": 4.062718391418457, "lr": 0.00039850445064913546, "tps": 93908, "wall": 1544.4} {"step": 2213, "train_loss": 4.113574981689453, "lr": 0.0003985019851580324, "tps": 93473, "wall": 1552.3} {"step": 2214, "train_loss": 4.066205024719238, "lr": 0.00039849951764484926, "tps": 93045, "wall": 1560.1} {"step": 2215, "train_loss": 4.188573837280273, "lr": 0.0003984970481096139, "tps": 92618, "wall": 1568.0} {"step": 2216, "train_loss": 4.139085292816162, "lr": 0.0003984945765523543, "tps": 92197, "wall": 1575.9} {"step": 2217, "train_loss": 4.11831521987915, "lr": 0.0003984921029730985, "tps": 91787, "wall": 1583.6} {"step": 2218, "train_loss": 4.1297502517700195, "lr": 0.00039848962737187453, "tps": 91374, "wall": 1591.5} {"step": 2219, "train_loss": 4.102137565612793, "lr": 0.0003984871497487104, "tps": 90970, "wall": 1599.3} {"step": 2220, "train_loss": 4.176304340362549, "lr": 0.0003984846701036341, "tps": 90567, "wall": 1607.2} {"step": 2221, "train_loss": 4.126327991485596, "lr": 0.0003984821884366739, "tps": 90168, "wall": 1615.0} {"step": 2222, "train_loss": 4.2008490562438965, "lr": 0.00039847970474785776, "tps": 89770, "wall": 1622.9} {"step": 2223, "train_loss": 4.153561592102051, "lr": 0.0003984772190372139, "tps": 89374, "wall": 1630.8} {"step": 2224, "train_loss": 4.2051472663879395, "lr": 0.00039847473130477044, "tps": 88989, "wall": 1638.6} {"step": 2225, "train_loss": 4.207070827484131, "lr": 0.0003984722415505556, "tps": 88610, "wall": 1646.3} {"step": 2226, "train_loss": 4.119147300720215, "lr": 0.0003984697497745974, "tps": 88229, "wall": 1654.2} {"step": 2227, "train_loss": 4.035331726074219, "lr": 0.0003984672559769244, "tps": 87853, "wall": 1662.0} {"step": 2228, "train_loss": 4.144516944885254, "lr": 0.0003984647601575646, "tps": 87482, "wall": 1669.8} {"step": 2229, "train_loss": 4.19715690612793, "lr": 0.00039846226231654634, "tps": 87103, "wall": 1677.8} {"step": 2230, "train_loss": 4.0552287101745605, "lr": 0.0003984597624538979, "tps": 86735, "wall": 1685.7} {"step": 2231, "train_loss": 4.111765384674072, "lr": 0.00039845726056964763, "tps": 86374, "wall": 1693.5} {"step": 2232, "train_loss": 4.057106018066406, "lr": 0.0003984547566638239, "tps": 86010, "wall": 1701.4} {"step": 2233, "train_loss": 4.104503631591797, "lr": 0.00039845225073645497, "tps": 85658, "wall": 1709.2} {"step": 2234, "train_loss": 4.198787689208984, "lr": 0.0003984497427875693, "tps": 85305, "wall": 1717.0} {"step": 2235, "train_loss": 4.075185775756836, "lr": 0.00039844723281719533, "tps": 84957, "wall": 1724.9} {"step": 2236, "train_loss": 4.104541301727295, "lr": 0.00039844472082536145, "tps": 84610, "wall": 1732.7} {"step": 2237, "train_loss": 4.1716203689575195, "lr": 0.00039844220681209603, "tps": 84260, "wall": 1740.7} {"step": 2238, "train_loss": 4.187696933746338, "lr": 0.00039843969077742777, "tps": 83919, "wall": 1748.5} {"step": 2239, "train_loss": 4.07736873626709, "lr": 0.00039843717272138496, "tps": 83583, "wall": 1756.3} {"step": 2240, "train_loss": 4.123912334442139, "lr": 0.0003984346526439962, "tps": 83250, "wall": 1764.2} {"step": 2241, "train_loss": 4.089344501495361, "lr": 0.00039843213054529007, "tps": 82920, "wall": 1772.0} {"step": 2242, "train_loss": 4.117767810821533, "lr": 0.00039842960642529513, "tps": 82589, "wall": 1779.9} {"step": 2243, "train_loss": 4.155259609222412, "lr": 0.0003984270802840399, "tps": 82267, "wall": 1787.6} {"step": 2244, "train_loss": 4.085402011871338, "lr": 0.00039842455212155315, "tps": 81947, "wall": 1795.4} {"step": 2245, "train_loss": 4.155410289764404, "lr": 0.0003984220219378633, "tps": 81622, "wall": 1803.3} {"step": 2246, "train_loss": 4.111049175262451, "lr": 0.00039841948973299917, "tps": 81303, "wall": 1811.2} {"step": 2247, "train_loss": 4.147103786468506, "lr": 0.0003984169555069894, "tps": 80993, "wall": 1819.0} {"step": 2248, "train_loss": 4.0974578857421875, "lr": 0.00039841441925986276, "tps": 80682, "wall": 1826.8} {"step": 2249, "train_loss": 4.170638084411621, "lr": 0.00039841188099164784, "tps": 80373, "wall": 1834.6} {"step": 2250, "train_loss": 4.142326354980469, "lr": 0.0003984093407023736, "tps": 80064, "wall": 1842.5} {"step": 2251, "train_loss": 4.061264991760254, "lr": 0.0003984067983920686, "tps": 79760, "wall": 1850.4} {"step": 2252, "train_loss": 4.042818069458008, "lr": 0.0003984042540607618, "tps": 79455, "wall": 1858.3} {"step": 2253, "train_loss": 4.090697765350342, "lr": 0.00039840170770848193, "tps": 79155, "wall": 1866.2} {"step": 2254, "train_loss": 4.202269554138184, "lr": 0.0003983991593352579, "tps": 78863, "wall": 1873.9} {"step": 2255, "train_loss": 4.172260284423828, "lr": 0.0003983966089411185, "tps": 78567, "wall": 1881.8} {"step": 2256, "train_loss": 4.1606125831604, "lr": 0.0003983940565260926, "tps": 78272, "wall": 1889.7} {"step": 2257, "train_loss": 4.019503593444824, "lr": 0.00039839150209020925, "tps": 77987, "wall": 1897.5} {"step": 2258, "train_loss": 4.149927139282227, "lr": 0.0003983889456334973, "tps": 77703, "wall": 1905.3} {"step": 2259, "train_loss": 4.184685230255127, "lr": 0.00039838638715598574, "tps": 77417, "wall": 1913.2} {"step": 2260, "train_loss": 3.9965553283691406, "lr": 0.00039838382665770354, "tps": 77134, "wall": 1921.0} {"step": 2261, "train_loss": 4.064606189727783, "lr": 0.0003983812641386797, "tps": 76858, "wall": 1928.8} {"step": 2262, "train_loss": 4.169511318206787, "lr": 0.0003983786995989432, "tps": 76580, "wall": 1936.6} {"step": 2263, "train_loss": 4.200756072998047, "lr": 0.00039837613303852316, "tps": 76308, "wall": 1944.4} {"step": 2264, "train_loss": 4.163677215576172, "lr": 0.0003983735644574487, "tps": 76035, "wall": 1952.2} {"step": 2265, "train_loss": 3.962285280227661, "lr": 0.00039837099385574883, "tps": 75767, "wall": 1960.0} {"step": 2266, "train_loss": 4.05844783782959, "lr": 0.00039836842123345265, "tps": 75498, "wall": 1967.9} {"step": 2267, "train_loss": 4.118271827697754, "lr": 0.0003983658465905893, "tps": 75232, "wall": 1975.7} {"step": 2268, "train_loss": 4.139843463897705, "lr": 0.00039836326992718807, "tps": 74964, "wall": 1983.6} {"step": 2269, "train_loss": 4.066067695617676, "lr": 0.00039836069124327806, "tps": 74702, "wall": 1991.4} {"step": 2270, "train_loss": 4.116683006286621, "lr": 0.0003983581105388885, "tps": 74443, "wall": 1999.3} {"step": 2271, "train_loss": 4.115011692047119, "lr": 0.0003983555278140486, "tps": 74189, "wall": 2007.0} {"step": 2272, "train_loss": 4.118719577789307, "lr": 0.0003983529430687876, "tps": 73932, "wall": 2014.8} {"step": 2273, "train_loss": 4.0402936935424805, "lr": 0.00039835035630313484, "tps": 73682, "wall": 2022.6} {"step": 2274, "train_loss": 4.195669651031494, "lr": 0.00039834776751711964, "tps": 73430, "wall": 2030.4} {"step": 2275, "train_loss": 4.076787948608398, "lr": 0.00039834517671077116, "tps": 73179, "wall": 2038.3} {"step": 2276, "train_loss": 4.100205898284912, "lr": 0.00039834258388411894, "tps": 72928, "wall": 2046.2} {"step": 2277, "train_loss": 4.143035411834717, "lr": 0.0003983399890371923, "tps": 72685, "wall": 2053.9} {"step": 2278, "train_loss": 4.115997791290283, "lr": 0.0003983373921700206, "tps": 72444, "wall": 2061.7} {"step": 2279, "train_loss": 4.161862373352051, "lr": 0.0003983347932826333, "tps": 72204, "wall": 2069.4} {"step": 2280, "train_loss": 4.223713397979736, "lr": 0.0003983321923750598, "tps": 71964, "wall": 2077.2} {"step": 2281, "train_loss": 4.072429656982422, "lr": 0.00039832958944732954, "tps": 71725, "wall": 2085.1} {"step": 2282, "train_loss": 4.099658012390137, "lr": 0.0003983269844994721, "tps": 71487, "wall": 2092.9} {"step": 2283, "train_loss": 4.046543121337891, "lr": 0.0003983243775315169, "tps": 71250, "wall": 2100.8} {"step": 2284, "train_loss": 4.14891242980957, "lr": 0.0003983217685434935, "tps": 71018, "wall": 2108.6} {"step": 2285, "train_loss": 4.142426490783691, "lr": 0.0003983191575354315, "tps": 70787, "wall": 2116.4} {"step": 2286, "train_loss": 4.139308452606201, "lr": 0.0003983165445073604, "tps": 70556, "wall": 2124.3} {"step": 2287, "train_loss": 4.139186859130859, "lr": 0.00039831392945930983, "tps": 70326, "wall": 2132.1} {"step": 2288, "train_loss": 4.090997219085693, "lr": 0.0003983113123913094, "tps": 70101, "wall": 2139.9} {"step": 2289, "train_loss": 4.083323001861572, "lr": 0.0003983086933033888, "tps": 69876, "wall": 2147.8} {"step": 2290, "train_loss": 4.137155055999756, "lr": 0.0003983060721955777, "tps": 69655, "wall": 2155.5} {"step": 2291, "train_loss": 4.204738616943359, "lr": 0.00039830344906790577, "tps": 69431, "wall": 2163.4} {"step": 2292, "train_loss": 4.079315662384033, "lr": 0.0003983008239204027, "tps": 69210, "wall": 2171.3} {"step": 2293, "train_loss": 4.115787982940674, "lr": 0.00039829819675309824, "tps": 68993, "wall": 2179.1} {"step": 2294, "train_loss": 4.141183853149414, "lr": 0.00039829556756602213, "tps": 68775, "wall": 2186.9} {"step": 2295, "train_loss": 4.073363304138184, "lr": 0.00039829293635920427, "tps": 68562, "wall": 2194.7} {"step": 2296, "train_loss": 4.107643127441406, "lr": 0.0003982903031326743, "tps": 68350, "wall": 2202.4} {"step": 2297, "train_loss": 4.134932994842529, "lr": 0.0003982876678864622, "tps": 68136, "wall": 2210.3} {"step": 2298, "train_loss": 4.186768054962158, "lr": 0.0003982850306205977, "tps": 67924, "wall": 2218.2} {"step": 2299, "train_loss": 4.183795928955078, "lr": 0.0003982823913351108, "tps": 67715, "wall": 2226.0} {"step": 2300, "train_loss": 4.01875638961792, "lr": 0.00039827975003003133, "tps": 67511, "wall": 2233.7} {"step": 2301, "train_loss": 4.160346508026123, "lr": 0.0003982771067053891, "tps": 67305, "wall": 2241.5} {"step": 2302, "train_loss": 4.086655616760254, "lr": 0.0003982744613612142, "tps": 67099, "wall": 2249.3} {"step": 2303, "train_loss": 4.069009780883789, "lr": 0.00039827181399753665, "tps": 66899, "wall": 2257.0} {"step": 2304, "train_loss": 4.055678844451904, "lr": 0.00039826916461438623, "tps": 66695, "wall": 2264.9} {"step": 2305, "train_loss": 4.077876567840576, "lr": 0.0003982665132117931, "tps": 66496, "wall": 2272.7} {"step": 2306, "train_loss": 4.0725555419921875, "lr": 0.00039826385978978726, "tps": 66294, "wall": 2280.6} {"step": 2307, "train_loss": 4.034894943237305, "lr": 0.00039826120434839884, "tps": 66097, "wall": 2288.4} {"step": 2308, "train_loss": 4.136098384857178, "lr": 0.00039825854688765774, "tps": 65901, "wall": 2296.2} {"step": 2309, "train_loss": 4.100866317749023, "lr": 0.0003982558874075942, "tps": 65706, "wall": 2304.0} {"step": 2310, "train_loss": 3.984637498855591, "lr": 0.00039825322590823846, "tps": 65513, "wall": 2311.8} {"step": 2311, "train_loss": 4.121760845184326, "lr": 0.0003982505623896204, "tps": 65320, "wall": 2319.6} {"step": 2312, "train_loss": 4.1092705726623535, "lr": 0.0003982478968517704, "tps": 65131, "wall": 2327.4} {"step": 2313, "train_loss": 4.174176216125488, "lr": 0.0003982452292947185, "tps": 64941, "wall": 2335.2} {"step": 2314, "train_loss": 4.178606986999512, "lr": 0.000398242559718495, "tps": 64749, "wall": 2343.1} {"step": 2315, "train_loss": 4.103673458099365, "lr": 0.0003982398881231302, "tps": 64562, "wall": 2350.9} {"step": 2316, "train_loss": 4.026176452636719, "lr": 0.0003982372145086543, "tps": 64379, "wall": 2358.6} {"step": 2317, "train_loss": 4.14836311340332, "lr": 0.00039823453887509756, "tps": 64193, "wall": 2366.5} {"step": 2318, "train_loss": 4.023296356201172, "lr": 0.0003982318612224904, "tps": 64009, "wall": 2374.3} {"step": 2319, "train_loss": 4.112288951873779, "lr": 0.000398229181550863, "tps": 63827, "wall": 2382.1} {"step": 2320, "train_loss": 4.011273384094238, "lr": 0.00039822649986024576, "tps": 63646, "wall": 2389.9} {"step": 2321, "train_loss": 4.172989845275879, "lr": 0.0003982238161506692, "tps": 63463, "wall": 2397.8} {"step": 2322, "train_loss": 4.0827789306640625, "lr": 0.0003982211304221635, "tps": 63282, "wall": 2405.7} {"step": 2323, "train_loss": 4.042238235473633, "lr": 0.00039821844267475925, "tps": 63102, "wall": 2413.6} {"step": 2324, "train_loss": 3.9735641479492188, "lr": 0.00039821575290848685, "tps": 62929, "wall": 2421.3} {"step": 2325, "train_loss": 4.055991172790527, "lr": 0.00039821306112337667, "tps": 62752, "wall": 2429.2} {"step": 2326, "train_loss": 4.155922889709473, "lr": 0.0003982103673194594, "tps": 62578, "wall": 2437.0} {"step": 2327, "train_loss": 4.202306270599365, "lr": 0.0003982076714967654, "tps": 62405, "wall": 2444.8} {"step": 2328, "train_loss": 4.064650535583496, "lr": 0.00039820497365532524, "tps": 62232, "wall": 2452.6} {"step": 2329, "train_loss": 4.022428512573242, "lr": 0.00039820227379516954, "tps": 62057, "wall": 2460.6} {"step": 2330, "train_loss": 4.029287338256836, "lr": 0.0003981995719163288, "tps": 61887, "wall": 2468.4} {"step": 2331, "train_loss": 4.168396949768066, "lr": 0.00039819686801883364, "tps": 61718, "wall": 2476.2} {"step": 2332, "train_loss": 4.024905681610107, "lr": 0.0003981941621027148, "tps": 61551, "wall": 2484.0} {"step": 2333, "train_loss": 4.071229457855225, "lr": 0.0003981914541680028, "tps": 61385, "wall": 2491.8} {"step": 2334, "train_loss": 3.9933924674987793, "lr": 0.0003981887442147284, "tps": 61220, "wall": 2499.6} {"step": 2335, "train_loss": 4.185302734375, "lr": 0.0003981860322429223, "tps": 61054, "wall": 2507.5} {"step": 2336, "train_loss": 4.068891525268555, "lr": 0.0003981833182526151, "tps": 60891, "wall": 2515.3} {"step": 2337, "train_loss": 4.108921527862549, "lr": 0.0003981806022438377, "tps": 60725, "wall": 2523.2} {"step": 2338, "train_loss": 4.137894153594971, "lr": 0.00039817788421662076, "tps": 60562, "wall": 2531.1} {"step": 2339, "train_loss": 4.013745307922363, "lr": 0.00039817516417099506, "tps": 60402, "wall": 2538.9} {"step": 2340, "train_loss": 4.035479545593262, "lr": 0.0003981724421069916, "tps": 60241, "wall": 2546.8} {"step": 2341, "train_loss": 4.067152976989746, "lr": 0.00039816971802464097, "tps": 60080, "wall": 2554.7} {"step": 2342, "train_loss": 4.314428806304932, "lr": 0.00039816699192397415, "tps": 59923, "wall": 2562.4} {"step": 2343, "train_loss": 4.125273704528809, "lr": 0.000398164263805022, "tps": 59764, "wall": 2570.4} {"step": 2344, "train_loss": 4.06879997253418, "lr": 0.00039816153366781546, "tps": 59606, "wall": 2578.3} {"step": 2345, "train_loss": 4.095512866973877, "lr": 0.00039815880151238545, "tps": 59453, "wall": 2586.0} {"step": 2346, "train_loss": 4.075422763824463, "lr": 0.0003981560673387628, "tps": 59297, "wall": 2593.9} {"step": 2347, "train_loss": 4.0941643714904785, "lr": 0.0003981533311469787, "tps": 59144, "wall": 2601.8} {"step": 2348, "train_loss": 4.028543472290039, "lr": 0.000398150592937064, "tps": 58993, "wall": 2609.5} {"step": 2349, "train_loss": 4.051512718200684, "lr": 0.0003981478527090497, "tps": 58842, "wall": 2617.3} {"step": 2350, "train_loss": 4.015130996704102, "lr": 0.0003981451104629669, "tps": 58693, "wall": 2625.1} {"step": 2351, "train_loss": 4.155356407165527, "lr": 0.0003981423661988466, "tps": 58543, "wall": 2632.9} {"step": 2352, "train_loss": 4.02768087387085, "lr": 0.00039813961991672, "tps": 58390, "wall": 2641.0} {"step": 2353, "train_loss": 4.159884452819824, "lr": 0.0003981368716166182, "tps": 58242, "wall": 2648.8} {"step": 2354, "train_loss": 4.120230674743652, "lr": 0.00039813412129857217, "tps": 58093, "wall": 2656.7} {"step": 2355, "train_loss": 4.149228096008301, "lr": 0.00039813136896261326, "tps": 57948, "wall": 2664.5} {"step": 2356, "train_loss": 4.0469841957092285, "lr": 0.00039812861460877255, "tps": 57803, "wall": 2672.3} {"step": 2357, "train_loss": 4.086186408996582, "lr": 0.0003981258582370812, "tps": 57659, "wall": 2680.1} {"step": 2358, "train_loss": 4.069652557373047, "lr": 0.00039812309984757054, "tps": 57516, "wall": 2687.9} {"step": 2359, "train_loss": 4.056861877441406, "lr": 0.00039812033944027175, "tps": 57373, "wall": 2695.8} {"step": 2360, "train_loss": 4.05601692199707, "lr": 0.0003981175770152162, "tps": 57227, "wall": 2703.8} {"step": 2361, "train_loss": 4.0534210205078125, "lr": 0.000398114812572435, "tps": 57086, "wall": 2711.6} {"step": 2362, "train_loss": 4.1273417472839355, "lr": 0.00039811204611195963, "tps": 56947, "wall": 2719.4} {"step": 2363, "train_loss": 4.026924133300781, "lr": 0.0003981092776338213, "tps": 56808, "wall": 2727.2} {"step": 2364, "train_loss": 4.048425674438477, "lr": 0.00039810650713805146, "tps": 56670, "wall": 2735.0} {"step": 2365, "train_loss": 4.107121467590332, "lr": 0.00039810373462468153, "tps": 56533, "wall": 2742.8} {"step": 2366, "train_loss": 4.030457496643066, "lr": 0.00039810096009374276, "tps": 56397, "wall": 2750.5} {"step": 2367, "train_loss": 4.205898284912109, "lr": 0.00039809818354526676, "tps": 56260, "wall": 2758.4} {"step": 2368, "train_loss": 3.9408936500549316, "lr": 0.0003980954049792849, "tps": 56124, "wall": 2766.2} {"step": 2369, "train_loss": 4.029017925262451, "lr": 0.0003980926243958286, "tps": 55990, "wall": 2774.0} {"step": 2370, "train_loss": 3.954906702041626, "lr": 0.00039808984179492946, "tps": 55857, "wall": 2781.8} {"step": 2371, "train_loss": 4.032158851623535, "lr": 0.000398087057176619, "tps": 55723, "wall": 2789.7} {"step": 2372, "train_loss": 3.9593677520751953, "lr": 0.00039808427054092863, "tps": 55592, "wall": 2797.4} {"step": 2373, "train_loss": 4.0895562171936035, "lr": 0.00039808148188789005, "tps": 55460, "wall": 2805.3} {"step": 2374, "train_loss": 3.986157178878784, "lr": 0.0003980786912175348, "tps": 55329, "wall": 2813.1} {"step": 2375, "train_loss": 3.968684196472168, "lr": 0.0003980758985298945, "tps": 55196, "wall": 2821.1} {"step": 2376, "train_loss": 4.123434543609619, "lr": 0.0003980731038250008, "tps": 55068, "wall": 2828.8} {"step": 2377, "train_loss": 4.140021800994873, "lr": 0.0003980703071028854, "tps": 54941, "wall": 2836.5} {"step": 2378, "train_loss": 4.146013259887695, "lr": 0.00039806750836357985, "tps": 54814, "wall": 2844.3} {"step": 2379, "train_loss": 4.124205112457275, "lr": 0.00039806470760711597, "tps": 54686, "wall": 2852.2} {"step": 2380, "train_loss": 4.190645217895508, "lr": 0.0003980619048335254, "tps": 54560, "wall": 2860.0} {"step": 2381, "train_loss": 4.021661281585693, "lr": 0.00039805910004284, "tps": 54434, "wall": 2867.8} {"step": 2382, "train_loss": 4.082065582275391, "lr": 0.0003980562932350914, "tps": 54312, "wall": 2875.5} {"step": 2383, "train_loss": 4.107576370239258, "lr": 0.00039805348441031155, "tps": 54184, "wall": 2883.4} {"step": 2384, "train_loss": 4.127214431762695, "lr": 0.00039805067356853217, "tps": 54062, "wall": 2891.2} {"step": 2385, "train_loss": 3.982377290725708, "lr": 0.00039804786070978513, "tps": 53939, "wall": 2899.0} {"step": 2386, "train_loss": 4.087425231933594, "lr": 0.00039804504583410233, "tps": 53816, "wall": 2906.8} {"step": 2387, "train_loss": 4.073875904083252, "lr": 0.0003980422289415156, "tps": 53695, "wall": 2914.6} {"step": 2388, "train_loss": 4.1170501708984375, "lr": 0.00039803941003205685, "tps": 53573, "wall": 2922.4} {"step": 2389, "train_loss": 3.997580051422119, "lr": 0.00039803658910575804, "tps": 53454, "wall": 2930.2} {"step": 2390, "train_loss": 4.175814151763916, "lr": 0.00039803376616265107, "tps": 53331, "wall": 2938.1} {"step": 2391, "train_loss": 4.158722877502441, "lr": 0.000398030941202768, "tps": 53214, "wall": 2945.9} {"step": 2392, "train_loss": 4.1319756507873535, "lr": 0.00039802811422614084, "tps": 53094, "wall": 2953.7} {"step": 2393, "train_loss": 3.9874861240386963, "lr": 0.0003980252852328015, "tps": 52976, "wall": 2961.6} {"step": 2394, "train_loss": 4.064061164855957, "lr": 0.00039802245422278215, "tps": 52859, "wall": 2969.4} {"step": 2395, "train_loss": 4.141298294067383, "lr": 0.0003980196211961148, "tps": 52742, "wall": 2977.2} {"step": 2396, "train_loss": 4.053956985473633, "lr": 0.00039801678615283153, "tps": 52628, "wall": 2984.9} {"step": 2397, "train_loss": 4.106665134429932, "lr": 0.0003980139490929645, "tps": 52513, "wall": 2992.7} {"step": 2398, "train_loss": 4.07529354095459, "lr": 0.0003980111100165458, "tps": 52396, "wall": 3000.6} {"step": 2399, "train_loss": 4.1151885986328125, "lr": 0.00039800826892360765, "tps": 52283, "wall": 3008.3} {"step": 2400, "train_loss": 3.9920437335968018, "lr": 0.0003980054258141822, "tps": 52170, "wall": 3016.1} {"step": 2401, "train_loss": 4.050049781799316, "lr": 0.0003980025806883016, "tps": 52055, "wall": 3024.0} {"step": 2402, "train_loss": 4.079014778137207, "lr": 0.0003979997335459982, "tps": 51943, "wall": 3031.8} {"step": 2403, "train_loss": 4.097654342651367, "lr": 0.0003979968843873041, "tps": 51830, "wall": 3039.7} {"step": 2404, "train_loss": 4.1760406494140625, "lr": 0.0003979940332122517, "tps": 51720, "wall": 3047.4} {"step": 2405, "train_loss": 4.052252292633057, "lr": 0.0003979911800208733, "tps": 51608, "wall": 3055.3} {"step": 2406, "train_loss": 4.13243293762207, "lr": 0.0003979883248132012, "tps": 51495, "wall": 3063.3} {"step": 2407, "train_loss": 4.030791759490967, "lr": 0.0003979854675892677, "tps": 51385, "wall": 3071.1} {"step": 2408, "train_loss": 4.1117987632751465, "lr": 0.0003979826083491052, "tps": 51275, "wall": 3079.0} {"step": 2409, "train_loss": 4.177726745605469, "lr": 0.0003979797470927461, "tps": 51165, "wall": 3086.9} {"step": 2410, "train_loss": 4.046040058135986, "lr": 0.0003979768838202227, "tps": 51058, "wall": 3094.6} {"step": 2411, "train_loss": 4.091002941131592, "lr": 0.00039797401853156766, "tps": 50951, "wall": 3102.4} {"step": 2412, "train_loss": 3.9688940048217773, "lr": 0.0003979711512268132, "tps": 50843, "wall": 3110.3} {"step": 2413, "train_loss": 4.01952600479126, "lr": 0.000397968281905992, "tps": 50734, "wall": 3118.2} {"step": 2414, "train_loss": 4.058213233947754, "lr": 0.00039796541056913643, "tps": 50629, "wall": 3126.0} {"step": 2415, "train_loss": 4.201067924499512, "lr": 0.0003979625372162791, "tps": 50524, "wall": 3133.8} {"step": 2416, "train_loss": 4.134298324584961, "lr": 0.00039795966184745247, "tps": 50419, "wall": 3141.7} {"step": 2417, "train_loss": 4.015198707580566, "lr": 0.0003979567844626892, "tps": 50314, "wall": 3149.5} {"step": 2418, "train_loss": 3.9883501529693604, "lr": 0.0003979539050620218, "tps": 50210, "wall": 3157.3} {"step": 2419, "train_loss": 4.118770599365234, "lr": 0.00039795102364548294, "tps": 50107, "wall": 3165.1} {"step": 2420, "train_loss": 3.969036102294922, "lr": 0.00039794814021310536, "tps": 50005, "wall": 3172.9} {"step": 2421, "train_loss": 4.080994606018066, "lr": 0.0003979452547649215, "tps": 49901, "wall": 3180.8} {"step": 2422, "train_loss": 4.055082321166992, "lr": 0.00039794236730096425, "tps": 49800, "wall": 3188.6} {"step": 2423, "train_loss": 4.039809703826904, "lr": 0.00039793947782126616, "tps": 49698, "wall": 3196.4} {"step": 2424, "train_loss": 4.11482048034668, "lr": 0.00039793658632586014, "tps": 49598, "wall": 3204.2} {"step": 2425, "train_loss": 3.950626850128174, "lr": 0.00039793369281477875, "tps": 49497, "wall": 3212.1} {"step": 2426, "train_loss": 4.097086429595947, "lr": 0.0003979307972880549, "tps": 49398, "wall": 3219.9} {"step": 2427, "train_loss": 4.151244163513184, "lr": 0.00039792789974572136, "tps": 49299, "wall": 3227.6} {"step": 2428, "train_loss": 4.121669769287109, "lr": 0.0003979250001878109, "tps": 49201, "wall": 3235.4} {"step": 2429, "train_loss": 4.115208148956299, "lr": 0.00039792209861435647, "tps": 49100, "wall": 3243.4} {"step": 2430, "train_loss": 4.12854528427124, "lr": 0.00039791919502539085, "tps": 49002, "wall": 3251.2} {"step": 2431, "train_loss": 4.053583145141602, "lr": 0.00039791628942094696, "tps": 48907, "wall": 3258.9} {"step": 2432, "train_loss": 4.01942253112793, "lr": 0.0003979133818010577, "tps": 48810, "wall": 3266.7} {"step": 2433, "train_loss": 4.114048957824707, "lr": 0.0003979104721657561, "tps": 48714, "wall": 3274.4} {"step": 2434, "train_loss": 4.171957015991211, "lr": 0.00039790756051507497, "tps": 48619, "wall": 3282.2} {"step": 2435, "train_loss": 4.114206790924072, "lr": 0.0003979046468490474, "tps": 48522, "wall": 3290.1} {"step": 2436, "train_loss": 4.080237865447998, "lr": 0.0003979017311677064, "tps": 48425, "wall": 3298.1} {"step": 2437, "train_loss": 4.083822250366211, "lr": 0.0003978988134710849, "tps": 48331, "wall": 3305.8} {"step": 2438, "train_loss": 4.08329439163208, "lr": 0.00039789589375921605, "tps": 48237, "wall": 3313.6} {"step": 2439, "train_loss": 4.0294904708862305, "lr": 0.0003978929720321329, "tps": 48144, "wall": 3321.4} {"step": 2440, "train_loss": 4.023241996765137, "lr": 0.0003978900482898685, "tps": 48050, "wall": 3329.2} {"step": 2441, "train_loss": 4.103673934936523, "lr": 0.00039788712253245606, "tps": 47957, "wall": 3337.1} {"step": 2442, "train_loss": 3.9660558700561523, "lr": 0.00039788419475992866, "tps": 47865, "wall": 3344.9} {"step": 2443, "train_loss": 4.058381080627441, "lr": 0.00039788126497231947, "tps": 47773, "wall": 3352.7} {"step": 2444, "train_loss": 4.0946760177612305, "lr": 0.0003978783331696617, "tps": 47680, "wall": 3360.6} {"step": 2445, "train_loss": 3.9960410594940186, "lr": 0.00039787539935198855, "tps": 47589, "wall": 3368.4} {"step": 2446, "train_loss": 4.103318214416504, "lr": 0.00039787246351933323, "tps": 47499, "wall": 3376.1} {"step": 2447, "train_loss": 4.045658588409424, "lr": 0.000397869525671729, "tps": 47409, "wall": 3383.9} {"step": 2448, "train_loss": 4.147482395172119, "lr": 0.00039786658580920917, "tps": 47320, "wall": 3391.7} {"step": 2449, "train_loss": 4.073973178863525, "lr": 0.0003978636439318071, "tps": 47230, "wall": 3399.5} {"step": 2450, "train_loss": 4.0319905281066895, "lr": 0.000397860700039556, "tps": 47140, "wall": 3407.5} {"step": 2451, "train_loss": 4.19234561920166, "lr": 0.0003978577541324892, "tps": 47051, "wall": 3415.3} {"step": 2452, "train_loss": 4.115302085876465, "lr": 0.0003978548062106403, "tps": 46962, "wall": 3423.2} {"step": 2453, "train_loss": 4.0810089111328125, "lr": 0.0003978518562740424, "tps": 46875, "wall": 3430.9} {"step": 2454, "train_loss": 4.082207202911377, "lr": 0.0003978489043227291, "tps": 46788, "wall": 3438.7} {"step": 2455, "train_loss": 4.1905436515808105, "lr": 0.00039784595035673376, "tps": 46702, "wall": 3446.5} {"step": 2456, "train_loss": 4.052116870880127, "lr": 0.0003978429943760899, "tps": 46615, "wall": 3454.2} {"step": 2457, "train_loss": 4.088222980499268, "lr": 0.000397840036380831, "tps": 46529, "wall": 3462.1} {"step": 2458, "train_loss": 4.013913154602051, "lr": 0.0003978370763709905, "tps": 46443, "wall": 3469.8} {"step": 2459, "train_loss": 4.006776809692383, "lr": 0.000397834114346602, "tps": 46355, "wall": 3477.8} {"step": 2460, "train_loss": 4.007327079772949, "lr": 0.0003978311503076991, "tps": 46270, "wall": 3485.7} {"step": 2461, "train_loss": 4.063332557678223, "lr": 0.0003978281842543152, "tps": 46186, "wall": 3493.5} {"step": 2462, "train_loss": 3.9713571071624756, "lr": 0.000397825216186484, "tps": 46102, "wall": 3501.2} {"step": 2463, "train_loss": 4.030953407287598, "lr": 0.00039782224610423924, "tps": 46018, "wall": 3509.1} {"step": 2464, "train_loss": 3.9820473194122314, "lr": 0.00039781927400761434, "tps": 45934, "wall": 3516.9} {"step": 2465, "train_loss": 4.074384689331055, "lr": 0.0003978162998966431, "tps": 45851, "wall": 3524.7} {"step": 2466, "train_loss": 4.046972274780273, "lr": 0.00039781332377135934, "tps": 45768, "wall": 3532.5} {"step": 2467, "train_loss": 4.058201313018799, "lr": 0.00039781034563179647, "tps": 45684, "wall": 3540.5} {"step": 2468, "train_loss": 4.106270790100098, "lr": 0.0003978073654779885, "tps": 45603, "wall": 3548.2} {"step": 2469, "train_loss": 4.085744857788086, "lr": 0.00039780438330996897, "tps": 45521, "wall": 3556.0} {"step": 2470, "train_loss": 4.107892036437988, "lr": 0.00039780139912777183, "tps": 45439, "wall": 3563.8} {"step": 2471, "train_loss": 4.004459381103516, "lr": 0.0003977984129314308, "tps": 45358, "wall": 3571.6} {"step": 2472, "train_loss": 4.1520915031433105, "lr": 0.00039779542472097974, "tps": 45277, "wall": 3579.5} {"step": 2473, "train_loss": 4.052597999572754, "lr": 0.00039779243449645244, "tps": 45198, "wall": 3587.2} {"step": 2474, "train_loss": 4.037246227264404, "lr": 0.0003977894422578829, "tps": 45118, "wall": 3595.0} {"step": 2475, "train_loss": 4.00693416595459, "lr": 0.0003977864480053049, "tps": 45037, "wall": 3602.9} {"step": 2476, "train_loss": 4.112747669219971, "lr": 0.0003977834517387524, "tps": 44958, "wall": 3610.7} {"step": 2477, "train_loss": 4.086609363555908, "lr": 0.00039778045345825936, "tps": 44879, "wall": 3618.5} {"step": 2478, "train_loss": 4.0265913009643555, "lr": 0.0003977774531638597, "tps": 44800, "wall": 3626.4} {"step": 2479, "train_loss": 4.111158847808838, "lr": 0.0003977744508555874, "tps": 44723, "wall": 3634.1} {"step": 2480, "train_loss": 4.018764495849609, "lr": 0.0003977714465334766, "tps": 44645, "wall": 3641.9} {"step": 2481, "train_loss": 4.019192218780518, "lr": 0.0003977684401975612, "tps": 44569, "wall": 3649.6} {"step": 2482, "train_loss": 4.01228666305542, "lr": 0.00039776543184787523, "tps": 44489, "wall": 3657.6} {"step": 2483, "train_loss": 4.155197620391846, "lr": 0.0003977624214844529, "tps": 44414, "wall": 3665.3} {"step": 2484, "train_loss": 4.066738605499268, "lr": 0.0003977594091073282, "tps": 44338, "wall": 3673.0} {"step": 2485, "train_loss": 3.97617244720459, "lr": 0.00039775639471653537, "tps": 44261, "wall": 3680.9} {"step": 2486, "train_loss": 4.0903801918029785, "lr": 0.00039775337831210835, "tps": 44186, "wall": 3688.6} {"step": 2487, "train_loss": 4.094852447509766, "lr": 0.0003977503598940816, "tps": 44110, "wall": 3696.5} {"step": 2488, "train_loss": 4.126517295837402, "lr": 0.00039774733946248904, "tps": 44035, "wall": 3704.2} {"step": 2489, "train_loss": 4.1680216789245605, "lr": 0.000397744317017365, "tps": 43960, "wall": 3712.1} {"step": 2490, "train_loss": 4.0334320068359375, "lr": 0.0003977412925587438, "tps": 43884, "wall": 3720.0} {"step": 2491, "train_loss": 4.073098659515381, "lr": 0.0003977382660866596, "tps": 43810, "wall": 3727.8} {"step": 2492, "train_loss": 4.117696762084961, "lr": 0.00039773523760114674, "tps": 43736, "wall": 3735.6} {"step": 2493, "train_loss": 4.034548759460449, "lr": 0.0003977322071022394, "tps": 43663, "wall": 3743.3} {"step": 2494, "train_loss": 4.117891311645508, "lr": 0.0003977291745899721, "tps": 43590, "wall": 3751.1} {"step": 2495, "train_loss": 4.019540786743164, "lr": 0.000397726140064379, "tps": 43516, "wall": 3759.0} {"step": 2496, "train_loss": 4.070634365081787, "lr": 0.00039772310352549465, "tps": 43444, "wall": 3766.7} {"step": 2497, "train_loss": 4.097146511077881, "lr": 0.00039772006497335326, "tps": 43372, "wall": 3774.5} {"step": 2498, "train_loss": 3.997687816619873, "lr": 0.0003977170244079895, "tps": 43299, "wall": 3782.4} {"step": 2499, "train_loss": 4.046095848083496, "lr": 0.0003977139818294376, "tps": 43227, "wall": 3790.2} {"step": 2500, "train_loss": 4.062174320220947, "lr": 0.0003977109372377321, "tps": 43156, "wall": 3797.9} {"step": 2501, "train_loss": 4.134237766265869, "lr": 0.0003977078906329075, "tps": 43086, "wall": 3805.6} {"step": 2502, "train_loss": 4.010129451751709, "lr": 0.0003977048420149983, "tps": 43015, "wall": 3813.4} {"step": 2503, "train_loss": 3.9735641479492188, "lr": 0.000397701791384039, "tps": 42944, "wall": 3821.3} {"step": 2504, "train_loss": 4.0218353271484375, "lr": 0.0003976987387400643, "tps": 42873, "wall": 3829.1} {"step": 2505, "train_loss": 4.114602088928223, "lr": 0.00039769568408310857, "tps": 42804, "wall": 3836.8} {"step": 2506, "train_loss": 3.992131471633911, "lr": 0.0003976926274132065, "tps": 42732, "wall": 3844.8} {"step": 2507, "train_loss": 3.9688076972961426, "lr": 0.00039768956873039287, "tps": 42662, "wall": 3852.6} {"step": 2508, "train_loss": 3.868197441101074, "lr": 0.00039768650803470205, "tps": 42594, "wall": 3860.4} {"step": 2509, "train_loss": 4.100766181945801, "lr": 0.0003976834453261689, "tps": 42526, "wall": 3868.1} {"step": 2510, "train_loss": 4.067473411560059, "lr": 0.0003976803806048281, "tps": 42457, "wall": 3875.9} {"step": 2511, "train_loss": 3.9933576583862305, "lr": 0.0003976773138707143, "tps": 42389, "wall": 3883.7} {"step": 2512, "train_loss": 4.0072479248046875, "lr": 0.0003976742451238623, "tps": 42321, "wall": 3891.4} {"step": 2513, "train_loss": 4.180713653564453, "lr": 0.00039767117436430684, "tps": 42251, "wall": 3899.4} {"step": 2514, "train_loss": 4.065741539001465, "lr": 0.0003976681015920827, "tps": 42184, "wall": 3907.2} {"step": 2515, "train_loss": 4.0203423500061035, "lr": 0.00039766502680722463, "tps": 42117, "wall": 3915.0} {"step": 2516, "train_loss": 4.1566386222839355, "lr": 0.00039766195000976763, "tps": 42050, "wall": 3922.7} {"step": 2517, "train_loss": 4.023316383361816, "lr": 0.0003976588711997464, "tps": 41984, "wall": 3930.5} {"step": 2518, "train_loss": 4.065987586975098, "lr": 0.00039765579037719583, "tps": 41918, "wall": 3938.2} {"step": 2519, "train_loss": 4.014237880706787, "lr": 0.0003976527075421509, "tps": 41852, "wall": 3946.0} {"step": 2520, "train_loss": 3.9799299240112305, "lr": 0.0003976496226946465, "tps": 41786, "wall": 3953.8} {"step": 2521, "train_loss": 4.026676654815674, "lr": 0.00039764653583471756, "tps": 41719, "wall": 3961.8} {"step": 2522, "train_loss": 3.9814224243164062, "lr": 0.00039764344696239905, "tps": 41653, "wall": 3969.6} {"step": 2523, "train_loss": 4.074336051940918, "lr": 0.00039764035607772595, "tps": 41588, "wall": 3977.3} {"step": 2524, "train_loss": 4.066098213195801, "lr": 0.00039763726318073323, "tps": 41524, "wall": 3985.0} {"step": 2525, "train_loss": 4.0432538986206055, "lr": 0.0003976341682714561, "tps": 41460, "wall": 3992.8} {"step": 2526, "train_loss": 3.958580493927002, "lr": 0.00039763107134992945, "tps": 41395, "wall": 4000.6} {"step": 2527, "train_loss": 4.044558525085449, "lr": 0.0003976279724161883, "tps": 41330, "wall": 4008.6} {"step": 2528, "train_loss": 3.919283866882324, "lr": 0.0003976248714702681, "tps": 41266, "wall": 4016.4} {"step": 2529, "train_loss": 3.9438796043395996, "lr": 0.0003976217685122036, "tps": 41201, "wall": 4024.3} {"step": 2530, "train_loss": 4.066356658935547, "lr": 0.0003976186635420301, "tps": 41138, "wall": 4032.0} {"step": 2531, "train_loss": 4.059117794036865, "lr": 0.00039761555655978283, "tps": 41075, "wall": 4039.8} {"step": 2532, "train_loss": 4.0470051765441895, "lr": 0.0003976124475654968, "tps": 41012, "wall": 4047.6} {"step": 2533, "train_loss": 4.104137420654297, "lr": 0.00039760933655920747, "tps": 40949, "wall": 4055.4} {"step": 2534, "train_loss": 4.014195442199707, "lr": 0.0003976062235409499, "tps": 40887, "wall": 4063.2} {"step": 2535, "train_loss": 4.083380222320557, "lr": 0.00039760310851075947, "tps": 40825, "wall": 4071.0} {"step": 2536, "train_loss": 4.004104137420654, "lr": 0.00039759999146867143, "tps": 40761, "wall": 4079.0} {"step": 2537, "train_loss": 4.117093086242676, "lr": 0.00039759687241472104, "tps": 40700, "wall": 4086.7} {"step": 2538, "train_loss": 3.9816250801086426, "lr": 0.0003975937513489437, "tps": 40640, "wall": 4094.4} {"step": 2539, "train_loss": 4.053915500640869, "lr": 0.0003975906282713747, "tps": 40578, "wall": 4102.2} {"step": 2540, "train_loss": 4.122499942779541, "lr": 0.0003975875031820495, "tps": 40518, "wall": 4109.9} {"step": 2541, "train_loss": 3.9378936290740967, "lr": 0.00039758437608100345, "tps": 40458, "wall": 4117.6} {"step": 2542, "train_loss": 3.989767551422119, "lr": 0.00039758124696827194, "tps": 40398, "wall": 4125.3} {"step": 2543, "train_loss": 4.150173187255859, "lr": 0.00039757811584389046, "tps": 40338, "wall": 4133.1} {"step": 2544, "train_loss": 4.027575969696045, "lr": 0.00039757498270789454, "tps": 40275, "wall": 4141.2} {"step": 2545, "train_loss": 4.0729522705078125, "lr": 0.00039757184756031955, "tps": 40216, "wall": 4149.0} {"step": 2546, "train_loss": 4.100533962249756, "lr": 0.0003975687104012011, "tps": 40156, "wall": 4156.8} {"step": 2547, "train_loss": 4.047323703765869, "lr": 0.0003975655712305747, "tps": 40097, "wall": 4164.5} {"step": 2548, "train_loss": 4.03289794921875, "lr": 0.00039756243004847585, "tps": 40038, "wall": 4172.3} {"step": 2549, "train_loss": 3.998011589050293, "lr": 0.0003975592868549402, "tps": 39978, "wall": 4180.1} {"step": 2550, "train_loss": 4.0661702156066895, "lr": 0.0003975561416500034, "tps": 39920, "wall": 4187.9} {"step": 2551, "train_loss": 3.981369972229004, "lr": 0.00039755299443370093, "tps": 39862, "wall": 4195.7} {"step": 2552, "train_loss": 4.08026647567749, "lr": 0.00039754984520606857, "tps": 39802, "wall": 4203.6} {"step": 2553, "train_loss": 4.01491117477417, "lr": 0.000397546693967142, "tps": 39744, "wall": 4211.3} {"step": 2554, "train_loss": 3.9919867515563965, "lr": 0.00039754354071695687, "tps": 39686, "wall": 4219.2} {"step": 2555, "train_loss": 4.035799026489258, "lr": 0.0003975403854555489, "tps": 39629, "wall": 4226.9} {"step": 2556, "train_loss": 4.0825090408325195, "lr": 0.00039753722818295376, "tps": 39572, "wall": 4234.7} {"step": 2557, "train_loss": 3.917111873626709, "lr": 0.0003975340688992074, "tps": 39514, "wall": 4242.5} {"step": 2558, "train_loss": 3.9006009101867676, "lr": 0.00039753090760434546, "tps": 39457, "wall": 4250.3} {"step": 2559, "train_loss": 4.060683250427246, "lr": 0.0003975277442984038, "tps": 39400, "wall": 4258.2} {"step": 2560, "train_loss": 3.953965425491333, "lr": 0.0003975245789814182, "tps": 39343, "wall": 4265.9} {"step": 2561, "train_loss": 4.054921627044678, "lr": 0.00039752141165342464, "tps": 39287, "wall": 4273.7} {"step": 2562, "train_loss": 3.9789113998413086, "lr": 0.0003975182423144589, "tps": 39231, "wall": 4281.5} {"step": 2563, "train_loss": 3.977506399154663, "lr": 0.0003975150709645569, "tps": 39175, "wall": 4289.3} {"step": 2564, "train_loss": 4.103030204772949, "lr": 0.00039751189760375453, "tps": 39118, "wall": 4297.2} {"step": 2565, "train_loss": 3.9817967414855957, "lr": 0.00039750872223208786, "tps": 39063, "wall": 4304.9} {"step": 2566, "train_loss": 3.97174072265625, "lr": 0.0003975055448495927, "tps": 39008, "wall": 4312.7} {"step": 2567, "train_loss": 3.940997362136841, "lr": 0.00039750236545630524, "tps": 38952, "wall": 4320.6} {"step": 2568, "train_loss": 4.144424915313721, "lr": 0.0003974991840522613, "tps": 38898, "wall": 4328.2} {"step": 2569, "train_loss": 3.925861120223999, "lr": 0.00039749600063749706, "tps": 38843, "wall": 4336.0} {"step": 2570, "train_loss": 4.08493709564209, "lr": 0.0003974928152120484, "tps": 38789, "wall": 4343.8} {"step": 2571, "train_loss": 3.8966822624206543, "lr": 0.0003974896277759516, "tps": 38735, "wall": 4351.5} {"step": 2572, "train_loss": 3.9405012130737305, "lr": 0.0003974864383292427, "tps": 38682, "wall": 4359.2} {"step": 2573, "train_loss": 3.8964877128601074, "lr": 0.0003974832468719578, "tps": 38628, "wall": 4367.0} {"step": 2574, "train_loss": 4.115567684173584, "lr": 0.00039748005340413314, "tps": 38574, "wall": 4374.8} {"step": 2575, "train_loss": 4.01022481918335, "lr": 0.0003974768579258048, "tps": 38519, "wall": 4382.7} {"step": 2576, "train_loss": 4.021203994750977, "lr": 0.00039747366043700903, "tps": 38466, "wall": 4390.5} {"step": 2577, "train_loss": 4.0868706703186035, "lr": 0.00039747046093778195, "tps": 38413, "wall": 4398.3} {"step": 2578, "train_loss": 3.9242358207702637, "lr": 0.00039746725942816, "tps": 38360, "wall": 4406.1} {"step": 2579, "train_loss": 4.026534080505371, "lr": 0.0003974640559081793, "tps": 38307, "wall": 4413.9} {"step": 2580, "train_loss": 4.055980205535889, "lr": 0.0003974608503778761, "tps": 38254, "wall": 4421.7} {"step": 2581, "train_loss": 4.048495292663574, "lr": 0.00039745764283728686, "tps": 38201, "wall": 4429.5} {"step": 2582, "train_loss": 4.127167224884033, "lr": 0.00039745443328644784, "tps": 38147, "wall": 4437.5} {"step": 2583, "train_loss": 4.023582935333252, "lr": 0.00039745122172539537, "tps": 38095, "wall": 4445.2} {"step": 2584, "train_loss": 4.0963029861450195, "lr": 0.0003974480081541658, "tps": 38044, "wall": 4452.9} {"step": 2585, "train_loss": 3.9988961219787598, "lr": 0.0003974447925727957, "tps": 37993, "wall": 4460.7} {"step": 2586, "train_loss": 3.989609718322754, "lr": 0.0003974415749813214, "tps": 37941, "wall": 4468.5} {"step": 2587, "train_loss": 4.0670366287231445, "lr": 0.0003974383553797793, "tps": 37889, "wall": 4476.3} {"step": 2588, "train_loss": 3.907592296600342, "lr": 0.0003974351337682059, "tps": 37838, "wall": 4484.1} {"step": 2589, "train_loss": 3.982320785522461, "lr": 0.0003974319101466377, "tps": 37787, "wall": 4491.9} {"step": 2590, "train_loss": 4.011566162109375, "lr": 0.0003974286845151112, "tps": 37735, "wall": 4499.8} {"step": 2591, "train_loss": 3.9205334186553955, "lr": 0.000397425456873663, "tps": 37685, "wall": 4507.6} {"step": 2592, "train_loss": 4.045749664306641, "lr": 0.0003974222272223297, "tps": 37635, "wall": 4515.3} {"step": 2593, "train_loss": 3.9702892303466797, "lr": 0.0003974189955611477, "tps": 37584, "wall": 4523.2} {"step": 2594, "train_loss": 4.128228187561035, "lr": 0.00039741576189015375, "tps": 37535, "wall": 4530.8} {"step": 2595, "train_loss": 4.0612993240356445, "lr": 0.0003974125262093844, "tps": 37486, "wall": 4538.5} {"step": 2596, "train_loss": 3.968933582305908, "lr": 0.0003974092885188764, "tps": 37436, "wall": 4546.3} {"step": 2597, "train_loss": 3.9180569648742676, "lr": 0.00039740604881866644, "tps": 37386, "wall": 4554.1} {"step": 2598, "train_loss": 4.059494972229004, "lr": 0.0003974028071087911, "tps": 37336, "wall": 4562.0} {"step": 2599, "train_loss": 4.129970073699951, "lr": 0.0003973995633892872, "tps": 37287, "wall": 4569.7} {"step": 2600, "train_loss": 3.961146116256714, "lr": 0.0003973963176601914, "tps": 37239, "wall": 4577.4} {"step": 2601, "train_loss": 4.121356010437012, "lr": 0.00039739306992154057, "tps": 37190, "wall": 4585.1} {"step": 2602, "train_loss": 4.021687030792236, "lr": 0.00039738982017337144, "tps": 37141, "wall": 4593.0} {"step": 2603, "train_loss": 4.102410316467285, "lr": 0.0003973865684157208, "tps": 37093, "wall": 4600.7} {"step": 2604, "train_loss": 3.959165096282959, "lr": 0.00039738331464862553, "tps": 37045, "wall": 4608.5} {"step": 2605, "train_loss": 3.9874649047851562, "lr": 0.00039738005887212253, "tps": 36996, "wall": 4616.2} {"step": 2606, "train_loss": 4.0310516357421875, "lr": 0.0003973768010862485, "tps": 36948, "wall": 4624.1} {"step": 2607, "train_loss": 3.9850239753723145, "lr": 0.00039737354129104055, "tps": 36899, "wall": 4631.9} {"step": 2608, "train_loss": 3.9725170135498047, "lr": 0.00039737027948653556, "tps": 36852, "wall": 4639.7} {"step": 2609, "train_loss": 4.098959922790527, "lr": 0.0003973670156727704, "tps": 36804, "wall": 4647.4} {"step": 2610, "train_loss": 3.8479995727539062, "lr": 0.00039736374984978206, "tps": 36757, "wall": 4655.2} {"step": 2611, "train_loss": 4.011435508728027, "lr": 0.00039736048201760766, "tps": 36711, "wall": 4662.9} {"step": 2612, "train_loss": 3.9788074493408203, "lr": 0.000397357212176284, "tps": 36664, "wall": 4670.7} {"step": 2613, "train_loss": 4.0013580322265625, "lr": 0.00039735394032584836, "tps": 36616, "wall": 4678.5} {"step": 2614, "train_loss": 4.062136650085449, "lr": 0.00039735066646633767, "tps": 36570, "wall": 4686.3} {"step": 2615, "train_loss": 3.9610700607299805, "lr": 0.00039734739059778896, "tps": 36523, "wall": 4694.0} {"step": 2616, "train_loss": 4.106359481811523, "lr": 0.00039734411272023955, "tps": 36477, "wall": 4701.8} {"step": 2617, "train_loss": 4.136634826660156, "lr": 0.00039734083283372634, "tps": 36430, "wall": 4709.6} {"step": 2618, "train_loss": 4.0652079582214355, "lr": 0.0003973375509382865, "tps": 36384, "wall": 4717.4} {"step": 2619, "train_loss": 4.023749828338623, "lr": 0.00039733426703395745, "tps": 36338, "wall": 4725.1} {"step": 2620, "train_loss": 4.05648136138916, "lr": 0.00039733098112077614, "tps": 36292, "wall": 4732.9} {"step": 2621, "train_loss": 4.10801887512207, "lr": 0.0003973276931987799, "tps": 36245, "wall": 4740.8} {"step": 2622, "train_loss": 4.038548946380615, "lr": 0.000397324403268006, "tps": 36199, "wall": 4748.7} {"step": 2623, "train_loss": 3.9642157554626465, "lr": 0.0003973211113284916, "tps": 36154, "wall": 4756.4} {"step": 2624, "train_loss": 4.021328926086426, "lr": 0.0003973178173802741, "tps": 36109, "wall": 4764.2} {"step": 2625, "train_loss": 4.051713943481445, "lr": 0.0003973145214233908, "tps": 36064, "wall": 4771.9} {"step": 2626, "train_loss": 4.013710021972656, "lr": 0.00039731122345787896, "tps": 36019, "wall": 4779.7} {"step": 2627, "train_loss": 3.9653046131134033, "lr": 0.000397307923483776, "tps": 35975, "wall": 4787.4} {"step": 2628, "train_loss": 4.094355583190918, "lr": 0.00039730462150111925, "tps": 35930, "wall": 4795.2} {"step": 2629, "train_loss": 4.0278639793396, "lr": 0.0003973013175099462, "tps": 35884, "wall": 4803.2} {"step": 2630, "train_loss": 4.032105445861816, "lr": 0.00039729801151029427, "tps": 35840, "wall": 4810.9} {"step": 2631, "train_loss": 4.093425273895264, "lr": 0.0003972947035022008, "tps": 35796, "wall": 4818.7} {"step": 2632, "train_loss": 4.00864315032959, "lr": 0.0003972913934857034, "tps": 35752, "wall": 4826.4} {"step": 2633, "train_loss": 3.9961371421813965, "lr": 0.0003972880814608394, "tps": 35709, "wall": 4834.1} {"step": 2634, "train_loss": 3.9752237796783447, "lr": 0.0003972847674276466, "tps": 35665, "wall": 4841.9} {"step": 2635, "train_loss": 3.9898996353149414, "lr": 0.00039728145138616226, "tps": 35622, "wall": 4849.6} {"step": 2636, "train_loss": 4.086550712585449, "lr": 0.000397278133336424, "tps": 35577, "wall": 4857.5} {"step": 2637, "train_loss": 4.015591144561768, "lr": 0.0003972748132784695, "tps": 35535, "wall": 4865.1} {"step": 2638, "train_loss": 4.022855758666992, "lr": 0.0003972714912123363, "tps": 35492, "wall": 4872.9} {"step": 2639, "train_loss": 3.9483118057250977, "lr": 0.0003972681671380621, "tps": 35449, "wall": 4880.6} {"step": 2640, "train_loss": 4.139676094055176, "lr": 0.00039726484105568455, "tps": 35406, "wall": 4888.4} {"step": 2641, "train_loss": 3.934488534927368, "lr": 0.00039726151296524124, "tps": 35363, "wall": 4896.2} {"step": 2642, "train_loss": 3.8756237030029297, "lr": 0.00039725818286676985, "tps": 35321, "wall": 4903.8} {"step": 2643, "train_loss": 3.9975240230560303, "lr": 0.00039725485076030833, "tps": 35278, "wall": 4911.7} {"step": 2644, "train_loss": 4.05492639541626, "lr": 0.00039725151664589414, "tps": 35236, "wall": 4919.5} {"step": 2645, "train_loss": 4.0167717933654785, "lr": 0.0003972481805235652, "tps": 35193, "wall": 4927.2} {"step": 2646, "train_loss": 4.014433860778809, "lr": 0.0003972448423933593, "tps": 35151, "wall": 4935.0} {"step": 2647, "train_loss": 3.954319477081299, "lr": 0.00039724150225531427, "tps": 35110, "wall": 4942.7} {"step": 2648, "train_loss": 4.073493480682373, "lr": 0.00039723816010946785, "tps": 35068, "wall": 4950.4} {"step": 2649, "train_loss": 4.044408798217773, "lr": 0.00039723481595585805, "tps": 35027, "wall": 4958.1} {"step": 2650, "train_loss": 3.926898956298828, "lr": 0.00039723146979452257, "tps": 34985, "wall": 4965.9} {"step": 2651, "train_loss": 4.059828758239746, "lr": 0.0003972281216254995, "tps": 34943, "wall": 4973.7} {"step": 2652, "train_loss": 4.019600868225098, "lr": 0.00039722477144882664, "tps": 34901, "wall": 4981.6} {"step": 2653, "train_loss": 4.060701847076416, "lr": 0.000397221419264542, "tps": 34860, "wall": 4989.3} {"step": 2654, "train_loss": 4.0947370529174805, "lr": 0.00039721806507268353, "tps": 34819, "wall": 4997.1} {"step": 2655, "train_loss": 4.070834159851074, "lr": 0.0003972147088732892, "tps": 34778, "wall": 5004.9} {"step": 2656, "train_loss": 4.063259124755859, "lr": 0.00039721135066639703, "tps": 34737, "wall": 5012.7} {"step": 2657, "train_loss": 4.051886081695557, "lr": 0.00039720799045204515, "tps": 34697, "wall": 5020.4} {"step": 2658, "train_loss": 3.975496768951416, "lr": 0.0003972046282302716, "tps": 34657, "wall": 5028.1} {"step": 2659, "train_loss": 3.994394302368164, "lr": 0.0003972012640011144, "tps": 34617, "wall": 5035.7} {"step": 2660, "train_loss": 3.9311585426330566, "lr": 0.0003971978977646117, "tps": 34576, "wall": 5043.6} {"step": 2661, "train_loss": 3.9542222023010254, "lr": 0.0003971945295208016, "tps": 34536, "wall": 5051.3} {"step": 2662, "train_loss": 3.9834470748901367, "lr": 0.00039719115926972233, "tps": 34497, "wall": 5059.0} {"step": 2663, "train_loss": 3.9672183990478516, "lr": 0.00039718778701141195, "tps": 34457, "wall": 5066.8} {"step": 2664, "train_loss": 4.032522201538086, "lr": 0.00039718441274590876, "tps": 34417, "wall": 5074.5} {"step": 2665, "train_loss": 3.9947452545166016, "lr": 0.000397181036473251, "tps": 34378, "wall": 5082.2} {"step": 2666, "train_loss": 3.9463186264038086, "lr": 0.00039717765819347685, "tps": 34339, "wall": 5089.9} {"step": 2667, "train_loss": 4.049162864685059, "lr": 0.00039717427790662455, "tps": 34299, "wall": 5097.8} {"step": 2668, "train_loss": 4.093946933746338, "lr": 0.0003971708956127325, "tps": 34261, "wall": 5105.4} {"step": 2669, "train_loss": 3.973722457885742, "lr": 0.0003971675113118389, "tps": 34222, "wall": 5113.1} {"step": 2670, "train_loss": 3.9716763496398926, "lr": 0.0003971641250039823, "tps": 34183, "wall": 5120.8} {"step": 2671, "train_loss": 4.0372514724731445, "lr": 0.0003971607366892008, "tps": 34144, "wall": 5128.5} {"step": 2672, "train_loss": 3.9647891521453857, "lr": 0.00039715734636753294, "tps": 34106, "wall": 5136.2} {"step": 2673, "train_loss": 3.9508056640625, "lr": 0.000397153954039017, "tps": 34068, "wall": 5143.9} {"step": 2674, "train_loss": 4.040524959564209, "lr": 0.0003971505597036915, "tps": 34029, "wall": 5151.6} {"step": 2675, "train_loss": 3.9764404296875, "lr": 0.00039714716336159496, "tps": 33991, "wall": 5159.4} {"step": 2676, "train_loss": 4.001646518707275, "lr": 0.0003971437650127656, "tps": 33952, "wall": 5167.2} {"step": 2677, "train_loss": 3.9513540267944336, "lr": 0.00039714036465724226, "tps": 33915, "wall": 5174.8} {"step": 2678, "train_loss": 3.97178316116333, "lr": 0.00039713696229506316, "tps": 33877, "wall": 5182.5} {"step": 2679, "train_loss": 4.066734790802002, "lr": 0.000397133557926267, "tps": 33840, "wall": 5190.1} {"step": 2680, "train_loss": 4.036040306091309, "lr": 0.00039713015155089243, "tps": 33803, "wall": 5197.7} {"step": 2681, "train_loss": 4.111115455627441, "lr": 0.0003971267431689778, "tps": 33766, "wall": 5205.4} {"step": 2682, "train_loss": 4.048572540283203, "lr": 0.0003971233327805619, "tps": 33729, "wall": 5213.1} {"step": 2683, "train_loss": 3.925917148590088, "lr": 0.0003971199203856833, "tps": 33691, "wall": 5220.9} {"step": 2684, "train_loss": 3.9027414321899414, "lr": 0.00039711650598438057, "tps": 33654, "wall": 5228.5} {"step": 2685, "train_loss": 3.991903066635132, "lr": 0.0003971130895766925, "tps": 33617, "wall": 5236.2} {"step": 2686, "train_loss": 4.033533096313477, "lr": 0.0003971096711626579, "tps": 33581, "wall": 5243.9} {"step": 2687, "train_loss": 4.101654052734375, "lr": 0.00039710625074231525, "tps": 33545, "wall": 5251.5} {"step": 2688, "train_loss": 4.028979301452637, "lr": 0.00039710282831570344, "tps": 33509, "wall": 5259.1} {"step": 2689, "train_loss": 3.9373369216918945, "lr": 0.00039709940388286117, "tps": 33472, "wall": 5266.7} {"step": 2690, "train_loss": 4.0307230949401855, "lr": 0.00039709597744382735, "tps": 33436, "wall": 5274.3} {"step": 2691, "train_loss": 3.916783332824707, "lr": 0.00039709254899864064, "tps": 33400, "wall": 5282.1} {"step": 2692, "train_loss": 4.049739837646484, "lr": 0.00039708911854734, "tps": 33364, "wall": 5289.8} {"step": 2693, "train_loss": 3.985553026199341, "lr": 0.00039708568608996423, "tps": 33329, "wall": 5297.3} {"step": 2694, "train_loss": 4.012138366699219, "lr": 0.00039708225162655227, "tps": 33293, "wall": 5304.9} {"step": 2695, "train_loss": 4.006622791290283, "lr": 0.00039707881515714294, "tps": 33257, "wall": 5312.6} {"step": 2696, "train_loss": 4.096653938293457, "lr": 0.00039707537668177517, "tps": 33221, "wall": 5320.3} {"step": 2697, "train_loss": 3.9545083045959473, "lr": 0.00039707193620048804, "tps": 33186, "wall": 5328.0} {"step": 2698, "train_loss": 3.938699722290039, "lr": 0.0003970684937133204, "tps": 33151, "wall": 5335.6} {"step": 2699, "train_loss": 4.036637306213379, "lr": 0.00039706504922031125, "tps": 33115, "wall": 5343.3} {"step": 2700, "train_loss": 4.030667781829834, "lr": 0.0003970616027214997, "tps": 33080, "wall": 5351.0} {"step": 2701, "train_loss": 4.0242838859558105, "lr": 0.0003970581542169247, "tps": 33045, "wall": 5358.6} {"step": 2702, "train_loss": 4.002585411071777, "lr": 0.00039705470370662534, "tps": 33010, "wall": 5366.3} {"step": 2703, "train_loss": 4.048553466796875, "lr": 0.0003970512511906408, "tps": 32975, "wall": 5373.9} {"step": 2704, "train_loss": 3.957789182662964, "lr": 0.00039704779666901004, "tps": 32941, "wall": 5381.5} {"step": 2705, "train_loss": 3.9895665645599365, "lr": 0.00039704434014177227, "tps": 32906, "wall": 5389.2} {"step": 2706, "train_loss": 4.0916972160339355, "lr": 0.00039704088160896664, "tps": 32872, "wall": 5396.8} {"step": 2707, "train_loss": 3.9480457305908203, "lr": 0.00039703742107063234, "tps": 32836, "wall": 5404.6} {"step": 2708, "train_loss": 4.043571949005127, "lr": 0.00039703395852680847, "tps": 32802, "wall": 5412.2} {"step": 2709, "train_loss": 3.8858113288879395, "lr": 0.0003970304939775344, "tps": 32768, "wall": 5419.9} {"step": 2710, "train_loss": 4.0598368644714355, "lr": 0.0003970270274228494, "tps": 32734, "wall": 5427.5} {"step": 2711, "train_loss": 4.006821155548096, "lr": 0.00039702355886279256, "tps": 32700, "wall": 5435.2} {"step": 2712, "train_loss": 4.037762641906738, "lr": 0.0003970200882974033, "tps": 32667, "wall": 5442.8} {"step": 2713, "train_loss": 3.9324374198913574, "lr": 0.00039701661572672084, "tps": 32633, "wall": 5450.4} {"step": 2714, "train_loss": 3.9732065200805664, "lr": 0.0003970131411507847, "tps": 32598, "wall": 5458.2} {"step": 2715, "train_loss": 4.090514183044434, "lr": 0.00039700966456963406, "tps": 32565, "wall": 5465.8} {"step": 2716, "train_loss": 4.057394027709961, "lr": 0.00039700618598330833, "tps": 32531, "wall": 5473.5} {"step": 2717, "train_loss": 3.9530129432678223, "lr": 0.00039700270539184696, "tps": 32498, "wall": 5481.1} {"step": 2718, "train_loss": 4.032914161682129, "lr": 0.0003969992227952894, "tps": 32464, "wall": 5488.8} {"step": 2719, "train_loss": 3.9210240840911865, "lr": 0.0003969957381936751, "tps": 32431, "wall": 5496.4} {"step": 2720, "train_loss": 4.009640693664551, "lr": 0.0003969922515870434, "tps": 32399, "wall": 5504.0} {"step": 2721, "train_loss": 4.071334362030029, "lr": 0.000396988762975434, "tps": 32366, "wall": 5511.6} {"step": 2722, "train_loss": 4.023709774017334, "lr": 0.0003969852723588863, "tps": 32332, "wall": 5519.4} {"step": 2723, "train_loss": 3.9553110599517822, "lr": 0.00039698177973743984, "tps": 32299, "wall": 5527.0} {"step": 2724, "train_loss": 4.021442890167236, "lr": 0.00039697828511113417, "tps": 32266, "wall": 5534.6} {"step": 2725, "train_loss": 3.9838624000549316, "lr": 0.0003969747884800089, "tps": 32234, "wall": 5542.2} {"step": 2726, "train_loss": 4.055780410766602, "lr": 0.00039697128984410367, "tps": 32202, "wall": 5549.9} {"step": 2727, "train_loss": 4.030447006225586, "lr": 0.00039696778920345814, "tps": 32169, "wall": 5557.5} {"step": 2728, "train_loss": 3.9677586555480957, "lr": 0.0003969642865581119, "tps": 32137, "wall": 5565.1} {"step": 2729, "train_loss": 4.006028175354004, "lr": 0.00039696078190810464, "tps": 32105, "wall": 5572.6} {"step": 2730, "train_loss": 3.9867379665374756, "lr": 0.0003969572752534761, "tps": 32072, "wall": 5580.4} {"step": 2731, "train_loss": 3.933250904083252, "lr": 0.00039695376659426595, "tps": 32040, "wall": 5588.0} {"step": 2732, "train_loss": 4.0203776359558105, "lr": 0.0003969502559305139, "tps": 32008, "wall": 5595.7} {"step": 2733, "train_loss": 3.933255195617676, "lr": 0.0003969467432622599, "tps": 31976, "wall": 5603.3} {"step": 2734, "train_loss": 3.9962081909179688, "lr": 0.0003969432285895435, "tps": 31944, "wall": 5611.0} {"step": 2735, "train_loss": 4.001854419708252, "lr": 0.00039693971191240475, "tps": 31912, "wall": 5618.6} {"step": 2736, "train_loss": 4.068254470825195, "lr": 0.0003969361932308833, "tps": 31881, "wall": 5626.3} {"step": 2737, "train_loss": 3.988924026489258, "lr": 0.00039693267254501904, "tps": 31849, "wall": 5633.9} {"step": 2738, "train_loss": 3.9446463584899902, "lr": 0.00039692914985485196, "tps": 31817, "wall": 5641.7} {"step": 2739, "train_loss": 4.022808074951172, "lr": 0.00039692562516042187, "tps": 31786, "wall": 5649.3} {"step": 2740, "train_loss": 4.047013759613037, "lr": 0.00039692209846176876, "tps": 31755, "wall": 5656.9} {"step": 2741, "train_loss": 3.8749704360961914, "lr": 0.00039691856975893254, "tps": 31723, "wall": 5664.5} {"step": 2742, "train_loss": 3.9809324741363525, "lr": 0.00039691503905195315, "tps": 31692, "wall": 5672.2} {"step": 2743, "train_loss": 4.013530731201172, "lr": 0.00039691150634087066, "tps": 31661, "wall": 5679.9} {"step": 2744, "train_loss": 3.993234634399414, "lr": 0.000396907971625725, "tps": 31629, "wall": 5687.5} {"step": 2745, "train_loss": 4.107979774475098, "lr": 0.00039690443490655636, "tps": 31599, "wall": 5695.1} {"step": 2746, "train_loss": 3.889991283416748, "lr": 0.00039690089618340467, "tps": 31568, "wall": 5702.8} {"step": 2747, "train_loss": 4.007807731628418, "lr": 0.00039689735545631006, "tps": 31537, "wall": 5710.4} {"step": 2748, "train_loss": 4.121071815490723, "lr": 0.0003968938127253126, "tps": 31507, "wall": 5718.0} {"step": 2749, "train_loss": 3.9855785369873047, "lr": 0.00039689026799045253, "tps": 31476, "wall": 5725.7} {"step": 2750, "train_loss": 3.984215259552002, "lr": 0.0003968867212517699, "tps": 31446, "wall": 5733.3} {"step": 2751, "train_loss": 4.029077053070068, "lr": 0.0003968831725093049, "tps": 31415, "wall": 5740.9} {"step": 2752, "train_loss": 3.9388041496276855, "lr": 0.00039687962176309776, "tps": 31385, "wall": 5748.5} {"step": 2753, "train_loss": 3.942721366882324, "lr": 0.0003968760690131887, "tps": 31355, "wall": 5756.1} {"step": 2754, "train_loss": 3.9306516647338867, "lr": 0.000396872514259618, "tps": 31324, "wall": 5763.9} {"step": 2755, "train_loss": 3.915309429168701, "lr": 0.00039686895750242585, "tps": 31294, "wall": 5771.5} {"step": 2756, "train_loss": 4.115179061889648, "lr": 0.0003968653987416526, "tps": 31264, "wall": 5779.1} {"step": 2757, "train_loss": 3.9812021255493164, "lr": 0.00039686183797733854, "tps": 31235, "wall": 5786.6} {"step": 2758, "train_loss": 3.964853286743164, "lr": 0.000396858275209524, "tps": 31205, "wall": 5794.3} {"step": 2759, "train_loss": 4.02365779876709, "lr": 0.0003968547104382494, "tps": 31175, "wall": 5801.9} {"step": 2760, "train_loss": 3.9546713829040527, "lr": 0.000396851143663555, "tps": 31145, "wall": 5809.6} {"step": 2761, "train_loss": 4.014625549316406, "lr": 0.00039684757488548126, "tps": 31115, "wall": 5817.4} {"step": 2762, "train_loss": 3.99678373336792, "lr": 0.00039684400410406874, "tps": 31085, "wall": 5825.0} {"step": 2763, "train_loss": 4.024501323699951, "lr": 0.0003968404313193577, "tps": 31056, "wall": 5832.7} {"step": 2764, "train_loss": 3.8542025089263916, "lr": 0.00039683685653138864, "tps": 31026, "wall": 5840.3} {"step": 2765, "train_loss": 3.988025188446045, "lr": 0.00039683327974020217, "tps": 30997, "wall": 5848.0} {"step": 2766, "train_loss": 4.022045135498047, "lr": 0.0003968297009458387, "tps": 30968, "wall": 5855.6} {"step": 2767, "train_loss": 3.957911252975464, "lr": 0.0003968261201483389, "tps": 30939, "wall": 5863.2} {"step": 2768, "train_loss": 3.9929652214050293, "lr": 0.0003968225373477432, "tps": 30910, "wall": 5870.7} {"step": 2769, "train_loss": 4.032459259033203, "lr": 0.0003968189525440921, "tps": 30881, "wall": 5878.5} {"step": 2770, "train_loss": 3.9494316577911377, "lr": 0.0003968153657374265, "tps": 30852, "wall": 5886.1} {"step": 2771, "train_loss": 3.9617128372192383, "lr": 0.0003968117769277868, "tps": 30824, "wall": 5893.6} {"step": 2772, "train_loss": 3.994619131088257, "lr": 0.00039680818611521375, "tps": 30795, "wall": 5901.3} {"step": 2773, "train_loss": 3.957423210144043, "lr": 0.00039680459329974804, "tps": 30766, "wall": 5909.0} {"step": 2774, "train_loss": 3.924534559249878, "lr": 0.0003968009984814303, "tps": 30737, "wall": 5916.6} {"step": 2775, "train_loss": 4.041910171508789, "lr": 0.0003967974016603012, "tps": 30709, "wall": 5924.2} {"step": 2776, "train_loss": 4.086296081542969, "lr": 0.00039679380283640174, "tps": 30681, "wall": 5931.8} {"step": 2777, "train_loss": 4.028632164001465, "lr": 0.0003967902020097724, "tps": 30652, "wall": 5939.5} {"step": 2778, "train_loss": 4.0785980224609375, "lr": 0.0003967865991804541, "tps": 30624, "wall": 5947.0} {"step": 2779, "train_loss": 3.9258921146392822, "lr": 0.00039678299434848765, "tps": 30596, "wall": 5954.7} {"step": 2780, "train_loss": 3.8994293212890625, "lr": 0.00039677938751391385, "tps": 30568, "wall": 5962.3} {"step": 2781, "train_loss": 3.9456677436828613, "lr": 0.00039677577867677365, "tps": 30540, "wall": 5969.9} {"step": 2782, "train_loss": 4.008321762084961, "lr": 0.0003967721678371078, "tps": 30512, "wall": 5977.5} {"step": 2783, "train_loss": 3.9059860706329346, "lr": 0.0003967685549949573, "tps": 30484, "wall": 5985.0} {"step": 2784, "train_loss": 4.058193206787109, "lr": 0.0003967649401503631, "tps": 30456, "wall": 5992.7} {"step": 2785, "train_loss": 3.924478530883789, "lr": 0.000396761323303366, "tps": 30429, "wall": 6000.3} {"step": 2786, "train_loss": 4.159354209899902, "lr": 0.00039675770445400714, "tps": 30401, "wall": 6007.9} {"step": 2787, "train_loss": 3.9545090198516846, "lr": 0.0003967540836023274, "tps": 30373, "wall": 6015.6} {"step": 2788, "train_loss": 4.0511956214904785, "lr": 0.00039675046074836787, "tps": 30346, "wall": 6023.1} {"step": 2789, "train_loss": 3.9912338256835938, "lr": 0.00039674683589216957, "tps": 30318, "wall": 6030.8} {"step": 2790, "train_loss": 3.9932172298431396, "lr": 0.00039674320903377344, "tps": 30291, "wall": 6038.4} {"step": 2791, "train_loss": 4.01436710357666, "lr": 0.00039673958017322073, "tps": 30264, "wall": 6045.9} {"step": 2792, "train_loss": 4.015635967254639, "lr": 0.00039673594931055253, "tps": 30237, "wall": 6053.5} {"step": 2793, "train_loss": 3.9578232765197754, "lr": 0.00039673231644580994, "tps": 30209, "wall": 6061.2} {"step": 2794, "train_loss": 4.005667686462402, "lr": 0.0003967286815790341, "tps": 30182, "wall": 6068.8} {"step": 2795, "train_loss": 4.032871246337891, "lr": 0.0003967250447102662, "tps": 30156, "wall": 6076.3} {"step": 2796, "train_loss": 3.9122369289398193, "lr": 0.00039672140583954735, "tps": 30129, "wall": 6083.9} {"step": 2797, "train_loss": 4.0887064933776855, "lr": 0.0003967177649669189, "tps": 30102, "wall": 6091.5} {"step": 2798, "train_loss": 3.936075210571289, "lr": 0.0003967141220924221, "tps": 30076, "wall": 6099.1} {"step": 2799, "train_loss": 4.036337852478027, "lr": 0.00039671047721609817, "tps": 30049, "wall": 6106.7} {"step": 2800, "train_loss": 3.8797926902770996, "lr": 0.00039670683033798834, "tps": 30022, "wall": 6114.2} {"step": 2801, "train_loss": 4.034870624542236, "lr": 0.00039670318145813404, "tps": 29995, "wall": 6121.9} {"step": 2802, "train_loss": 3.974935531616211, "lr": 0.00039669953057657647, "tps": 29969, "wall": 6129.5} {"step": 2803, "train_loss": 4.080513954162598, "lr": 0.00039669587769335704, "tps": 29943, "wall": 6137.1} {"step": 2804, "train_loss": 4.021453857421875, "lr": 0.00039669222280851727, "tps": 29916, "wall": 6144.7} {"step": 2805, "train_loss": 3.9900782108306885, "lr": 0.0003966885659220983, "tps": 29890, "wall": 6152.3} {"step": 2806, "train_loss": 4.040282249450684, "lr": 0.0003966849070341418, "tps": 29864, "wall": 6159.8} {"step": 2807, "train_loss": 3.9174578189849854, "lr": 0.00039668124614468907, "tps": 29838, "wall": 6167.5} {"step": 2808, "train_loss": 3.958747148513794, "lr": 0.00039667758325378165, "tps": 29812, "wall": 6175.0} {"step": 2809, "train_loss": 3.9884016513824463, "lr": 0.00039667391836146094, "tps": 29785, "wall": 6182.7} {"step": 2810, "train_loss": 4.014026165008545, "lr": 0.00039667025146776855, "tps": 29759, "wall": 6190.3} {"step": 2811, "train_loss": 3.9487173557281494, "lr": 0.000396666582572746, "tps": 29733, "wall": 6197.9} {"step": 2812, "train_loss": 3.9074788093566895, "lr": 0.00039666291167643497, "tps": 29707, "wall": 6205.5} {"step": 2813, "train_loss": 3.8422789573669434, "lr": 0.00039665923877887677, "tps": 29681, "wall": 6213.2} {"step": 2814, "train_loss": 3.949228286743164, "lr": 0.0003966555638801132, "tps": 29656, "wall": 6220.7} {"step": 2815, "train_loss": 4.009418964385986, "lr": 0.00039665188698018584, "tps": 29630, "wall": 6228.3} {"step": 2816, "train_loss": 3.938164234161377, "lr": 0.0003966482080791364, "tps": 29605, "wall": 6235.8} {"step": 2817, "train_loss": 4.012817859649658, "lr": 0.0003966445271770064, "tps": 29578, "wall": 6243.7} {"step": 2818, "train_loss": 3.9725446701049805, "lr": 0.0003966408442738377, "tps": 29553, "wall": 6251.2} {"step": 2819, "train_loss": 4.0286712646484375, "lr": 0.000396637159369672, "tps": 29528, "wall": 6258.8} {"step": 2820, "train_loss": 3.982132911682129, "lr": 0.00039663347246455096, "tps": 29503, "wall": 6266.4} {"step": 2821, "train_loss": 4.002749919891357, "lr": 0.00039662978355851637, "tps": 29478, "wall": 6273.9} {"step": 2822, "train_loss": 4.044594764709473, "lr": 0.00039662609265161004, "tps": 29453, "wall": 6281.4} {"step": 2823, "train_loss": 3.9885969161987305, "lr": 0.0003966223997438738, "tps": 29427, "wall": 6289.0} {"step": 2824, "train_loss": 4.1315813064575195, "lr": 0.00039661870483534943, "tps": 29403, "wall": 6296.6} {"step": 2825, "train_loss": 4.008669853210449, "lr": 0.0003966150079260788, "tps": 29377, "wall": 6304.3} {"step": 2826, "train_loss": 3.934767246246338, "lr": 0.0003966113090161039, "tps": 29352, "wall": 6311.9} {"step": 2827, "train_loss": 3.920681953430176, "lr": 0.0003966076081054665, "tps": 29327, "wall": 6319.5} {"step": 2828, "train_loss": 4.006000518798828, "lr": 0.00039660390519420847, "tps": 29302, "wall": 6327.1} {"step": 2829, "train_loss": 4.116545677185059, "lr": 0.00039660020028237195, "tps": 29278, "wall": 6334.7} {"step": 2830, "train_loss": 4.040176868438721, "lr": 0.00039659649336999875, "tps": 29253, "wall": 6342.3} {"step": 2831, "train_loss": 4.011125564575195, "lr": 0.00039659278445713095, "tps": 29229, "wall": 6349.8} {"step": 2832, "train_loss": 3.9175376892089844, "lr": 0.0003965890735438105, "tps": 29203, "wall": 6357.6} {"step": 2833, "train_loss": 3.97564697265625, "lr": 0.00039658536063007954, "tps": 29179, "wall": 6365.1} {"step": 2834, "train_loss": 4.071181774139404, "lr": 0.00039658164571598, "tps": 29154, "wall": 6372.7} {"step": 2835, "train_loss": 3.986354351043701, "lr": 0.00039657792880155407, "tps": 29130, "wall": 6380.3} {"step": 2836, "train_loss": 3.9786996841430664, "lr": 0.00039657420988684376, "tps": 29106, "wall": 6387.8} {"step": 2837, "train_loss": 3.968688488006592, "lr": 0.0003965704889718913, "tps": 29082, "wall": 6395.3} {"step": 2838, "train_loss": 3.969285488128662, "lr": 0.00039656676605673877, "tps": 29058, "wall": 6402.9} {"step": 2839, "train_loss": 4.1358137130737305, "lr": 0.0003965630411414283, "tps": 29031, "wall": 6411.1} {"step": 2840, "train_loss": 3.9874281883239746, "lr": 0.00039655931422600226, "tps": 29005, "wall": 6419.0} {"step": 2841, "train_loss": 4.030692100524902, "lr": 0.0003965555853105027, "tps": 28981, "wall": 6426.7} {"step": 2842, "train_loss": 3.912888526916504, "lr": 0.0003965518543949719, "tps": 28957, "wall": 6434.2} {"step": 2843, "train_loss": 3.891169309616089, "lr": 0.0003965481214794521, "tps": 28933, "wall": 6441.9} {"step": 2844, "train_loss": 3.943584442138672, "lr": 0.0003965443865639857, "tps": 28909, "wall": 6449.5} {"step": 2845, "train_loss": 3.899841785430908, "lr": 0.00039654064964861493, "tps": 28885, "wall": 6457.0} {"step": 2846, "train_loss": 3.9306912422180176, "lr": 0.00039653691073338217, "tps": 28861, "wall": 6464.6} {"step": 2847, "train_loss": 4.004018783569336, "lr": 0.00039653316981832967, "tps": 28838, "wall": 6472.1} {"step": 2848, "train_loss": 4.015224456787109, "lr": 0.0003965294269034999, "tps": 28814, "wall": 6479.8} {"step": 2849, "train_loss": 3.977483034133911, "lr": 0.00039652568198893516, "tps": 28791, "wall": 6487.3} {"step": 2850, "train_loss": 3.969130039215088, "lr": 0.0003965219350746781, "tps": 28767, "wall": 6494.9} {"step": 2851, "train_loss": 3.8916141986846924, "lr": 0.0003965181861607709, "tps": 28744, "wall": 6502.5} {"step": 2852, "train_loss": 3.9872076511383057, "lr": 0.00039651443524725614, "tps": 28720, "wall": 6510.0} {"step": 2853, "train_loss": 4.056666374206543, "lr": 0.00039651068233417634, "tps": 28697, "wall": 6517.6} {"step": 2854, "train_loss": 4.090041637420654, "lr": 0.000396506927421574, "tps": 28674, "wall": 6525.3} {"step": 2855, "train_loss": 3.9797041416168213, "lr": 0.0003965031705094916, "tps": 28650, "wall": 6532.8} {"step": 2856, "train_loss": 3.9951579570770264, "lr": 0.00039649941159797177, "tps": 28627, "wall": 6540.5} {"step": 2857, "train_loss": 4.073162078857422, "lr": 0.000396495650687057, "tps": 28603, "wall": 6548.2} {"step": 2858, "train_loss": 3.9942493438720703, "lr": 0.0003964918877767899, "tps": 28580, "wall": 6555.8} {"step": 2859, "train_loss": 4.022785186767578, "lr": 0.0003964881228672132, "tps": 28556, "wall": 6563.5} {"step": 2860, "train_loss": 4.021141052246094, "lr": 0.00039648435595836956, "tps": 28533, "wall": 6571.1} {"step": 2861, "train_loss": 3.9403862953186035, "lr": 0.00039648058705030154, "tps": 28511, "wall": 6578.6} {"step": 2862, "train_loss": 3.9255847930908203, "lr": 0.00039647681614305195, "tps": 28488, "wall": 6586.3} {"step": 2863, "train_loss": 3.9677093029022217, "lr": 0.0003964730432366634, "tps": 28465, "wall": 6593.9} {"step": 2864, "train_loss": 3.987785816192627, "lr": 0.0003964692683311786, "tps": 28441, "wall": 6601.6} {"step": 2865, "train_loss": 3.9556097984313965, "lr": 0.00039646549142664046, "tps": 28418, "wall": 6609.2} {"step": 2866, "train_loss": 4.082913398742676, "lr": 0.00039646171252309166, "tps": 28396, "wall": 6616.8} {"step": 2867, "train_loss": 3.9072439670562744, "lr": 0.00039645793162057497, "tps": 28373, "wall": 6624.3} {"step": 2868, "train_loss": 4.030656814575195, "lr": 0.0003964541487191334, "tps": 28350, "wall": 6632.0} {"step": 2869, "train_loss": 3.9699175357818604, "lr": 0.0003964503638188096, "tps": 28328, "wall": 6639.5} {"step": 2870, "train_loss": 3.9492299556732178, "lr": 0.0003964465769196466, "tps": 28305, "wall": 6647.2} {"step": 2871, "train_loss": 3.959669589996338, "lr": 0.0003964427880216872, "tps": 28283, "wall": 6654.7} {"step": 2872, "train_loss": 3.9682998657226562, "lr": 0.0003964389971249743, "tps": 28260, "wall": 6662.5} {"step": 2873, "train_loss": 3.948421001434326, "lr": 0.00039643520422955096, "tps": 28238, "wall": 6670.1} {"step": 2874, "train_loss": 4.039671897888184, "lr": 0.00039643140933546004, "tps": 28215, "wall": 6677.7} {"step": 2875, "train_loss": 3.934171438217163, "lr": 0.0003964276124427446, "tps": 28193, "wall": 6685.3} {"step": 2876, "train_loss": 4.022180557250977, "lr": 0.00039642381355144764, "tps": 28170, "wall": 6693.0} {"step": 2877, "train_loss": 3.9629907608032227, "lr": 0.0003964200126616122, "tps": 28149, "wall": 6700.5} {"step": 2878, "train_loss": 3.995779514312744, "lr": 0.0003964162097732813, "tps": 28127, "wall": 6708.1} {"step": 2879, "train_loss": 3.9151601791381836, "lr": 0.00039641240488649793, "tps": 28104, "wall": 6715.7} {"step": 2880, "train_loss": 3.9119770526885986, "lr": 0.0003964085980013054, "tps": 28082, "wall": 6723.5} {"step": 2881, "train_loss": 3.9535624980926514, "lr": 0.0003964047891177467, "tps": 28059, "wall": 6731.1} {"step": 2882, "train_loss": 3.879967212677002, "lr": 0.00039640097823586497, "tps": 28038, "wall": 6738.7} {"step": 2883, "train_loss": 4.042379379272461, "lr": 0.00039639716535570346, "tps": 28016, "wall": 6746.3} {"step": 2884, "train_loss": 4.011753559112549, "lr": 0.00039639335047730526, "tps": 27994, "wall": 6753.9} {"step": 2885, "train_loss": 4.025374412536621, "lr": 0.0003963895336007137, "tps": 27972, "wall": 6761.6} {"step": 2886, "train_loss": 3.945545196533203, "lr": 0.00039638571472597195, "tps": 27950, "wall": 6769.2} {"step": 2887, "train_loss": 3.9645590782165527, "lr": 0.00039638189385312326, "tps": 27928, "wall": 6776.8} {"step": 2888, "train_loss": 3.8971962928771973, "lr": 0.00039637807098221096, "tps": 27906, "wall": 6784.5} {"step": 2889, "train_loss": 3.8867080211639404, "lr": 0.0003963742461132783, "tps": 27885, "wall": 6792.1} {"step": 2890, "train_loss": 3.945997714996338, "lr": 0.0003963704192463687, "tps": 27863, "wall": 6799.7} {"step": 2891, "train_loss": 4.153015613555908, "lr": 0.0003963665903815254, "tps": 27841, "wall": 6807.4} {"step": 2892, "train_loss": 3.893566846847534, "lr": 0.0003963627595187918, "tps": 27820, "wall": 6814.9} {"step": 2893, "train_loss": 3.917215347290039, "lr": 0.00039635892665821135, "tps": 27799, "wall": 6822.5} {"step": 2894, "train_loss": 4.007583141326904, "lr": 0.0003963550917998275, "tps": 27778, "wall": 6830.1} {"step": 2895, "train_loss": 3.905059337615967, "lr": 0.0003963512549436835, "tps": 27756, "wall": 6837.8} {"step": 2896, "train_loss": 4.074444770812988, "lr": 0.00039634741608982304, "tps": 27735, "wall": 6845.4} {"step": 2897, "train_loss": 4.074591636657715, "lr": 0.00039634357523828947, "tps": 27714, "wall": 6853.0} {"step": 2898, "train_loss": 3.973888635635376, "lr": 0.00039633973238912634, "tps": 27693, "wall": 6860.5} {"step": 2899, "train_loss": 3.965054988861084, "lr": 0.0003963358875423772, "tps": 27672, "wall": 6868.0} {"step": 2900, "train_loss": 3.968080759048462, "lr": 0.0003963320406980856, "tps": 27650, "wall": 6875.7} {"step": 2901, "train_loss": 3.952850818634033, "lr": 0.000396328191856295, "tps": 27630, "wall": 6883.2} {"step": 2902, "train_loss": 4.021788120269775, "lr": 0.0003963243410170492, "tps": 27609, "wall": 6890.9} {"step": 2903, "train_loss": 4.022318363189697, "lr": 0.00039632048818039175, "tps": 27587, "wall": 6898.6} {"step": 2904, "train_loss": 4.027184009552002, "lr": 0.0003963166333463662, "tps": 27566, "wall": 6906.3} {"step": 2905, "train_loss": 3.9998016357421875, "lr": 0.00039631277651501636, "tps": 27546, "wall": 6913.8} {"step": 2906, "train_loss": 3.945232391357422, "lr": 0.0003963089176863858, "tps": 27525, "wall": 6921.4} {"step": 2907, "train_loss": 3.927506446838379, "lr": 0.00039630505686051825, "tps": 27504, "wall": 6929.0} {"step": 2908, "train_loss": 3.9522523880004883, "lr": 0.00039630119403745754, "tps": 27483, "wall": 6936.7} {"step": 2909, "train_loss": 3.942749500274658, "lr": 0.00039629732921724737, "tps": 27462, "wall": 6944.3} {"step": 2910, "train_loss": 3.9679346084594727, "lr": 0.0003962934623999315, "tps": 27442, "wall": 6951.9} {"step": 2911, "train_loss": 3.9376134872436523, "lr": 0.0003962895935855538, "tps": 27421, "wall": 6959.6} {"step": 2912, "train_loss": 3.936567783355713, "lr": 0.000396285722774158, "tps": 27400, "wall": 6967.3} {"step": 2913, "train_loss": 4.002707481384277, "lr": 0.0003962818499657879, "tps": 27379, "wall": 6974.9} {"step": 2914, "train_loss": 4.001238822937012, "lr": 0.00039627797516048757, "tps": 27359, "wall": 6982.6} {"step": 2915, "train_loss": 3.9652085304260254, "lr": 0.0003962740983583008, "tps": 27338, "wall": 6990.2} {"step": 2916, "train_loss": 3.9617700576782227, "lr": 0.0003962702195592714, "tps": 27318, "wall": 6997.7} {"step": 2917, "train_loss": 3.99485445022583, "lr": 0.00039626633876344356, "tps": 27298, "wall": 7005.3} {"step": 2918, "train_loss": 4.017065048217773, "lr": 0.0003962624559708611, "tps": 27278, "wall": 7013.0} {"step": 2919, "train_loss": 3.9052767753601074, "lr": 0.00039625857118156794, "tps": 27257, "wall": 7020.7} {"step": 2920, "train_loss": 3.9460344314575195, "lr": 0.00039625468439560813, "tps": 27237, "wall": 7028.3} {"step": 2921, "train_loss": 3.911953926086426, "lr": 0.0003962507956130258, "tps": 27217, "wall": 7035.9} {"step": 2922, "train_loss": 3.952524423599243, "lr": 0.00039624690483386484, "tps": 27196, "wall": 7043.5} {"step": 2923, "train_loss": 3.9074149131774902, "lr": 0.00039624301205816947, "tps": 27176, "wall": 7051.1} {"step": 2924, "train_loss": 4.004453182220459, "lr": 0.00039623911728598366, "tps": 27156, "wall": 7058.7} {"step": 2925, "train_loss": 4.032917022705078, "lr": 0.0003962352205173516, "tps": 27136, "wall": 7066.4} {"step": 2926, "train_loss": 3.950735092163086, "lr": 0.0003962313217523175, "tps": 27116, "wall": 7074.0} {"step": 2927, "train_loss": 4.043909072875977, "lr": 0.0003962274209909254, "tps": 27096, "wall": 7081.8} {"step": 2928, "train_loss": 3.868159294128418, "lr": 0.00039622351823321954, "tps": 27076, "wall": 7089.4} {"step": 2929, "train_loss": 3.953967571258545, "lr": 0.00039621961347924414, "tps": 27056, "wall": 7097.0} {"step": 2930, "train_loss": 3.944248676300049, "lr": 0.00039621570672904345, "tps": 27036, "wall": 7104.6} {"step": 2931, "train_loss": 3.9419140815734863, "lr": 0.0003962117979826617, "tps": 27016, "wall": 7112.3} {"step": 2932, "train_loss": 3.963844060897827, "lr": 0.00039620788724014315, "tps": 26996, "wall": 7120.0} {"step": 2933, "train_loss": 3.975667715072632, "lr": 0.0003962039745015321, "tps": 26977, "wall": 7127.6} {"step": 2934, "train_loss": 3.935929298400879, "lr": 0.0003962000597668729, "tps": 26957, "wall": 7135.3} {"step": 2935, "train_loss": 3.8899359703063965, "lr": 0.0003961961430362099, "tps": 26937, "wall": 7143.1} {"step": 2936, "train_loss": 4.012789249420166, "lr": 0.00039619222430958747, "tps": 26917, "wall": 7150.7} {"step": 2937, "train_loss": 4.017292499542236, "lr": 0.00039618830358704993, "tps": 26897, "wall": 7158.4} {"step": 2938, "train_loss": 3.869781017303467, "lr": 0.00039618438086864186, "tps": 26877, "wall": 7166.1} {"step": 2939, "train_loss": 4.110910415649414, "lr": 0.00039618045615440753, "tps": 26858, "wall": 7173.8} {"step": 2940, "train_loss": 3.992321252822876, "lr": 0.0003961765294443915, "tps": 26839, "wall": 7181.3} {"step": 2941, "train_loss": 3.8840112686157227, "lr": 0.0003961726007386382, "tps": 26819, "wall": 7189.0} {"step": 2942, "train_loss": 3.944740056991577, "lr": 0.00039616867003719214, "tps": 26800, "wall": 7196.6} {"step": 2943, "train_loss": 3.931504726409912, "lr": 0.00039616473734009784, "tps": 26780, "wall": 7204.3} {"step": 2944, "train_loss": 3.973820686340332, "lr": 0.0003961608026473999, "tps": 26761, "wall": 7211.9} {"step": 2945, "train_loss": 4.00997257232666, "lr": 0.0003961568659591428, "tps": 26742, "wall": 7219.6} {"step": 2946, "train_loss": 4.015091896057129, "lr": 0.0003961529272753712, "tps": 26723, "wall": 7227.2} {"step": 2947, "train_loss": 3.9139244556427, "lr": 0.0003961489865961298, "tps": 26703, "wall": 7234.9} {"step": 2948, "train_loss": 4.1190595626831055, "lr": 0.000396145043921463, "tps": 26684, "wall": 7242.5} {"step": 2949, "train_loss": 3.9829277992248535, "lr": 0.00039614109925141576, "tps": 26665, "wall": 7250.3} {"step": 2950, "train_loss": 3.9435746669769287, "lr": 0.0003961371525860326, "tps": 26645, "wall": 7258.1} {"step": 2951, "train_loss": 3.9873080253601074, "lr": 0.0003961332039253582, "tps": 26626, "wall": 7265.8} {"step": 2952, "train_loss": 3.8981332778930664, "lr": 0.0003961292532694373, "tps": 26607, "wall": 7273.4} {"step": 2953, "train_loss": 3.9583985805511475, "lr": 0.00039612530061831474, "tps": 26588, "wall": 7281.1} {"step": 2954, "train_loss": 4.0092549324035645, "lr": 0.00039612134597203524, "tps": 26569, "wall": 7288.8} {"step": 2955, "train_loss": 3.915681838989258, "lr": 0.00039611738933064365, "tps": 26550, "wall": 7296.4} {"step": 2956, "train_loss": 3.8391571044921875, "lr": 0.00039611343069418466, "tps": 26532, "wall": 7304.0} {"step": 2957, "train_loss": 3.884122848510742, "lr": 0.0003961094700627033, "tps": 26513, "wall": 7311.7} {"step": 2958, "train_loss": 4.023083209991455, "lr": 0.00039610550743624423, "tps": 26494, "wall": 7319.4} {"step": 2959, "train_loss": 3.862781286239624, "lr": 0.0003961015428148525, "tps": 26475, "wall": 7327.1} {"step": 2960, "train_loss": 3.9018869400024414, "lr": 0.000396097576198573, "tps": 26456, "wall": 7334.7} {"step": 2961, "train_loss": 3.843090057373047, "lr": 0.00039609360758745054, "tps": 26437, "wall": 7342.4} {"step": 2962, "train_loss": 3.8865303993225098, "lr": 0.0003960896369815302, "tps": 26419, "wall": 7350.1} {"step": 2963, "train_loss": 3.940004348754883, "lr": 0.00039608566438085693, "tps": 26400, "wall": 7357.8} {"step": 2964, "train_loss": 3.8825082778930664, "lr": 0.00039608168978547576, "tps": 26382, "wall": 7365.4} {"step": 2965, "train_loss": 3.939793586730957, "lr": 0.00039607771319543164, "tps": 26363, "wall": 7373.0} {"step": 2966, "train_loss": 4.0085062980651855, "lr": 0.00039607373461076966, "tps": 26344, "wall": 7380.8} {"step": 2967, "train_loss": 3.943028688430786, "lr": 0.00039606975403153494, "tps": 26326, "wall": 7388.4} {"step": 2968, "train_loss": 3.9407551288604736, "lr": 0.00039606577145777247, "tps": 26307, "wall": 7396.1} {"step": 2969, "train_loss": 3.9771151542663574, "lr": 0.00039606178688952746, "tps": 26289, "wall": 7403.7} {"step": 2970, "train_loss": 3.8989930152893066, "lr": 0.00039605780032684495, "tps": 26271, "wall": 7411.5} {"step": 2971, "train_loss": 3.999932050704956, "lr": 0.00039605381176977016, "tps": 26253, "wall": 7419.0} {"step": 2972, "train_loss": 3.858532428741455, "lr": 0.0003960498212183483, "tps": 26235, "wall": 7426.7} {"step": 2973, "train_loss": 3.9752941131591797, "lr": 0.0003960458286726246, "tps": 26216, "wall": 7434.3} {"step": 2974, "train_loss": 3.932274103164673, "lr": 0.0003960418341326441, "tps": 26198, "wall": 7442.1} {"step": 2975, "train_loss": 3.936460494995117, "lr": 0.00039603783759845226, "tps": 26180, "wall": 7449.7} {"step": 2976, "train_loss": 3.9269630908966064, "lr": 0.0003960338390700943, "tps": 26162, "wall": 7457.4} {"step": 2977, "train_loss": 4.008119583129883, "lr": 0.0003960298385476154, "tps": 26144, "wall": 7465.0} {"step": 2978, "train_loss": 3.874305248260498, "lr": 0.00039602583603106094, "tps": 26126, "wall": 7472.7} {"step": 2979, "train_loss": 3.964543342590332, "lr": 0.0003960218315204764, "tps": 26107, "wall": 7480.4} {"step": 2980, "train_loss": 3.9204282760620117, "lr": 0.00039601782501590696, "tps": 26090, "wall": 7488.0} {"step": 2981, "train_loss": 3.978801727294922, "lr": 0.00039601381651739815, "tps": 26072, "wall": 7495.7} {"step": 2982, "train_loss": 3.860415458679199, "lr": 0.00039600980602499524, "tps": 26053, "wall": 7503.5} {"step": 2983, "train_loss": 3.9434189796447754, "lr": 0.0003960057935387437, "tps": 26035, "wall": 7511.3} {"step": 2984, "train_loss": 3.9632158279418945, "lr": 0.000396001779058689, "tps": 26017, "wall": 7518.9} {"step": 2985, "train_loss": 3.955526351928711, "lr": 0.0003959977625848767, "tps": 25999, "wall": 7526.6} {"step": 2986, "train_loss": 3.851881504058838, "lr": 0.0003959937441173522, "tps": 25982, "wall": 7534.2} {"step": 2987, "train_loss": 3.844815492630005, "lr": 0.000395989723656161, "tps": 25964, "wall": 7542.0} {"step": 2988, "train_loss": 3.939218044281006, "lr": 0.0003959857012013488, "tps": 25946, "wall": 7549.6} {"step": 2989, "train_loss": 4.016117095947266, "lr": 0.00039598167675296096, "tps": 25928, "wall": 7557.4} {"step": 2990, "train_loss": 3.928412437438965, "lr": 0.00039597765031104324, "tps": 25910, "wall": 7565.1} {"step": 2991, "train_loss": 3.94496750831604, "lr": 0.0003959736218756411, "tps": 25893, "wall": 7572.8} {"step": 2992, "train_loss": 3.9934263229370117, "lr": 0.00039596959144680026, "tps": 25875, "wall": 7580.5} {"step": 2993, "train_loss": 3.961533784866333, "lr": 0.0003959655590245664, "tps": 25858, "wall": 7588.1} {"step": 2994, "train_loss": 3.949096202850342, "lr": 0.00039596152460898517, "tps": 25840, "wall": 7595.8} {"step": 2995, "train_loss": 3.9232444763183594, "lr": 0.00039595748820010226, "tps": 25823, "wall": 7603.5} {"step": 2996, "train_loss": 3.9210987091064453, "lr": 0.00039595344979796336, "tps": 25805, "wall": 7611.3} {"step": 2997, "train_loss": 3.9457955360412598, "lr": 0.0003959494094026143, "tps": 25786, "wall": 7619.3} {"step": 2998, "train_loss": 3.8414132595062256, "lr": 0.0003959453670141008, "tps": 25769, "wall": 7626.9} {"step": 2999, "train_loss": 3.8579039573669434, "lr": 0.0003959413226324687, "tps": 25752, "wall": 7634.6} {"step": 3000, "train_loss": 3.9199941158294678, "lr": 0.0003959372762577638, "tps": 25735, "wall": 7642.2, "val_loss_monitor": 3.964563193072316} {"step": 3001, "train_loss": 3.8936288356781006, "lr": 0.0003959332278900318, "tps": 25557, "wall": 7698.0} {"step": 3002, "train_loss": 3.9827332496643066, "lr": 0.00039592917752931877, "tps": 25539, "wall": 7705.8} {"step": 3003, "train_loss": 3.94065523147583, "lr": 0.0003959251251756705, "tps": 25522, "wall": 7713.6} {"step": 3004, "train_loss": 3.9330313205718994, "lr": 0.00039592107082913285, "tps": 25505, "wall": 7721.4} {"step": 3005, "train_loss": 3.784304618835449, "lr": 0.00039591701448975187, "tps": 25487, "wall": 7729.2} {"step": 3006, "train_loss": 3.910799503326416, "lr": 0.0003959129561575733, "tps": 25470, "wall": 7737.0} {"step": 3007, "train_loss": 3.9766552448272705, "lr": 0.00039590889583264335, "tps": 25453, "wall": 7744.9} {"step": 3008, "train_loss": 4.082178115844727, "lr": 0.0003959048335150079, "tps": 25436, "wall": 7752.7} {"step": 3009, "train_loss": 3.909069061279297, "lr": 0.000395900769204713, "tps": 25419, "wall": 7760.4} {"step": 3010, "train_loss": 3.941740036010742, "lr": 0.0003958967029018046, "tps": 25402, "wall": 7768.2} {"step": 3011, "train_loss": 4.0494489669799805, "lr": 0.0003958926346063288, "tps": 25385, "wall": 7776.0} {"step": 3012, "train_loss": 3.9283437728881836, "lr": 0.0003958885643183318, "tps": 25368, "wall": 7783.7} {"step": 3013, "train_loss": 3.897066116333008, "lr": 0.00039588449203785967, "tps": 25351, "wall": 7791.5} {"step": 3014, "train_loss": 3.9359982013702393, "lr": 0.0003958804177649584, "tps": 25334, "wall": 7799.4} {"step": 3015, "train_loss": 4.021873474121094, "lr": 0.0003958763414996743, "tps": 25317, "wall": 7807.1} {"step": 3016, "train_loss": 3.9484152793884277, "lr": 0.0003958722632420535, "tps": 25300, "wall": 7814.9} {"step": 3017, "train_loss": 3.95963191986084, "lr": 0.0003958681829921421, "tps": 25282, "wall": 7823.2} {"step": 3018, "train_loss": 3.9059267044067383, "lr": 0.00039586410074998654, "tps": 25264, "wall": 7831.2} {"step": 3019, "train_loss": 3.907871961593628, "lr": 0.0003958600165156328, "tps": 25247, "wall": 7839.2} {"step": 3020, "train_loss": 3.955803871154785, "lr": 0.00039585593028912744, "tps": 25230, "wall": 7847.2} {"step": 3021, "train_loss": 4.000230312347412, "lr": 0.00039585184207051647, "tps": 25209, "wall": 7856.3} {"step": 3022, "train_loss": 4.030280590057373, "lr": 0.0003958477518598463, "tps": 25191, "wall": 7864.5} {"step": 3023, "train_loss": 3.885716199874878, "lr": 0.00039584365965716336, "tps": 25174, "wall": 7872.3} {"step": 3024, "train_loss": 4.062997817993164, "lr": 0.00039583956546251393, "tps": 25158, "wall": 7880.0} {"step": 3025, "train_loss": 3.8207170963287354, "lr": 0.0003958354692759443, "tps": 25141, "wall": 7887.8} {"step": 3026, "train_loss": 3.962461471557617, "lr": 0.00039583137109750106, "tps": 25125, "wall": 7895.6} {"step": 3027, "train_loss": 3.94756817817688, "lr": 0.0003958272709272305, "tps": 25108, "wall": 7903.3} {"step": 3028, "train_loss": 3.9235193729400635, "lr": 0.0003958231687651791, "tps": 25092, "wall": 7911.0} {"step": 3029, "train_loss": 3.9723620414733887, "lr": 0.00039581906461139333, "tps": 25075, "wall": 7918.9} {"step": 3030, "train_loss": 4.042577743530273, "lr": 0.00039581495846591967, "tps": 25059, "wall": 7926.7} {"step": 3031, "train_loss": 3.944540023803711, "lr": 0.0003958108503288046, "tps": 25043, "wall": 7934.4} {"step": 3032, "train_loss": 3.9451208114624023, "lr": 0.0003958067402000948, "tps": 25027, "wall": 7942.1} {"step": 3033, "train_loss": 3.9993057250976562, "lr": 0.00039580262807983673, "tps": 25011, "wall": 7949.9} {"step": 3034, "train_loss": 3.8972315788269043, "lr": 0.00039579851396807697, "tps": 24995, "wall": 7957.6} {"step": 3035, "train_loss": 3.968569278717041, "lr": 0.0003957943978648621, "tps": 24979, "wall": 7965.4} {"step": 3036, "train_loss": 4.003903388977051, "lr": 0.00039579027977023874, "tps": 24962, "wall": 7973.1} {"step": 3037, "train_loss": 3.985621452331543, "lr": 0.0003957861596842537, "tps": 24946, "wall": 7981.0} {"step": 3038, "train_loss": 3.999136447906494, "lr": 0.0003957820376069534, "tps": 24930, "wall": 7988.7} {"step": 3039, "train_loss": 3.9514617919921875, "lr": 0.0003957779135383848, "tps": 24914, "wall": 7996.5} {"step": 3040, "train_loss": 3.8961024284362793, "lr": 0.0003957737874785944, "tps": 24898, "wall": 8004.2} {"step": 3041, "train_loss": 3.918217182159424, "lr": 0.0003957696594276291, "tps": 24883, "wall": 8011.9} {"step": 3042, "train_loss": 3.8641977310180664, "lr": 0.0003957655293855355, "tps": 24867, "wall": 8019.6} {"step": 3043, "train_loss": 3.9742937088012695, "lr": 0.00039576139735236055, "tps": 24851, "wall": 8027.2} {"step": 3044, "train_loss": 3.8867926597595215, "lr": 0.0003957572633281509, "tps": 24836, "wall": 8034.9} {"step": 3045, "train_loss": 3.880101442337036, "lr": 0.00039575312731295357, "tps": 24820, "wall": 8042.7} {"step": 3046, "train_loss": 3.8008289337158203, "lr": 0.0003957489893068152, "tps": 24804, "wall": 8050.3} {"step": 3047, "train_loss": 3.9626874923706055, "lr": 0.00039574484930978283, "tps": 24789, "wall": 8058.1} {"step": 3048, "train_loss": 3.9110913276672363, "lr": 0.0003957407073219033, "tps": 24773, "wall": 8065.9} {"step": 3049, "train_loss": 3.9256715774536133, "lr": 0.0003957365633432235, "tps": 24757, "wall": 8073.6} {"step": 3050, "train_loss": 3.920008659362793, "lr": 0.00039573241737379046, "tps": 24742, "wall": 8081.2} {"step": 3051, "train_loss": 3.946322202682495, "lr": 0.000395728269413651, "tps": 24727, "wall": 8088.9} {"step": 3052, "train_loss": 3.919680118560791, "lr": 0.00039572411946285223, "tps": 24712, "wall": 8096.5} {"step": 3053, "train_loss": 3.9894890785217285, "lr": 0.00039571996752144116, "tps": 24696, "wall": 8104.3} {"step": 3054, "train_loss": 4.021892547607422, "lr": 0.0003957158135894647, "tps": 24680, "wall": 8112.0} {"step": 3055, "train_loss": 3.8743607997894287, "lr": 0.0003957116576669702, "tps": 24665, "wall": 8119.8} {"step": 3056, "train_loss": 4.0028581619262695, "lr": 0.00039570749975400437, "tps": 24650, "wall": 8127.5} {"step": 3057, "train_loss": 3.940614700317383, "lr": 0.0003957033398506145, "tps": 24634, "wall": 8135.3} {"step": 3058, "train_loss": 3.9671859741210938, "lr": 0.0003956991779568477, "tps": 24619, "wall": 8143.0} {"step": 3059, "train_loss": 3.9283270835876465, "lr": 0.00039569501407275116, "tps": 24604, "wall": 8150.7} {"step": 3060, "train_loss": 3.9172921180725098, "lr": 0.0003956908481983719, "tps": 24588, "wall": 8158.5} {"step": 3061, "train_loss": 3.8358287811279297, "lr": 0.0003956866803337573, "tps": 24573, "wall": 8166.2} {"step": 3062, "train_loss": 3.9499599933624268, "lr": 0.0003956825104789544, "tps": 24558, "wall": 8173.9} {"step": 3063, "train_loss": 3.8322739601135254, "lr": 0.0003956783386340106, "tps": 24543, "wall": 8181.5} {"step": 3064, "train_loss": 3.90116548538208, "lr": 0.000395674164798973, "tps": 24528, "wall": 8189.2} {"step": 3065, "train_loss": 3.923048973083496, "lr": 0.00039566998897388897, "tps": 24513, "wall": 8196.9} {"step": 3066, "train_loss": 3.89920711517334, "lr": 0.00039566581115880583, "tps": 24498, "wall": 8204.6} {"step": 3067, "train_loss": 3.8791306018829346, "lr": 0.0003956616313537709, "tps": 24483, "wall": 8212.4} {"step": 3068, "train_loss": 4.016050338745117, "lr": 0.0003956574495588315, "tps": 24467, "wall": 8220.1} {"step": 3069, "train_loss": 3.9289684295654297, "lr": 0.00039565326577403493, "tps": 24453, "wall": 8227.8} {"step": 3070, "train_loss": 3.8924827575683594, "lr": 0.00039564907999942877, "tps": 24438, "wall": 8235.5} {"step": 3071, "train_loss": 3.910208225250244, "lr": 0.00039564489223506026, "tps": 24423, "wall": 8243.2} {"step": 3072, "train_loss": 3.8840842247009277, "lr": 0.0003956407024809769, "tps": 24408, "wall": 8250.8} {"step": 3073, "train_loss": 3.863788604736328, "lr": 0.00039563651073722616, "tps": 24393, "wall": 8258.6} {"step": 3074, "train_loss": 3.9163765907287598, "lr": 0.00039563231700385555, "tps": 24379, "wall": 8266.2} {"step": 3075, "train_loss": 3.9246788024902344, "lr": 0.0003956281212809126, "tps": 24364, "wall": 8273.9} {"step": 3076, "train_loss": 3.910825252532959, "lr": 0.0003956239235684447, "tps": 24349, "wall": 8281.7} {"step": 3077, "train_loss": 3.9651482105255127, "lr": 0.00039561972386649956, "tps": 24334, "wall": 8289.4} {"step": 3078, "train_loss": 3.9169952869415283, "lr": 0.00039561552217512463, "tps": 24320, "wall": 8297.1} {"step": 3079, "train_loss": 3.916574001312256, "lr": 0.0003956113184943676, "tps": 24305, "wall": 8304.8} {"step": 3080, "train_loss": 3.8415579795837402, "lr": 0.0003956071128242761, "tps": 24290, "wall": 8312.4} {"step": 3081, "train_loss": 3.8483991622924805, "lr": 0.0003956029051648976, "tps": 24276, "wall": 8320.2} {"step": 3082, "train_loss": 3.795340061187744, "lr": 0.00039559869551628, "tps": 24261, "wall": 8327.8} {"step": 3083, "train_loss": 3.965963840484619, "lr": 0.0003955944838784708, "tps": 24247, "wall": 8335.6} {"step": 3084, "train_loss": 3.931821823120117, "lr": 0.00039559027025151786, "tps": 24231, "wall": 8343.5} {"step": 3085, "train_loss": 3.915756940841675, "lr": 0.00039558605463546885, "tps": 24217, "wall": 8351.1} {"step": 3086, "train_loss": 3.9453248977661133, "lr": 0.00039558183703037144, "tps": 24203, "wall": 8358.9} {"step": 3087, "train_loss": 4.001570701599121, "lr": 0.00039557761743627353, "tps": 24188, "wall": 8366.5} {"step": 3088, "train_loss": 3.8891794681549072, "lr": 0.00039557339585322284, "tps": 24174, "wall": 8374.2} {"step": 3089, "train_loss": 3.94277024269104, "lr": 0.0003955691722812672, "tps": 24159, "wall": 8381.9} {"step": 3090, "train_loss": 4.053829669952393, "lr": 0.0003955649467204546, "tps": 24145, "wall": 8389.7} {"step": 3091, "train_loss": 3.894531488418579, "lr": 0.00039556071917083263, "tps": 24130, "wall": 8397.4} {"step": 3092, "train_loss": 3.9903693199157715, "lr": 0.0003955564896324494, "tps": 24116, "wall": 8405.3} {"step": 3093, "train_loss": 3.8765716552734375, "lr": 0.0003955522581053528, "tps": 24101, "wall": 8413.0} {"step": 3094, "train_loss": 3.940239429473877, "lr": 0.0003955480245895907, "tps": 24087, "wall": 8420.6} {"step": 3095, "train_loss": 3.945378303527832, "lr": 0.00039554378908521106, "tps": 24073, "wall": 8428.3} {"step": 3096, "train_loss": 3.9017391204833984, "lr": 0.00039553955159226187, "tps": 24059, "wall": 8436.0} {"step": 3097, "train_loss": 3.9124948978424072, "lr": 0.0003955353121107912, "tps": 24045, "wall": 8443.7} {"step": 3098, "train_loss": 4.0116801261901855, "lr": 0.0003955310706408469, "tps": 24031, "wall": 8451.4} {"step": 3099, "train_loss": 3.899803638458252, "lr": 0.0003955268271824773, "tps": 24016, "wall": 8459.2} {"step": 3100, "train_loss": 3.9717111587524414, "lr": 0.00039552258173573016, "tps": 24002, "wall": 8466.9} {"step": 3101, "train_loss": 3.8944129943847656, "lr": 0.0003955183343006538, "tps": 23988, "wall": 8474.7} {"step": 3102, "train_loss": 3.747326135635376, "lr": 0.00039551408487729624, "tps": 23974, "wall": 8482.4} {"step": 3103, "train_loss": 3.8624508380889893, "lr": 0.00039550983346570563, "tps": 23960, "wall": 8490.1} {"step": 3104, "train_loss": 3.9138646125793457, "lr": 0.0003955055800659301, "tps": 23946, "wall": 8497.8} {"step": 3105, "train_loss": 3.931368350982666, "lr": 0.0003955013246780179, "tps": 23932, "wall": 8505.5} {"step": 3106, "train_loss": 3.8394429683685303, "lr": 0.0003954970673020172, "tps": 23918, "wall": 8513.2} {"step": 3107, "train_loss": 3.8889732360839844, "lr": 0.00039549280793797623, "tps": 23903, "wall": 8521.1} {"step": 3108, "train_loss": 3.8055901527404785, "lr": 0.0003954885465859432, "tps": 23889, "wall": 8529.0} {"step": 3109, "train_loss": 3.8126325607299805, "lr": 0.0003954842832459665, "tps": 23875, "wall": 8536.6} {"step": 3110, "train_loss": 3.873326539993286, "lr": 0.0003954800179180943, "tps": 23861, "wall": 8544.4} {"step": 3111, "train_loss": 3.9258437156677246, "lr": 0.0003954757506023749, "tps": 23847, "wall": 8552.1} {"step": 3112, "train_loss": 3.8566837310791016, "lr": 0.0003954714812988568, "tps": 23833, "wall": 8559.8} {"step": 3113, "train_loss": 3.8541786670684814, "lr": 0.0003954672100075882, "tps": 23820, "wall": 8567.5} {"step": 3114, "train_loss": 3.8794312477111816, "lr": 0.00039546293672861754, "tps": 23806, "wall": 8575.3} {"step": 3115, "train_loss": 3.9451043605804443, "lr": 0.0003954586614619933, "tps": 23791, "wall": 8583.2} {"step": 3116, "train_loss": 3.9887638092041016, "lr": 0.00039545438420776386, "tps": 23777, "wall": 8591.0} {"step": 3117, "train_loss": 3.952099323272705, "lr": 0.00039545010496597763, "tps": 23764, "wall": 8598.7} {"step": 3118, "train_loss": 3.912614345550537, "lr": 0.0003954458237366831, "tps": 23750, "wall": 8606.5} {"step": 3119, "train_loss": 3.8547592163085938, "lr": 0.0003954415405199288, "tps": 23736, "wall": 8614.1} {"step": 3120, "train_loss": 3.8739967346191406, "lr": 0.00039543725531576327, "tps": 23723, "wall": 8621.9} {"step": 3121, "train_loss": 3.99151349067688, "lr": 0.000395432968124235, "tps": 23709, "wall": 8629.6} {"step": 3122, "train_loss": 3.9350504875183105, "lr": 0.00039542867894539255, "tps": 23695, "wall": 8637.3} {"step": 3123, "train_loss": 4.0321125984191895, "lr": 0.0003954243877792846, "tps": 23682, "wall": 8645.1} {"step": 3124, "train_loss": 3.9725632667541504, "lr": 0.00039542009462595963, "tps": 23668, "wall": 8652.8} {"step": 3125, "train_loss": 4.032615661621094, "lr": 0.00039541579948546636, "tps": 23655, "wall": 8660.5} {"step": 3126, "train_loss": 3.999628782272339, "lr": 0.0003954115023578534, "tps": 23641, "wall": 8668.1} {"step": 3127, "train_loss": 3.963555335998535, "lr": 0.0003954072032431696, "tps": 23628, "wall": 8675.8} {"step": 3128, "train_loss": 3.9332470893859863, "lr": 0.0003954029021414633, "tps": 23615, "wall": 8683.5} {"step": 3129, "train_loss": 3.834731340408325, "lr": 0.00039539859905278355, "tps": 23601, "wall": 8691.2} {"step": 3130, "train_loss": 3.8945374488830566, "lr": 0.000395394293977179, "tps": 23587, "wall": 8699.1} {"step": 3131, "train_loss": 3.856825351715088, "lr": 0.00039538998691469835, "tps": 23574, "wall": 8706.8} {"step": 3132, "train_loss": 4.104612827301025, "lr": 0.0003953856778653904, "tps": 23561, "wall": 8714.4} {"step": 3133, "train_loss": 3.9158010482788086, "lr": 0.00039538136682930406, "tps": 23547, "wall": 8722.2} {"step": 3134, "train_loss": 3.934211492538452, "lr": 0.0003953770538064881, "tps": 23534, "wall": 8729.9} {"step": 3135, "train_loss": 4.046183109283447, "lr": 0.00039537273879699137, "tps": 23521, "wall": 8737.6} {"step": 3136, "train_loss": 3.926082134246826, "lr": 0.0003953684218008628, "tps": 23508, "wall": 8745.3} {"step": 3137, "train_loss": 3.9351673126220703, "lr": 0.00039536410281815123, "tps": 23494, "wall": 8753.1} {"step": 3138, "train_loss": 3.935850143432617, "lr": 0.0003953597818489056, "tps": 23481, "wall": 8760.9} {"step": 3139, "train_loss": 3.809269428253174, "lr": 0.00039535545889317494, "tps": 23468, "wall": 8768.7} {"step": 3140, "train_loss": 3.8913726806640625, "lr": 0.0003953511339510081, "tps": 23454, "wall": 8776.4} {"step": 3141, "train_loss": 3.882728099822998, "lr": 0.00039534680702245416, "tps": 23441, "wall": 8784.1} {"step": 3142, "train_loss": 3.928616523742676, "lr": 0.0003953424781075621, "tps": 23428, "wall": 8791.8} {"step": 3143, "train_loss": 3.8860812187194824, "lr": 0.00039533814720638094, "tps": 23415, "wall": 8799.5} {"step": 3144, "train_loss": 3.9331650733947754, "lr": 0.00039533381431895975, "tps": 23402, "wall": 8807.3} {"step": 3145, "train_loss": 3.9791135787963867, "lr": 0.0003953294794453477, "tps": 23389, "wall": 8815.1} {"step": 3146, "train_loss": 3.9090609550476074, "lr": 0.0003953251425855937, "tps": 23375, "wall": 8822.9} {"step": 3147, "train_loss": 3.9458706378936768, "lr": 0.0003953208037397471, "tps": 23362, "wall": 8830.7} {"step": 3148, "train_loss": 3.897669792175293, "lr": 0.00039531646290785695, "tps": 23349, "wall": 8838.4} {"step": 3149, "train_loss": 3.9781088829040527, "lr": 0.0003953121200899724, "tps": 23336, "wall": 8846.1} {"step": 3150, "train_loss": 3.845742702484131, "lr": 0.0003953077752861427, "tps": 23323, "wall": 8853.9} {"step": 3151, "train_loss": 3.883387565612793, "lr": 0.00039530342849641696, "tps": 23310, "wall": 8861.6} {"step": 3152, "train_loss": 3.8987255096435547, "lr": 0.00039529907972084456, "tps": 23297, "wall": 8869.4} {"step": 3153, "train_loss": 3.9243593215942383, "lr": 0.0003952947289594747, "tps": 23284, "wall": 8877.1} {"step": 3154, "train_loss": 3.9228901863098145, "lr": 0.00039529037621235664, "tps": 23271, "wall": 8884.9} {"step": 3155, "train_loss": 3.9455480575561523, "lr": 0.00039528602147953973, "tps": 23258, "wall": 8892.6} {"step": 3156, "train_loss": 3.93058443069458, "lr": 0.00039528166476107327, "tps": 23245, "wall": 8900.4} {"step": 3157, "train_loss": 3.956653118133545, "lr": 0.0003952773060570066, "tps": 23233, "wall": 8908.1} {"step": 3158, "train_loss": 3.909669876098633, "lr": 0.0003952729453673892, "tps": 23220, "wall": 8915.9} {"step": 3159, "train_loss": 3.8138108253479004, "lr": 0.0003952685826922704, "tps": 23207, "wall": 8923.5} {"step": 3160, "train_loss": 3.9613852500915527, "lr": 0.0003952642180316995, "tps": 23194, "wall": 8931.2} {"step": 3161, "train_loss": 3.8654091358184814, "lr": 0.00039525985138572615, "tps": 23181, "wall": 8939.1} {"step": 3162, "train_loss": 3.989750862121582, "lr": 0.0003952554827543997, "tps": 23169, "wall": 8946.8} {"step": 3163, "train_loss": 3.880213499069214, "lr": 0.00039525111213776967, "tps": 23156, "wall": 8954.6} {"step": 3164, "train_loss": 3.8932299613952637, "lr": 0.0003952467395358856, "tps": 23143, "wall": 8962.3} {"step": 3165, "train_loss": 3.8959898948669434, "lr": 0.0003952423649487969, "tps": 23131, "wall": 8969.9} {"step": 3166, "train_loss": 3.8436403274536133, "lr": 0.00039523798837655323, "tps": 23118, "wall": 8977.6} {"step": 3167, "train_loss": 3.9007723331451416, "lr": 0.0003952336098192042, "tps": 23106, "wall": 8985.3} {"step": 3168, "train_loss": 3.800220489501953, "lr": 0.00039522922927679924, "tps": 23093, "wall": 8993.1} {"step": 3169, "train_loss": 3.899482488632202, "lr": 0.0003952248467493882, "tps": 23081, "wall": 9000.8} {"step": 3170, "train_loss": 3.7943148612976074, "lr": 0.00039522046223702063, "tps": 23068, "wall": 9008.6} {"step": 3171, "train_loss": 3.938354969024658, "lr": 0.0003952160757397461, "tps": 23056, "wall": 9016.3} {"step": 3172, "train_loss": 3.846792697906494, "lr": 0.00039521168725761445, "tps": 23043, "wall": 9024.0} {"step": 3173, "train_loss": 3.9639949798583984, "lr": 0.0003952072967906753, "tps": 23031, "wall": 9031.7} {"step": 3174, "train_loss": 3.9579782485961914, "lr": 0.0003952029043389784, "tps": 23019, "wall": 9039.3} {"step": 3175, "train_loss": 3.879384994506836, "lr": 0.0003951985099025736, "tps": 23006, "wall": 9047.1} {"step": 3176, "train_loss": 3.8903799057006836, "lr": 0.00039519411348151045, "tps": 22994, "wall": 9054.7} {"step": 3177, "train_loss": 3.8721141815185547, "lr": 0.00039518971507583904, "tps": 22981, "wall": 9062.7} {"step": 3178, "train_loss": 3.9016098976135254, "lr": 0.000395185314685609, "tps": 22969, "wall": 9070.3} {"step": 3179, "train_loss": 3.8720221519470215, "lr": 0.00039518091231087026, "tps": 22956, "wall": 9078.1} {"step": 3180, "train_loss": 3.807598114013672, "lr": 0.0003951765079516727, "tps": 22944, "wall": 9085.8} {"step": 3181, "train_loss": 3.9170455932617188, "lr": 0.0003951721016080661, "tps": 22932, "wall": 9093.5} {"step": 3182, "train_loss": 3.8436226844787598, "lr": 0.00039516769328010057, "tps": 22920, "wall": 9101.2} {"step": 3183, "train_loss": 3.8970088958740234, "lr": 0.0003951632829678258, "tps": 22907, "wall": 9108.9} {"step": 3184, "train_loss": 3.8131515979766846, "lr": 0.00039515887067129195, "tps": 22895, "wall": 9116.7} {"step": 3185, "train_loss": 3.833472728729248, "lr": 0.000395154456390549, "tps": 22883, "wall": 9124.5} {"step": 3186, "train_loss": 3.981187343597412, "lr": 0.0003951500401256468, "tps": 22870, "wall": 9132.2} {"step": 3187, "train_loss": 3.888502836227417, "lr": 0.0003951456218766355, "tps": 22858, "wall": 9139.9} {"step": 3188, "train_loss": 3.7516722679138184, "lr": 0.00039514120164356513, "tps": 22846, "wall": 9147.6} {"step": 3189, "train_loss": 4.038402080535889, "lr": 0.0003951367794264857, "tps": 22834, "wall": 9155.4} {"step": 3190, "train_loss": 3.980118751525879, "lr": 0.0003951323552254474, "tps": 22822, "wall": 9163.1} {"step": 3191, "train_loss": 3.8539230823516846, "lr": 0.00039512792904050035, "tps": 22810, "wall": 9170.9} {"step": 3192, "train_loss": 3.845621109008789, "lr": 0.0003951235008716946, "tps": 22797, "wall": 9178.8} {"step": 3193, "train_loss": 3.840841293334961, "lr": 0.00039511907071908037, "tps": 22785, "wall": 9186.5} {"step": 3194, "train_loss": 3.9253087043762207, "lr": 0.0003951146385827078, "tps": 22774, "wall": 9194.1} {"step": 3195, "train_loss": 3.8850510120391846, "lr": 0.0003951102044626271, "tps": 22762, "wall": 9201.9} {"step": 3196, "train_loss": 3.9620800018310547, "lr": 0.0003951057683588886, "tps": 22749, "wall": 9209.7} {"step": 3197, "train_loss": 3.9660425186157227, "lr": 0.0003951013302715425, "tps": 22738, "wall": 9217.3} {"step": 3198, "train_loss": 3.842132806777954, "lr": 0.000395096890200639, "tps": 22726, "wall": 9225.0} {"step": 3199, "train_loss": 4.02589750289917, "lr": 0.00039509244814622845, "tps": 22714, "wall": 9232.7} {"step": 3200, "train_loss": 3.954469919204712, "lr": 0.00039508800410836126, "tps": 22702, "wall": 9240.6} {"step": 3201, "train_loss": 4.015293598175049, "lr": 0.0003950835580870876, "tps": 22690, "wall": 9248.3} {"step": 3202, "train_loss": 3.8583905696868896, "lr": 0.0003950791100824579, "tps": 22678, "wall": 9256.0} {"step": 3203, "train_loss": 3.925485610961914, "lr": 0.0003950746600945227, "tps": 22666, "wall": 9263.7} {"step": 3204, "train_loss": 3.943315267562866, "lr": 0.0003950702081233322, "tps": 22654, "wall": 9271.4} {"step": 3205, "train_loss": 3.962686538696289, "lr": 0.0003950657541689369, "tps": 22643, "wall": 9279.2} {"step": 3206, "train_loss": 3.9092254638671875, "lr": 0.0003950612982313873, "tps": 22631, "wall": 9287.0} {"step": 3207, "train_loss": 3.8951992988586426, "lr": 0.0003950568403107338, "tps": 22619, "wall": 9294.7} {"step": 3208, "train_loss": 3.9657487869262695, "lr": 0.00039505238040702696, "tps": 22607, "wall": 9302.5} {"step": 3209, "train_loss": 3.8700404167175293, "lr": 0.00039504791852031725, "tps": 22595, "wall": 9310.2} {"step": 3210, "train_loss": 3.83651065826416, "lr": 0.0003950434546506553, "tps": 22583, "wall": 9318.0} {"step": 3211, "train_loss": 3.894444227218628, "lr": 0.0003950389887980916, "tps": 22572, "wall": 9325.7} {"step": 3212, "train_loss": 3.8548500537872314, "lr": 0.0003950345209626768, "tps": 22560, "wall": 9333.4} {"step": 3213, "train_loss": 3.900296211242676, "lr": 0.0003950300511444615, "tps": 22549, "wall": 9341.1} {"step": 3214, "train_loss": 3.9385766983032227, "lr": 0.00039502557934349627, "tps": 22537, "wall": 9348.7} {"step": 3215, "train_loss": 3.8833963871002197, "lr": 0.0003950211055598318, "tps": 22526, "wall": 9356.4} {"step": 3216, "train_loss": 3.880891799926758, "lr": 0.00039501662979351876, "tps": 22514, "wall": 9364.3} {"step": 3217, "train_loss": 3.9329404830932617, "lr": 0.0003950121520446079, "tps": 22502, "wall": 9372.0} {"step": 3218, "train_loss": 3.977057456970215, "lr": 0.0003950076723131499, "tps": 22491, "wall": 9379.7} {"step": 3219, "train_loss": 3.8471574783325195, "lr": 0.0003950031905991955, "tps": 22479, "wall": 9387.4} {"step": 3220, "train_loss": 3.882899284362793, "lr": 0.0003949987069027955, "tps": 22468, "wall": 9395.1} {"step": 3221, "train_loss": 3.8991522789001465, "lr": 0.0003949942212240007, "tps": 22456, "wall": 9402.8} {"step": 3222, "train_loss": 3.871216058731079, "lr": 0.0003949897335628619, "tps": 22444, "wall": 9410.9} {"step": 3223, "train_loss": 3.9649887084960938, "lr": 0.00039498524391943, "tps": 22432, "wall": 9418.8} {"step": 3224, "train_loss": 3.9188499450683594, "lr": 0.0003949807522937557, "tps": 22421, "wall": 9426.5} {"step": 3225, "train_loss": 3.9362878799438477, "lr": 0.00039497625868589, "tps": 22409, "wall": 9434.2} {"step": 3226, "train_loss": 3.930210590362549, "lr": 0.0003949717630958837, "tps": 22398, "wall": 9441.9} {"step": 3227, "train_loss": 3.8955135345458984, "lr": 0.0003949672655237879, "tps": 22387, "wall": 9449.6} {"step": 3228, "train_loss": 4.1120991706848145, "lr": 0.0003949627659696534, "tps": 22375, "wall": 9457.3} {"step": 3229, "train_loss": 3.859065532684326, "lr": 0.0003949582644335312, "tps": 22364, "wall": 9465.0} {"step": 3230, "train_loss": 3.9114465713500977, "lr": 0.0003949537609154724, "tps": 22353, "wall": 9472.8} {"step": 3231, "train_loss": 3.849252700805664, "lr": 0.00039494925541552783, "tps": 22341, "wall": 9480.5} {"step": 3232, "train_loss": 3.8815126419067383, "lr": 0.0003949447479337487, "tps": 22330, "wall": 9488.4} {"step": 3233, "train_loss": 3.7815632820129395, "lr": 0.000394940238470186, "tps": 22318, "wall": 9496.1} {"step": 3234, "train_loss": 3.8948521614074707, "lr": 0.0003949357270248908, "tps": 22307, "wall": 9503.8} {"step": 3235, "train_loss": 3.882993221282959, "lr": 0.0003949312135979142, "tps": 22296, "wall": 9511.4} {"step": 3236, "train_loss": 3.9225611686706543, "lr": 0.0003949266981893074, "tps": 22285, "wall": 9519.2} {"step": 3237, "train_loss": 3.937889337539673, "lr": 0.0003949221807991214, "tps": 22274, "wall": 9526.9} {"step": 3238, "train_loss": 3.9730618000030518, "lr": 0.00039491766142740764, "tps": 22263, "wall": 9534.6} {"step": 3239, "train_loss": 3.833256959915161, "lr": 0.00039491314007421703, "tps": 22251, "wall": 9542.5} {"step": 3240, "train_loss": 3.885695457458496, "lr": 0.0003949086167396009, "tps": 22240, "wall": 9550.2} {"step": 3241, "train_loss": 3.87601900100708, "lr": 0.00039490409142361056, "tps": 22229, "wall": 9557.9} {"step": 3242, "train_loss": 3.892289400100708, "lr": 0.00039489956412629715, "tps": 22218, "wall": 9565.6} {"step": 3243, "train_loss": 3.910034656524658, "lr": 0.00039489503484771204, "tps": 22207, "wall": 9573.3} {"step": 3244, "train_loss": 3.9301514625549316, "lr": 0.0003948905035879065, "tps": 22196, "wall": 9581.1} {"step": 3245, "train_loss": 3.9001543521881104, "lr": 0.00039488597034693186, "tps": 22185, "wall": 9588.8} {"step": 3246, "train_loss": 4.044610977172852, "lr": 0.00039488143512483956, "tps": 22174, "wall": 9596.6} {"step": 3247, "train_loss": 4.033587455749512, "lr": 0.0003948768979216808, "tps": 22162, "wall": 9604.4} {"step": 3248, "train_loss": 3.9966044425964355, "lr": 0.00039487235873750714, "tps": 22151, "wall": 9612.1} {"step": 3249, "train_loss": 3.955169200897217, "lr": 0.00039486781757236997, "tps": 22140, "wall": 9619.9} {"step": 3250, "train_loss": 3.8552966117858887, "lr": 0.0003948632744263206, "tps": 22129, "wall": 9627.6} {"step": 3251, "train_loss": 3.9590816497802734, "lr": 0.00039485872929941073, "tps": 22118, "wall": 9635.3} {"step": 3252, "train_loss": 3.9366002082824707, "lr": 0.0003948541821916917, "tps": 22107, "wall": 9643.1} {"step": 3253, "train_loss": 3.910515308380127, "lr": 0.00039484963310321494, "tps": 22097, "wall": 9650.8} {"step": 3254, "train_loss": 3.87451171875, "lr": 0.0003948450820340321, "tps": 22085, "wall": 9658.6} {"step": 3255, "train_loss": 3.9040722846984863, "lr": 0.0003948405289841947, "tps": 22074, "wall": 9666.4} {"step": 3256, "train_loss": 3.861738920211792, "lr": 0.00039483597395375435, "tps": 22064, "wall": 9674.0} {"step": 3257, "train_loss": 3.871776580810547, "lr": 0.00039483141694276265, "tps": 22053, "wall": 9681.8} {"step": 3258, "train_loss": 3.821772813796997, "lr": 0.00039482685795127126, "tps": 22042, "wall": 9689.6} {"step": 3259, "train_loss": 3.9719178676605225, "lr": 0.00039482229697933167, "tps": 22031, "wall": 9697.3} {"step": 3260, "train_loss": 3.8717503547668457, "lr": 0.00039481773402699565, "tps": 22021, "wall": 9704.9} {"step": 3261, "train_loss": 3.916745662689209, "lr": 0.00039481316909431493, "tps": 22010, "wall": 9712.7} {"step": 3262, "train_loss": 3.946927785873413, "lr": 0.0003948086021813411, "tps": 21999, "wall": 9720.5} {"step": 3263, "train_loss": 3.84890079498291, "lr": 0.000394804033288126, "tps": 21988, "wall": 9728.2} {"step": 3264, "train_loss": 3.8593239784240723, "lr": 0.0003947994624147214, "tps": 21977, "wall": 9736.0} {"step": 3265, "train_loss": 3.785857677459717, "lr": 0.000394794889561179, "tps": 21966, "wall": 9743.8} {"step": 3266, "train_loss": 3.8843889236450195, "lr": 0.0003947903147275506, "tps": 21956, "wall": 9751.5} {"step": 3267, "train_loss": 3.8733644485473633, "lr": 0.0003947857379138881, "tps": 21945, "wall": 9759.1} {"step": 3268, "train_loss": 3.7983546257019043, "lr": 0.0003947811591202434, "tps": 21935, "wall": 9766.8} {"step": 3269, "train_loss": 3.8357458114624023, "lr": 0.0003947765783466681, "tps": 21924, "wall": 9774.6} {"step": 3270, "train_loss": 3.9887161254882812, "lr": 0.0003947719955932143, "tps": 21913, "wall": 9782.5} {"step": 3271, "train_loss": 3.8364923000335693, "lr": 0.00039476741085993393, "tps": 21902, "wall": 9790.3} {"step": 3272, "train_loss": 3.8930201530456543, "lr": 0.0003947628241468789, "tps": 21892, "wall": 9797.9} {"step": 3273, "train_loss": 3.921771287918091, "lr": 0.0003947582354541011, "tps": 21881, "wall": 9805.6} {"step": 3274, "train_loss": 3.9248368740081787, "lr": 0.0003947536447816525, "tps": 21871, "wall": 9813.4} {"step": 3275, "train_loss": 3.901127815246582, "lr": 0.0003947490521295852, "tps": 21860, "wall": 9821.0} {"step": 3276, "train_loss": 3.924610137939453, "lr": 0.00039474445749795124, "tps": 21850, "wall": 9828.8} {"step": 3277, "train_loss": 3.9209394454956055, "lr": 0.00039473986088680256, "tps": 21840, "wall": 9836.4} {"step": 3278, "train_loss": 3.962282180786133, "lr": 0.0003947352622961913, "tps": 21829, "wall": 9844.2} {"step": 3279, "train_loss": 3.8608880043029785, "lr": 0.00039473066172616956, "tps": 21819, "wall": 9851.9} {"step": 3280, "train_loss": 3.9605982303619385, "lr": 0.0003947260591767894, "tps": 21808, "wall": 9859.6} {"step": 3281, "train_loss": 3.8003363609313965, "lr": 0.00039472145464810297, "tps": 21798, "wall": 9867.2} {"step": 3282, "train_loss": 3.849304676055908, "lr": 0.00039471684814016246, "tps": 21787, "wall": 9875.0} {"step": 3283, "train_loss": 3.8515002727508545, "lr": 0.00039471223965302006, "tps": 21777, "wall": 9882.7} {"step": 3284, "train_loss": 3.9476308822631836, "lr": 0.00039470762918672795, "tps": 21767, "wall": 9890.4} {"step": 3285, "train_loss": 3.841491222381592, "lr": 0.00039470301674133834, "tps": 21756, "wall": 9898.3} {"step": 3286, "train_loss": 3.9111504554748535, "lr": 0.00039469840231690355, "tps": 21746, "wall": 9906.0} {"step": 3287, "train_loss": 3.8832244873046875, "lr": 0.00039469378591347573, "tps": 21735, "wall": 9914.0} {"step": 3288, "train_loss": 3.8305397033691406, "lr": 0.0003946891675311074, "tps": 21724, "wall": 9921.9} {"step": 3289, "train_loss": 3.917940616607666, "lr": 0.00039468454716985057, "tps": 21713, "wall": 9929.8} {"step": 3290, "train_loss": 3.9463911056518555, "lr": 0.0003946799248297578, "tps": 21703, "wall": 9937.5} {"step": 3291, "train_loss": 3.890465259552002, "lr": 0.00039467530051088146, "tps": 21693, "wall": 9945.3} {"step": 3292, "train_loss": 3.8708653450012207, "lr": 0.0003946706742132738, "tps": 21682, "wall": 9953.1} {"step": 3293, "train_loss": 3.924572229385376, "lr": 0.00039466604593698724, "tps": 21672, "wall": 9960.9} {"step": 3294, "train_loss": 3.898632049560547, "lr": 0.00039466141568207435, "tps": 21661, "wall": 9968.8} {"step": 3295, "train_loss": 3.861926555633545, "lr": 0.0003946567834485875, "tps": 21651, "wall": 9976.7} {"step": 3296, "train_loss": 3.880763530731201, "lr": 0.0003946521492365791, "tps": 21640, "wall": 9984.6} {"step": 3297, "train_loss": 3.916215419769287, "lr": 0.00039464751304610173, "tps": 21630, "wall": 9992.4} {"step": 3298, "train_loss": 3.8717525005340576, "lr": 0.0003946428748772079, "tps": 21620, "wall": 10000.1} {"step": 3299, "train_loss": 3.846519708633423, "lr": 0.0003946382347299501, "tps": 21610, "wall": 10007.7} {"step": 3300, "train_loss": 3.8690199851989746, "lr": 0.00039463359260438096, "tps": 21600, "wall": 10015.5} {"step": 3301, "train_loss": 3.9487104415893555, "lr": 0.000394628948500553, "tps": 21588, "wall": 10024.0} {"step": 3302, "train_loss": 3.7756576538085938, "lr": 0.00039462430241851893, "tps": 21578, "wall": 10031.7} {"step": 3303, "train_loss": 3.916792869567871, "lr": 0.0003946196543583312, "tps": 21567, "wall": 10039.5} {"step": 3304, "train_loss": 3.958852767944336, "lr": 0.0003946150043200427, "tps": 21556, "wall": 10047.7} {"step": 3305, "train_loss": 3.853886127471924, "lr": 0.0003946103523037059, "tps": 21546, "wall": 10055.6} {"step": 3306, "train_loss": 3.8330986499786377, "lr": 0.0003946056983093736, "tps": 21534, "wall": 10064.1} {"step": 3307, "train_loss": 3.9406652450561523, "lr": 0.0003946010423370986, "tps": 21523, "wall": 10072.3} {"step": 3308, "train_loss": 3.886759042739868, "lr": 0.00039459638438693346, "tps": 21512, "wall": 10080.7} {"step": 3309, "train_loss": 3.875157594680786, "lr": 0.000394591724458931, "tps": 21502, "wall": 10088.5} {"step": 3310, "train_loss": 3.904463768005371, "lr": 0.0003945870625531441, "tps": 21492, "wall": 10096.3} {"step": 3311, "train_loss": 3.815535068511963, "lr": 0.0003945823986696255, "tps": 21481, "wall": 10104.1} {"step": 3312, "train_loss": 3.905380964279175, "lr": 0.000394577732808428, "tps": 21471, "wall": 10111.8} {"step": 3313, "train_loss": 3.8449935913085938, "lr": 0.0003945730649696045, "tps": 21462, "wall": 10119.5} {"step": 3314, "train_loss": 3.9068350791931152, "lr": 0.00039456839515320793, "tps": 21451, "wall": 10127.5} {"step": 3315, "train_loss": 3.9520392417907715, "lr": 0.00039456372335929115, "tps": 21441, "wall": 10135.4} {"step": 3316, "train_loss": 3.872354030609131, "lr": 0.000394559049587907, "tps": 21431, "wall": 10143.2} {"step": 3317, "train_loss": 3.987684726715088, "lr": 0.00039455437383910857, "tps": 21421, "wall": 10151.0} {"step": 3318, "train_loss": 3.939164161682129, "lr": 0.00039454969611294865, "tps": 21411, "wall": 10158.7} {"step": 3319, "train_loss": 3.8209097385406494, "lr": 0.00039454501640948043, "tps": 21401, "wall": 10166.6} {"step": 3320, "train_loss": 3.9822921752929688, "lr": 0.00039454033472875673, "tps": 21391, "wall": 10174.3} {"step": 3321, "train_loss": 3.884115219116211, "lr": 0.00039453565107083077, "tps": 21381, "wall": 10182.2} {"step": 3322, "train_loss": 3.949697971343994, "lr": 0.0003945309654357554, "tps": 21371, "wall": 10190.0} {"step": 3323, "train_loss": 3.9541015625, "lr": 0.00039452627782358393, "tps": 21361, "wall": 10197.9} {"step": 3324, "train_loss": 3.832313060760498, "lr": 0.00039452158823436925, "tps": 21351, "wall": 10205.7} {"step": 3325, "train_loss": 3.9223532676696777, "lr": 0.00039451689666816466, "tps": 21341, "wall": 10213.4} {"step": 3326, "train_loss": 3.925356149673462, "lr": 0.00039451220312502317, "tps": 21332, "wall": 10221.1} {"step": 3327, "train_loss": 3.857921600341797, "lr": 0.000394507507604998, "tps": 21322, "wall": 10229.0} {"step": 3328, "train_loss": 3.8534815311431885, "lr": 0.0003945028101081424, "tps": 21312, "wall": 10236.8} {"step": 3329, "train_loss": 4.038730144500732, "lr": 0.00039449811063450944, "tps": 21302, "wall": 10244.5} {"step": 3330, "train_loss": 3.8500688076019287, "lr": 0.0003944934091841525, "tps": 21292, "wall": 10252.3} {"step": 3331, "train_loss": 3.9436845779418945, "lr": 0.00039448870575712475, "tps": 21282, "wall": 10260.1} {"step": 3332, "train_loss": 3.913356304168701, "lr": 0.0003944840003534795, "tps": 21273, "wall": 10267.9} {"step": 3333, "train_loss": 3.877988815307617, "lr": 0.00039447929297327004, "tps": 21263, "wall": 10275.5} {"step": 3334, "train_loss": 3.8200879096984863, "lr": 0.00039447458361654975, "tps": 21254, "wall": 10283.2} {"step": 3335, "train_loss": 3.818875551223755, "lr": 0.00039446987228337194, "tps": 21244, "wall": 10291.0} {"step": 3336, "train_loss": 3.8491530418395996, "lr": 0.00039446515897379, "tps": 21235, "wall": 10298.7} {"step": 3337, "train_loss": 3.897433280944824, "lr": 0.00039446044368785725, "tps": 21225, "wall": 10306.4} {"step": 3338, "train_loss": 3.825654983520508, "lr": 0.00039445572642562716, "tps": 21215, "wall": 10314.4} {"step": 3339, "train_loss": 3.9279625415802, "lr": 0.00039445100718715314, "tps": 21205, "wall": 10322.2} {"step": 3340, "train_loss": 3.7298641204833984, "lr": 0.0003944462859724887, "tps": 21196, "wall": 10330.0} {"step": 3341, "train_loss": 3.9019179344177246, "lr": 0.00039444156278168734, "tps": 21186, "wall": 10337.8} {"step": 3342, "train_loss": 3.9561798572540283, "lr": 0.00039443683761480246, "tps": 21177, "wall": 10345.5} {"step": 3343, "train_loss": 4.018787860870361, "lr": 0.0003944321104718877, "tps": 21167, "wall": 10353.4} {"step": 3344, "train_loss": 3.816636085510254, "lr": 0.0003944273813529965, "tps": 21157, "wall": 10361.1} {"step": 3345, "train_loss": 3.8413190841674805, "lr": 0.00039442265025818254, "tps": 21147, "wall": 10369.1} {"step": 3346, "train_loss": 3.8913283348083496, "lr": 0.0003944179171874994, "tps": 21138, "wall": 10376.8} {"step": 3347, "train_loss": 3.947514057159424, "lr": 0.00039441318214100056, "tps": 21128, "wall": 10384.6} {"step": 3348, "train_loss": 3.84293794631958, "lr": 0.0003944084451187398, "tps": 21119, "wall": 10392.2} {"step": 3349, "train_loss": 3.95913028717041, "lr": 0.00039440370612077067, "tps": 21110, "wall": 10399.9} {"step": 3350, "train_loss": 3.8151941299438477, "lr": 0.000394398965147147, "tps": 21101, "wall": 10407.6} {"step": 3351, "train_loss": 3.972240447998047, "lr": 0.0003943942221979224, "tps": 21091, "wall": 10415.2} {"step": 3352, "train_loss": 3.922130584716797, "lr": 0.0003943894772731506, "tps": 21082, "wall": 10422.9} {"step": 3353, "train_loss": 3.7918641567230225, "lr": 0.0003943847303728854, "tps": 21073, "wall": 10430.6} {"step": 3354, "train_loss": 3.984295606613159, "lr": 0.0003943799814971805, "tps": 21063, "wall": 10438.5} {"step": 3355, "train_loss": 3.8856875896453857, "lr": 0.00039437523064608977, "tps": 21054, "wall": 10446.2} {"step": 3356, "train_loss": 3.8334858417510986, "lr": 0.00039437047781966703, "tps": 21045, "wall": 10453.9} {"step": 3357, "train_loss": 3.8384599685668945, "lr": 0.000394365723017966, "tps": 21035, "wall": 10461.7} {"step": 3358, "train_loss": 3.8131208419799805, "lr": 0.00039436096624104064, "tps": 21024, "wall": 10470.2} {"step": 3359, "train_loss": 3.906055450439453, "lr": 0.00039435620748894487, "tps": 21015, "wall": 10477.9} {"step": 3360, "train_loss": 3.956657886505127, "lr": 0.0003943514467617325, "tps": 21006, "wall": 10485.6} {"step": 3361, "train_loss": 3.892200469970703, "lr": 0.0003943466840594575, "tps": 20997, "wall": 10493.4} {"step": 3362, "train_loss": 3.8703012466430664, "lr": 0.0003943419193821739, "tps": 20987, "wall": 10501.3} {"step": 3363, "train_loss": 3.892207622528076, "lr": 0.0003943371527299356, "tps": 20978, "wall": 10509.0} {"step": 3364, "train_loss": 3.8272061347961426, "lr": 0.00039433238410279656, "tps": 20969, "wall": 10516.7} {"step": 3365, "train_loss": 3.866715908050537, "lr": 0.0003943276135008108, "tps": 20960, "wall": 10524.4} {"step": 3366, "train_loss": 3.9024152755737305, "lr": 0.0003943228409240325, "tps": 20950, "wall": 10532.2} {"step": 3367, "train_loss": 3.8703081607818604, "lr": 0.0003943180663725156, "tps": 20941, "wall": 10539.9} {"step": 3368, "train_loss": 3.954421281814575, "lr": 0.0003943132898463142, "tps": 20932, "wall": 10547.6} {"step": 3369, "train_loss": 3.9005355834960938, "lr": 0.00039430851134548246, "tps": 20923, "wall": 10555.4} {"step": 3370, "train_loss": 3.7989425659179688, "lr": 0.00039430373087007435, "tps": 20913, "wall": 10563.4} {"step": 3371, "train_loss": 3.820932388305664, "lr": 0.00039429894842014424, "tps": 20904, "wall": 10571.2} {"step": 3372, "train_loss": 3.8253705501556396, "lr": 0.00039429416399574624, "tps": 20895, "wall": 10579.0} {"step": 3373, "train_loss": 3.8866899013519287, "lr": 0.0003942893775969345, "tps": 20886, "wall": 10586.7} {"step": 3374, "train_loss": 3.8995203971862793, "lr": 0.0003942845892237632, "tps": 20877, "wall": 10594.4} {"step": 3375, "train_loss": 3.895700454711914, "lr": 0.00039427979887628667, "tps": 20868, "wall": 10602.2} {"step": 3376, "train_loss": 3.8261594772338867, "lr": 0.0003942750065545592, "tps": 20859, "wall": 10609.9} {"step": 3377, "train_loss": 3.8802404403686523, "lr": 0.000394270212258635, "tps": 20850, "wall": 10617.5} {"step": 3378, "train_loss": 3.876192092895508, "lr": 0.0003942654159885684, "tps": 20841, "wall": 10625.4} {"step": 3379, "train_loss": 3.8449816703796387, "lr": 0.0003942606177444138, "tps": 20832, "wall": 10633.2} {"step": 3380, "train_loss": 3.9138214588165283, "lr": 0.00039425581752622536, "tps": 20823, "wall": 10640.9} {"step": 3381, "train_loss": 3.917189359664917, "lr": 0.00039425101533405773, "tps": 20814, "wall": 10648.6} {"step": 3382, "train_loss": 3.835780620574951, "lr": 0.0003942462111679651, "tps": 20805, "wall": 10656.3} {"step": 3383, "train_loss": 3.87648606300354, "lr": 0.00039424140502800195, "tps": 20796, "wall": 10664.1} {"step": 3384, "train_loss": 3.7978880405426025, "lr": 0.00039423659691422276, "tps": 20787, "wall": 10671.8} {"step": 3385, "train_loss": 3.905564546585083, "lr": 0.00039423178682668203, "tps": 20778, "wall": 10679.7} {"step": 3386, "train_loss": 3.923579692840576, "lr": 0.00039422697476543413, "tps": 20769, "wall": 10687.4} {"step": 3387, "train_loss": 3.9828362464904785, "lr": 0.0003942221607305336, "tps": 20760, "wall": 10695.1} {"step": 3388, "train_loss": 3.8230133056640625, "lr": 0.00039421734472203513, "tps": 20751, "wall": 10702.9} {"step": 3389, "train_loss": 3.979836940765381, "lr": 0.00039421252673999305, "tps": 20742, "wall": 10710.5} {"step": 3390, "train_loss": 3.8898468017578125, "lr": 0.000394207706784462, "tps": 20733, "wall": 10718.3} {"step": 3391, "train_loss": 3.904942274093628, "lr": 0.0003942028848554967, "tps": 20725, "wall": 10726.1} {"step": 3392, "train_loss": 3.8685503005981445, "lr": 0.0003941980609531517, "tps": 20716, "wall": 10733.8} {"step": 3393, "train_loss": 3.825270175933838, "lr": 0.00039419323507748166, "tps": 20707, "wall": 10741.6} {"step": 3394, "train_loss": 3.8771917819976807, "lr": 0.0003941884072285412, "tps": 20698, "wall": 10749.3} {"step": 3395, "train_loss": 3.879058361053467, "lr": 0.00039418357740638506, "tps": 20689, "wall": 10757.1} {"step": 3396, "train_loss": 3.8905234336853027, "lr": 0.0003941787456110679, "tps": 20680, "wall": 10764.9} {"step": 3397, "train_loss": 3.8925232887268066, "lr": 0.0003941739118426445, "tps": 20671, "wall": 10772.7} {"step": 3398, "train_loss": 3.8445396423339844, "lr": 0.0003941690761011696, "tps": 20663, "wall": 10780.5} {"step": 3399, "train_loss": 3.846169948577881, "lr": 0.000394164238386698, "tps": 20654, "wall": 10788.2} {"step": 3400, "train_loss": 3.875491142272949, "lr": 0.00039415939869928446, "tps": 20645, "wall": 10795.9} {"step": 3401, "train_loss": 3.8882369995117188, "lr": 0.0003941545570389838, "tps": 20636, "wall": 10803.8} {"step": 3402, "train_loss": 3.8351917266845703, "lr": 0.00039414971340585105, "tps": 20627, "wall": 10811.6} {"step": 3403, "train_loss": 3.908261299133301, "lr": 0.0003941448677999407, "tps": 20619, "wall": 10819.3} {"step": 3404, "train_loss": 3.8411221504211426, "lr": 0.000394140020221308, "tps": 20610, "wall": 10827.0} {"step": 3405, "train_loss": 3.851109743118286, "lr": 0.00039413517067000774, "tps": 20601, "wall": 10834.7} {"step": 3406, "train_loss": 3.7992796897888184, "lr": 0.00039413031914609483, "tps": 20593, "wall": 10842.5} {"step": 3407, "train_loss": 3.8143162727355957, "lr": 0.00039412546564962416, "tps": 20584, "wall": 10850.2} {"step": 3408, "train_loss": 3.9726037979125977, "lr": 0.0003941206101806509, "tps": 20575, "wall": 10858.1} {"step": 3409, "train_loss": 3.864178419113159, "lr": 0.00039411575273922995, "tps": 20567, "wall": 10865.8} {"step": 3410, "train_loss": 3.865711212158203, "lr": 0.0003941108933254163, "tps": 20558, "wall": 10873.5} {"step": 3411, "train_loss": 3.960099220275879, "lr": 0.000394106031939265, "tps": 20549, "wall": 10881.2} {"step": 3412, "train_loss": 3.956360340118408, "lr": 0.0003941011685808312, "tps": 20541, "wall": 10889.0} {"step": 3413, "train_loss": 3.769690990447998, "lr": 0.0003940963032501699, "tps": 20532, "wall": 10896.8} {"step": 3414, "train_loss": 3.9271011352539062, "lr": 0.0003940914359473363, "tps": 20524, "wall": 10904.5} {"step": 3415, "train_loss": 3.827699661254883, "lr": 0.0003940865666723855, "tps": 20515, "wall": 10912.3} {"step": 3416, "train_loss": 3.877622365951538, "lr": 0.00039408169542537257, "tps": 20506, "wall": 10920.1} {"step": 3417, "train_loss": 3.8623759746551514, "lr": 0.0003940768222063529, "tps": 20498, "wall": 10927.8} {"step": 3418, "train_loss": 3.9544260501861572, "lr": 0.0003940719470153815, "tps": 20489, "wall": 10935.5} {"step": 3419, "train_loss": 3.820688009262085, "lr": 0.00039406706985251365, "tps": 20481, "wall": 10943.2} {"step": 3420, "train_loss": 3.8294687271118164, "lr": 0.00039406219071780465, "tps": 20473, "wall": 10950.9} {"step": 3421, "train_loss": 3.8692171573638916, "lr": 0.00039405730961130975, "tps": 20464, "wall": 10958.7} {"step": 3422, "train_loss": 3.855658531188965, "lr": 0.0003940524265330842, "tps": 20456, "wall": 10966.4} {"step": 3423, "train_loss": 3.8097400665283203, "lr": 0.0003940475414831834, "tps": 20447, "wall": 10974.2} {"step": 3424, "train_loss": 3.8059375286102295, "lr": 0.00039404265446166254, "tps": 20438, "wall": 10982.2} {"step": 3425, "train_loss": 3.841127395629883, "lr": 0.0003940377654685771, "tps": 20430, "wall": 10990.0} {"step": 3426, "train_loss": 3.8647897243499756, "lr": 0.00039403287450398246, "tps": 20421, "wall": 10997.7} {"step": 3427, "train_loss": 3.812058925628662, "lr": 0.000394027981567934, "tps": 20413, "wall": 11005.5} {"step": 3428, "train_loss": 3.9328017234802246, "lr": 0.0003940230866604872, "tps": 20404, "wall": 11013.3} {"step": 3429, "train_loss": 3.8318843841552734, "lr": 0.0003940181897816974, "tps": 20396, "wall": 11021.1} {"step": 3430, "train_loss": 3.9559834003448486, "lr": 0.00039401329093162013, "tps": 20387, "wall": 11028.9} {"step": 3431, "train_loss": 3.8517847061157227, "lr": 0.0003940083901103109, "tps": 20379, "wall": 11036.6} {"step": 3432, "train_loss": 3.9212088584899902, "lr": 0.00039400348731782523, "tps": 20370, "wall": 11044.5} {"step": 3433, "train_loss": 3.885706663131714, "lr": 0.00039399858255421863, "tps": 20362, "wall": 11052.3} {"step": 3434, "train_loss": 3.871084690093994, "lr": 0.0003939936758195466, "tps": 20353, "wall": 11060.1} {"step": 3435, "train_loss": 3.8792881965637207, "lr": 0.00039398876711386495, "tps": 20345, "wall": 11067.8} {"step": 3436, "train_loss": 3.872826099395752, "lr": 0.00039398385643722906, "tps": 20337, "wall": 11075.6} {"step": 3437, "train_loss": 3.828347682952881, "lr": 0.00039397894378969463, "tps": 20328, "wall": 11083.3} {"step": 3438, "train_loss": 3.841578960418701, "lr": 0.0003939740291713173, "tps": 20320, "wall": 11091.1} {"step": 3439, "train_loss": 3.7867870330810547, "lr": 0.0003939691125821527, "tps": 20311, "wall": 11099.1} {"step": 3440, "train_loss": 3.8179407119750977, "lr": 0.0003939641940222567, "tps": 20303, "wall": 11107.0} {"step": 3441, "train_loss": 3.656949520111084, "lr": 0.0003939592734916848, "tps": 20295, "wall": 11114.8} {"step": 3442, "train_loss": 3.8529720306396484, "lr": 0.00039395435099049287, "tps": 20286, "wall": 11122.6} {"step": 3443, "train_loss": 3.8522510528564453, "lr": 0.00039394942651873666, "tps": 20278, "wall": 11130.4} {"step": 3444, "train_loss": 3.744391679763794, "lr": 0.00039394450007647195, "tps": 20270, "wall": 11138.2} {"step": 3445, "train_loss": 3.883096218109131, "lr": 0.0003939395716637545, "tps": 20261, "wall": 11146.0} {"step": 3446, "train_loss": 3.8543434143066406, "lr": 0.0003939346412806402, "tps": 20253, "wall": 11153.8} {"step": 3447, "train_loss": 3.897188186645508, "lr": 0.00039392970892718486, "tps": 20245, "wall": 11161.6} {"step": 3448, "train_loss": 3.8735857009887695, "lr": 0.00039392477460344435, "tps": 20236, "wall": 11169.4} {"step": 3449, "train_loss": 3.7278690338134766, "lr": 0.00039391983830947463, "tps": 20228, "wall": 11177.2} {"step": 3450, "train_loss": 3.7973947525024414, "lr": 0.00039391490004533154, "tps": 20220, "wall": 11185.0} {"step": 3451, "train_loss": 3.8643741607666016, "lr": 0.000393909959811071, "tps": 20212, "wall": 11192.8} {"step": 3452, "train_loss": 3.831871509552002, "lr": 0.0003939050176067491, "tps": 20203, "wall": 11200.6} {"step": 3453, "train_loss": 3.836805820465088, "lr": 0.00039390007343242174, "tps": 20194, "wall": 11209.0} {"step": 3454, "train_loss": 3.710348606109619, "lr": 0.000393895127288145, "tps": 20186, "wall": 11216.9} {"step": 3455, "train_loss": 3.898049831390381, "lr": 0.00039389017917397474, "tps": 20177, "wall": 11224.9} {"step": 3456, "train_loss": 3.7767367362976074, "lr": 0.00039388522908996717, "tps": 20169, "wall": 11232.7} {"step": 3457, "train_loss": 3.828258514404297, "lr": 0.00039388027703617833, "tps": 20161, "wall": 11240.6} {"step": 3458, "train_loss": 3.939727306365967, "lr": 0.0003938753230126643, "tps": 20152, "wall": 11248.4} {"step": 3459, "train_loss": 3.920598030090332, "lr": 0.0003938703670194812, "tps": 20144, "wall": 11256.3} {"step": 3460, "train_loss": 3.9195668697357178, "lr": 0.00039386540905668514, "tps": 20136, "wall": 11264.1} {"step": 3461, "train_loss": 3.833181858062744, "lr": 0.0003938604491243324, "tps": 20128, "wall": 11271.9} {"step": 3462, "train_loss": 3.9372899532318115, "lr": 0.000393855487222479, "tps": 20119, "wall": 11280.0} {"step": 3463, "train_loss": 3.812957286834717, "lr": 0.0003938505233511813, "tps": 20111, "wall": 11287.8} {"step": 3464, "train_loss": 3.82550048828125, "lr": 0.00039384555751049543, "tps": 20103, "wall": 11295.6} {"step": 3465, "train_loss": 3.89731502532959, "lr": 0.0003938405897004777, "tps": 20095, "wall": 11303.4} {"step": 3466, "train_loss": 3.914508819580078, "lr": 0.00039383561992118436, "tps": 20087, "wall": 11311.4} {"step": 3467, "train_loss": 3.8559188842773438, "lr": 0.0003938306481726717, "tps": 20077, "wall": 11319.9} {"step": 3468, "train_loss": 3.9699935913085938, "lr": 0.0003938256744549961, "tps": 20069, "wall": 11327.7} {"step": 3469, "train_loss": 3.858731746673584, "lr": 0.0003938206987682138, "tps": 20061, "wall": 11335.5} {"step": 3470, "train_loss": 3.818319320678711, "lr": 0.0003938157211123812, "tps": 20053, "wall": 11343.5} {"step": 3471, "train_loss": 3.8299975395202637, "lr": 0.0003938107414875548, "tps": 20044, "wall": 11351.6} {"step": 3472, "train_loss": 3.8502590656280518, "lr": 0.0003938057598937908, "tps": 20036, "wall": 11359.4} {"step": 3473, "train_loss": 3.7775683403015137, "lr": 0.00039380077633114583, "tps": 20029, "wall": 11367.1} {"step": 3474, "train_loss": 3.927056312561035, "lr": 0.0003937957907996763, "tps": 20020, "wall": 11375.1} {"step": 3475, "train_loss": 3.9566588401794434, "lr": 0.00039379080329943856, "tps": 20012, "wall": 11382.9} {"step": 3476, "train_loss": 3.810537815093994, "lr": 0.00039378581383048923, "tps": 20004, "wall": 11390.7} {"step": 3477, "train_loss": 3.801862955093384, "lr": 0.0003937808223928848, "tps": 19996, "wall": 11398.6} {"step": 3478, "train_loss": 3.934361457824707, "lr": 0.00039377582898668183, "tps": 19987, "wall": 11407.4} {"step": 3479, "train_loss": 3.8863677978515625, "lr": 0.00039377083361193685, "tps": 19977, "wall": 11416.0} {"step": 3480, "train_loss": 3.8062164783477783, "lr": 0.00039376583626870643, "tps": 19968, "wall": 11424.3} {"step": 3481, "train_loss": 3.8232526779174805, "lr": 0.00039376083695704734, "tps": 19960, "wall": 11432.6} {"step": 3482, "train_loss": 3.8102259635925293, "lr": 0.000393755835677016, "tps": 19951, "wall": 11440.9} {"step": 3483, "train_loss": 3.793181896209717, "lr": 0.00039375083242866913, "tps": 19942, "wall": 11449.1} {"step": 3484, "train_loss": 3.787219524383545, "lr": 0.0003937458272120635, "tps": 19934, "wall": 11457.3} {"step": 3485, "train_loss": 3.8420166969299316, "lr": 0.00039374082002725563, "tps": 19925, "wall": 11465.6} {"step": 3486, "train_loss": 3.8101816177368164, "lr": 0.0003937358108743024, "tps": 19917, "wall": 11473.6} {"step": 3487, "train_loss": 3.7558891773223877, "lr": 0.0003937307997532606, "tps": 19908, "wall": 11482.2} {"step": 3488, "train_loss": 3.7652130126953125, "lr": 0.00039372578666418685, "tps": 19899, "wall": 11490.5} {"step": 3489, "train_loss": 3.844294786453247, "lr": 0.0003937207716071379, "tps": 19890, "wall": 11498.9} {"step": 3490, "train_loss": 3.876603364944458, "lr": 0.0003937157545821708, "tps": 19882, "wall": 11507.2} {"step": 3491, "train_loss": 3.8865785598754883, "lr": 0.00039371073558934207, "tps": 19873, "wall": 11515.5} {"step": 3492, "train_loss": 3.760863780975342, "lr": 0.00039370571462870886, "tps": 19864, "wall": 11523.9} {"step": 3493, "train_loss": 3.879446506500244, "lr": 0.0003937006917003279, "tps": 19856, "wall": 11532.1} {"step": 3494, "train_loss": 3.7386038303375244, "lr": 0.000393695666804256, "tps": 19847, "wall": 11540.2} {"step": 3495, "train_loss": 3.887396812438965, "lr": 0.0003936906399405503, "tps": 19839, "wall": 11548.4} {"step": 3496, "train_loss": 3.7653746604919434, "lr": 0.0003936856111092676, "tps": 19831, "wall": 11556.5} {"step": 3497, "train_loss": 3.830463171005249, "lr": 0.00039368058031046487, "tps": 19822, "wall": 11564.8} {"step": 3498, "train_loss": 3.870089292526245, "lr": 0.0003936755475441992, "tps": 19814, "wall": 11573.0} {"step": 3499, "train_loss": 3.8747916221618652, "lr": 0.00039367051281052754, "tps": 19805, "wall": 11581.3} {"step": 3500, "train_loss": 3.701050281524658, "lr": 0.0003936654761095069, "tps": 19797, "wall": 11589.5} {"step": 3501, "train_loss": 3.8273274898529053, "lr": 0.0003936604374411943, "tps": 19788, "wall": 11597.7} {"step": 3502, "train_loss": 3.831494092941284, "lr": 0.00039365539680564685, "tps": 19780, "wall": 11606.1} {"step": 3503, "train_loss": 3.8867549896240234, "lr": 0.0003936503542029217, "tps": 19772, "wall": 11614.2} {"step": 3504, "train_loss": 3.827906847000122, "lr": 0.000393645309633076, "tps": 19763, "wall": 11622.5} {"step": 3505, "train_loss": 3.73399019241333, "lr": 0.00039364026309616677, "tps": 19755, "wall": 11630.8} {"step": 3506, "train_loss": 3.7024354934692383, "lr": 0.00039363521459225123, "tps": 19746, "wall": 11639.2} {"step": 3507, "train_loss": 3.817864179611206, "lr": 0.00039363016412138663, "tps": 19737, "wall": 11647.8} {"step": 3508, "train_loss": 3.8426997661590576, "lr": 0.00039362511168363016, "tps": 19729, "wall": 11656.0} {"step": 3509, "train_loss": 3.906527042388916, "lr": 0.00039362005727903906, "tps": 19721, "wall": 11664.1} {"step": 3510, "train_loss": 3.812481164932251, "lr": 0.00039361500090767047, "tps": 19712, "wall": 11672.4} {"step": 3511, "train_loss": 3.8396847248077393, "lr": 0.0003936099425695818, "tps": 19704, "wall": 11680.5} {"step": 3512, "train_loss": 3.8975887298583984, "lr": 0.00039360488226483024, "tps": 19696, "wall": 11688.8} {"step": 3513, "train_loss": 3.9450674057006836, "lr": 0.00039359981999347325, "tps": 19687, "wall": 11697.2} {"step": 3514, "train_loss": 3.8471670150756836, "lr": 0.00039359475575556814, "tps": 19679, "wall": 11705.5} {"step": 3515, "train_loss": 3.937293767929077, "lr": 0.0003935896895511722, "tps": 19671, "wall": 11713.7} {"step": 3516, "train_loss": 3.837210178375244, "lr": 0.00039358462138034284, "tps": 19663, "wall": 11721.9} {"step": 3517, "train_loss": 3.8772757053375244, "lr": 0.00039357955124313753, "tps": 19655, "wall": 11730.1} {"step": 3518, "train_loss": 3.9272570610046387, "lr": 0.00039357447913961367, "tps": 19646, "wall": 11738.3} {"step": 3519, "train_loss": 3.726320266723633, "lr": 0.0003935694050698287, "tps": 19638, "wall": 11746.4} {"step": 3520, "train_loss": 3.845078945159912, "lr": 0.00039356432903384016, "tps": 19630, "wall": 11754.6} {"step": 3521, "train_loss": 3.953822135925293, "lr": 0.00039355925103170555, "tps": 19622, "wall": 11762.9} {"step": 3522, "train_loss": 3.817247152328491, "lr": 0.00039355417106348223, "tps": 19614, "wall": 11771.1} {"step": 3523, "train_loss": 3.8581910133361816, "lr": 0.00039354908912922796, "tps": 19606, "wall": 11779.4} {"step": 3524, "train_loss": 3.8642494678497314, "lr": 0.0003935440052290002, "tps": 19598, "wall": 11787.5} {"step": 3525, "train_loss": 3.7663912773132324, "lr": 0.00039353891936285654, "tps": 19590, "wall": 11795.6} {"step": 3526, "train_loss": 3.7411129474639893, "lr": 0.0003935338315308547, "tps": 19582, "wall": 11803.9} {"step": 3527, "train_loss": 3.801607370376587, "lr": 0.0003935287417330521, "tps": 19574, "wall": 11812.0} {"step": 3528, "train_loss": 3.8498010635375977, "lr": 0.0003935236499695066, "tps": 19566, "wall": 11820.3} {"step": 3529, "train_loss": 3.930661201477051, "lr": 0.0003935185562402758, "tps": 19557, "wall": 11828.6} {"step": 3530, "train_loss": 3.8831894397735596, "lr": 0.00039351346054541735, "tps": 19549, "wall": 11836.8} {"step": 3531, "train_loss": 3.872298240661621, "lr": 0.00039350836288498913, "tps": 19541, "wall": 11845.1} {"step": 3532, "train_loss": 3.836317539215088, "lr": 0.00039350326325904875, "tps": 19533, "wall": 11853.1} {"step": 3533, "train_loss": 3.8679120540618896, "lr": 0.00039349816166765403, "tps": 19525, "wall": 11861.3} {"step": 3534, "train_loss": 3.7728171348571777, "lr": 0.00039349305811086266, "tps": 19517, "wall": 11869.6} {"step": 3535, "train_loss": 3.86186146736145, "lr": 0.00039348795258873265, "tps": 19509, "wall": 11878.0} {"step": 3536, "train_loss": 3.765118360519409, "lr": 0.0003934828451013216, "tps": 19501, "wall": 11886.1} {"step": 3537, "train_loss": 3.8590705394744873, "lr": 0.0003934777356486877, "tps": 19493, "wall": 11894.4} {"step": 3538, "train_loss": 3.8387250900268555, "lr": 0.0003934726242308884, "tps": 19485, "wall": 11902.6} {"step": 3539, "train_loss": 3.821627616882324, "lr": 0.00039346751084798196, "tps": 19477, "wall": 11910.8} {"step": 3540, "train_loss": 3.787172794342041, "lr": 0.0003934623955000262, "tps": 19469, "wall": 11919.0} {"step": 3541, "train_loss": 3.8091325759887695, "lr": 0.000393457278187079, "tps": 19462, "wall": 11927.1} {"step": 3542, "train_loss": 3.9066998958587646, "lr": 0.0003934521589091983, "tps": 19454, "wall": 11935.4} {"step": 3543, "train_loss": 3.8544487953186035, "lr": 0.00039344703766644223, "tps": 19446, "wall": 11943.6} {"step": 3544, "train_loss": 3.805266857147217, "lr": 0.0003934419144588687, "tps": 19438, "wall": 11951.8} {"step": 3545, "train_loss": 3.8402535915374756, "lr": 0.0003934367892865358, "tps": 19430, "wall": 11959.9} {"step": 3546, "train_loss": 3.8105521202087402, "lr": 0.0003934316621495016, "tps": 19422, "wall": 11968.1} {"step": 3547, "train_loss": 3.8997721672058105, "lr": 0.00039342653304782414, "tps": 19414, "wall": 11976.4} {"step": 3548, "train_loss": 3.8273987770080566, "lr": 0.0003934214019815615, "tps": 19407, "wall": 11984.2} {"step": 3549, "train_loss": 3.9038708209991455, "lr": 0.0003934162689507718, "tps": 19400, "wall": 11992.0} {"step": 3550, "train_loss": 3.893575668334961, "lr": 0.00039341113395551327, "tps": 19393, "wall": 11999.8} {"step": 3551, "train_loss": 3.884068489074707, "lr": 0.00039340599699584406, "tps": 19386, "wall": 12007.5} {"step": 3552, "train_loss": 3.8653018474578857, "lr": 0.0003934008580718223, "tps": 19379, "wall": 12015.1} {"step": 3553, "train_loss": 3.8956704139709473, "lr": 0.00039339571718350626, "tps": 19372, "wall": 12022.8} {"step": 3554, "train_loss": 3.8667497634887695, "lr": 0.0003933905743309541, "tps": 19365, "wall": 12030.6} {"step": 3555, "train_loss": 3.8526344299316406, "lr": 0.0003933854295142242, "tps": 19358, "wall": 12038.3} {"step": 3556, "train_loss": 3.9027082920074463, "lr": 0.0003933802827333748, "tps": 19351, "wall": 12046.1} {"step": 3557, "train_loss": 3.8167500495910645, "lr": 0.00039337513398846405, "tps": 19344, "wall": 12053.9} {"step": 3558, "train_loss": 3.8240649700164795, "lr": 0.0003933699832795505, "tps": 19337, "wall": 12061.7} {"step": 3559, "train_loss": 3.925139904022217, "lr": 0.00039336483060669236, "tps": 19330, "wall": 12069.6} {"step": 3560, "train_loss": 3.7826921939849854, "lr": 0.0003933596759699481, "tps": 19323, "wall": 12077.3} {"step": 3561, "train_loss": 3.788125514984131, "lr": 0.000393354519369376, "tps": 19316, "wall": 12085.1} {"step": 3562, "train_loss": 3.826528549194336, "lr": 0.0003933493608050345, "tps": 19309, "wall": 12092.8} {"step": 3563, "train_loss": 3.747997760772705, "lr": 0.00039334420027698207, "tps": 19302, "wall": 12100.5} {"step": 3564, "train_loss": 3.8807122707366943, "lr": 0.0003933390377852773, "tps": 19295, "wall": 12108.3} {"step": 3565, "train_loss": 3.8953542709350586, "lr": 0.00039333387332997837, "tps": 19288, "wall": 12116.0} {"step": 3566, "train_loss": 3.746516227722168, "lr": 0.00039332870691114396, "tps": 19281, "wall": 12123.9} {"step": 3567, "train_loss": 3.861924171447754, "lr": 0.00039332353852883264, "tps": 19274, "wall": 12131.6} {"step": 3568, "train_loss": 3.8777265548706055, "lr": 0.0003933183681831029, "tps": 19267, "wall": 12139.3} {"step": 3569, "train_loss": 3.8602871894836426, "lr": 0.00039331319587401325, "tps": 19261, "wall": 12147.0} {"step": 3570, "train_loss": 3.782740592956543, "lr": 0.00039330802160162244, "tps": 19254, "wall": 12154.7} {"step": 3571, "train_loss": 3.8580777645111084, "lr": 0.0003933028453659889, "tps": 19247, "wall": 12162.4} {"step": 3572, "train_loss": 3.8671183586120605, "lr": 0.00039329766716717136, "tps": 19240, "wall": 12170.1} {"step": 3573, "train_loss": 3.9178104400634766, "lr": 0.0003932924870052285, "tps": 19233, "wall": 12178.1} {"step": 3574, "train_loss": 3.852503538131714, "lr": 0.0003932873048802189, "tps": 19226, "wall": 12185.9} {"step": 3575, "train_loss": 3.907698392868042, "lr": 0.00039328212079220144, "tps": 19219, "wall": 12193.7} {"step": 3576, "train_loss": 3.9187722206115723, "lr": 0.00039327693474123474, "tps": 19212, "wall": 12201.5} {"step": 3577, "train_loss": 3.8942031860351562, "lr": 0.0003932717467273775, "tps": 19205, "wall": 12209.2} {"step": 3578, "train_loss": 3.838806629180908, "lr": 0.00039326655675068855, "tps": 19197, "wall": 12218.1} {"step": 3579, "train_loss": 3.8088009357452393, "lr": 0.00039326136481122664, "tps": 19190, "wall": 12225.9} {"step": 3580, "train_loss": 3.8582983016967773, "lr": 0.0003932561709090506, "tps": 19180, "wall": 12235.7} {"step": 3581, "train_loss": 3.858590602874756, "lr": 0.00039325097504421935, "tps": 19172, "wall": 12244.3} {"step": 3582, "train_loss": 3.8340823650360107, "lr": 0.00039324577721679165, "tps": 19165, "wall": 12252.0} {"step": 3583, "train_loss": 3.867401599884033, "lr": 0.00039324057742682646, "tps": 19158, "wall": 12260.0} {"step": 3584, "train_loss": 3.871260166168213, "lr": 0.00039323537567438263, "tps": 19151, "wall": 12267.7} {"step": 3585, "train_loss": 3.893995761871338, "lr": 0.00039323017195951905, "tps": 19144, "wall": 12275.4} {"step": 3586, "train_loss": 3.8260817527770996, "lr": 0.0003932249662822947, "tps": 19138, "wall": 12283.1} {"step": 3587, "train_loss": 3.963618755340576, "lr": 0.00039321975864276855, "tps": 19131, "wall": 12290.8} {"step": 3588, "train_loss": 3.843616247177124, "lr": 0.00039321454904099964, "tps": 19124, "wall": 12298.8} {"step": 3589, "train_loss": 3.810948133468628, "lr": 0.00039320933747704695, "tps": 19117, "wall": 12306.7} {"step": 3590, "train_loss": 3.9169535636901855, "lr": 0.0003932041239509695, "tps": 19110, "wall": 12314.4} {"step": 3591, "train_loss": 3.984833240509033, "lr": 0.0003931989084628264, "tps": 19104, "wall": 12322.2} {"step": 3592, "train_loss": 3.8152966499328613, "lr": 0.00039319369101267667, "tps": 19097, "wall": 12330.0} {"step": 3593, "train_loss": 3.8598804473876953, "lr": 0.00039318847160057943, "tps": 19090, "wall": 12337.8} {"step": 3594, "train_loss": 3.8611607551574707, "lr": 0.0003931832502265938, "tps": 19083, "wall": 12345.5} {"step": 3595, "train_loss": 3.8524279594421387, "lr": 0.000393178026890779, "tps": 19077, "wall": 12353.3} {"step": 3596, "train_loss": 3.7786383628845215, "lr": 0.0003931728015931941, "tps": 19070, "wall": 12361.3} {"step": 3597, "train_loss": 3.822195291519165, "lr": 0.0003931675743338983, "tps": 19063, "wall": 12369.1} {"step": 3598, "train_loss": 3.8847649097442627, "lr": 0.0003931623451129509, "tps": 19056, "wall": 12377.0} {"step": 3599, "train_loss": 3.903148651123047, "lr": 0.00039315711393041105, "tps": 19050, "wall": 12384.7} {"step": 3600, "train_loss": 3.9239754676818848, "lr": 0.0003931518807863381, "tps": 19043, "wall": 12392.5} {"step": 3601, "train_loss": 3.83823823928833, "lr": 0.0003931466456807913, "tps": 19036, "wall": 12400.6} {"step": 3602, "train_loss": 3.8853676319122314, "lr": 0.00039314140861382985, "tps": 19029, "wall": 12408.4} {"step": 3603, "train_loss": 3.786452054977417, "lr": 0.0003931361695855132, "tps": 19022, "wall": 12416.2} {"step": 3604, "train_loss": 3.9990644454956055, "lr": 0.0003931309285959006, "tps": 19015, "wall": 12424.2} {"step": 3605, "train_loss": 3.8225619792938232, "lr": 0.0003931256856450515, "tps": 19009, "wall": 12432.0} {"step": 3606, "train_loss": 3.7975125312805176, "lr": 0.0003931204407330253, "tps": 19002, "wall": 12439.7} {"step": 3607, "train_loss": 3.83998441696167, "lr": 0.00039311519385988136, "tps": 18996, "wall": 12447.4} {"step": 3608, "train_loss": 3.8799262046813965, "lr": 0.0003931099450256791, "tps": 18989, "wall": 12455.2} {"step": 3609, "train_loss": 3.755786418914795, "lr": 0.0003931046942304781, "tps": 18983, "wall": 12462.9} {"step": 3610, "train_loss": 3.9210495948791504, "lr": 0.0003930994414743377, "tps": 18976, "wall": 12470.5} {"step": 3611, "train_loss": 3.7663488388061523, "lr": 0.0003930941867573175, "tps": 18969, "wall": 12478.6} {"step": 3612, "train_loss": 3.8241326808929443, "lr": 0.00039308893007947696, "tps": 18963, "wall": 12486.5} {"step": 3613, "train_loss": 3.897409200668335, "lr": 0.0003930836714408757, "tps": 18956, "wall": 12494.3} {"step": 3614, "train_loss": 3.806380271911621, "lr": 0.00039307841084157316, "tps": 18949, "wall": 12502.1} {"step": 3615, "train_loss": 3.7842719554901123, "lr": 0.0003930731482816291, "tps": 18943, "wall": 12509.9} {"step": 3616, "train_loss": 3.730485439300537, "lr": 0.000393067883761103, "tps": 18936, "wall": 12517.5} {"step": 3617, "train_loss": 3.7637112140655518, "lr": 0.00039306261728005456, "tps": 18930, "wall": 12525.2} {"step": 3618, "train_loss": 3.8748934268951416, "lr": 0.00039305734883854354, "tps": 18924, "wall": 12532.9} {"step": 3619, "train_loss": 3.8328592777252197, "lr": 0.00039305207843662933, "tps": 18917, "wall": 12540.6} {"step": 3620, "train_loss": 3.9433822631835938, "lr": 0.0003930468060743719, "tps": 18911, "wall": 12548.2} {"step": 3621, "train_loss": 3.8189144134521484, "lr": 0.00039304153175183094, "tps": 18905, "wall": 12555.8} {"step": 3622, "train_loss": 3.7953453063964844, "lr": 0.000393036255469066, "tps": 18899, "wall": 12563.4} {"step": 3623, "train_loss": 3.7929210662841797, "lr": 0.00039303097722613714, "tps": 18892, "wall": 12571.1} {"step": 3624, "train_loss": 3.794196128845215, "lr": 0.000393025697023104, "tps": 18886, "wall": 12579.0} {"step": 3625, "train_loss": 3.7354907989501953, "lr": 0.0003930204148600264, "tps": 18879, "wall": 12586.6} {"step": 3626, "train_loss": 3.830599069595337, "lr": 0.00039301513073696404, "tps": 18873, "wall": 12594.3} {"step": 3627, "train_loss": 3.9393434524536133, "lr": 0.00039300984465397707, "tps": 18867, "wall": 12602.0} {"step": 3628, "train_loss": 3.856776714324951, "lr": 0.00039300455661112516, "tps": 18861, "wall": 12609.6} {"step": 3629, "train_loss": 3.859529972076416, "lr": 0.0003929992666084683, "tps": 18855, "wall": 12617.1} {"step": 3630, "train_loss": 3.766624689102173, "lr": 0.00039299397464606634, "tps": 18848, "wall": 12624.6} {"step": 3631, "train_loss": 3.863043785095215, "lr": 0.00039298868072397934, "tps": 18842, "wall": 12632.4} {"step": 3632, "train_loss": 3.8715155124664307, "lr": 0.00039298338484226717, "tps": 18835, "wall": 12640.4} {"step": 3633, "train_loss": 3.8399033546447754, "lr": 0.0003929780870009898, "tps": 18829, "wall": 12648.0} {"step": 3634, "train_loss": 3.783750534057617, "lr": 0.0003929727872002074, "tps": 18823, "wall": 12655.6} {"step": 3635, "train_loss": 3.8293840885162354, "lr": 0.0003929674854399799, "tps": 18816, "wall": 12663.5} {"step": 3636, "train_loss": 3.6433544158935547, "lr": 0.00039296218172036733, "tps": 18810, "wall": 12671.1} {"step": 3637, "train_loss": 3.8910155296325684, "lr": 0.0003929568760414298, "tps": 18804, "wall": 12678.7} {"step": 3638, "train_loss": 3.7469663619995117, "lr": 0.0003929515684032275, "tps": 18798, "wall": 12686.3} {"step": 3639, "train_loss": 3.848590850830078, "lr": 0.0003929462588058204, "tps": 18792, "wall": 12694.0} {"step": 3640, "train_loss": 3.8259048461914062, "lr": 0.00039294094724926876, "tps": 18786, "wall": 12701.7} {"step": 3641, "train_loss": 3.8304154872894287, "lr": 0.00039293563373363265, "tps": 18780, "wall": 12709.3} {"step": 3642, "train_loss": 3.8407788276672363, "lr": 0.0003929303182589724, "tps": 18774, "wall": 12716.9} {"step": 3643, "train_loss": 3.806800365447998, "lr": 0.0003929250008253481, "tps": 18767, "wall": 12724.7} {"step": 3644, "train_loss": 3.854816436767578, "lr": 0.0003929196814328201, "tps": 18761, "wall": 12732.3} {"step": 3645, "train_loss": 3.9197113513946533, "lr": 0.0003929143600814485, "tps": 18755, "wall": 12739.9} {"step": 3646, "train_loss": 3.8671627044677734, "lr": 0.00039290903677129373, "tps": 18749, "wall": 12747.6} {"step": 3647, "train_loss": 3.793638229370117, "lr": 0.00039290371150241607, "tps": 18743, "wall": 12755.3} {"step": 3648, "train_loss": 3.8848843574523926, "lr": 0.0003928983842748758, "tps": 18736, "wall": 12763.3} {"step": 3649, "train_loss": 3.8643665313720703, "lr": 0.0003928930550887332, "tps": 18730, "wall": 12771.0} {"step": 3650, "train_loss": 3.9344539642333984, "lr": 0.0003928877239440488, "tps": 18724, "wall": 12778.8} {"step": 3651, "train_loss": 3.9548473358154297, "lr": 0.0003928823908408828, "tps": 18717, "wall": 12786.8} {"step": 3652, "train_loss": 3.8527891635894775, "lr": 0.00039287705577929587, "tps": 18710, "wall": 12795.0} {"step": 3653, "train_loss": 3.912294626235962, "lr": 0.00039287171875934825, "tps": 18704, "wall": 12803.0} {"step": 3654, "train_loss": 3.83811354637146, "lr": 0.0003928663797811004, "tps": 18698, "wall": 12810.7} {"step": 3655, "train_loss": 3.8318843841552734, "lr": 0.0003928610388446129, "tps": 18691, "wall": 12818.7} {"step": 3656, "train_loss": 3.763241767883301, "lr": 0.0003928556959499462, "tps": 18685, "wall": 12826.3} {"step": 3657, "train_loss": 3.748792886734009, "lr": 0.0003928503510971608, "tps": 18679, "wall": 12834.0} {"step": 3658, "train_loss": 3.7687463760375977, "lr": 0.0003928450042863173, "tps": 18673, "wall": 12841.8} {"step": 3659, "train_loss": 3.8467049598693848, "lr": 0.0003928396555174762, "tps": 18666, "wall": 12849.8} {"step": 3660, "train_loss": 3.7377543449401855, "lr": 0.00039283430479069816, "tps": 18660, "wall": 12857.5} {"step": 3661, "train_loss": 3.8644814491271973, "lr": 0.0003928289521060437, "tps": 18654, "wall": 12865.2} {"step": 3662, "train_loss": 3.8954033851623535, "lr": 0.00039282359746357367, "tps": 18648, "wall": 12872.8} {"step": 3663, "train_loss": 3.8791866302490234, "lr": 0.00039281824086334844, "tps": 18642, "wall": 12880.4} {"step": 3664, "train_loss": 3.8229734897613525, "lr": 0.0003928128823054289, "tps": 18636, "wall": 12888.0} {"step": 3665, "train_loss": 3.921062469482422, "lr": 0.0003928075217898756, "tps": 18630, "wall": 12895.6} {"step": 3666, "train_loss": 3.8561480045318604, "lr": 0.0003928021593167494, "tps": 18624, "wall": 12903.5} {"step": 3667, "train_loss": 3.751660108566284, "lr": 0.00039279679488611103, "tps": 18617, "wall": 12912.0} {"step": 3668, "train_loss": 3.872863292694092, "lr": 0.0003927914284980212, "tps": 18611, "wall": 12919.7} {"step": 3669, "train_loss": 3.82346773147583, "lr": 0.00039278606015254067, "tps": 18605, "wall": 12927.3} {"step": 3670, "train_loss": 3.8580124378204346, "lr": 0.0003927806898497303, "tps": 18597, "wall": 12936.5} {"step": 3671, "train_loss": 3.8172833919525146, "lr": 0.000392775317589651, "tps": 18591, "wall": 12944.3} {"step": 3672, "train_loss": 3.8059027194976807, "lr": 0.0003927699433723635, "tps": 18583, "wall": 12953.0} {"step": 3673, "train_loss": 3.795681953430176, "lr": 0.00039276456719792874, "tps": 18576, "wall": 12961.3} {"step": 3674, "train_loss": 3.797293186187744, "lr": 0.00039275918906640767, "tps": 18570, "wall": 12969.0} {"step": 3675, "train_loss": 3.8249361515045166, "lr": 0.00039275380897786107, "tps": 18562, "wall": 12978.1} {"step": 3676, "train_loss": 3.87180757522583, "lr": 0.00039274842693235004, "tps": 18556, "wall": 12985.8} {"step": 3677, "train_loss": 3.714900493621826, "lr": 0.00039274304292993546, "tps": 18548, "wall": 12994.9} {"step": 3678, "train_loss": 3.8742566108703613, "lr": 0.00039273765697067837, "tps": 18542, "wall": 13002.7} {"step": 3679, "train_loss": 3.7719812393188477, "lr": 0.00039273226905463975, "tps": 18535, "wall": 13011.7} {"step": 3680, "train_loss": 3.7307186126708984, "lr": 0.0003927268791818806, "tps": 18528, "wall": 13019.9} {"step": 3681, "train_loss": 3.844820022583008, "lr": 0.00039272148735246205, "tps": 18522, "wall": 13027.9} {"step": 3682, "train_loss": 3.8203415870666504, "lr": 0.00039271609356644516, "tps": 18515, "wall": 13036.2} {"step": 3683, "train_loss": 3.8290746212005615, "lr": 0.00039271069782389096, "tps": 18509, "wall": 13044.0} {"step": 3684, "train_loss": 3.719546318054199, "lr": 0.0003927053001248607, "tps": 18503, "wall": 13051.8} {"step": 3685, "train_loss": 3.8846006393432617, "lr": 0.0003926999004694154, "tps": 18497, "wall": 13059.4} {"step": 3686, "train_loss": 3.8674421310424805, "lr": 0.00039269449885761637, "tps": 18491, "wall": 13067.0} {"step": 3687, "train_loss": 3.8699846267700195, "lr": 0.0003926890952895247, "tps": 18485, "wall": 13074.7} {"step": 3688, "train_loss": 3.8113276958465576, "lr": 0.00039268368976520156, "tps": 18479, "wall": 13082.5} {"step": 3689, "train_loss": 3.842052936553955, "lr": 0.00039267828228470823, "tps": 18474, "wall": 13090.1} {"step": 3690, "train_loss": 3.8515405654907227, "lr": 0.00039267287284810596, "tps": 18468, "wall": 13097.8} {"step": 3691, "train_loss": 3.8322501182556152, "lr": 0.0003926674614554561, "tps": 18462, "wall": 13105.6} {"step": 3692, "train_loss": 3.8749842643737793, "lr": 0.0003926620481068199, "tps": 18456, "wall": 13113.2} {"step": 3693, "train_loss": 3.803699493408203, "lr": 0.0003926566328022587, "tps": 18450, "wall": 13120.9} {"step": 3694, "train_loss": 3.8300373554229736, "lr": 0.0003926512155418338, "tps": 18444, "wall": 13128.6} {"step": 3695, "train_loss": 3.8593244552612305, "lr": 0.00039264579632560654, "tps": 18439, "wall": 13136.2} {"step": 3696, "train_loss": 3.794445514678955, "lr": 0.0003926403751536384, "tps": 18433, "wall": 13144.0} {"step": 3697, "train_loss": 3.870570421218872, "lr": 0.00039263495202599075, "tps": 18427, "wall": 13152.0} {"step": 3698, "train_loss": 3.8752121925354004, "lr": 0.000392629526942725, "tps": 18421, "wall": 13159.7} {"step": 3699, "train_loss": 3.8296051025390625, "lr": 0.00039262409990390264, "tps": 18415, "wall": 13167.3} {"step": 3700, "train_loss": 3.82661509513855, "lr": 0.00039261867090958517, "tps": 18409, "wall": 13174.9} {"step": 3701, "train_loss": 3.78717041015625, "lr": 0.00039261323995983406, "tps": 18404, "wall": 13182.6} {"step": 3702, "train_loss": 3.891712188720703, "lr": 0.00039260780705471077, "tps": 18398, "wall": 13190.3} {"step": 3703, "train_loss": 3.8492794036865234, "lr": 0.00039260237219427695, "tps": 18392, "wall": 13198.2} {"step": 3704, "train_loss": 3.9496614933013916, "lr": 0.0003925969353785941, "tps": 18386, "wall": 13205.8} {"step": 3705, "train_loss": 3.8566231727600098, "lr": 0.0003925914966077238, "tps": 18381, "wall": 13213.4} {"step": 3706, "train_loss": 3.835261821746826, "lr": 0.0003925860558817278, "tps": 18375, "wall": 13221.0} {"step": 3707, "train_loss": 3.756591558456421, "lr": 0.0003925806132006675, "tps": 18369, "wall": 13228.7} {"step": 3708, "train_loss": 3.9105443954467773, "lr": 0.0003925751685646047, "tps": 18363, "wall": 13236.5} {"step": 3709, "train_loss": 3.7642948627471924, "lr": 0.00039256972197360113, "tps": 18358, "wall": 13244.1} {"step": 3710, "train_loss": 3.917750835418701, "lr": 0.0003925642734277184, "tps": 18352, "wall": 13251.7} {"step": 3711, "train_loss": 3.8651375770568848, "lr": 0.00039255882292701813, "tps": 18346, "wall": 13259.5} {"step": 3712, "train_loss": 3.8803179264068604, "lr": 0.0003925533704715623, "tps": 18341, "wall": 13267.2} {"step": 3713, "train_loss": 3.8310060501098633, "lr": 0.0003925479160614125, "tps": 18335, "wall": 13274.9} {"step": 3714, "train_loss": 3.845883846282959, "lr": 0.0003925424596966306, "tps": 18329, "wall": 13282.7} {"step": 3715, "train_loss": 3.7667505741119385, "lr": 0.0003925370013772784, "tps": 18324, "wall": 13290.2} {"step": 3716, "train_loss": 3.7796125411987305, "lr": 0.00039253154110341766, "tps": 18318, "wall": 13298.0} {"step": 3717, "train_loss": 3.759045362472534, "lr": 0.0003925260788751103, "tps": 18312, "wall": 13305.7} {"step": 3718, "train_loss": 3.8501555919647217, "lr": 0.00039252061469241816, "tps": 18306, "wall": 13313.7} {"step": 3719, "train_loss": 3.786534070968628, "lr": 0.00039251514855540324, "tps": 18300, "wall": 13322.1} {"step": 3720, "train_loss": 3.687011241912842, "lr": 0.00039250968046412735, "tps": 18293, "wall": 13330.2} {"step": 3721, "train_loss": 3.7701010704040527, "lr": 0.0003925042104186524, "tps": 18287, "wall": 13338.2} {"step": 3722, "train_loss": 3.8466930389404297, "lr": 0.0003924987384190405, "tps": 18281, "wall": 13346.3} {"step": 3723, "train_loss": 3.7071585655212402, "lr": 0.00039249326446535353, "tps": 18275, "wall": 13354.5} {"step": 3724, "train_loss": 3.9450478553771973, "lr": 0.00039248778855765354, "tps": 18269, "wall": 13362.5} {"step": 3725, "train_loss": 3.680131435394287, "lr": 0.0003924823106960026, "tps": 18262, "wall": 13370.6} {"step": 3726, "train_loss": 3.9342269897460938, "lr": 0.00039247683088046263, "tps": 18256, "wall": 13378.9} {"step": 3727, "train_loss": 3.837026834487915, "lr": 0.0003924713491110958, "tps": 18250, "wall": 13386.9} {"step": 3728, "train_loss": 3.864109516143799, "lr": 0.00039246586538796424, "tps": 18244, "wall": 13395.0} {"step": 3729, "train_loss": 3.794232130050659, "lr": 0.00039246037971113, "tps": 18237, "wall": 13403.3} {"step": 3730, "train_loss": 3.7896370887756348, "lr": 0.00039245489208065526, "tps": 18231, "wall": 13411.6} {"step": 3731, "train_loss": 3.885171413421631, "lr": 0.00039244940249660214, "tps": 18225, "wall": 13419.7} {"step": 3732, "train_loss": 3.8008997440338135, "lr": 0.0003924439109590329, "tps": 18219, "wall": 13427.8} {"step": 3733, "train_loss": 3.9187653064727783, "lr": 0.0003924384174680097, "tps": 18213, "wall": 13435.8} {"step": 3734, "train_loss": 3.8350188732147217, "lr": 0.00039243292202359475, "tps": 18207, "wall": 13444.1} {"step": 3735, "train_loss": 3.856675624847412, "lr": 0.00039242742462585037, "tps": 18200, "wall": 13452.2} {"step": 3736, "train_loss": 3.814497470855713, "lr": 0.00039242192527483874, "tps": 18194, "wall": 13460.2} {"step": 3737, "train_loss": 3.8347578048706055, "lr": 0.00039241642397062226, "tps": 18188, "wall": 13468.4} {"step": 3738, "train_loss": 3.8066163063049316, "lr": 0.00039241092071326327, "tps": 18182, "wall": 13476.5} {"step": 3739, "train_loss": 3.8061909675598145, "lr": 0.0003924054155028239, "tps": 18176, "wall": 13484.7} {"step": 3740, "train_loss": 3.845614433288574, "lr": 0.0003923999083393667, "tps": 18170, "wall": 13492.8} {"step": 3741, "train_loss": 3.8121814727783203, "lr": 0.000392394399222954, "tps": 18164, "wall": 13501.0} {"step": 3742, "train_loss": 3.8153061866760254, "lr": 0.00039238888815364836, "tps": 18158, "wall": 13509.0} {"step": 3743, "train_loss": 3.8290817737579346, "lr": 0.00039238337513151195, "tps": 18152, "wall": 13517.1} {"step": 3744, "train_loss": 3.8260605335235596, "lr": 0.00039237786015660736, "tps": 18146, "wall": 13525.3} {"step": 3745, "train_loss": 3.8595542907714844, "lr": 0.000392372343228997, "tps": 18140, "wall": 13533.4} {"step": 3746, "train_loss": 3.712568759918213, "lr": 0.0003923668243487434, "tps": 18134, "wall": 13541.6} {"step": 3747, "train_loss": 3.855353593826294, "lr": 0.00039236130351590916, "tps": 18127, "wall": 13549.8} {"step": 3748, "train_loss": 3.726313352584839, "lr": 0.0003923557807305567, "tps": 18121, "wall": 13558.0} {"step": 3749, "train_loss": 3.817159652709961, "lr": 0.00039235025599274867, "tps": 18115, "wall": 13566.1} {"step": 3750, "train_loss": 3.804999351501465, "lr": 0.0003923447293025476, "tps": 18109, "wall": 13574.2} {"step": 3751, "train_loss": 3.7868833541870117, "lr": 0.0003923392006600162, "tps": 18103, "wall": 13582.3} {"step": 3752, "train_loss": 3.814140796661377, "lr": 0.0003923336700652168, "tps": 18097, "wall": 13590.5} {"step": 3753, "train_loss": 3.861112594604492, "lr": 0.0003923281375182124, "tps": 18091, "wall": 13598.5} {"step": 3754, "train_loss": 3.9600236415863037, "lr": 0.0003923226030190656, "tps": 18085, "wall": 13606.6} {"step": 3755, "train_loss": 3.8663899898529053, "lr": 0.00039231706656783896, "tps": 18080, "wall": 13614.6} {"step": 3756, "train_loss": 3.801457166671753, "lr": 0.0003923115281645953, "tps": 18074, "wall": 13622.8} {"step": 3757, "train_loss": 3.8102481365203857, "lr": 0.00039230598780939723, "tps": 18068, "wall": 13630.8} {"step": 3758, "train_loss": 3.796670913696289, "lr": 0.0003923004455023076, "tps": 18062, "wall": 13638.9} {"step": 3759, "train_loss": 3.8830106258392334, "lr": 0.00039229490124338933, "tps": 18056, "wall": 13647.0} {"step": 3760, "train_loss": 3.794252872467041, "lr": 0.000392289355032705, "tps": 18050, "wall": 13655.2} {"step": 3761, "train_loss": 3.9097723960876465, "lr": 0.00039228380687031763, "tps": 18044, "wall": 13663.3} {"step": 3762, "train_loss": 3.759256362915039, "lr": 0.00039227825675628987, "tps": 18038, "wall": 13671.3} {"step": 3763, "train_loss": 3.831244468688965, "lr": 0.00039227270469068475, "tps": 18032, "wall": 13679.4} {"step": 3764, "train_loss": 3.831864356994629, "lr": 0.0003922671506735651, "tps": 18026, "wall": 13687.4} {"step": 3765, "train_loss": 3.7729125022888184, "lr": 0.0003922615947049939, "tps": 18021, "wall": 13695.5} {"step": 3766, "train_loss": 3.8703131675720215, "lr": 0.000392256036785034, "tps": 18015, "wall": 13703.5} {"step": 3767, "train_loss": 3.8390889167785645, "lr": 0.00039225047691374837, "tps": 18009, "wall": 13711.6} {"step": 3768, "train_loss": 3.794182300567627, "lr": 0.00039224491509120006, "tps": 18003, "wall": 13719.6} {"step": 3769, "train_loss": 3.8841419219970703, "lr": 0.000392239351317452, "tps": 17997, "wall": 13727.7} {"step": 3770, "train_loss": 3.8337693214416504, "lr": 0.00039223378559256726, "tps": 17992, "wall": 13735.8} {"step": 3771, "train_loss": 3.680678367614746, "lr": 0.00039222821791660886, "tps": 17986, "wall": 13743.9} {"step": 3772, "train_loss": 3.749603748321533, "lr": 0.0003922226482896399, "tps": 17980, "wall": 13751.9} {"step": 3773, "train_loss": 3.8994879722595215, "lr": 0.0003922170767117235, "tps": 17974, "wall": 13760.0} {"step": 3774, "train_loss": 3.7555999755859375, "lr": 0.0003922115031829227, "tps": 17968, "wall": 13768.3} {"step": 3775, "train_loss": 3.8457376956939697, "lr": 0.0003922059277033007, "tps": 17962, "wall": 13776.5} {"step": 3776, "train_loss": 3.7397544384002686, "lr": 0.0003922003502729206, "tps": 17956, "wall": 13784.6} {"step": 3777, "train_loss": 3.80086088180542, "lr": 0.0003921947708918457, "tps": 17951, "wall": 13792.6} {"step": 3778, "train_loss": 3.8080801963806152, "lr": 0.000392189189560139, "tps": 17945, "wall": 13800.4} {"step": 3779, "train_loss": 3.751906394958496, "lr": 0.0003921836062778639, "tps": 17940, "wall": 13808.1} {"step": 3780, "train_loss": 3.699218988418579, "lr": 0.0003921780210450836, "tps": 17935, "wall": 13815.8} {"step": 3781, "train_loss": 3.8840579986572266, "lr": 0.00039217243386186135, "tps": 17930, "wall": 13823.5} {"step": 3782, "train_loss": 3.8283274173736572, "lr": 0.0003921668447282605, "tps": 17924, "wall": 13831.2} {"step": 3783, "train_loss": 3.923525810241699, "lr": 0.0003921612536443442, "tps": 17919, "wall": 13839.0} {"step": 3784, "train_loss": 3.854879379272461, "lr": 0.00039215566061017603, "tps": 17914, "wall": 13846.7} {"step": 3785, "train_loss": 3.8376975059509277, "lr": 0.00039215006562581914, "tps": 17909, "wall": 13854.3} {"step": 3786, "train_loss": 3.6551432609558105, "lr": 0.0003921444686913371, "tps": 17903, "wall": 13862.1} {"step": 3787, "train_loss": 3.8904545307159424, "lr": 0.00039213886980679315, "tps": 17898, "wall": 13869.8} {"step": 3788, "train_loss": 3.8519198894500732, "lr": 0.00039213326897225074, "tps": 17893, "wall": 13877.4} {"step": 3789, "train_loss": 3.8961329460144043, "lr": 0.00039212766618777333, "tps": 17888, "wall": 13885.2} {"step": 3790, "train_loss": 3.7812819480895996, "lr": 0.0003921220614534245, "tps": 17883, "wall": 13892.8} {"step": 3791, "train_loss": 3.875722885131836, "lr": 0.00039211645476926757, "tps": 17878, "wall": 13900.5} {"step": 3792, "train_loss": 3.816645860671997, "lr": 0.00039211084613536613, "tps": 17872, "wall": 13908.3} {"step": 3793, "train_loss": 3.7727627754211426, "lr": 0.00039210523555178377, "tps": 17867, "wall": 13915.9} {"step": 3794, "train_loss": 3.820949077606201, "lr": 0.0003920996230185839, "tps": 17862, "wall": 13923.7} {"step": 3795, "train_loss": 3.913938045501709, "lr": 0.00039209400853583025, "tps": 17857, "wall": 13931.4} {"step": 3796, "train_loss": 3.7743000984191895, "lr": 0.0003920883921035864, "tps": 17851, "wall": 13939.1} {"step": 3797, "train_loss": 3.786830425262451, "lr": 0.00039208277372191583, "tps": 17846, "wall": 13946.8} {"step": 3798, "train_loss": 3.7045822143554688, "lr": 0.00039207715339088236, "tps": 17841, "wall": 13954.4} {"step": 3799, "train_loss": 3.7503509521484375, "lr": 0.00039207153111054955, "tps": 17836, "wall": 13962.2} {"step": 3800, "train_loss": 3.745466709136963, "lr": 0.0003920659068809812, "tps": 17831, "wall": 13969.9} {"step": 3801, "train_loss": 3.7748966217041016, "lr": 0.00039206028070224087, "tps": 17826, "wall": 13977.5} {"step": 3802, "train_loss": 3.8437085151672363, "lr": 0.00039205465257439244, "tps": 17821, "wall": 13985.3} {"step": 3803, "train_loss": 3.748183012008667, "lr": 0.0003920490224974995, "tps": 17815, "wall": 13993.0} {"step": 3804, "train_loss": 3.8947091102600098, "lr": 0.000392043390471626, "tps": 17810, "wall": 14000.7} {"step": 3805, "train_loss": 3.764497995376587, "lr": 0.0003920377564968357, "tps": 17805, "wall": 14008.4} {"step": 3806, "train_loss": 3.8803939819335938, "lr": 0.00039203212057319233, "tps": 17800, "wall": 14016.1} {"step": 3807, "train_loss": 3.8847885131835938, "lr": 0.00039202648270075975, "tps": 17795, "wall": 14023.7} {"step": 3808, "train_loss": 3.7517216205596924, "lr": 0.000392020842879602, "tps": 17790, "wall": 14031.5} {"step": 3809, "train_loss": 3.7969000339508057, "lr": 0.0003920152011097827, "tps": 17784, "wall": 14039.5} {"step": 3810, "train_loss": 3.7768452167510986, "lr": 0.000392009557391366, "tps": 17779, "wall": 14047.2} {"step": 3811, "train_loss": 3.9623780250549316, "lr": 0.0003920039117244156, "tps": 17774, "wall": 14054.8} {"step": 3812, "train_loss": 3.8364391326904297, "lr": 0.00039199826410899564, "tps": 17769, "wall": 14062.5} {"step": 3813, "train_loss": 3.73486065864563, "lr": 0.0003919926145451701, "tps": 17764, "wall": 14070.2} {"step": 3814, "train_loss": 3.7447309494018555, "lr": 0.0003919869630330029, "tps": 17759, "wall": 14077.9} {"step": 3815, "train_loss": 3.8239238262176514, "lr": 0.00039198130957255803, "tps": 17754, "wall": 14085.5} {"step": 3816, "train_loss": 3.873323678970337, "lr": 0.0003919756541638996, "tps": 17749, "wall": 14093.3} {"step": 3817, "train_loss": 3.880002498626709, "lr": 0.00039196999680709166, "tps": 17744, "wall": 14101.1} {"step": 3818, "train_loss": 3.8911428451538086, "lr": 0.0003919643375021983, "tps": 17739, "wall": 14108.8} {"step": 3819, "train_loss": 3.7705605030059814, "lr": 0.00039195867624928365, "tps": 17734, "wall": 14116.6} {"step": 3820, "train_loss": 3.910945177078247, "lr": 0.0003919530130484118, "tps": 17729, "wall": 14124.3} {"step": 3821, "train_loss": 3.862598180770874, "lr": 0.0003919473478996469, "tps": 17724, "wall": 14132.0} {"step": 3822, "train_loss": 3.811413288116455, "lr": 0.0003919416808030531, "tps": 17719, "wall": 14139.7} {"step": 3823, "train_loss": 3.7930707931518555, "lr": 0.00039193601175869467, "tps": 17714, "wall": 14147.4} {"step": 3824, "train_loss": 3.775266170501709, "lr": 0.0003919303407666358, "tps": 17709, "wall": 14155.1} {"step": 3825, "train_loss": 3.7951815128326416, "lr": 0.0003919246678269407, "tps": 17704, "wall": 14162.8} {"step": 3826, "train_loss": 3.853393077850342, "lr": 0.0003919189929396737, "tps": 17699, "wall": 14170.6} {"step": 3827, "train_loss": 3.7563014030456543, "lr": 0.000391913316104899, "tps": 17694, "wall": 14178.3} {"step": 3828, "train_loss": 3.6914799213409424, "lr": 0.000391907637322681, "tps": 17689, "wall": 14186.0} {"step": 3829, "train_loss": 3.801913022994995, "lr": 0.00039190195659308404, "tps": 17684, "wall": 14193.8} {"step": 3830, "train_loss": 3.830571174621582, "lr": 0.0003918962739161723, "tps": 17679, "wall": 14201.4} {"step": 3831, "train_loss": 3.7307841777801514, "lr": 0.00039189058929201036, "tps": 17674, "wall": 14209.1} {"step": 3832, "train_loss": 3.817781925201416, "lr": 0.00039188490272066244, "tps": 17669, "wall": 14216.8} {"step": 3833, "train_loss": 3.896091938018799, "lr": 0.0003918792142021932, "tps": 17664, "wall": 14224.7} {"step": 3834, "train_loss": 3.8862109184265137, "lr": 0.00039187352373666677, "tps": 17659, "wall": 14232.4} {"step": 3835, "train_loss": 3.8482425212860107, "lr": 0.0003918678313241478, "tps": 17654, "wall": 14240.1} {"step": 3836, "train_loss": 3.8601818084716797, "lr": 0.00039186213696470074, "tps": 17649, "wall": 14247.9} {"step": 3837, "train_loss": 3.8028430938720703, "lr": 0.0003918564406583901, "tps": 17644, "wall": 14255.6} {"step": 3838, "train_loss": 3.8623833656311035, "lr": 0.00039185074240528044, "tps": 17639, "wall": 14263.4} {"step": 3839, "train_loss": 3.757819175720215, "lr": 0.00039184504220543624, "tps": 17634, "wall": 14271.2} {"step": 3840, "train_loss": 3.733940601348877, "lr": 0.0003918393400589221, "tps": 17629, "wall": 14278.9} {"step": 3841, "train_loss": 3.865847587585449, "lr": 0.0003918336359658026, "tps": 17624, "wall": 14286.6} {"step": 3842, "train_loss": 3.874586820602417, "lr": 0.0003918279299261424, "tps": 17619, "wall": 14294.3} {"step": 3843, "train_loss": 3.832472801208496, "lr": 0.00039182222194000614, "tps": 17614, "wall": 14302.0} {"step": 3844, "train_loss": 3.7344436645507812, "lr": 0.00039181651200745837, "tps": 17609, "wall": 14309.7} {"step": 3845, "train_loss": 3.894890308380127, "lr": 0.00039181080012856397, "tps": 17604, "wall": 14317.4} {"step": 3846, "train_loss": 3.8711414337158203, "lr": 0.00039180508630338746, "tps": 17599, "wall": 14325.2} {"step": 3847, "train_loss": 3.8075077533721924, "lr": 0.00039179937053199367, "tps": 17594, "wall": 14332.8} {"step": 3848, "train_loss": 3.802290916442871, "lr": 0.0003917936528144473, "tps": 17589, "wall": 14340.7} {"step": 3849, "train_loss": 3.7617859840393066, "lr": 0.0003917879331508131, "tps": 17584, "wall": 14348.5} {"step": 3850, "train_loss": 3.799894094467163, "lr": 0.00039178221154115593, "tps": 17579, "wall": 14356.2} {"step": 3851, "train_loss": 3.8608367443084717, "lr": 0.00039177648798554063, "tps": 17574, "wall": 14363.9} {"step": 3852, "train_loss": 3.769930362701416, "lr": 0.00039177076248403186, "tps": 17570, "wall": 14371.6} {"step": 3853, "train_loss": 3.811945915222168, "lr": 0.00039176503503669466, "tps": 17565, "wall": 14379.2} {"step": 3854, "train_loss": 3.726764678955078, "lr": 0.0003917593056435939, "tps": 17560, "wall": 14386.9} {"step": 3855, "train_loss": 3.8712570667266846, "lr": 0.00039175357430479437, "tps": 17555, "wall": 14394.6} {"step": 3856, "train_loss": 3.87833571434021, "lr": 0.0003917478410203611, "tps": 17550, "wall": 14402.5} {"step": 3857, "train_loss": 3.686898708343506, "lr": 0.000391742105790359, "tps": 17545, "wall": 14410.2} {"step": 3858, "train_loss": 3.739666700363159, "lr": 0.00039173636861485306, "tps": 17540, "wall": 14417.9} {"step": 3859, "train_loss": 3.8815743923187256, "lr": 0.0003917306294939082, "tps": 17536, "wall": 14425.6} {"step": 3860, "train_loss": 3.710808753967285, "lr": 0.00039172488842758945, "tps": 17531, "wall": 14433.3} {"step": 3861, "train_loss": 3.8748202323913574, "lr": 0.00039171914541596194, "tps": 17526, "wall": 14441.1} {"step": 3862, "train_loss": 3.8067550659179688, "lr": 0.0003917134004590906, "tps": 17521, "wall": 14448.8} {"step": 3863, "train_loss": 3.8101260662078857, "lr": 0.0003917076535570406, "tps": 17516, "wall": 14456.4} {"step": 3864, "train_loss": 3.8078601360321045, "lr": 0.000391701904709877, "tps": 17511, "wall": 14464.2} {"step": 3865, "train_loss": 3.7946951389312744, "lr": 0.0003916961539176649, "tps": 17507, "wall": 14472.0} {"step": 3866, "train_loss": 3.700923442840576, "lr": 0.0003916904011804696, "tps": 17502, "wall": 14479.7} {"step": 3867, "train_loss": 3.732245922088623, "lr": 0.00039168464649835604, "tps": 17497, "wall": 14487.4} {"step": 3868, "train_loss": 3.850771903991699, "lr": 0.00039167888987138953, "tps": 17492, "wall": 14495.1} {"step": 3869, "train_loss": 3.72532320022583, "lr": 0.0003916731312996353, "tps": 17487, "wall": 14502.8} {"step": 3870, "train_loss": 3.8465781211853027, "lr": 0.0003916673707831585, "tps": 17483, "wall": 14510.4} {"step": 3871, "train_loss": 3.8055076599121094, "lr": 0.0003916616083220245, "tps": 17478, "wall": 14518.4} {"step": 3872, "train_loss": 3.7353320121765137, "lr": 0.0003916558439162985, "tps": 17473, "wall": 14526.2} {"step": 3873, "train_loss": 3.7391695976257324, "lr": 0.00039165007756604577, "tps": 17468, "wall": 14533.8} {"step": 3874, "train_loss": 3.710294008255005, "lr": 0.0003916443092713317, "tps": 17463, "wall": 14541.6} {"step": 3875, "train_loss": 3.873828887939453, "lr": 0.0003916385390322216, "tps": 17459, "wall": 14549.3} {"step": 3876, "train_loss": 3.707620620727539, "lr": 0.00039163276684878087, "tps": 17454, "wall": 14557.0} {"step": 3877, "train_loss": 3.854790449142456, "lr": 0.00039162699272107484, "tps": 17449, "wall": 14564.8} {"step": 3878, "train_loss": 3.8815596103668213, "lr": 0.00039162121664916897, "tps": 17444, "wall": 14572.6} {"step": 3879, "train_loss": 3.822178840637207, "lr": 0.0003916154386331287, "tps": 17439, "wall": 14580.4} {"step": 3880, "train_loss": 3.818403720855713, "lr": 0.0003916096586730194, "tps": 17435, "wall": 14588.2} {"step": 3881, "train_loss": 3.9080052375793457, "lr": 0.00039160387676890663, "tps": 17430, "wall": 14595.9} {"step": 3882, "train_loss": 3.7776808738708496, "lr": 0.00039159809292085585, "tps": 17425, "wall": 14603.6} {"step": 3883, "train_loss": 3.8232364654541016, "lr": 0.0003915923071289326, "tps": 17420, "wall": 14611.4} {"step": 3884, "train_loss": 3.799823760986328, "lr": 0.00039158651939320247, "tps": 17416, "wall": 14619.1} {"step": 3885, "train_loss": 3.9553232192993164, "lr": 0.0003915807297137309, "tps": 17411, "wall": 14626.8} {"step": 3886, "train_loss": 3.8006553649902344, "lr": 0.00039157493809058357, "tps": 17406, "wall": 14634.5} {"step": 3887, "train_loss": 3.827469825744629, "lr": 0.000391569144523826, "tps": 17401, "wall": 14642.3} {"step": 3888, "train_loss": 3.8688840866088867, "lr": 0.0003915633490135239, "tps": 17397, "wall": 14650.0} {"step": 3889, "train_loss": 3.797745704650879, "lr": 0.0003915575515597429, "tps": 17392, "wall": 14657.6} {"step": 3890, "train_loss": 3.787479877471924, "lr": 0.00039155175216254874, "tps": 17388, "wall": 14665.3} {"step": 3891, "train_loss": 3.7341203689575195, "lr": 0.000391545950822007, "tps": 17383, "wall": 14673.1} {"step": 3892, "train_loss": 3.823392391204834, "lr": 0.0003915401475381835, "tps": 17378, "wall": 14680.8} {"step": 3893, "train_loss": 3.8107235431671143, "lr": 0.00039153434231114386, "tps": 17374, "wall": 14688.4} {"step": 3894, "train_loss": 3.847252130508423, "lr": 0.00039152853514095394, "tps": 17369, "wall": 14696.2} {"step": 3895, "train_loss": 3.8259835243225098, "lr": 0.0003915227260276795, "tps": 17364, "wall": 14704.1} {"step": 3896, "train_loss": 3.9406118392944336, "lr": 0.0003915169149713863, "tps": 17359, "wall": 14711.8} {"step": 3897, "train_loss": 3.7969701290130615, "lr": 0.00039151110197214024, "tps": 17355, "wall": 14719.5} {"step": 3898, "train_loss": 3.740661382675171, "lr": 0.00039150528703000713, "tps": 17350, "wall": 14727.2} {"step": 3899, "train_loss": 3.9030656814575195, "lr": 0.00039149947014505284, "tps": 17345, "wall": 14734.9} {"step": 3900, "train_loss": 3.834014415740967, "lr": 0.00039149365131734335, "tps": 17341, "wall": 14742.6} {"step": 3901, "train_loss": 3.6924798488616943, "lr": 0.0003914878305469444, "tps": 17336, "wall": 14750.3} {"step": 3902, "train_loss": 3.7792317867279053, "lr": 0.00039148200783392206, "tps": 17331, "wall": 14758.1} {"step": 3903, "train_loss": 3.8903799057006836, "lr": 0.0003914761831783423, "tps": 17327, "wall": 14765.9} {"step": 3904, "train_loss": 3.777250289916992, "lr": 0.000391470356580271, "tps": 17322, "wall": 14773.7} {"step": 3905, "train_loss": 3.805835485458374, "lr": 0.0003914645280397743, "tps": 17318, "wall": 14781.3} {"step": 3906, "train_loss": 3.7482619285583496, "lr": 0.00039145869755691806, "tps": 17313, "wall": 14789.0} {"step": 3907, "train_loss": 3.791459321975708, "lr": 0.00039145286513176845, "tps": 17308, "wall": 14796.8} {"step": 3908, "train_loss": 3.803891181945801, "lr": 0.00039144703076439153, "tps": 17304, "wall": 14804.4} {"step": 3909, "train_loss": 3.881301164627075, "lr": 0.0003914411944548534, "tps": 17299, "wall": 14812.2} {"step": 3910, "train_loss": 3.7883620262145996, "lr": 0.00039143535620322006, "tps": 17294, "wall": 14820.1} {"step": 3911, "train_loss": 3.6908700466156006, "lr": 0.0003914295160095578, "tps": 17290, "wall": 14827.8} {"step": 3912, "train_loss": 3.77030611038208, "lr": 0.0003914236738739327, "tps": 17285, "wall": 14835.5} {"step": 3913, "train_loss": 3.874286651611328, "lr": 0.00039141782979641086, "tps": 17281, "wall": 14843.1} {"step": 3914, "train_loss": 3.768798351287842, "lr": 0.00039141198377705866, "tps": 17276, "wall": 14850.8} {"step": 3915, "train_loss": 3.8287904262542725, "lr": 0.0003914061358159423, "tps": 17272, "wall": 14858.5} {"step": 3916, "train_loss": 3.718078136444092, "lr": 0.0003914002859131278, "tps": 17267, "wall": 14866.2} {"step": 3917, "train_loss": 3.772829055786133, "lr": 0.00039139443406868165, "tps": 17263, "wall": 14874.0} {"step": 3918, "train_loss": 3.760927677154541, "lr": 0.0003913885802826701, "tps": 17258, "wall": 14881.8} {"step": 3919, "train_loss": 3.677049160003662, "lr": 0.0003913827245551595, "tps": 17253, "wall": 14889.5} {"step": 3920, "train_loss": 3.7831082344055176, "lr": 0.000391376866886216, "tps": 17249, "wall": 14897.2} {"step": 3921, "train_loss": 3.799168825149536, "lr": 0.00039137100727590617, "tps": 17244, "wall": 14904.9} {"step": 3922, "train_loss": 3.8263189792633057, "lr": 0.00039136514572429625, "tps": 17240, "wall": 14912.6} {"step": 3923, "train_loss": 3.7985377311706543, "lr": 0.0003913592822314527, "tps": 17235, "wall": 14920.3} {"step": 3924, "train_loss": 3.7285537719726562, "lr": 0.000391353416797442, "tps": 17231, "wall": 14927.9} {"step": 3925, "train_loss": 3.661129951477051, "lr": 0.0003913475494223304, "tps": 17226, "wall": 14935.6} {"step": 3926, "train_loss": 3.7101502418518066, "lr": 0.00039134168010618455, "tps": 17222, "wall": 14943.4} {"step": 3927, "train_loss": 3.781893730163574, "lr": 0.00039133580884907087, "tps": 17217, "wall": 14951.0} {"step": 3928, "train_loss": 3.794642448425293, "lr": 0.00039132993565105587, "tps": 17213, "wall": 14958.7} {"step": 3929, "train_loss": 3.8195605278015137, "lr": 0.00039132406051220616, "tps": 17208, "wall": 14966.4} {"step": 3930, "train_loss": 3.8411669731140137, "lr": 0.0003913181834325881, "tps": 17204, "wall": 14974.1} {"step": 3931, "train_loss": 3.775423765182495, "lr": 0.00039131230441226856, "tps": 17200, "wall": 14981.8} {"step": 3932, "train_loss": 3.7305173873901367, "lr": 0.00039130642345131385, "tps": 17195, "wall": 14989.5} {"step": 3933, "train_loss": 3.7928009033203125, "lr": 0.0003913005405497907, "tps": 17191, "wall": 14997.2} {"step": 3934, "train_loss": 3.8994245529174805, "lr": 0.0003912946557077658, "tps": 17186, "wall": 15005.0} {"step": 3935, "train_loss": 3.8449203968048096, "lr": 0.00039128876892530575, "tps": 17182, "wall": 15012.6} {"step": 3936, "train_loss": 3.8010683059692383, "lr": 0.00039128288020247727, "tps": 17177, "wall": 15020.4} {"step": 3937, "train_loss": 3.8467302322387695, "lr": 0.0003912769895393471, "tps": 17173, "wall": 15028.1} {"step": 3938, "train_loss": 3.831700325012207, "lr": 0.00039127109693598187, "tps": 17168, "wall": 15035.8} {"step": 3939, "train_loss": 3.8392863273620605, "lr": 0.00039126520239244836, "tps": 17164, "wall": 15043.4} {"step": 3940, "train_loss": 3.835543632507324, "lr": 0.00039125930590881345, "tps": 17160, "wall": 15051.0} {"step": 3941, "train_loss": 3.7048563957214355, "lr": 0.0003912534074851438, "tps": 17155, "wall": 15058.8} {"step": 3942, "train_loss": 3.7691097259521484, "lr": 0.0003912475071215063, "tps": 17151, "wall": 15066.4} {"step": 3943, "train_loss": 3.7759957313537598, "lr": 0.00039124160481796775, "tps": 17146, "wall": 15074.1} {"step": 3944, "train_loss": 3.7233901023864746, "lr": 0.0003912357005745951, "tps": 17142, "wall": 15081.7} {"step": 3945, "train_loss": 3.7292020320892334, "lr": 0.0003912297943914551, "tps": 17138, "wall": 15089.5} {"step": 3946, "train_loss": 3.772054433822632, "lr": 0.0003912238862686148, "tps": 17133, "wall": 15097.2} {"step": 3947, "train_loss": 3.741518020629883, "lr": 0.00039121797620614095, "tps": 17129, "wall": 15104.8} {"step": 3948, "train_loss": 3.8196818828582764, "lr": 0.00039121206420410074, "tps": 17125, "wall": 15112.5} {"step": 3949, "train_loss": 3.7942018508911133, "lr": 0.0003912061502625609, "tps": 17120, "wall": 15120.3} {"step": 3950, "train_loss": 3.8592031002044678, "lr": 0.00039120023438158865, "tps": 17116, "wall": 15128.0} {"step": 3951, "train_loss": 3.7557568550109863, "lr": 0.0003911943165612507, "tps": 17111, "wall": 15135.6} {"step": 3952, "train_loss": 3.8395614624023438, "lr": 0.0003911883968016144, "tps": 17107, "wall": 15143.3} {"step": 3953, "train_loss": 3.6871418952941895, "lr": 0.00039118247510274665, "tps": 17103, "wall": 15151.1} {"step": 3954, "train_loss": 3.760380268096924, "lr": 0.0003911765514647145, "tps": 17098, "wall": 15158.7} {"step": 3955, "train_loss": 3.7147440910339355, "lr": 0.0003911706258875853, "tps": 17094, "wall": 15166.5} {"step": 3956, "train_loss": 3.75622820854187, "lr": 0.0003911646983714258, "tps": 17090, "wall": 15174.1} {"step": 3957, "train_loss": 3.744842767715454, "lr": 0.00039115876891630336, "tps": 17085, "wall": 15181.9} {"step": 3958, "train_loss": 3.8021810054779053, "lr": 0.0003911528375222852, "tps": 17081, "wall": 15189.6} {"step": 3959, "train_loss": 3.748577833175659, "lr": 0.0003911469041894384, "tps": 17076, "wall": 15197.2} {"step": 3960, "train_loss": 3.7829556465148926, "lr": 0.0003911409689178302, "tps": 17072, "wall": 15204.9} {"step": 3961, "train_loss": 3.7712948322296143, "lr": 0.00039113503170752785, "tps": 17068, "wall": 15212.5} {"step": 3962, "train_loss": 3.881478786468506, "lr": 0.00039112909255859863, "tps": 17064, "wall": 15220.3} {"step": 3963, "train_loss": 3.7414770126342773, "lr": 0.0003911231514711098, "tps": 17059, "wall": 15227.9} {"step": 3964, "train_loss": 3.763709306716919, "lr": 0.00039111720844512863, "tps": 17055, "wall": 15235.5} {"step": 3965, "train_loss": 3.7679240703582764, "lr": 0.0003911112634807224, "tps": 17051, "wall": 15243.4} {"step": 3966, "train_loss": 3.794919490814209, "lr": 0.00039110531657795855, "tps": 17046, "wall": 15251.1} {"step": 3967, "train_loss": 3.791891574859619, "lr": 0.0003910993677369045, "tps": 17042, "wall": 15258.7} {"step": 3968, "train_loss": 3.663433074951172, "lr": 0.00039109341695762746, "tps": 17038, "wall": 15266.5} {"step": 3969, "train_loss": 3.7459137439727783, "lr": 0.00039108746424019504, "tps": 17033, "wall": 15274.1} {"step": 3970, "train_loss": 3.6936416625976562, "lr": 0.00039108150958467447, "tps": 17029, "wall": 15281.7} {"step": 3971, "train_loss": 3.858106851577759, "lr": 0.00039107555299113336, "tps": 17025, "wall": 15289.4} {"step": 3972, "train_loss": 3.718125104904175, "lr": 0.00039106959445963914, "tps": 17021, "wall": 15297.1} {"step": 3973, "train_loss": 3.8942558765411377, "lr": 0.00039106363399025925, "tps": 17016, "wall": 15305.0} {"step": 3974, "train_loss": 3.7766971588134766, "lr": 0.00039105767158306124, "tps": 17012, "wall": 15312.6} {"step": 3975, "train_loss": 3.7934961318969727, "lr": 0.0003910517072381128, "tps": 17008, "wall": 15320.4} {"step": 3976, "train_loss": 3.7959277629852295, "lr": 0.00039104574095548124, "tps": 17003, "wall": 15328.0} {"step": 3977, "train_loss": 3.6949596405029297, "lr": 0.00039103977273523434, "tps": 16999, "wall": 15335.6} {"step": 3978, "train_loss": 3.862700939178467, "lr": 0.00039103380257743956, "tps": 16995, "wall": 15343.3} {"step": 3979, "train_loss": 3.7286276817321777, "lr": 0.0003910278304821647, "tps": 16991, "wall": 15351.0} {"step": 3980, "train_loss": 3.807633399963379, "lr": 0.0003910218564494773, "tps": 16986, "wall": 15358.8} {"step": 3981, "train_loss": 3.7263731956481934, "lr": 0.00039101588047944503, "tps": 16982, "wall": 15366.4} {"step": 3982, "train_loss": 3.829345464706421, "lr": 0.0003910099025721357, "tps": 16978, "wall": 15374.1} {"step": 3983, "train_loss": 3.7601280212402344, "lr": 0.0003910039227276168, "tps": 16974, "wall": 15381.8} {"step": 3984, "train_loss": 3.7335381507873535, "lr": 0.0003909979409459563, "tps": 16970, "wall": 15389.5} {"step": 3985, "train_loss": 3.7560689449310303, "lr": 0.00039099195722722184, "tps": 16965, "wall": 15397.3} {"step": 3986, "train_loss": 3.8508388996124268, "lr": 0.0003909859715714813, "tps": 16961, "wall": 15404.9} {"step": 3987, "train_loss": 3.863706588745117, "lr": 0.00039097998397880237, "tps": 16957, "wall": 15412.6} {"step": 3988, "train_loss": 3.8779542446136475, "lr": 0.000390973994449253, "tps": 16953, "wall": 15420.3} {"step": 3989, "train_loss": 3.838892936706543, "lr": 0.00039096800298290093, "tps": 16949, "wall": 15427.9} {"step": 3990, "train_loss": 3.7178826332092285, "lr": 0.000390962009579814, "tps": 16944, "wall": 15435.6} {"step": 3991, "train_loss": 3.807342767715454, "lr": 0.0003909560142400603, "tps": 16940, "wall": 15443.2} {"step": 3992, "train_loss": 3.752655506134033, "lr": 0.0003909500169637075, "tps": 16936, "wall": 15450.9} {"step": 3993, "train_loss": 3.824871063232422, "lr": 0.0003909440177508237, "tps": 16932, "wall": 15458.7} {"step": 3994, "train_loss": 3.747619152069092, "lr": 0.0003909380166014769, "tps": 16928, "wall": 15466.4} {"step": 3995, "train_loss": 3.7280335426330566, "lr": 0.0003909320135157349, "tps": 16924, "wall": 15474.0} {"step": 3996, "train_loss": 3.852059841156006, "lr": 0.00039092600849366583, "tps": 16919, "wall": 15481.8} {"step": 3997, "train_loss": 3.708841323852539, "lr": 0.0003909200015353377, "tps": 16915, "wall": 15489.6} {"step": 3998, "train_loss": 3.9045515060424805, "lr": 0.00039091399264081856, "tps": 16910, "wall": 15497.6} {"step": 3999, "train_loss": 3.8126556873321533, "lr": 0.00039090798181017647, "tps": 16906, "wall": 15505.3} {"step": 4000, "train_loss": 3.8221633434295654, "lr": 0.0003909019690434795, "tps": 16902, "wall": 15513.0, "val_loss_monitor": 3.8503245350770356} {"step": 4001, "train_loss": 3.6963510513305664, "lr": 0.0003908959543407957, "tps": 16845, "wall": 15569.6} {"step": 4002, "train_loss": 3.7906861305236816, "lr": 0.0003908899377021934, "tps": 16841, "wall": 15577.3} {"step": 4003, "train_loss": 3.7509584426879883, "lr": 0.0003908839191277406, "tps": 16836, "wall": 15585.3} {"step": 4004, "train_loss": 3.8548574447631836, "lr": 0.0003908778986175056, "tps": 16831, "wall": 15594.1} {"step": 4005, "train_loss": 3.781672716140747, "lr": 0.0003908718761715564, "tps": 16826, "wall": 15602.6} {"step": 4006, "train_loss": 3.9302268028259277, "lr": 0.0003908658517899614, "tps": 16821, "wall": 15611.0} {"step": 4007, "train_loss": 3.920055866241455, "lr": 0.0003908598254727888, "tps": 16816, "wall": 15619.4} {"step": 4008, "train_loss": 3.868259906768799, "lr": 0.0003908537972201068, "tps": 16811, "wall": 15627.8} {"step": 4009, "train_loss": 3.813782215118408, "lr": 0.0003908477670319837, "tps": 16807, "wall": 15636.2} {"step": 4010, "train_loss": 3.7655041217803955, "lr": 0.00039084173490848797, "tps": 16802, "wall": 15644.5} {"step": 4011, "train_loss": 3.864326000213623, "lr": 0.0003908357008496877, "tps": 16797, "wall": 15653.0} {"step": 4012, "train_loss": 3.6632261276245117, "lr": 0.00039082966485565147, "tps": 16792, "wall": 15661.4} {"step": 4013, "train_loss": 3.871819019317627, "lr": 0.0003908236269264476, "tps": 16787, "wall": 15669.8} {"step": 4014, "train_loss": 3.819310188293457, "lr": 0.0003908175870621443, "tps": 16782, "wall": 15678.3} {"step": 4015, "train_loss": 3.7558624744415283, "lr": 0.00039081154526281024, "tps": 16778, "wall": 15686.6} {"step": 4016, "train_loss": 3.727457046508789, "lr": 0.00039080550152851374, "tps": 16773, "wall": 15695.0} {"step": 4017, "train_loss": 3.780555486679077, "lr": 0.0003907994558593232, "tps": 16768, "wall": 15703.3} {"step": 4018, "train_loss": 3.7485451698303223, "lr": 0.0003907934082553073, "tps": 16763, "wall": 15711.7} {"step": 4019, "train_loss": 3.8258140087127686, "lr": 0.0003907873587165343, "tps": 16759, "wall": 15720.0} {"step": 4020, "train_loss": 3.8699445724487305, "lr": 0.000390781307243073, "tps": 16754, "wall": 15728.3} {"step": 4021, "train_loss": 3.9731645584106445, "lr": 0.0003907752538349917, "tps": 16749, "wall": 15736.5} {"step": 4022, "train_loss": 3.836729049682617, "lr": 0.00039076919849235917, "tps": 16745, "wall": 15744.7} {"step": 4023, "train_loss": 3.9522817134857178, "lr": 0.00039076314121524384, "tps": 16740, "wall": 15753.3} {"step": 4024, "train_loss": 3.8171746730804443, "lr": 0.00039075708200371446, "tps": 16735, "wall": 15761.7} {"step": 4025, "train_loss": 3.844435930252075, "lr": 0.00039075102085783965, "tps": 16731, "wall": 15770.0} {"step": 4026, "train_loss": 3.8802058696746826, "lr": 0.00039074495777768794, "tps": 16726, "wall": 15778.3} {"step": 4027, "train_loss": 3.8105573654174805, "lr": 0.00039073889276332823, "tps": 16721, "wall": 15786.8} {"step": 4028, "train_loss": 3.799074411392212, "lr": 0.000390732825814829, "tps": 16717, "wall": 15794.9} {"step": 4029, "train_loss": 3.8272852897644043, "lr": 0.0003907267569322591, "tps": 16712, "wall": 15803.2} {"step": 4030, "train_loss": 3.822274923324585, "lr": 0.0003907206861156873, "tps": 16707, "wall": 15811.5} {"step": 4031, "train_loss": 3.819135904312134, "lr": 0.00039071461336518233, "tps": 16703, "wall": 15819.9} {"step": 4032, "train_loss": 3.952249050140381, "lr": 0.000390708538680813, "tps": 16698, "wall": 15828.1} {"step": 4033, "train_loss": 3.8394646644592285, "lr": 0.0003907024620626481, "tps": 16694, "wall": 15836.3} {"step": 4034, "train_loss": 3.793527603149414, "lr": 0.0003906963835107564, "tps": 16689, "wall": 15844.6} {"step": 4035, "train_loss": 3.837918996810913, "lr": 0.0003906903030252069, "tps": 16685, "wall": 15852.6} {"step": 4036, "train_loss": 3.864431142807007, "lr": 0.0003906842206060684, "tps": 16680, "wall": 15860.7} {"step": 4037, "train_loss": 3.7583043575286865, "lr": 0.0003906781362534098, "tps": 16676, "wall": 15868.6} {"step": 4038, "train_loss": 3.8314208984375, "lr": 0.0003906720499673001, "tps": 16672, "wall": 15876.6} {"step": 4039, "train_loss": 3.8332512378692627, "lr": 0.00039066596174780813, "tps": 16668, "wall": 15884.5} {"step": 4040, "train_loss": 3.8299169540405273, "lr": 0.0003906598715950029, "tps": 16663, "wall": 15892.4} {"step": 4041, "train_loss": 3.87069034576416, "lr": 0.00039065377950895345, "tps": 16659, "wall": 15900.5} {"step": 4042, "train_loss": 3.766188383102417, "lr": 0.0003906476854897287, "tps": 16655, "wall": 15908.4} {"step": 4043, "train_loss": 3.832918643951416, "lr": 0.0003906415895373978, "tps": 16651, "wall": 15916.3} {"step": 4044, "train_loss": 3.7294859886169434, "lr": 0.0003906354916520297, "tps": 16647, "wall": 15924.3} {"step": 4045, "train_loss": 3.8724827766418457, "lr": 0.00039062939183369356, "tps": 16642, "wall": 15932.3} {"step": 4046, "train_loss": 3.8310036659240723, "lr": 0.0003906232900824584, "tps": 16638, "wall": 15940.2} {"step": 4047, "train_loss": 3.7942728996276855, "lr": 0.0003906171863983934, "tps": 16634, "wall": 15948.1} {"step": 4048, "train_loss": 3.7895069122314453, "lr": 0.00039061108078156765, "tps": 16630, "wall": 15956.0} {"step": 4049, "train_loss": 3.863524913787842, "lr": 0.0003906049732320504, "tps": 16626, "wall": 15964.1} {"step": 4050, "train_loss": 3.8246190547943115, "lr": 0.00039059886374991076, "tps": 16621, "wall": 15972.1} {"step": 4051, "train_loss": 3.9462103843688965, "lr": 0.000390592752335218, "tps": 16617, "wall": 15980.0} {"step": 4052, "train_loss": 3.8154706954956055, "lr": 0.00039058663898804125, "tps": 16613, "wall": 15988.0} {"step": 4053, "train_loss": 3.8076906204223633, "lr": 0.00039058052370844983, "tps": 16609, "wall": 15995.9} {"step": 4054, "train_loss": 3.8569822311401367, "lr": 0.0003905744064965131, "tps": 16605, "wall": 16003.8} {"step": 4055, "train_loss": 3.831598997116089, "lr": 0.00039056828735230015, "tps": 16601, "wall": 16011.8} {"step": 4056, "train_loss": 3.8747525215148926, "lr": 0.00039056216627588044, "tps": 16596, "wall": 16019.8} {"step": 4057, "train_loss": 3.7103233337402344, "lr": 0.0003905560432673233, "tps": 16592, "wall": 16027.8} {"step": 4058, "train_loss": 3.7909023761749268, "lr": 0.0003905499183266981, "tps": 16588, "wall": 16035.7} {"step": 4059, "train_loss": 3.9249839782714844, "lr": 0.00039054379145407413, "tps": 16584, "wall": 16043.6} {"step": 4060, "train_loss": 3.7768149375915527, "lr": 0.0003905376626495209, "tps": 16580, "wall": 16051.6} {"step": 4061, "train_loss": 3.9070377349853516, "lr": 0.0003905315319131078, "tps": 16576, "wall": 16059.4} {"step": 4062, "train_loss": 3.7085602283477783, "lr": 0.0003905253992449043, "tps": 16572, "wall": 16067.5} {"step": 4063, "train_loss": 3.8399038314819336, "lr": 0.0003905192646449799, "tps": 16568, "wall": 16075.3} {"step": 4064, "train_loss": 3.871220588684082, "lr": 0.00039051312811340394, "tps": 16563, "wall": 16083.4} {"step": 4065, "train_loss": 3.754556655883789, "lr": 0.0003905069896502461, "tps": 16559, "wall": 16091.3} {"step": 4066, "train_loss": 3.878420114517212, "lr": 0.0003905008492555758, "tps": 16555, "wall": 16099.2} {"step": 4067, "train_loss": 3.8662214279174805, "lr": 0.00039049470692946274, "tps": 16551, "wall": 16107.1} {"step": 4068, "train_loss": 3.903707265853882, "lr": 0.0003904885626719764, "tps": 16547, "wall": 16115.0} {"step": 4069, "train_loss": 3.796011447906494, "lr": 0.00039048241648318636, "tps": 16543, "wall": 16122.8} {"step": 4070, "train_loss": 3.884242057800293, "lr": 0.00039047626836316227, "tps": 16539, "wall": 16130.8} {"step": 4071, "train_loss": 3.911736488342285, "lr": 0.00039047011831197385, "tps": 16535, "wall": 16139.1} {"step": 4072, "train_loss": 3.806602954864502, "lr": 0.00039046396632969066, "tps": 16531, "wall": 16147.0} {"step": 4073, "train_loss": 3.8505141735076904, "lr": 0.00039045781241638246, "tps": 16527, "wall": 16155.0} {"step": 4074, "train_loss": 3.89908766746521, "lr": 0.00039045165657211893, "tps": 16523, "wall": 16162.9} {"step": 4075, "train_loss": 3.8142824172973633, "lr": 0.0003904454987969698, "tps": 16518, "wall": 16170.9} {"step": 4076, "train_loss": 3.819235324859619, "lr": 0.0003904393390910048, "tps": 16514, "wall": 16178.9} {"step": 4077, "train_loss": 3.7706973552703857, "lr": 0.00039043317745429386, "tps": 16510, "wall": 16186.8} {"step": 4078, "train_loss": 3.967418670654297, "lr": 0.0003904270138869066, "tps": 16506, "wall": 16194.7} {"step": 4079, "train_loss": 3.815131664276123, "lr": 0.00039042084838891293, "tps": 16502, "wall": 16202.7} {"step": 4080, "train_loss": 3.7949507236480713, "lr": 0.00039041468096038265, "tps": 16498, "wall": 16210.7} {"step": 4081, "train_loss": 3.8682689666748047, "lr": 0.0003904085116013856, "tps": 16493, "wall": 16219.5} {"step": 4082, "train_loss": 3.776878595352173, "lr": 0.0003904023403119918, "tps": 16489, "wall": 16227.8} {"step": 4083, "train_loss": 3.793891429901123, "lr": 0.000390396167092271, "tps": 16484, "wall": 16236.2} {"step": 4084, "train_loss": 3.882045269012451, "lr": 0.0003903899919422932, "tps": 16480, "wall": 16244.7} {"step": 4085, "train_loss": 3.822899341583252, "lr": 0.0003903838148621284, "tps": 16475, "wall": 16253.1} {"step": 4086, "train_loss": 3.813667058944702, "lr": 0.00039037763585184656, "tps": 16471, "wall": 16261.5} {"step": 4087, "train_loss": 3.7048912048339844, "lr": 0.00039037145491151756, "tps": 16466, "wall": 16270.0} {"step": 4088, "train_loss": 3.891808032989502, "lr": 0.0003903652720412115, "tps": 16462, "wall": 16278.4} {"step": 4089, "train_loss": 3.9002184867858887, "lr": 0.0003903590872409985, "tps": 16457, "wall": 16286.8} {"step": 4090, "train_loss": 3.818803548812866, "lr": 0.0003903529005109485, "tps": 16453, "wall": 16295.2} {"step": 4091, "train_loss": 3.8083953857421875, "lr": 0.00039034671185113166, "tps": 16448, "wall": 16303.6} {"step": 4092, "train_loss": 3.938343048095703, "lr": 0.000390340521261618, "tps": 16444, "wall": 16312.0} {"step": 4093, "train_loss": 3.808651924133301, "lr": 0.00039033432874247773, "tps": 16439, "wall": 16320.5} {"step": 4094, "train_loss": 3.8475818634033203, "lr": 0.0003903281342937809, "tps": 16435, "wall": 16328.9} {"step": 4095, "train_loss": 3.8910586833953857, "lr": 0.00039032193791559784, "tps": 16430, "wall": 16337.3} {"step": 4096, "train_loss": 3.830324649810791, "lr": 0.00039031573960799867, "tps": 16426, "wall": 16345.9} {"step": 4097, "train_loss": 3.8204152584075928, "lr": 0.0003903095393710535, "tps": 16421, "wall": 16354.3} {"step": 4098, "train_loss": 3.8954451084136963, "lr": 0.0003903033372048327, "tps": 16417, "wall": 16362.7} {"step": 4099, "train_loss": 3.7538585662841797, "lr": 0.0003902971331094065, "tps": 16412, "wall": 16371.0} {"step": 4100, "train_loss": 3.8140156269073486, "lr": 0.0003902909270848451, "tps": 16408, "wall": 16379.5} {"step": 4101, "train_loss": 3.8215715885162354, "lr": 0.00039028471913121895, "tps": 16404, "wall": 16387.9} {"step": 4102, "train_loss": 3.854360580444336, "lr": 0.0003902785092485982, "tps": 16399, "wall": 16396.3} {"step": 4103, "train_loss": 3.833674907684326, "lr": 0.00039027229743705333, "tps": 16395, "wall": 16404.6} {"step": 4104, "train_loss": 3.798051357269287, "lr": 0.0003902660836966547, "tps": 16390, "wall": 16413.3} {"step": 4105, "train_loss": 3.8609423637390137, "lr": 0.0003902598680274726, "tps": 16386, "wall": 16421.4} {"step": 4106, "train_loss": 3.8064510822296143, "lr": 0.0003902536504295775, "tps": 16382, "wall": 16429.5} {"step": 4107, "train_loss": 3.712092876434326, "lr": 0.0003902474309030399, "tps": 16378, "wall": 16437.6} {"step": 4108, "train_loss": 3.736056327819824, "lr": 0.00039024120944793013, "tps": 16374, "wall": 16445.8} {"step": 4109, "train_loss": 3.8584136962890625, "lr": 0.0003902349860643188, "tps": 16370, "wall": 16453.9} {"step": 4110, "train_loss": 3.8565874099731445, "lr": 0.00039022876075227634, "tps": 16366, "wall": 16461.9} {"step": 4111, "train_loss": 3.760010242462158, "lr": 0.00039022253351187315, "tps": 16362, "wall": 16469.8} {"step": 4112, "train_loss": 3.821749210357666, "lr": 0.00039021630434318, "tps": 16358, "wall": 16477.9} {"step": 4113, "train_loss": 3.8587920665740967, "lr": 0.00039021007324626733, "tps": 16354, "wall": 16485.9} {"step": 4114, "train_loss": 3.782261610031128, "lr": 0.00039020384022120575, "tps": 16350, "wall": 16493.8} {"step": 4115, "train_loss": 3.8856821060180664, "lr": 0.0003901976052680658, "tps": 16346, "wall": 16501.9} {"step": 4116, "train_loss": 3.757507801055908, "lr": 0.0003901913683869182, "tps": 16342, "wall": 16510.0} {"step": 4117, "train_loss": 3.8192970752716064, "lr": 0.0003901851295778336, "tps": 16338, "wall": 16518.1} {"step": 4118, "train_loss": 3.96632719039917, "lr": 0.0003901788888408826, "tps": 16334, "wall": 16526.1} {"step": 4119, "train_loss": 3.7692296504974365, "lr": 0.00039017264617613597, "tps": 16330, "wall": 16534.2} {"step": 4120, "train_loss": 3.8694000244140625, "lr": 0.00039016640158366444, "tps": 16326, "wall": 16542.2} {"step": 4121, "train_loss": 3.837261438369751, "lr": 0.00039016015506353863, "tps": 16322, "wall": 16550.2} {"step": 4122, "train_loss": 3.7008368968963623, "lr": 0.00039015390661582936, "tps": 16318, "wall": 16558.5} {"step": 4123, "train_loss": 3.8060731887817383, "lr": 0.0003901476562406075, "tps": 16314, "wall": 16566.6} {"step": 4124, "train_loss": 3.8117148876190186, "lr": 0.00039014140393794374, "tps": 16308, "wall": 16575.9} {"step": 4125, "train_loss": 3.831986427307129, "lr": 0.000390135149707909, "tps": 16304, "wall": 16584.6} {"step": 4126, "train_loss": 3.822129011154175, "lr": 0.0003901288935505741, "tps": 16299, "wall": 16593.2} {"step": 4127, "train_loss": 3.815967321395874, "lr": 0.0003901226354660098, "tps": 16295, "wall": 16601.8} {"step": 4128, "train_loss": 3.832463264465332, "lr": 0.0003901163754542871, "tps": 16290, "wall": 16610.6} {"step": 4129, "train_loss": 3.789712905883789, "lr": 0.00039011011351547696, "tps": 16286, "wall": 16619.1} {"step": 4130, "train_loss": 3.864856719970703, "lr": 0.00039010384964965027, "tps": 16281, "wall": 16627.8} {"step": 4131, "train_loss": 3.873537063598633, "lr": 0.00039009758385687783, "tps": 16277, "wall": 16636.2} {"step": 4132, "train_loss": 3.831143379211426, "lr": 0.0003900913161372309, "tps": 16272, "wall": 16645.0} {"step": 4133, "train_loss": 3.7196693420410156, "lr": 0.0003900850464907802, "tps": 16268, "wall": 16653.6} {"step": 4134, "train_loss": 3.7979912757873535, "lr": 0.000390078774917597, "tps": 16264, "wall": 16662.0} {"step": 4135, "train_loss": 3.840373992919922, "lr": 0.00039007250141775225, "tps": 16259, "wall": 16670.5} {"step": 4136, "train_loss": 3.8116915225982666, "lr": 0.00039006622599131697, "tps": 16255, "wall": 16678.9} {"step": 4137, "train_loss": 3.939821720123291, "lr": 0.0003900599486383622, "tps": 16250, "wall": 16687.5} {"step": 4138, "train_loss": 3.913048505783081, "lr": 0.0003900536693589592, "tps": 16246, "wall": 16696.3} {"step": 4139, "train_loss": 3.8566226959228516, "lr": 0.00039004738815317906, "tps": 16242, "wall": 16704.7} {"step": 4140, "train_loss": 3.7667369842529297, "lr": 0.0003900411050210929, "tps": 16237, "wall": 16713.3} {"step": 4141, "train_loss": 3.7406888008117676, "lr": 0.0003900348199627719, "tps": 16233, "wall": 16721.8} {"step": 4142, "train_loss": 3.812361478805542, "lr": 0.00039002853297828726, "tps": 16228, "wall": 16730.3} {"step": 4143, "train_loss": 3.7719674110412598, "lr": 0.0003900222440677102, "tps": 16224, "wall": 16738.9} {"step": 4144, "train_loss": 3.8756463527679443, "lr": 0.00039001595323111195, "tps": 16220, "wall": 16747.4} {"step": 4145, "train_loss": 3.810986042022705, "lr": 0.00039000966046856376, "tps": 16215, "wall": 16755.8} {"step": 4146, "train_loss": 3.8617348670959473, "lr": 0.00039000336578013696, "tps": 16211, "wall": 16764.4} {"step": 4147, "train_loss": 3.9727416038513184, "lr": 0.0003899970691659029, "tps": 16207, "wall": 16773.0} {"step": 4148, "train_loss": 3.8657336235046387, "lr": 0.00038999077062593275, "tps": 16202, "wall": 16781.6} {"step": 4149, "train_loss": 3.8066420555114746, "lr": 0.000389984470160298, "tps": 16198, "wall": 16790.2} {"step": 4150, "train_loss": 3.813694477081299, "lr": 0.00038997816776906993, "tps": 16194, "wall": 16798.6} {"step": 4151, "train_loss": 3.7358555793762207, "lr": 0.00038997186345232003, "tps": 16189, "wall": 16807.1} {"step": 4152, "train_loss": 3.859323024749756, "lr": 0.00038996555721011966, "tps": 16185, "wall": 16815.7} {"step": 4153, "train_loss": 3.8297314643859863, "lr": 0.0003899592490425402, "tps": 16181, "wall": 16824.2} {"step": 4154, "train_loss": 3.901468515396118, "lr": 0.00038995293894965327, "tps": 16176, "wall": 16832.7} {"step": 4155, "train_loss": 3.8068485260009766, "lr": 0.0003899466269315302, "tps": 16172, "wall": 16840.9} {"step": 4156, "train_loss": 3.8441238403320312, "lr": 0.00038994031298824255, "tps": 16168, "wall": 16849.2} {"step": 4157, "train_loss": 3.836503744125366, "lr": 0.00038993399711986185, "tps": 16164, "wall": 16857.3} {"step": 4158, "train_loss": 3.745574474334717, "lr": 0.00038992767932645965, "tps": 16160, "wall": 16865.8} {"step": 4159, "train_loss": 3.8307228088378906, "lr": 0.00038992135960810745, "tps": 16156, "wall": 16873.9} {"step": 4160, "train_loss": 3.8024322986602783, "lr": 0.00038991503796487697, "tps": 16152, "wall": 16882.2} {"step": 4161, "train_loss": 3.8899269104003906, "lr": 0.0003899087143968397, "tps": 16148, "wall": 16890.4} {"step": 4162, "train_loss": 3.7944281101226807, "lr": 0.00038990238890406734, "tps": 16144, "wall": 16898.6} {"step": 4163, "train_loss": 3.8271355628967285, "lr": 0.00038989606148663147, "tps": 16140, "wall": 16907.2} {"step": 4164, "train_loss": 3.807729721069336, "lr": 0.00038988973214460393, "tps": 16136, "wall": 16915.3} {"step": 4165, "train_loss": 3.8267335891723633, "lr": 0.0003898834008780562, "tps": 16132, "wall": 16923.5} {"step": 4166, "train_loss": 3.8506546020507812, "lr": 0.0003898770676870602, "tps": 16128, "wall": 16931.7} {"step": 4167, "train_loss": 3.7475202083587646, "lr": 0.00038987073257168756, "tps": 16124, "wall": 16940.0} {"step": 4168, "train_loss": 3.784467935562134, "lr": 0.0003898643955320101, "tps": 16121, "wall": 16948.0} {"step": 4169, "train_loss": 3.7587890625, "lr": 0.0003898580565680995, "tps": 16117, "wall": 16956.0} {"step": 4170, "train_loss": 3.7723617553710938, "lr": 0.0003898517156800277, "tps": 16113, "wall": 16964.1} {"step": 4171, "train_loss": 3.877772092819214, "lr": 0.0003898453728678665, "tps": 16109, "wall": 16972.2} {"step": 4172, "train_loss": 3.831752300262451, "lr": 0.0003898390281316877, "tps": 16105, "wall": 16980.4} {"step": 4173, "train_loss": 3.7823104858398438, "lr": 0.00038983268147156316, "tps": 16101, "wall": 16988.4} {"step": 4174, "train_loss": 3.8932583332061768, "lr": 0.00038982633288756486, "tps": 16098, "wall": 16996.4} {"step": 4175, "train_loss": 3.759284257888794, "lr": 0.0003898199823797647, "tps": 16094, "wall": 17004.4} {"step": 4176, "train_loss": 3.8539481163024902, "lr": 0.00038981362994823456, "tps": 16090, "wall": 17012.6} {"step": 4177, "train_loss": 3.86202335357666, "lr": 0.0003898072755930464, "tps": 16086, "wall": 17020.8} {"step": 4178, "train_loss": 3.782118320465088, "lr": 0.0003898009193142723, "tps": 16082, "wall": 17029.1} {"step": 4179, "train_loss": 3.8482000827789307, "lr": 0.00038979456111198414, "tps": 16078, "wall": 17037.2} {"step": 4180, "train_loss": 3.8281021118164062, "lr": 0.0003897882009862541, "tps": 16075, "wall": 17045.5} {"step": 4181, "train_loss": 3.7875375747680664, "lr": 0.000389781838937154, "tps": 16071, "wall": 17053.6} {"step": 4182, "train_loss": 3.814450740814209, "lr": 0.00038977547496475614, "tps": 16066, "wall": 17062.1} {"step": 4183, "train_loss": 3.76267409324646, "lr": 0.0003897691090691325, "tps": 16063, "wall": 17070.3} {"step": 4184, "train_loss": 3.8387503623962402, "lr": 0.0003897627412503552, "tps": 16059, "wall": 17078.4} {"step": 4185, "train_loss": 3.846515417098999, "lr": 0.00038975637150849633, "tps": 16055, "wall": 17086.5} {"step": 4186, "train_loss": 3.834362268447876, "lr": 0.0003897499998436282, "tps": 16051, "wall": 17094.6} {"step": 4187, "train_loss": 3.7291946411132812, "lr": 0.0003897436262558229, "tps": 16047, "wall": 17102.9} {"step": 4188, "train_loss": 3.805532932281494, "lr": 0.0003897372507451525, "tps": 16043, "wall": 17111.1} {"step": 4189, "train_loss": 3.8691344261169434, "lr": 0.0003897308733116894, "tps": 16040, "wall": 17119.2} {"step": 4190, "train_loss": 3.8193540573120117, "lr": 0.00038972449395550577, "tps": 16036, "wall": 17127.2} {"step": 4191, "train_loss": 3.814300298690796, "lr": 0.00038971811267667387, "tps": 16032, "wall": 17135.3} {"step": 4192, "train_loss": 3.849402666091919, "lr": 0.00038971172947526605, "tps": 16028, "wall": 17143.5} {"step": 4193, "train_loss": 3.8592140674591064, "lr": 0.00038970534435135457, "tps": 16025, "wall": 17151.6} {"step": 4194, "train_loss": 3.844531536102295, "lr": 0.0003896989573050118, "tps": 16021, "wall": 17159.8} {"step": 4195, "train_loss": 3.770709753036499, "lr": 0.00038969256833631, "tps": 16017, "wall": 17167.9} {"step": 4196, "train_loss": 3.798616886138916, "lr": 0.00038968617744532166, "tps": 16013, "wall": 17176.0} {"step": 4197, "train_loss": 3.881218433380127, "lr": 0.000389679784632119, "tps": 16010, "wall": 17184.1} {"step": 4198, "train_loss": 3.7694199085235596, "lr": 0.00038967338989677475, "tps": 16006, "wall": 17192.3} {"step": 4199, "train_loss": 3.8721330165863037, "lr": 0.00038966699323936103, "tps": 16002, "wall": 17200.3} {"step": 4200, "train_loss": 3.7560408115386963, "lr": 0.00038966059465995047, "tps": 15999, "wall": 17208.4} {"step": 4201, "train_loss": 3.8355917930603027, "lr": 0.00038965419415861553, "tps": 15995, "wall": 17216.3} {"step": 4202, "train_loss": 3.8721675872802734, "lr": 0.0003896477917354287, "tps": 15991, "wall": 17224.5} {"step": 4203, "train_loss": 3.834998607635498, "lr": 0.0003896413873904624, "tps": 15987, "wall": 17232.6} {"step": 4204, "train_loss": 3.824993371963501, "lr": 0.00038963498112378945, "tps": 15984, "wall": 17240.6} {"step": 4205, "train_loss": 3.8234896659851074, "lr": 0.0003896285729354822, "tps": 15980, "wall": 17248.6} {"step": 4206, "train_loss": 3.8212978839874268, "lr": 0.0003896221628256133, "tps": 15977, "wall": 17256.6} {"step": 4207, "train_loss": 3.802569627761841, "lr": 0.0003896157507942553, "tps": 15973, "wall": 17264.6} {"step": 4208, "train_loss": 3.7751235961914062, "lr": 0.0003896093368414809, "tps": 15969, "wall": 17272.6} {"step": 4209, "train_loss": 3.7894446849823, "lr": 0.0003896029209673628, "tps": 15966, "wall": 17280.7} {"step": 4210, "train_loss": 3.7996575832366943, "lr": 0.0003895965031719737, "tps": 15962, "wall": 17288.8} {"step": 4211, "train_loss": 3.756405830383301, "lr": 0.00038959008345538614, "tps": 15958, "wall": 17296.8} {"step": 4212, "train_loss": 3.8309011459350586, "lr": 0.00038958366181767297, "tps": 15955, "wall": 17304.9} {"step": 4213, "train_loss": 3.868762254714966, "lr": 0.0003895772382589069, "tps": 15951, "wall": 17313.0} {"step": 4001, "train_loss": 3.727938413619995, "lr": 0.0003908959543407957, "tps": 42904491, "wall": 6.1} {"step": 4002, "train_loss": 3.7839834690093994, "lr": 0.0003908899377021934, "tps": 22558577, "wall": 11.6} {"step": 4003, "train_loss": 3.734053134918213, "lr": 0.0003908839191277406, "tps": 15027178, "wall": 17.5} {"step": 4004, "train_loss": 3.8813095092773438, "lr": 0.0003908778986175056, "tps": 11224458, "wall": 23.4} {"step": 4005, "train_loss": 3.7319507598876953, "lr": 0.0003908718761715564, "tps": 8941119, "wall": 29.4} {"step": 4006, "train_loss": 3.7829408645629883, "lr": 0.0003908658517899614, "tps": 7431213, "wall": 35.3} {"step": 4007, "train_loss": 3.7427492141723633, "lr": 0.0003908598254727888, "tps": 6340288, "wall": 41.4} {"step": 4008, "train_loss": 3.852626323699951, "lr": 0.0003908537972201068, "tps": 5536275, "wall": 47.5} {"step": 4009, "train_loss": 3.827688217163086, "lr": 0.0003908477670319837, "tps": 4860594, "wall": 54.1} {"step": 4010, "train_loss": 3.832693338394165, "lr": 0.00039084173490848797, "tps": 4339299, "wall": 60.6} {"step": 4011, "train_loss": 3.737051248550415, "lr": 0.0003908357008496877, "tps": 3911235, "wall": 67.2} {"step": 4012, "train_loss": 3.8287177085876465, "lr": 0.00039082966485565147, "tps": 3558366, "wall": 73.9} {"step": 4013, "train_loss": 3.715824604034424, "lr": 0.0003908236269264476, "tps": 3262493, "wall": 80.6} {"step": 4014, "train_loss": 3.7506203651428223, "lr": 0.0003908175870621443, "tps": 3003116, "wall": 87.6} {"step": 4015, "train_loss": 3.9137251377105713, "lr": 0.00039081154526281024, "tps": 2780663, "wall": 94.7} {"step": 4016, "train_loss": 3.768568515777588, "lr": 0.00039080550152851374, "tps": 2582538, "wall": 101.9} {"step": 4017, "train_loss": 3.73010516166687, "lr": 0.0003907994558593232, "tps": 2412788, "wall": 109.1} {"step": 4018, "train_loss": 3.8485989570617676, "lr": 0.0003907934082553073, "tps": 2260736, "wall": 116.5} {"step": 4019, "train_loss": 3.819888114929199, "lr": 0.0003907873587165343, "tps": 2126036, "wall": 123.9} {"step": 4020, "train_loss": 3.807063341140747, "lr": 0.000390781307243073, "tps": 2003772, "wall": 131.5} {"step": 4021, "train_loss": 3.8666205406188965, "lr": 0.0003907752538349917, "tps": 1892204, "wall": 139.3} {"step": 4022, "train_loss": 3.8449957370758057, "lr": 0.00039076919849235917, "tps": 1789690, "wall": 147.3} {"step": 4023, "train_loss": 3.7870097160339355, "lr": 0.00039076314121524384, "tps": 1698952, "wall": 155.2} {"step": 4024, "train_loss": 3.7169265747070312, "lr": 0.00039075708200371446, "tps": 1613831, "wall": 163.5} {"step": 4025, "train_loss": 3.7747294902801514, "lr": 0.00039075102085783965, "tps": 1537455, "wall": 171.6} {"step": 4026, "train_loss": 3.6910133361816406, "lr": 0.00039074495777768794, "tps": 1466767, "wall": 179.9} {"step": 4027, "train_loss": 3.7794437408447266, "lr": 0.00039073889276332823, "tps": 1401624, "wall": 188.3} {"step": 4028, "train_loss": 3.8900017738342285, "lr": 0.000390732825814829, "tps": 1341739, "wall": 196.8} {"step": 4029, "train_loss": 3.7719287872314453, "lr": 0.0003907267569322591, "tps": 1285643, "wall": 205.4} {"step": 4030, "train_loss": 3.815431594848633, "lr": 0.0003907206861156873, "tps": 1234055, "wall": 214.1} {"step": 4031, "train_loss": 3.7638118267059326, "lr": 0.00039071461336518233, "tps": 1185170, "wall": 223.0} {"step": 4032, "train_loss": 3.8038580417633057, "lr": 0.000390708538680813, "tps": 1140100, "wall": 231.8} {"step": 4033, "train_loss": 3.8083415031433105, "lr": 0.0003907024620626481, "tps": 1098355, "wall": 240.7} {"step": 4034, "train_loss": 3.6590800285339355, "lr": 0.0003906963835107564, "tps": 1059351, "wall": 249.6} {"step": 4035, "train_loss": 3.8170862197875977, "lr": 0.0003906903030252069, "tps": 1023251, "wall": 258.5} {"step": 4036, "train_loss": 3.787785291671753, "lr": 0.0003906842206060684, "tps": 988438, "wall": 267.7} {"step": 4037, "train_loss": 3.8054566383361816, "lr": 0.0003906781362534098, "tps": 956881, "wall": 276.6} {"step": 4038, "train_loss": 3.774383068084717, "lr": 0.0003906720499673001, "tps": 926742, "wall": 285.6} {"step": 4039, "train_loss": 3.7061190605163574, "lr": 0.00039066596174780813, "tps": 898701, "wall": 294.6} {"step": 4040, "train_loss": 3.7770540714263916, "lr": 0.0003906598715950029, "tps": 872030, "wall": 303.7} {"step": 4041, "train_loss": 3.7180862426757812, "lr": 0.00039065377950895345, "tps": 843495, "wall": 314.0} {"step": 4042, "train_loss": 3.8519608974456787, "lr": 0.0003906476854897287, "tps": 818890, "wall": 323.6} {"step": 4043, "train_loss": 3.6745212078094482, "lr": 0.0003906415895373978, "tps": 796605, "wall": 332.7} {"step": 4044, "train_loss": 3.8519415855407715, "lr": 0.0003906354916520297, "tps": 775484, "wall": 341.8} {"step": 4045, "train_loss": 3.669888973236084, "lr": 0.00039062939183369356, "tps": 755914, "wall": 350.8} {"step": 4046, "train_loss": 3.838967800140381, "lr": 0.0003906232900824584, "tps": 737659, "wall": 359.5} {"step": 4047, "train_loss": 3.641915798187256, "lr": 0.0003906171863983934, "tps": 719681, "wall": 368.6} {"step": 4048, "train_loss": 3.8245797157287598, "lr": 0.00039061108078156765, "tps": 702942, "wall": 377.5} {"step": 4049, "train_loss": 3.85318922996521, "lr": 0.0003906049732320504, "tps": 686889, "wall": 386.4} {"step": 4050, "train_loss": 3.771474838256836, "lr": 0.00039059886374991076, "tps": 671901, "wall": 395.1} {"step": 4051, "train_loss": 3.7078959941864014, "lr": 0.000390592752335218, "tps": 657151, "wall": 404.1} {"step": 4052, "train_loss": 3.8093273639678955, "lr": 0.00039058663898804125, "tps": 643519, "wall": 412.8} {"step": 4053, "train_loss": 3.8451151847839355, "lr": 0.00039058052370844983, "tps": 630486, "wall": 421.4} {"step": 4054, "train_loss": 3.786651849746704, "lr": 0.0003905744064965131, "tps": 617962, "wall": 430.0} {"step": 4055, "train_loss": 3.752595901489258, "lr": 0.00039056828735230015, "tps": 605912, "wall": 438.7} {"step": 4056, "train_loss": 3.727027177810669, "lr": 0.00039056216627588044, "tps": 594268, "wall": 447.4} {"step": 4057, "train_loss": 3.8021607398986816, "lr": 0.0003905560432673233, "tps": 583302, "wall": 455.9} {"step": 4058, "train_loss": 3.792170286178589, "lr": 0.0003905499183266981, "tps": 572384, "wall": 464.7} {"step": 4059, "train_loss": 3.787151336669922, "lr": 0.00039054379145407413, "tps": 562328, "wall": 473.2} {"step": 4060, "train_loss": 3.8934359550476074, "lr": 0.0003905376626495209, "tps": 552479, "wall": 481.7} {"step": 4061, "train_loss": 3.828723192214966, "lr": 0.0003905315319131078, "tps": 543119, "wall": 490.1} {"step": 4062, "train_loss": 3.781069755554199, "lr": 0.0003905253992449043, "tps": 534149, "wall": 498.5} {"step": 4063, "train_loss": 3.8396754264831543, "lr": 0.0003905192646449799, "tps": 525292, "wall": 507.0} {"step": 4064, "train_loss": 3.7513773441314697, "lr": 0.00039051312811340394, "tps": 516928, "wall": 515.4} {"step": 4065, "train_loss": 3.753267765045166, "lr": 0.0003905069896502461, "tps": 508667, "wall": 523.9} {"step": 4066, "train_loss": 3.8376760482788086, "lr": 0.0003905008492555758, "tps": 500901, "wall": 532.1} {"step": 4067, "train_loss": 3.871647834777832, "lr": 0.00039049470692946274, "tps": 493340, "wall": 540.4} {"step": 4068, "train_loss": 3.7478981018066406, "lr": 0.0003904885626719764, "tps": 485879, "wall": 548.8} {"step": 4069, "train_loss": 3.707456588745117, "lr": 0.00039048241648318636, "tps": 478753, "wall": 557.1} {"step": 4070, "train_loss": 3.8694887161254883, "lr": 0.00039047626836316227, "tps": 471788, "wall": 565.5} {"step": 4071, "train_loss": 3.808114767074585, "lr": 0.00039047011831197385, "tps": 465205, "wall": 573.6} {"step": 4072, "train_loss": 3.7521491050720215, "lr": 0.00039046396632969066, "tps": 458597, "wall": 582.1} {"step": 4073, "train_loss": 3.7940139770507812, "lr": 0.00039045781241638246, "tps": 452372, "wall": 590.2} {"step": 4074, "train_loss": 3.7015459537506104, "lr": 0.00039045165657211893, "tps": 446247, "wall": 598.5} {"step": 4075, "train_loss": 3.806851625442505, "lr": 0.0003904454987969698, "tps": 440362, "wall": 606.6} {"step": 4076, "train_loss": 3.8488552570343018, "lr": 0.0003904393390910048, "tps": 434569, "wall": 614.8} {"step": 4077, "train_loss": 3.804722309112549, "lr": 0.00039043317745429386, "tps": 428899, "wall": 623.1} {"step": 4078, "train_loss": 3.857072353363037, "lr": 0.0003904270138869066, "tps": 423428, "wall": 631.3} {"step": 4079, "train_loss": 3.9006004333496094, "lr": 0.00039042084838891293, "tps": 418117, "wall": 639.5} {"step": 4080, "train_loss": 3.7251288890838623, "lr": 0.00039041468096038265, "tps": 412903, "wall": 647.7} {"step": 4081, "train_loss": 3.7927961349487305, "lr": 0.0003904085116013856, "tps": 407869, "wall": 655.9} {"step": 4082, "train_loss": 3.763289213180542, "lr": 0.0003904023403119918, "tps": 402973, "wall": 664.0} {"step": 4083, "train_loss": 3.773845672607422, "lr": 0.000390396167092271, "tps": 398132, "wall": 672.3} {"step": 4084, "train_loss": 3.7749722003936768, "lr": 0.0003903899919422932, "tps": 393522, "wall": 680.3} {"step": 4085, "train_loss": 3.832110643386841, "lr": 0.0003903838148621284, "tps": 388943, "wall": 688.5} {"step": 4086, "train_loss": 3.8037338256835938, "lr": 0.00039037763585184656, "tps": 384547, "wall": 696.5} {"step": 4087, "train_loss": 3.748713493347168, "lr": 0.00039037145491151756, "tps": 380160, "wall": 704.7} {"step": 4088, "train_loss": 3.797224521636963, "lr": 0.0003903652720412115, "tps": 375929, "wall": 712.8} {"step": 4089, "train_loss": 3.7989983558654785, "lr": 0.0003903590872409985, "tps": 371789, "wall": 721.0} {"step": 4090, "train_loss": 3.7556183338165283, "lr": 0.0003903529005109485, "tps": 367702, "wall": 729.1} {"step": 4091, "train_loss": 3.713550090789795, "lr": 0.00039034671185113166, "tps": 363728, "wall": 737.3} {"step": 4092, "train_loss": 3.8039751052856445, "lr": 0.000390340521261618, "tps": 359850, "wall": 745.4} {"step": 4093, "train_loss": 3.793614387512207, "lr": 0.00039033432874247773, "tps": 356128, "wall": 753.4} {"step": 4094, "train_loss": 3.8198463916778564, "lr": 0.0003903281342937809, "tps": 352376, "wall": 761.6} {"step": 4095, "train_loss": 3.741115093231201, "lr": 0.00039032193791559784, "tps": 348789, "wall": 769.6} {"step": 4096, "train_loss": 3.767925500869751, "lr": 0.00039031573960799867, "tps": 345217, "wall": 777.8} {"step": 4097, "train_loss": 3.741726875305176, "lr": 0.0003903095393710535, "tps": 341729, "wall": 785.9} {"step": 4098, "train_loss": 3.8303050994873047, "lr": 0.0003903033372048327, "tps": 338355, "wall": 793.9} {"step": 4099, "train_loss": 3.8450944423675537, "lr": 0.0003902971331094065, "tps": 334989, "wall": 802.1} {"step": 4100, "train_loss": 3.791241407394409, "lr": 0.0003902909270848451, "tps": 331705, "wall": 810.2} {"step": 4101, "train_loss": 3.6499876976013184, "lr": 0.00039028471913121895, "tps": 328524, "wall": 818.3} {"step": 4102, "train_loss": 3.7382380962371826, "lr": 0.0003902785092485982, "tps": 325363, "wall": 826.4} {"step": 4103, "train_loss": 3.7100112438201904, "lr": 0.00039027229743705333, "tps": 322303, "wall": 834.5} {"step": 4104, "train_loss": 3.7002453804016113, "lr": 0.0003902660836966547, "tps": 319295, "wall": 842.6} {"step": 4105, "train_loss": 3.763469696044922, "lr": 0.0003902598680274726, "tps": 316360, "wall": 850.6} {"step": 4106, "train_loss": 3.821157932281494, "lr": 0.0003902536504295775, "tps": 313434, "wall": 858.7} {"step": 4107, "train_loss": 3.7209391593933105, "lr": 0.0003902474309030399, "tps": 310564, "wall": 866.9} {"step": 4108, "train_loss": 3.8345770835876465, "lr": 0.00039024120944793013, "tps": 307817, "wall": 874.8} {"step": 4109, "train_loss": 3.748867988586426, "lr": 0.0003902349860643188, "tps": 305024, "wall": 883.1} {"step": 4110, "train_loss": 3.7632763385772705, "lr": 0.00039022876075227634, "tps": 302372, "wall": 891.0} {"step": 4111, "train_loss": 3.728541612625122, "lr": 0.00039022253351187315, "tps": 299711, "wall": 899.1} {"step": 4112, "train_loss": 3.761855125427246, "lr": 0.00039021630434318, "tps": 297120, "wall": 907.2} {"step": 4113, "train_loss": 3.8038833141326904, "lr": 0.00039021007324626733, "tps": 294557, "wall": 915.3} {"step": 4114, "train_loss": 3.7411892414093018, "lr": 0.00039020384022120575, "tps": 292042, "wall": 923.4} {"step": 4115, "train_loss": 3.765439987182617, "lr": 0.0003901976052680658, "tps": 289557, "wall": 931.6} {"step": 4116, "train_loss": 3.7536091804504395, "lr": 0.0003901913683869182, "tps": 287173, "wall": 939.5} {"step": 4117, "train_loss": 3.792820453643799, "lr": 0.0003901851295778336, "tps": 284800, "wall": 947.6} {"step": 4118, "train_loss": 3.7425785064697266, "lr": 0.0003901788888408826, "tps": 282465, "wall": 955.7} {"step": 4119, "train_loss": 3.8426451683044434, "lr": 0.00039017264617613597, "tps": 280187, "wall": 963.7} {"step": 4120, "train_loss": 3.843163013458252, "lr": 0.00039016640158366444, "tps": 277938, "wall": 971.7} {"step": 4121, "train_loss": 3.7725584506988525, "lr": 0.00039016015506353863, "tps": 275700, "wall": 979.8} {"step": 4122, "train_loss": 3.810164451599121, "lr": 0.00039015390661582936, "tps": 273493, "wall": 988.0} {"step": 4123, "train_loss": 3.774228572845459, "lr": 0.0003901476562406075, "tps": 271381, "wall": 995.9} {"step": 4124, "train_loss": 3.771585702896118, "lr": 0.00039014140393794374, "tps": 269221, "wall": 1004.1} {"step": 4125, "train_loss": 3.7774770259857178, "lr": 0.000390135149707909, "tps": 267192, "wall": 1012.0} {"step": 4126, "train_loss": 3.7327122688293457, "lr": 0.0003901288935505741, "tps": 265138, "wall": 1020.1} {"step": 4127, "train_loss": 3.814797878265381, "lr": 0.0003901226354660098, "tps": 263137, "wall": 1028.1} {"step": 4128, "train_loss": 3.7658796310424805, "lr": 0.0003901163754542871, "tps": 261162, "wall": 1036.1} {"step": 4129, "train_loss": 3.79545521736145, "lr": 0.00039011011351547696, "tps": 259224, "wall": 1044.1} {"step": 4130, "train_loss": 3.793917179107666, "lr": 0.00039010384964965027, "tps": 257285, "wall": 1052.3} {"step": 4131, "train_loss": 3.749912738800049, "lr": 0.00039009758385687783, "tps": 255398, "wall": 1060.3} {"step": 4132, "train_loss": 3.87534761428833, "lr": 0.0003900913161372309, "tps": 253546, "wall": 1068.3} {"step": 4133, "train_loss": 3.6864070892333984, "lr": 0.0003900850464907802, "tps": 251748, "wall": 1076.2} {"step": 4134, "train_loss": 3.6483726501464844, "lr": 0.000390078774917597, "tps": 249966, "wall": 1084.1} {"step": 4135, "train_loss": 3.665095329284668, "lr": 0.00039007250141775225, "tps": 248207, "wall": 1092.1} {"step": 4136, "train_loss": 3.9341769218444824, "lr": 0.00039006622599131697, "tps": 246461, "wall": 1100.1} {"step": 4137, "train_loss": 3.809877395629883, "lr": 0.0003900599486383622, "tps": 244727, "wall": 1108.1} {"step": 4138, "train_loss": 3.693164825439453, "lr": 0.0003900536693589592, "tps": 243022, "wall": 1116.2} {"step": 4139, "train_loss": 3.895174980163574, "lr": 0.00039004738815317906, "tps": 241303, "wall": 1124.4} {"step": 4140, "train_loss": 3.6777095794677734, "lr": 0.0003900411050210929, "tps": 239661, "wall": 1132.4} {"step": 4141, "train_loss": 3.8043713569641113, "lr": 0.0003900348199627719, "tps": 237997, "wall": 1140.6} {"step": 4142, "train_loss": 3.7609927654266357, "lr": 0.00039002853297828726, "tps": 236428, "wall": 1148.4} {"step": 4143, "train_loss": 3.867011070251465, "lr": 0.0003900222440677102, "tps": 234848, "wall": 1156.4} {"step": 4144, "train_loss": 3.885101795196533, "lr": 0.00039001595323111195, "tps": 233285, "wall": 1164.4} {"step": 4145, "train_loss": 3.788882255554199, "lr": 0.00039000966046856376, "tps": 231760, "wall": 1172.4} {"step": 4146, "train_loss": 3.6986629962921143, "lr": 0.00039000336578013696, "tps": 230236, "wall": 1180.4} {"step": 4147, "train_loss": 3.725734233856201, "lr": 0.0003899970691659029, "tps": 228745, "wall": 1188.4} {"step": 4148, "train_loss": 3.7829484939575195, "lr": 0.00038999077062593275, "tps": 227282, "wall": 1196.3} {"step": 4149, "train_loss": 3.761876106262207, "lr": 0.000389984470160298, "tps": 225820, "wall": 1204.4} {"step": 4150, "train_loss": 3.6319689750671387, "lr": 0.00038997816776906993, "tps": 224411, "wall": 1212.2} {"step": 4151, "train_loss": 3.747579574584961, "lr": 0.00038997186345232003, "tps": 222983, "wall": 1220.3} {"step": 4152, "train_loss": 3.772141456604004, "lr": 0.00038996555721011966, "tps": 221578, "wall": 1228.3} {"step": 4153, "train_loss": 3.8160245418548584, "lr": 0.0003899592490425402, "tps": 220200, "wall": 1236.3} {"step": 4154, "train_loss": 3.7602336406707764, "lr": 0.00038995293894965327, "tps": 218826, "wall": 1244.4} {"step": 4155, "train_loss": 3.687045097351074, "lr": 0.0003899466269315302, "tps": 217494, "wall": 1252.3} {"step": 4156, "train_loss": 3.754984140396118, "lr": 0.00038994031298824255, "tps": 216186, "wall": 1260.2} {"step": 4157, "train_loss": 3.7338154315948486, "lr": 0.00038993399711986185, "tps": 214886, "wall": 1268.1} {"step": 4158, "train_loss": 3.833014488220215, "lr": 0.00038992767932645965, "tps": 213615, "wall": 1276.0} {"step": 4159, "train_loss": 3.718531370162964, "lr": 0.00038992135960810745, "tps": 212335, "wall": 1284.0} {"step": 4160, "train_loss": 3.7827820777893066, "lr": 0.00038991503796487697, "tps": 211088, "wall": 1291.9} {"step": 4161, "train_loss": 3.9131522178649902, "lr": 0.0003899087143968397, "tps": 209855, "wall": 1299.8} {"step": 4162, "train_loss": 3.6813197135925293, "lr": 0.00038990238890406734, "tps": 208611, "wall": 1307.8} {"step": 4163, "train_loss": 3.7831385135650635, "lr": 0.00038989606148663147, "tps": 207409, "wall": 1315.7} {"step": 4164, "train_loss": 3.6865625381469727, "lr": 0.00038988973214460393, "tps": 206211, "wall": 1323.7} {"step": 4165, "train_loss": 3.75007700920105, "lr": 0.0003898834008780562, "tps": 205042, "wall": 1331.5} {"step": 4166, "train_loss": 3.9075214862823486, "lr": 0.0003898770676870602, "tps": 203858, "wall": 1339.6} {"step": 4167, "train_loss": 3.6664586067199707, "lr": 0.00038987073257168756, "tps": 202703, "wall": 1347.6} {"step": 4168, "train_loss": 3.6974520683288574, "lr": 0.0003898643955320101, "tps": 201566, "wall": 1355.5} {"step": 4169, "train_loss": 3.716806411743164, "lr": 0.0003898580565680995, "tps": 200422, "wall": 1363.5} {"step": 4170, "train_loss": 3.819033145904541, "lr": 0.0003898517156800277, "tps": 199310, "wall": 1371.5} {"step": 4171, "train_loss": 3.777205467224121, "lr": 0.0003898453728678665, "tps": 198212, "wall": 1379.4} {"step": 4172, "train_loss": 3.8271734714508057, "lr": 0.0003898390281316877, "tps": 197101, "wall": 1387.5} {"step": 4173, "train_loss": 3.638101100921631, "lr": 0.00038983268147156316, "tps": 196043, "wall": 1395.3} {"step": 4174, "train_loss": 3.752654552459717, "lr": 0.00038982633288756486, "tps": 194962, "wall": 1403.4} {"step": 4175, "train_loss": 3.8633596897125244, "lr": 0.0003898199823797647, "tps": 193919, "wall": 1411.3} {"step": 4176, "train_loss": 3.7486629486083984, "lr": 0.00038981362994823456, "tps": 192890, "wall": 1419.2} {"step": 4177, "train_loss": 3.768718719482422, "lr": 0.0003898072755930464, "tps": 191861, "wall": 1427.1} {"step": 4178, "train_loss": 3.7652902603149414, "lr": 0.0003898009193142723, "tps": 190847, "wall": 1435.0} {"step": 4179, "train_loss": 3.761492967605591, "lr": 0.00038979456111198414, "tps": 189855, "wall": 1442.9} {"step": 4180, "train_loss": 3.6531310081481934, "lr": 0.0003897882009862541, "tps": 188866, "wall": 1450.8} {"step": 4181, "train_loss": 3.834636688232422, "lr": 0.000389781838937154, "tps": 187882, "wall": 1458.7} {"step": 4182, "train_loss": 3.7246241569519043, "lr": 0.00038977547496475614, "tps": 186893, "wall": 1466.8} {"step": 4183, "train_loss": 3.8167080879211426, "lr": 0.0003897691090691325, "tps": 185932, "wall": 1474.7} {"step": 4184, "train_loss": 3.7605652809143066, "lr": 0.0003897627412503552, "tps": 184978, "wall": 1482.7} {"step": 4185, "train_loss": 3.809971332550049, "lr": 0.00038975637150849633, "tps": 184032, "wall": 1490.7} {"step": 4186, "train_loss": 3.858999252319336, "lr": 0.0003897499998436282, "tps": 183109, "wall": 1498.6} {"step": 4187, "train_loss": 3.8178021907806396, "lr": 0.0003897436262558229, "tps": 182179, "wall": 1506.6} {"step": 4188, "train_loss": 3.810750722885132, "lr": 0.0003897372507451525, "tps": 181281, "wall": 1514.4} {"step": 4189, "train_loss": 3.8022608757019043, "lr": 0.0003897308733116894, "tps": 180374, "wall": 1522.4} {"step": 4190, "train_loss": 3.6420798301696777, "lr": 0.00038972449395550577, "tps": 179477, "wall": 1530.3} {"step": 4191, "train_loss": 3.9045538902282715, "lr": 0.00038971811267667387, "tps": 178598, "wall": 1538.2} {"step": 4192, "train_loss": 3.6543967723846436, "lr": 0.00038971172947526605, "tps": 177714, "wall": 1546.3} {"step": 4193, "train_loss": 3.6306748390197754, "lr": 0.00038970534435135457, "tps": 176848, "wall": 1554.2} {"step": 4194, "train_loss": 3.750793933868408, "lr": 0.0003896989573050118, "tps": 175992, "wall": 1562.1} {"step": 4195, "train_loss": 3.7323124408721924, "lr": 0.00038969256833631, "tps": 175155, "wall": 1570.0} {"step": 4196, "train_loss": 3.805561065673828, "lr": 0.00038968617744532166, "tps": 174317, "wall": 1577.9} {"step": 4197, "train_loss": 3.680878162384033, "lr": 0.000389679784632119, "tps": 173481, "wall": 1585.9} {"step": 4198, "train_loss": 3.7767062187194824, "lr": 0.00038967338989677475, "tps": 172663, "wall": 1593.8} {"step": 4199, "train_loss": 3.822920560836792, "lr": 0.00038966699323936103, "tps": 171841, "wall": 1601.8} {"step": 4200, "train_loss": 3.8288114070892334, "lr": 0.00038966059465995047, "tps": 171042, "wall": 1609.6} {"step": 4201, "train_loss": 3.84359073638916, "lr": 0.00038965419415861553, "tps": 170242, "wall": 1617.6} {"step": 4202, "train_loss": 3.803675413131714, "lr": 0.0003896477917354287, "tps": 169452, "wall": 1625.5} {"step": 4203, "train_loss": 3.772768020629883, "lr": 0.0003896413873904624, "tps": 168677, "wall": 1633.4} {"step": 4204, "train_loss": 3.6752912998199463, "lr": 0.00038963498112378945, "tps": 167900, "wall": 1641.3} {"step": 4205, "train_loss": 3.7152724266052246, "lr": 0.0003896285729354822, "tps": 167120, "wall": 1649.4} {"step": 4206, "train_loss": 3.777891159057617, "lr": 0.0003896221628256133, "tps": 166362, "wall": 1657.3} {"step": 4207, "train_loss": 3.7168049812316895, "lr": 0.0003896157507942553, "tps": 165610, "wall": 1665.2} {"step": 4208, "train_loss": 3.6990408897399902, "lr": 0.0003896093368414809, "tps": 164868, "wall": 1673.1} {"step": 4209, "train_loss": 3.7822022438049316, "lr": 0.0003896029209673628, "tps": 164130, "wall": 1681.0} {"step": 4210, "train_loss": 3.6767992973327637, "lr": 0.0003895965031719737, "tps": 163401, "wall": 1688.9} {"step": 4211, "train_loss": 3.7136073112487793, "lr": 0.00038959008345538614, "tps": 162682, "wall": 1696.8} {"step": 4212, "train_loss": 3.6915433406829834, "lr": 0.00038958366181767297, "tps": 161963, "wall": 1704.7} {"step": 4213, "train_loss": 3.7529921531677246, "lr": 0.0003895772382589069, "tps": 161258, "wall": 1712.6} {"step": 4214, "train_loss": 3.708038330078125, "lr": 0.0003895708127791607, "tps": 160530, "wall": 1720.8} {"step": 4215, "train_loss": 3.8152015209198, "lr": 0.0003895643853785072, "tps": 159851, "wall": 1728.5} {"step": 4216, "train_loss": 3.781764030456543, "lr": 0.0003895579560570192, "tps": 159164, "wall": 1736.4} {"step": 4217, "train_loss": 3.7386481761932373, "lr": 0.00038955152481476936, "tps": 158485, "wall": 1744.2} {"step": 4218, "train_loss": 3.756552219390869, "lr": 0.0003895450916518308, "tps": 157804, "wall": 1752.1} {"step": 4219, "train_loss": 3.7340612411499023, "lr": 0.0003895386565682762, "tps": 157141, "wall": 1760.0} {"step": 4220, "train_loss": 3.802577495574951, "lr": 0.0003895322195641785, "tps": 156468, "wall": 1767.9} {"step": 4221, "train_loss": 3.761579990386963, "lr": 0.0003895257806396108, "tps": 155814, "wall": 1775.8} {"step": 4222, "train_loss": 3.834009885787964, "lr": 0.0003895193397946457, "tps": 155143, "wall": 1783.9} {"step": 4223, "train_loss": 3.7751121520996094, "lr": 0.00038951289702935646, "tps": 154506, "wall": 1791.7} {"step": 4224, "train_loss": 3.8202154636383057, "lr": 0.0003895064523438159, "tps": 153867, "wall": 1799.5} {"step": 4225, "train_loss": 3.851381778717041, "lr": 0.0003895000057380971, "tps": 153228, "wall": 1807.5} {"step": 4226, "train_loss": 3.760122299194336, "lr": 0.00038949355721227305, "tps": 152601, "wall": 1815.3} {"step": 4227, "train_loss": 3.654188632965088, "lr": 0.0003894871067664169, "tps": 151963, "wall": 1823.4} {"step": 4228, "train_loss": 3.7854788303375244, "lr": 0.0003894806544006015, "tps": 151341, "wall": 1831.3} {"step": 4229, "train_loss": 3.829312801361084, "lr": 0.00038947420011490013, "tps": 150723, "wall": 1839.2} {"step": 4230, "train_loss": 3.6947412490844727, "lr": 0.0003894677439093859, "tps": 150114, "wall": 1847.1} {"step": 4231, "train_loss": 3.753330945968628, "lr": 0.00038946128578413184, "tps": 149508, "wall": 1855.1} {"step": 4232, "train_loss": 3.6810059547424316, "lr": 0.00038945482573921124, "tps": 148906, "wall": 1863.0} {"step": 4233, "train_loss": 3.749966859817505, "lr": 0.00038944836377469714, "tps": 148308, "wall": 1871.0} {"step": 4234, "train_loss": 3.8497204780578613, "lr": 0.00038944189989066283, "tps": 147714, "wall": 1878.9} {"step": 4235, "train_loss": 3.718139171600342, "lr": 0.00038943543408718155, "tps": 147122, "wall": 1886.9} {"step": 4236, "train_loss": 3.7319326400756836, "lr": 0.0003894289663643264, "tps": 146557, "wall": 1894.7} {"step": 4237, "train_loss": 3.8140246868133545, "lr": 0.00038942249672217083, "tps": 145960, "wall": 1902.9} {"step": 4238, "train_loss": 3.820209503173828, "lr": 0.00038941602516078796, "tps": 145400, "wall": 1910.6} {"step": 4239, "train_loss": 3.6994619369506836, "lr": 0.00038940955168025135, "tps": 144830, "wall": 1918.6} {"step": 4240, "train_loss": 3.7750184535980225, "lr": 0.00038940307628063407, "tps": 144267, "wall": 1926.5} {"step": 4241, "train_loss": 3.7347002029418945, "lr": 0.00038939659896200957, "tps": 143711, "wall": 1934.5} {"step": 4242, "train_loss": 3.757828950881958, "lr": 0.0003893901197244513, "tps": 143155, "wall": 1942.4} {"step": 4243, "train_loss": 3.783205986022949, "lr": 0.0003893836385680325, "tps": 142602, "wall": 1950.4} {"step": 4244, "train_loss": 3.726018190383911, "lr": 0.0003893771554928268, "tps": 142063, "wall": 1958.3} {"step": 4245, "train_loss": 3.7860093116760254, "lr": 0.0003893706704989074, "tps": 141515, "wall": 1966.3} {"step": 4246, "train_loss": 3.7408764362335205, "lr": 0.00038936418358634795, "tps": 140985, "wall": 1974.2} {"step": 4247, "train_loss": 3.796428680419922, "lr": 0.00038935769475522184, "tps": 140446, "wall": 1982.2} {"step": 4248, "train_loss": 3.739295244216919, "lr": 0.00038935120400560263, "tps": 139924, "wall": 1990.1} {"step": 4249, "train_loss": 3.8178510665893555, "lr": 0.0003893447113375638, "tps": 139409, "wall": 1997.9} {"step": 4250, "train_loss": 3.7939388751983643, "lr": 0.0003893382167511789, "tps": 138882, "wall": 2006.0} {"step": 4251, "train_loss": 3.7005815505981445, "lr": 0.0003893317202465215, "tps": 138375, "wall": 2013.8} {"step": 4252, "train_loss": 3.6729018688201904, "lr": 0.0003893252218236653, "tps": 137862, "wall": 2021.8} {"step": 4253, "train_loss": 3.7398974895477295, "lr": 0.00038931872148268375, "tps": 137361, "wall": 2029.6} {"step": 4254, "train_loss": 3.8444976806640625, "lr": 0.0003893122192236506, "tps": 136856, "wall": 2037.6} {"step": 4255, "train_loss": 3.8159098625183105, "lr": 0.00038930571504663947, "tps": 136361, "wall": 2045.5} {"step": 4256, "train_loss": 3.801236629486084, "lr": 0.000389299208951724, "tps": 135862, "wall": 2053.4} {"step": 4257, "train_loss": 3.6810548305511475, "lr": 0.00038929270093897804, "tps": 135371, "wall": 2061.4} {"step": 4258, "train_loss": 3.7790284156799316, "lr": 0.00038928619100847507, "tps": 134883, "wall": 2069.3} {"step": 4259, "train_loss": 3.8111982345581055, "lr": 0.00038927967916028907, "tps": 134409, "wall": 2077.1} {"step": 4260, "train_loss": 3.637880802154541, "lr": 0.0003892731653944936, "tps": 133923, "wall": 2085.1} {"step": 4261, "train_loss": 3.71065354347229, "lr": 0.0003892666497111627, "tps": 133456, "wall": 2092.9} {"step": 4262, "train_loss": 3.8019323348999023, "lr": 0.00038926013211036995, "tps": 132983, "wall": 2100.9} {"step": 4263, "train_loss": 3.846144676208496, "lr": 0.00038925361259218926, "tps": 132513, "wall": 2108.8} {"step": 4264, "train_loss": 3.799398422241211, "lr": 0.0003892470911566945, "tps": 132051, "wall": 2116.7} {"step": 4265, "train_loss": 3.605344772338867, "lr": 0.0003892405678039595, "tps": 131593, "wall": 2124.6} {"step": 4266, "train_loss": 3.6863362789154053, "lr": 0.0003892340425340583, "tps": 131139, "wall": 2132.4} {"step": 4267, "train_loss": 3.7510013580322266, "lr": 0.0003892275153470646, "tps": 130684, "wall": 2140.3} {"step": 4268, "train_loss": 3.785032272338867, "lr": 0.00038922098624305247, "tps": 130234, "wall": 2148.2} {"step": 4269, "train_loss": 3.7092695236206055, "lr": 0.0003892144552220959, "tps": 129793, "wall": 2156.0} {"step": 4270, "train_loss": 3.7673745155334473, "lr": 0.0003892079222842688, "tps": 129343, "wall": 2164.0} {"step": 4271, "train_loss": 3.759956121444702, "lr": 0.00038920138742964516, "tps": 128904, "wall": 2171.9} {"step": 4272, "train_loss": 3.769726276397705, "lr": 0.00038919485065829916, "tps": 128471, "wall": 2179.8} {"step": 4273, "train_loss": 3.696168899536133, "lr": 0.0003891883119703046, "tps": 128028, "wall": 2187.8} {"step": 4274, "train_loss": 3.8438730239868164, "lr": 0.00038918177136573577, "tps": 127604, "wall": 2195.6} {"step": 4275, "train_loss": 3.7318947315216064, "lr": 0.0003891752288446667, "tps": 127173, "wall": 2203.5} {"step": 4276, "train_loss": 3.7444090843200684, "lr": 0.00038916868440717146, "tps": 126753, "wall": 2211.4} {"step": 4277, "train_loss": 3.793337106704712, "lr": 0.0003891621380533242, "tps": 126333, "wall": 2219.2} {"step": 4278, "train_loss": 3.7540926933288574, "lr": 0.0003891555897831991, "tps": 125917, "wall": 2227.1} {"step": 4279, "train_loss": 3.805790901184082, "lr": 0.00038914903959687036, "tps": 125502, "wall": 2235.0} {"step": 4280, "train_loss": 3.8541228771209717, "lr": 0.00038914248749441206, "tps": 125079, "wall": 2243.0} {"step": 4281, "train_loss": 3.7219338417053223, "lr": 0.0003891359334758986, "tps": 124676, "wall": 2250.8} {"step": 4282, "train_loss": 3.7452073097229004, "lr": 0.00038912937754140406, "tps": 124274, "wall": 2258.6} {"step": 4283, "train_loss": 3.689669609069824, "lr": 0.00038912281969100284, "tps": 123871, "wall": 2266.5} {"step": 4284, "train_loss": 3.7900147438049316, "lr": 0.00038911625992476916, "tps": 123471, "wall": 2274.4} {"step": 4285, "train_loss": 3.7823452949523926, "lr": 0.0003891096982427773, "tps": 123070, "wall": 2282.3} {"step": 4286, "train_loss": 3.791311264038086, "lr": 0.0003891031346451017, "tps": 122676, "wall": 2290.2} {"step": 4287, "train_loss": 3.772310495376587, "lr": 0.0003890965691318166, "tps": 122285, "wall": 2298.0} {"step": 4288, "train_loss": 3.738253593444824, "lr": 0.0003890900017029964, "tps": 121889, "wall": 2306.1} {"step": 4289, "train_loss": 3.696291446685791, "lr": 0.00038908343235871554, "tps": 121499, "wall": 2314.0} {"step": 4290, "train_loss": 3.7915897369384766, "lr": 0.0003890768610990484, "tps": 121116, "wall": 2321.9} {"step": 4291, "train_loss": 3.848870277404785, "lr": 0.00038907028792406945, "tps": 120739, "wall": 2329.7} {"step": 4292, "train_loss": 3.723252534866333, "lr": 0.00038906371283385313, "tps": 120358, "wall": 2337.6} {"step": 4293, "train_loss": 3.768374443054199, "lr": 0.00038905713582847385, "tps": 119985, "wall": 2345.4} {"step": 4294, "train_loss": 3.7741775512695312, "lr": 0.0003890505569080063, "tps": 119611, "wall": 2353.3} {"step": 4295, "train_loss": 3.729954481124878, "lr": 0.00038904397607252483, "tps": 119237, "wall": 2361.2} {"step": 4296, "train_loss": 3.7536563873291016, "lr": 0.00038903739332210406, "tps": 118860, "wall": 2369.2} {"step": 4297, "train_loss": 3.778562307357788, "lr": 0.0003890308086568186, "tps": 118497, "wall": 2377.0} {"step": 4298, "train_loss": 3.838477849960327, "lr": 0.0003890242220767429, "tps": 118122, "wall": 2385.1} {"step": 4299, "train_loss": 3.831998109817505, "lr": 0.00038901763358195173, "tps": 117760, "wall": 2393.0} {"step": 4300, "train_loss": 3.653717279434204, "lr": 0.0003890110431725197, "tps": 117403, "wall": 2400.9} {"step": 4301, "train_loss": 3.8237247467041016, "lr": 0.0003890044508485214, "tps": 117047, "wall": 2408.7} {"step": 4302, "train_loss": 3.7267565727233887, "lr": 0.00038899785661003147, "tps": 116693, "wall": 2416.6} {"step": 4303, "train_loss": 3.72482967376709, "lr": 0.0003889912604571247, "tps": 116340, "wall": 2424.5} {"step": 4304, "train_loss": 3.70322847366333, "lr": 0.0003889846623898759, "tps": 115988, "wall": 2432.4} {"step": 4305, "train_loss": 3.7220516204833984, "lr": 0.0003889780624083596, "tps": 115638, "wall": 2440.3} {"step": 4306, "train_loss": 3.7316503524780273, "lr": 0.0003889714605126507, "tps": 115289, "wall": 2448.3} {"step": 4307, "train_loss": 3.6889753341674805, "lr": 0.00038896485670282397, "tps": 114946, "wall": 2456.2} {"step": 4308, "train_loss": 3.78391170501709, "lr": 0.00038895825097895416, "tps": 114606, "wall": 2464.0} {"step": 4309, "train_loss": 3.7240262031555176, "lr": 0.0003889516433411162, "tps": 114270, "wall": 2471.9} {"step": 4310, "train_loss": 3.6322126388549805, "lr": 0.00038894503378938483, "tps": 113931, "wall": 2479.8} {"step": 4311, "train_loss": 3.7613601684570312, "lr": 0.000388938422323835, "tps": 113595, "wall": 2487.7} {"step": 4312, "train_loss": 3.767754554748535, "lr": 0.00038893180894454153, "tps": 113266, "wall": 2495.5} {"step": 4313, "train_loss": 3.826201915740967, "lr": 0.00038892519365157945, "tps": 112929, "wall": 2503.5} {"step": 4314, "train_loss": 3.830122947692871, "lr": 0.00038891857644502364, "tps": 112602, "wall": 2511.4} {"step": 4315, "train_loss": 3.765526533126831, "lr": 0.00038891195732494905, "tps": 112278, "wall": 2519.2} {"step": 4316, "train_loss": 3.6832447052001953, "lr": 0.0003889053362914306, "tps": 111951, "wall": 2527.1} {"step": 4317, "train_loss": 3.7868001461029053, "lr": 0.00038889871334454347, "tps": 111633, "wall": 2534.9} {"step": 4318, "train_loss": 3.6702914237976074, "lr": 0.0003888920884843625, "tps": 111312, "wall": 2542.8} {"step": 4319, "train_loss": 3.7586560249328613, "lr": 0.00038888546171096287, "tps": 110992, "wall": 2550.8} {"step": 4320, "train_loss": 3.6661267280578613, "lr": 0.00038887883302441957, "tps": 110680, "wall": 2558.6} {"step": 4321, "train_loss": 3.8228983879089355, "lr": 0.0003888722024248078, "tps": 110359, "wall": 2566.6} {"step": 4322, "train_loss": 3.749070167541504, "lr": 0.00038886556991220246, "tps": 110048, "wall": 2574.4} {"step": 4323, "train_loss": 3.698093891143799, "lr": 0.0003888589354866788, "tps": 109738, "wall": 2582.3} {"step": 4324, "train_loss": 3.626011848449707, "lr": 0.00038885229914831205, "tps": 109435, "wall": 2590.0} {"step": 4325, "train_loss": 3.709319591522217, "lr": 0.0003888456608971773, "tps": 109129, "wall": 2597.9} {"step": 4326, "train_loss": 3.792875051498413, "lr": 0.00038883902073334975, "tps": 108819, "wall": 2605.9} {"step": 4327, "train_loss": 3.867826461791992, "lr": 0.0003888323786569047, "tps": 108517, "wall": 2613.8} {"step": 4328, "train_loss": 3.7318010330200195, "lr": 0.00038882573466791725, "tps": 108213, "wall": 2621.7} {"step": 4329, "train_loss": 3.6707653999328613, "lr": 0.0003888190887664628, "tps": 107914, "wall": 2629.6} {"step": 4330, "train_loss": 3.6909611225128174, "lr": 0.00038881244095261653, "tps": 107623, "wall": 2637.3} {"step": 4331, "train_loss": 3.824936866760254, "lr": 0.00038880579122645386, "tps": 107329, "wall": 2645.2} {"step": 4332, "train_loss": 3.6699366569519043, "lr": 0.00038879913958805, "tps": 107040, "wall": 2652.9} {"step": 4333, "train_loss": 3.7336878776550293, "lr": 0.0003887924860374804, "tps": 106746, "wall": 2660.8} {"step": 4334, "train_loss": 3.6562275886535645, "lr": 0.0003887858305748204, "tps": 106453, "wall": 2668.8} {"step": 4335, "train_loss": 3.8379547595977783, "lr": 0.0003887791732001453, "tps": 106166, "wall": 2676.6} {"step": 4336, "train_loss": 3.72868013381958, "lr": 0.00038877251391353067, "tps": 105874, "wall": 2684.6} {"step": 4337, "train_loss": 3.762576103210449, "lr": 0.0003887658527150518, "tps": 105589, "wall": 2692.5} {"step": 4338, "train_loss": 3.7929024696350098, "lr": 0.00038875918960478426, "tps": 105307, "wall": 2700.3} {"step": 4339, "train_loss": 3.676025390625, "lr": 0.00038875252458280354, "tps": 105027, "wall": 2708.1} {"step": 4340, "train_loss": 3.7024481296539307, "lr": 0.00038874585764918503, "tps": 104746, "wall": 2716.0} {"step": 4341, "train_loss": 3.712066650390625, "lr": 0.00038873918880400437, "tps": 104466, "wall": 2723.9} {"step": 4342, "train_loss": 3.988030433654785, "lr": 0.000388732518047337, "tps": 104185, "wall": 2731.9} {"step": 4343, "train_loss": 3.7635817527770996, "lr": 0.0003887258453792585, "tps": 103910, "wall": 2739.7} {"step": 4344, "train_loss": 3.7197933197021484, "lr": 0.0003887191707998445, "tps": 103630, "wall": 2747.8} {"step": 4345, "train_loss": 3.738395929336548, "lr": 0.00038871249430917073, "tps": 103356, "wall": 2755.7} {"step": 4346, "train_loss": 3.7306137084960938, "lr": 0.00038870581590731267, "tps": 103086, "wall": 2763.6} {"step": 4347, "train_loss": 3.7550461292266846, "lr": 0.0003886991355943459, "tps": 102819, "wall": 2771.4} {"step": 4348, "train_loss": 3.6848859786987305, "lr": 0.00038869245337034625, "tps": 102547, "wall": 2779.4} {"step": 4349, "train_loss": 3.7207818031311035, "lr": 0.00038868576923538936, "tps": 102279, "wall": 2787.3} {"step": 4350, "train_loss": 3.666609525680542, "lr": 0.00038867908318955096, "tps": 102014, "wall": 2795.2} {"step": 4351, "train_loss": 3.820509910583496, "lr": 0.00038867239523290674, "tps": 101746, "wall": 2803.2} {"step": 4352, "train_loss": 3.705656051635742, "lr": 0.00038866570536553254, "tps": 101486, "wall": 2811.0} {"step": 4353, "train_loss": 3.817910671234131, "lr": 0.0003886590135875041, "tps": 101226, "wall": 2818.9} {"step": 4354, "train_loss": 3.784071922302246, "lr": 0.0003886523198988972, "tps": 100968, "wall": 2826.7} {"step": 4355, "train_loss": 3.8083763122558594, "lr": 0.00038864562429978777, "tps": 100716, "wall": 2834.4} {"step": 4356, "train_loss": 3.6979823112487793, "lr": 0.0003886389267902515, "tps": 100457, "wall": 2842.4} {"step": 4357, "train_loss": 3.7344045639038086, "lr": 0.0003886322273703644, "tps": 100208, "wall": 2850.1} {"step": 4358, "train_loss": 3.733896255493164, "lr": 0.00038862552604020226, "tps": 99954, "wall": 2858.0} {"step": 4359, "train_loss": 3.719350814819336, "lr": 0.00038861882279984104, "tps": 99698, "wall": 2866.0} {"step": 4360, "train_loss": 3.713601589202881, "lr": 0.0003886121176493567, "tps": 99448, "wall": 2873.9} {"step": 4361, "train_loss": 3.6923282146453857, "lr": 0.00038860541058882524, "tps": 99204, "wall": 2881.6} {"step": 4362, "train_loss": 3.8057610988616943, "lr": 0.0003885987016183225, "tps": 98959, "wall": 2889.4} {"step": 4363, "train_loss": 3.6730480194091797, "lr": 0.00038859199073792446, "tps": 98713, "wall": 2897.3} {"step": 4364, "train_loss": 3.6909141540527344, "lr": 0.0003885852779477073, "tps": 98463, "wall": 2905.3} {"step": 4365, "train_loss": 3.7632710933685303, "lr": 0.000388578563247747, "tps": 98225, "wall": 2913.0} {"step": 4366, "train_loss": 3.6919121742248535, "lr": 0.0003885718466381197, "tps": 97979, "wall": 2921.0} {"step": 4367, "train_loss": 3.8537800312042236, "lr": 0.00038856512811890123, "tps": 97739, "wall": 2928.8} {"step": 4368, "train_loss": 3.5790891647338867, "lr": 0.000388558407690168, "tps": 97497, "wall": 2936.7} {"step": 4369, "train_loss": 3.6865737438201904, "lr": 0.0003885516853519959, "tps": 97261, "wall": 2944.6} {"step": 4370, "train_loss": 3.6099853515625, "lr": 0.0003885449611044613, "tps": 97026, "wall": 2952.4} {"step": 4371, "train_loss": 3.6839842796325684, "lr": 0.0003885382349476402, "tps": 96793, "wall": 2960.1} {"step": 4372, "train_loss": 3.616824150085449, "lr": 0.0003885315068816089, "tps": 96558, "wall": 2968.0} {"step": 4373, "train_loss": 3.7502353191375732, "lr": 0.00038852477690644354, "tps": 96327, "wall": 2975.8} {"step": 4374, "train_loss": 3.645742416381836, "lr": 0.0003885180450222204, "tps": 96092, "wall": 2983.8} {"step": 4375, "train_loss": 3.617216110229492, "lr": 0.0003885113112290157, "tps": 95862, "wall": 2991.6} {"step": 4376, "train_loss": 3.783780813217163, "lr": 0.0003885045755269058, "tps": 95635, "wall": 2999.4} {"step": 4377, "train_loss": 3.7957210540771484, "lr": 0.0003884978379159669, "tps": 95403, "wall": 3007.4} {"step": 4378, "train_loss": 3.8140110969543457, "lr": 0.0003884910983962755, "tps": 95178, "wall": 3015.2} {"step": 4379, "train_loss": 3.766633987426758, "lr": 0.0003884843569679077, "tps": 94951, "wall": 3023.1} {"step": 4380, "train_loss": 3.8499436378479004, "lr": 0.0003884776136309399, "tps": 94726, "wall": 3031.0} {"step": 4381, "train_loss": 3.664309024810791, "lr": 0.00038847086838544875, "tps": 94506, "wall": 3038.7} {"step": 4382, "train_loss": 3.7448883056640625, "lr": 0.00038846412123151044, "tps": 94279, "wall": 3046.7} {"step": 4383, "train_loss": 3.76628041267395, "lr": 0.0003884573721692015, "tps": 94057, "wall": 3054.6} {"step": 4384, "train_loss": 3.7722103595733643, "lr": 0.00038845062119859824, "tps": 93838, "wall": 3062.4} {"step": 4385, "train_loss": 3.6382265090942383, "lr": 0.0003884438683197773, "tps": 93621, "wall": 3070.2} {"step": 4386, "train_loss": 3.752364158630371, "lr": 0.00038843711353281503, "tps": 93403, "wall": 3078.1} {"step": 4387, "train_loss": 3.7282803058624268, "lr": 0.00038843035683778804, "tps": 93185, "wall": 3086.0} {"step": 4388, "train_loss": 3.7607414722442627, "lr": 0.00038842359823477296, "tps": 92972, "wall": 3093.8} {"step": 4389, "train_loss": 3.6600639820098877, "lr": 0.0003884168377238461, "tps": 92754, "wall": 3101.8} {"step": 4390, "train_loss": 3.8322157859802246, "lr": 0.00038841007530508433, "tps": 92543, "wall": 3109.6} {"step": 4391, "train_loss": 3.834108352661133, "lr": 0.000388403310978564, "tps": 92331, "wall": 3117.4} {"step": 4392, "train_loss": 3.7897114753723145, "lr": 0.000388396544744362, "tps": 92121, "wall": 3125.2} {"step": 4393, "train_loss": 3.66384220123291, "lr": 0.00038838977660255467, "tps": 91910, "wall": 3133.1} {"step": 4394, "train_loss": 3.7235584259033203, "lr": 0.0003883830065532189, "tps": 91700, "wall": 3141.0} {"step": 4395, "train_loss": 3.802313804626465, "lr": 0.0003883762345964314, "tps": 91490, "wall": 3148.9} {"step": 4396, "train_loss": 3.7142257690429688, "lr": 0.0003883694607322687, "tps": 91284, "wall": 3156.8} {"step": 4397, "train_loss": 3.771681547164917, "lr": 0.0003883626849608076, "tps": 91074, "wall": 3164.7} {"step": 4398, "train_loss": 3.7495603561401367, "lr": 0.00038835590728212503, "tps": 90868, "wall": 3172.6} {"step": 4399, "train_loss": 3.7684900760650635, "lr": 0.00038834912769629756, "tps": 90665, "wall": 3180.5} {"step": 4400, "train_loss": 3.6569106578826904, "lr": 0.0003883423462034021, "tps": 90460, "wall": 3188.4} {"step": 4401, "train_loss": 3.706787347793579, "lr": 0.0003883355628035154, "tps": 90260, "wall": 3196.2} {"step": 4402, "train_loss": 3.7434749603271484, "lr": 0.0003883287774967143, "tps": 90058, "wall": 3204.1} {"step": 4403, "train_loss": 3.7623579502105713, "lr": 0.0003883219902830758, "tps": 89858, "wall": 3211.9} {"step": 4404, "train_loss": 3.844965696334839, "lr": 0.00038831520116267666, "tps": 89661, "wall": 3219.7} {"step": 4405, "train_loss": 3.713740348815918, "lr": 0.0003883084101355938, "tps": 89459, "wall": 3227.7} {"step": 4406, "train_loss": 3.8054122924804688, "lr": 0.0003883016172019042, "tps": 89260, "wall": 3235.7} {"step": 4407, "train_loss": 3.6844189167022705, "lr": 0.0003882948223616847, "tps": 89062, "wall": 3243.6} {"step": 4408, "train_loss": 3.7655844688415527, "lr": 0.00038828802561501237, "tps": 88870, "wall": 3251.4} {"step": 4409, "train_loss": 3.8162503242492676, "lr": 0.00038828122696196423, "tps": 88675, "wall": 3259.2} {"step": 4410, "train_loss": 3.7182211875915527, "lr": 0.00038827442640261724, "tps": 88478, "wall": 3267.2} {"step": 4411, "train_loss": 3.720277786254883, "lr": 0.00038826762393704843, "tps": 88288, "wall": 3275.0} {"step": 4412, "train_loss": 3.6331257820129395, "lr": 0.00038826081956533484, "tps": 88094, "wall": 3283.0} {"step": 4413, "train_loss": 3.685999870300293, "lr": 0.00038825401328755355, "tps": 87906, "wall": 3290.7} {"step": 4414, "train_loss": 3.7192580699920654, "lr": 0.0003882472051037818, "tps": 87716, "wall": 3298.6} {"step": 4415, "train_loss": 3.866056442260742, "lr": 0.0003882403950140965, "tps": 87529, "wall": 3306.4} {"step": 4416, "train_loss": 3.793942451477051, "lr": 0.000388233583018575, "tps": 87342, "wall": 3314.2} {"step": 4417, "train_loss": 3.6603384017944336, "lr": 0.00038822676911729435, "tps": 87153, "wall": 3322.2} {"step": 4418, "train_loss": 3.6495347023010254, "lr": 0.0003882199533103317, "tps": 86966, "wall": 3330.1} {"step": 4419, "train_loss": 3.780365467071533, "lr": 0.0003882131355977644, "tps": 86783, "wall": 3337.8} {"step": 4420, "train_loss": 3.652557849884033, "lr": 0.0003882063159796695, "tps": 86594, "wall": 3345.9} {"step": 4421, "train_loss": 3.7373273372650146, "lr": 0.00038819949445612447, "tps": 86412, "wall": 3353.7} {"step": 4422, "train_loss": 3.733764886856079, "lr": 0.0003881926710272064, "tps": 86232, "wall": 3361.5} {"step": 4423, "train_loss": 3.7001864910125732, "lr": 0.00038818584569299267, "tps": 86051, "wall": 3369.3} {"step": 4424, "train_loss": 3.787825584411621, "lr": 0.00038817901845356056, "tps": 85867, "wall": 3377.3} {"step": 4425, "train_loss": 3.6240689754486084, "lr": 0.00038817218930898743, "tps": 85687, "wall": 3385.1} {"step": 4426, "train_loss": 3.754920244216919, "lr": 0.0003881653582593507, "tps": 85508, "wall": 3393.0} {"step": 4427, "train_loss": 3.81884765625, "lr": 0.0003881585253047276, "tps": 85327, "wall": 3400.9} {"step": 4428, "train_loss": 3.792419910430908, "lr": 0.0003881516904451957, "tps": 85154, "wall": 3408.6} {"step": 4429, "train_loss": 3.7791972160339355, "lr": 0.00038814485368083234, "tps": 84974, "wall": 3416.6} {"step": 4430, "train_loss": 3.7868189811706543, "lr": 0.000388138015011715, "tps": 84799, "wall": 3424.4} {"step": 4431, "train_loss": 3.7193603515625, "lr": 0.0003881311744379211, "tps": 84625, "wall": 3432.3} {"step": 4432, "train_loss": 3.6916465759277344, "lr": 0.00038812433195952817, "tps": 84447, "wall": 3440.2} {"step": 4433, "train_loss": 3.7790374755859375, "lr": 0.0003881174875766137, "tps": 84271, "wall": 3448.2} {"step": 4434, "train_loss": 3.8423848152160645, "lr": 0.0003881106412892552, "tps": 84101, "wall": 3456.0} {"step": 4435, "train_loss": 3.7964587211608887, "lr": 0.0003881037930975303, "tps": 83927, "wall": 3463.9} {"step": 4436, "train_loss": 3.7451729774475098, "lr": 0.0003880969430015166, "tps": 83757, "wall": 3471.7} {"step": 4437, "train_loss": 3.7645392417907715, "lr": 0.0003880900910012915, "tps": 83585, "wall": 3479.6} {"step": 4438, "train_loss": 3.752035140991211, "lr": 0.00038808323709693286, "tps": 83417, "wall": 3487.5} {"step": 4439, "train_loss": 3.695913791656494, "lr": 0.0003880763812885182, "tps": 83248, "wall": 3495.3} {"step": 4440, "train_loss": 3.6890060901641846, "lr": 0.0003880695235761252, "tps": 83079, "wall": 3503.2} {"step": 4441, "train_loss": 3.763516426086426, "lr": 0.0003880626639598315, "tps": 82910, "wall": 3511.1} {"step": 4442, "train_loss": 3.635338306427002, "lr": 0.00038805580243971493, "tps": 82747, "wall": 3518.8} {"step": 4443, "train_loss": 3.7371280193328857, "lr": 0.000388048939015853, "tps": 82579, "wall": 3526.8} {"step": 4444, "train_loss": 3.759164333343506, "lr": 0.0003880420736883238, "tps": 82414, "wall": 3534.7} {"step": 4445, "train_loss": 3.6711766719818115, "lr": 0.00038803520645720475, "tps": 82247, "wall": 3542.6} {"step": 4446, "train_loss": 3.7684762477874756, "lr": 0.00038802833732257385, "tps": 82087, "wall": 3550.3} {"step": 4447, "train_loss": 3.7226786613464355, "lr": 0.0003880214662845088, "tps": 81924, "wall": 3558.2} {"step": 4448, "train_loss": 3.8159799575805664, "lr": 0.0003880145933430875, "tps": 81760, "wall": 3566.2} {"step": 4449, "train_loss": 3.7496538162231445, "lr": 0.00038800771849838785, "tps": 81597, "wall": 3574.1} {"step": 4450, "train_loss": 3.70455002784729, "lr": 0.0003880008417504876, "tps": 81435, "wall": 3582.0} {"step": 4451, "train_loss": 3.8612163066864014, "lr": 0.00038799396309946487, "tps": 81276, "wall": 3589.8} {"step": 4452, "train_loss": 3.794822931289673, "lr": 0.0003879870825453973, "tps": 81118, "wall": 3597.6} {"step": 4453, "train_loss": 3.748264789581299, "lr": 0.000387980200088363, "tps": 80960, "wall": 3605.4} {"step": 4454, "train_loss": 3.7543797492980957, "lr": 0.00038797331572843993, "tps": 80803, "wall": 3613.3} {"step": 4455, "train_loss": 3.859415292739868, "lr": 0.000387966429465706, "tps": 80644, "wall": 3621.2} {"step": 4456, "train_loss": 3.7408554553985596, "lr": 0.00038795954130023934, "tps": 80482, "wall": 3629.3} {"step": 4457, "train_loss": 3.753329277038574, "lr": 0.0003879526512321179, "tps": 80328, "wall": 3637.1} {"step": 4458, "train_loss": 3.6849112510681152, "lr": 0.0003879457592614197, "tps": 80172, "wall": 3644.9} {"step": 4459, "train_loss": 3.6776318550109863, "lr": 0.0003879388653882229, "tps": 80018, "wall": 3652.8} {"step": 4460, "train_loss": 3.6780500411987305, "lr": 0.0003879319696126055, "tps": 79867, "wall": 3660.5} {"step": 4461, "train_loss": 3.7192015647888184, "lr": 0.00038792507193464564, "tps": 79711, "wall": 3668.5} {"step": 4462, "train_loss": 3.657252788543701, "lr": 0.0003879181723544216, "tps": 79560, "wall": 3676.3} {"step": 4463, "train_loss": 3.7082085609436035, "lr": 0.00038791127087201135, "tps": 79409, "wall": 3684.1} {"step": 4464, "train_loss": 3.6439907550811768, "lr": 0.0003879043674874931, "tps": 79256, "wall": 3692.0} {"step": 4465, "train_loss": 3.737908124923706, "lr": 0.00038789746220094516, "tps": 79107, "wall": 3699.8} {"step": 4466, "train_loss": 3.723048210144043, "lr": 0.0003878905550124456, "tps": 78956, "wall": 3707.7} {"step": 4467, "train_loss": 3.728154182434082, "lr": 0.0003878836459220728, "tps": 78808, "wall": 3715.5} {"step": 4468, "train_loss": 3.775217294692993, "lr": 0.00038787673492990496, "tps": 78659, "wall": 3723.4} {"step": 4469, "train_loss": 3.7287912368774414, "lr": 0.00038786982203602047, "tps": 78513, "wall": 3731.2} {"step": 4470, "train_loss": 3.767385721206665, "lr": 0.00038786290724049746, "tps": 78365, "wall": 3739.0} {"step": 4471, "train_loss": 3.673046112060547, "lr": 0.0003878559905434144, "tps": 78217, "wall": 3747.0} {"step": 4472, "train_loss": 3.8195300102233887, "lr": 0.00038784907194484955, "tps": 78072, "wall": 3754.8} {"step": 4473, "train_loss": 3.7317845821380615, "lr": 0.0003878421514448813, "tps": 77923, "wall": 3762.8} {"step": 4474, "train_loss": 3.712785243988037, "lr": 0.0003878352290435882, "tps": 77780, "wall": 3770.5} {"step": 4475, "train_loss": 3.6918482780456543, "lr": 0.0003878283047410485, "tps": 77636, "wall": 3778.3} {"step": 4476, "train_loss": 3.783754825592041, "lr": 0.0003878213785373407, "tps": 77494, "wall": 3786.2} {"step": 4477, "train_loss": 3.7612967491149902, "lr": 0.00038781445043254315, "tps": 77354, "wall": 3793.9} {"step": 4478, "train_loss": 3.6924214363098145, "lr": 0.00038780752042673447, "tps": 77212, "wall": 3801.7} {"step": 4479, "train_loss": 3.790283441543579, "lr": 0.00038780058851999315, "tps": 77070, "wall": 3809.5} {"step": 4480, "train_loss": 3.7002525329589844, "lr": 0.0003877936547123977, "tps": 76930, "wall": 3817.3} {"step": 4481, "train_loss": 3.6900508403778076, "lr": 0.00038778671900402666, "tps": 76787, "wall": 3825.3} {"step": 4482, "train_loss": 3.6757314205169678, "lr": 0.00038777978139495855, "tps": 76648, "wall": 3833.0} {"step": 4483, "train_loss": 3.830221176147461, "lr": 0.000387772841885272, "tps": 76508, "wall": 3840.9} {"step": 4484, "train_loss": 3.6973166465759277, "lr": 0.00038776590047504564, "tps": 76371, "wall": 3848.7} {"step": 4485, "train_loss": 3.6258745193481445, "lr": 0.0003877589571643581, "tps": 76234, "wall": 3856.5} {"step": 4486, "train_loss": 3.7493085861206055, "lr": 0.00038775201195328797, "tps": 76095, "wall": 3864.3} {"step": 4487, "train_loss": 3.7615790367126465, "lr": 0.000387745064841914, "tps": 75959, "wall": 3872.1} {"step": 4488, "train_loss": 3.7944674491882324, "lr": 0.0003877381158303149, "tps": 75824, "wall": 3879.9} {"step": 4489, "train_loss": 3.8384766578674316, "lr": 0.00038773116491856924, "tps": 75685, "wall": 3887.9} {"step": 4490, "train_loss": 3.716411828994751, "lr": 0.000387724212106756, "tps": 75552, "wall": 3895.6} {"step": 4491, "train_loss": 3.755406379699707, "lr": 0.0003877172573949537, "tps": 75418, "wall": 3903.4} {"step": 4492, "train_loss": 3.7820332050323486, "lr": 0.0003877103007832413, "tps": 75287, "wall": 3911.0} {"step": 4493, "train_loss": 3.7056007385253906, "lr": 0.0003877033422716975, "tps": 75154, "wall": 3918.8} {"step": 4494, "train_loss": 3.78700590133667, "lr": 0.00038769638186040125, "tps": 75021, "wall": 3926.7} {"step": 4495, "train_loss": 3.7025790214538574, "lr": 0.0003876894195494312, "tps": 74888, "wall": 3934.5} {"step": 4496, "train_loss": 3.7521779537200928, "lr": 0.0003876824553388664, "tps": 74754, "wall": 3942.5} {"step": 4497, "train_loss": 3.7630228996276855, "lr": 0.00038767548922878566, "tps": 74624, "wall": 3950.2} {"step": 4498, "train_loss": 3.668144464492798, "lr": 0.00038766852121926786, "tps": 74494, "wall": 3958.0} {"step": 4499, "train_loss": 3.7299764156341553, "lr": 0.00038766155131039206, "tps": 74365, "wall": 3965.7} {"step": 4500, "train_loss": 3.7430059909820557, "lr": 0.0003876545795022371, "tps": 74237, "wall": 3973.4} {"step": 4501, "train_loss": 3.8200106620788574, "lr": 0.000387647605794882, "tps": 74109, "wall": 3981.2} {"step": 4502, "train_loss": 3.6918740272521973, "lr": 0.00038764063018840577, "tps": 73977, "wall": 3989.2} {"step": 4503, "train_loss": 3.647477865219116, "lr": 0.00038763365268288736, "tps": 73848, "wall": 3997.0} {"step": 4504, "train_loss": 3.7116503715515137, "lr": 0.0003876266732784059, "tps": 73719, "wall": 4004.9} {"step": 4505, "train_loss": 3.792417526245117, "lr": 0.00038761969197504044, "tps": 73592, "wall": 4012.7} {"step": 4506, "train_loss": 3.660872459411621, "lr": 0.00038761270877287, "tps": 73466, "wall": 4020.5} {"step": 4507, "train_loss": 3.6405107975006104, "lr": 0.0003876057236719737, "tps": 73341, "wall": 4028.2} {"step": 4508, "train_loss": 3.5338551998138428, "lr": 0.00038759873667243075, "tps": 73215, "wall": 4036.0} {"step": 4509, "train_loss": 3.7718825340270996, "lr": 0.00038759174777432023, "tps": 73090, "wall": 4043.9} {"step": 4510, "train_loss": 3.7503223419189453, "lr": 0.00038758475697772134, "tps": 72965, "wall": 4051.7} {"step": 4511, "train_loss": 3.663828134536743, "lr": 0.00038757776428271324, "tps": 72842, "wall": 4059.4} {"step": 4512, "train_loss": 3.6884164810180664, "lr": 0.0003875707696893752, "tps": 72716, "wall": 4067.4} {"step": 4513, "train_loss": 3.854156494140625, "lr": 0.00038756377319778634, "tps": 72591, "wall": 4075.2} {"step": 4514, "train_loss": 3.7346341609954834, "lr": 0.000387556774808026, "tps": 72469, "wall": 4083.0} {"step": 4515, "train_loss": 3.6947762966156006, "lr": 0.0003875497745201735, "tps": 72349, "wall": 4090.7} {"step": 4516, "train_loss": 3.8407397270202637, "lr": 0.0003875427723343081, "tps": 72226, "wall": 4098.6} {"step": 4517, "train_loss": 3.7057361602783203, "lr": 0.00038753576825050905, "tps": 72102, "wall": 4106.5} {"step": 4518, "train_loss": 3.7487282752990723, "lr": 0.0003875287622688558, "tps": 71980, "wall": 4114.4} {"step": 4519, "train_loss": 3.7030436992645264, "lr": 0.00038752175438942765, "tps": 71860, "wall": 4122.2} {"step": 4520, "train_loss": 3.6644177436828613, "lr": 0.000387514744612304, "tps": 71740, "wall": 4130.0} {"step": 4521, "train_loss": 3.7150461673736572, "lr": 0.00038750773293756425, "tps": 71621, "wall": 4137.7} {"step": 4522, "train_loss": 3.6735501289367676, "lr": 0.00038750071936528786, "tps": 71503, "wall": 4145.5} {"step": 4523, "train_loss": 3.754599094390869, "lr": 0.00038749370389555424, "tps": 71384, "wall": 4153.3} {"step": 4524, "train_loss": 3.7384040355682373, "lr": 0.00038748668652844296, "tps": 71264, "wall": 4161.3} {"step": 4525, "train_loss": 3.701436996459961, "lr": 0.00038747966726403334, "tps": 71145, "wall": 4169.2} {"step": 4526, "train_loss": 3.6318187713623047, "lr": 0.000387472646102405, "tps": 71029, "wall": 4176.9} {"step": 4527, "train_loss": 3.731062412261963, "lr": 0.0003874656230436375, "tps": 70910, "wall": 4184.8} {"step": 4528, "train_loss": 3.6025445461273193, "lr": 0.00038745859808781037, "tps": 70794, "wall": 4192.6} {"step": 4529, "train_loss": 3.623286724090576, "lr": 0.0003874515712350031, "tps": 70680, "wall": 4200.3} {"step": 4530, "train_loss": 3.751781463623047, "lr": 0.0003874445424852954, "tps": 70565, "wall": 4208.1} {"step": 4531, "train_loss": 3.7127461433410645, "lr": 0.0003874375118387669, "tps": 70450, "wall": 4215.9} {"step": 4532, "train_loss": 3.7192885875701904, "lr": 0.00038743047929549725, "tps": 70332, "wall": 4223.8} {"step": 4533, "train_loss": 3.7889881134033203, "lr": 0.00038742344485556603, "tps": 70220, "wall": 4231.6} {"step": 4534, "train_loss": 3.689516544342041, "lr": 0.00038741640851905297, "tps": 70106, "wall": 4239.4} {"step": 4535, "train_loss": 3.75771164894104, "lr": 0.0003874093702860378, "tps": 69991, "wall": 4247.2} {"step": 4536, "train_loss": 3.6998956203460693, "lr": 0.00038740233015660015, "tps": 69877, "wall": 4255.1} {"step": 4537, "train_loss": 3.7990059852600098, "lr": 0.0003873952881308199, "tps": 69765, "wall": 4262.9} {"step": 4538, "train_loss": 3.6555981636047363, "lr": 0.00038738824420877675, "tps": 69653, "wall": 4270.7} {"step": 4539, "train_loss": 3.746326446533203, "lr": 0.0003873811983905506, "tps": 69541, "wall": 4278.5} {"step": 4540, "train_loss": 3.795356035232544, "lr": 0.0003873741506762211, "tps": 69426, "wall": 4286.6} {"step": 4541, "train_loss": 3.6072397232055664, "lr": 0.00038736710106586814, "tps": 69316, "wall": 4294.3} {"step": 4542, "train_loss": 3.6719276905059814, "lr": 0.0003873600495595716, "tps": 69204, "wall": 4302.2} {"step": 4543, "train_loss": 3.8180294036865234, "lr": 0.00038735299615741143, "tps": 69096, "wall": 4309.9} {"step": 4544, "train_loss": 3.712301254272461, "lr": 0.00038734594085946747, "tps": 68986, "wall": 4317.7} {"step": 4545, "train_loss": 3.761119842529297, "lr": 0.0003873388836658196, "tps": 68876, "wall": 4325.5} {"step": 4546, "train_loss": 3.790817975997925, "lr": 0.00038733182457654776, "tps": 68768, "wall": 4333.3} {"step": 4547, "train_loss": 3.723938465118408, "lr": 0.00038732476359173203, "tps": 68659, "wall": 4341.1} {"step": 4548, "train_loss": 3.717442274093628, "lr": 0.00038731770071145233, "tps": 68549, "wall": 4349.1} {"step": 4549, "train_loss": 3.66943097114563, "lr": 0.0003873106359357886, "tps": 68440, "wall": 4356.9} {"step": 4550, "train_loss": 3.707890510559082, "lr": 0.000387303569264821, "tps": 68332, "wall": 4364.8} {"step": 4551, "train_loss": 3.665663719177246, "lr": 0.0003872965006986295, "tps": 68225, "wall": 4372.5} {"step": 4552, "train_loss": 3.762596845626831, "lr": 0.00038728943023729417, "tps": 68118, "wall": 4380.4} {"step": 4553, "train_loss": 3.702465534210205, "lr": 0.00038728235788089514, "tps": 68012, "wall": 4388.2} {"step": 4554, "train_loss": 3.65484881401062, "lr": 0.00038727528362951253, "tps": 67907, "wall": 4395.9} {"step": 4555, "train_loss": 3.7213730812072754, "lr": 0.0003872682074832264, "tps": 67800, "wall": 4403.8} {"step": 4556, "train_loss": 3.7667675018310547, "lr": 0.00038726112944211704, "tps": 67697, "wall": 4411.5} {"step": 4557, "train_loss": 3.606114387512207, "lr": 0.0003872540495062645, "tps": 67593, "wall": 4419.2} {"step": 4558, "train_loss": 3.588498115539551, "lr": 0.00038724696767574905, "tps": 67486, "wall": 4427.2} {"step": 4559, "train_loss": 3.743767738342285, "lr": 0.0003872398839506509, "tps": 67382, "wall": 4435.0} {"step": 4560, "train_loss": 3.6257877349853516, "lr": 0.0003872327983310503, "tps": 67279, "wall": 4442.8} {"step": 4561, "train_loss": 3.737191677093506, "lr": 0.0003872257108170275, "tps": 67175, "wall": 4450.7} {"step": 4562, "train_loss": 3.664066791534424, "lr": 0.00038721862140866285, "tps": 67072, "wall": 4458.5} {"step": 4563, "train_loss": 3.6578710079193115, "lr": 0.00038721153010603664, "tps": 66968, "wall": 4466.4} {"step": 4564, "train_loss": 3.775850296020508, "lr": 0.0003872044369092291, "tps": 66868, "wall": 4474.0} {"step": 4565, "train_loss": 3.6771202087402344, "lr": 0.0003871973418183206, "tps": 66764, "wall": 4482.0} {"step": 4566, "train_loss": 3.6441359519958496, "lr": 0.00038719024483339166, "tps": 66664, "wall": 4489.7} {"step": 4567, "train_loss": 3.6242287158966064, "lr": 0.00038718314595452254, "tps": 66562, "wall": 4497.5} {"step": 4568, "train_loss": 3.829296112060547, "lr": 0.00038717604518179367, "tps": 66462, "wall": 4505.3} {"step": 4569, "train_loss": 3.626461982727051, "lr": 0.0003871689425152856, "tps": 66363, "wall": 4513.0} {"step": 4570, "train_loss": 3.7819910049438477, "lr": 0.00038716183795507866, "tps": 66263, "wall": 4520.8} {"step": 4571, "train_loss": 3.582988739013672, "lr": 0.00038715473150125336, "tps": 66161, "wall": 4528.8} {"step": 4572, "train_loss": 3.633727550506592, "lr": 0.00038714762315389026, "tps": 66063, "wall": 4536.5} {"step": 4573, "train_loss": 3.585513114929199, "lr": 0.00038714051291306983, "tps": 65963, "wall": 4544.4} {"step": 4574, "train_loss": 3.7995247840881348, "lr": 0.0003871334007788726, "tps": 65864, "wall": 4552.2} {"step": 4575, "train_loss": 3.695127010345459, "lr": 0.0003871262867513792, "tps": 65767, "wall": 4559.9} {"step": 4576, "train_loss": 3.700745105743408, "lr": 0.00038711917083067014, "tps": 65670, "wall": 4567.7} {"step": 4577, "train_loss": 3.7805981636047363, "lr": 0.0003871120530168261, "tps": 65571, "wall": 4575.5} {"step": 4578, "train_loss": 3.6199288368225098, "lr": 0.0003871049333099277, "tps": 65475, "wall": 4583.3} {"step": 4579, "train_loss": 3.726889133453369, "lr": 0.00038709781171005555, "tps": 65378, "wall": 4591.1} {"step": 4580, "train_loss": 3.747875452041626, "lr": 0.0003870906882172903, "tps": 65280, "wall": 4598.9} {"step": 4581, "train_loss": 3.7322354316711426, "lr": 0.0003870835628317128, "tps": 65183, "wall": 4606.8} {"step": 4582, "train_loss": 3.8213586807250977, "lr": 0.0003870764355534036, "tps": 65087, "wall": 4614.6} {"step": 4583, "train_loss": 3.698352575302124, "lr": 0.0003870693063824435, "tps": 64992, "wall": 4622.3} {"step": 4584, "train_loss": 3.790231227874756, "lr": 0.0003870621753189132, "tps": 64897, "wall": 4630.1} {"step": 4585, "train_loss": 3.6817915439605713, "lr": 0.0003870550423628937, "tps": 64802, "wall": 4637.9} {"step": 4586, "train_loss": 3.6852927207946777, "lr": 0.00038704790751446555, "tps": 64707, "wall": 4645.7} {"step": 4587, "train_loss": 3.755183696746826, "lr": 0.0003870407707737097, "tps": 64613, "wall": 4653.5} {"step": 4588, "train_loss": 3.5970458984375, "lr": 0.00038703363214070686, "tps": 64517, "wall": 4661.5} {"step": 4589, "train_loss": 3.6762678623199463, "lr": 0.0003870264916155381, "tps": 64424, "wall": 4669.2} {"step": 4590, "train_loss": 3.7002387046813965, "lr": 0.00038701934919828417, "tps": 64329, "wall": 4677.1} {"step": 4591, "train_loss": 3.591660737991333, "lr": 0.000387012204889026, "tps": 64236, "wall": 4684.9} {"step": 4592, "train_loss": 3.7159230709075928, "lr": 0.0003870050586878445, "tps": 64144, "wall": 4692.6} {"step": 4593, "train_loss": 3.6443958282470703, "lr": 0.00038699791059482083, "tps": 64053, "wall": 4700.4} {"step": 4594, "train_loss": 3.81541109085083, "lr": 0.0003869907606100356, "tps": 63959, "wall": 4708.3} {"step": 4595, "train_loss": 3.7483508586883545, "lr": 0.0003869836087335701, "tps": 63869, "wall": 4715.9} {"step": 4596, "train_loss": 3.6710519790649414, "lr": 0.0003869764549655053, "tps": 63776, "wall": 4723.8} {"step": 4597, "train_loss": 3.6098155975341797, "lr": 0.00038696929930592203, "tps": 63686, "wall": 4731.5} {"step": 4598, "train_loss": 3.7432994842529297, "lr": 0.0003869621417549016, "tps": 63594, "wall": 4739.4} {"step": 4599, "train_loss": 3.809366226196289, "lr": 0.000386954982312525, "tps": 63503, "wall": 4747.2} {"step": 4600, "train_loss": 3.634835720062256, "lr": 0.0003869478209788733, "tps": 63413, "wall": 4755.0} {"step": 4601, "train_loss": 3.81449294090271, "lr": 0.0003869406577540277, "tps": 63323, "wall": 4762.8} {"step": 4602, "train_loss": 3.7184042930603027, "lr": 0.0003869334926380693, "tps": 63232, "wall": 4770.7} {"step": 4603, "train_loss": 3.7984468936920166, "lr": 0.0003869263256310792, "tps": 63144, "wall": 4778.4} {"step": 4604, "train_loss": 3.6371474266052246, "lr": 0.0003869191567331386, "tps": 63053, "wall": 4786.3} {"step": 4605, "train_loss": 3.6765401363372803, "lr": 0.0003869119859443289, "tps": 62965, "wall": 4794.0} {"step": 4606, "train_loss": 3.722637891769409, "lr": 0.0003869048132647311, "tps": 62877, "wall": 4801.8} {"step": 4607, "train_loss": 3.680281639099121, "lr": 0.0003868976386944266, "tps": 62790, "wall": 4809.5} {"step": 4608, "train_loss": 3.667968273162842, "lr": 0.00038689046223349657, "tps": 62702, "wall": 4817.3} {"step": 4609, "train_loss": 3.801103115081787, "lr": 0.0003868832838820224, "tps": 62614, "wall": 4825.1} {"step": 4610, "train_loss": 3.547684669494629, "lr": 0.00038687610364008537, "tps": 62528, "wall": 4832.8} {"step": 4611, "train_loss": 3.6774728298187256, "lr": 0.00038686892150776675, "tps": 62441, "wall": 4840.5} {"step": 4612, "train_loss": 3.6734187602996826, "lr": 0.00038686173748514805, "tps": 62355, "wall": 4848.3} {"step": 4613, "train_loss": 3.7080881595611572, "lr": 0.0003868545515723105, "tps": 62269, "wall": 4856.0} {"step": 4614, "train_loss": 3.7555389404296875, "lr": 0.00038684736376933557, "tps": 62183, "wall": 4863.8} {"step": 4615, "train_loss": 3.6534790992736816, "lr": 0.00038684017407630464, "tps": 62098, "wall": 4871.5} {"step": 4616, "train_loss": 3.7955799102783203, "lr": 0.00038683298249329927, "tps": 62011, "wall": 4879.4} {"step": 4617, "train_loss": 3.7416720390319824, "lr": 0.0003868257890204008, "tps": 61924, "wall": 4887.3} {"step": 4618, "train_loss": 3.7424917221069336, "lr": 0.00038681859365769075, "tps": 61841, "wall": 4894.9} {"step": 4619, "train_loss": 3.7164762020111084, "lr": 0.0003868113964052507, "tps": 61756, "wall": 4902.8} {"step": 4620, "train_loss": 3.7358291149139404, "lr": 0.0003868041972631621, "tps": 61672, "wall": 4910.5} {"step": 4621, "train_loss": 3.7935619354248047, "lr": 0.00038679699623150654, "tps": 61588, "wall": 4918.3} {"step": 4622, "train_loss": 3.728600025177002, "lr": 0.00038678979331036555, "tps": 61505, "wall": 4926.0} {"step": 4623, "train_loss": 3.6525659561157227, "lr": 0.0003867825884998208, "tps": 61421, "wall": 4933.7} {"step": 4624, "train_loss": 3.6921231746673584, "lr": 0.00038677538179995386, "tps": 61338, "wall": 4941.5} {"step": 4625, "train_loss": 3.727935314178467, "lr": 0.00038676817321084634, "tps": 61254, "wall": 4949.4} {"step": 4626, "train_loss": 3.72086501121521, "lr": 0.00038676096273257995, "tps": 61172, "wall": 4957.0} {"step": 4627, "train_loss": 3.648104667663574, "lr": 0.00038675375036523635, "tps": 61088, "wall": 4964.9} {"step": 4628, "train_loss": 3.794428825378418, "lr": 0.0003867465361088973, "tps": 61007, "wall": 4972.6} {"step": 4629, "train_loss": 3.7142889499664307, "lr": 0.0003867393199636444, "tps": 60924, "wall": 4980.4} {"step": 4630, "train_loss": 3.729398250579834, "lr": 0.0003867321019295594, "tps": 60842, "wall": 4988.2} {"step": 4631, "train_loss": 3.7701096534729004, "lr": 0.00038672488200672424, "tps": 60759, "wall": 4996.1} {"step": 4632, "train_loss": 3.7056989669799805, "lr": 0.00038671766019522056, "tps": 60679, "wall": 5003.8} {"step": 4633, "train_loss": 3.6680054664611816, "lr": 0.0003867104364951302, "tps": 60597, "wall": 5011.7} {"step": 4634, "train_loss": 3.671036958694458, "lr": 0.00038670321090653503, "tps": 60517, "wall": 5019.4} {"step": 4635, "train_loss": 3.6909258365631104, "lr": 0.00038669598342951685, "tps": 60435, "wall": 5027.3} {"step": 4636, "train_loss": 3.778730869293213, "lr": 0.0003866887540641575, "tps": 60355, "wall": 5035.0} {"step": 4637, "train_loss": 3.7093687057495117, "lr": 0.000386681522810539, "tps": 60274, "wall": 5042.9} {"step": 4638, "train_loss": 3.719783067703247, "lr": 0.0003866742896687432, "tps": 60196, "wall": 5050.5} {"step": 4639, "train_loss": 3.650693893432617, "lr": 0.00038666705463885197, "tps": 60117, "wall": 5058.2} {"step": 4640, "train_loss": 3.844923973083496, "lr": 0.00038665981772094735, "tps": 60035, "wall": 5066.2} {"step": 4641, "train_loss": 3.616694450378418, "lr": 0.00038665257891511135, "tps": 59957, "wall": 5073.9} {"step": 4642, "train_loss": 3.5669307708740234, "lr": 0.0003866453382214259, "tps": 59877, "wall": 5081.7} {"step": 4643, "train_loss": 3.696925640106201, "lr": 0.0003866380956399729, "tps": 59799, "wall": 5089.5} {"step": 4644, "train_loss": 3.738846778869629, "lr": 0.00038663085117083477, "tps": 59721, "wall": 5097.3} {"step": 4645, "train_loss": 3.700253486633301, "lr": 0.00038662360481409323, "tps": 59643, "wall": 5105.0} {"step": 4646, "train_loss": 3.71771240234375, "lr": 0.0003866163565698304, "tps": 59564, "wall": 5112.9} {"step": 4647, "train_loss": 3.656790256500244, "lr": 0.0003866091064381286, "tps": 59487, "wall": 5120.6} {"step": 4648, "train_loss": 3.7706081867218018, "lr": 0.00038660185441906976, "tps": 59408, "wall": 5128.5} {"step": 4649, "train_loss": 3.725864887237549, "lr": 0.0003865946005127361, "tps": 59331, "wall": 5136.3} {"step": 4650, "train_loss": 3.6172049045562744, "lr": 0.0003865873447192098, "tps": 59253, "wall": 5144.2} {"step": 4651, "train_loss": 3.7513527870178223, "lr": 0.00038658008703857305, "tps": 59176, "wall": 5152.0} {"step": 4652, "train_loss": 3.7078166007995605, "lr": 0.0003865728274709081, "tps": 59099, "wall": 5159.7} {"step": 4653, "train_loss": 3.74572491645813, "lr": 0.00038656556601629716, "tps": 59024, "wall": 5167.4} {"step": 4654, "train_loss": 3.784355640411377, "lr": 0.0003865583026748224, "tps": 58949, "wall": 5175.1} {"step": 4655, "train_loss": 3.766429901123047, "lr": 0.0003865510374465662, "tps": 58873, "wall": 5182.9} {"step": 4656, "train_loss": 3.757887363433838, "lr": 0.0003865437703316109, "tps": 58796, "wall": 5190.8} {"step": 4657, "train_loss": 3.749032497406006, "lr": 0.0003865365013300386, "tps": 58723, "wall": 5198.4} {"step": 4658, "train_loss": 3.661874771118164, "lr": 0.00038652923044193196, "tps": 58646, "wall": 5206.3} {"step": 4659, "train_loss": 3.6998684406280518, "lr": 0.00038652195766737316, "tps": 58572, "wall": 5214.0} {"step": 4660, "train_loss": 3.614462375640869, "lr": 0.00038651468300644455, "tps": 58497, "wall": 5221.8} {"step": 4661, "train_loss": 3.653785228729248, "lr": 0.00038650740645922865, "tps": 58425, "wall": 5229.4} {"step": 4662, "train_loss": 3.6816399097442627, "lr": 0.00038650012802580785, "tps": 58351, "wall": 5237.1} {"step": 4663, "train_loss": 3.662285327911377, "lr": 0.00038649284770626456, "tps": 58277, "wall": 5244.9} {"step": 4664, "train_loss": 3.7096927165985107, "lr": 0.0003864855655006813, "tps": 58203, "wall": 5252.7} {"step": 4665, "train_loss": 3.6912622451782227, "lr": 0.00038647828140914056, "tps": 58131, "wall": 5260.4} {"step": 4666, "train_loss": 3.655883312225342, "lr": 0.0003864709954317249, "tps": 58057, "wall": 5268.1} {"step": 4667, "train_loss": 3.7424511909484863, "lr": 0.00038646370756851667, "tps": 57984, "wall": 5275.9} {"step": 4668, "train_loss": 3.799088478088379, "lr": 0.0003864564178195986, "tps": 57912, "wall": 5283.6} {"step": 4669, "train_loss": 3.6750059127807617, "lr": 0.00038644912618505326, "tps": 57841, "wall": 5291.3} {"step": 4670, "train_loss": 3.6579623222351074, "lr": 0.0003864418326649632, "tps": 57769, "wall": 5299.0} {"step": 4671, "train_loss": 3.730553150177002, "lr": 0.00038643453725941107, "tps": 57696, "wall": 5306.8} {"step": 4672, "train_loss": 3.6671502590179443, "lr": 0.0003864272399684795, "tps": 57625, "wall": 5314.5} {"step": 4673, "train_loss": 3.6580617427825928, "lr": 0.00038641994079225106, "tps": 57552, "wall": 5322.4} {"step": 4674, "train_loss": 3.7362797260284424, "lr": 0.0003864126397308086, "tps": 57481, "wall": 5330.0} {"step": 4675, "train_loss": 3.682988166809082, "lr": 0.00038640533678423476, "tps": 57410, "wall": 5337.8} {"step": 4676, "train_loss": 3.691586971282959, "lr": 0.0003863980319526123, "tps": 57340, "wall": 5345.4} {"step": 4677, "train_loss": 3.6445255279541016, "lr": 0.00038639072523602387, "tps": 57270, "wall": 5353.1} {"step": 4678, "train_loss": 3.680771827697754, "lr": 0.0003863834166345523, "tps": 57199, "wall": 5360.9} {"step": 4679, "train_loss": 3.7611846923828125, "lr": 0.0003863761061482804, "tps": 57128, "wall": 5368.7} {"step": 4680, "train_loss": 3.728705406188965, "lr": 0.000386368793777291, "tps": 57059, "wall": 5376.4} {"step": 4681, "train_loss": 3.8150851726531982, "lr": 0.0003863614795216669, "tps": 56988, "wall": 5384.3} {"step": 4682, "train_loss": 3.753227949142456, "lr": 0.0003863541633814909, "tps": 56918, "wall": 5392.0} {"step": 4683, "train_loss": 3.6355700492858887, "lr": 0.000386346845356846, "tps": 56850, "wall": 5399.7} {"step": 4684, "train_loss": 3.6057679653167725, "lr": 0.000386339525447815, "tps": 56780, "wall": 5407.4} {"step": 4685, "train_loss": 3.698610305786133, "lr": 0.0003863322036544809, "tps": 56711, "wall": 5415.2} {"step": 4686, "train_loss": 3.745274305343628, "lr": 0.00038632487997692657, "tps": 56640, "wall": 5423.1} {"step": 4687, "train_loss": 3.7950406074523926, "lr": 0.00038631755441523503, "tps": 56570, "wall": 5430.9} {"step": 4688, "train_loss": 3.730637550354004, "lr": 0.00038631022696948916, "tps": 56501, "wall": 5438.7} {"step": 4689, "train_loss": 3.63193941116333, "lr": 0.00038630289763977207, "tps": 56432, "wall": 5446.6} {"step": 4690, "train_loss": 3.723392963409424, "lr": 0.00038629556642616675, "tps": 56364, "wall": 5454.3} {"step": 4691, "train_loss": 3.609515905380249, "lr": 0.0003862882333287563, "tps": 56296, "wall": 5462.0} {"step": 4692, "train_loss": 3.7498996257781982, "lr": 0.00038628089834762374, "tps": 56230, "wall": 5469.6} {"step": 4693, "train_loss": 3.6850898265838623, "lr": 0.00038627356148285215, "tps": 56162, "wall": 5477.4} {"step": 4694, "train_loss": 3.7104334831237793, "lr": 0.00038626622273452464, "tps": 56094, "wall": 5485.3} {"step": 4695, "train_loss": 3.69781494140625, "lr": 0.0003862588821027244, "tps": 56026, "wall": 5493.0} {"step": 4696, "train_loss": 3.777663469314575, "lr": 0.0003862515395875346, "tps": 55960, "wall": 5500.8} {"step": 4697, "train_loss": 3.647017240524292, "lr": 0.00038624419518903827, "tps": 55892, "wall": 5508.6} {"step": 4698, "train_loss": 3.6301016807556152, "lr": 0.00038623684890731877, "tps": 55825, "wall": 5516.3} {"step": 4699, "train_loss": 3.7418105602264404, "lr": 0.0003862295007424592, "tps": 55758, "wall": 5524.2} {"step": 4700, "train_loss": 3.728372573852539, "lr": 0.00038622215069454287, "tps": 55691, "wall": 5532.0} {"step": 4701, "train_loss": 3.729532480239868, "lr": 0.00038621479876365305, "tps": 55625, "wall": 5539.8} {"step": 4702, "train_loss": 3.7171146869659424, "lr": 0.0003862074449498729, "tps": 55557, "wall": 5547.7} {"step": 4703, "train_loss": 3.7494864463806152, "lr": 0.0003862000892532859, "tps": 55492, "wall": 5555.3} {"step": 4704, "train_loss": 3.65736985206604, "lr": 0.00038619273167397536, "tps": 55425, "wall": 5563.3} {"step": 4705, "train_loss": 3.6839399337768555, "lr": 0.0003861853722120245, "tps": 55360, "wall": 5571.0} {"step": 4706, "train_loss": 3.7964258193969727, "lr": 0.0003861780108675167, "tps": 55294, "wall": 5578.8} {"step": 4707, "train_loss": 3.6542468070983887, "lr": 0.0003861706476405355, "tps": 55228, "wall": 5586.7} {"step": 4708, "train_loss": 3.743203639984131, "lr": 0.0003861632825311642, "tps": 55164, "wall": 5594.4} {"step": 4709, "train_loss": 3.5880846977233887, "lr": 0.0003861559155394862, "tps": 55098, "wall": 5602.2} {"step": 4710, "train_loss": 3.7443697452545166, "lr": 0.000386148546665585, "tps": 55033, "wall": 5610.0} {"step": 4711, "train_loss": 3.7144947052001953, "lr": 0.0003861411759095441, "tps": 54968, "wall": 5617.9} {"step": 4712, "train_loss": 3.7444944381713867, "lr": 0.00038613380327144696, "tps": 54902, "wall": 5625.9} {"step": 4713, "train_loss": 3.6350347995758057, "lr": 0.0003861264287513771, "tps": 54837, "wall": 5633.6} {"step": 4714, "train_loss": 3.688565254211426, "lr": 0.000386119052349418, "tps": 54774, "wall": 5641.3} {"step": 4715, "train_loss": 3.799856185913086, "lr": 0.00038611167406565346, "tps": 54710, "wall": 5649.2} {"step": 4716, "train_loss": 3.7655482292175293, "lr": 0.0003861042939001668, "tps": 54647, "wall": 5656.9} {"step": 4717, "train_loss": 3.649493932723999, "lr": 0.0003860969118530417, "tps": 54583, "wall": 5664.7} {"step": 4718, "train_loss": 3.7359185218811035, "lr": 0.0003860895279243618, "tps": 54521, "wall": 5672.3} {"step": 4719, "train_loss": 3.6262259483337402, "lr": 0.00038608214211421075, "tps": 54458, "wall": 5680.2} {"step": 4720, "train_loss": 3.7077338695526123, "lr": 0.00038607475442267215, "tps": 54394, "wall": 5687.9} {"step": 4721, "train_loss": 3.76212215423584, "lr": 0.00038606736484982985, "tps": 54332, "wall": 5695.7} {"step": 4722, "train_loss": 3.725363254547119, "lr": 0.00038605997339576743, "tps": 54269, "wall": 5703.5} {"step": 4723, "train_loss": 3.6670165061950684, "lr": 0.00038605258006056865, "tps": 54208, "wall": 5711.1} {"step": 4724, "train_loss": 3.7275242805480957, "lr": 0.00038604518484431716, "tps": 54146, "wall": 5718.9} {"step": 4725, "train_loss": 3.684122323989868, "lr": 0.000386037787747097, "tps": 54083, "wall": 5726.8} {"step": 4726, "train_loss": 3.7638349533081055, "lr": 0.00038603038876899165, "tps": 54022, "wall": 5734.4} {"step": 4727, "train_loss": 3.7302443981170654, "lr": 0.00038602298791008514, "tps": 53961, "wall": 5742.1} {"step": 4728, "train_loss": 3.680393934249878, "lr": 0.00038601558517046126, "tps": 53900, "wall": 5749.8} {"step": 4729, "train_loss": 3.716834306716919, "lr": 0.00038600818055020377, "tps": 53839, "wall": 5757.6} {"step": 4730, "train_loss": 3.7076919078826904, "lr": 0.00038600077404939674, "tps": 53777, "wall": 5765.4} {"step": 4731, "train_loss": 3.623967170715332, "lr": 0.0003859933656681239, "tps": 53717, "wall": 5773.1} {"step": 4732, "train_loss": 3.718038320541382, "lr": 0.00038598595540646926, "tps": 53657, "wall": 5780.8} {"step": 4733, "train_loss": 3.641768455505371, "lr": 0.0003859785432645167, "tps": 53596, "wall": 5788.6} {"step": 4734, "train_loss": 3.702488422393799, "lr": 0.00038597112924235026, "tps": 53536, "wall": 5796.3} {"step": 4735, "train_loss": 3.710236072540283, "lr": 0.0003859637133400539, "tps": 53474, "wall": 5804.2} {"step": 4736, "train_loss": 3.7695093154907227, "lr": 0.0003859562955577115, "tps": 53415, "wall": 5811.8} {"step": 4737, "train_loss": 3.6962194442749023, "lr": 0.0003859488758954073, "tps": 53356, "wall": 5819.6} {"step": 4738, "train_loss": 3.650503158569336, "lr": 0.0003859414543532253, "tps": 53297, "wall": 5827.2} {"step": 4739, "train_loss": 3.7245357036590576, "lr": 0.0003859340309312495, "tps": 53238, "wall": 5834.9} {"step": 4740, "train_loss": 3.7512168884277344, "lr": 0.000385926605629564, "tps": 53178, "wall": 5842.7} {"step": 4741, "train_loss": 3.5775094032287598, "lr": 0.0003859191784482529, "tps": 53119, "wall": 5850.4} {"step": 4742, "train_loss": 3.682567596435547, "lr": 0.00038591174938740034, "tps": 53061, "wall": 5858.1} {"step": 4743, "train_loss": 3.7139925956726074, "lr": 0.0003859043184470906, "tps": 53000, "wall": 5866.0} {"step": 4744, "train_loss": 3.699319362640381, "lr": 0.0003858968856274078, "tps": 52941, "wall": 5873.8} {"step": 4745, "train_loss": 3.7953805923461914, "lr": 0.000385889450928436, "tps": 52883, "wall": 5881.5} {"step": 4746, "train_loss": 3.5896692276000977, "lr": 0.0003858820143502595, "tps": 52824, "wall": 5889.4} {"step": 4747, "train_loss": 3.7054083347320557, "lr": 0.0003858745758929627, "tps": 52766, "wall": 5897.0} {"step": 4748, "train_loss": 3.830291748046875, "lr": 0.0003858671355566297, "tps": 52707, "wall": 5904.9} {"step": 4749, "train_loss": 3.7013683319091797, "lr": 0.0003858596933413447, "tps": 52649, "wall": 5912.6} {"step": 4750, "train_loss": 3.684056282043457, "lr": 0.0003858522492471922, "tps": 52591, "wall": 5920.4} {"step": 4751, "train_loss": 3.729393243789673, "lr": 0.0003858448032742565, "tps": 52533, "wall": 5928.2} {"step": 4752, "train_loss": 3.640819787979126, "lr": 0.0003858373554226218, "tps": 52475, "wall": 5935.9} {"step": 4753, "train_loss": 3.6355481147766113, "lr": 0.00038582990569237263, "tps": 52418, "wall": 5943.7} {"step": 4754, "train_loss": 3.635979652404785, "lr": 0.0003858224540835933, "tps": 52362, "wall": 5951.3} {"step": 4755, "train_loss": 3.6007940769195557, "lr": 0.0003858150005963682, "tps": 52305, "wall": 5959.1} {"step": 4756, "train_loss": 3.823568344116211, "lr": 0.0003858075452307819, "tps": 52247, "wall": 5966.8} {"step": 4757, "train_loss": 3.680302619934082, "lr": 0.0003858000879869187, "tps": 52192, "wall": 5974.5} {"step": 4758, "train_loss": 3.6779234409332275, "lr": 0.00038579262886486316, "tps": 52134, "wall": 5982.3} {"step": 4759, "train_loss": 3.7336134910583496, "lr": 0.00038578516786469966, "tps": 52078, "wall": 5990.1} {"step": 4760, "train_loss": 3.6630544662475586, "lr": 0.0003857777049865129, "tps": 52022, "wall": 5997.8} {"step": 4761, "train_loss": 3.705615758895874, "lr": 0.0003857702402303873, "tps": 51965, "wall": 6005.6} {"step": 4762, "train_loss": 3.720158100128174, "lr": 0.0003857627735964074, "tps": 51910, "wall": 6013.2} {"step": 4763, "train_loss": 3.7284951210021973, "lr": 0.00038575530508465794, "tps": 51853, "wall": 6021.1} {"step": 4764, "train_loss": 3.563683271408081, "lr": 0.00038574783469522334, "tps": 51797, "wall": 6028.9} {"step": 4765, "train_loss": 3.672447919845581, "lr": 0.0003857403624281883, "tps": 51742, "wall": 6036.5} {"step": 4766, "train_loss": 3.7260968685150146, "lr": 0.0003857328882836375, "tps": 51687, "wall": 6044.2} {"step": 4767, "train_loss": 3.666264533996582, "lr": 0.00038572541226165554, "tps": 51632, "wall": 6051.9} {"step": 4768, "train_loss": 3.693422317504883, "lr": 0.0003857179343623272, "tps": 51577, "wall": 6059.6} {"step": 4769, "train_loss": 3.74263334274292, "lr": 0.0003857104545857371, "tps": 51522, "wall": 6067.4} {"step": 4770, "train_loss": 3.6475000381469727, "lr": 0.00038570297293197, "tps": 51467, "wall": 6075.1} {"step": 4771, "train_loss": 3.6721243858337402, "lr": 0.00038569548940111065, "tps": 51413, "wall": 6082.8} {"step": 4772, "train_loss": 3.7166223526000977, "lr": 0.00038568800399324386, "tps": 51358, "wall": 6090.6} {"step": 4773, "train_loss": 3.6716411113739014, "lr": 0.00038568051670845435, "tps": 51304, "wall": 6098.2} {"step": 4774, "train_loss": 3.639235258102417, "lr": 0.0003856730275468271, "tps": 51250, "wall": 6106.0} {"step": 4775, "train_loss": 3.7473583221435547, "lr": 0.0003856655365084467, "tps": 51196, "wall": 6113.7} {"step": 4776, "train_loss": 3.797199249267578, "lr": 0.00038565804359339825, "tps": 51142, "wall": 6121.5} {"step": 4777, "train_loss": 3.7375988960266113, "lr": 0.0003856505488017665, "tps": 51089, "wall": 6129.1} {"step": 4778, "train_loss": 3.7810959815979004, "lr": 0.0003856430521336363, "tps": 51034, "wall": 6137.0} {"step": 4779, "train_loss": 3.6347038745880127, "lr": 0.00038563555358909265, "tps": 50980, "wall": 6144.7} {"step": 4780, "train_loss": 3.5975918769836426, "lr": 0.00038562805316822053, "tps": 50927, "wall": 6152.4} {"step": 4781, "train_loss": 3.657193183898926, "lr": 0.00038562055087110485, "tps": 50874, "wall": 6160.1} {"step": 4782, "train_loss": 3.7156591415405273, "lr": 0.00038561304669783064, "tps": 50820, "wall": 6167.9} {"step": 4783, "train_loss": 3.606229066848755, "lr": 0.0003856055406484828, "tps": 50768, "wall": 6175.6} {"step": 4784, "train_loss": 3.7484593391418457, "lr": 0.0003855980327231465, "tps": 50714, "wall": 6183.4} {"step": 4785, "train_loss": 3.627588987350464, "lr": 0.0003855905229219067, "tps": 50662, "wall": 6191.1} {"step": 4786, "train_loss": 3.8561413288116455, "lr": 0.00038558301124484853, "tps": 50609, "wall": 6198.8} {"step": 4787, "train_loss": 3.6639771461486816, "lr": 0.00038557549769205703, "tps": 50556, "wall": 6206.6} {"step": 4788, "train_loss": 3.7677066326141357, "lr": 0.00038556798226361736, "tps": 50505, "wall": 6214.2} {"step": 4789, "train_loss": 3.709810256958008, "lr": 0.00038556046495961455, "tps": 50452, "wall": 6222.1} {"step": 4790, "train_loss": 3.70784068107605, "lr": 0.0003855529457801339, "tps": 50400, "wall": 6229.7} {"step": 4791, "train_loss": 3.7418816089630127, "lr": 0.0003855454247252605, "tps": 50349, "wall": 6237.4} {"step": 4792, "train_loss": 3.7259955406188965, "lr": 0.0003855379017950796, "tps": 50297, "wall": 6245.1} {"step": 4793, "train_loss": 3.6779372692108154, "lr": 0.0003855303769896764, "tps": 50246, "wall": 6252.8} {"step": 4794, "train_loss": 3.725877285003662, "lr": 0.0003855228503091361, "tps": 50195, "wall": 6260.4} {"step": 4795, "train_loss": 3.7452170848846436, "lr": 0.000385515321753544, "tps": 50143, "wall": 6268.2} {"step": 4796, "train_loss": 3.634427309036255, "lr": 0.00038550779132298543, "tps": 50093, "wall": 6275.8} {"step": 4797, "train_loss": 3.7944116592407227, "lr": 0.00038550025901754563, "tps": 50041, "wall": 6283.7} {"step": 4798, "train_loss": 3.6465654373168945, "lr": 0.0003854927248373099, "tps": 49991, "wall": 6291.2} {"step": 4799, "train_loss": 3.760282516479492, "lr": 0.00038548518878236363, "tps": 49940, "wall": 6299.0} {"step": 4800, "train_loss": 3.5903592109680176, "lr": 0.00038547765085279224, "tps": 49889, "wall": 6306.7} {"step": 4801, "train_loss": 3.732675075531006, "lr": 0.000385470111048681, "tps": 49839, "wall": 6314.4} {"step": 4802, "train_loss": 3.680654525756836, "lr": 0.00038546256937011544, "tps": 49788, "wall": 6322.2} {"step": 4803, "train_loss": 3.775066614151001, "lr": 0.00038545502581718096, "tps": 49736, "wall": 6330.0} {"step": 4804, "train_loss": 3.745706558227539, "lr": 0.00038544748038996297, "tps": 49687, "wall": 6337.6} {"step": 4805, "train_loss": 3.69085431098938, "lr": 0.0003854399330885469, "tps": 49636, "wall": 6345.4} {"step": 4806, "train_loss": 3.7386274337768555, "lr": 0.00038543238391301846, "tps": 49587, "wall": 6353.1} {"step": 4807, "train_loss": 3.6278605461120605, "lr": 0.0003854248328634629, "tps": 49537, "wall": 6360.8} {"step": 4808, "train_loss": 3.6654670238494873, "lr": 0.00038541727993996594, "tps": 49487, "wall": 6368.5} {"step": 4809, "train_loss": 3.703002691268921, "lr": 0.00038540972514261313, "tps": 49437, "wall": 6376.3} {"step": 4810, "train_loss": 3.7173500061035156, "lr": 0.00038540216847149, "tps": 49388, "wall": 6383.9} {"step": 4811, "train_loss": 3.6627509593963623, "lr": 0.000385394609926682, "tps": 49338, "wall": 6391.7} {"step": 4812, "train_loss": 3.622547149658203, "lr": 0.0003853870495082751, "tps": 49290, "wall": 6399.3} {"step": 4813, "train_loss": 3.56101655960083, "lr": 0.00038537948721635465, "tps": 49239, "wall": 6407.2} {"step": 4814, "train_loss": 3.660905599594116, "lr": 0.0003853719230510064, "tps": 49191, "wall": 6414.9} {"step": 4815, "train_loss": 3.7171294689178467, "lr": 0.00038536435701231616, "tps": 49141, "wall": 6422.7} {"step": 4816, "train_loss": 3.6643590927124023, "lr": 0.0003853567891003695, "tps": 49092, "wall": 6430.4} {"step": 4817, "train_loss": 3.7202532291412354, "lr": 0.00038534921931525216, "tps": 49044, "wall": 6438.1} {"step": 4818, "train_loss": 3.6843502521514893, "lr": 0.00038534164765705, "tps": 48994, "wall": 6446.0} {"step": 4819, "train_loss": 3.7459139823913574, "lr": 0.0003853340741258486, "tps": 48946, "wall": 6453.7} {"step": 4820, "train_loss": 3.693781614303589, "lr": 0.0003853264987217339, "tps": 48896, "wall": 6461.5} {"step": 4821, "train_loss": 3.729419231414795, "lr": 0.00038531892144479167, "tps": 48848, "wall": 6469.3} {"step": 4822, "train_loss": 3.758554458618164, "lr": 0.0003853113422951078, "tps": 48800, "wall": 6477.0} {"step": 4823, "train_loss": 3.7121520042419434, "lr": 0.00038530376127276806, "tps": 48751, "wall": 6484.8} {"step": 4824, "train_loss": 3.8336281776428223, "lr": 0.0003852961783778584, "tps": 48704, "wall": 6492.4} {"step": 4825, "train_loss": 3.7276854515075684, "lr": 0.00038528859361046467, "tps": 48656, "wall": 6500.2} {"step": 4826, "train_loss": 3.619785785675049, "lr": 0.00038528100697067286, "tps": 48608, "wall": 6508.0} {"step": 4827, "train_loss": 3.6153347492218018, "lr": 0.0003852734184585688, "tps": 48560, "wall": 6515.7} {"step": 4828, "train_loss": 3.720736265182495, "lr": 0.0003852658280742385, "tps": 48511, "wall": 6523.6} {"step": 4829, "train_loss": 3.8267412185668945, "lr": 0.000385258235817768, "tps": 48463, "wall": 6531.4} {"step": 4830, "train_loss": 3.75486159324646, "lr": 0.0003852506416892432, "tps": 48415, "wall": 6539.3} {"step": 4831, "train_loss": 3.7314963340759277, "lr": 0.00038524304568875027, "tps": 48368, "wall": 6547.1} {"step": 4832, "train_loss": 3.6336841583251953, "lr": 0.0003852354478163752, "tps": 48320, "wall": 6554.9} {"step": 4833, "train_loss": 3.6903622150421143, "lr": 0.0003852278480722039, "tps": 48272, "wall": 6562.7} {"step": 4834, "train_loss": 3.784402847290039, "lr": 0.0003852202464563227, "tps": 48225, "wall": 6570.5} {"step": 4835, "train_loss": 3.695143222808838, "lr": 0.00038521264296881763, "tps": 48178, "wall": 6578.2} {"step": 4836, "train_loss": 3.696653127670288, "lr": 0.0003852050376097748, "tps": 48131, "wall": 6586.1} {"step": 4837, "train_loss": 3.6638753414154053, "lr": 0.0003851974303792803, "tps": 48084, "wall": 6593.9} {"step": 4838, "train_loss": 3.6816649436950684, "lr": 0.0003851898212774204, "tps": 48036, "wall": 6601.8} {"step": 4839, "train_loss": 3.8489394187927246, "lr": 0.00038518221030428134, "tps": 47990, "wall": 6609.6} {"step": 4840, "train_loss": 3.7122879028320312, "lr": 0.00038517459745994914, "tps": 47943, "wall": 6617.3} {"step": 4841, "train_loss": 3.748680591583252, "lr": 0.00038516698274451027, "tps": 47896, "wall": 6625.2} {"step": 4842, "train_loss": 3.615919589996338, "lr": 0.0003851593661580508, "tps": 47849, "wall": 6633.0} {"step": 4843, "train_loss": 3.604661464691162, "lr": 0.00038515174770065717, "tps": 47802, "wall": 6640.9} {"step": 4844, "train_loss": 3.6742708683013916, "lr": 0.00038514412737241554, "tps": 47755, "wall": 6648.8} {"step": 4845, "train_loss": 3.622654914855957, "lr": 0.0003851365051734124, "tps": 47710, "wall": 6656.6} {"step": 4846, "train_loss": 3.644395112991333, "lr": 0.00038512888110373385, "tps": 47664, "wall": 6664.4} {"step": 4847, "train_loss": 3.7125582695007324, "lr": 0.0003851212551634665, "tps": 47619, "wall": 6672.0} {"step": 4848, "train_loss": 3.7255618572235107, "lr": 0.00038511362735269667, "tps": 47573, "wall": 6679.8} {"step": 4849, "train_loss": 3.6972737312316895, "lr": 0.0003851059976715107, "tps": 47526, "wall": 6687.8} {"step": 4850, "train_loss": 3.6912665367126465, "lr": 0.000385098366119995, "tps": 47480, "wall": 6695.6} {"step": 4851, "train_loss": 3.5988311767578125, "lr": 0.0003850907326982361, "tps": 47434, "wall": 6703.5} {"step": 4852, "train_loss": 3.6934173107147217, "lr": 0.0003850830974063205, "tps": 47389, "wall": 6711.4} {"step": 4853, "train_loss": 3.771167039871216, "lr": 0.0003850754602443346, "tps": 47344, "wall": 6719.1} {"step": 4854, "train_loss": 3.805467128753662, "lr": 0.00038506782121236493, "tps": 47298, "wall": 6726.9} {"step": 4855, "train_loss": 3.69738507270813, "lr": 0.0003850601803104981, "tps": 47255, "wall": 6734.6} {"step": 4856, "train_loss": 3.6983859539031982, "lr": 0.0003850525375388206, "tps": 47209, "wall": 6742.5} {"step": 4857, "train_loss": 3.785520076751709, "lr": 0.00038504489289741906, "tps": 47163, "wall": 6750.4} {"step": 4858, "train_loss": 3.7128705978393555, "lr": 0.00038503724638638, "tps": 47119, "wall": 6758.1} {"step": 4859, "train_loss": 3.7500548362731934, "lr": 0.0003850295980057901, "tps": 47073, "wall": 6766.1} {"step": 4860, "train_loss": 3.7357239723205566, "lr": 0.000385021947755736, "tps": 47029, "wall": 6773.9} {"step": 4861, "train_loss": 3.664450168609619, "lr": 0.0003850142956363043, "tps": 46985, "wall": 6781.6} {"step": 4862, "train_loss": 3.635549306869507, "lr": 0.0003850066416475818, "tps": 46941, "wall": 6789.4} {"step": 4863, "train_loss": 3.6970982551574707, "lr": 0.0003849989857896551, "tps": 46896, "wall": 6797.2} {"step": 4864, "train_loss": 3.725486993789673, "lr": 0.00038499132806261093, "tps": 46851, "wall": 6805.2} {"step": 4865, "train_loss": 3.6712393760681152, "lr": 0.0003849836684665362, "tps": 46807, "wall": 6812.9} {"step": 4866, "train_loss": 3.8079299926757812, "lr": 0.0003849760070015174, "tps": 46763, "wall": 6820.7} {"step": 4867, "train_loss": 3.627457618713379, "lr": 0.00038496834366764156, "tps": 46719, "wall": 6828.6} {"step": 4868, "train_loss": 3.7330241203308105, "lr": 0.0003849606784649954, "tps": 46675, "wall": 6836.4} {"step": 4869, "train_loss": 3.7008378505706787, "lr": 0.0003849530113936656, "tps": 46632, "wall": 6844.2} {"step": 4870, "train_loss": 3.672581434249878, "lr": 0.0003849453424537393, "tps": 46589, "wall": 6851.9} {"step": 4871, "train_loss": 3.6800973415374756, "lr": 0.0003849376716453032, "tps": 46546, "wall": 6859.7} {"step": 4872, "train_loss": 3.6934165954589844, "lr": 0.00038492999896844426, "tps": 46501, "wall": 6867.6} {"step": 4873, "train_loss": 3.6666808128356934, "lr": 0.00038492232442324933, "tps": 46457, "wall": 6875.5} {"step": 4874, "train_loss": 3.763577938079834, "lr": 0.0003849146480098054, "tps": 46413, "wall": 6883.5} {"step": 4875, "train_loss": 3.65529727935791, "lr": 0.0003849069697281994, "tps": 46370, "wall": 6891.4} {"step": 4876, "train_loss": 3.7291979789733887, "lr": 0.0003848992895785184, "tps": 46327, "wall": 6899.2} {"step": 4877, "train_loss": 3.666862964630127, "lr": 0.0003848916075608493, "tps": 46284, "wall": 6907.0} {"step": 4878, "train_loss": 3.7054872512817383, "lr": 0.0003848839236752791, "tps": 46242, "wall": 6914.7} {"step": 4879, "train_loss": 3.6145925521850586, "lr": 0.0003848762379218949, "tps": 46198, "wall": 6922.6} {"step": 4880, "train_loss": 3.6246917247772217, "lr": 0.00038486855030078385, "tps": 46155, "wall": 6930.5} {"step": 4881, "train_loss": 3.687915325164795, "lr": 0.0003848608608120328, "tps": 46113, "wall": 6938.3} {"step": 4882, "train_loss": 3.604038715362549, "lr": 0.0003848531694557291, "tps": 46070, "wall": 6946.2} {"step": 4883, "train_loss": 3.766785144805908, "lr": 0.0003848454762319597, "tps": 46028, "wall": 6954.0} {"step": 4884, "train_loss": 3.7252416610717773, "lr": 0.00038483778114081193, "tps": 45986, "wall": 6961.7} {"step": 4885, "train_loss": 3.729215145111084, "lr": 0.00038483008418237273, "tps": 45943, "wall": 6969.6} {"step": 4886, "train_loss": 3.669107437133789, "lr": 0.00038482238535672954, "tps": 45901, "wall": 6977.4} {"step": 4887, "train_loss": 3.6998159885406494, "lr": 0.0003848146846639694, "tps": 45858, "wall": 6985.4} {"step": 4888, "train_loss": 3.618520736694336, "lr": 0.00038480698210417957, "tps": 45817, "wall": 6993.1} {"step": 4889, "train_loss": 3.6090927124023438, "lr": 0.0003847992776774474, "tps": 45774, "wall": 7001.0} {"step": 4890, "train_loss": 3.6736931800842285, "lr": 0.00038479157138386004, "tps": 45734, "wall": 7008.7} {"step": 4891, "train_loss": 3.8783040046691895, "lr": 0.00038478386322350486, "tps": 45692, "wall": 7016.6} {"step": 4892, "train_loss": 3.624476909637451, "lr": 0.00038477615319646916, "tps": 45651, "wall": 7024.2} {"step": 4893, "train_loss": 3.637388229370117, "lr": 0.0003847684413028403, "tps": 45610, "wall": 7031.9} {"step": 4894, "train_loss": 3.7275593280792236, "lr": 0.0003847607275427056, "tps": 45569, "wall": 7039.8} {"step": 4895, "train_loss": 3.6307523250579834, "lr": 0.00038475301191615247, "tps": 45527, "wall": 7047.7} {"step": 4896, "train_loss": 3.787675380706787, "lr": 0.00038474529442326835, "tps": 45487, "wall": 7055.4} {"step": 4897, "train_loss": 3.797549247741699, "lr": 0.0003847375750641406, "tps": 45444, "wall": 7063.4} {"step": 4898, "train_loss": 3.686189651489258, "lr": 0.0003847298538388566, "tps": 45404, "wall": 7071.1} {"step": 4899, "train_loss": 3.688969135284424, "lr": 0.000384722130747504, "tps": 45363, "wall": 7079.0} {"step": 4900, "train_loss": 3.6931023597717285, "lr": 0.00038471440579017016, "tps": 45323, "wall": 7086.7} {"step": 4901, "train_loss": 3.684563398361206, "lr": 0.00038470667896694263, "tps": 45282, "wall": 7094.5} {"step": 4902, "train_loss": 3.749886989593506, "lr": 0.00038469895027790893, "tps": 45241, "wall": 7102.4} {"step": 4903, "train_loss": 3.7426562309265137, "lr": 0.0003846912197231566, "tps": 45201, "wall": 7110.2} {"step": 4904, "train_loss": 3.7407898902893066, "lr": 0.00038468348730277325, "tps": 45160, "wall": 7118.0} {"step": 4905, "train_loss": 3.7108774185180664, "lr": 0.0003846757530168464, "tps": 45120, "wall": 7125.8} {"step": 4906, "train_loss": 3.66745924949646, "lr": 0.0003846680168654638, "tps": 45080, "wall": 7133.5} {"step": 4907, "train_loss": 3.636695384979248, "lr": 0.00038466027884871294, "tps": 45041, "wall": 7141.3} {"step": 4908, "train_loss": 3.663886547088623, "lr": 0.0003846525389666815, "tps": 45001, "wall": 7149.0} {"step": 4909, "train_loss": 3.677015781402588, "lr": 0.0003846447972194572, "tps": 44961, "wall": 7156.9} {"step": 4910, "train_loss": 3.6747961044311523, "lr": 0.00038463705360712775, "tps": 44921, "wall": 7164.7} {"step": 4911, "train_loss": 3.653123378753662, "lr": 0.00038462930812978085, "tps": 44881, "wall": 7172.5} {"step": 4912, "train_loss": 3.653810977935791, "lr": 0.00038462156078750425, "tps": 44842, "wall": 7180.2} {"step": 4913, "train_loss": 3.7333273887634277, "lr": 0.0003846138115803857, "tps": 44802, "wall": 7188.1} {"step": 4914, "train_loss": 3.7208142280578613, "lr": 0.000384606060508513, "tps": 44762, "wall": 7196.0} {"step": 4915, "train_loss": 3.6702029705047607, "lr": 0.0003845983075719739, "tps": 44722, "wall": 7203.8} {"step": 4916, "train_loss": 3.6847991943359375, "lr": 0.0003845905527708563, "tps": 44683, "wall": 7211.7} {"step": 4917, "train_loss": 3.7071828842163086, "lr": 0.00038458279610524803, "tps": 44644, "wall": 7219.4} {"step": 4918, "train_loss": 3.743062973022461, "lr": 0.0003845750375752369, "tps": 44604, "wall": 7227.4} {"step": 4919, "train_loss": 3.619966983795166, "lr": 0.0003845672771809108, "tps": 44564, "wall": 7235.2} {"step": 4920, "train_loss": 3.663395404815674, "lr": 0.00038455951492235777, "tps": 44525, "wall": 7243.2} {"step": 4921, "train_loss": 3.6458184719085693, "lr": 0.00038455175079966567, "tps": 44486, "wall": 7251.0} {"step": 4922, "train_loss": 3.65750789642334, "lr": 0.0003845439848129224, "tps": 44447, "wall": 7258.8} {"step": 4923, "train_loss": 3.631101131439209, "lr": 0.00038453621696221587, "tps": 44408, "wall": 7266.6} {"step": 4924, "train_loss": 3.7306923866271973, "lr": 0.0003845284472476343, "tps": 44370, "wall": 7274.4} {"step": 4925, "train_loss": 3.7559633255004883, "lr": 0.00038452067566926556, "tps": 44330, "wall": 7282.3} {"step": 4926, "train_loss": 3.6781136989593506, "lr": 0.0003845129022271976, "tps": 44291, "wall": 7290.2} {"step": 4927, "train_loss": 3.7692155838012695, "lr": 0.0003845051269215187, "tps": 44253, "wall": 7297.9} {"step": 4928, "train_loss": 3.5839579105377197, "lr": 0.0003844973497523168, "tps": 44214, "wall": 7305.8} {"step": 4929, "train_loss": 3.6899802684783936, "lr": 0.00038448957071968, "tps": 44176, "wall": 7313.7} {"step": 4930, "train_loss": 3.677961826324463, "lr": 0.0003844817898236965, "tps": 44138, "wall": 7321.5} {"step": 4931, "train_loss": 3.6630969047546387, "lr": 0.00038447400706445427, "tps": 44099, "wall": 7329.4} {"step": 4932, "train_loss": 3.681159496307373, "lr": 0.00038446622244204165, "tps": 44061, "wall": 7337.2} {"step": 4933, "train_loss": 3.693300724029541, "lr": 0.0003844584359565468, "tps": 44023, "wall": 7345.1} {"step": 4934, "train_loss": 3.6661417484283447, "lr": 0.0003844506476080579, "tps": 43985, "wall": 7352.9} {"step": 4935, "train_loss": 3.608255386352539, "lr": 0.0003844428573966631, "tps": 43947, "wall": 7360.8} {"step": 4936, "train_loss": 3.7447142601013184, "lr": 0.0003844350653224508, "tps": 43908, "wall": 7368.7} {"step": 4937, "train_loss": 3.753587245941162, "lr": 0.0003844272713855091, "tps": 43870, "wall": 7376.6} {"step": 4938, "train_loss": 3.599719285964966, "lr": 0.00038441947558592643, "tps": 43832, "wall": 7384.5} {"step": 4939, "train_loss": 3.8404693603515625, "lr": 0.000384411677923791, "tps": 43795, "wall": 7392.3} {"step": 4940, "train_loss": 3.710096597671509, "lr": 0.00038440387839919123, "tps": 43757, "wall": 7400.3} {"step": 4941, "train_loss": 3.6256532669067383, "lr": 0.0003843960770122154, "tps": 43719, "wall": 7408.1} {"step": 4942, "train_loss": 3.6691460609436035, "lr": 0.0003843882737629519, "tps": 43682, "wall": 7415.9} {"step": 4943, "train_loss": 3.650299310684204, "lr": 0.00038438046865148923, "tps": 43644, "wall": 7423.8} {"step": 4944, "train_loss": 3.7092175483703613, "lr": 0.0003843726616779156, "tps": 43607, "wall": 7431.6} {"step": 4945, "train_loss": 3.735966920852661, "lr": 0.00038436485284231965, "tps": 43570, "wall": 7439.5} {"step": 4946, "train_loss": 3.7360734939575195, "lr": 0.0003843570421447897, "tps": 43533, "wall": 7447.3} {"step": 4947, "train_loss": 3.634901523590088, "lr": 0.00038434922958541435, "tps": 43496, "wall": 7455.1} {"step": 4948, "train_loss": 3.842900514602661, "lr": 0.000384341415164282, "tps": 43459, "wall": 7463.0} {"step": 4949, "train_loss": 3.7068324089050293, "lr": 0.00038433359888148124, "tps": 43422, "wall": 7470.8} {"step": 4950, "train_loss": 3.6761229038238525, "lr": 0.00038432578073710054, "tps": 43386, "wall": 7478.6} {"step": 4951, "train_loss": 3.733193874359131, "lr": 0.00038431796073122847, "tps": 43350, "wall": 7486.4} {"step": 4952, "train_loss": 3.6294045448303223, "lr": 0.0003843101388639537, "tps": 43313, "wall": 7494.3} {"step": 4953, "train_loss": 3.681396722793579, "lr": 0.0003843023151353648, "tps": 43276, "wall": 7502.0} {"step": 4954, "train_loss": 3.7166733741760254, "lr": 0.00038429448954555045, "tps": 43241, "wall": 7509.8} {"step": 4955, "train_loss": 3.6323416233062744, "lr": 0.0003842866620945991, "tps": 43204, "wall": 7517.7} {"step": 4956, "train_loss": 3.577866554260254, "lr": 0.0003842788327825996, "tps": 43167, "wall": 7525.6} {"step": 4957, "train_loss": 3.614238739013672, "lr": 0.0003842710016096406, "tps": 43131, "wall": 7533.4} {"step": 4958, "train_loss": 3.755011796951294, "lr": 0.00038426316857581084, "tps": 43093, "wall": 7541.5} {"step": 4959, "train_loss": 3.5913968086242676, "lr": 0.00038425533368119895, "tps": 43058, "wall": 7549.3} {"step": 4960, "train_loss": 3.6336865425109863, "lr": 0.00038424749692589377, "tps": 43022, "wall": 7557.1} {"step": 4961, "train_loss": 3.5736727714538574, "lr": 0.0003842396583099842, "tps": 42986, "wall": 7565.0} {"step": 4962, "train_loss": 3.603888750076294, "lr": 0.0003842318178335587, "tps": 42950, "wall": 7572.8} {"step": 4963, "train_loss": 3.6662280559539795, "lr": 0.0003842239754967064, "tps": 42914, "wall": 7580.6} {"step": 4964, "train_loss": 3.614208221435547, "lr": 0.00038421613129951596, "tps": 42878, "wall": 7588.5} {"step": 4965, "train_loss": 3.677483558654785, "lr": 0.00038420828524207636, "tps": 42843, "wall": 7596.2} {"step": 4966, "train_loss": 3.72212553024292, "lr": 0.00038420043732447634, "tps": 42807, "wall": 7604.3} {"step": 4967, "train_loss": 3.664964199066162, "lr": 0.00038419258754680493, "tps": 42772, "wall": 7611.9} {"step": 4968, "train_loss": 3.6636598110198975, "lr": 0.000384184735909151, "tps": 42736, "wall": 7619.9} {"step": 4969, "train_loss": 3.699437379837036, "lr": 0.00038417688241160355, "tps": 42701, "wall": 7627.6} {"step": 4970, "train_loss": 3.6250035762786865, "lr": 0.00038416902705425143, "tps": 42666, "wall": 7635.5} {"step": 4971, "train_loss": 3.7279438972473145, "lr": 0.0003841611698371837, "tps": 42630, "wall": 7643.4} {"step": 4972, "train_loss": 3.5907492637634277, "lr": 0.00038415331076048937, "tps": 42595, "wall": 7651.3} {"step": 4973, "train_loss": 3.708785057067871, "lr": 0.0003841454498242574, "tps": 42560, "wall": 7659.1} {"step": 4974, "train_loss": 3.66874361038208, "lr": 0.000384137587028577, "tps": 42525, "wall": 7667.0} {"step": 4975, "train_loss": 3.6670875549316406, "lr": 0.0003841297223735371, "tps": 42490, "wall": 7674.7} {"step": 4976, "train_loss": 3.6514482498168945, "lr": 0.00038412185585922677, "tps": 42455, "wall": 7682.6} {"step": 4977, "train_loss": 3.72731351852417, "lr": 0.0003841139874857352, "tps": 42421, "wall": 7690.4} {"step": 4978, "train_loss": 3.6077563762664795, "lr": 0.0003841061172531516, "tps": 42386, "wall": 7698.3} {"step": 4979, "train_loss": 3.6910481452941895, "lr": 0.0003840982451615649, "tps": 42351, "wall": 7706.2} {"step": 4980, "train_loss": 3.644716501235962, "lr": 0.0003840903712110644, "tps": 42317, "wall": 7714.0} {"step": 4981, "train_loss": 3.704507350921631, "lr": 0.0003840824954017394, "tps": 42282, "wall": 7721.9} {"step": 4982, "train_loss": 3.591508388519287, "lr": 0.0003840746177336789, "tps": 42248, "wall": 7729.6} {"step": 4983, "train_loss": 3.669525146484375, "lr": 0.0003840667382069723, "tps": 42214, "wall": 7737.4} {"step": 4984, "train_loss": 3.69504451751709, "lr": 0.00038405885682170885, "tps": 42180, "wall": 7745.3} {"step": 4985, "train_loss": 3.692202091217041, "lr": 0.00038405097357797777, "tps": 42146, "wall": 7753.0} {"step": 4986, "train_loss": 3.582650899887085, "lr": 0.0003840430884758684, "tps": 42112, "wall": 7760.8} {"step": 4987, "train_loss": 3.564199447631836, "lr": 0.00038403520151547, "tps": 42077, "wall": 7768.8} {"step": 4988, "train_loss": 3.670703172683716, "lr": 0.000384027312696872, "tps": 42043, "wall": 7776.6} {"step": 4989, "train_loss": 3.7432761192321777, "lr": 0.00038401942202016375, "tps": 42009, "wall": 7784.6} {"step": 4990, "train_loss": 3.655498504638672, "lr": 0.0003840115294854346, "tps": 41975, "wall": 7792.4} {"step": 4991, "train_loss": 3.673490524291992, "lr": 0.0003840036350927739, "tps": 41941, "wall": 7800.3} {"step": 4992, "train_loss": 3.7205710411071777, "lr": 0.00038399573884227126, "tps": 41907, "wall": 7808.1} {"step": 4993, "train_loss": 3.6850688457489014, "lr": 0.00038398784073401596, "tps": 41874, "wall": 7815.9} {"step": 4994, "train_loss": 3.684891939163208, "lr": 0.0003839799407680975, "tps": 41841, "wall": 7823.6} {"step": 4995, "train_loss": 3.660020589828491, "lr": 0.00038397203894460546, "tps": 41807, "wall": 7831.6} {"step": 4996, "train_loss": 3.6457245349884033, "lr": 0.0003839641352636293, "tps": 41774, "wall": 7839.3} {"step": 4997, "train_loss": 3.6720848083496094, "lr": 0.0003839562297252585, "tps": 41740, "wall": 7847.3} {"step": 4998, "train_loss": 3.580430030822754, "lr": 0.0003839483223295826, "tps": 41707, "wall": 7855.0} {"step": 4999, "train_loss": 3.6008644104003906, "lr": 0.00038394041307669133, "tps": 41673, "wall": 7862.9} {"step": 5000, "train_loss": 3.6535093784332275, "lr": 0.0003839325019666742, "tps": 41641, "wall": 7870.6, "val_loss_monitor": 3.7811833840919737, "val_loss_full": 3.796828411974315} {"step": 5001, "train_loss": 3.6265721321105957, "lr": 0.0003839245889996208, "tps": 40717, "wall": 8050.8} {"step": 5002, "train_loss": 3.716299533843994, "lr": 0.0003839166741756208, "tps": 40684, "wall": 8059.1} {"step": 5003, "train_loss": 3.6751723289489746, "lr": 0.00038390875749476377, "tps": 40650, "wall": 8067.4} {"step": 5004, "train_loss": 3.6706695556640625, "lr": 0.00038390083895713955, "tps": 40616, "wall": 8075.7} {"step": 5005, "train_loss": 3.5187668800354004, "lr": 0.0003838929185628377, "tps": 40582, "wall": 8084.1} {"step": 5006, "train_loss": 3.6540369987487793, "lr": 0.000383884996311948, "tps": 40550, "wall": 8092.2} {"step": 5007, "train_loss": 3.710749626159668, "lr": 0.0003838770722045603, "tps": 40517, "wall": 8100.2} {"step": 5008, "train_loss": 3.815861225128174, "lr": 0.00038386914624076413, "tps": 40485, "wall": 8108.3} {"step": 5009, "train_loss": 3.6411190032958984, "lr": 0.0003838612184206495, "tps": 40453, "wall": 8116.3} {"step": 5010, "train_loss": 3.666351795196533, "lr": 0.00038385328874430605, "tps": 40421, "wall": 8124.4} {"step": 5011, "train_loss": 3.778414249420166, "lr": 0.0003838453572118237, "tps": 40389, "wall": 8132.5} {"step": 5012, "train_loss": 3.6622238159179688, "lr": 0.0003838374238232923, "tps": 40357, "wall": 8140.5} {"step": 5013, "train_loss": 3.6282639503479004, "lr": 0.00038382948857880174, "tps": 40325, "wall": 8148.6} {"step": 5014, "train_loss": 3.6821906566619873, "lr": 0.0003838215514784418, "tps": 40294, "wall": 8156.6} {"step": 5015, "train_loss": 3.7584362030029297, "lr": 0.00038381361252230257, "tps": 40263, "wall": 8164.5} {"step": 5016, "train_loss": 3.690145969390869, "lr": 0.00038380567171047373, "tps": 40232, "wall": 8172.4} {"step": 5017, "train_loss": 3.702259063720703, "lr": 0.0003837977290430455, "tps": 40200, "wall": 8180.4} {"step": 5018, "train_loss": 3.6452860832214355, "lr": 0.0003837897845201076, "tps": 40169, "wall": 8188.5} {"step": 5019, "train_loss": 3.6550180912017822, "lr": 0.00038378183814175026, "tps": 40138, "wall": 8196.5} {"step": 5020, "train_loss": 3.7038066387176514, "lr": 0.00038377388990806343, "tps": 40107, "wall": 8204.4} {"step": 5021, "train_loss": 3.7213611602783203, "lr": 0.00038376593981913706, "tps": 40077, "wall": 8212.2} {"step": 5022, "train_loss": 3.7612414360046387, "lr": 0.00038375798787506125, "tps": 40047, "wall": 8220.0} {"step": 5023, "train_loss": 3.608187198638916, "lr": 0.00038375003407592614, "tps": 40016, "wall": 8228.0} {"step": 5024, "train_loss": 3.815046787261963, "lr": 0.00038374207842182173, "tps": 39985, "wall": 8235.9} {"step": 5025, "train_loss": 3.5379812717437744, "lr": 0.00038373412091283817, "tps": 39954, "wall": 8243.9} {"step": 5026, "train_loss": 3.6955859661102295, "lr": 0.00038372616154906566, "tps": 39924, "wall": 8251.7} {"step": 5027, "train_loss": 3.673609733581543, "lr": 0.0003837182003305944, "tps": 39895, "wall": 8259.5} {"step": 5028, "train_loss": 3.6644561290740967, "lr": 0.00038371023725751447, "tps": 39864, "wall": 8267.5} {"step": 5029, "train_loss": 3.7037835121154785, "lr": 0.0003837022723299161, "tps": 39835, "wall": 8275.3} {"step": 5030, "train_loss": 3.785292625427246, "lr": 0.0003836943055478896, "tps": 39805, "wall": 8283.1} {"step": 5031, "train_loss": 3.6747117042541504, "lr": 0.0003836863369115251, "tps": 39775, "wall": 8290.9} {"step": 5032, "train_loss": 3.6639721393585205, "lr": 0.00038367836642091285, "tps": 39746, "wall": 8298.7} {"step": 5033, "train_loss": 3.7435362339019775, "lr": 0.0003836703940761433, "tps": 39716, "wall": 8306.5} {"step": 5034, "train_loss": 3.633490562438965, "lr": 0.00038366241987730664, "tps": 39688, "wall": 8314.2} {"step": 5035, "train_loss": 3.70361065864563, "lr": 0.0003836544438244933, "tps": 39658, "wall": 8322.0} {"step": 5036, "train_loss": 3.73233699798584, "lr": 0.00038364646591779346, "tps": 39629, "wall": 8329.8} {"step": 5037, "train_loss": 3.719320774078369, "lr": 0.00038363848615729763, "tps": 39600, "wall": 8337.5} {"step": 5038, "train_loss": 3.742025375366211, "lr": 0.0003836305045430962, "tps": 39571, "wall": 8345.2} {"step": 5039, "train_loss": 3.6829323768615723, "lr": 0.00038362252107527957, "tps": 39543, "wall": 8352.9} {"step": 5040, "train_loss": 3.6278297901153564, "lr": 0.0003836145357539382, "tps": 39514, "wall": 8360.7} {"step": 5041, "train_loss": 3.651021957397461, "lr": 0.00038360654857916244, "tps": 39485, "wall": 8368.5} {"step": 5042, "train_loss": 3.599189519882202, "lr": 0.0003835985595510429, "tps": 39456, "wall": 8376.2} {"step": 5043, "train_loss": 3.7096056938171387, "lr": 0.00038359056866967, "tps": 39427, "wall": 8384.1} {"step": 5044, "train_loss": 3.623137950897217, "lr": 0.00038358257593513426, "tps": 39398, "wall": 8391.9} {"step": 5045, "train_loss": 3.632903575897217, "lr": 0.0003835745813475263, "tps": 39370, "wall": 8399.6} {"step": 5046, "train_loss": 3.5384535789489746, "lr": 0.00038356658490693664, "tps": 39341, "wall": 8407.5} {"step": 5047, "train_loss": 3.701991558074951, "lr": 0.0003835585866134558, "tps": 39312, "wall": 8415.2} {"step": 5048, "train_loss": 3.6428122520446777, "lr": 0.0003835505864671745, "tps": 39284, "wall": 8423.0} {"step": 5049, "train_loss": 3.6727981567382812, "lr": 0.00038354258446818333, "tps": 39255, "wall": 8430.8} {"step": 5050, "train_loss": 3.663576602935791, "lr": 0.0003835345806165728, "tps": 39227, "wall": 8438.5} {"step": 5051, "train_loss": 3.686591148376465, "lr": 0.0003835265749124338, "tps": 39198, "wall": 8446.4} {"step": 5052, "train_loss": 3.6518478393554688, "lr": 0.00038351856735585686, "tps": 39170, "wall": 8454.2} {"step": 5053, "train_loss": 3.7280962467193604, "lr": 0.0003835105579469328, "tps": 39141, "wall": 8462.0} {"step": 5054, "train_loss": 3.7561798095703125, "lr": 0.0003835025466857523, "tps": 39113, "wall": 8469.8} {"step": 5055, "train_loss": 3.6199684143066406, "lr": 0.000383494533572406, "tps": 39085, "wall": 8477.6} {"step": 5056, "train_loss": 3.7250566482543945, "lr": 0.0003834865186069849, "tps": 39057, "wall": 8485.4} {"step": 5057, "train_loss": 3.6741323471069336, "lr": 0.0003834785017895796, "tps": 39029, "wall": 8493.1} {"step": 5058, "train_loss": 3.7083959579467773, "lr": 0.000383470483120281, "tps": 39001, "wall": 8500.9} {"step": 5059, "train_loss": 3.6777517795562744, "lr": 0.00038346246259917993, "tps": 38973, "wall": 8508.8} {"step": 5060, "train_loss": 3.6521177291870117, "lr": 0.0003834544402263672, "tps": 38944, "wall": 8516.6} {"step": 5061, "train_loss": 3.5767135620117188, "lr": 0.00038344641600193376, "tps": 38916, "wall": 8524.5} {"step": 5062, "train_loss": 3.6835756301879883, "lr": 0.0003834383899259705, "tps": 38888, "wall": 8532.3} {"step": 5063, "train_loss": 3.560814142227173, "lr": 0.00038343036199856825, "tps": 38861, "wall": 8540.0} {"step": 5064, "train_loss": 3.62968111038208, "lr": 0.0003834223322198181, "tps": 38832, "wall": 8548.0} {"step": 5065, "train_loss": 3.668095111846924, "lr": 0.0003834143005898109, "tps": 38805, "wall": 8555.7} {"step": 5066, "train_loss": 3.643695116043091, "lr": 0.00038340626710863765, "tps": 38776, "wall": 8563.7} {"step": 5067, "train_loss": 3.616807460784912, "lr": 0.00038339823177638944, "tps": 38749, "wall": 8571.3} {"step": 5068, "train_loss": 3.754974365234375, "lr": 0.0003833901945931571, "tps": 38721, "wall": 8579.2} {"step": 5069, "train_loss": 3.6610074043273926, "lr": 0.00038338215555903184, "tps": 38694, "wall": 8586.9} {"step": 5070, "train_loss": 3.6326417922973633, "lr": 0.00038337411467410476, "tps": 38667, "wall": 8594.7} {"step": 5071, "train_loss": 3.653641700744629, "lr": 0.00038336607193846674, "tps": 38639, "wall": 8602.5} {"step": 5072, "train_loss": 3.629042625427246, "lr": 0.00038335802735220913, "tps": 38612, "wall": 8610.3} {"step": 5073, "train_loss": 3.6129307746887207, "lr": 0.0003833499809154229, "tps": 38585, "wall": 8618.1} {"step": 5074, "train_loss": 3.648468494415283, "lr": 0.00038334193262819927, "tps": 38557, "wall": 8625.9} {"step": 5075, "train_loss": 3.6617681980133057, "lr": 0.0003833338824906293, "tps": 38530, "wall": 8633.8} {"step": 5076, "train_loss": 3.6441640853881836, "lr": 0.0003833258305028044, "tps": 38503, "wall": 8641.5} {"step": 5077, "train_loss": 3.699920892715454, "lr": 0.00038331777666481557, "tps": 38476, "wall": 8649.3} {"step": 5078, "train_loss": 3.670595645904541, "lr": 0.0003833097209767542, "tps": 38448, "wall": 8657.2} {"step": 5079, "train_loss": 3.6578822135925293, "lr": 0.0003833016634387114, "tps": 38421, "wall": 8665.1} {"step": 5080, "train_loss": 3.5808701515197754, "lr": 0.00038329360405077857, "tps": 38394, "wall": 8672.8} {"step": 5081, "train_loss": 3.593242883682251, "lr": 0.0003832855428130469, "tps": 38367, "wall": 8680.6} {"step": 5082, "train_loss": 3.5194308757781982, "lr": 0.0003832774797256079, "tps": 38340, "wall": 8688.4} {"step": 5083, "train_loss": 3.6922197341918945, "lr": 0.00038326941478855273, "tps": 38313, "wall": 8696.3} {"step": 5084, "train_loss": 3.6729087829589844, "lr": 0.0003832613480019727, "tps": 38287, "wall": 8704.0} {"step": 5085, "train_loss": 3.6654715538024902, "lr": 0.00038325327936595936, "tps": 38260, "wall": 8711.8} {"step": 5086, "train_loss": 3.6888575553894043, "lr": 0.000383245208880604, "tps": 38233, "wall": 8719.6} {"step": 5087, "train_loss": 3.7421135902404785, "lr": 0.0003832371365459981, "tps": 38206, "wall": 8727.5} {"step": 5088, "train_loss": 3.6306331157684326, "lr": 0.0003832290623622331, "tps": 38180, "wall": 8735.2} {"step": 5089, "train_loss": 3.679778575897217, "lr": 0.00038322098632940046, "tps": 38153, "wall": 8743.1} {"step": 5090, "train_loss": 3.793349266052246, "lr": 0.0003832129084475917, "tps": 38127, "wall": 8750.8} {"step": 5091, "train_loss": 3.644835948944092, "lr": 0.0003832048287168982, "tps": 38100, "wall": 8758.6} {"step": 5092, "train_loss": 3.7359423637390137, "lr": 0.00038319674713741154, "tps": 38074, "wall": 8766.4} {"step": 5093, "train_loss": 3.634963035583496, "lr": 0.0003831886637092234, "tps": 38048, "wall": 8774.2} {"step": 5094, "train_loss": 3.6952292919158936, "lr": 0.0003831805784324252, "tps": 38021, "wall": 8782.0} {"step": 5095, "train_loss": 3.6851766109466553, "lr": 0.0003831724913071086, "tps": 37994, "wall": 8789.9} {"step": 5096, "train_loss": 3.6500039100646973, "lr": 0.0003831644023333652, "tps": 37969, "wall": 8797.6} {"step": 5097, "train_loss": 3.6590657234191895, "lr": 0.00038315631151128655, "tps": 37942, "wall": 8805.6} {"step": 5098, "train_loss": 3.7547078132629395, "lr": 0.0003831482188409645, "tps": 37916, "wall": 8813.3} {"step": 5099, "train_loss": 3.6433544158935547, "lr": 0.0003831401243224905, "tps": 37890, "wall": 8821.1} {"step": 5100, "train_loss": 3.7041828632354736, "lr": 0.00038313202795595635, "tps": 37864, "wall": 8828.9} {"step": 5101, "train_loss": 3.6411936283111572, "lr": 0.00038312392974145377, "tps": 37837, "wall": 8836.7} {"step": 5102, "train_loss": 3.485339641571045, "lr": 0.00038311582967907453, "tps": 37811, "wall": 8844.6} {"step": 5103, "train_loss": 3.614041566848755, "lr": 0.0003831077277689103, "tps": 37786, "wall": 8852.4} {"step": 5104, "train_loss": 3.646813154220581, "lr": 0.000383099624011053, "tps": 37760, "wall": 8860.1} {"step": 5105, "train_loss": 3.675834894180298, "lr": 0.00038309151840559423, "tps": 37734, "wall": 8867.9} {"step": 5106, "train_loss": 3.5873026847839355, "lr": 0.0003830834109526259, "tps": 37708, "wall": 8875.7} {"step": 5107, "train_loss": 3.6338436603546143, "lr": 0.00038307530165223994, "tps": 37682, "wall": 8883.6} {"step": 5108, "train_loss": 3.5357718467712402, "lr": 0.0003830671905045281, "tps": 37657, "wall": 8891.3} {"step": 5109, "train_loss": 3.5543527603149414, "lr": 0.0003830590775095823, "tps": 37631, "wall": 8899.1} {"step": 5110, "train_loss": 3.6208462715148926, "lr": 0.0003830509626674945, "tps": 37605, "wall": 8907.1} {"step": 5111, "train_loss": 3.6664938926696777, "lr": 0.0003830428459783566, "tps": 37580, "wall": 8914.8} {"step": 5112, "train_loss": 3.5994157791137695, "lr": 0.00038303472744226043, "tps": 37554, "wall": 8922.7} {"step": 5113, "train_loss": 3.590020179748535, "lr": 0.00038302660705929814, "tps": 37528, "wall": 8930.5} {"step": 5114, "train_loss": 3.618887424468994, "lr": 0.00038301848482956153, "tps": 37503, "wall": 8938.3} {"step": 5115, "train_loss": 3.7002663612365723, "lr": 0.0003830103607531428, "tps": 37478, "wall": 8946.1} {"step": 5116, "train_loss": 3.7403035163879395, "lr": 0.00038300223483013376, "tps": 37452, "wall": 8953.9} {"step": 5117, "train_loss": 3.7025575637817383, "lr": 0.00038299410706062664, "tps": 37427, "wall": 8961.6} {"step": 5118, "train_loss": 3.639881134033203, "lr": 0.0003829859774447135, "tps": 37401, "wall": 8969.6} {"step": 5119, "train_loss": 3.594878673553467, "lr": 0.0003829778459824864, "tps": 37376, "wall": 8977.3} {"step": 5120, "train_loss": 3.613961696624756, "lr": 0.0003829697126740374, "tps": 37351, "wall": 8985.2} {"step": 5121, "train_loss": 3.7352263927459717, "lr": 0.00038296157751945866, "tps": 37326, "wall": 8993.0} {"step": 5122, "train_loss": 3.682422637939453, "lr": 0.0003829534405188424, "tps": 37301, "wall": 9000.9} {"step": 5123, "train_loss": 3.772404670715332, "lr": 0.00038294530167228073, "tps": 37276, "wall": 9008.6} {"step": 5124, "train_loss": 3.703373432159424, "lr": 0.0003829371609798658, "tps": 37251, "wall": 9016.4} {"step": 5125, "train_loss": 3.7767274379730225, "lr": 0.00038292901844169, "tps": 37226, "wall": 9024.3} {"step": 5126, "train_loss": 3.735534191131592, "lr": 0.00038292087405784544, "tps": 37200, "wall": 9032.2} {"step": 5127, "train_loss": 3.714817523956299, "lr": 0.0003829127278284244, "tps": 37175, "wall": 9039.9} {"step": 5128, "train_loss": 3.679321765899658, "lr": 0.0003829045797535191, "tps": 37150, "wall": 9047.8} {"step": 5129, "train_loss": 3.5887656211853027, "lr": 0.000382896429833222, "tps": 37126, "wall": 9055.6} {"step": 5130, "train_loss": 3.643430233001709, "lr": 0.0003828882780676253, "tps": 37101, "wall": 9063.4} {"step": 5131, "train_loss": 3.6045081615448, "lr": 0.0003828801244568213, "tps": 37077, "wall": 9071.0} {"step": 5132, "train_loss": 3.833157539367676, "lr": 0.0003828719690009026, "tps": 37052, "wall": 9078.9} {"step": 5133, "train_loss": 3.671330213546753, "lr": 0.0003828638116999613, "tps": 37027, "wall": 9086.7} {"step": 5134, "train_loss": 3.6810386180877686, "lr": 0.00038285565255408995, "tps": 37003, "wall": 9094.5} {"step": 5135, "train_loss": 3.796201705932617, "lr": 0.000382847491563381, "tps": 36978, "wall": 9102.5} {"step": 5136, "train_loss": 3.670487403869629, "lr": 0.00038283932872792677, "tps": 36953, "wall": 9110.3} {"step": 5137, "train_loss": 3.674989700317383, "lr": 0.0003828311640478199, "tps": 36929, "wall": 9118.1} {"step": 5138, "train_loss": 3.6723790168762207, "lr": 0.0003828229975231528, "tps": 36904, "wall": 9126.0} {"step": 5139, "train_loss": 3.5586533546447754, "lr": 0.0003828148291540179, "tps": 36879, "wall": 9133.9} {"step": 5140, "train_loss": 3.6319024562835693, "lr": 0.00038280665894050786, "tps": 36855, "wall": 9141.6} {"step": 5141, "train_loss": 3.636608600616455, "lr": 0.00038279848688271514, "tps": 36830, "wall": 9149.6} {"step": 5142, "train_loss": 3.676220655441284, "lr": 0.0003827903129807324, "tps": 36806, "wall": 9157.4} {"step": 5143, "train_loss": 3.6079986095428467, "lr": 0.00038278213723465216, "tps": 36781, "wall": 9165.3} {"step": 5144, "train_loss": 3.674039602279663, "lr": 0.00038277395964456703, "tps": 36757, "wall": 9173.1} {"step": 5145, "train_loss": 3.7327513694763184, "lr": 0.00038276578021056973, "tps": 36733, "wall": 9180.9} {"step": 5146, "train_loss": 3.6599338054656982, "lr": 0.00038275759893275296, "tps": 36709, "wall": 9188.7} {"step": 5147, "train_loss": 3.6762914657592773, "lr": 0.00038274941581120913, "tps": 36685, "wall": 9196.4} {"step": 5148, "train_loss": 3.6440625190734863, "lr": 0.0003827412308460312, "tps": 36661, "wall": 9204.3} {"step": 5149, "train_loss": 3.736295223236084, "lr": 0.0003827330440373118, "tps": 36637, "wall": 9212.2} {"step": 5150, "train_loss": 3.5912492275238037, "lr": 0.00038272485538514366, "tps": 36614, "wall": 9219.8} {"step": 5151, "train_loss": 3.629605293273926, "lr": 0.0003827166648896195, "tps": 36589, "wall": 9227.8} {"step": 5152, "train_loss": 3.6480495929718018, "lr": 0.00038270847255083223, "tps": 36566, "wall": 9235.4} {"step": 5153, "train_loss": 3.67720365524292, "lr": 0.0003827002783688746, "tps": 36542, "wall": 9243.4} {"step": 5154, "train_loss": 3.671234607696533, "lr": 0.00038269208234383934, "tps": 36518, "wall": 9251.0} {"step": 5155, "train_loss": 3.687065839767456, "lr": 0.00038268388447581944, "tps": 36495, "wall": 9258.8} {"step": 5156, "train_loss": 3.6740429401397705, "lr": 0.00038267568476490766, "tps": 36471, "wall": 9266.7} {"step": 5157, "train_loss": 3.710099697113037, "lr": 0.0003826674832111969, "tps": 36447, "wall": 9274.5} {"step": 5158, "train_loss": 3.649907350540161, "lr": 0.00038265927981478016, "tps": 36424, "wall": 9282.2} {"step": 5159, "train_loss": 3.562100410461426, "lr": 0.00038265107457575027, "tps": 36401, "wall": 9290.0} {"step": 5160, "train_loss": 3.711589813232422, "lr": 0.0003826428674942001, "tps": 36378, "wall": 9297.7} {"step": 5161, "train_loss": 3.6043615341186523, "lr": 0.00038263465857022285, "tps": 36354, "wall": 9305.6} {"step": 5162, "train_loss": 3.7352354526519775, "lr": 0.0003826264478039114, "tps": 36331, "wall": 9313.2} {"step": 5163, "train_loss": 3.6356382369995117, "lr": 0.0003826182351953587, "tps": 36308, "wall": 9321.0} {"step": 5164, "train_loss": 3.6524949073791504, "lr": 0.0003826100207446578, "tps": 36284, "wall": 9328.9} {"step": 5165, "train_loss": 3.6439552307128906, "lr": 0.00038260180445190184, "tps": 36261, "wall": 9336.7} {"step": 5166, "train_loss": 3.5776185989379883, "lr": 0.00038259358631718385, "tps": 36237, "wall": 9344.6} {"step": 5167, "train_loss": 3.6318507194519043, "lr": 0.0003825853663405969, "tps": 36214, "wall": 9352.3} {"step": 5168, "train_loss": 3.554426431655884, "lr": 0.0003825771445222341, "tps": 36191, "wall": 9360.1} {"step": 5169, "train_loss": 3.6459784507751465, "lr": 0.0003825689208621887, "tps": 36168, "wall": 9367.8} {"step": 5170, "train_loss": 3.548469305038452, "lr": 0.0003825606953605537, "tps": 36145, "wall": 9375.5} {"step": 5171, "train_loss": 3.6789965629577637, "lr": 0.0003825524680174224, "tps": 36122, "wall": 9383.4} {"step": 5172, "train_loss": 3.598906993865967, "lr": 0.00038254423883288784, "tps": 36099, "wall": 9391.2} {"step": 5173, "train_loss": 3.7183609008789062, "lr": 0.0003825360078070434, "tps": 36076, "wall": 9398.9} {"step": 5174, "train_loss": 3.7171409130096436, "lr": 0.00038252777493998227, "tps": 36053, "wall": 9406.9} {"step": 5175, "train_loss": 3.6291749477386475, "lr": 0.0003825195402317977, "tps": 36030, "wall": 9414.6} {"step": 5176, "train_loss": 3.62894868850708, "lr": 0.0003825113036825831, "tps": 36008, "wall": 9422.2} {"step": 5177, "train_loss": 3.616001844406128, "lr": 0.0003825030652924316, "tps": 35985, "wall": 9429.9} {"step": 5178, "train_loss": 3.6514101028442383, "lr": 0.0003824948250614365, "tps": 35963, "wall": 9437.7} {"step": 5179, "train_loss": 3.610917091369629, "lr": 0.0003824865829896913, "tps": 35939, "wall": 9445.7} {"step": 5180, "train_loss": 3.557832956314087, "lr": 0.0003824783390772893, "tps": 35917, "wall": 9453.3} {"step": 5181, "train_loss": 3.668325901031494, "lr": 0.0003824700933243239, "tps": 35894, "wall": 9461.2} {"step": 5182, "train_loss": 3.592268943786621, "lr": 0.00038246184573088843, "tps": 35872, "wall": 9469.0} {"step": 5183, "train_loss": 3.6517748832702637, "lr": 0.0003824535962970765, "tps": 35849, "wall": 9476.8} {"step": 5184, "train_loss": 3.554941177368164, "lr": 0.0003824453450229813, "tps": 35826, "wall": 9484.6} {"step": 5185, "train_loss": 3.568695545196533, "lr": 0.0003824370919086965, "tps": 35804, "wall": 9492.3} {"step": 5186, "train_loss": 3.7246956825256348, "lr": 0.00038242883695431556, "tps": 35782, "wall": 9500.1} {"step": 5187, "train_loss": 3.630518913269043, "lr": 0.0003824205801599319, "tps": 35759, "wall": 9508.0} {"step": 5188, "train_loss": 3.5142879486083984, "lr": 0.00038241232152563917, "tps": 35737, "wall": 9515.7} {"step": 5189, "train_loss": 3.789238929748535, "lr": 0.0003824040610515309, "tps": 35714, "wall": 9523.6} {"step": 5190, "train_loss": 3.720458507537842, "lr": 0.0003823957987377006, "tps": 35692, "wall": 9531.3} {"step": 5191, "train_loss": 3.604940414428711, "lr": 0.00038238753458424193, "tps": 35670, "wall": 9539.1} {"step": 5192, "train_loss": 3.5898654460906982, "lr": 0.00038237926859124844, "tps": 35647, "wall": 9546.9} {"step": 5193, "train_loss": 3.6021242141723633, "lr": 0.00038237100075881386, "tps": 35626, "wall": 9554.6} {"step": 5194, "train_loss": 3.681065559387207, "lr": 0.0003823627310870318, "tps": 35604, "wall": 9562.4} {"step": 5195, "train_loss": 3.642810344696045, "lr": 0.0003823544595759959, "tps": 35581, "wall": 9570.2} {"step": 5196, "train_loss": 3.6908798217773438, "lr": 0.00038234618622579996, "tps": 35559, "wall": 9578.0} {"step": 5197, "train_loss": 3.7242438793182373, "lr": 0.0003823379110365376, "tps": 35537, "wall": 9585.8} {"step": 5198, "train_loss": 3.597292423248291, "lr": 0.0003823296340083026, "tps": 35515, "wall": 9593.6} {"step": 5199, "train_loss": 3.773406505584717, "lr": 0.00038232135514118873, "tps": 35493, "wall": 9601.4} {"step": 5200, "train_loss": 3.7101902961730957, "lr": 0.00038231307443528976, "tps": 35471, "wall": 9609.3} {"step": 5201, "train_loss": 3.761551856994629, "lr": 0.0003823047918906995, "tps": 35449, "wall": 9617.0} {"step": 5202, "train_loss": 3.6161229610443115, "lr": 0.0003822965075075118, "tps": 35427, "wall": 9624.9} {"step": 5203, "train_loss": 3.6785409450531006, "lr": 0.00038228822128582045, "tps": 35405, "wall": 9632.7} {"step": 5204, "train_loss": 3.6993274688720703, "lr": 0.0003822799332257194, "tps": 35383, "wall": 9640.5} {"step": 5205, "train_loss": 3.712097644805908, "lr": 0.0003822716433273024, "tps": 35361, "wall": 9648.4} {"step": 5206, "train_loss": 3.6658709049224854, "lr": 0.0003822633515906635, "tps": 35339, "wall": 9656.1} {"step": 5207, "train_loss": 3.6402158737182617, "lr": 0.0003822550580158966, "tps": 35318, "wall": 9663.9} {"step": 5208, "train_loss": 3.711775302886963, "lr": 0.00038224676260309557, "tps": 35296, "wall": 9671.7} {"step": 5209, "train_loss": 3.611516237258911, "lr": 0.00038223846535235444, "tps": 35275, "wall": 9679.4} {"step": 5210, "train_loss": 3.5879783630371094, "lr": 0.00038223016626376724, "tps": 35253, "wall": 9687.3} {"step": 5211, "train_loss": 3.645395278930664, "lr": 0.000382221865337428, "tps": 35231, "wall": 9695.0} {"step": 5212, "train_loss": 3.6193008422851562, "lr": 0.00038221356257343056, "tps": 35210, "wall": 9702.9} {"step": 5213, "train_loss": 3.6610794067382812, "lr": 0.00038220525797186917, "tps": 35188, "wall": 9710.6} {"step": 5214, "train_loss": 3.694345235824585, "lr": 0.00038219695153283783, "tps": 35167, "wall": 9718.3} {"step": 5215, "train_loss": 3.6379001140594482, "lr": 0.00038218864325643065, "tps": 35146, "wall": 9726.1} {"step": 5216, "train_loss": 3.6371328830718994, "lr": 0.0003821803331427418, "tps": 35124, "wall": 9733.9} {"step": 5217, "train_loss": 3.677734851837158, "lr": 0.0003821720211918652, "tps": 35103, "wall": 9741.6} {"step": 5218, "train_loss": 3.7164578437805176, "lr": 0.0003821637074038953, "tps": 35082, "wall": 9749.5} {"step": 5219, "train_loss": 3.600066661834717, "lr": 0.00038215539177892616, "tps": 35060, "wall": 9757.3} {"step": 5220, "train_loss": 3.625575304031372, "lr": 0.00038214707431705197, "tps": 35039, "wall": 9765.2} {"step": 5221, "train_loss": 3.652523994445801, "lr": 0.0003821387550183669, "tps": 35018, "wall": 9772.9} {"step": 5222, "train_loss": 3.6244444847106934, "lr": 0.0003821304338829653, "tps": 34997, "wall": 9780.6} {"step": 5223, "train_loss": 3.706936836242676, "lr": 0.00038212211091094133, "tps": 34975, "wall": 9788.4} {"step": 5224, "train_loss": 3.6778340339660645, "lr": 0.0003821137861023893, "tps": 34955, "wall": 9796.2} {"step": 5225, "train_loss": 3.6933674812316895, "lr": 0.00038210545945740353, "tps": 34934, "wall": 9803.9} {"step": 5226, "train_loss": 3.677981376647949, "lr": 0.0003820971309760784, "tps": 34913, "wall": 9811.6} {"step": 5227, "train_loss": 3.652006149291992, "lr": 0.0003820888006585082, "tps": 34892, "wall": 9819.5} {"step": 5228, "train_loss": 3.867964267730713, "lr": 0.0003820804685047873, "tps": 34870, "wall": 9827.3} {"step": 5229, "train_loss": 3.611886501312256, "lr": 0.00038207213451501, "tps": 34849, "wall": 9835.2} {"step": 5230, "train_loss": 3.671786308288574, "lr": 0.00038206379868927084, "tps": 34828, "wall": 9843.0} {"step": 5231, "train_loss": 3.599062919616699, "lr": 0.0003820554610276642, "tps": 34808, "wall": 9850.7} {"step": 5232, "train_loss": 3.6396594047546387, "lr": 0.00038204712153028453, "tps": 34787, "wall": 9858.5} {"step": 5233, "train_loss": 3.5370397567749023, "lr": 0.0003820387801972263, "tps": 34766, "wall": 9866.3} {"step": 5234, "train_loss": 3.658181667327881, "lr": 0.000382030437028584, "tps": 34745, "wall": 9874.0} {"step": 5235, "train_loss": 3.648810386657715, "lr": 0.00038202209202445217, "tps": 34724, "wall": 9881.9} {"step": 5236, "train_loss": 3.6775643825531006, "lr": 0.00038201374518492527, "tps": 34703, "wall": 9889.7} {"step": 5237, "train_loss": 3.692155122756958, "lr": 0.00038200539651009796, "tps": 34683, "wall": 9897.6} {"step": 5238, "train_loss": 3.739135265350342, "lr": 0.00038199704600006473, "tps": 34662, "wall": 9905.3} {"step": 5239, "train_loss": 3.58243989944458, "lr": 0.00038198869365492017, "tps": 34641, "wall": 9913.1} {"step": 5240, "train_loss": 3.65038800239563, "lr": 0.000381980339474759, "tps": 34621, "wall": 9920.8} {"step": 5241, "train_loss": 3.637338876724243, "lr": 0.00038197198345967567, "tps": 34600, "wall": 9928.8} {"step": 5242, "train_loss": 3.6639978885650635, "lr": 0.00038196362560976503, "tps": 34580, "wall": 9936.5} {"step": 5243, "train_loss": 3.6677136421203613, "lr": 0.0003819552659251216, "tps": 34559, "wall": 9944.4} {"step": 5244, "train_loss": 3.6884875297546387, "lr": 0.0003819469044058403, "tps": 34538, "wall": 9952.2} {"step": 5245, "train_loss": 3.647615432739258, "lr": 0.0003819385410520156, "tps": 34518, "wall": 9959.8} {"step": 5246, "train_loss": 3.789626121520996, "lr": 0.0003819301758637423, "tps": 34498, "wall": 9967.6} {"step": 5247, "train_loss": 3.79341983795166, "lr": 0.0003819218088411153, "tps": 34478, "wall": 9975.4} {"step": 5248, "train_loss": 3.76643443107605, "lr": 0.0003819134399842293, "tps": 34457, "wall": 9983.2} {"step": 5249, "train_loss": 3.7128305435180664, "lr": 0.00038190506929317903, "tps": 34437, "wall": 9991.0} {"step": 5250, "train_loss": 3.619741678237915, "lr": 0.0003818966967680594, "tps": 34417, "wall": 9998.6} {"step": 5251, "train_loss": 3.7210025787353516, "lr": 0.0003818883224089652, "tps": 34397, "wall": 10006.5} {"step": 5252, "train_loss": 3.7043614387512207, "lr": 0.00038187994621599136, "tps": 34376, "wall": 10014.3} {"step": 5253, "train_loss": 3.6703786849975586, "lr": 0.00038187156818923274, "tps": 34356, "wall": 10022.1} {"step": 5254, "train_loss": 3.6235408782958984, "lr": 0.00038186318832878423, "tps": 34336, "wall": 10029.8} {"step": 5255, "train_loss": 3.6528267860412598, "lr": 0.0003818548066347407, "tps": 34316, "wall": 10037.6} {"step": 5256, "train_loss": 3.6196582317352295, "lr": 0.00038184642310719726, "tps": 34296, "wall": 10045.4} {"step": 5257, "train_loss": 3.6384689807891846, "lr": 0.00038183803774624874, "tps": 34277, "wall": 10053.0} {"step": 5258, "train_loss": 3.5729968547821045, "lr": 0.0003818296505519902, "tps": 34257, "wall": 10060.8} {"step": 5259, "train_loss": 3.73046612739563, "lr": 0.00038182126152451663, "tps": 34236, "wall": 10068.7} {"step": 5260, "train_loss": 3.632859706878662, "lr": 0.000381812870663923, "tps": 34217, "wall": 10076.4} {"step": 5261, "train_loss": 3.6704859733581543, "lr": 0.00038180447797030447, "tps": 34197, "wall": 10084.1} {"step": 5262, "train_loss": 3.6962735652923584, "lr": 0.000381796083443756, "tps": 34177, "wall": 10091.9} {"step": 5263, "train_loss": 3.5978598594665527, "lr": 0.0003817876870843728, "tps": 34158, "wall": 10099.5} {"step": 5264, "train_loss": 3.6178081035614014, "lr": 0.00038177928889224986, "tps": 34138, "wall": 10107.3} {"step": 5265, "train_loss": 3.5286121368408203, "lr": 0.0003817708888674824, "tps": 34119, "wall": 10114.9} {"step": 5266, "train_loss": 3.643082857131958, "lr": 0.0003817624870101656, "tps": 34099, "wall": 10122.8} {"step": 5267, "train_loss": 3.6254115104675293, "lr": 0.0003817540833203947, "tps": 34079, "wall": 10130.4} {"step": 5268, "train_loss": 3.5489706993103027, "lr": 0.0003817456777982646, "tps": 34060, "wall": 10138.2} {"step": 5269, "train_loss": 3.582228660583496, "lr": 0.0003817372704438708, "tps": 34041, "wall": 10145.8} {"step": 5270, "train_loss": 3.7287607192993164, "lr": 0.00038172886125730843, "tps": 34021, "wall": 10153.5} {"step": 5271, "train_loss": 3.5834202766418457, "lr": 0.00038172045023867284, "tps": 34002, "wall": 10161.2} {"step": 5272, "train_loss": 3.6411032676696777, "lr": 0.00038171203738805915, "tps": 33982, "wall": 10169.0} {"step": 5273, "train_loss": 3.6734204292297363, "lr": 0.0003817036227055628, "tps": 33963, "wall": 10176.6} {"step": 5274, "train_loss": 3.6841673851013184, "lr": 0.00038169520619127904, "tps": 33943, "wall": 10184.5} {"step": 5275, "train_loss": 3.663829803466797, "lr": 0.00038168678784530327, "tps": 33925, "wall": 10192.1} {"step": 5276, "train_loss": 3.6778383255004883, "lr": 0.0003816783676677307, "tps": 33905, "wall": 10199.9} {"step": 5277, "train_loss": 3.674808979034424, "lr": 0.00038166994565865697, "tps": 33886, "wall": 10207.5} {"step": 5278, "train_loss": 3.7254652976989746, "lr": 0.00038166152181817736, "tps": 33867, "wall": 10215.2} {"step": 5279, "train_loss": 3.6104788780212402, "lr": 0.0003816530961463872, "tps": 33848, "wall": 10222.9} {"step": 5280, "train_loss": 3.724807024002075, "lr": 0.0003816446686433821, "tps": 33829, "wall": 10230.6} {"step": 5281, "train_loss": 3.5633962154388428, "lr": 0.0003816362393092574, "tps": 33810, "wall": 10238.3} {"step": 5282, "train_loss": 3.606015682220459, "lr": 0.0003816278081441086, "tps": 33791, "wall": 10246.1} {"step": 5283, "train_loss": 3.617067813873291, "lr": 0.0003816193751480313, "tps": 33772, "wall": 10253.7} {"step": 5284, "train_loss": 3.7039036750793457, "lr": 0.000381610940321121, "tps": 33753, "wall": 10261.4} {"step": 5285, "train_loss": 3.583219051361084, "lr": 0.00038160250366347316, "tps": 33734, "wall": 10269.1} {"step": 5286, "train_loss": 3.6813011169433594, "lr": 0.0003815940651751834, "tps": 33715, "wall": 10276.8} {"step": 5287, "train_loss": 3.636704921722412, "lr": 0.00038158562485634737, "tps": 33696, "wall": 10284.6} {"step": 5288, "train_loss": 3.5927772521972656, "lr": 0.0003815771827070607, "tps": 33677, "wall": 10292.3} {"step": 5289, "train_loss": 3.6785190105438232, "lr": 0.0003815687387274189, "tps": 33659, "wall": 10299.9} {"step": 5290, "train_loss": 3.700005054473877, "lr": 0.0003815602929175177, "tps": 33640, "wall": 10307.6} {"step": 5291, "train_loss": 3.6367111206054688, "lr": 0.00038155184527745273, "tps": 33621, "wall": 10315.4} {"step": 5292, "train_loss": 3.609321117401123, "lr": 0.00038154339580731973, "tps": 33602, "wall": 10323.1} {"step": 5293, "train_loss": 3.6759676933288574, "lr": 0.0003815349445072144, "tps": 33583, "wall": 10330.8} {"step": 5294, "train_loss": 3.661313772201538, "lr": 0.0003815264913772325, "tps": 33565, "wall": 10338.4} {"step": 5295, "train_loss": 3.6212151050567627, "lr": 0.00038151803641746975, "tps": 33546, "wall": 10346.2} {"step": 5296, "train_loss": 3.6352391242980957, "lr": 0.00038150957962802194, "tps": 33528, "wall": 10353.8} {"step": 5297, "train_loss": 3.6648690700531006, "lr": 0.0003815011210089849, "tps": 33509, "wall": 10361.5} {"step": 5298, "train_loss": 3.622398614883423, "lr": 0.0003814926605604544, "tps": 33491, "wall": 10369.1} {"step": 5299, "train_loss": 3.6002492904663086, "lr": 0.0003814841982825264, "tps": 33473, "wall": 10376.7} {"step": 5300, "train_loss": 3.6334643363952637, "lr": 0.00038147573417529656, "tps": 33454, "wall": 10384.3} {"step": 5301, "train_loss": 3.7096784114837646, "lr": 0.0003814672682388609, "tps": 33436, "wall": 10392.0} {"step": 5302, "train_loss": 3.5281553268432617, "lr": 0.0003814588004733153, "tps": 33418, "wall": 10399.6} {"step": 5303, "train_loss": 3.6736111640930176, "lr": 0.0003814503308787556, "tps": 33400, "wall": 10407.2} {"step": 5304, "train_loss": 3.731389045715332, "lr": 0.0003814418594552779, "tps": 33381, "wall": 10415.0} {"step": 5305, "train_loss": 3.6201603412628174, "lr": 0.00038143338620297805, "tps": 33362, "wall": 10422.7} {"step": 5306, "train_loss": 3.5958399772644043, "lr": 0.00038142491112195203, "tps": 33344, "wall": 10430.4} {"step": 5307, "train_loss": 3.7064907550811768, "lr": 0.000381416434212296, "tps": 33327, "wall": 10437.9} {"step": 5308, "train_loss": 3.6560776233673096, "lr": 0.0003814079554741057, "tps": 33308, "wall": 10445.6} {"step": 5309, "train_loss": 3.640470027923584, "lr": 0.0003813994749074775, "tps": 33290, "wall": 10453.2} {"step": 5310, "train_loss": 3.6563591957092285, "lr": 0.00038139099251250725, "tps": 33272, "wall": 10460.8} {"step": 5311, "train_loss": 3.5695900917053223, "lr": 0.0003813825082892911, "tps": 33254, "wall": 10468.6} {"step": 5312, "train_loss": 3.6714067459106445, "lr": 0.00038137402223792523, "tps": 33236, "wall": 10476.2} {"step": 5313, "train_loss": 3.615294933319092, "lr": 0.0003813655343585056, "tps": 33218, "wall": 10483.9} {"step": 5314, "train_loss": 3.6665942668914795, "lr": 0.0003813570446511286, "tps": 33200, "wall": 10491.6} {"step": 5315, "train_loss": 3.723727226257324, "lr": 0.0003813485531158902, "tps": 33182, "wall": 10499.2} {"step": 5316, "train_loss": 3.616818904876709, "lr": 0.00038134005975288664, "tps": 33164, "wall": 10506.9} {"step": 5317, "train_loss": 3.7430601119995117, "lr": 0.00038133156456221414, "tps": 33146, "wall": 10514.5} {"step": 5318, "train_loss": 3.7021548748016357, "lr": 0.00038132306754396893, "tps": 33128, "wall": 10522.1} {"step": 5319, "train_loss": 3.584247589111328, "lr": 0.00038131456869824735, "tps": 33110, "wall": 10529.9} {"step": 5320, "train_loss": 3.7538766860961914, "lr": 0.0003813060680251456, "tps": 33093, "wall": 10537.5} {"step": 5321, "train_loss": 3.657989501953125, "lr": 0.00038129756552476, "tps": 33075, "wall": 10545.2} {"step": 5322, "train_loss": 3.7056167125701904, "lr": 0.00038128906119718685, "tps": 33057, "wall": 10552.8} {"step": 5323, "train_loss": 3.7155745029449463, "lr": 0.0003812805550425225, "tps": 33040, "wall": 10560.3} {"step": 5324, "train_loss": 3.6053292751312256, "lr": 0.0003812720470608632, "tps": 33022, "wall": 10567.9} {"step": 5325, "train_loss": 3.6720635890960693, "lr": 0.00038126353725230554, "tps": 33005, "wall": 10575.5} {"step": 5326, "train_loss": 3.6954755783081055, "lr": 0.0003812550256169458, "tps": 32987, "wall": 10583.2} {"step": 5327, "train_loss": 3.6197972297668457, "lr": 0.00038124651215488026, "tps": 32969, "wall": 10590.9} {"step": 5328, "train_loss": 3.621900796890259, "lr": 0.00038123799686620567, "tps": 32952, "wall": 10598.5} {"step": 5329, "train_loss": 3.7969532012939453, "lr": 0.0003812294797510183, "tps": 32934, "wall": 10606.3} {"step": 5330, "train_loss": 3.6095199584960938, "lr": 0.0003812209608094146, "tps": 32916, "wall": 10613.9} {"step": 5331, "train_loss": 3.7169668674468994, "lr": 0.0003812124400414911, "tps": 32898, "wall": 10621.5} {"step": 5332, "train_loss": 3.685333013534546, "lr": 0.0003812039174473445, "tps": 32881, "wall": 10629.1} {"step": 5333, "train_loss": 3.6415657997131348, "lr": 0.0003811953930270711, "tps": 32864, "wall": 10636.8} {"step": 5334, "train_loss": 3.5914556980133057, "lr": 0.0003811868667807676, "tps": 32846, "wall": 10644.5} {"step": 5335, "train_loss": 3.5708789825439453, "lr": 0.00038117833870853054, "tps": 32828, "wall": 10652.2} {"step": 5336, "train_loss": 3.6115498542785645, "lr": 0.00038116980881045654, "tps": 32811, "wall": 10659.7} {"step": 5337, "train_loss": 3.65480375289917, "lr": 0.00038116127708664224, "tps": 32794, "wall": 10667.5} {"step": 5338, "train_loss": 3.6030123233795166, "lr": 0.00038115274353718424, "tps": 32777, "wall": 10675.1} {"step": 5339, "train_loss": 3.682286024093628, "lr": 0.00038114420816217926, "tps": 32759, "wall": 10682.7} {"step": 5340, "train_loss": 3.4988207817077637, "lr": 0.000381135670961724, "tps": 32742, "wall": 10690.3} {"step": 5341, "train_loss": 3.6561412811279297, "lr": 0.0003811271319359151, "tps": 32725, "wall": 10698.0} {"step": 5342, "train_loss": 3.7297816276550293, "lr": 0.00038111859108484937, "tps": 32707, "wall": 10705.8} {"step": 5343, "train_loss": 3.7748279571533203, "lr": 0.0003811100484086235, "tps": 32690, "wall": 10713.4} {"step": 5344, "train_loss": 3.5778160095214844, "lr": 0.0003811015039073343, "tps": 32672, "wall": 10721.1} {"step": 5345, "train_loss": 3.603888511657715, "lr": 0.0003810929575810786, "tps": 32655, "wall": 10728.8} {"step": 5346, "train_loss": 3.652996301651001, "lr": 0.00038108440942995306, "tps": 32638, "wall": 10736.5} {"step": 5347, "train_loss": 3.7000465393066406, "lr": 0.00038107585945405467, "tps": 32621, "wall": 10744.0} {"step": 5348, "train_loss": 3.6100378036499023, "lr": 0.00038106730765348024, "tps": 32604, "wall": 10751.6} {"step": 5349, "train_loss": 3.726916790008545, "lr": 0.0003810587540283266, "tps": 32587, "wall": 10759.2} {"step": 5350, "train_loss": 3.5739352703094482, "lr": 0.0003810501985786907, "tps": 32570, "wall": 10766.9} {"step": 5351, "train_loss": 3.7339730262756348, "lr": 0.0003810416413046694, "tps": 32553, "wall": 10774.4} {"step": 5352, "train_loss": 3.6902356147766113, "lr": 0.00038103308220635974, "tps": 32536, "wall": 10782.1} {"step": 5353, "train_loss": 3.5511045455932617, "lr": 0.00038102452128385857, "tps": 32519, "wall": 10789.8} {"step": 5354, "train_loss": 3.7497787475585938, "lr": 0.0003810159585372629, "tps": 32502, "wall": 10797.3} {"step": 5355, "train_loss": 3.65334153175354, "lr": 0.0003810073939666698, "tps": 32485, "wall": 10805.0} {"step": 5356, "train_loss": 3.587190866470337, "lr": 0.0003809988275721762, "tps": 32469, "wall": 10812.6} {"step": 5357, "train_loss": 3.6044182777404785, "lr": 0.00038099025935387914, "tps": 32452, "wall": 10820.2} {"step": 5358, "train_loss": 3.5804238319396973, "lr": 0.00038098168931187577, "tps": 32435, "wall": 10827.9} {"step": 5359, "train_loss": 3.653715133666992, "lr": 0.00038097311744626306, "tps": 32418, "wall": 10835.7} {"step": 5360, "train_loss": 3.7218422889709473, "lr": 0.00038096454375713824, "tps": 32401, "wall": 10843.4} {"step": 5361, "train_loss": 3.6609044075012207, "lr": 0.00038095596824459826, "tps": 32384, "wall": 10851.1} {"step": 5362, "train_loss": 3.6299543380737305, "lr": 0.0003809473909087404, "tps": 32367, "wall": 10858.7} {"step": 5363, "train_loss": 3.657602310180664, "lr": 0.00038093881174966184, "tps": 32350, "wall": 10866.3} {"step": 5364, "train_loss": 3.592090368270874, "lr": 0.00038093023076745964, "tps": 32334, "wall": 10873.9} {"step": 5365, "train_loss": 3.63455867767334, "lr": 0.0003809216479622312, "tps": 32317, "wall": 10881.5} {"step": 5366, "train_loss": 3.672055721282959, "lr": 0.0003809130633340735, "tps": 32300, "wall": 10889.3} {"step": 5367, "train_loss": 3.6335880756378174, "lr": 0.00038090447688308396, "tps": 32284, "wall": 10896.9} {"step": 5368, "train_loss": 3.71271014213562, "lr": 0.00038089588860935983, "tps": 32267, "wall": 10904.5} {"step": 5369, "train_loss": 3.67568039894104, "lr": 0.00038088729851299834, "tps": 32251, "wall": 10912.1} {"step": 5370, "train_loss": 3.554455280303955, "lr": 0.0003808787065940968, "tps": 32234, "wall": 10919.7} {"step": 5371, "train_loss": 3.581902027130127, "lr": 0.00038087011285275265, "tps": 32217, "wall": 10927.4} {"step": 5372, "train_loss": 3.590322494506836, "lr": 0.00038086151728906306, "tps": 32201, "wall": 10935.0} {"step": 5373, "train_loss": 3.6518754959106445, "lr": 0.0003808529199031255, "tps": 32184, "wall": 10942.8} {"step": 5374, "train_loss": 3.667973756790161, "lr": 0.00038084432069503745, "tps": 32168, "wall": 10950.4} {"step": 5375, "train_loss": 3.6659679412841797, "lr": 0.0003808357196648962, "tps": 32151, "wall": 10958.1} {"step": 5376, "train_loss": 3.589907169342041, "lr": 0.00038082711681279916, "tps": 32135, "wall": 10965.8} {"step": 5377, "train_loss": 3.6436448097229004, "lr": 0.0003808185121388439, "tps": 32118, "wall": 10973.5} {"step": 5378, "train_loss": 3.6468288898468018, "lr": 0.0003808099056431278, "tps": 32102, "wall": 10981.0} {"step": 5379, "train_loss": 3.605659008026123, "lr": 0.00038080129732574844, "tps": 32086, "wall": 10988.7} {"step": 5380, "train_loss": 3.673478126525879, "lr": 0.00038079268718680325, "tps": 32069, "wall": 10996.3} {"step": 5381, "train_loss": 3.6857690811157227, "lr": 0.0003807840752263898, "tps": 32053, "wall": 11003.9} {"step": 5382, "train_loss": 3.591075897216797, "lr": 0.00038077546144460564, "tps": 32037, "wall": 11011.6} {"step": 5383, "train_loss": 3.652590274810791, "lr": 0.0003807668458415484, "tps": 32020, "wall": 11019.3} {"step": 5384, "train_loss": 3.566214084625244, "lr": 0.00038075822841731553, "tps": 32004, "wall": 11027.1} {"step": 5385, "train_loss": 3.6719398498535156, "lr": 0.0003807496091720049, "tps": 31987, "wall": 11034.8} {"step": 5386, "train_loss": 3.689815044403076, "lr": 0.00038074098810571386, "tps": 31971, "wall": 11042.4} {"step": 5387, "train_loss": 3.7507576942443848, "lr": 0.0003807323652185403, "tps": 31955, "wall": 11050.0} {"step": 5388, "train_loss": 3.599008798599243, "lr": 0.00038072374051058175, "tps": 31939, "wall": 11057.6} {"step": 5389, "train_loss": 3.741947650909424, "lr": 0.00038071511398193603, "tps": 31922, "wall": 11065.4} {"step": 5390, "train_loss": 3.655609130859375, "lr": 0.0003807064856327008, "tps": 31907, "wall": 11072.9} {"step": 5391, "train_loss": 3.6620378494262695, "lr": 0.0003806978554629738, "tps": 31891, "wall": 11080.5} {"step": 5392, "train_loss": 3.631173849105835, "lr": 0.0003806892234728527, "tps": 31875, "wall": 11088.1} {"step": 5393, "train_loss": 3.5902814865112305, "lr": 0.00038068058966243557, "tps": 31858, "wall": 11095.8} {"step": 5394, "train_loss": 3.6369595527648926, "lr": 0.0003806719540318199, "tps": 31843, "wall": 11103.4} {"step": 5395, "train_loss": 3.65616774559021, "lr": 0.00038066331658110367, "tps": 31827, "wall": 11111.0} {"step": 5396, "train_loss": 3.670620918273926, "lr": 0.0003806546773103847, "tps": 31811, "wall": 11118.6} {"step": 5397, "train_loss": 3.6599183082580566, "lr": 0.0003806460362197609, "tps": 31794, "wall": 11126.4} {"step": 5398, "train_loss": 3.6119375228881836, "lr": 0.00038063739330933, "tps": 31778, "wall": 11134.1} {"step": 5399, "train_loss": 3.606905221939087, "lr": 0.0003806287485791901, "tps": 31762, "wall": 11141.9} {"step": 5400, "train_loss": 3.639070749282837, "lr": 0.00038062010202943907, "tps": 31746, "wall": 11149.5} {"step": 5401, "train_loss": 3.661288261413574, "lr": 0.00038061145366017474, "tps": 31730, "wall": 11157.1} {"step": 5402, "train_loss": 3.6009082794189453, "lr": 0.00038060280347149524, "tps": 31715, "wall": 11164.7} {"step": 5403, "train_loss": 3.6771302223205566, "lr": 0.0003805941514634985, "tps": 31699, "wall": 11172.3} {"step": 5404, "train_loss": 3.614835500717163, "lr": 0.0003805854976362825, "tps": 31683, "wall": 11179.9} {"step": 5405, "train_loss": 3.619248390197754, "lr": 0.0003805768419899453, "tps": 31667, "wall": 11187.6} {"step": 5406, "train_loss": 3.5742075443267822, "lr": 0.0003805681845245849, "tps": 31652, "wall": 11195.1} {"step": 5407, "train_loss": 3.5886752605438232, "lr": 0.00038055952524029954, "tps": 31636, "wall": 11202.8} {"step": 5408, "train_loss": 3.7360754013061523, "lr": 0.0003805508641371871, "tps": 31621, "wall": 11210.4} {"step": 5409, "train_loss": 3.6390724182128906, "lr": 0.0003805422012153458, "tps": 31605, "wall": 11218.0} {"step": 5410, "train_loss": 3.6274795532226562, "lr": 0.0003805335364748738, "tps": 31590, "wall": 11225.6} {"step": 5411, "train_loss": 3.72878098487854, "lr": 0.00038052486991586913, "tps": 31574, "wall": 11233.1} {"step": 5412, "train_loss": 3.713815450668335, "lr": 0.0003805162015384301, "tps": 31558, "wall": 11240.9} {"step": 5413, "train_loss": 3.5411415100097656, "lr": 0.0003805075313426549, "tps": 31543, "wall": 11248.5} {"step": 5414, "train_loss": 3.695603370666504, "lr": 0.0003804988593286416, "tps": 31527, "wall": 11256.1} {"step": 5415, "train_loss": 3.588304281234741, "lr": 0.0003804901854964886, "tps": 31511, "wall": 11263.8} {"step": 5416, "train_loss": 3.641371726989746, "lr": 0.0003804815098462941, "tps": 31496, "wall": 11271.4} {"step": 5417, "train_loss": 3.6281015872955322, "lr": 0.0003804728323781564, "tps": 31480, "wall": 11279.1} {"step": 5418, "train_loss": 3.72756290435791, "lr": 0.0003804641530921737, "tps": 31465, "wall": 11286.7} {"step": 5419, "train_loss": 3.5797300338745117, "lr": 0.0003804554719884444, "tps": 31450, "wall": 11294.3} {"step": 5420, "train_loss": 3.594162702560425, "lr": 0.0003804467890670669, "tps": 31434, "wall": 11301.8} {"step": 5421, "train_loss": 3.6364071369171143, "lr": 0.0003804381043281394, "tps": 31419, "wall": 11309.6} {"step": 5422, "train_loss": 3.6212100982666016, "lr": 0.0003804294177717605, "tps": 31403, "wall": 11317.1} {"step": 5423, "train_loss": 3.5777053833007812, "lr": 0.0003804207293980284, "tps": 31388, "wall": 11324.9} {"step": 5424, "train_loss": 3.578671455383301, "lr": 0.0003804120392070416, "tps": 31373, "wall": 11332.4} {"step": 5425, "train_loss": 3.609909772872925, "lr": 0.00038040334719889856, "tps": 31357, "wall": 11340.0} {"step": 5426, "train_loss": 3.629422664642334, "lr": 0.0003803946533736977, "tps": 31342, "wall": 11347.6} {"step": 5427, "train_loss": 3.575164794921875, "lr": 0.00038038595773153753, "tps": 31327, "wall": 11355.2} {"step": 5428, "train_loss": 3.697680711746216, "lr": 0.0003803772602725166, "tps": 31311, "wall": 11362.9} {"step": 5429, "train_loss": 3.607180595397949, "lr": 0.00038036856099673335, "tps": 31296, "wall": 11370.5} {"step": 5430, "train_loss": 3.719393014907837, "lr": 0.0003803598599042864, "tps": 31281, "wall": 11378.0} {"step": 5431, "train_loss": 3.6325442790985107, "lr": 0.0003803511569952742, "tps": 31266, "wall": 11385.8} {"step": 5432, "train_loss": 3.6933271884918213, "lr": 0.00038034245226979544, "tps": 31251, "wall": 11393.4} {"step": 5433, "train_loss": 3.6297202110290527, "lr": 0.0003803337457279488, "tps": 31235, "wall": 11401.1} {"step": 5434, "train_loss": 3.6514182090759277, "lr": 0.00038032503736983275, "tps": 31220, "wall": 11408.6} {"step": 5435, "train_loss": 3.6435048580169678, "lr": 0.00038031632719554595, "tps": 31205, "wall": 11416.3} {"step": 5436, "train_loss": 3.6385302543640137, "lr": 0.0003803076152051872, "tps": 31190, "wall": 11424.0} {"step": 5437, "train_loss": 3.6017580032348633, "lr": 0.00038029890139885513, "tps": 31175, "wall": 11431.6} {"step": 5438, "train_loss": 3.613198757171631, "lr": 0.0003802901857766484, "tps": 31160, "wall": 11439.2} {"step": 5439, "train_loss": 3.557257652282715, "lr": 0.00038028146833866575, "tps": 31145, "wall": 11446.9} {"step": 5440, "train_loss": 3.5907821655273438, "lr": 0.00038027274908500596, "tps": 31130, "wall": 11454.5} {"step": 5441, "train_loss": 3.4219655990600586, "lr": 0.00038026402801576777, "tps": 31115, "wall": 11462.1} {"step": 5442, "train_loss": 3.628936767578125, "lr": 0.00038025530513105006, "tps": 31100, "wall": 11469.7} {"step": 5443, "train_loss": 3.6280274391174316, "lr": 0.00038024658043095156, "tps": 31085, "wall": 11477.3} {"step": 5444, "train_loss": 3.5118048191070557, "lr": 0.0003802378539155712, "tps": 31070, "wall": 11485.0} {"step": 5445, "train_loss": 3.656568765640259, "lr": 0.00038022912558500767, "tps": 31055, "wall": 11492.6} {"step": 5446, "train_loss": 3.6215004920959473, "lr": 0.00038022039543935993, "tps": 31040, "wall": 11500.2} {"step": 5447, "train_loss": 3.654984712600708, "lr": 0.00038021166347872696, "tps": 31025, "wall": 11507.9} {"step": 5448, "train_loss": 3.649651050567627, "lr": 0.00038020292970320754, "tps": 31010, "wall": 11515.5} {"step": 5449, "train_loss": 3.4969520568847656, "lr": 0.00038019419411290065, "tps": 30996, "wall": 11523.0} {"step": 5450, "train_loss": 3.573866367340088, "lr": 0.00038018545670790533, "tps": 30981, "wall": 11530.6} {"step": 5451, "train_loss": 3.6411705017089844, "lr": 0.00038017671748832047, "tps": 30966, "wall": 11538.2} {"step": 5452, "train_loss": 3.599547863006592, "lr": 0.00038016797645424504, "tps": 30950, "wall": 11546.3} {"step": 5453, "train_loss": 3.6178817749023438, "lr": 0.00038015923360577814, "tps": 30934, "wall": 11554.5} {"step": 5454, "train_loss": 3.481262683868408, "lr": 0.0003801504889430187, "tps": 30919, "wall": 11562.2} {"step": 5455, "train_loss": 3.669614791870117, "lr": 0.000380141742466066, "tps": 30905, "wall": 11569.8} {"step": 5456, "train_loss": 3.536609172821045, "lr": 0.00038013299417501893, "tps": 30890, "wall": 11577.5} {"step": 5457, "train_loss": 3.5882060527801514, "lr": 0.00038012424406997654, "tps": 30875, "wall": 11585.0} {"step": 5458, "train_loss": 3.717212438583374, "lr": 0.0003801154921510382, "tps": 30861, "wall": 11592.6} {"step": 5459, "train_loss": 3.6903939247131348, "lr": 0.0003801067384183028, "tps": 30846, "wall": 11600.2} {"step": 5460, "train_loss": 3.7044644355773926, "lr": 0.00038009798287186964, "tps": 30831, "wall": 11607.9} {"step": 5461, "train_loss": 3.615434169769287, "lr": 0.0003800892255118379, "tps": 30817, "wall": 11615.5} {"step": 5462, "train_loss": 3.706608295440674, "lr": 0.0003800804663383067, "tps": 30802, "wall": 11623.4} {"step": 5463, "train_loss": 3.583646774291992, "lr": 0.00038007170535137534, "tps": 30787, "wall": 11631.0} {"step": 5464, "train_loss": 3.590513229370117, "lr": 0.00038006294255114306, "tps": 30772, "wall": 11638.6} {"step": 5465, "train_loss": 3.661423683166504, "lr": 0.0003800541779377091, "tps": 30758, "wall": 11646.3} {"step": 5466, "train_loss": 3.680818557739258, "lr": 0.0003800454115111727, "tps": 30743, "wall": 11653.9} {"step": 5467, "train_loss": 3.6268792152404785, "lr": 0.00038003664327163327, "tps": 30729, "wall": 11661.5} {"step": 5468, "train_loss": 3.7278847694396973, "lr": 0.0003800278732191901, "tps": 30714, "wall": 11669.2} {"step": 5469, "train_loss": 3.6515674591064453, "lr": 0.0003800191013539425, "tps": 30700, "wall": 11676.9} {"step": 5470, "train_loss": 3.594451427459717, "lr": 0.0003800103276759899, "tps": 30685, "wall": 11684.7} {"step": 5471, "train_loss": 3.6043434143066406, "lr": 0.0003800015521854316, "tps": 30670, "wall": 11692.3} {"step": 5472, "train_loss": 3.613956928253174, "lr": 0.00037999277488236704, "tps": 30656, "wall": 11700.0} {"step": 5473, "train_loss": 3.539255142211914, "lr": 0.0003799839957668957, "tps": 30642, "wall": 11707.5} {"step": 5474, "train_loss": 3.696786403656006, "lr": 0.00037997521483911704, "tps": 30627, "wall": 11715.3} {"step": 5475, "train_loss": 3.7322750091552734, "lr": 0.0003799664320991305, "tps": 30612, "wall": 11723.0} {"step": 5476, "train_loss": 3.5836713314056396, "lr": 0.00037995764754703546, "tps": 30598, "wall": 11730.7} {"step": 5477, "train_loss": 3.567084550857544, "lr": 0.0003799488611829316, "tps": 30583, "wall": 11738.4} {"step": 5478, "train_loss": 3.7045350074768066, "lr": 0.0003799400730069184, "tps": 30569, "wall": 11746.2} {"step": 5479, "train_loss": 3.673949956893921, "lr": 0.0003799312830190954, "tps": 30554, "wall": 11753.9} {"step": 5480, "train_loss": 3.5769219398498535, "lr": 0.00037992249121956214, "tps": 30540, "wall": 11761.6} {"step": 5481, "train_loss": 3.5930423736572266, "lr": 0.0003799136976084183, "tps": 30526, "wall": 11769.2} {"step": 5482, "train_loss": 3.573772430419922, "lr": 0.00037990490218576335, "tps": 30511, "wall": 11777.1} {"step": 5483, "train_loss": 3.5553338527679443, "lr": 0.00037989610495169714, "tps": 30496, "wall": 11784.9} {"step": 5484, "train_loss": 3.5506784915924072, "lr": 0.00037988730590631913, "tps": 30481, "wall": 11792.8} {"step": 5485, "train_loss": 3.6055872440338135, "lr": 0.0003798785050497291, "tps": 30467, "wall": 11800.5} {"step": 5486, "train_loss": 3.5844874382019043, "lr": 0.0003798697023820267, "tps": 30452, "wall": 11808.3} {"step": 5487, "train_loss": 3.5296759605407715, "lr": 0.0003798608979033117, "tps": 30437, "wall": 11816.2} {"step": 5488, "train_loss": 3.5336976051330566, "lr": 0.0003798520916136837, "tps": 30423, "wall": 11823.9} {"step": 5489, "train_loss": 3.625441074371338, "lr": 0.0003798432835132426, "tps": 30409, "wall": 11831.7} {"step": 5490, "train_loss": 3.6452696323394775, "lr": 0.00037983447360208817, "tps": 30394, "wall": 11839.5} {"step": 5491, "train_loss": 3.656449317932129, "lr": 0.00037982566188032017, "tps": 30380, "wall": 11847.4} {"step": 5492, "train_loss": 3.5292601585388184, "lr": 0.0003798168483480384, "tps": 30365, "wall": 11855.2} {"step": 5493, "train_loss": 3.6575024127960205, "lr": 0.00037980803300534274, "tps": 30350, "wall": 11863.1} {"step": 5494, "train_loss": 3.5185461044311523, "lr": 0.000379799215852333, "tps": 30336, "wall": 11870.8} {"step": 5495, "train_loss": 3.660715103149414, "lr": 0.0003797903968891092, "tps": 30321, "wall": 11878.8} {"step": 5496, "train_loss": 3.531561851501465, "lr": 0.0003797815761157711, "tps": 30307, "wall": 11886.5} {"step": 5497, "train_loss": 3.602933406829834, "lr": 0.0003797727535324186, "tps": 30293, "wall": 11894.3} {"step": 5498, "train_loss": 3.6454572677612305, "lr": 0.00037976392913915177, "tps": 30278, "wall": 11902.1} {"step": 5499, "train_loss": 3.6507554054260254, "lr": 0.0003797551029360705, "tps": 30264, "wall": 11910.1} {"step": 5500, "train_loss": 3.4688618183135986, "lr": 0.00037974627492327477, "tps": 30249, "wall": 11917.9} {"step": 5501, "train_loss": 3.6138200759887695, "lr": 0.00037973744510086453, "tps": 30235, "wall": 11925.8} {"step": 5502, "train_loss": 3.602597713470459, "lr": 0.00037972861346893995, "tps": 30220, "wall": 11933.7} {"step": 5503, "train_loss": 3.6744723320007324, "lr": 0.000379719780027601, "tps": 30206, "wall": 11941.6} {"step": 5504, "train_loss": 3.609560966491699, "lr": 0.00037971094477694766, "tps": 30192, "wall": 11949.3} {"step": 5505, "train_loss": 3.5135397911071777, "lr": 0.0003797021077170802, "tps": 30177, "wall": 11957.3} {"step": 5506, "train_loss": 3.4939217567443848, "lr": 0.0003796932688480986, "tps": 30163, "wall": 11965.2} {"step": 5507, "train_loss": 3.5998096466064453, "lr": 0.0003796844281701029, "tps": 30148, "wall": 11973.1} {"step": 5508, "train_loss": 3.613412857055664, "lr": 0.0003796755856831935, "tps": 30134, "wall": 11980.9} {"step": 5509, "train_loss": 3.690185785293579, "lr": 0.0003796667413874703, "tps": 30119, "wall": 11989.0} {"step": 5510, "train_loss": 3.592769145965576, "lr": 0.00037965789528303373, "tps": 30105, "wall": 11997.0} {"step": 5511, "train_loss": 3.6273787021636963, "lr": 0.0003796490473699839, "tps": 30090, "wall": 12004.8} {"step": 5512, "train_loss": 3.6711366176605225, "lr": 0.00037964019764842095, "tps": 30076, "wall": 12012.7} {"step": 5513, "train_loss": 3.730806827545166, "lr": 0.0003796313461184452, "tps": 30062, "wall": 12020.6} {"step": 5514, "train_loss": 3.6321916580200195, "lr": 0.00037962249278015694, "tps": 30047, "wall": 12028.7} {"step": 5515, "train_loss": 3.691823720932007, "lr": 0.00037961363763365643, "tps": 30033, "wall": 12036.5} {"step": 5516, "train_loss": 3.6119630336761475, "lr": 0.00037960478067904405, "tps": 30018, "wall": 12044.6} {"step": 5517, "train_loss": 3.646541118621826, "lr": 0.00037959592191642004, "tps": 30004, "wall": 12052.6} {"step": 5518, "train_loss": 3.705954074859619, "lr": 0.00037958706134588483, "tps": 29990, "wall": 12060.4} {"step": 5519, "train_loss": 3.5082132816314697, "lr": 0.0003795781989675387, "tps": 29975, "wall": 12068.3} {"step": 5520, "train_loss": 3.63278865814209, "lr": 0.00037956933478148217, "tps": 29961, "wall": 12076.3} {"step": 5521, "train_loss": 3.721367835998535, "lr": 0.00037956046878781556, "tps": 29947, "wall": 12084.2} {"step": 5522, "train_loss": 3.5963821411132812, "lr": 0.0003795516009866393, "tps": 29932, "wall": 12092.2} {"step": 5523, "train_loss": 3.6326167583465576, "lr": 0.00037954273137805384, "tps": 29918, "wall": 12100.1} {"step": 5524, "train_loss": 3.651418924331665, "lr": 0.00037953385996215974, "tps": 29904, "wall": 12108.1} {"step": 5525, "train_loss": 3.528780937194824, "lr": 0.00037952498673905744, "tps": 29890, "wall": 12116.1} {"step": 5526, "train_loss": 3.5131402015686035, "lr": 0.0003795161117088475, "tps": 29876, "wall": 12124.0} {"step": 5527, "train_loss": 3.5657958984375, "lr": 0.0003795072348716304, "tps": 29861, "wall": 12132.0} {"step": 5528, "train_loss": 3.6198434829711914, "lr": 0.0003794983562275066, "tps": 29847, "wall": 12139.9} {"step": 5529, "train_loss": 3.707801580429077, "lr": 0.0003794894757765769, "tps": 29833, "wall": 12147.9} {"step": 5530, "train_loss": 3.659989356994629, "lr": 0.00037948059351894175, "tps": 29819, "wall": 12155.9} {"step": 5531, "train_loss": 3.6499505043029785, "lr": 0.00037947170945470184, "tps": 29804, "wall": 12164.0} {"step": 5532, "train_loss": 3.6097018718719482, "lr": 0.00037946282358395777, "tps": 29790, "wall": 12172.0} {"step": 5533, "train_loss": 3.6358232498168945, "lr": 0.00037945393590681025, "tps": 29776, "wall": 12180.0} {"step": 5534, "train_loss": 3.5518741607666016, "lr": 0.00037944504642335985, "tps": 29762, "wall": 12188.0} {"step": 5535, "train_loss": 3.6574933528900146, "lr": 0.0003794361551337073, "tps": 29748, "wall": 12196.0} {"step": 5536, "train_loss": 3.5428435802459717, "lr": 0.00037942726203795345, "tps": 29734, "wall": 12204.0} {"step": 5537, "train_loss": 3.6151959896087646, "lr": 0.0003794183671361989, "tps": 29719, "wall": 12212.1} {"step": 5538, "train_loss": 3.6270432472229004, "lr": 0.0003794094704285445, "tps": 29705, "wall": 12220.0} {"step": 5539, "train_loss": 3.598228931427002, "lr": 0.000379400571915091, "tps": 29691, "wall": 12228.2} {"step": 5540, "train_loss": 3.5576651096343994, "lr": 0.00037939167159593915, "tps": 29677, "wall": 12236.2} {"step": 5541, "train_loss": 3.5892372131347656, "lr": 0.00037938276947118983, "tps": 29663, "wall": 12244.2} {"step": 5542, "train_loss": 3.6876189708709717, "lr": 0.0003793738655409439, "tps": 29649, "wall": 12252.2} {"step": 5543, "train_loss": 3.6289567947387695, "lr": 0.00037936495980530217, "tps": 29634, "wall": 12260.3} {"step": 5544, "train_loss": 3.583808660507202, "lr": 0.0003793560522643656, "tps": 29620, "wall": 12268.2} {"step": 5545, "train_loss": 3.630066156387329, "lr": 0.000379347142918235, "tps": 29606, "wall": 12276.3} {"step": 5546, "train_loss": 3.5788040161132812, "lr": 0.0003793382317670114, "tps": 29592, "wall": 12284.4} {"step": 5547, "train_loss": 3.675048828125, "lr": 0.0003793293188107956, "tps": 29578, "wall": 12292.5} {"step": 5548, "train_loss": 3.608091115951538, "lr": 0.0003793204040496888, "tps": 29564, "wall": 12300.6} {"step": 5549, "train_loss": 3.6875851154327393, "lr": 0.0003793114874837917, "tps": 29550, "wall": 12308.6} {"step": 5550, "train_loss": 3.679307460784912, "lr": 0.0003793025691132055, "tps": 29536, "wall": 12316.7} {"step": 5551, "train_loss": 3.6611132621765137, "lr": 0.0003792936489380312, "tps": 29522, "wall": 12324.8} {"step": 5552, "train_loss": 3.651412010192871, "lr": 0.0003792847269583698, "tps": 29508, "wall": 12332.9} {"step": 5553, "train_loss": 3.6670520305633545, "lr": 0.00037927580317432245, "tps": 29494, "wall": 12340.9} {"step": 5554, "train_loss": 3.6452231407165527, "lr": 0.0003792668775859901, "tps": 29480, "wall": 12349.0} {"step": 5555, "train_loss": 3.6418685913085938, "lr": 0.000379257950193474, "tps": 29466, "wall": 12357.1} {"step": 5556, "train_loss": 3.6965579986572266, "lr": 0.0003792490209968752, "tps": 29452, "wall": 12365.1} {"step": 5557, "train_loss": 3.60295033454895, "lr": 0.0003792400899962949, "tps": 29438, "wall": 12373.2} {"step": 5558, "train_loss": 3.6084656715393066, "lr": 0.0003792311571918343, "tps": 29424, "wall": 12381.3} {"step": 5559, "train_loss": 3.6868929862976074, "lr": 0.00037922222258359443, "tps": 29410, "wall": 12389.3} {"step": 5560, "train_loss": 3.5729053020477295, "lr": 0.0003792132861716767, "tps": 29396, "wall": 12397.5} {"step": 5561, "train_loss": 3.5621848106384277, "lr": 0.00037920434795618216, "tps": 29382, "wall": 12405.6} {"step": 5562, "train_loss": 3.6095926761627197, "lr": 0.0003791954079372122, "tps": 29368, "wall": 12413.8} {"step": 5563, "train_loss": 3.5202486515045166, "lr": 0.00037918646611486805, "tps": 29354, "wall": 12421.8} {"step": 5564, "train_loss": 3.6568827629089355, "lr": 0.00037917752248925094, "tps": 29341, "wall": 12429.9} {"step": 5565, "train_loss": 3.666490077972412, "lr": 0.00037916857706046233, "tps": 29327, "wall": 12438.0} {"step": 5566, "train_loss": 3.5255885124206543, "lr": 0.00037915962982860345, "tps": 29313, "wall": 12446.2} {"step": 5567, "train_loss": 3.643771171569824, "lr": 0.00037915068079377566, "tps": 29299, "wall": 12454.3} {"step": 5568, "train_loss": 3.65759015083313, "lr": 0.00037914172995608033, "tps": 29285, "wall": 12462.4} {"step": 5569, "train_loss": 3.6421284675598145, "lr": 0.0003791327773156189, "tps": 29271, "wall": 12470.5} {"step": 5570, "train_loss": 3.5595552921295166, "lr": 0.00037912382287249273, "tps": 29258, "wall": 12478.6} {"step": 5571, "train_loss": 3.636603832244873, "lr": 0.0003791148666268033, "tps": 29244, "wall": 12486.7} {"step": 5572, "train_loss": 3.6558730602264404, "lr": 0.00037910590857865206, "tps": 29230, "wall": 12494.8} {"step": 5573, "train_loss": 3.679626941680908, "lr": 0.00037909694872814047, "tps": 29216, "wall": 12502.9} {"step": 5574, "train_loss": 3.622776985168457, "lr": 0.0003790879870753701, "tps": 29203, "wall": 12511.1} {"step": 5575, "train_loss": 3.689361095428467, "lr": 0.0003790790236204423, "tps": 29189, "wall": 12519.2} {"step": 5576, "train_loss": 3.6998813152313232, "lr": 0.0003790700583634588, "tps": 29175, "wall": 12527.4} {"step": 5577, "train_loss": 3.6746773719787598, "lr": 0.00037906109130452105, "tps": 29161, "wall": 12535.5} {"step": 5578, "train_loss": 3.621406078338623, "lr": 0.0003790521224437306, "tps": 29148, "wall": 12543.7} {"step": 5579, "train_loss": 3.592609405517578, "lr": 0.0003790431517811892, "tps": 29134, "wall": 12551.7} {"step": 5580, "train_loss": 3.6379246711730957, "lr": 0.0003790341793169983, "tps": 29120, "wall": 12560.0} {"step": 5581, "train_loss": 3.6367764472961426, "lr": 0.00037902520505125957, "tps": 29107, "wall": 12568.1} {"step": 5582, "train_loss": 3.6111392974853516, "lr": 0.0003790162289840748, "tps": 29093, "wall": 12576.3} {"step": 5583, "train_loss": 3.634580135345459, "lr": 0.00037900725111554557, "tps": 29079, "wall": 12584.5} {"step": 5584, "train_loss": 3.661968231201172, "lr": 0.0003789982714457736, "tps": 29066, "wall": 12592.6} {"step": 5585, "train_loss": 3.6615564823150635, "lr": 0.0003789892899748606, "tps": 29052, "wall": 12600.8} {"step": 5586, "train_loss": 3.6137208938598633, "lr": 0.0003789803067029083, "tps": 29038, "wall": 12608.9} {"step": 5587, "train_loss": 3.742616653442383, "lr": 0.00037897132163001854, "tps": 29025, "wall": 12617.1} {"step": 5588, "train_loss": 3.631291389465332, "lr": 0.000378962334756293, "tps": 29011, "wall": 12625.3} {"step": 5589, "train_loss": 3.580397129058838, "lr": 0.0003789533460818335, "tps": 28997, "wall": 12633.6} {"step": 5590, "train_loss": 3.681136131286621, "lr": 0.00037894435560674195, "tps": 28983, "wall": 12641.9} {"step": 5591, "train_loss": 3.7589993476867676, "lr": 0.00037893536333112013, "tps": 28970, "wall": 12650.1} {"step": 5592, "train_loss": 3.601461887359619, "lr": 0.0003789263692550699, "tps": 28956, "wall": 12658.3} {"step": 5593, "train_loss": 3.6464290618896484, "lr": 0.0003789173733786932, "tps": 28942, "wall": 12666.6} {"step": 5594, "train_loss": 3.6346659660339355, "lr": 0.0003789083757020919, "tps": 28929, "wall": 12674.9} {"step": 5595, "train_loss": 3.6351349353790283, "lr": 0.0003788993762253679, "tps": 28915, "wall": 12683.0} {"step": 5596, "train_loss": 3.5543251037597656, "lr": 0.00037889037494862315, "tps": 28902, "wall": 12691.2} {"step": 5597, "train_loss": 3.5972447395324707, "lr": 0.0003788813718719597, "tps": 28888, "wall": 12699.3} {"step": 5598, "train_loss": 3.673265218734741, "lr": 0.0003788723669954794, "tps": 28875, "wall": 12707.6} {"step": 5599, "train_loss": 3.6812479496002197, "lr": 0.0003788633603192844, "tps": 28861, "wall": 12715.8} {"step": 5600, "train_loss": 3.7148537635803223, "lr": 0.00037885435184347664, "tps": 28848, "wall": 12723.9} {"step": 5601, "train_loss": 3.618610382080078, "lr": 0.0003788453415681581, "tps": 28835, "wall": 12732.1} {"step": 5602, "train_loss": 3.657684564590454, "lr": 0.000378836329493431, "tps": 28822, "wall": 12740.2} {"step": 5603, "train_loss": 3.5774192810058594, "lr": 0.0003788273156193974, "tps": 28808, "wall": 12748.4} {"step": 5604, "train_loss": 3.7644386291503906, "lr": 0.00037881829994615933, "tps": 28795, "wall": 12756.5} {"step": 5605, "train_loss": 3.596283435821533, "lr": 0.000378809282473819, "tps": 28782, "wall": 12764.7} {"step": 5606, "train_loss": 3.5804057121276855, "lr": 0.0003788002632024785, "tps": 28768, "wall": 12772.8} {"step": 5607, "train_loss": 3.6031975746154785, "lr": 0.00037879124213224, "tps": 28756, "wall": 12780.8} {"step": 5608, "train_loss": 3.662716865539551, "lr": 0.00037878221926320577, "tps": 28742, "wall": 12788.9} {"step": 5609, "train_loss": 3.5406081676483154, "lr": 0.000378773194595478, "tps": 28729, "wall": 12797.0} {"step": 5610, "train_loss": 3.7047314643859863, "lr": 0.0003787641681291588, "tps": 28716, "wall": 12805.2} {"step": 5611, "train_loss": 3.549154281616211, "lr": 0.0003787551398643506, "tps": 28703, "wall": 12813.4} {"step": 5612, "train_loss": 3.614828586578369, "lr": 0.00037874610980115554, "tps": 28690, "wall": 12821.6} {"step": 5613, "train_loss": 3.6717329025268555, "lr": 0.000378737077939676, "tps": 28677, "wall": 12829.6} {"step": 5614, "train_loss": 3.586958646774292, "lr": 0.0003787280442800142, "tps": 28664, "wall": 12837.8} {"step": 5615, "train_loss": 3.5695247650146484, "lr": 0.00037871900882227263, "tps": 28651, "wall": 12845.9} {"step": 5616, "train_loss": 3.521641731262207, "lr": 0.0003787099715665534, "tps": 28638, "wall": 12854.0} {"step": 5617, "train_loss": 3.552712917327881, "lr": 0.0003787009325129591, "tps": 28625, "wall": 12862.1} {"step": 5618, "train_loss": 3.6604743003845215, "lr": 0.00037869189166159207, "tps": 28612, "wall": 12870.3} {"step": 5619, "train_loss": 3.613386392593384, "lr": 0.0003786828490125547, "tps": 28599, "wall": 12878.5} {"step": 5620, "train_loss": 3.72467303276062, "lr": 0.0003786738045659494, "tps": 28586, "wall": 12886.6} {"step": 5621, "train_loss": 3.6186418533325195, "lr": 0.0003786647583218786, "tps": 28573, "wall": 12894.7} {"step": 5622, "train_loss": 3.5781216621398926, "lr": 0.0003786557102804449, "tps": 28560, "wall": 12902.7} {"step": 5623, "train_loss": 3.5839591026306152, "lr": 0.0003786466604417508, "tps": 28547, "wall": 12910.8} {"step": 5624, "train_loss": 3.5750794410705566, "lr": 0.0003786376088058987, "tps": 28534, "wall": 12919.0} {"step": 5625, "train_loss": 3.51031494140625, "lr": 0.00037862855537299113, "tps": 28521, "wall": 12927.1} {"step": 5626, "train_loss": 3.612387180328369, "lr": 0.00037861950014313076, "tps": 28509, "wall": 12935.2} {"step": 5627, "train_loss": 3.732961654663086, "lr": 0.00037861044311642006, "tps": 28496, "wall": 12943.4} {"step": 5628, "train_loss": 3.631923198699951, "lr": 0.00037860138429296177, "tps": 28483, "wall": 12951.5} {"step": 5629, "train_loss": 3.644939661026001, "lr": 0.0003785923236728583, "tps": 28470, "wall": 12959.7} {"step": 5630, "train_loss": 3.5548365116119385, "lr": 0.00037858326125621245, "tps": 28457, "wall": 12967.7} {"step": 5631, "train_loss": 3.659853219985962, "lr": 0.0003785741970431269, "tps": 28445, "wall": 12975.8} {"step": 5632, "train_loss": 3.660745620727539, "lr": 0.00037856513103370416, "tps": 28432, "wall": 12983.9} {"step": 5633, "train_loss": 3.621049642562866, "lr": 0.00037855606322804715, "tps": 28419, "wall": 12992.0} {"step": 5634, "train_loss": 3.570706367492676, "lr": 0.0003785469936262584, "tps": 28407, "wall": 13000.0} {"step": 5635, "train_loss": 3.615015983581543, "lr": 0.0003785379222284407, "tps": 28394, "wall": 13008.1} {"step": 5636, "train_loss": 3.427732229232788, "lr": 0.000378528849034697, "tps": 28381, "wall": 13016.2} {"step": 5637, "train_loss": 3.666562557220459, "lr": 0.00037851977404512976, "tps": 28369, "wall": 13024.1} {"step": 5638, "train_loss": 3.5450525283813477, "lr": 0.000378510697259842, "tps": 28357, "wall": 13032.2} {"step": 5639, "train_loss": 3.6383554935455322, "lr": 0.00037850161867893653, "tps": 28344, "wall": 13040.2} {"step": 5640, "train_loss": 3.6244492530822754, "lr": 0.0003784925383025161, "tps": 28332, "wall": 13048.3} {"step": 5641, "train_loss": 3.6210780143737793, "lr": 0.0003784834561306836, "tps": 28320, "wall": 13056.3} {"step": 5642, "train_loss": 3.632518768310547, "lr": 0.00037847437216354196, "tps": 28307, "wall": 13064.4} {"step": 5643, "train_loss": 3.6022958755493164, "lr": 0.0003784652864011941, "tps": 28295, "wall": 13072.4} {"step": 5644, "train_loss": 3.6379616260528564, "lr": 0.0003784561988437428, "tps": 28282, "wall": 13080.5} {"step": 5645, "train_loss": 3.695418357849121, "lr": 0.0003784471094912912, "tps": 28270, "wall": 13088.4} {"step": 5646, "train_loss": 3.6419858932495117, "lr": 0.0003784380183439421, "tps": 28258, "wall": 13096.5} {"step": 5647, "train_loss": 3.579413652420044, "lr": 0.00037842892540179864, "tps": 28245, "wall": 13104.5} {"step": 5648, "train_loss": 3.67228364944458, "lr": 0.00037841983066496374, "tps": 28233, "wall": 13112.5} {"step": 5649, "train_loss": 3.651153564453125, "lr": 0.00037841073413354034, "tps": 28221, "wall": 13120.4} {"step": 5650, "train_loss": 3.7186903953552246, "lr": 0.00037840163580763164, "tps": 28209, "wall": 13128.4} {"step": 5651, "train_loss": 3.744746208190918, "lr": 0.00037839253568734064, "tps": 28197, "wall": 13136.4} {"step": 5652, "train_loss": 3.6326115131378174, "lr": 0.0003783834337727704, "tps": 28185, "wall": 13144.4} {"step": 5653, "train_loss": 3.6960017681121826, "lr": 0.00037837433006402413, "tps": 28172, "wall": 13152.4} {"step": 5654, "train_loss": 3.6246702671051025, "lr": 0.0003783652245612048, "tps": 28160, "wall": 13160.4} {"step": 5655, "train_loss": 3.6087892055511475, "lr": 0.0003783561172644157, "tps": 28148, "wall": 13168.5} {"step": 5656, "train_loss": 3.5411877632141113, "lr": 0.0003783470081737598, "tps": 28136, "wall": 13176.4} {"step": 5657, "train_loss": 3.5352184772491455, "lr": 0.00037833789728934056, "tps": 28124, "wall": 13184.5} {"step": 5658, "train_loss": 3.558140754699707, "lr": 0.000378328784611261, "tps": 28112, "wall": 13192.5} {"step": 5659, "train_loss": 3.6294329166412354, "lr": 0.00037831967013962436, "tps": 28099, "wall": 13200.5} {"step": 5660, "train_loss": 3.533437728881836, "lr": 0.00037831055387453405, "tps": 28088, "wall": 13208.3} {"step": 5661, "train_loss": 3.6442384719848633, "lr": 0.0003783014358160931, "tps": 28076, "wall": 13216.4} {"step": 5662, "train_loss": 3.6818079948425293, "lr": 0.000378292315964405, "tps": 28064, "wall": 13224.4} {"step": 5663, "train_loss": 3.67592453956604, "lr": 0.00037828319431957295, "tps": 28052, "wall": 13232.2} {"step": 5664, "train_loss": 3.601902484893799, "lr": 0.0003782740708817003, "tps": 28040, "wall": 13240.2} {"step": 5665, "train_loss": 3.714648723602295, "lr": 0.0003782649456508905, "tps": 28028, "wall": 13248.2} {"step": 5666, "train_loss": 3.6402878761291504, "lr": 0.00037825581862724675, "tps": 28016, "wall": 13256.4} {"step": 5667, "train_loss": 3.545349597930908, "lr": 0.00037824668981087254, "tps": 28004, "wall": 13264.2} {"step": 5668, "train_loss": 3.663954257965088, "lr": 0.00037823755920187124, "tps": 27992, "wall": 13272.3} {"step": 5669, "train_loss": 3.6047699451446533, "lr": 0.00037822842680034635, "tps": 27980, "wall": 13280.2} {"step": 5670, "train_loss": 3.6574435234069824, "lr": 0.0003782192926064013, "tps": 27968, "wall": 13288.2} {"step": 5671, "train_loss": 3.5997982025146484, "lr": 0.00037821015662013946, "tps": 27956, "wall": 13296.1} {"step": 5672, "train_loss": 3.59757137298584, "lr": 0.0003782010188416645, "tps": 27945, "wall": 13304.2} {"step": 5673, "train_loss": 3.577167272567749, "lr": 0.00037819187927107977, "tps": 27933, "wall": 13312.0} {"step": 5674, "train_loss": 3.5787084102630615, "lr": 0.00037818273790848894, "tps": 27921, "wall": 13320.1} {"step": 5675, "train_loss": 3.6105499267578125, "lr": 0.00037817359475399544, "tps": 27909, "wall": 13328.0} {"step": 5676, "train_loss": 3.6593103408813477, "lr": 0.0003781644498077029, "tps": 27897, "wall": 13336.0} {"step": 5677, "train_loss": 3.509385347366333, "lr": 0.00037815530306971497, "tps": 27886, "wall": 13343.9} {"step": 5678, "train_loss": 3.658963680267334, "lr": 0.0003781461545401352, "tps": 27874, "wall": 13351.9} {"step": 5679, "train_loss": 3.556715726852417, "lr": 0.00037813700421906717, "tps": 27862, "wall": 13359.8} {"step": 5680, "train_loss": 3.5023880004882812, "lr": 0.00037812785210661467, "tps": 27851, "wall": 13367.9} {"step": 5681, "train_loss": 3.6385016441345215, "lr": 0.00037811869820288124, "tps": 27839, "wall": 13375.8} {"step": 5682, "train_loss": 3.601496696472168, "lr": 0.00037810954250797074, "tps": 27827, "wall": 13383.7} {"step": 5683, "train_loss": 3.609771251678467, "lr": 0.0003781003850219867, "tps": 27816, "wall": 13391.6} {"step": 5684, "train_loss": 3.515425443649292, "lr": 0.000378091225745033, "tps": 27804, "wall": 13399.6} {"step": 5685, "train_loss": 3.6669936180114746, "lr": 0.0003780820646772133, "tps": 27793, "wall": 13407.5} {"step": 5686, "train_loss": 3.651935577392578, "lr": 0.00037807290181863146, "tps": 27781, "wall": 13415.5} {"step": 5687, "train_loss": 3.6597259044647217, "lr": 0.0003780637371693912, "tps": 27769, "wall": 13423.6} {"step": 5688, "train_loss": 3.6116652488708496, "lr": 0.0003780545707295964, "tps": 27758, "wall": 13431.4} {"step": 5689, "train_loss": 3.6308858394622803, "lr": 0.0003780454024993509, "tps": 27746, "wall": 13439.5} {"step": 5690, "train_loss": 3.641822099685669, "lr": 0.0003780362324787584, "tps": 27735, "wall": 13447.3} {"step": 5691, "train_loss": 3.6179299354553223, "lr": 0.000378027060667923, "tps": 27723, "wall": 13455.4} {"step": 5692, "train_loss": 3.6539907455444336, "lr": 0.00037801788706694857, "tps": 27712, "wall": 13463.2} {"step": 5693, "train_loss": 3.593477725982666, "lr": 0.0003780087116759389, "tps": 27700, "wall": 13471.2} {"step": 5694, "train_loss": 3.61842679977417, "lr": 0.000377999534494998, "tps": 27689, "wall": 13479.1} {"step": 5695, "train_loss": 3.6474077701568604, "lr": 0.0003779903555242299, "tps": 27677, "wall": 13487.1} {"step": 5696, "train_loss": 3.588197708129883, "lr": 0.00037798117476373836, "tps": 27666, "wall": 13495.0} {"step": 5697, "train_loss": 3.664839744567871, "lr": 0.00037797199221362767, "tps": 27655, "wall": 13502.8} {"step": 5698, "train_loss": 3.666133403778076, "lr": 0.00037796280787400155, "tps": 27644, "wall": 13510.6} {"step": 5699, "train_loss": 3.627872943878174, "lr": 0.00037795362174496437, "tps": 27632, "wall": 13518.5} {"step": 5700, "train_loss": 3.6054649353027344, "lr": 0.0003779444338266199, "tps": 27621, "wall": 13526.4} {"step": 5701, "train_loss": 3.5787715911865234, "lr": 0.0003779352441190724, "tps": 27610, "wall": 13534.4} {"step": 5702, "train_loss": 3.673490524291992, "lr": 0.00037792605262242584, "tps": 27598, "wall": 13542.3} {"step": 5703, "train_loss": 3.6439743041992188, "lr": 0.00037791685933678446, "tps": 27587, "wall": 13550.2} {"step": 5704, "train_loss": 3.7273497581481934, "lr": 0.0003779076642622523, "tps": 27576, "wall": 13558.2} {"step": 5705, "train_loss": 3.6607348918914795, "lr": 0.0003778984673989336, "tps": 27564, "wall": 13566.1} {"step": 5706, "train_loss": 3.6238436698913574, "lr": 0.0003778892687469326, "tps": 27553, "wall": 13573.9} {"step": 5707, "train_loss": 3.549351692199707, "lr": 0.00037788006830635334, "tps": 27543, "wall": 13581.7} {"step": 5708, "train_loss": 3.7031848430633545, "lr": 0.0003778708660773002, "tps": 27531, "wall": 13589.6} {"step": 5709, "train_loss": 3.545445680618286, "lr": 0.00037786166205987725, "tps": 27520, "wall": 13597.4} {"step": 5710, "train_loss": 3.7088136672973633, "lr": 0.0003778524562541889, "tps": 27509, "wall": 13605.3} {"step": 5711, "train_loss": 3.650675058364868, "lr": 0.0003778432486603394, "tps": 27498, "wall": 13613.2} {"step": 5712, "train_loss": 3.668598175048828, "lr": 0.000377834039278433, "tps": 27487, "wall": 13621.1} {"step": 5713, "train_loss": 3.6225273609161377, "lr": 0.00037782482810857414, "tps": 27476, "wall": 13628.9} {"step": 5714, "train_loss": 3.643685817718506, "lr": 0.000377815615150867, "tps": 27465, "wall": 13636.9} {"step": 5715, "train_loss": 3.5574116706848145, "lr": 0.00037780640040541613, "tps": 27454, "wall": 13644.8} {"step": 5716, "train_loss": 3.571439504623413, "lr": 0.0003777971838723257, "tps": 27442, "wall": 13652.8} {"step": 5717, "train_loss": 3.5378642082214355, "lr": 0.00037778796555170037, "tps": 27431, "wall": 13660.6} {"step": 5718, "train_loss": 3.6294565200805664, "lr": 0.0003777787454436443, "tps": 27420, "wall": 13668.6} {"step": 5719, "train_loss": 3.575697183609009, "lr": 0.0003777695235482621, "tps": 27409, "wall": 13676.5} {"step": 5720, "train_loss": 3.480388641357422, "lr": 0.0003777602998656583, "tps": 27398, "wall": 13684.2} {"step": 5721, "train_loss": 3.56490159034729, "lr": 0.0003777510743959372, "tps": 27387, "wall": 13692.1} {"step": 5722, "train_loss": 3.642904281616211, "lr": 0.0003777418471392034, "tps": 27376, "wall": 13700.0} {"step": 5723, "train_loss": 3.494149923324585, "lr": 0.00037773261809556137, "tps": 27365, "wall": 13707.9} {"step": 5724, "train_loss": 3.737826108932495, "lr": 0.0003777233872651158, "tps": 27355, "wall": 13715.7} {"step": 5725, "train_loss": 3.4585578441619873, "lr": 0.00037771415464797116, "tps": 27343, "wall": 13723.7} {"step": 5726, "train_loss": 3.7302567958831787, "lr": 0.00037770492024423203, "tps": 27332, "wall": 13731.6} {"step": 5727, "train_loss": 3.626842498779297, "lr": 0.000377695684054003, "tps": 27322, "wall": 13739.5} {"step": 5728, "train_loss": 3.6431710720062256, "lr": 0.00037768644607738875, "tps": 27311, "wall": 13747.3} {"step": 5729, "train_loss": 3.589444160461426, "lr": 0.0003776772063144939, "tps": 27300, "wall": 13755.1} {"step": 5730, "train_loss": 3.574352264404297, "lr": 0.00037766796476542314, "tps": 27289, "wall": 13763.0} {"step": 5731, "train_loss": 3.6742844581604004, "lr": 0.00037765872143028114, "tps": 27278, "wall": 13770.9} {"step": 5732, "train_loss": 3.5974819660186768, "lr": 0.0003776494763091726, "tps": 27268, "wall": 13778.6} {"step": 5733, "train_loss": 3.713054656982422, "lr": 0.0003776402294022023, "tps": 27257, "wall": 13786.5} {"step": 5734, "train_loss": 3.6227164268493652, "lr": 0.00037763098070947495, "tps": 27246, "wall": 13794.3} {"step": 5735, "train_loss": 3.6562910079956055, "lr": 0.0003776217302310953, "tps": 27236, "wall": 13802.1} {"step": 5736, "train_loss": 3.6032419204711914, "lr": 0.00037761247796716817, "tps": 27225, "wall": 13809.8} {"step": 5737, "train_loss": 3.620302677154541, "lr": 0.0003776032239177984, "tps": 27214, "wall": 13817.6} {"step": 5738, "train_loss": 3.591791868209839, "lr": 0.00037759396808309065, "tps": 27204, "wall": 13825.4} {"step": 5739, "train_loss": 3.607235908508301, "lr": 0.00037758471046315004, "tps": 27193, "wall": 13833.3} {"step": 5740, "train_loss": 3.6314985752105713, "lr": 0.00037757545105808124, "tps": 27183, "wall": 13841.0} {"step": 5741, "train_loss": 3.5984160900115967, "lr": 0.00037756618986798925, "tps": 27172, "wall": 13848.9} {"step": 5742, "train_loss": 3.608966112136841, "lr": 0.0003775569268929789, "tps": 27161, "wall": 13856.8} {"step": 5743, "train_loss": 3.614917755126953, "lr": 0.0003775476621331552, "tps": 27151, "wall": 13864.6} {"step": 5744, "train_loss": 3.612851619720459, "lr": 0.000377538395588623, "tps": 27140, "wall": 13872.4} {"step": 5745, "train_loss": 3.6326136589050293, "lr": 0.00037752912725948744, "tps": 27129, "wall": 13880.3} {"step": 5746, "train_loss": 3.5050148963928223, "lr": 0.0003775198571458533, "tps": 27119, "wall": 13888.1} {"step": 5747, "train_loss": 3.6386077404022217, "lr": 0.00037751058524782574, "tps": 27109, "wall": 13895.8} {"step": 5748, "train_loss": 3.5138466358184814, "lr": 0.0003775013115655097, "tps": 27098, "wall": 13903.6} {"step": 5749, "train_loss": 3.6102373600006104, "lr": 0.00037749203609901033, "tps": 27088, "wall": 13911.4} {"step": 5750, "train_loss": 3.6020607948303223, "lr": 0.00037748275884843266, "tps": 27077, "wall": 13919.2} {"step": 5751, "train_loss": 3.569490909576416, "lr": 0.00037747347981388174, "tps": 27066, "wall": 13927.1} {"step": 5752, "train_loss": 3.6080851554870605, "lr": 0.0003774641989954628, "tps": 27056, "wall": 13934.9} {"step": 5753, "train_loss": 3.656036376953125, "lr": 0.0003774549163932808, "tps": 27046, "wall": 13942.6} {"step": 5754, "train_loss": 3.741459369659424, "lr": 0.000377445632007441, "tps": 27035, "wall": 13950.4} {"step": 5755, "train_loss": 3.659640312194824, "lr": 0.0003774363458380486, "tps": 27025, "wall": 13958.1} {"step": 5756, "train_loss": 3.5830631256103516, "lr": 0.00037742705788520873, "tps": 27015, "wall": 13965.9} {"step": 5757, "train_loss": 3.605175495147705, "lr": 0.00037741776814902665, "tps": 27004, "wall": 13973.8} {"step": 5758, "train_loss": 3.5882904529571533, "lr": 0.0003774084766296076, "tps": 26994, "wall": 13981.5} {"step": 5759, "train_loss": 3.6679201126098633, "lr": 0.0003773991833270568, "tps": 26984, "wall": 13989.2} {"step": 5760, "train_loss": 3.583991050720215, "lr": 0.0003773898882414795, "tps": 26973, "wall": 13997.0} {"step": 5761, "train_loss": 3.698692560195923, "lr": 0.00037738059137298104, "tps": 26963, "wall": 14004.9} {"step": 5762, "train_loss": 3.558060884475708, "lr": 0.0003773712927216667, "tps": 26953, "wall": 14012.6} {"step": 5763, "train_loss": 3.6258888244628906, "lr": 0.00037736199228764197, "tps": 26942, "wall": 14020.4} {"step": 5764, "train_loss": 3.614957571029663, "lr": 0.00037735269007101196, "tps": 26932, "wall": 14028.2} {"step": 5765, "train_loss": 3.5663001537323, "lr": 0.00037734338607188213, "tps": 26921, "wall": 14036.1} {"step": 5766, "train_loss": 3.6703453063964844, "lr": 0.00037733408029035797, "tps": 26911, "wall": 14043.8} {"step": 5767, "train_loss": 3.632972478866577, "lr": 0.00037732477272654487, "tps": 26901, "wall": 14051.6} {"step": 5768, "train_loss": 3.5846433639526367, "lr": 0.00037731546338054826, "tps": 26891, "wall": 14059.4} {"step": 5769, "train_loss": 3.6735806465148926, "lr": 0.00037730615225247354, "tps": 26881, "wall": 14067.2} {"step": 5770, "train_loss": 3.6286165714263916, "lr": 0.00037729683934242613, "tps": 26870, "wall": 14075.0} {"step": 5771, "train_loss": 3.47170352935791, "lr": 0.0003772875246505117, "tps": 26860, "wall": 14082.9} {"step": 5772, "train_loss": 3.538083076477051, "lr": 0.0003772782081768357, "tps": 26850, "wall": 14090.5} {"step": 5773, "train_loss": 3.6888580322265625, "lr": 0.00037726888992150356, "tps": 26840, "wall": 14098.4} {"step": 5774, "train_loss": 3.542562484741211, "lr": 0.000377259569884621, "tps": 26830, "wall": 14106.1} {"step": 5775, "train_loss": 3.6363253593444824, "lr": 0.00037725024806629345, "tps": 26820, "wall": 14113.8} {"step": 5776, "train_loss": 3.533189296722412, "lr": 0.00037724092446662666, "tps": 26810, "wall": 14121.5} {"step": 5777, "train_loss": 3.5962448120117188, "lr": 0.0003772315990857262, "tps": 26800, "wall": 14129.3} {"step": 5778, "train_loss": 3.605372428894043, "lr": 0.0003772222719236976, "tps": 26789, "wall": 14137.1} {"step": 5779, "train_loss": 3.5339620113372803, "lr": 0.00037721294298064656, "tps": 26779, "wall": 14144.9} {"step": 5780, "train_loss": 3.5022971630096436, "lr": 0.0003772036122566789, "tps": 26769, "wall": 14152.6} {"step": 5781, "train_loss": 3.6767754554748535, "lr": 0.00037719427975190016, "tps": 26759, "wall": 14160.3} {"step": 5782, "train_loss": 3.6203300952911377, "lr": 0.0003771849454664162, "tps": 26749, "wall": 14168.0} {"step": 5783, "train_loss": 3.7198128700256348, "lr": 0.00037717560940033254, "tps": 26740, "wall": 14175.8} {"step": 5784, "train_loss": 3.647588014602661, "lr": 0.0003771662715537552, "tps": 26729, "wall": 14183.6} {"step": 5785, "train_loss": 3.628603935241699, "lr": 0.0003771569319267897, "tps": 26719, "wall": 14191.4} {"step": 5786, "train_loss": 3.455618381500244, "lr": 0.00037714759051954205, "tps": 26709, "wall": 14199.2} {"step": 5787, "train_loss": 3.6796786785125732, "lr": 0.00037713824733211795, "tps": 26699, "wall": 14206.9} {"step": 5788, "train_loss": 3.64212703704834, "lr": 0.00037712890236462336, "tps": 26689, "wall": 14214.8} {"step": 5789, "train_loss": 3.688373565673828, "lr": 0.00037711955561716407, "tps": 26679, "wall": 14222.5} {"step": 5790, "train_loss": 3.5732903480529785, "lr": 0.0003771102070898458, "tps": 26669, "wall": 14230.3} {"step": 5791, "train_loss": 3.666783571243286, "lr": 0.0003771008567827748, "tps": 26659, "wall": 14238.0} {"step": 5792, "train_loss": 3.6088221073150635, "lr": 0.0003770915046960567, "tps": 26649, "wall": 14245.9} {"step": 5793, "train_loss": 3.577932357788086, "lr": 0.00037708215082979754, "tps": 26639, "wall": 14253.6} {"step": 5794, "train_loss": 3.6190876960754395, "lr": 0.00037707279518410324, "tps": 26630, "wall": 14261.3} {"step": 5795, "train_loss": 3.706400156021118, "lr": 0.0003770634377590799, "tps": 26620, "wall": 14269.1} {"step": 5796, "train_loss": 3.563145637512207, "lr": 0.00037705407855483336, "tps": 26610, "wall": 14276.8} {"step": 5797, "train_loss": 3.581005573272705, "lr": 0.0003770447175714698, "tps": 26600, "wall": 14284.5} {"step": 5798, "train_loss": 3.4978325366973877, "lr": 0.00037703535480909515, "tps": 26590, "wall": 14292.2} {"step": 5799, "train_loss": 3.5473074913024902, "lr": 0.00037702599026781546, "tps": 26581, "wall": 14300.0} {"step": 5800, "train_loss": 3.5346291065216064, "lr": 0.00037701662394773694, "tps": 26571, "wall": 14307.7} {"step": 5801, "train_loss": 3.5726571083068848, "lr": 0.0003770072558489655, "tps": 26561, "wall": 14315.5} {"step": 5802, "train_loss": 3.6406235694885254, "lr": 0.00037699788597160745, "tps": 26551, "wall": 14323.4} {"step": 5803, "train_loss": 3.53780460357666, "lr": 0.0003769885143157689, "tps": 26541, "wall": 14331.1} {"step": 5804, "train_loss": 3.6955318450927734, "lr": 0.00037697914088155593, "tps": 26531, "wall": 14338.8} {"step": 5805, "train_loss": 3.5719943046569824, "lr": 0.0003769697656690747, "tps": 26522, "wall": 14346.4} {"step": 5806, "train_loss": 3.662454128265381, "lr": 0.00037696038867843153, "tps": 26512, "wall": 14354.1} {"step": 5807, "train_loss": 3.671973705291748, "lr": 0.00037695100990973253, "tps": 26503, "wall": 14361.8} {"step": 5808, "train_loss": 3.5518271923065186, "lr": 0.00037694162936308405, "tps": 26493, "wall": 14369.6} {"step": 5809, "train_loss": 3.593519687652588, "lr": 0.0003769322470385923, "tps": 26483, "wall": 14377.3} {"step": 5810, "train_loss": 3.572709560394287, "lr": 0.00037692286293636355, "tps": 26473, "wall": 14385.2} {"step": 5811, "train_loss": 3.7426419258117676, "lr": 0.0003769134770565041, "tps": 26464, "wall": 14392.9} {"step": 5812, "train_loss": 3.6283864974975586, "lr": 0.0003769040893991203, "tps": 26454, "wall": 14400.6} {"step": 5813, "train_loss": 3.5311741828918457, "lr": 0.00037689469996431856, "tps": 26445, "wall": 14408.2} {"step": 5814, "train_loss": 3.524834394454956, "lr": 0.00037688530875220504, "tps": 26435, "wall": 14416.0} {"step": 5815, "train_loss": 3.619640350341797, "lr": 0.00037687591576288635, "tps": 26425, "wall": 14423.8} {"step": 5816, "train_loss": 3.667358875274658, "lr": 0.0003768665209964688, "tps": 26415, "wall": 14431.9} {"step": 5817, "train_loss": 3.675950050354004, "lr": 0.0003768571244530588, "tps": 26405, "wall": 14439.7} {"step": 5818, "train_loss": 3.693824291229248, "lr": 0.0003768477261327628, "tps": 26395, "wall": 14447.5} {"step": 5819, "train_loss": 3.561530113220215, "lr": 0.0003768383260356872, "tps": 26386, "wall": 14455.3} {"step": 5820, "train_loss": 3.7021596431732178, "lr": 0.0003768289241619387, "tps": 26376, "wall": 14463.0} {"step": 5821, "train_loss": 3.6638081073760986, "lr": 0.00037681952051162363, "tps": 26367, "wall": 14470.7} {"step": 5822, "train_loss": 3.602325916290283, "lr": 0.0003768101150848485, "tps": 26357, "wall": 14478.4} {"step": 5823, "train_loss": 3.5788259506225586, "lr": 0.00037680070788171987, "tps": 26348, "wall": 14486.1} {"step": 5824, "train_loss": 3.574237108230591, "lr": 0.0003767912989023444, "tps": 26338, "wall": 14493.9} {"step": 5825, "train_loss": 3.579655170440674, "lr": 0.00037678188814682857, "tps": 26328, "wall": 14501.7} {"step": 5826, "train_loss": 3.6546883583068848, "lr": 0.0003767724756152791, "tps": 26319, "wall": 14509.4} {"step": 5827, "train_loss": 3.549893379211426, "lr": 0.0003767630613078025, "tps": 26309, "wall": 14517.2} {"step": 5828, "train_loss": 3.46972393989563, "lr": 0.0003767536452245054, "tps": 26300, "wall": 14524.9} {"step": 5829, "train_loss": 3.5953996181488037, "lr": 0.00037674422736549463, "tps": 26290, "wall": 14532.6} {"step": 5830, "train_loss": 3.6186065673828125, "lr": 0.00037673480773087675, "tps": 26281, "wall": 14540.4} {"step": 5831, "train_loss": 3.517331123352051, "lr": 0.0003767253863207585, "tps": 26271, "wall": 14548.2} {"step": 5832, "train_loss": 3.6129977703094482, "lr": 0.0003767159631352465, "tps": 26262, "wall": 14556.0} {"step": 5833, "train_loss": 3.6824746131896973, "lr": 0.0003767065381744477, "tps": 26252, "wall": 14563.8} {"step": 5834, "train_loss": 3.681713342666626, "lr": 0.0003766971114384687, "tps": 26243, "wall": 14571.5} {"step": 5835, "train_loss": 3.639646291732788, "lr": 0.00037668768292741634, "tps": 26233, "wall": 14579.2} {"step": 5836, "train_loss": 3.659205198287964, "lr": 0.00037667825264139747, "tps": 26224, "wall": 14586.9} {"step": 5837, "train_loss": 3.595900058746338, "lr": 0.0003766688205805188, "tps": 26214, "wall": 14594.8} {"step": 5838, "train_loss": 3.667078971862793, "lr": 0.00037665938674488736, "tps": 26205, "wall": 14602.4} {"step": 5839, "train_loss": 3.5416412353515625, "lr": 0.0003766499511346099, "tps": 26196, "wall": 14610.1} {"step": 5840, "train_loss": 3.5346388816833496, "lr": 0.0003766405137497933, "tps": 26186, "wall": 14617.9} {"step": 5841, "train_loss": 3.666175365447998, "lr": 0.00037663107459054445, "tps": 26177, "wall": 14625.7} {"step": 5842, "train_loss": 3.6682987213134766, "lr": 0.0003766216336569703, "tps": 26168, "wall": 14633.4} {"step": 5843, "train_loss": 3.6110105514526367, "lr": 0.0003766121909491779, "tps": 26158, "wall": 14641.1} {"step": 5844, "train_loss": 3.5290751457214355, "lr": 0.00037660274646727403, "tps": 26149, "wall": 14648.8} {"step": 5845, "train_loss": 3.6933441162109375, "lr": 0.00037659330021136585, "tps": 26140, "wall": 14656.6} {"step": 5846, "train_loss": 3.6705515384674072, "lr": 0.00037658385218156023, "tps": 26130, "wall": 14664.3} {"step": 5847, "train_loss": 3.604807138442993, "lr": 0.0003765744023779643, "tps": 26121, "wall": 14672.0} {"step": 5848, "train_loss": 3.599661111831665, "lr": 0.00037656495080068506, "tps": 26112, "wall": 14679.8} {"step": 5849, "train_loss": 3.545595169067383, "lr": 0.00037655549744982964, "tps": 26102, "wall": 14687.6} {"step": 5850, "train_loss": 3.590541362762451, "lr": 0.000376546042325505, "tps": 26093, "wall": 14695.4} {"step": 5851, "train_loss": 3.6566197872161865, "lr": 0.0003765365854278183, "tps": 26084, "wall": 14703.1} {"step": 5852, "train_loss": 3.569040298461914, "lr": 0.0003765271267568768, "tps": 26074, "wall": 14710.7} {"step": 5853, "train_loss": 3.598355293273926, "lr": 0.0003765176663127875, "tps": 26065, "wall": 14718.4} {"step": 5854, "train_loss": 3.529339075088501, "lr": 0.0003765082040956576, "tps": 26056, "wall": 14726.2} {"step": 5855, "train_loss": 3.666600465774536, "lr": 0.00037649874010559423, "tps": 26047, "wall": 14733.9} {"step": 5856, "train_loss": 3.681105613708496, "lr": 0.00037648927434270473, "tps": 26037, "wall": 14741.7} {"step": 5857, "train_loss": 3.478668689727783, "lr": 0.00037647980680709627, "tps": 26028, "wall": 14749.5} {"step": 5858, "train_loss": 3.534679412841797, "lr": 0.0003764703374988761, "tps": 26019, "wall": 14757.3} {"step": 5859, "train_loss": 3.6808671951293945, "lr": 0.00037646086641815143, "tps": 26010, "wall": 14765.0} {"step": 5860, "train_loss": 3.5040032863616943, "lr": 0.0003764513935650296, "tps": 26001, "wall": 14772.7} {"step": 5861, "train_loss": 3.6701927185058594, "lr": 0.00037644191893961796, "tps": 25992, "wall": 14780.4} {"step": 5862, "train_loss": 3.606407642364502, "lr": 0.0003764324425420238, "tps": 25982, "wall": 14788.2} {"step": 5863, "train_loss": 3.6141228675842285, "lr": 0.0003764229643723545, "tps": 25973, "wall": 14795.9} {"step": 5864, "train_loss": 3.59847092628479, "lr": 0.0003764134844307173, "tps": 25964, "wall": 14803.8} {"step": 5865, "train_loss": 3.5890402793884277, "lr": 0.0003764040027172198, "tps": 25955, "wall": 14811.5} {"step": 5866, "train_loss": 3.493436813354492, "lr": 0.00037639451923196927, "tps": 25945, "wall": 14819.3} {"step": 5867, "train_loss": 3.5226142406463623, "lr": 0.00037638503397507305, "tps": 25937, "wall": 14826.8} {"step": 5868, "train_loss": 3.6517772674560547, "lr": 0.00037637554694663883, "tps": 25928, "wall": 14834.6} {"step": 5869, "train_loss": 3.508338451385498, "lr": 0.0003763660581467739, "tps": 25919, "wall": 14842.1} {"step": 5870, "train_loss": 3.6302974224090576, "lr": 0.0003763565675755858, "tps": 25909, "wall": 14849.9} {"step": 5871, "train_loss": 3.5993971824645996, "lr": 0.00037634707523318206, "tps": 25901, "wall": 14857.6} {"step": 5872, "train_loss": 3.534863233566284, "lr": 0.00037633758111967026, "tps": 25891, "wall": 14865.5} {"step": 5873, "train_loss": 3.53108286857605, "lr": 0.0003763280852351578, "tps": 25882, "wall": 14873.2} {"step": 5874, "train_loss": 3.514500617980957, "lr": 0.0003763185875797523, "tps": 25873, "wall": 14881.0} {"step": 5875, "train_loss": 3.667506694793701, "lr": 0.00037630908815356145, "tps": 25864, "wall": 14888.6} {"step": 5876, "train_loss": 3.517928123474121, "lr": 0.0003762995869566928, "tps": 25855, "wall": 14896.4} {"step": 5877, "train_loss": 3.659395694732666, "lr": 0.00037629008398925396, "tps": 25846, "wall": 14904.1} {"step": 5878, "train_loss": 3.680314064025879, "lr": 0.0003762805792513526, "tps": 25837, "wall": 14911.8} {"step": 5879, "train_loss": 3.6170549392700195, "lr": 0.00037627107274309634, "tps": 25828, "wall": 14919.5} {"step": 5880, "train_loss": 3.616563320159912, "lr": 0.00037626156446459293, "tps": 25819, "wall": 14927.4} {"step": 5881, "train_loss": 3.71105694770813, "lr": 0.0003762520544159501, "tps": 25810, "wall": 14935.1} {"step": 5882, "train_loss": 3.5795180797576904, "lr": 0.00037624254259727553, "tps": 25801, "wall": 14942.8} {"step": 5883, "train_loss": 3.6185812950134277, "lr": 0.000376233029008677, "tps": 25792, "wall": 14950.5} {"step": 5884, "train_loss": 3.60599684715271, "lr": 0.0003762235136502622, "tps": 25783, "wall": 14958.3} {"step": 5885, "train_loss": 3.7494747638702393, "lr": 0.00037621399652213903, "tps": 25774, "wall": 14966.1} {"step": 5886, "train_loss": 3.5867679119110107, "lr": 0.00037620447762441527, "tps": 25765, "wall": 14973.9} {"step": 5887, "train_loss": 3.622213840484619, "lr": 0.0003761949569571987, "tps": 25756, "wall": 14981.7} {"step": 5888, "train_loss": 3.6759285926818848, "lr": 0.0003761854345205972, "tps": 25747, "wall": 14989.5} {"step": 5889, "train_loss": 3.5906310081481934, "lr": 0.0003761759103147187, "tps": 25738, "wall": 14997.3} {"step": 5890, "train_loss": 3.580749988555908, "lr": 0.000376166384339671, "tps": 25729, "wall": 15005.1} {"step": 5891, "train_loss": 3.521713972091675, "lr": 0.00037615685659556205, "tps": 25720, "wall": 15012.8} {"step": 5892, "train_loss": 3.6177821159362793, "lr": 0.0003761473270824998, "tps": 25711, "wall": 15020.6} {"step": 5893, "train_loss": 3.607006311416626, "lr": 0.00037613779580059217, "tps": 25702, "wall": 15028.5} {"step": 5894, "train_loss": 3.641685724258423, "lr": 0.00037612826274994717, "tps": 25693, "wall": 15036.3} {"step": 5895, "train_loss": 3.6252808570861816, "lr": 0.00037611872793067276, "tps": 25684, "wall": 15044.2} {"step": 5896, "train_loss": 3.743892192840576, "lr": 0.00037610919134287694, "tps": 25675, "wall": 15051.9} {"step": 5897, "train_loss": 3.606167793273926, "lr": 0.00037609965298666774, "tps": 25666, "wall": 15059.6} {"step": 5898, "train_loss": 3.538832426071167, "lr": 0.00037609011286215326, "tps": 25657, "wall": 15067.3} {"step": 5899, "train_loss": 3.7008962631225586, "lr": 0.0003760805709694415, "tps": 25648, "wall": 15075.2} {"step": 5900, "train_loss": 3.637589931488037, "lr": 0.00037607102730864066, "tps": 25640, "wall": 15083.0} {"step": 5901, "train_loss": 3.487436056137085, "lr": 0.0003760614818798587, "tps": 25631, "wall": 15090.8} {"step": 5902, "train_loss": 3.576279640197754, "lr": 0.00037605193468320385, "tps": 25622, "wall": 15098.6} {"step": 5903, "train_loss": 3.6907477378845215, "lr": 0.0003760423857187842, "tps": 25613, "wall": 15106.4} {"step": 5904, "train_loss": 3.579709529876709, "lr": 0.000376032834986708, "tps": 25604, "wall": 15114.3} {"step": 5905, "train_loss": 3.5964579582214355, "lr": 0.00037602328248708344, "tps": 25595, "wall": 15122.0} {"step": 5906, "train_loss": 3.5517101287841797, "lr": 0.00037601372822001865, "tps": 25586, "wall": 15129.9} {"step": 5907, "train_loss": 3.59802508354187, "lr": 0.0003760041721856219, "tps": 25577, "wall": 15137.7} {"step": 5908, "train_loss": 3.6072211265563965, "lr": 0.0003759946143840015, "tps": 25568, "wall": 15145.7} {"step": 5909, "train_loss": 3.6805241107940674, "lr": 0.0003759850548152656, "tps": 25559, "wall": 15153.5} {"step": 5910, "train_loss": 3.5854101181030273, "lr": 0.0003759754934795226, "tps": 25550, "wall": 15161.3} {"step": 5911, "train_loss": 3.499516010284424, "lr": 0.0003759659303768808, "tps": 25541, "wall": 15169.1} {"step": 5912, "train_loss": 3.572863817214966, "lr": 0.0003759563655074485, "tps": 25533, "wall": 15177.0} {"step": 5913, "train_loss": 3.6835174560546875, "lr": 0.00037594679887133404, "tps": 25524, "wall": 15184.9} {"step": 5914, "train_loss": 3.5657882690429688, "lr": 0.0003759372304686458, "tps": 25515, "wall": 15192.6} {"step": 5915, "train_loss": 3.6284756660461426, "lr": 0.00037592766029949213, "tps": 25506, "wall": 15200.6} {"step": 5916, "train_loss": 3.5233209133148193, "lr": 0.00037591808836398154, "tps": 25497, "wall": 15208.4} {"step": 5917, "train_loss": 3.560502529144287, "lr": 0.0003759085146622224, "tps": 25488, "wall": 15216.4} {"step": 5918, "train_loss": 3.5631027221679688, "lr": 0.0003758989391943232, "tps": 25479, "wall": 15224.3} {"step": 5919, "train_loss": 3.4822607040405273, "lr": 0.00037588936196039234, "tps": 25470, "wall": 15232.1} {"step": 5920, "train_loss": 3.5877904891967773, "lr": 0.0003758797829605384, "tps": 25461, "wall": 15240.0} {"step": 5921, "train_loss": 3.6080238819122314, "lr": 0.0003758702021948698, "tps": 25452, "wall": 15247.9} {"step": 5922, "train_loss": 3.625993251800537, "lr": 0.00037586061966349515, "tps": 25444, "wall": 15255.8} {"step": 5923, "train_loss": 3.591538906097412, "lr": 0.00037585103536652293, "tps": 25435, "wall": 15263.8} {"step": 5924, "train_loss": 3.5310792922973633, "lr": 0.00037584144930406175, "tps": 25426, "wall": 15271.7} {"step": 5925, "train_loss": 3.467923164367676, "lr": 0.00037583186147622025, "tps": 25417, "wall": 15279.7} {"step": 5926, "train_loss": 3.5140554904937744, "lr": 0.00037582227188310695, "tps": 25408, "wall": 15287.6} {"step": 5927, "train_loss": 3.5640640258789062, "lr": 0.00037581268052483055, "tps": 25399, "wall": 15295.5} {"step": 5928, "train_loss": 3.582291603088379, "lr": 0.00037580308740149963, "tps": 25390, "wall": 15303.4} {"step": 5929, "train_loss": 3.6309494972229004, "lr": 0.000375793492513223, "tps": 25381, "wall": 15311.2} {"step": 5930, "train_loss": 3.6428794860839844, "lr": 0.00037578389586010916, "tps": 25372, "wall": 15319.3} {"step": 5931, "train_loss": 3.574429512023926, "lr": 0.000375774297442267, "tps": 25363, "wall": 15327.2} {"step": 5932, "train_loss": 3.5314416885375977, "lr": 0.00037576469725980507, "tps": 25354, "wall": 15335.3} {"step": 5933, "train_loss": 3.5894556045532227, "lr": 0.0003757550953128323, "tps": 25346, "wall": 15343.2} {"step": 5934, "train_loss": 3.6984481811523438, "lr": 0.00037574549160145743, "tps": 25337, "wall": 15351.1} {"step": 5935, "train_loss": 3.649547576904297, "lr": 0.0003757358861257891, "tps": 25328, "wall": 15359.1} {"step": 5936, "train_loss": 3.594731569290161, "lr": 0.00037572627888593626, "tps": 25319, "wall": 15367.1} {"step": 5937, "train_loss": 3.6499290466308594, "lr": 0.0003757166698820077, "tps": 25310, "wall": 15375.0} {"step": 5938, "train_loss": 3.6304237842559814, "lr": 0.00037570705911411234, "tps": 25301, "wall": 15382.9} {"step": 5939, "train_loss": 3.6394283771514893, "lr": 0.00037569744658235896, "tps": 25293, "wall": 15390.8} {"step": 5940, "train_loss": 3.6250321865081787, "lr": 0.00037568783228685644, "tps": 25284, "wall": 15398.8} {"step": 5941, "train_loss": 3.512234687805176, "lr": 0.0003756782162277138, "tps": 25275, "wall": 15406.8} {"step": 5942, "train_loss": 3.571336269378662, "lr": 0.00037566859840503983, "tps": 25266, "wall": 15414.8} {"step": 5943, "train_loss": 3.580247163772583, "lr": 0.0003756589788189436, "tps": 25258, "wall": 15422.6} {"step": 5944, "train_loss": 3.5224318504333496, "lr": 0.00037564935746953404, "tps": 25249, "wall": 15430.6} {"step": 5945, "train_loss": 3.531651496887207, "lr": 0.00037563973435692015, "tps": 25240, "wall": 15438.5} {"step": 5946, "train_loss": 3.5740292072296143, "lr": 0.0003756301094812109, "tps": 25231, "wall": 15446.7} {"step": 5947, "train_loss": 3.5287575721740723, "lr": 0.00037562048284251533, "tps": 25222, "wall": 15454.7} {"step": 5948, "train_loss": 3.617424488067627, "lr": 0.0003756108544409426, "tps": 25213, "wall": 15462.8} {"step": 5949, "train_loss": 3.58862566947937, "lr": 0.0003756012242766016, "tps": 25204, "wall": 15470.8} {"step": 5950, "train_loss": 3.6641011238098145, "lr": 0.0003755915923496016, "tps": 25196, "wall": 15478.8} {"step": 5951, "train_loss": 3.5574257373809814, "lr": 0.0003755819586600515, "tps": 25187, "wall": 15486.8} {"step": 5952, "train_loss": 3.64121150970459, "lr": 0.00037557232320806065, "tps": 25178, "wall": 15494.8} {"step": 5953, "train_loss": 3.4919400215148926, "lr": 0.00037556268599373807, "tps": 25169, "wall": 15502.8} {"step": 5954, "train_loss": 3.570838451385498, "lr": 0.00037555304701719297, "tps": 25160, "wall": 15510.9} {"step": 5955, "train_loss": 3.5259594917297363, "lr": 0.0003755434062785346, "tps": 25151, "wall": 15519.0} {"step": 5956, "train_loss": 3.5692005157470703, "lr": 0.00037553376377787205, "tps": 25143, "wall": 15527.1} {"step": 5957, "train_loss": 3.5424134731292725, "lr": 0.0003755241195153146, "tps": 25134, "wall": 15535.1} {"step": 5958, "train_loss": 3.6026101112365723, "lr": 0.00037551447349097155, "tps": 25125, "wall": 15543.1} {"step": 5959, "train_loss": 3.5494606494903564, "lr": 0.0003755048257049521, "tps": 25116, "wall": 15551.1} {"step": 5960, "train_loss": 3.5943641662597656, "lr": 0.00037549517615736555, "tps": 25107, "wall": 15559.2} {"step": 5961, "train_loss": 3.573394775390625, "lr": 0.00037548552484832127, "tps": 25098, "wall": 15567.4} {"step": 5962, "train_loss": 3.683046817779541, "lr": 0.00037547587177792855, "tps": 25090, "wall": 15575.5} {"step": 5963, "train_loss": 3.542926549911499, "lr": 0.0003754662169462968, "tps": 25081, "wall": 15583.6} {"step": 5964, "train_loss": 3.5771360397338867, "lr": 0.00037545656035353525, "tps": 25072, "wall": 15591.5} {"step": 5965, "train_loss": 3.5668349266052246, "lr": 0.0003754469019997534, "tps": 25063, "wall": 15599.6} {"step": 5966, "train_loss": 3.5983314514160156, "lr": 0.00037543724188506065, "tps": 25055, "wall": 15607.8} {"step": 5967, "train_loss": 3.601184368133545, "lr": 0.00037542758000956637, "tps": 25046, "wall": 15615.9} {"step": 5968, "train_loss": 3.462167739868164, "lr": 0.00037541791637338013, "tps": 25037, "wall": 15624.0} {"step": 5969, "train_loss": 3.554108142852783, "lr": 0.0003754082509766113, "tps": 25028, "wall": 15632.1} {"step": 5970, "train_loss": 3.504603624343872, "lr": 0.00037539858381936935, "tps": 25019, "wall": 15640.2} {"step": 5971, "train_loss": 3.6655218601226807, "lr": 0.0003753889149017638, "tps": 25010, "wall": 15648.4} {"step": 5972, "train_loss": 3.5169119834899902, "lr": 0.0003753792442239043, "tps": 25002, "wall": 15656.5} {"step": 5973, "train_loss": 3.708944797515869, "lr": 0.0003753695717859003, "tps": 24993, "wall": 15664.5} {"step": 5974, "train_loss": 3.5896010398864746, "lr": 0.0003753598975878614, "tps": 24984, "wall": 15672.6} {"step": 5975, "train_loss": 3.6037073135375977, "lr": 0.0003753502216298971, "tps": 24976, "wall": 15680.7} {"step": 5976, "train_loss": 3.5978481769561768, "lr": 0.0003753405439121171, "tps": 24967, "wall": 15688.8} {"step": 5977, "train_loss": 3.5037999153137207, "lr": 0.00037533086443463113, "tps": 24958, "wall": 15696.8} {"step": 5978, "train_loss": 3.666531801223755, "lr": 0.0003753211831975486, "tps": 24949, "wall": 15705.0} {"step": 5979, "train_loss": 3.5374910831451416, "lr": 0.00037531150020097935, "tps": 24941, "wall": 15713.1} {"step": 5980, "train_loss": 3.6086437702178955, "lr": 0.000375301815445033, "tps": 24932, "wall": 15721.2} {"step": 5981, "train_loss": 3.5421853065490723, "lr": 0.00037529212892981935, "tps": 24923, "wall": 15729.3} {"step": 5982, "train_loss": 3.629678726196289, "lr": 0.000375282440655448, "tps": 24915, "wall": 15737.4} {"step": 5983, "train_loss": 3.55831241607666, "lr": 0.0003752727506220288, "tps": 24906, "wall": 15745.5} {"step": 5984, "train_loss": 3.534626007080078, "lr": 0.00037526305882967147, "tps": 24898, "wall": 15753.5} {"step": 5985, "train_loss": 3.5557494163513184, "lr": 0.0003752533652784858, "tps": 24889, "wall": 15761.6} {"step": 5986, "train_loss": 3.655561923980713, "lr": 0.00037524366996858163, "tps": 24880, "wall": 15769.7} {"step": 5987, "train_loss": 3.6661548614501953, "lr": 0.0003752339729000687, "tps": 24872, "wall": 15777.8} {"step": 5988, "train_loss": 3.6745822429656982, "lr": 0.00037522427407305696, "tps": 24863, "wall": 15785.9} {"step": 5989, "train_loss": 3.6446971893310547, "lr": 0.00037521457348765625, "tps": 24854, "wall": 15794.0} {"step": 5990, "train_loss": 3.52624249458313, "lr": 0.0003752048711439765, "tps": 24846, "wall": 15802.1} {"step": 5991, "train_loss": 3.6099581718444824, "lr": 0.0003751951670421275, "tps": 24837, "wall": 15810.2} {"step": 5992, "train_loss": 3.550973653793335, "lr": 0.00037518546118221936, "tps": 24829, "wall": 15818.4} {"step": 5993, "train_loss": 3.6225783824920654, "lr": 0.0003751757535643618, "tps": 24820, "wall": 15826.6} {"step": 5994, "train_loss": 3.5448434352874756, "lr": 0.00037516604418866495, "tps": 24811, "wall": 15834.8} {"step": 5995, "train_loss": 3.5358290672302246, "lr": 0.00037515633305523874, "tps": 24803, "wall": 15842.8} {"step": 5996, "train_loss": 3.664551019668579, "lr": 0.00037514662016419325, "tps": 24794, "wall": 15851.0} {"step": 5997, "train_loss": 3.517090320587158, "lr": 0.00037513690551563847, "tps": 24785, "wall": 15859.2} {"step": 5998, "train_loss": 3.6995248794555664, "lr": 0.00037512718910968435, "tps": 24777, "wall": 15867.3} {"step": 5999, "train_loss": 3.606438159942627, "lr": 0.00037511747094644114, "tps": 24768, "wall": 15875.4} {"step": 6000, "train_loss": 3.621567487716675, "lr": 0.0003751077510260188, "tps": 24760, "wall": 15883.6, "val_loss_monitor": 3.74153195579318} {"step": 6001, "train_loss": 3.603851318359375, "lr": 0.00037509802934852733, "tps": 24672, "wall": 15942.5} {"step": 6002, "train_loss": 3.6606571674346924, "lr": 0.0003750883059140771, "tps": 24664, "wall": 15950.7} {"step": 6003, "train_loss": 3.621049404144287, "lr": 0.0003750785807227782, "tps": 24655, "wall": 15959.2} {"step": 6004, "train_loss": 3.733952283859253, "lr": 0.0003750688537747407, "tps": 24646, "wall": 15967.6} {"step": 6005, "train_loss": 3.654545545578003, "lr": 0.0003750591250700748, "tps": 24637, "wall": 15976.1} {"step": 6006, "train_loss": 3.816570281982422, "lr": 0.0003750493946088907, "tps": 24628, "wall": 15984.6} {"step": 6007, "train_loss": 3.8029699325561523, "lr": 0.00037503966239129874, "tps": 24619, "wall": 15993.1} {"step": 6008, "train_loss": 3.7495832443237305, "lr": 0.0003750299284174091, "tps": 24610, "wall": 16001.3} {"step": 6009, "train_loss": 3.6934189796447754, "lr": 0.0003750201926873321, "tps": 24601, "wall": 16009.8} {"step": 6010, "train_loss": 3.633999824523926, "lr": 0.0003750104552011779, "tps": 24593, "wall": 16018.2} {"step": 6011, "train_loss": 3.738189220428467, "lr": 0.00037500071595905686, "tps": 24584, "wall": 16026.4} {"step": 6012, "train_loss": 3.5264077186584473, "lr": 0.00037499097496107933, "tps": 24575, "wall": 16034.7} {"step": 6013, "train_loss": 3.7432003021240234, "lr": 0.0003749812322073557, "tps": 24567, "wall": 16043.0} {"step": 6014, "train_loss": 3.69685697555542, "lr": 0.0003749714876979963, "tps": 24558, "wall": 16051.3} {"step": 6015, "train_loss": 3.63826322555542, "lr": 0.0003749617414331114, "tps": 24550, "wall": 16059.5} {"step": 6016, "train_loss": 3.60563325881958, "lr": 0.0003749519934128116, "tps": 24541, "wall": 16067.9} {"step": 6017, "train_loss": 3.666912078857422, "lr": 0.00037494224363720716, "tps": 24532, "wall": 16076.2} {"step": 6018, "train_loss": 3.624910354614258, "lr": 0.0003749324921064087, "tps": 24524, "wall": 16084.4} {"step": 6019, "train_loss": 3.703615188598633, "lr": 0.00037492273882052654, "tps": 24516, "wall": 16092.6} {"step": 6020, "train_loss": 3.7435073852539062, "lr": 0.00037491298377967115, "tps": 24507, "wall": 16100.7} {"step": 6021, "train_loss": 3.859344005584717, "lr": 0.0003749032269839532, "tps": 24499, "wall": 16109.1} {"step": 6022, "train_loss": 3.720757484436035, "lr": 0.0003748934684334831, "tps": 24490, "wall": 16117.4} {"step": 6023, "train_loss": 3.8365702629089355, "lr": 0.0003748837081283714, "tps": 24481, "wall": 16125.7} {"step": 6024, "train_loss": 3.696643829345703, "lr": 0.00037487394606872863, "tps": 24473, "wall": 16134.0} {"step": 6025, "train_loss": 3.7170562744140625, "lr": 0.00037486418225466544, "tps": 24465, "wall": 16142.1} {"step": 6026, "train_loss": 3.7643041610717773, "lr": 0.00037485441668629244, "tps": 24456, "wall": 16150.3} {"step": 6027, "train_loss": 3.6893117427825928, "lr": 0.0003748446493637202, "tps": 24448, "wall": 16158.5} {"step": 6028, "train_loss": 3.681215286254883, "lr": 0.00037483488028705944, "tps": 24440, "wall": 16166.7} {"step": 6029, "train_loss": 3.7046916484832764, "lr": 0.0003748251094564207, "tps": 24431, "wall": 16175.1} {"step": 6030, "train_loss": 3.6986474990844727, "lr": 0.0003748153368719149, "tps": 24423, "wall": 16183.2} {"step": 6031, "train_loss": 3.6943273544311523, "lr": 0.0003748055625336524, "tps": 24415, "wall": 16191.3} {"step": 6032, "train_loss": 3.833064079284668, "lr": 0.0003747957864417442, "tps": 24406, "wall": 16199.5} {"step": 6033, "train_loss": 3.714179515838623, "lr": 0.00037478600859630097, "tps": 24398, "wall": 16207.5} {"step": 6034, "train_loss": 3.6634113788604736, "lr": 0.00037477622899743343, "tps": 24390, "wall": 16215.6} {"step": 6035, "train_loss": 3.7155566215515137, "lr": 0.0003747664476452524, "tps": 24382, "wall": 16223.7} {"step": 6036, "train_loss": 3.7457871437072754, "lr": 0.00037475666453986873, "tps": 24374, "wall": 16231.8} {"step": 6037, "train_loss": 3.6281442642211914, "lr": 0.0003747468796813931, "tps": 24366, "wall": 16240.0} {"step": 6038, "train_loss": 3.7021846771240234, "lr": 0.00037473709306993656, "tps": 24357, "wall": 16248.4} {"step": 6039, "train_loss": 3.70365309715271, "lr": 0.00037472730470560975, "tps": 24349, "wall": 16256.3} {"step": 6040, "train_loss": 3.698559045791626, "lr": 0.00037471751458852375, "tps": 24341, "wall": 16264.4} {"step": 6041, "train_loss": 3.748187303543091, "lr": 0.00037470772271878933, "tps": 24333, "wall": 16272.3} {"step": 6042, "train_loss": 3.6468467712402344, "lr": 0.00037469792909651745, "tps": 24325, "wall": 16280.5} {"step": 6043, "train_loss": 3.715010166168213, "lr": 0.0003746881337218191, "tps": 24317, "wall": 16288.6} {"step": 6044, "train_loss": 3.6075439453125, "lr": 0.0003746783365948051, "tps": 24309, "wall": 16296.7} {"step": 6045, "train_loss": 3.7450921535491943, "lr": 0.0003746685377155866, "tps": 24301, "wall": 16304.8} {"step": 6046, "train_loss": 3.7110188007354736, "lr": 0.0003746587370842746, "tps": 24293, "wall": 16312.7} {"step": 6047, "train_loss": 3.668334722518921, "lr": 0.00037464893470097997, "tps": 24285, "wall": 16320.9} {"step": 6048, "train_loss": 3.6677193641662598, "lr": 0.0003746391305658139, "tps": 24277, "wall": 16328.9} {"step": 6049, "train_loss": 3.7425122261047363, "lr": 0.0003746293246788873, "tps": 24269, "wall": 16336.9} {"step": 6050, "train_loss": 3.6878767013549805, "lr": 0.00037461951704031147, "tps": 24261, "wall": 16345.0} {"step": 6051, "train_loss": 3.8247506618499756, "lr": 0.0003746097076501973, "tps": 24253, "wall": 16353.0} {"step": 6052, "train_loss": 3.6952619552612305, "lr": 0.00037459989650865603, "tps": 24245, "wall": 16361.0} {"step": 6053, "train_loss": 3.6817429065704346, "lr": 0.00037459008361579875, "tps": 24238, "wall": 16369.1} {"step": 6054, "train_loss": 3.7197225093841553, "lr": 0.00037458026897173666, "tps": 24230, "wall": 16377.2} {"step": 6055, "train_loss": 3.70709228515625, "lr": 0.00037457045257658093, "tps": 24222, "wall": 16385.2} {"step": 6056, "train_loss": 3.7608561515808105, "lr": 0.0003745606344304427, "tps": 24214, "wall": 16393.3} {"step": 6057, "train_loss": 3.5816800594329834, "lr": 0.0003745508145334333, "tps": 24206, "wall": 16401.3} {"step": 6058, "train_loss": 3.669806718826294, "lr": 0.0003745409928856639, "tps": 24198, "wall": 16409.4} {"step": 6059, "train_loss": 3.799984931945801, "lr": 0.00037453116948724574, "tps": 24190, "wall": 16417.4} {"step": 6060, "train_loss": 3.6562113761901855, "lr": 0.0003745213443382902, "tps": 24182, "wall": 16425.5} {"step": 6061, "train_loss": 3.7830405235290527, "lr": 0.00037451151743890846, "tps": 24174, "wall": 16433.6} {"step": 6062, "train_loss": 3.59411358833313, "lr": 0.0003745016887892119, "tps": 24167, "wall": 16441.6} {"step": 6063, "train_loss": 3.7201523780822754, "lr": 0.0003744918583893118, "tps": 24159, "wall": 16449.6} {"step": 6064, "train_loss": 3.7465217113494873, "lr": 0.0003744820262393196, "tps": 24151, "wall": 16457.8} {"step": 6065, "train_loss": 3.6344223022460938, "lr": 0.0003744721923393467, "tps": 24143, "wall": 16465.9} {"step": 6066, "train_loss": 3.7613770961761475, "lr": 0.0003744623566895044, "tps": 24135, "wall": 16473.9} {"step": 6067, "train_loss": 3.742359161376953, "lr": 0.00037445251928990415, "tps": 24127, "wall": 16482.0} {"step": 6068, "train_loss": 3.7812552452087402, "lr": 0.0003744426801406575, "tps": 24119, "wall": 16490.0} {"step": 6069, "train_loss": 3.6706645488739014, "lr": 0.00037443283924187576, "tps": 24112, "wall": 16498.0} {"step": 6070, "train_loss": 3.7640151977539062, "lr": 0.00037442299659367045, "tps": 24104, "wall": 16506.0} {"step": 6071, "train_loss": 3.7881455421447754, "lr": 0.00037441315219615307, "tps": 24096, "wall": 16514.0} {"step": 6072, "train_loss": 3.689671516418457, "lr": 0.0003744033060494352, "tps": 24089, "wall": 16521.9} {"step": 6073, "train_loss": 3.7253544330596924, "lr": 0.00037439345815362825, "tps": 24081, "wall": 16529.9} {"step": 6074, "train_loss": 3.7679331302642822, "lr": 0.0003743836085088439, "tps": 24073, "wall": 16537.9} {"step": 6075, "train_loss": 3.6854147911071777, "lr": 0.0003743737571151936, "tps": 24066, "wall": 16545.9} {"step": 6076, "train_loss": 3.6981160640716553, "lr": 0.00037436390397278915, "tps": 24058, "wall": 16554.0} {"step": 6077, "train_loss": 3.649904251098633, "lr": 0.000374354049081742, "tps": 24050, "wall": 16561.8} {"step": 6078, "train_loss": 3.8490982055664062, "lr": 0.00037434419244216385, "tps": 24043, "wall": 16569.8} {"step": 6079, "train_loss": 3.6883764266967773, "lr": 0.0003743343340541663, "tps": 24035, "wall": 16577.8} {"step": 6080, "train_loss": 3.6664822101593018, "lr": 0.0003743244739178611, "tps": 24027, "wall": 16585.9} {"step": 6081, "train_loss": 3.7415761947631836, "lr": 0.00037431461203335986, "tps": 24020, "wall": 16593.7} {"step": 6082, "train_loss": 3.643444538116455, "lr": 0.0003743047484007744, "tps": 24013, "wall": 16601.5} {"step": 6083, "train_loss": 3.663975715637207, "lr": 0.00037429488302021636, "tps": 24005, "wall": 16609.6} {"step": 6084, "train_loss": 3.757111072540283, "lr": 0.00037428501589179756, "tps": 23997, "wall": 16617.6} {"step": 6085, "train_loss": 3.69924259185791, "lr": 0.00037427514701562974, "tps": 23990, "wall": 16625.5} {"step": 6086, "train_loss": 3.6894748210906982, "lr": 0.0003742652763918248, "tps": 23982, "wall": 16633.5} {"step": 6087, "train_loss": 3.57592511177063, "lr": 0.00037425540402049435, "tps": 23975, "wall": 16641.5} {"step": 6088, "train_loss": 3.774648427963257, "lr": 0.00037424552990175035, "tps": 23967, "wall": 16649.6} {"step": 6089, "train_loss": 3.782683849334717, "lr": 0.00037423565403570466, "tps": 23960, "wall": 16657.5} {"step": 6090, "train_loss": 3.6950278282165527, "lr": 0.0003742257764224691, "tps": 23952, "wall": 16665.4} {"step": 6091, "train_loss": 3.685462713241577, "lr": 0.0003742158970621557, "tps": 23945, "wall": 16673.3} {"step": 6092, "train_loss": 3.8219051361083984, "lr": 0.00037420601595487623, "tps": 23937, "wall": 16681.2} {"step": 6093, "train_loss": 3.687093496322632, "lr": 0.00037419613310074265, "tps": 23930, "wall": 16689.1} {"step": 6094, "train_loss": 3.726156234741211, "lr": 0.00037418624849986694, "tps": 23922, "wall": 16697.0} {"step": 6095, "train_loss": 3.764296531677246, "lr": 0.00037417636215236104, "tps": 23915, "wall": 16705.0} {"step": 6096, "train_loss": 3.7144064903259277, "lr": 0.000374166474058337, "tps": 23907, "wall": 16713.0} {"step": 6097, "train_loss": 3.701169490814209, "lr": 0.0003741565842179068, "tps": 23900, "wall": 16720.9} {"step": 6098, "train_loss": 3.7612810134887695, "lr": 0.00037414669263118245, "tps": 23893, "wall": 16728.8} {"step": 6099, "train_loss": 3.637129783630371, "lr": 0.0003741367992982761, "tps": 23885, "wall": 16736.8} {"step": 6100, "train_loss": 3.693912982940674, "lr": 0.00037412690421929966, "tps": 23878, "wall": 16744.7} {"step": 6101, "train_loss": 3.698726177215576, "lr": 0.0003741170073943653, "tps": 23871, "wall": 16752.5} {"step": 6102, "train_loss": 3.736393451690674, "lr": 0.0003741071088235852, "tps": 23863, "wall": 16760.4} {"step": 6103, "train_loss": 3.7169532775878906, "lr": 0.00037409720850707146, "tps": 23856, "wall": 16768.3} {"step": 6104, "train_loss": 3.675623893737793, "lr": 0.00037408730644493616, "tps": 23848, "wall": 16776.3} {"step": 6105, "train_loss": 3.73854923248291, "lr": 0.0003740774026372915, "tps": 23841, "wall": 16784.3} {"step": 6106, "train_loss": 3.679080009460449, "lr": 0.00037406749708424975, "tps": 23834, "wall": 16792.2} {"step": 6107, "train_loss": 3.585287570953369, "lr": 0.000374057589785923, "tps": 23826, "wall": 16800.1} {"step": 6108, "train_loss": 3.604107618331909, "lr": 0.0003740476807424236, "tps": 23819, "wall": 16807.9} {"step": 6109, "train_loss": 3.733762741088867, "lr": 0.00037403776995386366, "tps": 23812, "wall": 16815.9} {"step": 6110, "train_loss": 3.74164080619812, "lr": 0.00037402785742035556, "tps": 23805, "wall": 16823.8} {"step": 6111, "train_loss": 3.6350979804992676, "lr": 0.00037401794314201157, "tps": 23797, "wall": 16831.7} {"step": 6112, "train_loss": 3.697904586791992, "lr": 0.000374008027118944, "tps": 23790, "wall": 16839.7} {"step": 6113, "train_loss": 3.7361392974853516, "lr": 0.00037399810935126514, "tps": 23782, "wall": 16847.6} {"step": 6114, "train_loss": 3.663752794265747, "lr": 0.00037398818983908733, "tps": 23775, "wall": 16855.5} {"step": 6115, "train_loss": 3.7603447437286377, "lr": 0.00037397826858252305, "tps": 23768, "wall": 16863.4} {"step": 6116, "train_loss": 3.63108491897583, "lr": 0.0003739683455816846, "tps": 23761, "wall": 16871.3} {"step": 6117, "train_loss": 3.6993660926818848, "lr": 0.0003739584208366844, "tps": 23753, "wall": 16879.2} {"step": 6118, "train_loss": 3.8462934494018555, "lr": 0.00037394849434763485, "tps": 23746, "wall": 16887.1} {"step": 6119, "train_loss": 3.6403331756591797, "lr": 0.00037393856611464847, "tps": 23739, "wall": 16895.1} {"step": 6120, "train_loss": 3.7504658699035645, "lr": 0.00037392863613783765, "tps": 23732, "wall": 16903.0} {"step": 6121, "train_loss": 3.71425199508667, "lr": 0.0003739187044173149, "tps": 23725, "wall": 16910.8} {"step": 6122, "train_loss": 3.5744268894195557, "lr": 0.0003739087709531928, "tps": 23717, "wall": 16918.8} {"step": 6123, "train_loss": 3.6794185638427734, "lr": 0.00037389883574558374, "tps": 23710, "wall": 16926.5} {"step": 6124, "train_loss": 3.6920735836029053, "lr": 0.0003738888987946004, "tps": 23703, "wall": 16934.4} {"step": 6125, "train_loss": 3.706827163696289, "lr": 0.00037387896010035524, "tps": 23696, "wall": 16942.2} {"step": 6126, "train_loss": 3.7008237838745117, "lr": 0.0003738690196629609, "tps": 23689, "wall": 16950.1} {"step": 6127, "train_loss": 3.6990151405334473, "lr": 0.00037385907748253004, "tps": 23682, "wall": 16958.1} {"step": 6128, "train_loss": 3.7071614265441895, "lr": 0.00037384913355917516, "tps": 23674, "wall": 16966.1} {"step": 6129, "train_loss": 3.6640236377716064, "lr": 0.00037383918789300904, "tps": 23667, "wall": 16974.0} {"step": 6130, "train_loss": 3.739959478378296, "lr": 0.0003738292404841442, "tps": 23660, "wall": 16981.8} {"step": 6131, "train_loss": 3.7587502002716064, "lr": 0.00037381929133269344, "tps": 23653, "wall": 16989.7} {"step": 6132, "train_loss": 3.707183361053467, "lr": 0.00037380934043876947, "tps": 23646, "wall": 16997.5} {"step": 6133, "train_loss": 3.5961222648620605, "lr": 0.0003737993878024849, "tps": 23639, "wall": 17005.5} {"step": 6134, "train_loss": 3.6706008911132812, "lr": 0.00037378943342395257, "tps": 23632, "wall": 17013.3} {"step": 6135, "train_loss": 3.722693920135498, "lr": 0.0003737794773032852, "tps": 23625, "wall": 17021.2} {"step": 6136, "train_loss": 3.698007822036743, "lr": 0.00037376951944059566, "tps": 23618, "wall": 17029.0} {"step": 6137, "train_loss": 3.823040008544922, "lr": 0.00037375955983599666, "tps": 23611, "wall": 17036.9} {"step": 6138, "train_loss": 3.7908108234405518, "lr": 0.00037374959848960097, "tps": 23604, "wall": 17044.7} {"step": 6139, "train_loss": 3.727555274963379, "lr": 0.00037373963540152165, "tps": 23597, "wall": 17052.5} {"step": 6140, "train_loss": 3.643345355987549, "lr": 0.0003737296705718713, "tps": 23590, "wall": 17060.3} {"step": 6141, "train_loss": 3.6238608360290527, "lr": 0.000373719704000763, "tps": 23583, "wall": 17068.3} {"step": 6142, "train_loss": 3.6949713230133057, "lr": 0.0003737097356883095, "tps": 23576, "wall": 17076.1} {"step": 6143, "train_loss": 3.6521284580230713, "lr": 0.00037369976563462386, "tps": 23568, "wall": 17084.1} {"step": 6144, "train_loss": 3.74466872215271, "lr": 0.0003736897938398189, "tps": 23561, "wall": 17091.9} {"step": 6145, "train_loss": 3.686047077178955, "lr": 0.00037367982030400774, "tps": 23554, "wall": 17099.8} {"step": 6146, "train_loss": 3.737962484359741, "lr": 0.0003736698450273032, "tps": 23548, "wall": 17107.6} {"step": 6147, "train_loss": 3.849553346633911, "lr": 0.0003736598680098183, "tps": 23541, "wall": 17115.5} {"step": 6148, "train_loss": 3.7395951747894287, "lr": 0.00037364988925166616, "tps": 23534, "wall": 17123.3} {"step": 6149, "train_loss": 3.6829330921173096, "lr": 0.00037363990875295976, "tps": 23526, "wall": 17131.3} {"step": 6150, "train_loss": 3.6923675537109375, "lr": 0.0003736299265138122, "tps": 23520, "wall": 17139.1} {"step": 6151, "train_loss": 3.619074821472168, "lr": 0.00037361994253433644, "tps": 23512, "wall": 17147.1} {"step": 6152, "train_loss": 3.74129581451416, "lr": 0.0003736099568146457, "tps": 23505, "wall": 17154.9} {"step": 6153, "train_loss": 3.718740224838257, "lr": 0.000373599969354853, "tps": 23499, "wall": 17162.6} {"step": 6154, "train_loss": 3.780646324157715, "lr": 0.00037358998015507165, "tps": 23492, "wall": 17170.5} {"step": 6155, "train_loss": 3.6803767681121826, "lr": 0.0003735799892154146, "tps": 23485, "wall": 17178.3} {"step": 6156, "train_loss": 3.729592800140381, "lr": 0.00037356999653599514, "tps": 23478, "wall": 17186.2} {"step": 6157, "train_loss": 3.7106337547302246, "lr": 0.0003735600021169265, "tps": 23471, "wall": 17193.9} {"step": 6158, "train_loss": 3.6119208335876465, "lr": 0.00037355000595832183, "tps": 23464, "wall": 17201.6} {"step": 6159, "train_loss": 3.7131948471069336, "lr": 0.00037354000806029435, "tps": 23458, "wall": 17209.5} {"step": 6160, "train_loss": 3.6808459758758545, "lr": 0.0003735300084229574, "tps": 23451, "wall": 17217.4} {"step": 6161, "train_loss": 3.7687811851501465, "lr": 0.00037352000704642417, "tps": 23444, "wall": 17225.3} {"step": 6162, "train_loss": 3.673433303833008, "lr": 0.000373510003930808, "tps": 23437, "wall": 17233.1} {"step": 6163, "train_loss": 3.702920436859131, "lr": 0.0003734999990762222, "tps": 23430, "wall": 17240.9} {"step": 6164, "train_loss": 3.686293840408325, "lr": 0.00037348999248278017, "tps": 23423, "wall": 17248.8} {"step": 6165, "train_loss": 3.7050018310546875, "lr": 0.00037347998415059513, "tps": 23416, "wall": 17256.7} {"step": 6166, "train_loss": 3.729715585708618, "lr": 0.00037346997407978057, "tps": 23409, "wall": 17264.5} {"step": 6167, "train_loss": 3.6339523792266846, "lr": 0.0003734599622704498, "tps": 23403, "wall": 17272.3} {"step": 6168, "train_loss": 3.6666712760925293, "lr": 0.00037344994872271625, "tps": 23396, "wall": 17280.1} {"step": 6169, "train_loss": 3.6391990184783936, "lr": 0.00037343993343669343, "tps": 23389, "wall": 17287.9} {"step": 6170, "train_loss": 3.640474796295166, "lr": 0.0003734299164124947, "tps": 23382, "wall": 17295.7} {"step": 6171, "train_loss": 3.7597756385803223, "lr": 0.00037341989765023366, "tps": 23376, "wall": 17303.5} {"step": 6172, "train_loss": 3.7137534618377686, "lr": 0.0003734098771500237, "tps": 23369, "wall": 17311.3} {"step": 6173, "train_loss": 3.6495237350463867, "lr": 0.0003733998549119783, "tps": 23362, "wall": 17319.1} {"step": 6174, "train_loss": 3.7604260444641113, "lr": 0.00037338983093621107, "tps": 23355, "wall": 17327.0} {"step": 6175, "train_loss": 3.656972646713257, "lr": 0.00037337980522283553, "tps": 23348, "wall": 17334.9} {"step": 6176, "train_loss": 3.7348363399505615, "lr": 0.0003733697777719653, "tps": 23342, "wall": 17342.6} {"step": 6177, "train_loss": 3.7405879497528076, "lr": 0.00037335974858371387, "tps": 23335, "wall": 17350.4} {"step": 6178, "train_loss": 3.665888786315918, "lr": 0.00037334971765819495, "tps": 23328, "wall": 17358.2} {"step": 6179, "train_loss": 3.7277631759643555, "lr": 0.0003733396849955221, "tps": 23322, "wall": 17366.1} {"step": 6180, "train_loss": 3.7079432010650635, "lr": 0.000373329650595809, "tps": 23315, "wall": 17374.0} {"step": 6181, "train_loss": 3.6604957580566406, "lr": 0.00037331961445916936, "tps": 23308, "wall": 17381.7} {"step": 6182, "train_loss": 3.6887216567993164, "lr": 0.00037330957658571683, "tps": 23301, "wall": 17389.6} {"step": 6183, "train_loss": 3.6380774974823, "lr": 0.0003732995369755651, "tps": 23295, "wall": 17397.5} {"step": 6184, "train_loss": 3.721127510070801, "lr": 0.00037328949562882787, "tps": 23288, "wall": 17405.2} {"step": 6185, "train_loss": 3.73319411277771, "lr": 0.0003732794525456191, "tps": 23281, "wall": 17413.0} {"step": 6186, "train_loss": 3.7167866230010986, "lr": 0.00037326940772605227, "tps": 23275, "wall": 17420.7} {"step": 6187, "train_loss": 3.604114294052124, "lr": 0.0003732593611702413, "tps": 23268, "wall": 17428.6} {"step": 6188, "train_loss": 3.691431760787964, "lr": 0.00037324931287830007, "tps": 23261, "wall": 17436.4} {"step": 6189, "train_loss": 3.752437114715576, "lr": 0.0003732392628503422, "tps": 23255, "wall": 17444.3} {"step": 6190, "train_loss": 3.7039506435394287, "lr": 0.00037322921108648183, "tps": 23248, "wall": 17452.0} {"step": 6191, "train_loss": 3.691892147064209, "lr": 0.00037321915758683257, "tps": 23241, "wall": 17459.8} {"step": 6192, "train_loss": 3.737848997116089, "lr": 0.00037320910235150845, "tps": 23235, "wall": 17467.6} {"step": 6193, "train_loss": 3.740574598312378, "lr": 0.00037319904538062336, "tps": 23228, "wall": 17475.4} {"step": 6194, "train_loss": 3.7253570556640625, "lr": 0.0003731889866742911, "tps": 23222, "wall": 17483.2} {"step": 6195, "train_loss": 3.6501200199127197, "lr": 0.00037317892623262575, "tps": 23215, "wall": 17491.1} {"step": 6196, "train_loss": 3.678812026977539, "lr": 0.00037316886405574124, "tps": 23208, "wall": 17498.9} {"step": 6197, "train_loss": 3.761849880218506, "lr": 0.0003731588001437515, "tps": 23201, "wall": 17506.8} {"step": 6198, "train_loss": 3.650730848312378, "lr": 0.00037314873449677065, "tps": 23195, "wall": 17514.6} {"step": 6199, "train_loss": 3.756917953491211, "lr": 0.00037313866711491265, "tps": 23188, "wall": 17522.4} {"step": 6200, "train_loss": 3.6429848670959473, "lr": 0.0003731285979982916, "tps": 23182, "wall": 17530.1} {"step": 6201, "train_loss": 3.7158141136169434, "lr": 0.0003731185271470214, "tps": 23175, "wall": 17538.0} {"step": 6202, "train_loss": 3.7520639896392822, "lr": 0.0003731084545612163, "tps": 23169, "wall": 17545.8} {"step": 6203, "train_loss": 3.7148244380950928, "lr": 0.0003730983802409903, "tps": 23162, "wall": 17553.6} {"step": 6204, "train_loss": 3.6999974250793457, "lr": 0.0003730883041864576, "tps": 23156, "wall": 17561.4} {"step": 6205, "train_loss": 3.697991371154785, "lr": 0.00037307822639773226, "tps": 23149, "wall": 17569.2} {"step": 6206, "train_loss": 3.7003908157348633, "lr": 0.00037306814687492856, "tps": 23142, "wall": 17577.0} {"step": 6207, "train_loss": 3.6776695251464844, "lr": 0.0003730580656181606, "tps": 23136, "wall": 17584.8} {"step": 6208, "train_loss": 3.652022361755371, "lr": 0.00037304798262754253, "tps": 23129, "wall": 17592.5} {"step": 6209, "train_loss": 3.671776294708252, "lr": 0.0003730378979031887, "tps": 23123, "wall": 17600.3} {"step": 6210, "train_loss": 3.679682493209839, "lr": 0.00037302781144521333, "tps": 23116, "wall": 17608.2} {"step": 6211, "train_loss": 3.640392303466797, "lr": 0.00037301772325373057, "tps": 23110, "wall": 17615.9} {"step": 6212, "train_loss": 3.71091365814209, "lr": 0.0003730076333288547, "tps": 23103, "wall": 17623.7} {"step": 6213, "train_loss": 3.748579740524292, "lr": 0.0003729975416707002, "tps": 23097, "wall": 17631.4} {"step": 6214, "train_loss": 3.6512861251831055, "lr": 0.00037298744827938114, "tps": 23090, "wall": 17639.3} {"step": 6215, "train_loss": 3.6785707473754883, "lr": 0.0003729773531550121, "tps": 23084, "wall": 17647.0} {"step": 6216, "train_loss": 3.7393250465393066, "lr": 0.00037296725629770727, "tps": 23077, "wall": 17654.8} {"step": 6217, "train_loss": 3.6697349548339844, "lr": 0.0003729571577075811, "tps": 23071, "wall": 17662.6} {"step": 6218, "train_loss": 3.7081360816955566, "lr": 0.000372947057384748, "tps": 23065, "wall": 17670.3} {"step": 6219, "train_loss": 3.632183074951172, "lr": 0.0003729369553293223, "tps": 23058, "wall": 17678.1} {"step": 6220, "train_loss": 3.658459186553955, "lr": 0.00037292685154141853, "tps": 23052, "wall": 17685.9} {"step": 6221, "train_loss": 3.767827033996582, "lr": 0.0003729167460211511, "tps": 23045, "wall": 17693.6} {"step": 6222, "train_loss": 3.6313514709472656, "lr": 0.00037290663876863455, "tps": 23039, "wall": 17701.4} {"step": 6223, "train_loss": 3.5090346336364746, "lr": 0.0003728965297839833, "tps": 23033, "wall": 17709.1} {"step": 6224, "train_loss": 3.6284425258636475, "lr": 0.00037288641906731184, "tps": 23026, "wall": 17716.9} {"step": 6225, "train_loss": 3.6553168296813965, "lr": 0.0003728763066187348, "tps": 23020, "wall": 17724.6} {"step": 6226, "train_loss": 3.738194465637207, "lr": 0.0003728661924383667, "tps": 23013, "wall": 17732.4} {"step": 6227, "train_loss": 3.630974054336548, "lr": 0.00037285607652632203, "tps": 23007, "wall": 17740.1} {"step": 6228, "train_loss": 3.846118927001953, "lr": 0.00037284595888271554, "tps": 23001, "wall": 17748.0} {"step": 6229, "train_loss": 3.6489691734313965, "lr": 0.0003728358395076617, "tps": 22994, "wall": 17755.8} {"step": 6230, "train_loss": 3.6536989212036133, "lr": 0.0003728257184012753, "tps": 22988, "wall": 17763.5} {"step": 6231, "train_loss": 3.635493755340576, "lr": 0.00037281559556367073, "tps": 22982, "wall": 17771.1} {"step": 6232, "train_loss": 3.5922775268554688, "lr": 0.00037280547099496295, "tps": 22975, "wall": 17778.9} {"step": 6233, "train_loss": 3.5446012020111084, "lr": 0.0003727953446952665, "tps": 22969, "wall": 17786.7} {"step": 6234, "train_loss": 3.7380988597869873, "lr": 0.0003727852166646961, "tps": 22963, "wall": 17794.5} {"step": 6235, "train_loss": 3.7265467643737793, "lr": 0.0003727750869033665, "tps": 22956, "wall": 17802.3} {"step": 6236, "train_loss": 3.6518588066101074, "lr": 0.00037276495541139245, "tps": 22950, "wall": 17810.0} {"step": 6237, "train_loss": 3.7747249603271484, "lr": 0.0003727548221888888, "tps": 22944, "wall": 17817.9} {"step": 6238, "train_loss": 3.7520108222961426, "lr": 0.00037274468723597017, "tps": 22937, "wall": 17825.6} {"step": 6239, "train_loss": 3.7445483207702637, "lr": 0.00037273455055275155, "tps": 22931, "wall": 17833.4} {"step": 6240, "train_loss": 3.764915704727173, "lr": 0.00037272441213934756, "tps": 22925, "wall": 17841.2} {"step": 6241, "train_loss": 3.6802122592926025, "lr": 0.0003727142719958732, "tps": 22918, "wall": 17848.9} {"step": 6242, "train_loss": 3.70963978767395, "lr": 0.0003727041301224433, "tps": 22912, "wall": 17856.7} {"step": 6243, "train_loss": 3.766648769378662, "lr": 0.0003726939865191728, "tps": 22906, "wall": 17864.5} {"step": 6244, "train_loss": 3.728788137435913, "lr": 0.0003726838411861766, "tps": 22899, "wall": 17872.3} {"step": 6245, "train_loss": 3.6426780223846436, "lr": 0.00037267369412356946, "tps": 22893, "wall": 17880.0} {"step": 6246, "train_loss": 3.6753368377685547, "lr": 0.0003726635453314665, "tps": 22887, "wall": 17887.6} {"step": 6247, "train_loss": 3.7348363399505615, "lr": 0.0003726533948099827, "tps": 22881, "wall": 17895.3} {"step": 6248, "train_loss": 3.6539783477783203, "lr": 0.00037264324255923293, "tps": 22875, "wall": 17903.1} {"step": 6249, "train_loss": 3.718778133392334, "lr": 0.00037263308857933227, "tps": 22868, "wall": 17910.8} {"step": 6250, "train_loss": 3.633805274963379, "lr": 0.00037262293287039576, "tps": 22862, "wall": 17918.6} {"step": 6251, "train_loss": 3.724261999130249, "lr": 0.00037261277543253836, "tps": 22856, "wall": 17926.3} {"step": 6252, "train_loss": 3.5269384384155273, "lr": 0.0003726026162658752, "tps": 22850, "wall": 17934.2} {"step": 6253, "train_loss": 3.641785144805908, "lr": 0.00037259245537052133, "tps": 22843, "wall": 17941.8} {"step": 6254, "train_loss": 3.774770736694336, "lr": 0.0003725822927465918, "tps": 22837, "wall": 17949.6} {"step": 6255, "train_loss": 3.7635085582733154, "lr": 0.00037257212839420195, "tps": 22831, "wall": 17957.4} {"step": 6256, "train_loss": 3.7258214950561523, "lr": 0.0003725619623134667, "tps": 22825, "wall": 17965.1} {"step": 6257, "train_loss": 3.5899033546447754, "lr": 0.0003725517945045013, "tps": 22819, "wall": 17972.9} {"step": 6258, "train_loss": 3.752384662628174, "lr": 0.0003725416249674209, "tps": 22813, "wall": 17980.5} {"step": 6259, "train_loss": 3.6965560913085938, "lr": 0.0003725314537023407, "tps": 22806, "wall": 17988.4} {"step": 6260, "train_loss": 3.559757709503174, "lr": 0.00037252128070937605, "tps": 22800, "wall": 17996.1} {"step": 6261, "train_loss": 3.652143716812134, "lr": 0.00037251110598864203, "tps": 22794, "wall": 18003.8} {"step": 6262, "train_loss": 3.6923112869262695, "lr": 0.0003725009295402539, "tps": 22788, "wall": 18011.4} {"step": 6263, "train_loss": 3.6924400329589844, "lr": 0.00037249075136432705, "tps": 22782, "wall": 18019.2} {"step": 6264, "train_loss": 3.7905027866363525, "lr": 0.00037248057146097664, "tps": 22776, "wall": 18027.0} {"step": 6265, "train_loss": 3.6884076595306396, "lr": 0.0003724703898303181, "tps": 22769, "wall": 18034.8} {"step": 6266, "train_loss": 3.6481165885925293, "lr": 0.0003724602064724668, "tps": 22763, "wall": 18042.7} {"step": 6267, "train_loss": 3.683448076248169, "lr": 0.000372450021387538, "tps": 22757, "wall": 18050.4} {"step": 6268, "train_loss": 3.735907554626465, "lr": 0.00037243983457564705, "tps": 22751, "wall": 18058.2} {"step": 6269, "train_loss": 3.6793723106384277, "lr": 0.00037242964603690943, "tps": 22745, "wall": 18066.0} {"step": 6270, "train_loss": 3.7804503440856934, "lr": 0.0003724194557714406, "tps": 22738, "wall": 18073.8} {"step": 6271, "train_loss": 3.74882435798645, "lr": 0.00037240926377935587, "tps": 22732, "wall": 18081.6} {"step": 6272, "train_loss": 3.649352550506592, "lr": 0.00037239907006077075, "tps": 22726, "wall": 18089.3} {"step": 6273, "train_loss": 3.7123336791992188, "lr": 0.00037238887461580076, "tps": 22720, "wall": 18097.4} {"step": 6274, "train_loss": 3.716052532196045, "lr": 0.0003723786774445613, "tps": 22713, "wall": 18105.2} {"step": 6275, "train_loss": 3.6183037757873535, "lr": 0.000372368478547168, "tps": 22707, "wall": 18113.0} {"step": 6276, "train_loss": 3.600421190261841, "lr": 0.0003723582779237363, "tps": 22701, "wall": 18120.7} {"step": 6277, "train_loss": 3.725212812423706, "lr": 0.00037234807557438176, "tps": 22695, "wall": 18128.4} {"step": 6278, "train_loss": 3.6055102348327637, "lr": 0.00037233787149922, "tps": 22689, "wall": 18136.2} {"step": 6279, "train_loss": 3.730358123779297, "lr": 0.0003723276656983666, "tps": 22683, "wall": 18144.1} {"step": 6280, "train_loss": 3.6731014251708984, "lr": 0.0003723174581719372, "tps": 22677, "wall": 18151.8} {"step": 6281, "train_loss": 3.6114554405212402, "lr": 0.00037230724892004733, "tps": 22670, "wall": 18159.7} {"step": 6282, "train_loss": 3.6999926567077637, "lr": 0.0003722970379428127, "tps": 22664, "wall": 18167.5} {"step": 6283, "train_loss": 3.6825127601623535, "lr": 0.00037228682524034903, "tps": 22658, "wall": 18175.4} {"step": 6284, "train_loss": 3.6555283069610596, "lr": 0.000372276610812772, "tps": 22652, "wall": 18183.1} {"step": 6285, "train_loss": 3.759352207183838, "lr": 0.0003722663946601972, "tps": 22646, "wall": 18190.9} {"step": 6286, "train_loss": 3.6881275177001953, "lr": 0.0003722561767827405, "tps": 22640, "wall": 18198.7} {"step": 6287, "train_loss": 3.6606833934783936, "lr": 0.0003722459571805175, "tps": 22634, "wall": 18206.6} {"step": 6288, "train_loss": 3.74106502532959, "lr": 0.0003722357358536442, "tps": 22627, "wall": 18214.4} {"step": 6289, "train_loss": 3.6292853355407715, "lr": 0.0003722255128022361, "tps": 22621, "wall": 18222.4} {"step": 6290, "train_loss": 3.5726680755615234, "lr": 0.00037221528802640927, "tps": 22615, "wall": 18230.1} {"step": 6291, "train_loss": 3.609713077545166, "lr": 0.00037220506152627937, "tps": 22609, "wall": 18237.9} {"step": 6292, "train_loss": 3.7225327491760254, "lr": 0.0003721948333019623, "tps": 22603, "wall": 18245.8} {"step": 6293, "train_loss": 3.649380683898926, "lr": 0.00037218460335357393, "tps": 22597, "wall": 18253.6} {"step": 6294, "train_loss": 3.697911024093628, "lr": 0.0003721743716812302, "tps": 22591, "wall": 18261.4} {"step": 6295, "train_loss": 3.7176451683044434, "lr": 0.0003721641382850469, "tps": 22585, "wall": 18269.4} {"step": 6296, "train_loss": 3.646639347076416, "lr": 0.00037215390316514, "tps": 22578, "wall": 18277.2} {"step": 6297, "train_loss": 3.7078709602355957, "lr": 0.0003721436663216255, "tps": 22572, "wall": 18285.2} {"step": 6298, "train_loss": 3.7203369140625, "lr": 0.00037213342775461924, "tps": 22566, "wall": 18293.0} {"step": 6299, "train_loss": 3.7149453163146973, "lr": 0.00037212318746423736, "tps": 22560, "wall": 18300.8} {"step": 6300, "train_loss": 3.709035873413086, "lr": 0.00037211294545059576, "tps": 22554, "wall": 18308.6} {"step": 6301, "train_loss": 3.647005081176758, "lr": 0.00037210270171381045, "tps": 22548, "wall": 18316.4} {"step": 6302, "train_loss": 3.6075496673583984, "lr": 0.00037209245625399756, "tps": 22542, "wall": 18324.4} {"step": 6303, "train_loss": 3.6836585998535156, "lr": 0.000372082209071273, "tps": 22536, "wall": 18332.2} {"step": 6304, "train_loss": 3.628068447113037, "lr": 0.000372071960165753, "tps": 22529, "wall": 18340.2} {"step": 6305, "train_loss": 3.7391979694366455, "lr": 0.0003720617095375537, "tps": 22522, "wall": 18349.2} {"step": 6306, "train_loss": 3.710756778717041, "lr": 0.000372051457186791, "tps": 22515, "wall": 18357.8} {"step": 6307, "train_loss": 3.687621593475342, "lr": 0.0003720412031135812, "tps": 22509, "wall": 18365.7} {"step": 6308, "train_loss": 3.6467933654785156, "lr": 0.00037203094731804045, "tps": 22503, "wall": 18373.6} {"step": 6309, "train_loss": 3.784541606903076, "lr": 0.0003720206898002849, "tps": 22497, "wall": 18381.4} {"step": 6310, "train_loss": 3.6568799018859863, "lr": 0.00037201043056043077, "tps": 22491, "wall": 18389.4} {"step": 6311, "train_loss": 3.659208297729492, "lr": 0.0003720001695985942, "tps": 22484, "wall": 18397.4} {"step": 6312, "train_loss": 3.6437931060791016, "lr": 0.0003719899069148915, "tps": 22478, "wall": 18405.5} {"step": 6313, "train_loss": 3.6707324981689453, "lr": 0.000371979642509439, "tps": 22472, "wall": 18413.4} {"step": 6314, "train_loss": 3.693836212158203, "lr": 0.0003719693763823528, "tps": 22466, "wall": 18421.3} {"step": 6315, "train_loss": 3.7393126487731934, "lr": 0.0003719591085337493, "tps": 22460, "wall": 18429.2} {"step": 6316, "train_loss": 3.746164560317993, "lr": 0.0003719488389637448, "tps": 22454, "wall": 18437.0} {"step": 6317, "train_loss": 3.64973783493042, "lr": 0.00037193856767245563, "tps": 22448, "wall": 18445.0} {"step": 6318, "train_loss": 3.7439041137695312, "lr": 0.00037192829465999816, "tps": 22442, "wall": 18452.9} {"step": 6319, "train_loss": 3.734525680541992, "lr": 0.00037191801992648873, "tps": 22436, "wall": 18460.8} {"step": 6320, "train_loss": 3.5969557762145996, "lr": 0.0003719077434720438, "tps": 22429, "wall": 18468.9} {"step": 6321, "train_loss": 3.6666994094848633, "lr": 0.00037189746529677967, "tps": 22423, "wall": 18476.8} {"step": 6322, "train_loss": 3.739610195159912, "lr": 0.00037188718540081286, "tps": 22417, "wall": 18484.7} {"step": 6323, "train_loss": 3.669550895690918, "lr": 0.0003718769037842598, "tps": 22411, "wall": 18492.6} {"step": 6324, "train_loss": 3.727912425994873, "lr": 0.000371866620447237, "tps": 22405, "wall": 18500.5} {"step": 6325, "train_loss": 3.675119638442993, "lr": 0.0003718563353898608, "tps": 22399, "wall": 18508.5} {"step": 6326, "train_loss": 3.7305424213409424, "lr": 0.00037184604861224786, "tps": 22393, "wall": 18516.5} {"step": 6327, "train_loss": 3.6194820404052734, "lr": 0.0003718357601145148, "tps": 22387, "wall": 18524.6} {"step": 6328, "train_loss": 3.701814651489258, "lr": 0.0003718254698967779, "tps": 22381, "wall": 18532.5} {"step": 6329, "train_loss": 3.7498648166656494, "lr": 0.0003718151779591538, "tps": 22374, "wall": 18540.6} {"step": 6330, "train_loss": 3.6544289588928223, "lr": 0.0003718048843017593, "tps": 22368, "wall": 18548.5} {"step": 6331, "train_loss": 3.6497554779052734, "lr": 0.0003717945889247108, "tps": 22362, "wall": 18556.5} {"step": 6332, "train_loss": 3.694885730743408, "lr": 0.00037178429182812493, "tps": 22356, "wall": 18564.5} {"step": 6333, "train_loss": 3.66559100151062, "lr": 0.00037177399301211844, "tps": 22350, "wall": 18572.4} {"step": 6334, "train_loss": 3.6404433250427246, "lr": 0.000371763692476808, "tps": 22344, "wall": 18580.5} {"step": 6335, "train_loss": 3.603884220123291, "lr": 0.0003717533902223102, "tps": 22338, "wall": 18588.6} {"step": 6336, "train_loss": 3.6543843746185303, "lr": 0.00037174308624874177, "tps": 22332, "wall": 18596.6} {"step": 6337, "train_loss": 3.6879286766052246, "lr": 0.00037173278055621943, "tps": 22326, "wall": 18604.6} {"step": 6338, "train_loss": 3.670260190963745, "lr": 0.00037172247314486, "tps": 22320, "wall": 18612.6} {"step": 6339, "train_loss": 3.737076759338379, "lr": 0.0003717121640147801, "tps": 22313, "wall": 18620.6} {"step": 6340, "train_loss": 3.7189135551452637, "lr": 0.0003717018531660967, "tps": 22307, "wall": 18628.7} {"step": 6341, "train_loss": 3.5861616134643555, "lr": 0.0003716915405989264, "tps": 22301, "wall": 18636.7} {"step": 6342, "train_loss": 3.6503775119781494, "lr": 0.0003716812263133862, "tps": 22295, "wall": 18644.9} {"step": 6343, "train_loss": 3.6633455753326416, "lr": 0.0003716709103095929, "tps": 22289, "wall": 18653.0} {"step": 6344, "train_loss": 3.756260395050049, "lr": 0.00037166059258766324, "tps": 22283, "wall": 18661.1} {"step": 6345, "train_loss": 3.746331214904785, "lr": 0.0003716502731477142, "tps": 22277, "wall": 18669.1} {"step": 6346, "train_loss": 3.7174148559570312, "lr": 0.0003716399519898626, "tps": 22270, "wall": 18677.2} {"step": 6347, "train_loss": 3.6036152839660645, "lr": 0.0003716296291142255, "tps": 22264, "wall": 18685.2} {"step": 6348, "train_loss": 3.7055420875549316, "lr": 0.00037161930452091977, "tps": 22258, "wall": 18693.3} {"step": 6349, "train_loss": 3.6986212730407715, "lr": 0.0003716089782100623, "tps": 22252, "wall": 18701.3} {"step": 6350, "train_loss": 3.693042039871216, "lr": 0.00037159865018177013, "tps": 22246, "wall": 18709.5} {"step": 6351, "train_loss": 3.6397218704223633, "lr": 0.0003715883204361603, "tps": 22240, "wall": 18717.6} {"step": 6352, "train_loss": 3.704437732696533, "lr": 0.00037157798897334977, "tps": 22234, "wall": 18725.5} {"step": 6353, "train_loss": 3.605922222137451, "lr": 0.0003715676557934555, "tps": 22228, "wall": 18733.6} {"step": 6354, "train_loss": 3.690107583999634, "lr": 0.00037155732089659473, "tps": 22222, "wall": 18741.7} {"step": 6355, "train_loss": 3.6995389461517334, "lr": 0.0003715469842828844, "tps": 22216, "wall": 18749.7} {"step": 6356, "train_loss": 3.6941003799438477, "lr": 0.00037153664595244155, "tps": 22210, "wall": 18757.7} {"step": 6357, "train_loss": 3.595676898956299, "lr": 0.00037152630590538344, "tps": 22203, "wall": 18766.0} {"step": 6358, "train_loss": 3.6974728107452393, "lr": 0.0003715159641418272, "tps": 22197, "wall": 18774.1} {"step": 6359, "train_loss": 3.608112335205078, "lr": 0.0003715056206618899, "tps": 22191, "wall": 18782.1} {"step": 6360, "train_loss": 3.811981678009033, "lr": 0.0003714952754656887, "tps": 22185, "wall": 18790.1} {"step": 6361, "train_loss": 3.576638698577881, "lr": 0.0003714849285533407, "tps": 22179, "wall": 18798.3} {"step": 6362, "train_loss": 3.631775140762329, "lr": 0.0003714745799249634, "tps": 22173, "wall": 18806.4} {"step": 6363, "train_loss": 3.6072585582733154, "lr": 0.0003714642295806738, "tps": 22167, "wall": 18814.5} {"step": 6364, "train_loss": 3.702159881591797, "lr": 0.0003714538775205893, "tps": 22161, "wall": 18822.7} {"step": 6365, "train_loss": 3.6794464588165283, "lr": 0.00037144352374482697, "tps": 22155, "wall": 18830.7} {"step": 6366, "train_loss": 3.6596922874450684, "lr": 0.00037143316825350423, "tps": 22149, "wall": 18838.9} {"step": 6367, "train_loss": 3.7799572944641113, "lr": 0.0003714228110467384, "tps": 22143, "wall": 18846.9} {"step": 6368, "train_loss": 3.69572114944458, "lr": 0.0003714124521246468, "tps": 22137, "wall": 18855.0} {"step": 6369, "train_loss": 3.6071882247924805, "lr": 0.00037140209148734673, "tps": 22131, "wall": 18863.3} {"step": 6370, "train_loss": 3.614717721939087, "lr": 0.00037139172913495553, "tps": 22125, "wall": 18871.4} {"step": 6371, "train_loss": 3.7575223445892334, "lr": 0.0003713813650675907, "tps": 22118, "wall": 18879.5} {"step": 6372, "train_loss": 3.735867977142334, "lr": 0.00037137099928536945, "tps": 22112, "wall": 18887.8} {"step": 6373, "train_loss": 3.7925541400909424, "lr": 0.0003713606317884095, "tps": 22106, "wall": 18895.8} {"step": 6374, "train_loss": 3.609785795211792, "lr": 0.000371350262576828, "tps": 22100, "wall": 18903.9} {"step": 6375, "train_loss": 3.7266297340393066, "lr": 0.00037133989165074265, "tps": 22094, "wall": 18912.0} {"step": 6376, "train_loss": 3.588202714920044, "lr": 0.00037132951901027074, "tps": 22089, "wall": 18919.9} {"step": 6377, "train_loss": 3.719773530960083, "lr": 0.00037131914465552985, "tps": 22082, "wall": 18928.1} {"step": 6378, "train_loss": 3.697033405303955, "lr": 0.0003713087685866375, "tps": 22076, "wall": 18936.3} {"step": 6379, "train_loss": 3.631443977355957, "lr": 0.00037129839080371127, "tps": 22070, "wall": 18944.5} {"step": 6380, "train_loss": 3.7094943523406982, "lr": 0.0003712880113068687, "tps": 22064, "wall": 18952.7} {"step": 6381, "train_loss": 3.752362012863159, "lr": 0.0003712776300962273, "tps": 22058, "wall": 18960.7} {"step": 6382, "train_loss": 3.7671961784362793, "lr": 0.00037126724717190474, "tps": 22052, "wall": 18968.9} {"step": 6383, "train_loss": 3.7012863159179688, "lr": 0.00037125686253401864, "tps": 22046, "wall": 18977.0} {"step": 6384, "train_loss": 3.732819080352783, "lr": 0.0003712464761826866, "tps": 22040, "wall": 18985.0} {"step": 6385, "train_loss": 3.7502665519714355, "lr": 0.0003712360881180263, "tps": 22034, "wall": 18993.3} {"step": 6386, "train_loss": 3.73518967628479, "lr": 0.0003712256983401554, "tps": 22028, "wall": 19001.3} {"step": 6387, "train_loss": 3.647979736328125, "lr": 0.00037121530684919155, "tps": 22022, "wall": 19009.6} {"step": 6388, "train_loss": 3.684236526489258, "lr": 0.0003712049136452527, "tps": 22016, "wall": 19017.8} {"step": 6389, "train_loss": 3.641327381134033, "lr": 0.0003711945187284563, "tps": 22010, "wall": 19025.9} {"step": 6390, "train_loss": 3.707556962966919, "lr": 0.00037118412209892016, "tps": 22004, "wall": 19034.0} {"step": 6391, "train_loss": 3.74428391456604, "lr": 0.0003711737237567622, "tps": 21998, "wall": 19042.2} {"step": 6392, "train_loss": 3.8348259925842285, "lr": 0.00037116332370210005, "tps": 21992, "wall": 19050.4} {"step": 6393, "train_loss": 3.6846258640289307, "lr": 0.0003711529219350516, "tps": 21986, "wall": 19058.6} {"step": 6394, "train_loss": 3.5916833877563477, "lr": 0.00037114251845573465, "tps": 21980, "wall": 19066.8} {"step": 6395, "train_loss": 3.768960952758789, "lr": 0.00037113211326426714, "tps": 21974, "wall": 19075.0} {"step": 6396, "train_loss": 3.6386892795562744, "lr": 0.0003711217063607669, "tps": 21968, "wall": 19083.1} {"step": 6397, "train_loss": 3.681279420852661, "lr": 0.0003711112977453517, "tps": 21962, "wall": 19091.2} {"step": 6398, "train_loss": 3.642597198486328, "lr": 0.0003711008874181396, "tps": 21957, "wall": 19099.4} {"step": 6399, "train_loss": 3.562556266784668, "lr": 0.00037109047537924847, "tps": 21951, "wall": 19107.5} {"step": 6400, "train_loss": 3.614596366882324, "lr": 0.00037108006162879623, "tps": 21945, "wall": 19115.7} {"step": 6401, "train_loss": 3.7881712913513184, "lr": 0.00037106964616690093, "tps": 21938, "wall": 19124.0} {"step": 6402, "train_loss": 3.711599826812744, "lr": 0.0003710592289936805, "tps": 21933, "wall": 19132.2} {"step": 6403, "train_loss": 3.7013046741485596, "lr": 0.0003710488101092529, "tps": 21927, "wall": 19140.3} {"step": 6404, "train_loss": 3.662174701690674, "lr": 0.0003710383895137363, "tps": 21921, "wall": 19148.5} {"step": 6405, "train_loss": 3.788205862045288, "lr": 0.00037102796720724855, "tps": 21915, "wall": 19156.8} {"step": 6406, "train_loss": 3.6123785972595215, "lr": 0.00037101754318990784, "tps": 21909, "wall": 19164.9} {"step": 6407, "train_loss": 3.706721305847168, "lr": 0.0003710071174618323, "tps": 21903, "wall": 19173.1} {"step": 6408, "train_loss": 3.7369892597198486, "lr": 0.0003709966900231399, "tps": 21897, "wall": 19181.1} {"step": 6409, "train_loss": 3.7123522758483887, "lr": 0.0003709862608739488, "tps": 21891, "wall": 19189.3} {"step": 6410, "train_loss": 3.6632437705993652, "lr": 0.00037097583001437717, "tps": 21885, "wall": 19197.4} {"step": 6411, "train_loss": 3.68867564201355, "lr": 0.0003709653974445432, "tps": 21880, "wall": 19205.5} {"step": 6412, "train_loss": 3.563560962677002, "lr": 0.0003709549631645651, "tps": 21874, "wall": 19213.6} {"step": 6413, "train_loss": 3.547886371612549, "lr": 0.00037094452717456095, "tps": 21868, "wall": 19221.7} {"step": 6414, "train_loss": 3.646171808242798, "lr": 0.00037093408947464905, "tps": 21862, "wall": 19229.9} {"step": 6415, "train_loss": 3.8025169372558594, "lr": 0.00037092365006494756, "tps": 21856, "wall": 19237.9} {"step": 6416, "train_loss": 3.7316629886627197, "lr": 0.0003709132089455749, "tps": 21850, "wall": 19246.2} {"step": 6417, "train_loss": 3.6893503665924072, "lr": 0.0003709027661166491, "tps": 21844, "wall": 19254.4} {"step": 6418, "train_loss": 3.707263946533203, "lr": 0.0003708923215782888, "tps": 21839, "wall": 19262.5} {"step": 6419, "train_loss": 3.586909770965576, "lr": 0.00037088187533061196, "tps": 21833, "wall": 19270.5} {"step": 6420, "train_loss": 3.625033378601074, "lr": 0.00037087142737373714, "tps": 21827, "wall": 19278.6} {"step": 6421, "train_loss": 3.650496482849121, "lr": 0.0003708609777077826, "tps": 21821, "wall": 19286.8} {"step": 6422, "train_loss": 3.7594618797302246, "lr": 0.00037085052633286676, "tps": 21816, "wall": 19294.8} {"step": 6423, "train_loss": 3.837307929992676, "lr": 0.000370840073249108, "tps": 21810, "wall": 19303.0} {"step": 6424, "train_loss": 3.7357020378112793, "lr": 0.0003708296184566247, "tps": 21804, "wall": 19311.0} {"step": 6425, "train_loss": 3.655097484588623, "lr": 0.00037081916195553534, "tps": 21798, "wall": 19319.2} {"step": 6426, "train_loss": 3.64803409576416, "lr": 0.00037080870374595835, "tps": 21793, "wall": 19327.3} {"step": 6427, "train_loss": 3.768967866897583, "lr": 0.00037079824382801223, "tps": 21787, "wall": 19335.4} {"step": 6428, "train_loss": 3.7150216102600098, "lr": 0.0003707877822018154, "tps": 21781, "wall": 19343.5} {"step": 6429, "train_loss": 3.664517879486084, "lr": 0.0003707773188674865, "tps": 21775, "wall": 19351.5} {"step": 6430, "train_loss": 3.613910675048828, "lr": 0.0003707668538251439, "tps": 21770, "wall": 19359.6} {"step": 6431, "train_loss": 3.692880153656006, "lr": 0.0003707563870749062, "tps": 21764, "wall": 19367.8} {"step": 6432, "train_loss": 3.656327486038208, "lr": 0.0003707459186168921, "tps": 21758, "wall": 19375.9} {"step": 6433, "train_loss": 3.714230537414551, "lr": 0.00037073544845121997, "tps": 21752, "wall": 19384.0} {"step": 6434, "train_loss": 3.6623482704162598, "lr": 0.00037072497657800863, "tps": 21747, "wall": 19391.9} {"step": 6435, "train_loss": 3.7255301475524902, "lr": 0.00037071450299737646, "tps": 21741, "wall": 19400.1} {"step": 6436, "train_loss": 3.57096004486084, "lr": 0.00037070402770944235, "tps": 21735, "wall": 19408.2} {"step": 6437, "train_loss": 3.7001943588256836, "lr": 0.00037069355071432485, "tps": 21730, "wall": 19416.2} {"step": 6438, "train_loss": 3.744572877883911, "lr": 0.00037068307201214263, "tps": 21724, "wall": 19424.4} {"step": 6439, "train_loss": 3.712158679962158, "lr": 0.00037067259160301447, "tps": 21719, "wall": 19432.4} {"step": 6440, "train_loss": 3.619626998901367, "lr": 0.00037066210948705897, "tps": 21713, "wall": 19440.4} {"step": 6441, "train_loss": 3.720846176147461, "lr": 0.00037065162566439497, "tps": 21707, "wall": 19448.5} {"step": 6442, "train_loss": 3.656475782394409, "lr": 0.0003706411401351412, "tps": 21702, "wall": 19456.5} {"step": 6443, "train_loss": 3.6967334747314453, "lr": 0.0003706306528994165, "tps": 21696, "wall": 19464.6} {"step": 6444, "train_loss": 3.753683567047119, "lr": 0.00037062016395733957, "tps": 21691, "wall": 19472.5} {"step": 6445, "train_loss": 3.6062185764312744, "lr": 0.00037060967330902923, "tps": 21685, "wall": 19480.7} {"step": 6446, "train_loss": 3.7164852619171143, "lr": 0.00037059918095460443, "tps": 21679, "wall": 19488.6} {"step": 6447, "train_loss": 3.712299346923828, "lr": 0.00037058868689418393, "tps": 21674, "wall": 19496.9} {"step": 6448, "train_loss": 3.713407039642334, "lr": 0.0003705781911278866, "tps": 21668, "wall": 19504.8} {"step": 6449, "train_loss": 3.768888473510742, "lr": 0.0003705676936558315, "tps": 21663, "wall": 19512.8} {"step": 6450, "train_loss": 3.5871329307556152, "lr": 0.0003705571944781373, "tps": 21657, "wall": 19520.9} {"step": 6451, "train_loss": 3.696796417236328, "lr": 0.0003705466935949231, "tps": 21651, "wall": 19529.0} {"step": 6452, "train_loss": 3.63441801071167, "lr": 0.0003705361910063078, "tps": 21646, "wall": 19537.0} {"step": 6453, "train_loss": 3.665618419647217, "lr": 0.0003705256867124104, "tps": 21640, "wall": 19545.1} {"step": 6454, "train_loss": 3.72184419631958, "lr": 0.00037051518071334986, "tps": 21635, "wall": 19553.2} {"step": 6455, "train_loss": 3.6369926929473877, "lr": 0.00037050467300924525, "tps": 21629, "wall": 19561.1} {"step": 6456, "train_loss": 3.6728878021240234, "lr": 0.00037049416360021554, "tps": 21624, "wall": 19569.1} {"step": 6457, "train_loss": 3.6448049545288086, "lr": 0.00037048365248637977, "tps": 21618, "wall": 19577.1} {"step": 6458, "train_loss": 3.7583327293395996, "lr": 0.0003704731396678571, "tps": 21613, "wall": 19585.1} {"step": 6459, "train_loss": 3.763641119003296, "lr": 0.00037046262514476647, "tps": 21607, "wall": 19593.1} {"step": 6460, "train_loss": 3.625126838684082, "lr": 0.0003704521089172272, "tps": 21602, "wall": 19601.1} {"step": 6461, "train_loss": 3.669189453125, "lr": 0.00037044159098535825, "tps": 21596, "wall": 19609.1} {"step": 6462, "train_loss": 3.6619131565093994, "lr": 0.0003704310713492788, "tps": 21591, "wall": 19617.3} {"step": 6463, "train_loss": 3.6029319763183594, "lr": 0.000370420550009108, "tps": 21585, "wall": 19625.2} {"step": 6464, "train_loss": 3.7425005435943604, "lr": 0.00037041002696496514, "tps": 21580, "wall": 19633.2} {"step": 6465, "train_loss": 3.7394826412200928, "lr": 0.0003703995022169694, "tps": 21574, "wall": 19641.2} {"step": 6466, "train_loss": 3.6632606983184814, "lr": 0.00037038897576523985, "tps": 21569, "wall": 19649.2} {"step": 6467, "train_loss": 3.653104066848755, "lr": 0.0003703784476098959, "tps": 21563, "wall": 19657.2} {"step": 6468, "train_loss": 3.6961984634399414, "lr": 0.0003703679177510568, "tps": 21558, "wall": 19665.2} {"step": 6469, "train_loss": 3.7497339248657227, "lr": 0.00037035738618884173, "tps": 21553, "wall": 19673.2} {"step": 6470, "train_loss": 3.7730937004089355, "lr": 0.0003703468529233701, "tps": 21547, "wall": 19681.2} {"step": 6471, "train_loss": 3.7573208808898926, "lr": 0.0003703363179547611, "tps": 21542, "wall": 19689.1} {"step": 6472, "train_loss": 3.808112621307373, "lr": 0.0003703257812831343, "tps": 21537, "wall": 19697.0} {"step": 6473, "train_loss": 3.660214900970459, "lr": 0.0003703152429086088, "tps": 21531, "wall": 19704.9} {"step": 6474, "train_loss": 3.722531318664551, "lr": 0.0003703047028313042, "tps": 21526, "wall": 19712.9} {"step": 6475, "train_loss": 3.6899642944335938, "lr": 0.0003702941610513397, "tps": 21520, "wall": 19720.9} {"step": 6476, "train_loss": 3.6832776069641113, "lr": 0.0003702836175688348, "tps": 21515, "wall": 19728.9} {"step": 6477, "train_loss": 3.7350237369537354, "lr": 0.00037027307238390894, "tps": 21510, "wall": 19736.9} {"step": 6478, "train_loss": 3.747352361679077, "lr": 0.0003702625254966817, "tps": 21504, "wall": 19744.8} {"step": 6479, "train_loss": 3.692978858947754, "lr": 0.00037025197690727235, "tps": 21499, "wall": 19752.7} {"step": 6480, "train_loss": 3.6334941387176514, "lr": 0.0003702414266158005, "tps": 21494, "wall": 19760.7} {"step": 6481, "train_loss": 3.724369764328003, "lr": 0.0003702308746223857, "tps": 21488, "wall": 19768.7} {"step": 6482, "train_loss": 3.6922881603240967, "lr": 0.00037022032092714737, "tps": 21483, "wall": 19776.6} {"step": 6483, "train_loss": 3.6417551040649414, "lr": 0.00037020976553020507, "tps": 21478, "wall": 19784.6} {"step": 6484, "train_loss": 3.5520577430725098, "lr": 0.0003701992084316785, "tps": 21472, "wall": 19792.6} {"step": 6485, "train_loss": 3.7157325744628906, "lr": 0.0003701886496316871, "tps": 21467, "wall": 19800.5} {"step": 6486, "train_loss": 3.721999168395996, "lr": 0.0003701780891303506, "tps": 21462, "wall": 19808.4} {"step": 6487, "train_loss": 3.6537094116210938, "lr": 0.00037016752692778864, "tps": 21456, "wall": 19816.3} {"step": 6488, "train_loss": 3.750913619995117, "lr": 0.0003701569630241207, "tps": 21451, "wall": 19824.2} {"step": 6489, "train_loss": 3.583083391189575, "lr": 0.0003701463974194666, "tps": 21446, "wall": 19832.3} {"step": 6490, "train_loss": 3.546966075897217, "lr": 0.000370135830113946, "tps": 21441, "wall": 19840.2} {"step": 6491, "train_loss": 3.657453775405884, "lr": 0.0003701252611076786, "tps": 21435, "wall": 19848.2} {"step": 6492, "train_loss": 3.6355628967285156, "lr": 0.00037011469040078407, "tps": 21430, "wall": 19856.1} {"step": 6493, "train_loss": 3.6760709285736084, "lr": 0.00037010411799338227, "tps": 21425, "wall": 19864.0} {"step": 6494, "train_loss": 3.699766159057617, "lr": 0.0003700935438855929, "tps": 21420, "wall": 19871.9} {"step": 6495, "train_loss": 3.6381518840789795, "lr": 0.0003700829680775357, "tps": 21414, "wall": 19879.8} {"step": 6496, "train_loss": 3.6052730083465576, "lr": 0.00037007239056933056, "tps": 21409, "wall": 19887.9} {"step": 6497, "train_loss": 3.622555732727051, "lr": 0.0003700618113610972, "tps": 21404, "wall": 19895.8} {"step": 6498, "train_loss": 3.697524070739746, "lr": 0.0003700512304529556, "tps": 21398, "wall": 19903.9} {"step": 6499, "train_loss": 3.673072576522827, "lr": 0.0003700406478450255, "tps": 21393, "wall": 19911.8} {"step": 6500, "train_loss": 3.687246799468994, "lr": 0.0003700300635374268, "tps": 21388, "wall": 19919.6} {"step": 6501, "train_loss": 3.6162772178649902, "lr": 0.0003700194775302795, "tps": 21383, "wall": 19927.6} {"step": 6502, "train_loss": 3.7169666290283203, "lr": 0.0003700088898237034, "tps": 21377, "wall": 19935.5} {"step": 6503, "train_loss": 3.6987414360046387, "lr": 0.00036999830041781846, "tps": 21372, "wall": 19943.4} {"step": 6504, "train_loss": 3.682373523712158, "lr": 0.00036998770931274467, "tps": 21367, "wall": 19951.4} {"step": 6505, "train_loss": 3.6960041522979736, "lr": 0.00036997711650860204, "tps": 21362, "wall": 19959.2} {"step": 6506, "train_loss": 3.725614309310913, "lr": 0.00036996652200551043, "tps": 21357, "wall": 19967.3} {"step": 6507, "train_loss": 3.691530704498291, "lr": 0.00036995592580359003, "tps": 21351, "wall": 19975.2} {"step": 6508, "train_loss": 3.5766680240631104, "lr": 0.00036994532790296075, "tps": 21346, "wall": 19983.0} {"step": 6509, "train_loss": 3.7744874954223633, "lr": 0.0003699347283037427, "tps": 21341, "wall": 19990.9} {"step": 6510, "train_loss": 3.6857500076293945, "lr": 0.0003699241270060559, "tps": 21336, "wall": 19998.8} {"step": 6511, "train_loss": 3.6557583808898926, "lr": 0.0003699135240100205, "tps": 21331, "wall": 20006.7} {"step": 6512, "train_loss": 3.7374699115753174, "lr": 0.00036990291931575663, "tps": 21326, "wall": 20014.5} {"step": 6513, "train_loss": 3.640310764312744, "lr": 0.00036989231292338434, "tps": 21321, "wall": 20022.6} {"step": 6514, "train_loss": 3.578317403793335, "lr": 0.0003698817048330238, "tps": 21316, "wall": 20030.3} {"step": 6515, "train_loss": 3.688349723815918, "lr": 0.00036987109504479525, "tps": 21310, "wall": 20038.3} {"step": 6516, "train_loss": 3.689603567123413, "lr": 0.00036986048355881876, "tps": 21305, "wall": 20046.1} {"step": 6517, "train_loss": 3.6501851081848145, "lr": 0.0003698498703752146, "tps": 21300, "wall": 20054.0} {"step": 6518, "train_loss": 3.6396877765655518, "lr": 0.0003698392554941031, "tps": 21295, "wall": 20061.8} {"step": 6519, "train_loss": 3.7321362495422363, "lr": 0.0003698286389156044, "tps": 21290, "wall": 20069.8} {"step": 6520, "train_loss": 3.6375327110290527, "lr": 0.0003698180206398387, "tps": 21285, "wall": 20077.6} {"step": 6521, "train_loss": 3.6568093299865723, "lr": 0.0003698074006669264, "tps": 21280, "wall": 20085.6} {"step": 6522, "train_loss": 3.691141128540039, "lr": 0.0003697967789969877, "tps": 21275, "wall": 20093.5} {"step": 6523, "train_loss": 3.711139678955078, "lr": 0.00036978615563014304, "tps": 21269, "wall": 20101.4} {"step": 6524, "train_loss": 3.716198444366455, "lr": 0.00036977553056651274, "tps": 21265, "wall": 20109.1} {"step": 6525, "train_loss": 3.706547737121582, "lr": 0.00036976490380621706, "tps": 21259, "wall": 20117.1} {"step": 6526, "train_loss": 3.678812026977539, "lr": 0.0003697542753493764, "tps": 21254, "wall": 20125.0} {"step": 6527, "train_loss": 3.6972548961639404, "lr": 0.00036974364519611134, "tps": 21249, "wall": 20132.8} {"step": 6528, "train_loss": 3.7563576698303223, "lr": 0.00036973301334654204, "tps": 21244, "wall": 20140.7} {"step": 6529, "train_loss": 3.6146254539489746, "lr": 0.0003697223798007892, "tps": 21239, "wall": 20148.7} {"step": 6530, "train_loss": 3.7178215980529785, "lr": 0.00036971174455897307, "tps": 21234, "wall": 20156.6} {"step": 6531, "train_loss": 3.715210199356079, "lr": 0.0003697011076212142, "tps": 21229, "wall": 20164.4} {"step": 6532, "train_loss": 3.671670436859131, "lr": 0.00036969046898763306, "tps": 21224, "wall": 20172.2} {"step": 6533, "train_loss": 3.5803754329681396, "lr": 0.0003696798286583502, "tps": 21219, "wall": 20179.9} {"step": 6534, "train_loss": 3.6677134037017822, "lr": 0.00036966918663348616, "tps": 21214, "wall": 20187.9} {"step": 6535, "train_loss": 3.6475815773010254, "lr": 0.0003696585429131615, "tps": 21209, "wall": 20195.8} {"step": 6536, "train_loss": 3.6816630363464355, "lr": 0.0003696478974974967, "tps": 21204, "wall": 20203.7} {"step": 6537, "train_loss": 3.7388925552368164, "lr": 0.0003696372503866125, "tps": 21199, "wall": 20211.5} {"step": 6538, "train_loss": 3.715642213821411, "lr": 0.0003696266015806294, "tps": 21194, "wall": 20219.4} {"step": 6539, "train_loss": 3.6318955421447754, "lr": 0.00036961595107966804, "tps": 21189, "wall": 20227.1} {"step": 6540, "train_loss": 3.681250810623169, "lr": 0.0003696052988838491, "tps": 21184, "wall": 20235.0} {"step": 6541, "train_loss": 3.561337471008301, "lr": 0.00036959464499329326, "tps": 21179, "wall": 20242.6} {"step": 6542, "train_loss": 3.666518211364746, "lr": 0.00036958398940812123, "tps": 21174, "wall": 20250.6} {"step": 6543, "train_loss": 3.7647671699523926, "lr": 0.0003695733321284536, "tps": 21169, "wall": 20258.4} {"step": 6544, "train_loss": 3.747568130493164, "lr": 0.0003695626731544112, "tps": 21164, "wall": 20266.3} {"step": 6545, "train_loss": 3.790125846862793, "lr": 0.0003695520124861147, "tps": 21159, "wall": 20274.1} {"step": 6546, "train_loss": 3.601548433303833, "lr": 0.00036954135012368496, "tps": 21155, "wall": 20281.9} {"step": 6547, "train_loss": 3.7405004501342773, "lr": 0.00036953068606724275, "tps": 21150, "wall": 20289.7} {"step": 6548, "train_loss": 3.599761486053467, "lr": 0.0003695200203169088, "tps": 21145, "wall": 20297.6} {"step": 6549, "train_loss": 3.7651844024658203, "lr": 0.00036950935287280396, "tps": 21140, "wall": 20305.4} {"step": 6550, "train_loss": 3.6866588592529297, "lr": 0.0003694986837350491, "tps": 21135, "wall": 20313.3} {"step": 6551, "train_loss": 3.5911474227905273, "lr": 0.00036948801290376504, "tps": 21130, "wall": 20321.1} {"step": 6552, "train_loss": 3.739121913909912, "lr": 0.00036947734037907275, "tps": 21125, "wall": 20329.0} {"step": 6553, "train_loss": 3.6330983638763428, "lr": 0.000369466666161093, "tps": 21120, "wall": 20336.8} {"step": 6554, "train_loss": 3.747437000274658, "lr": 0.00036945599024994674, "tps": 21115, "wall": 20344.6} {"step": 6555, "train_loss": 3.718153476715088, "lr": 0.000369445312645755, "tps": 21110, "wall": 20352.4} {"step": 6556, "train_loss": 3.6470870971679688, "lr": 0.00036943463334863864, "tps": 21105, "wall": 20360.2} {"step": 6557, "train_loss": 3.6590476036071777, "lr": 0.0003694239523587187, "tps": 21100, "wall": 20368.0} {"step": 6558, "train_loss": 3.6456775665283203, "lr": 0.0003694132696761161, "tps": 21096, "wall": 20375.8} {"step": 6559, "train_loss": 3.5920820236206055, "lr": 0.000369402585300952, "tps": 21091, "wall": 20383.7} {"step": 6560, "train_loss": 3.6233885288238525, "lr": 0.0003693918992333472, "tps": 21086, "wall": 20391.5} {"step": 6561, "train_loss": 3.670858383178711, "lr": 0.0003693812114734229, "tps": 21081, "wall": 20399.3} {"step": 6562, "train_loss": 3.7522709369659424, "lr": 0.00036937052202130026, "tps": 21076, "wall": 20407.0} {"step": 6563, "train_loss": 3.657794713973999, "lr": 0.0003693598308771002, "tps": 21071, "wall": 20414.9} {"step": 6564, "train_loss": 3.683515787124634, "lr": 0.0003693491380409439, "tps": 21067, "wall": 20422.6} {"step": 6565, "train_loss": 3.698932409286499, "lr": 0.0003693384435129524, "tps": 21062, "wall": 20430.5} {"step": 6566, "train_loss": 3.7167131900787354, "lr": 0.0003693277472932471, "tps": 21057, "wall": 20438.3} {"step": 6567, "train_loss": 3.690180540084839, "lr": 0.00036931704938194886, "tps": 21052, "wall": 20446.2} {"step": 6568, "train_loss": 3.7389070987701416, "lr": 0.000369306349779179, "tps": 21047, "wall": 20454.1} {"step": 6569, "train_loss": 3.7025599479675293, "lr": 0.00036929564848505884, "tps": 21042, "wall": 20461.8} {"step": 6570, "train_loss": 3.6538052558898926, "lr": 0.00036928494549970945, "tps": 21037, "wall": 20469.6} {"step": 6571, "train_loss": 3.710932970046997, "lr": 0.00036927424082325213, "tps": 21033, "wall": 20477.4} {"step": 6572, "train_loss": 3.6214890480041504, "lr": 0.0003692635344558081, "tps": 21028, "wall": 20485.2} {"step": 6573, "train_loss": 3.772099733352661, "lr": 0.0003692528263974987, "tps": 21023, "wall": 20493.0} {"step": 6574, "train_loss": 3.6959667205810547, "lr": 0.0003692421166484453, "tps": 21018, "wall": 20500.7} {"step": 6575, "train_loss": 3.658036708831787, "lr": 0.000369231405208769, "tps": 21013, "wall": 20508.7} {"step": 6576, "train_loss": 3.631319046020508, "lr": 0.0003692206920785913, "tps": 21009, "wall": 20516.5} {"step": 6577, "train_loss": 3.6307625770568848, "lr": 0.0003692099772580335, "tps": 21004, "wall": 20524.2} {"step": 6578, "train_loss": 3.6385748386383057, "lr": 0.00036919926074721707, "tps": 20999, "wall": 20532.0} {"step": 6579, "train_loss": 3.6372318267822266, "lr": 0.0003691885425462633, "tps": 20994, "wall": 20539.8} {"step": 6580, "train_loss": 3.61846923828125, "lr": 0.00036917782265529365, "tps": 20989, "wall": 20547.6} {"step": 6581, "train_loss": 3.683180332183838, "lr": 0.0003691671010744296, "tps": 20985, "wall": 20555.4} {"step": 6582, "train_loss": 3.738105297088623, "lr": 0.00036915637780379247, "tps": 20980, "wall": 20563.3} {"step": 6583, "train_loss": 3.732172727584839, "lr": 0.0003691456528435039, "tps": 20975, "wall": 20571.1} {"step": 6584, "train_loss": 3.696896553039551, "lr": 0.00036913492619368524, "tps": 20970, "wall": 20578.9} {"step": 6585, "train_loss": 3.6561856269836426, "lr": 0.00036912419785445816, "tps": 20965, "wall": 20586.7} {"step": 6586, "train_loss": 3.682190418243408, "lr": 0.00036911346782594407, "tps": 20961, "wall": 20594.5} {"step": 6587, "train_loss": 3.6005663871765137, "lr": 0.0003691027361082645, "tps": 20956, "wall": 20602.3} {"step": 6588, "train_loss": 3.6651511192321777, "lr": 0.0003690920027015411, "tps": 20951, "wall": 20610.1} {"step": 6589, "train_loss": 3.642432689666748, "lr": 0.0003690812676058954, "tps": 20947, "wall": 20617.8} {"step": 6590, "train_loss": 3.786301851272583, "lr": 0.00036907053082144907, "tps": 20942, "wall": 20625.7} {"step": 6591, "train_loss": 3.7012014389038086, "lr": 0.0003690597923483237, "tps": 20937, "wall": 20633.5} {"step": 6592, "train_loss": 3.6018331050872803, "lr": 0.00036904905218664095, "tps": 20932, "wall": 20641.3} {"step": 6593, "train_loss": 3.7412667274475098, "lr": 0.00036903831033652246, "tps": 20928, "wall": 20649.1} {"step": 6594, "train_loss": 3.6548068523406982, "lr": 0.00036902756679808987, "tps": 20923, "wall": 20656.9} {"step": 6595, "train_loss": 3.5602118968963623, "lr": 0.000369016821571465, "tps": 20918, "wall": 20664.8} {"step": 6596, "train_loss": 3.6704893112182617, "lr": 0.00036900607465676955, "tps": 20913, "wall": 20672.5} {"step": 6597, "train_loss": 3.7633652687072754, "lr": 0.00036899532605412516, "tps": 20909, "wall": 20680.4} {"step": 6598, "train_loss": 3.773406744003296, "lr": 0.0003689845757636537, "tps": 20904, "wall": 20688.2} {"step": 6599, "train_loss": 3.691494941711426, "lr": 0.00036897382378547693, "tps": 20899, "wall": 20696.0} {"step": 6600, "train_loss": 3.728447914123535, "lr": 0.00036896307011971655, "tps": 20894, "wall": 20703.7} {"step": 6601, "train_loss": 3.684386730194092, "lr": 0.0003689523147664944, "tps": 20890, "wall": 20711.4} {"step": 6602, "train_loss": 3.658656120300293, "lr": 0.0003689415577259325, "tps": 20885, "wall": 20719.2} {"step": 6603, "train_loss": 3.612240791320801, "lr": 0.00036893079899815253, "tps": 20880, "wall": 20727.1} {"step": 6604, "train_loss": 3.744492530822754, "lr": 0.0003689200385832764, "tps": 20876, "wall": 20735.0} {"step": 6605, "train_loss": 3.725139617919922, "lr": 0.0003689092764814261, "tps": 20871, "wall": 20742.8} {"step": 6606, "train_loss": 3.727273464202881, "lr": 0.00036889851269272334, "tps": 20866, "wall": 20750.6} {"step": 6607, "train_loss": 3.6926796436309814, "lr": 0.00036888774721729025, "tps": 20861, "wall": 20758.4} {"step": 6608, "train_loss": 3.7583465576171875, "lr": 0.0003688769800552487, "tps": 20857, "wall": 20766.2} {"step": 6609, "train_loss": 3.6086320877075195, "lr": 0.0003688662112067206, "tps": 20852, "wall": 20773.9} {"step": 6610, "train_loss": 3.6049602031707764, "lr": 0.00036885544067182804, "tps": 20848, "wall": 20781.7} {"step": 6611, "train_loss": 3.6544852256774902, "lr": 0.000368844668450693, "tps": 20843, "wall": 20789.5} {"step": 6612, "train_loss": 3.612292766571045, "lr": 0.00036883389454343753, "tps": 20838, "wall": 20797.4} {"step": 6613, "train_loss": 3.7120141983032227, "lr": 0.00036882311895018364, "tps": 20833, "wall": 20805.2} {"step": 6614, "train_loss": 3.6904430389404297, "lr": 0.00036881234167105337, "tps": 20829, "wall": 20813.0} {"step": 6615, "train_loss": 3.6578807830810547, "lr": 0.0003688015627061689, "tps": 20824, "wall": 20820.8} {"step": 6616, "train_loss": 3.605215549468994, "lr": 0.0003687907820556522, "tps": 20820, "wall": 20828.5} {"step": 6617, "train_loss": 3.6014766693115234, "lr": 0.0003687799997196255, "tps": 20815, "wall": 20836.4} {"step": 6618, "train_loss": 3.682542085647583, "lr": 0.00036876921569821094, "tps": 20810, "wall": 20844.2} {"step": 6619, "train_loss": 3.745368719100952, "lr": 0.0003687584299915306, "tps": 20806, "wall": 20852.0} {"step": 6620, "train_loss": 3.803173303604126, "lr": 0.0003687476425997068, "tps": 20801, "wall": 20859.8} {"step": 6621, "train_loss": 3.6545250415802, "lr": 0.00036873685352286164, "tps": 20796, "wall": 20867.6} {"step": 6622, "train_loss": 3.633291721343994, "lr": 0.00036872606276111737, "tps": 20792, "wall": 20875.5} {"step": 6623, "train_loss": 3.6476168632507324, "lr": 0.0003687152703145962, "tps": 20787, "wall": 20883.2} {"step": 6624, "train_loss": 3.5695576667785645, "lr": 0.0003687044761834203, "tps": 20782, "wall": 20890.9} {"step": 6625, "train_loss": 3.6791367530822754, "lr": 0.0003686936803677122, "tps": 20778, "wall": 20898.7} {"step": 6626, "train_loss": 3.575237274169922, "lr": 0.0003686828828675939, "tps": 20773, "wall": 20906.6} {"step": 6627, "train_loss": 3.652315855026245, "lr": 0.000368672083683188, "tps": 20768, "wall": 20914.5} {"step": 6628, "train_loss": 3.6802210807800293, "lr": 0.0003686612828146166, "tps": 20764, "wall": 20922.3} {"step": 6629, "train_loss": 3.696256160736084, "lr": 0.0003686504802620022, "tps": 20759, "wall": 20930.1} {"step": 6630, "train_loss": 3.6209828853607178, "lr": 0.00036863967602546714, "tps": 20755, "wall": 20938.0} {"step": 6631, "train_loss": 3.6779892444610596, "lr": 0.0003686288701051337, "tps": 20750, "wall": 20945.7} {"step": 6632, "train_loss": 3.6572060585021973, "lr": 0.0003686180625011245, "tps": 20745, "wall": 20953.5} {"step": 6633, "train_loss": 3.6026551723480225, "lr": 0.0003686072532135617, "tps": 20741, "wall": 20961.2} {"step": 6634, "train_loss": 3.6041903495788574, "lr": 0.000368596442242568, "tps": 20736, "wall": 20969.2} {"step": 6635, "train_loss": 3.7181167602539062, "lr": 0.00036858562958826574, "tps": 20732, "wall": 20977.0} {"step": 6636, "train_loss": 3.5481317043304443, "lr": 0.0003685748152507774, "tps": 20727, "wall": 20985.0} {"step": 6637, "train_loss": 3.701314926147461, "lr": 0.0003685639992302255, "tps": 20722, "wall": 20992.7} {"step": 6638, "train_loss": 3.6370763778686523, "lr": 0.00036855318152673264, "tps": 20718, "wall": 21000.6} {"step": 6639, "train_loss": 3.8052477836608887, "lr": 0.00036854236214042124, "tps": 20713, "wall": 21008.3} {"step": 6640, "train_loss": 3.5915942192077637, "lr": 0.000368531541071414, "tps": 20708, "wall": 21016.3} {"step": 6641, "train_loss": 3.722102642059326, "lr": 0.0003685207183198334, "tps": 20704, "wall": 21024.1} {"step": 6642, "train_loss": 3.5462119579315186, "lr": 0.000368509893885802, "tps": 20699, "wall": 21031.8} {"step": 6643, "train_loss": 3.583007335662842, "lr": 0.00036849906776944256, "tps": 20695, "wall": 21039.7} {"step": 6644, "train_loss": 3.6912693977355957, "lr": 0.0003684882399708777, "tps": 20690, "wall": 21047.6} {"step": 6645, "train_loss": 3.6550958156585693, "lr": 0.00036847741049022994, "tps": 20685, "wall": 21055.5} {"step": 6646, "train_loss": 3.5883984565734863, "lr": 0.000368466579327622, "tps": 20681, "wall": 21063.4} {"step": 6647, "train_loss": 3.654735565185547, "lr": 0.0003684557464831767, "tps": 20676, "wall": 21071.2} {"step": 6648, "train_loss": 3.5844717025756836, "lr": 0.0003684449119570167, "tps": 20672, "wall": 21079.1} {"step": 6649, "train_loss": 3.676560401916504, "lr": 0.0003684340757492646, "tps": 20667, "wall": 21087.1} {"step": 6650, "train_loss": 3.681630849838257, "lr": 0.00036842323786004334, "tps": 20662, "wall": 21094.9} {"step": 6651, "train_loss": 3.790402412414551, "lr": 0.0003684123982894756, "tps": 20658, "wall": 21103.0} {"step": 6652, "train_loss": 3.6370537281036377, "lr": 0.0003684015570376842, "tps": 20653, "wall": 21110.8} {"step": 6653, "train_loss": 3.5878615379333496, "lr": 0.00036839071410479186, "tps": 20648, "wall": 21118.8} {"step": 6654, "train_loss": 3.702080726623535, "lr": 0.00036837986949092154, "tps": 20644, "wall": 21126.6} {"step": 6655, "train_loss": 3.613990306854248, "lr": 0.000368369023196196, "tps": 20639, "wall": 21134.6} {"step": 6656, "train_loss": 3.629934310913086, "lr": 0.00036835817522073815, "tps": 20634, "wall": 21142.6} {"step": 6657, "train_loss": 3.6377625465393066, "lr": 0.0003683473255646709, "tps": 20630, "wall": 21150.5} {"step": 6658, "train_loss": 3.7597646713256836, "lr": 0.0003683364742281171, "tps": 20625, "wall": 21158.3} {"step": 6659, "train_loss": 3.6441264152526855, "lr": 0.0003683256212111997, "tps": 20620, "wall": 21166.4} {"step": 6660, "train_loss": 3.6079516410827637, "lr": 0.0003683147665140416, "tps": 20616, "wall": 21174.3} {"step": 6661, "train_loss": 3.6754343509674072, "lr": 0.00036830391013676587, "tps": 20611, "wall": 21182.1} {"step": 6662, "train_loss": 3.6887471675872803, "lr": 0.00036829305207949534, "tps": 20607, "wall": 21190.1} {"step": 6663, "train_loss": 3.625973701477051, "lr": 0.00036828219234235314, "tps": 20602, "wall": 21198.1} {"step": 6664, "train_loss": 3.583625555038452, "lr": 0.0003682713309254622, "tps": 20597, "wall": 21206.2} {"step": 6665, "train_loss": 3.6477837562561035, "lr": 0.0003682604678289457, "tps": 20593, "wall": 21214.1} {"step": 6666, "train_loss": 3.7085177898406982, "lr": 0.00036824960305292646, "tps": 20588, "wall": 21222.1} {"step": 6667, "train_loss": 3.7317543029785156, "lr": 0.0003682387365975278, "tps": 20583, "wall": 21230.2} {"step": 6668, "train_loss": 3.7009196281433105, "lr": 0.0003682278684628727, "tps": 20578, "wall": 21238.2} {"step": 6669, "train_loss": 3.5745840072631836, "lr": 0.0003682169986490843, "tps": 20574, "wall": 21246.2} {"step": 6670, "train_loss": 3.6444501876831055, "lr": 0.0003682061271562857, "tps": 20569, "wall": 21254.3} {"step": 6671, "train_loss": 3.7457375526428223, "lr": 0.00036819525398460004, "tps": 20564, "wall": 21262.2} {"step": 6672, "train_loss": 3.7369606494903564, "lr": 0.0003681843791341506, "tps": 20560, "wall": 21270.2} {"step": 6673, "train_loss": 3.730137825012207, "lr": 0.00036817350260506045, "tps": 20555, "wall": 21278.2} {"step": 6674, "train_loss": 3.8072915077209473, "lr": 0.0003681626243974528, "tps": 20550, "wall": 21286.3} {"step": 6675, "train_loss": 3.684009552001953, "lr": 0.00036815174451145096, "tps": 20546, "wall": 21294.2} {"step": 6676, "train_loss": 3.64186692237854, "lr": 0.0003681408629471782, "tps": 20541, "wall": 21302.2} {"step": 6677, "train_loss": 3.6922879219055176, "lr": 0.00036812997970475767, "tps": 20537, "wall": 21310.1} {"step": 6678, "train_loss": 3.565220832824707, "lr": 0.00036811909478431275, "tps": 20532, "wall": 21318.2} {"step": 6679, "train_loss": 3.674398899078369, "lr": 0.0003681082081859667, "tps": 20527, "wall": 21326.2} {"step": 6680, "train_loss": 3.651531219482422, "lr": 0.0003680973199098428, "tps": 20523, "wall": 21334.2} {"step": 6681, "train_loss": 3.733268976211548, "lr": 0.0003680864299560645, "tps": 20518, "wall": 21342.3} {"step": 6682, "train_loss": 3.701843023300171, "lr": 0.00036807553832475515, "tps": 20513, "wall": 21350.3} {"step": 6683, "train_loss": 3.6803781986236572, "lr": 0.000368064645016038, "tps": 20509, "wall": 21358.4} {"step": 6684, "train_loss": 3.7434604167938232, "lr": 0.00036805375003003663, "tps": 20504, "wall": 21366.4} {"step": 6685, "train_loss": 3.654477119445801, "lr": 0.0003680428533668743, "tps": 20499, "wall": 21374.4} {"step": 6686, "train_loss": 3.6568613052368164, "lr": 0.00036803195502667455, "tps": 20495, "wall": 21382.4} {"step": 6687, "train_loss": 3.5618674755096436, "lr": 0.0003680210550095609, "tps": 20490, "wall": 21390.5} {"step": 6688, "train_loss": 3.7639379501342773, "lr": 0.0003680101533156566, "tps": 20486, "wall": 21398.5} {"step": 6689, "train_loss": 3.6762046813964844, "lr": 0.0003679992499450853, "tps": 20481, "wall": 21406.7} {"step": 6690, "train_loss": 3.793242931365967, "lr": 0.0003679883448979705, "tps": 20476, "wall": 21414.7} {"step": 6691, "train_loss": 3.719564914703369, "lr": 0.00036797743817443566, "tps": 20472, "wall": 21422.6} {"step": 6692, "train_loss": 3.786855697631836, "lr": 0.0003679665297746045, "tps": 20467, "wall": 21430.6} {"step": 6693, "train_loss": 3.7147061824798584, "lr": 0.00036795561969860043, "tps": 20462, "wall": 21438.7} {"step": 6694, "train_loss": 3.654242515563965, "lr": 0.00036794470794654713, "tps": 20458, "wall": 21446.8} {"step": 6695, "train_loss": 3.7282228469848633, "lr": 0.00036793379451856815, "tps": 20453, "wall": 21454.9} {"step": 6696, "train_loss": 3.7644295692443848, "lr": 0.00036792287941478716, "tps": 20448, "wall": 21463.1} {"step": 6697, "train_loss": 3.576040744781494, "lr": 0.00036791196263532774, "tps": 20444, "wall": 21471.1} {"step": 6698, "train_loss": 3.6483447551727295, "lr": 0.00036790104418031366, "tps": 20439, "wall": 21479.3} {"step": 6699, "train_loss": 3.689883232116699, "lr": 0.00036789012404986847, "tps": 20434, "wall": 21487.3} {"step": 6700, "train_loss": 3.682346820831299, "lr": 0.0003678792022441161, "tps": 20430, "wall": 21495.5} {"step": 6701, "train_loss": 3.6202645301818848, "lr": 0.00036786827876318006, "tps": 20425, "wall": 21503.5} {"step": 6702, "train_loss": 3.6651601791381836, "lr": 0.0003678573536071841, "tps": 20420, "wall": 21511.7} {"step": 6703, "train_loss": 3.6281962394714355, "lr": 0.0003678464267762521, "tps": 20416, "wall": 21519.7} {"step": 6704, "train_loss": 3.6988120079040527, "lr": 0.00036783549827050776, "tps": 20411, "wall": 21528.0} {"step": 6705, "train_loss": 3.6733522415161133, "lr": 0.00036782456809007487, "tps": 20406, "wall": 21536.1} {"step": 6706, "train_loss": 3.56227707862854, "lr": 0.0003678136362350773, "tps": 20402, "wall": 21544.1} {"step": 6707, "train_loss": 3.7670164108276367, "lr": 0.0003678027027056389, "tps": 20397, "wall": 21552.1} {"step": 6708, "train_loss": 3.6403310298919678, "lr": 0.00036779176750188346, "tps": 20393, "wall": 21560.2} {"step": 6709, "train_loss": 3.652925491333008, "lr": 0.0003677808306239349, "tps": 20388, "wall": 21568.3} {"step": 6710, "train_loss": 3.6422550678253174, "lr": 0.00036776989207191704, "tps": 20383, "wall": 21576.4} {"step": 6711, "train_loss": 3.7178969383239746, "lr": 0.0003677589518459539, "tps": 20379, "wall": 21584.6} {"step": 6712, "train_loss": 3.6968376636505127, "lr": 0.0003677480099461693, "tps": 20374, "wall": 21592.7} {"step": 6713, "train_loss": 3.6815271377563477, "lr": 0.0003677370663726873, "tps": 20369, "wall": 21600.9} {"step": 6714, "train_loss": 3.6922097206115723, "lr": 0.0003677261211256318, "tps": 20365, "wall": 21608.9} {"step": 6715, "train_loss": 3.579272747039795, "lr": 0.00036771517420512684, "tps": 20360, "wall": 21617.0} {"step": 6716, "train_loss": 3.6793041229248047, "lr": 0.00036770422561129636, "tps": 20356, "wall": 21625.1} {"step": 6717, "train_loss": 3.773571014404297, "lr": 0.00036769327534426447, "tps": 20351, "wall": 21633.3} {"step": 6718, "train_loss": 3.688021659851074, "lr": 0.0003676823234041551, "tps": 20346, "wall": 21641.5} {"step": 6719, "train_loss": 3.5949792861938477, "lr": 0.0003676713697910924, "tps": 20342, "wall": 21649.8} {"step": 6720, "train_loss": 3.6977646350860596, "lr": 0.00036766041450520047, "tps": 20337, "wall": 21658.1} {"step": 6721, "train_loss": 3.5909507274627686, "lr": 0.0003676494575466033, "tps": 20332, "wall": 21666.2} {"step": 6722, "train_loss": 3.6210854053497314, "lr": 0.0003676384989154252, "tps": 20328, "wall": 21674.3} {"step": 6723, "train_loss": 3.7154698371887207, "lr": 0.00036762753861179013, "tps": 20323, "wall": 21682.3} {"step": 6724, "train_loss": 3.672823429107666, "lr": 0.0003676165766358223, "tps": 20318, "wall": 21690.5} {"step": 6725, "train_loss": 3.6903061866760254, "lr": 0.00036760561298764596, "tps": 20314, "wall": 21698.7} {"step": 6726, "train_loss": 3.6126465797424316, "lr": 0.00036759464766738517, "tps": 20309, "wall": 21707.0} {"step": 6727, "train_loss": 3.6655750274658203, "lr": 0.0003675836806751643, "tps": 20305, "wall": 21715.1} {"step": 6728, "train_loss": 3.6566123962402344, "lr": 0.0003675727120111075, "tps": 20300, "wall": 21723.3} {"step": 6729, "train_loss": 3.615201473236084, "lr": 0.00036756174167533906, "tps": 20295, "wall": 21731.3} {"step": 6730, "train_loss": 3.6385459899902344, "lr": 0.0003675507696679831, "tps": 20291, "wall": 21739.5} {"step": 6731, "train_loss": 3.7301411628723145, "lr": 0.0003675397959891642, "tps": 20286, "wall": 21747.7} {"step": 6732, "train_loss": 3.7119083404541016, "lr": 0.00036752882063900645, "tps": 20282, "wall": 21755.9} {"step": 6733, "train_loss": 3.6966052055358887, "lr": 0.0003675178436176342, "tps": 20277, "wall": 21763.9} {"step": 6734, "train_loss": 3.6571762561798096, "lr": 0.0003675068649251718, "tps": 20272, "wall": 21772.1} {"step": 6735, "train_loss": 3.6750903129577637, "lr": 0.00036749588456174375, "tps": 20268, "wall": 21780.2} {"step": 6736, "train_loss": 3.6797475814819336, "lr": 0.0003674849025274743, "tps": 20263, "wall": 21788.4} {"step": 6737, "train_loss": 3.6515800952911377, "lr": 0.00036747391882248787, "tps": 20259, "wall": 21796.5} {"step": 6738, "train_loss": 3.588568687438965, "lr": 0.00036746293344690906, "tps": 20254, "wall": 21804.7} {"step": 6739, "train_loss": 3.5974156856536865, "lr": 0.000367451946400862, "tps": 20250, "wall": 21812.8} {"step": 6740, "train_loss": 3.687748670578003, "lr": 0.0003674409576844713, "tps": 20245, "wall": 21820.8} {"step": 6741, "train_loss": 3.7598352432250977, "lr": 0.00036742996729786156, "tps": 20241, "wall": 21829.1} {"step": 6742, "train_loss": 3.7015762329101562, "lr": 0.0003674189752411571, "tps": 20236, "wall": 21837.3} {"step": 6743, "train_loss": 3.6477274894714355, "lr": 0.0003674079815144826, "tps": 20231, "wall": 21845.4} {"step": 6744, "train_loss": 3.696796417236328, "lr": 0.00036739698611796244, "tps": 20227, "wall": 21853.4} {"step": 6745, "train_loss": 3.626832962036133, "lr": 0.00036738598905172124, "tps": 20222, "wall": 21861.6} {"step": 6746, "train_loss": 3.7198843955993652, "lr": 0.00036737499031588356, "tps": 20218, "wall": 21869.7} {"step": 6747, "train_loss": 3.645893096923828, "lr": 0.0003673639899105741, "tps": 20213, "wall": 21877.8} {"step": 6748, "train_loss": 3.6697707176208496, "lr": 0.00036735298783591733, "tps": 20209, "wall": 21886.0} {"step": 6749, "train_loss": 3.59982967376709, "lr": 0.0003673419840920379, "tps": 20204, "wall": 21894.2} {"step": 6750, "train_loss": 3.5770387649536133, "lr": 0.0003673309786790606, "tps": 20200, "wall": 21902.4} {"step": 6751, "train_loss": 3.64381742477417, "lr": 0.00036731997159710996, "tps": 20195, "wall": 21910.5} {"step": 6752, "train_loss": 3.645385265350342, "lr": 0.00036730896284631077, "tps": 20191, "wall": 21918.7} {"step": 6753, "train_loss": 3.632418394088745, "lr": 0.0003672979524267876, "tps": 20186, "wall": 21926.8} {"step": 6754, "train_loss": 3.5895638465881348, "lr": 0.00036728694033866526, "tps": 20182, "wall": 21934.9} {"step": 6755, "train_loss": 3.680821180343628, "lr": 0.00036727592658206853, "tps": 20177, "wall": 21943.3} {"step": 6756, "train_loss": 3.7307636737823486, "lr": 0.0003672649111571221, "tps": 20173, "wall": 21951.3} {"step": 6757, "train_loss": 3.568296432495117, "lr": 0.0003672538940639508, "tps": 20168, "wall": 21959.6} {"step": 6758, "train_loss": 3.7249348163604736, "lr": 0.0003672428753026795, "tps": 20164, "wall": 21967.7} {"step": 6759, "train_loss": 3.65276837348938, "lr": 0.0003672318548734329, "tps": 20159, "wall": 21975.9} {"step": 6760, "train_loss": 3.610229969024658, "lr": 0.0003672208327763358, "tps": 20155, "wall": 21984.1} {"step": 6761, "train_loss": 3.6955909729003906, "lr": 0.00036720980901151323, "tps": 20150, "wall": 21992.3} {"step": 6762, "train_loss": 3.704545736312866, "lr": 0.00036719878357908996, "tps": 20146, "wall": 22000.3} {"step": 6763, "train_loss": 3.564098358154297, "lr": 0.00036718775647919086, "tps": 20141, "wall": 22008.6} {"step": 6764, "train_loss": 3.6537437438964844, "lr": 0.00036717672771194093, "tps": 20136, "wall": 22016.8} {"step": 6765, "train_loss": 3.6593546867370605, "lr": 0.00036716569727746507, "tps": 20132, "wall": 22024.9} {"step": 6766, "train_loss": 3.65592098236084, "lr": 0.00036715466517588824, "tps": 20128, "wall": 22033.1} {"step": 6767, "train_loss": 3.6983587741851807, "lr": 0.0003671436314073354, "tps": 20123, "wall": 22041.3} {"step": 6768, "train_loss": 3.6465721130371094, "lr": 0.0003671325959719315, "tps": 20119, "wall": 22049.4} {"step": 6769, "train_loss": 3.668382167816162, "lr": 0.0003671215588698016, "tps": 20114, "wall": 22057.5} {"step": 6770, "train_loss": 3.595690965652466, "lr": 0.00036711052010107075, "tps": 20110, "wall": 22065.6} {"step": 6771, "train_loss": 3.800626277923584, "lr": 0.00036709947966586396, "tps": 20105, "wall": 22073.9} {"step": 6772, "train_loss": 3.598951578140259, "lr": 0.00036708843756430635, "tps": 20101, "wall": 22081.9} {"step": 6773, "train_loss": 3.571662425994873, "lr": 0.00036707739379652295, "tps": 20096, "wall": 22090.1} {"step": 6774, "train_loss": 3.6156907081604004, "lr": 0.0003670663483626388, "tps": 20092, "wall": 22098.1} {"step": 6775, "train_loss": 3.589348316192627, "lr": 0.00036705530126277913, "tps": 20087, "wall": 22106.4} {"step": 6776, "train_loss": 3.6071603298187256, "lr": 0.0003670442524970691, "tps": 20083, "wall": 22114.4} {"step": 6777, "train_loss": 3.6872687339782715, "lr": 0.00036703320206563376, "tps": 20079, "wall": 22122.5} {"step": 6778, "train_loss": 3.7231287956237793, "lr": 0.0003670221499685984, "tps": 20074, "wall": 22130.8} {"step": 6779, "train_loss": 3.6883010864257812, "lr": 0.0003670110962060882, "tps": 20070, "wall": 22139.1} {"step": 6780, "train_loss": 3.5700736045837402, "lr": 0.00036700004077822826, "tps": 20065, "wall": 22147.2} {"step": 6781, "train_loss": 3.706141948699951, "lr": 0.0003669889836851439, "tps": 20061, "wall": 22155.3} {"step": 6782, "train_loss": 3.7129428386688232, "lr": 0.00036697792492696054, "tps": 20056, "wall": 22163.5} {"step": 6783, "train_loss": 3.5352635383605957, "lr": 0.00036696686450380316, "tps": 20052, "wall": 22171.8} {"step": 6784, "train_loss": 3.7245912551879883, "lr": 0.0003669558024157972, "tps": 20047, "wall": 22179.9} {"step": 6785, "train_loss": 3.707686424255371, "lr": 0.000366944738663068, "tps": 20043, "wall": 22188.1} {"step": 6786, "train_loss": 3.7931761741638184, "lr": 0.0003669336732457408, "tps": 20038, "wall": 22196.5} {"step": 6787, "train_loss": 3.6114695072174072, "lr": 0.0003669226061639411, "tps": 20034, "wall": 22204.5} {"step": 6788, "train_loss": 3.775282621383667, "lr": 0.00036691153741779406, "tps": 20030, "wall": 22212.7} {"step": 6789, "train_loss": 3.7223730087280273, "lr": 0.00036690046700742516, "tps": 20025, "wall": 22220.8} {"step": 6790, "train_loss": 3.5646042823791504, "lr": 0.0003668893949329599, "tps": 20021, "wall": 22229.1} {"step": 6791, "train_loss": 3.5525364875793457, "lr": 0.0003668783211945236, "tps": 20016, "wall": 22237.3} {"step": 6792, "train_loss": 3.6901397705078125, "lr": 0.00036686724579224175, "tps": 20012, "wall": 22245.5} {"step": 6793, "train_loss": 3.715266227722168, "lr": 0.0003668561687262398, "tps": 20008, "wall": 22253.7} {"step": 6794, "train_loss": 3.671905517578125, "lr": 0.0003668450899966432, "tps": 20003, "wall": 22261.7} {"step": 6795, "train_loss": 3.6135447025299072, "lr": 0.0003668340096035775, "tps": 19999, "wall": 22269.8} {"step": 6796, "train_loss": 3.6860532760620117, "lr": 0.00036682292754716813, "tps": 19995, "wall": 22277.9} {"step": 6797, "train_loss": 3.59588885307312, "lr": 0.00036681184382754076, "tps": 19990, "wall": 22286.0} {"step": 6798, "train_loss": 3.6083154678344727, "lr": 0.00036680075844482086, "tps": 19986, "wall": 22294.0} {"step": 6799, "train_loss": 3.657773494720459, "lr": 0.000366789671399134, "tps": 19982, "wall": 22302.2} {"step": 6800, "train_loss": 3.6654038429260254, "lr": 0.00036677858269060584, "tps": 19977, "wall": 22310.4} {"step": 6801, "train_loss": 3.6176300048828125, "lr": 0.000366767492319362, "tps": 19973, "wall": 22318.5} {"step": 6802, "train_loss": 3.6101722717285156, "lr": 0.00036675640028552796, "tps": 19969, "wall": 22326.6} {"step": 6803, "train_loss": 3.5860366821289062, "lr": 0.0003667453065892295, "tps": 19964, "wall": 22334.8} {"step": 6804, "train_loss": 3.631406784057617, "lr": 0.00036673421123059233, "tps": 19960, "wall": 22342.8} {"step": 6805, "train_loss": 3.7614455223083496, "lr": 0.0003667231142097421, "tps": 19956, "wall": 22350.9} {"step": 6806, "train_loss": 3.5541443824768066, "lr": 0.00036671201552680434, "tps": 19951, "wall": 22359.1} {"step": 6807, "train_loss": 3.7156221866607666, "lr": 0.00036670091518190505, "tps": 19947, "wall": 22367.2} {"step": 6808, "train_loss": 3.5296664237976074, "lr": 0.00036668981317516985, "tps": 19943, "wall": 22375.4} {"step": 6809, "train_loss": 3.705824136734009, "lr": 0.00036667870950672453, "tps": 19938, "wall": 22383.4} {"step": 6810, "train_loss": 3.695974826812744, "lr": 0.0003666676041766948, "tps": 19934, "wall": 22391.6} {"step": 6811, "train_loss": 3.636597156524658, "lr": 0.00036665649718520656, "tps": 19930, "wall": 22399.6} {"step": 6812, "train_loss": 3.6517419815063477, "lr": 0.0003666453885323855, "tps": 19926, "wall": 22407.7} {"step": 6813, "train_loss": 3.7313716411590576, "lr": 0.0003666342782183576, "tps": 19921, "wall": 22415.8} {"step": 6814, "train_loss": 3.7834653854370117, "lr": 0.0003666231662432487, "tps": 19917, "wall": 22423.9} {"step": 6815, "train_loss": 3.570213794708252, "lr": 0.0003666120526071846, "tps": 19913, "wall": 22431.9} {"step": 6816, "train_loss": 3.6920595169067383, "lr": 0.00036660093731029125, "tps": 19909, "wall": 22440.0} {"step": 6817, "train_loss": 3.611278533935547, "lr": 0.00036658982035269453, "tps": 19904, "wall": 22448.0} {"step": 6818, "train_loss": 3.661283493041992, "lr": 0.0003665787017345204, "tps": 19900, "wall": 22456.1} {"step": 6819, "train_loss": 3.6890881061553955, "lr": 0.00036656758145589487, "tps": 19896, "wall": 22464.1} {"step": 6820, "train_loss": 3.6145942211151123, "lr": 0.00036655645951694384, "tps": 19892, "wall": 22472.1} {"step": 6821, "train_loss": 3.810605764389038, "lr": 0.0003665453359177932, "tps": 19887, "wall": 22480.2} {"step": 6822, "train_loss": 3.6839871406555176, "lr": 0.00036653421065856916, "tps": 19883, "wall": 22488.2} {"step": 6823, "train_loss": 3.7115535736083984, "lr": 0.00036652308373939763, "tps": 19879, "wall": 22496.3} {"step": 6824, "train_loss": 3.6365582942962646, "lr": 0.00036651195516040463, "tps": 19875, "wall": 22504.2} {"step": 6825, "train_loss": 3.558361053466797, "lr": 0.00036650082492171635, "tps": 19871, "wall": 22512.3} {"step": 6826, "train_loss": 3.6963725090026855, "lr": 0.0003664896930234587, "tps": 19867, "wall": 22520.3} {"step": 6827, "train_loss": 3.6431562900543213, "lr": 0.00036647855946575806, "tps": 19863, "wall": 22528.3} {"step": 6828, "train_loss": 3.6380481719970703, "lr": 0.0003664674242487402, "tps": 19858, "wall": 22536.4} {"step": 6829, "train_loss": 3.7099740505218506, "lr": 0.00036645628737253156, "tps": 19854, "wall": 22544.5} {"step": 6830, "train_loss": 3.654550552368164, "lr": 0.0003664451488372581, "tps": 19850, "wall": 22552.4} {"step": 6831, "train_loss": 3.69602108001709, "lr": 0.0003664340086430461, "tps": 19846, "wall": 22560.5} {"step": 6832, "train_loss": 3.687196731567383, "lr": 0.00036642286679002174, "tps": 19842, "wall": 22568.4} {"step": 6833, "train_loss": 3.5827622413635254, "lr": 0.00036641172327831124, "tps": 19837, "wall": 22576.5} {"step": 6834, "train_loss": 3.6725099086761475, "lr": 0.0003664005781080407, "tps": 19833, "wall": 22584.6} {"step": 6835, "train_loss": 3.735311508178711, "lr": 0.00036638943127933663, "tps": 19829, "wall": 22592.6} {"step": 6836, "train_loss": 3.750284433364868, "lr": 0.00036637828279232503, "tps": 19825, "wall": 22600.7} {"step": 6837, "train_loss": 3.654923915863037, "lr": 0.0003663671326471324, "tps": 19821, "wall": 22608.8} {"step": 6838, "train_loss": 3.653987407684326, "lr": 0.00036635598084388497, "tps": 19817, "wall": 22617.0} {"step": 6839, "train_loss": 3.6845521926879883, "lr": 0.00036634482738270906, "tps": 19812, "wall": 22624.9} {"step": 6840, "train_loss": 3.6656394004821777, "lr": 0.00036633367226373106, "tps": 19808, "wall": 22632.9} {"step": 6841, "train_loss": 3.638275623321533, "lr": 0.00036632251548707727, "tps": 19804, "wall": 22640.9} {"step": 6842, "train_loss": 3.8069310188293457, "lr": 0.00036631135705287416, "tps": 19800, "wall": 22649.1} {"step": 6843, "train_loss": 3.60551381111145, "lr": 0.00036630019696124805, "tps": 19796, "wall": 22657.1} {"step": 6844, "train_loss": 3.6360318660736084, "lr": 0.0003662890352123254, "tps": 19792, "wall": 22665.2} {"step": 6845, "train_loss": 3.638155460357666, "lr": 0.0003662778718062326, "tps": 19788, "wall": 22673.1} {"step": 6846, "train_loss": 3.673152446746826, "lr": 0.0003662667067430962, "tps": 19784, "wall": 22681.1} {"step": 6847, "train_loss": 3.666407823562622, "lr": 0.0003662555400230426, "tps": 19779, "wall": 22689.1} {"step": 6848, "train_loss": 3.654080629348755, "lr": 0.00036624437164619835, "tps": 19775, "wall": 22697.1} {"step": 6849, "train_loss": 3.6987898349761963, "lr": 0.00036623320161268996, "tps": 19771, "wall": 22705.2} {"step": 6850, "train_loss": 3.615119457244873, "lr": 0.00036622202992264393, "tps": 19767, "wall": 22713.1} {"step": 6851, "train_loss": 3.661823272705078, "lr": 0.00036621085657618683, "tps": 19763, "wall": 22721.1} {"step": 6852, "train_loss": 3.6514906883239746, "lr": 0.0003661996815734453, "tps": 19759, "wall": 22729.2} {"step": 6853, "train_loss": 3.6368680000305176, "lr": 0.0003661885049145458, "tps": 19755, "wall": 22737.2} {"step": 6854, "train_loss": 3.634000778198242, "lr": 0.000366177326599615, "tps": 19751, "wall": 22745.2} {"step": 6855, "train_loss": 3.640929937362671, "lr": 0.00036616614662877956, "tps": 19747, "wall": 22753.1} {"step": 6856, "train_loss": 3.6348073482513428, "lr": 0.0003661549650021661, "tps": 19743, "wall": 22761.1} {"step": 6857, "train_loss": 3.6152050495147705, "lr": 0.00036614378171990136, "tps": 19739, "wall": 22769.2} {"step": 6858, "train_loss": 3.6184701919555664, "lr": 0.00036613259678211187, "tps": 19735, "wall": 22777.1} {"step": 6859, "train_loss": 3.630235195159912, "lr": 0.0003661214101889244, "tps": 19731, "wall": 22785.1} {"step": 6860, "train_loss": 3.6198666095733643, "lr": 0.00036611022194046574, "tps": 19727, "wall": 22793.1} {"step": 6861, "train_loss": 3.6908493041992188, "lr": 0.0003660990320368626, "tps": 19723, "wall": 22801.2} {"step": 6862, "train_loss": 3.6959445476531982, "lr": 0.00036608784047824166, "tps": 19719, "wall": 22809.1} {"step": 6863, "train_loss": 3.5715620517730713, "lr": 0.00036607664726472983, "tps": 19715, "wall": 22817.1} {"step": 6864, "train_loss": 3.6511545181274414, "lr": 0.00036606545239645374, "tps": 19711, "wall": 22825.0} {"step": 6865, "train_loss": 3.6241676807403564, "lr": 0.0003660542558735404, "tps": 19706, "wall": 22833.1} {"step": 6866, "train_loss": 3.6280951499938965, "lr": 0.00036604305769611647, "tps": 19702, "wall": 22841.0} {"step": 6867, "train_loss": 3.697892189025879, "lr": 0.000366031857864309, "tps": 19698, "wall": 22849.0} {"step": 6868, "train_loss": 3.72792387008667, "lr": 0.0003660206563782446, "tps": 19694, "wall": 22857.0} {"step": 6869, "train_loss": 3.598301887512207, "lr": 0.00036600945323805043, "tps": 19690, "wall": 22865.0} {"step": 6870, "train_loss": 3.6164469718933105, "lr": 0.00036599824844385314, "tps": 19687, "wall": 22872.9} {"step": 6871, "train_loss": 3.6196017265319824, "lr": 0.00036598704199577986, "tps": 19683, "wall": 22880.7} {"step": 6872, "train_loss": 3.727928638458252, "lr": 0.0003659758338939575, "tps": 19679, "wall": 22888.7} {"step": 6873, "train_loss": 3.6348226070404053, "lr": 0.000365964624138513, "tps": 19675, "wall": 22896.7} {"step": 6874, "train_loss": 3.7042365074157715, "lr": 0.0003659534127295733, "tps": 19671, "wall": 22904.7} {"step": 6875, "train_loss": 3.629845380783081, "lr": 0.00036594219966726543, "tps": 19667, "wall": 22912.5} {"step": 6876, "train_loss": 3.5967109203338623, "lr": 0.00036593098495171653, "tps": 19663, "wall": 22920.5} {"step": 6877, "train_loss": 3.6247076988220215, "lr": 0.00036591976858305346, "tps": 19659, "wall": 22928.4} {"step": 6878, "train_loss": 3.655517101287842, "lr": 0.0003659085505614033, "tps": 19655, "wall": 22936.3} {"step": 6879, "train_loss": 3.7389683723449707, "lr": 0.0003658973308868933, "tps": 19651, "wall": 22944.1} {"step": 6880, "train_loss": 3.604222297668457, "lr": 0.0003658861095596503, "tps": 19647, "wall": 22952.1} {"step": 6881, "train_loss": 3.652705192565918, "lr": 0.0003658748865798017, "tps": 19643, "wall": 22960.1} {"step": 6882, "train_loss": 3.81777024269104, "lr": 0.00036586366194747444, "tps": 19639, "wall": 22968.2} {"step": 6883, "train_loss": 3.7021689414978027, "lr": 0.0003658524356627957, "tps": 19635, "wall": 22976.2} {"step": 6884, "train_loss": 3.686588764190674, "lr": 0.00036584120772589274, "tps": 19631, "wall": 22984.1} {"step": 6885, "train_loss": 3.640829086303711, "lr": 0.00036582997813689263, "tps": 19627, "wall": 22991.9} {"step": 6886, "train_loss": 3.6182875633239746, "lr": 0.00036581874689592273, "tps": 19623, "wall": 22999.8} {"step": 6887, "train_loss": 3.644571304321289, "lr": 0.0003658075140031101, "tps": 19619, "wall": 23007.8} {"step": 6888, "train_loss": 3.669762134552002, "lr": 0.00036579627945858203, "tps": 19615, "wall": 23015.8} {"step": 6889, "train_loss": 3.697334051132202, "lr": 0.00036578504326246586, "tps": 19611, "wall": 23023.9} {"step": 6890, "train_loss": 3.6122894287109375, "lr": 0.00036577380541488887, "tps": 19608, "wall": 23031.8} {"step": 6891, "train_loss": 3.6122093200683594, "lr": 0.0003657625659159783, "tps": 19604, "wall": 23039.7} {"step": 6892, "train_loss": 3.7145473957061768, "lr": 0.00036575132476586144, "tps": 19600, "wall": 23047.6} {"step": 6893, "train_loss": 3.701415777206421, "lr": 0.0003657400819646658, "tps": 19596, "wall": 23055.4} {"step": 6894, "train_loss": 3.6707444190979004, "lr": 0.00036572883751251854, "tps": 19592, "wall": 23063.4} {"step": 6895, "train_loss": 3.60768461227417, "lr": 0.00036571759140954714, "tps": 19588, "wall": 23071.3} {"step": 6896, "train_loss": 3.625415802001953, "lr": 0.000365706343655879, "tps": 19584, "wall": 23079.2} {"step": 6897, "train_loss": 3.66334867477417, "lr": 0.0003656950942516415, "tps": 19580, "wall": 23087.2} {"step": 6898, "train_loss": 3.7011075019836426, "lr": 0.0003656838431969621, "tps": 19576, "wall": 23095.2} {"step": 6899, "train_loss": 3.6276633739471436, "lr": 0.00036567259049196825, "tps": 19573, "wall": 23103.0} {"step": 6900, "train_loss": 3.7089109420776367, "lr": 0.00036566133613678744, "tps": 19569, "wall": 23110.8} {"step": 6901, "train_loss": 3.6738076210021973, "lr": 0.0003656500801315471, "tps": 19565, "wall": 23118.8} {"step": 6902, "train_loss": 3.67539381980896, "lr": 0.0003656388224763747, "tps": 19561, "wall": 23126.7} {"step": 6903, "train_loss": 3.6530604362487793, "lr": 0.00036562756317139796, "tps": 19557, "wall": 23134.5} {"step": 6904, "train_loss": 3.689999580383301, "lr": 0.00036561630221674423, "tps": 19554, "wall": 23142.4} {"step": 6905, "train_loss": 3.645627021789551, "lr": 0.0003656050396125412, "tps": 19550, "wall": 23150.4} {"step": 6906, "train_loss": 3.590200424194336, "lr": 0.0003655937753589164, "tps": 19546, "wall": 23158.3} {"step": 6907, "train_loss": 3.6815645694732666, "lr": 0.00036558250945599745, "tps": 19542, "wall": 23166.2} {"step": 6908, "train_loss": 3.647307872772217, "lr": 0.00036557124190391186, "tps": 19538, "wall": 23174.1} {"step": 6909, "train_loss": 3.533891201019287, "lr": 0.0003655599727027875, "tps": 19534, "wall": 23181.9} {"step": 6910, "train_loss": 3.7311787605285645, "lr": 0.0003655487018527518, "tps": 19530, "wall": 23190.0} {"step": 6911, "train_loss": 3.5938327312469482, "lr": 0.00036553742935393254, "tps": 19527, "wall": 23197.8} {"step": 6912, "train_loss": 3.6257622241973877, "lr": 0.00036552615520645746, "tps": 19523, "wall": 23205.6} {"step": 6913, "train_loss": 3.82141375541687, "lr": 0.0003655148794104541, "tps": 19519, "wall": 23213.6} {"step": 6914, "train_loss": 3.6242127418518066, "lr": 0.00036550360196605045, "tps": 19515, "wall": 23221.5} {"step": 6915, "train_loss": 3.6131768226623535, "lr": 0.000365492322873374, "tps": 19511, "wall": 23229.2} {"step": 6916, "train_loss": 3.619520902633667, "lr": 0.00036548104213255284, "tps": 19508, "wall": 23237.2} {"step": 6917, "train_loss": 3.677443742752075, "lr": 0.0003654697597437144, "tps": 19504, "wall": 23245.1} {"step": 6918, "train_loss": 3.6651623249053955, "lr": 0.00036545847570698675, "tps": 19500, "wall": 23252.9} {"step": 6919, "train_loss": 3.5792019367218018, "lr": 0.00036544719002249755, "tps": 19496, "wall": 23260.8} {"step": 6920, "train_loss": 3.6369552612304688, "lr": 0.0003654359026903747, "tps": 19492, "wall": 23268.8} {"step": 6921, "train_loss": 3.548482656478882, "lr": 0.0003654246137107461, "tps": 19489, "wall": 23276.7} {"step": 6922, "train_loss": 3.7402024269104004, "lr": 0.0003654133230837396, "tps": 19485, "wall": 23284.6} {"step": 6923, "train_loss": 3.639800786972046, "lr": 0.00036540203080948313, "tps": 19481, "wall": 23292.4} {"step": 6924, "train_loss": 3.693615674972534, "lr": 0.0003653907368881046, "tps": 19477, "wall": 23300.3} {"step": 6925, "train_loss": 3.5581281185150146, "lr": 0.00036537944131973194, "tps": 19473, "wall": 23308.2} {"step": 6926, "train_loss": 3.683631420135498, "lr": 0.00036536814410449307, "tps": 19470, "wall": 23316.0} {"step": 6927, "train_loss": 3.6612191200256348, "lr": 0.00036535684524251596, "tps": 19466, "wall": 23324.0} {"step": 6928, "train_loss": 3.686615467071533, "lr": 0.00036534554473392875, "tps": 19462, "wall": 23331.9} {"step": 6929, "train_loss": 3.752819776535034, "lr": 0.0003653342425788592, "tps": 19458, "wall": 23339.8} {"step": 6930, "train_loss": 3.673020362854004, "lr": 0.0003653229387774356, "tps": 19454, "wall": 23347.8} {"step": 6931, "train_loss": 3.6641969680786133, "lr": 0.0003653116333297859, "tps": 19451, "wall": 23355.7} {"step": 6932, "train_loss": 3.638719320297241, "lr": 0.0003653003262360381, "tps": 19447, "wall": 23363.7} {"step": 6933, "train_loss": 3.696444034576416, "lr": 0.00036528901749632045, "tps": 19443, "wall": 23371.5} {"step": 6934, "train_loss": 3.6626205444335938, "lr": 0.00036527770711076085, "tps": 19439, "wall": 23379.4} {"step": 6935, "train_loss": 3.585139751434326, "lr": 0.0003652663950794875, "tps": 19436, "wall": 23387.3} {"step": 6936, "train_loss": 3.6074273586273193, "lr": 0.00036525508140262865, "tps": 19432, "wall": 23395.3} {"step": 6937, "train_loss": 3.6367292404174805, "lr": 0.0003652437660803123, "tps": 19428, "wall": 23403.1} {"step": 6938, "train_loss": 3.646955966949463, "lr": 0.00036523244911266676, "tps": 19424, "wall": 23410.9} {"step": 6939, "train_loss": 3.646684408187866, "lr": 0.00036522113049982014, "tps": 19421, "wall": 23418.8} {"step": 6940, "train_loss": 3.686594009399414, "lr": 0.0003652098102419008, "tps": 19417, "wall": 23426.7} {"step": 6941, "train_loss": 3.631779432296753, "lr": 0.00036519848833903675, "tps": 19413, "wall": 23434.7} {"step": 6942, "train_loss": 3.6455202102661133, "lr": 0.0003651871647913564, "tps": 19409, "wall": 23442.5} {"step": 6943, "train_loss": 3.579475164413452, "lr": 0.000365175839598988, "tps": 19406, "wall": 23450.4} {"step": 6944, "train_loss": 3.699767589569092, "lr": 0.0003651645127620598, "tps": 19402, "wall": 23458.3} {"step": 6945, "train_loss": 3.6330790519714355, "lr": 0.0003651531842807003, "tps": 19398, "wall": 23466.2} {"step": 6946, "train_loss": 3.729097366333008, "lr": 0.00036514185415503753, "tps": 19394, "wall": 23474.1} {"step": 6947, "train_loss": 3.6428518295288086, "lr": 0.0003651305223852, "tps": 19391, "wall": 23481.9} {"step": 6948, "train_loss": 3.5563807487487793, "lr": 0.0003651191889713161, "tps": 19387, "wall": 23489.8} {"step": 6949, "train_loss": 3.63912034034729, "lr": 0.00036510785391351416, "tps": 19383, "wall": 23497.7} {"step": 6950, "train_loss": 3.65519380569458, "lr": 0.0003650965172119226, "tps": 19380, "wall": 23505.5} {"step": 6951, "train_loss": 3.638138771057129, "lr": 0.00036508517886666987, "tps": 19376, "wall": 23513.4} {"step": 6952, "train_loss": 3.664369583129883, "lr": 0.00036507383887788436, "tps": 19372, "wall": 23521.3} {"step": 6953, "train_loss": 3.672069549560547, "lr": 0.0003650624972456945, "tps": 19369, "wall": 23529.1} {"step": 6954, "train_loss": 3.6918792724609375, "lr": 0.0003650511539702289, "tps": 19365, "wall": 23536.9} {"step": 6955, "train_loss": 3.6046204566955566, "lr": 0.00036503980905161596, "tps": 19361, "wall": 23544.7} {"step": 6956, "train_loss": 3.6234853267669678, "lr": 0.00036502846248998423, "tps": 19358, "wall": 23552.6} {"step": 6957, "train_loss": 3.5955810546875, "lr": 0.00036501711428546226, "tps": 19354, "wall": 23560.5} {"step": 6958, "train_loss": 3.6116058826446533, "lr": 0.0003650057644381785, "tps": 19350, "wall": 23568.4} {"step": 6959, "train_loss": 3.7029783725738525, "lr": 0.00036499441294826157, "tps": 19346, "wall": 23576.3} {"step": 6960, "train_loss": 3.673654556274414, "lr": 0.0003649830598158402, "tps": 19343, "wall": 23584.1} {"step": 6961, "train_loss": 3.7608306407928467, "lr": 0.0003649717050410428, "tps": 19339, "wall": 23591.9} {"step": 6962, "train_loss": 3.649453639984131, "lr": 0.0003649603486239981, "tps": 19336, "wall": 23599.7} {"step": 6963, "train_loss": 3.6115496158599854, "lr": 0.0003649489905648348, "tps": 19332, "wall": 23607.7} {"step": 6964, "train_loss": 3.681130886077881, "lr": 0.00036493763086368136, "tps": 19328, "wall": 23615.5} {"step": 6965, "train_loss": 3.6554336547851562, "lr": 0.0003649262695206667, "tps": 19324, "wall": 23623.5} {"step": 6966, "train_loss": 3.642169952392578, "lr": 0.0003649149065359194, "tps": 19321, "wall": 23631.2} {"step": 6967, "train_loss": 3.6029374599456787, "lr": 0.00036490354190956814, "tps": 19317, "wall": 23639.0} {"step": 6968, "train_loss": 3.668337345123291, "lr": 0.0003648921756417418, "tps": 19314, "wall": 23646.8} {"step": 6969, "train_loss": 3.55822491645813, "lr": 0.000364880807732569, "tps": 19310, "wall": 23654.8} {"step": 6970, "train_loss": 3.6652231216430664, "lr": 0.0003648694381821786, "tps": 19306, "wall": 23662.6} {"step": 6971, "train_loss": 3.663727045059204, "lr": 0.00036485806699069936, "tps": 19303, "wall": 23670.4} {"step": 6972, "train_loss": 3.780482530593872, "lr": 0.0003648466941582601, "tps": 19299, "wall": 23678.3} {"step": 6973, "train_loss": 3.5429000854492188, "lr": 0.0003648353196849897, "tps": 19295, "wall": 23686.2} {"step": 6974, "train_loss": 3.6269450187683105, "lr": 0.00036482394357101685, "tps": 19292, "wall": 23694.1} {"step": 6975, "train_loss": 3.7979612350463867, "lr": 0.0003648125658164706, "tps": 19288, "wall": 23701.8} {"step": 6976, "train_loss": 3.5978498458862305, "lr": 0.0003648011864214798, "tps": 19285, "wall": 23709.7} {"step": 6977, "train_loss": 3.6958823204040527, "lr": 0.00036478980538617325, "tps": 19281, "wall": 23717.5} {"step": 6978, "train_loss": 3.6135377883911133, "lr": 0.00036477842271068005, "tps": 19277, "wall": 23725.4} {"step": 6979, "train_loss": 3.5577902793884277, "lr": 0.000364767038395129, "tps": 19274, "wall": 23733.1} {"step": 6980, "train_loss": 3.6694459915161133, "lr": 0.00036475565243964905, "tps": 19270, "wall": 23741.1} {"step": 6981, "train_loss": 3.7375941276550293, "lr": 0.0003647442648443693, "tps": 19267, "wall": 23748.9} {"step": 6982, "train_loss": 3.7346060276031494, "lr": 0.0003647328756094186, "tps": 19263, "wall": 23756.7} {"step": 6983, "train_loss": 3.6267290115356445, "lr": 0.0003647214847349262, "tps": 19259, "wall": 23764.5} {"step": 6984, "train_loss": 3.6371538639068604, "lr": 0.0003647100922210209, "tps": 19256, "wall": 23772.4} {"step": 6985, "train_loss": 3.620845079421997, "lr": 0.0003646986980678319, "tps": 19252, "wall": 23780.2} {"step": 6986, "train_loss": 3.7457737922668457, "lr": 0.00036468730227548815, "tps": 19249, "wall": 23788.2} {"step": 6987, "train_loss": 3.653672695159912, "lr": 0.00036467590484411886, "tps": 19245, "wall": 23796.0} {"step": 6988, "train_loss": 3.6746835708618164, "lr": 0.00036466450577385303, "tps": 19241, "wall": 23804.1} {"step": 6989, "train_loss": 3.673196792602539, "lr": 0.00036465310506481996, "tps": 19238, "wall": 23811.8} {"step": 6990, "train_loss": 3.6307268142700195, "lr": 0.00036464170271714865, "tps": 19234, "wall": 23819.6} {"step": 6991, "train_loss": 3.6856980323791504, "lr": 0.00036463029873096825, "tps": 19231, "wall": 23827.4} {"step": 6992, "train_loss": 3.723646640777588, "lr": 0.00036461889310640804, "tps": 19227, "wall": 23835.3} {"step": 6993, "train_loss": 3.7110209465026855, "lr": 0.0003646074858435972, "tps": 19223, "wall": 23843.2} {"step": 6994, "train_loss": 3.6089563369750977, "lr": 0.00036459607694266493, "tps": 19220, "wall": 23851.1} {"step": 6995, "train_loss": 3.6371312141418457, "lr": 0.0003645846664037405, "tps": 19216, "wall": 23858.9} {"step": 6996, "train_loss": 3.5787556171417236, "lr": 0.0003645732542269531, "tps": 19212, "wall": 23867.0} {"step": 6997, "train_loss": 3.577626943588257, "lr": 0.0003645618404124321, "tps": 19209, "wall": 23875.0} {"step": 6998, "train_loss": 3.5624256134033203, "lr": 0.0003645504249603067, "tps": 19205, "wall": 23882.8} {"step": 6999, "train_loss": 3.6420774459838867, "lr": 0.0003645390078707063, "tps": 19202, "wall": 23890.7} {"step": 7000, "train_loss": 3.6802563667297363, "lr": 0.0003645275891437602, "tps": 19198, "wall": 23898.6, "val_loss_monitor": 3.6700399161117225} {"step": 7001, "train_loss": 3.6346817016601562, "lr": 0.0003645161687795978, "tps": 19155, "wall": 23955.9} {"step": 7002, "train_loss": 3.6252903938293457, "lr": 0.0003645047467783483, "tps": 19151, "wall": 23964.0} {"step": 7003, "train_loss": 3.5818934440612793, "lr": 0.00036449332314014124, "tps": 19147, "wall": 23972.2} {"step": 7004, "train_loss": 3.515336036682129, "lr": 0.00036448189786510604, "tps": 19143, "wall": 23980.4} {"step": 7005, "train_loss": 3.622802734375, "lr": 0.0003644704709533721, "tps": 19139, "wall": 23988.8} {"step": 7006, "train_loss": 3.6247544288635254, "lr": 0.00036445904240506885, "tps": 19136, "wall": 23997.0} {"step": 7007, "train_loss": 3.680034637451172, "lr": 0.0003644476122203257, "tps": 19132, "wall": 24005.0} {"step": 7008, "train_loss": 3.543510675430298, "lr": 0.00036443618039927217, "tps": 19128, "wall": 24013.3} {"step": 7009, "train_loss": 3.7021100521087646, "lr": 0.00036442474694203786, "tps": 19124, "wall": 24021.3} {"step": 7010, "train_loss": 3.6293914318084717, "lr": 0.0003644133118487522, "tps": 19121, "wall": 24029.6} {"step": 7011, "train_loss": 3.5751161575317383, "lr": 0.00036440187511954463, "tps": 19117, "wall": 24037.7} {"step": 7012, "train_loss": 3.599163055419922, "lr": 0.0003643904367545449, "tps": 19113, "wall": 24045.9} {"step": 7013, "train_loss": 3.650193929672241, "lr": 0.00036437899675388245, "tps": 19109, "wall": 24054.1} {"step": 7014, "train_loss": 3.609687328338623, "lr": 0.00036436755511768694, "tps": 19106, "wall": 24062.2} {"step": 7015, "train_loss": 3.6211352348327637, "lr": 0.000364356111846088, "tps": 19102, "wall": 24070.3} {"step": 7016, "train_loss": 3.5958619117736816, "lr": 0.00036434466693921507, "tps": 19098, "wall": 24078.5} {"step": 7017, "train_loss": 3.6610093116760254, "lr": 0.00036433322039719805, "tps": 19094, "wall": 24086.8} {"step": 7018, "train_loss": 3.6936540603637695, "lr": 0.00036432177222016647, "tps": 19091, "wall": 24094.8} {"step": 7019, "train_loss": 3.6246931552886963, "lr": 0.0003643103224082501, "tps": 19087, "wall": 24103.1} {"step": 7020, "train_loss": 3.604872226715088, "lr": 0.00036429887096157856, "tps": 19083, "wall": 24111.1} {"step": 7021, "train_loss": 3.7655444145202637, "lr": 0.00036428741788028157, "tps": 19079, "wall": 24119.3} {"step": 7022, "train_loss": 3.7263617515563965, "lr": 0.0003642759631644889, "tps": 19076, "wall": 24127.3} {"step": 7023, "train_loss": 3.6038732528686523, "lr": 0.0003642645068143304, "tps": 19072, "wall": 24135.3} {"step": 7024, "train_loss": 3.6763622760772705, "lr": 0.00036425304882993563, "tps": 19068, "wall": 24143.4} {"step": 7025, "train_loss": 3.6070704460144043, "lr": 0.00036424158921143465, "tps": 19065, "wall": 24151.6} {"step": 7026, "train_loss": 3.643301248550415, "lr": 0.0003642301279589571, "tps": 19061, "wall": 24159.6} {"step": 7027, "train_loss": 3.6768088340759277, "lr": 0.0003642186650726328, "tps": 19057, "wall": 24167.9} {"step": 7028, "train_loss": 3.625361442565918, "lr": 0.0003642072005525917, "tps": 19054, "wall": 24176.1} {"step": 7029, "train_loss": 3.4993317127227783, "lr": 0.0003641957343989636, "tps": 19050, "wall": 24184.2} {"step": 7030, "train_loss": 3.5897254943847656, "lr": 0.0003641842666118785, "tps": 19046, "wall": 24192.1} {"step": 7031, "train_loss": 3.6514203548431396, "lr": 0.00036417279719146617, "tps": 19043, "wall": 24200.3} {"step": 7032, "train_loss": 3.6063897609710693, "lr": 0.00036416132613785663, "tps": 19039, "wall": 24208.4} {"step": 7033, "train_loss": 3.6175432205200195, "lr": 0.0003641498534511797, "tps": 19035, "wall": 24216.6} {"step": 7034, "train_loss": 3.7592594623565674, "lr": 0.00036413837913156557, "tps": 19031, "wall": 24224.8} {"step": 7035, "train_loss": 3.663712501525879, "lr": 0.000364126903179144, "tps": 19028, "wall": 24232.8} {"step": 7036, "train_loss": 3.627817153930664, "lr": 0.00036411542559404507, "tps": 19024, "wall": 24240.9} {"step": 7037, "train_loss": 3.6253232955932617, "lr": 0.0003641039463763988, "tps": 19021, "wall": 24248.9} {"step": 7038, "train_loss": 3.616452693939209, "lr": 0.00036409246552633525, "tps": 19017, "wall": 24257.0} {"step": 7039, "train_loss": 3.5891270637512207, "lr": 0.0003640809830439845, "tps": 19013, "wall": 24265.0} {"step": 7040, "train_loss": 3.7208921909332275, "lr": 0.00036406949892947647, "tps": 19010, "wall": 24273.1} {"step": 7041, "train_loss": 3.718669891357422, "lr": 0.0003640580131829414, "tps": 19006, "wall": 24281.1} {"step": 7042, "train_loss": 3.7027106285095215, "lr": 0.0003640465258045094, "tps": 19002, "wall": 24289.4} {"step": 7043, "train_loss": 3.6281566619873047, "lr": 0.0003640350367943105, "tps": 18999, "wall": 24297.4} {"step": 7044, "train_loss": 3.6931395530700684, "lr": 0.000364023546152475, "tps": 18995, "wall": 24305.5} {"step": 7045, "train_loss": 3.6584391593933105, "lr": 0.000364012053879133, "tps": 18992, "wall": 24313.5} {"step": 7046, "train_loss": 3.541919708251953, "lr": 0.0003640005599744146, "tps": 18988, "wall": 24321.7} {"step": 7047, "train_loss": 3.5752241611480713, "lr": 0.00036398906443845, "tps": 18984, "wall": 24329.8} {"step": 7048, "train_loss": 3.680185079574585, "lr": 0.00036397756727136956, "tps": 18981, "wall": 24337.9} {"step": 7049, "train_loss": 3.5880703926086426, "lr": 0.00036396606847330343, "tps": 18977, "wall": 24346.2} {"step": 7050, "train_loss": 3.6517691612243652, "lr": 0.0003639545680443819, "tps": 18973, "wall": 24354.2} {"step": 7051, "train_loss": 3.696723699569702, "lr": 0.0003639430659847353, "tps": 18970, "wall": 24362.3} {"step": 7052, "train_loss": 3.6018033027648926, "lr": 0.0003639315622944938, "tps": 18966, "wall": 24370.4} {"step": 7053, "train_loss": 3.6755542755126953, "lr": 0.0003639200569737877, "tps": 18963, "wall": 24378.4} {"step": 7054, "train_loss": 3.7301712036132812, "lr": 0.00036390855002274753, "tps": 18959, "wall": 24386.5} {"step": 7055, "train_loss": 3.6097211837768555, "lr": 0.00036389704144150346, "tps": 18955, "wall": 24394.6} {"step": 7056, "train_loss": 3.6503920555114746, "lr": 0.00036388553123018597, "tps": 18952, "wall": 24402.6} {"step": 7057, "train_loss": 3.6239748001098633, "lr": 0.00036387401938892534, "tps": 18948, "wall": 24410.8} {"step": 7058, "train_loss": 3.6189286708831787, "lr": 0.00036386250591785205, "tps": 18945, "wall": 24418.9} {"step": 7059, "train_loss": 3.766946792602539, "lr": 0.0003638509908170965, "tps": 18941, "wall": 24427.0} {"step": 7060, "train_loss": 3.596437931060791, "lr": 0.00036383947408678916, "tps": 18937, "wall": 24435.1} {"step": 7061, "train_loss": 3.615854501724243, "lr": 0.00036382795572706053, "tps": 18934, "wall": 24443.2} {"step": 7062, "train_loss": 3.6704294681549072, "lr": 0.0003638164357380409, "tps": 18930, "wall": 24451.3} {"step": 7063, "train_loss": 3.695402145385742, "lr": 0.00036380491411986104, "tps": 18927, "wall": 24459.4} {"step": 7064, "train_loss": 3.5956573486328125, "lr": 0.00036379339087265125, "tps": 18923, "wall": 24467.6} {"step": 7065, "train_loss": 3.6353414058685303, "lr": 0.0003637818659965422, "tps": 18919, "wall": 24475.8} {"step": 7066, "train_loss": 3.5966880321502686, "lr": 0.00036377033949166435, "tps": 18916, "wall": 24483.8} {"step": 7067, "train_loss": 3.656334400177002, "lr": 0.00036375881135814836, "tps": 18912, "wall": 24491.9} {"step": 7068, "train_loss": 3.733581066131592, "lr": 0.00036374728159612477, "tps": 18909, "wall": 24500.0} {"step": 7069, "train_loss": 3.6145761013031006, "lr": 0.0003637357502057242, "tps": 18905, "wall": 24508.0} {"step": 7070, "train_loss": 3.580061197280884, "lr": 0.0003637242171870772, "tps": 18902, "wall": 24516.1} {"step": 7071, "train_loss": 3.6660830974578857, "lr": 0.00036371268254031455, "tps": 18898, "wall": 24524.2} {"step": 7072, "train_loss": 3.747859477996826, "lr": 0.0003637011462655669, "tps": 18894, "wall": 24532.3} {"step": 7073, "train_loss": 3.6481845378875732, "lr": 0.0003636896083629648, "tps": 18891, "wall": 24540.4} {"step": 7074, "train_loss": 3.5663208961486816, "lr": 0.00036367806883263917, "tps": 18887, "wall": 24548.5} {"step": 7075, "train_loss": 3.5796947479248047, "lr": 0.00036366652767472044, "tps": 18884, "wall": 24556.6} {"step": 7076, "train_loss": 3.703507661819458, "lr": 0.0003636549848893396, "tps": 18880, "wall": 24564.7} {"step": 7077, "train_loss": 3.655391216278076, "lr": 0.00036364344047662737, "tps": 18877, "wall": 24572.8} {"step": 7078, "train_loss": 3.659616470336914, "lr": 0.0003636318944367144, "tps": 18873, "wall": 24580.8} {"step": 7079, "train_loss": 3.683971643447876, "lr": 0.0003636203467697316, "tps": 18869, "wall": 24589.1} {"step": 7080, "train_loss": 3.600548028945923, "lr": 0.00036360879747580975, "tps": 18866, "wall": 24597.1} {"step": 7081, "train_loss": 3.6135547161102295, "lr": 0.0003635972465550796, "tps": 18862, "wall": 24605.1} {"step": 7082, "train_loss": 3.7027626037597656, "lr": 0.0003635856940076721, "tps": 18859, "wall": 24613.1} {"step": 7083, "train_loss": 3.6343483924865723, "lr": 0.00036357413983371814, "tps": 18855, "wall": 24621.3} {"step": 7084, "train_loss": 3.5783095359802246, "lr": 0.0003635625840333486, "tps": 18852, "wall": 24629.4} {"step": 7085, "train_loss": 3.7700297832489014, "lr": 0.0003635510266066942, "tps": 18848, "wall": 24637.5} {"step": 7086, "train_loss": 3.5516796112060547, "lr": 0.0003635394675538861, "tps": 18845, "wall": 24645.6} {"step": 7087, "train_loss": 3.664212465286255, "lr": 0.00036352790687505513, "tps": 18841, "wall": 24653.5} {"step": 7088, "train_loss": 3.686100959777832, "lr": 0.0003635163445703322, "tps": 18838, "wall": 24661.6} {"step": 7089, "train_loss": 3.6547791957855225, "lr": 0.00036350478063984845, "tps": 18834, "wall": 24669.6} {"step": 7090, "train_loss": 3.584672212600708, "lr": 0.0003634932150837348, "tps": 18831, "wall": 24677.6} {"step": 7091, "train_loss": 3.7473251819610596, "lr": 0.0003634816479021221, "tps": 18827, "wall": 24685.8} {"step": 7092, "train_loss": 3.613588333129883, "lr": 0.00036347007909514164, "tps": 18824, "wall": 24693.8} {"step": 7093, "train_loss": 3.7054495811462402, "lr": 0.0003634585086629244, "tps": 18821, "wall": 24701.8} {"step": 7094, "train_loss": 3.612116813659668, "lr": 0.0003634469366056013, "tps": 18817, "wall": 24709.9} {"step": 7095, "train_loss": 3.659882068634033, "lr": 0.0003634353629233036, "tps": 18813, "wall": 24718.0} {"step": 7096, "train_loss": 3.8189034461975098, "lr": 0.0003634237876161623, "tps": 18810, "wall": 24726.0} {"step": 7097, "train_loss": 3.7172727584838867, "lr": 0.0003634122106843087, "tps": 18807, "wall": 24734.1} {"step": 7098, "train_loss": 3.608025550842285, "lr": 0.0003634006321278737, "tps": 18803, "wall": 24742.0} {"step": 7099, "train_loss": 3.5797698497772217, "lr": 0.00036338905194698863, "tps": 18800, "wall": 24750.1} {"step": 7100, "train_loss": 3.655895233154297, "lr": 0.0003633774701417846, "tps": 18796, "wall": 24758.0} {"step": 7101, "train_loss": 3.6548709869384766, "lr": 0.00036336588671239284, "tps": 18793, "wall": 24766.0} {"step": 7102, "train_loss": 3.5998213291168213, "lr": 0.0003633543016589446, "tps": 18789, "wall": 24774.2} {"step": 7103, "train_loss": 3.655834197998047, "lr": 0.000363342714981571, "tps": 18786, "wall": 24782.2} {"step": 7104, "train_loss": 3.5759847164154053, "lr": 0.00036333112668040347, "tps": 18782, "wall": 24790.2} {"step": 7105, "train_loss": 3.61704421043396, "lr": 0.0003633195367555731, "tps": 18779, "wall": 24798.3} {"step": 7106, "train_loss": 3.6059422492980957, "lr": 0.0003633079452072113, "tps": 18775, "wall": 24806.4} {"step": 7107, "train_loss": 3.6020588874816895, "lr": 0.00036329635203544933, "tps": 18772, "wall": 24814.4} {"step": 7108, "train_loss": 3.5647356510162354, "lr": 0.00036328475724041855, "tps": 18769, "wall": 24822.4} {"step": 7109, "train_loss": 3.659440517425537, "lr": 0.00036327316082225027, "tps": 18765, "wall": 24830.4} {"step": 7110, "train_loss": 3.7073657512664795, "lr": 0.00036326156278107584, "tps": 18762, "wall": 24838.4} {"step": 7111, "train_loss": 3.6823716163635254, "lr": 0.00036324996311702673, "tps": 18759, "wall": 24846.3} {"step": 7112, "train_loss": 3.61057186126709, "lr": 0.0003632383618302343, "tps": 18755, "wall": 24854.4} {"step": 7113, "train_loss": 3.5666537284851074, "lr": 0.0003632267589208299, "tps": 18752, "wall": 24862.4} {"step": 7114, "train_loss": 3.5727715492248535, "lr": 0.00036321515438894505, "tps": 18748, "wall": 24870.3} {"step": 7115, "train_loss": 3.651686191558838, "lr": 0.0003632035482347112, "tps": 18745, "wall": 24878.4} {"step": 7116, "train_loss": 3.6688899993896484, "lr": 0.0003631919404582598, "tps": 18741, "wall": 24886.4} {"step": 7117, "train_loss": 3.61647891998291, "lr": 0.00036318033105972234, "tps": 18738, "wall": 24894.5} {"step": 7118, "train_loss": 3.6777334213256836, "lr": 0.0003631687200392303, "tps": 18735, "wall": 24902.4} {"step": 7119, "train_loss": 3.530195951461792, "lr": 0.00036315710739691533, "tps": 18731, "wall": 24910.4} {"step": 7120, "train_loss": 3.533473014831543, "lr": 0.0003631454931329089, "tps": 18728, "wall": 24918.4} {"step": 7121, "train_loss": 3.577982187271118, "lr": 0.0003631338772473425, "tps": 18724, "wall": 24926.5} {"step": 7122, "train_loss": 3.7245004177093506, "lr": 0.0003631222597403479, "tps": 18721, "wall": 24934.4} {"step": 7123, "train_loss": 3.635488986968994, "lr": 0.00036311064061205655, "tps": 18718, "wall": 24942.4} {"step": 7124, "train_loss": 3.6775710582733154, "lr": 0.00036309901986260015, "tps": 18714, "wall": 24950.4} {"step": 7125, "train_loss": 3.574711799621582, "lr": 0.00036308739749211025, "tps": 18711, "wall": 24958.4} {"step": 7126, "train_loss": 3.726212501525879, "lr": 0.0003630757735007186, "tps": 18708, "wall": 24966.3} {"step": 7127, "train_loss": 3.643740653991699, "lr": 0.00036306414788855683, "tps": 18704, "wall": 24974.3} {"step": 7128, "train_loss": 3.7623167037963867, "lr": 0.0003630525206557567, "tps": 18701, "wall": 24982.3} {"step": 7129, "train_loss": 3.6906626224517822, "lr": 0.00036304089180244983, "tps": 18698, "wall": 24990.2} {"step": 7130, "train_loss": 3.720674514770508, "lr": 0.00036302926132876804, "tps": 18694, "wall": 24998.3} {"step": 7131, "train_loss": 3.740830421447754, "lr": 0.00036301762923484303, "tps": 18691, "wall": 25006.3} {"step": 7132, "train_loss": 3.606724500656128, "lr": 0.0003630059955208066, "tps": 18688, "wall": 25014.2} {"step": 7133, "train_loss": 3.6408941745758057, "lr": 0.0003629943601867904, "tps": 18684, "wall": 25022.1} {"step": 7134, "train_loss": 3.6020593643188477, "lr": 0.0003629827232329265, "tps": 18681, "wall": 25030.0} {"step": 7135, "train_loss": 3.650871753692627, "lr": 0.00036297108465934655, "tps": 18678, "wall": 25038.0} {"step": 7136, "train_loss": 3.724658966064453, "lr": 0.0003629594444661824, "tps": 18674, "wall": 25045.9} {"step": 7137, "train_loss": 3.6996092796325684, "lr": 0.00036294780265356587, "tps": 18671, "wall": 25053.7} {"step": 7138, "train_loss": 3.630312442779541, "lr": 0.00036293615922162895, "tps": 18668, "wall": 25061.8} {"step": 7139, "train_loss": 3.683706283569336, "lr": 0.00036292451417050347, "tps": 18665, "wall": 25069.7} {"step": 7140, "train_loss": 3.685699939727783, "lr": 0.00036291286750032137, "tps": 18661, "wall": 25077.8} {"step": 7141, "train_loss": 3.550567150115967, "lr": 0.00036290121921121456, "tps": 18658, "wall": 25085.7} {"step": 7142, "train_loss": 3.624816417694092, "lr": 0.000362889569303315, "tps": 18655, "wall": 25093.6} {"step": 7143, "train_loss": 3.7049992084503174, "lr": 0.0003628779177767547, "tps": 18651, "wall": 25101.5} {"step": 7144, "train_loss": 3.576162099838257, "lr": 0.00036286626463166564, "tps": 18648, "wall": 25109.5} {"step": 7145, "train_loss": 3.67425537109375, "lr": 0.00036285460986817974, "tps": 18645, "wall": 25117.5} {"step": 7146, "train_loss": 3.659290313720703, "lr": 0.0003628429534864292, "tps": 18641, "wall": 25125.5} {"step": 7147, "train_loss": 3.663083553314209, "lr": 0.00036283129548654575, "tps": 18638, "wall": 25133.4} {"step": 7148, "train_loss": 3.748565196990967, "lr": 0.0003628196358686618, "tps": 18635, "wall": 25141.4} {"step": 7149, "train_loss": 3.6118712425231934, "lr": 0.00036280797463290936, "tps": 18632, "wall": 25149.2} {"step": 7150, "train_loss": 3.613668918609619, "lr": 0.00036279631177942034, "tps": 18628, "wall": 25157.1} {"step": 7151, "train_loss": 3.5388236045837402, "lr": 0.00036278464730832706, "tps": 18625, "wall": 25165.1} {"step": 7152, "train_loss": 3.546015739440918, "lr": 0.00036277298121976145, "tps": 18622, "wall": 25172.9} {"step": 7153, "train_loss": 3.6570258140563965, "lr": 0.00036276131351385585, "tps": 18619, "wall": 25181.0} {"step": 7154, "train_loss": 3.6370034217834473, "lr": 0.00036274964419074235, "tps": 18615, "wall": 25188.8} {"step": 7155, "train_loss": 3.6291823387145996, "lr": 0.00036273797325055325, "tps": 18612, "wall": 25196.8} {"step": 7156, "train_loss": 3.6749651432037354, "lr": 0.0003627263006934206, "tps": 18609, "wall": 25204.7} {"step": 7157, "train_loss": 3.5539205074310303, "lr": 0.00036271462651947664, "tps": 18606, "wall": 25212.6} {"step": 7158, "train_loss": 3.736978530883789, "lr": 0.00036270295072885373, "tps": 18602, "wall": 25220.5} {"step": 7159, "train_loss": 3.7133398056030273, "lr": 0.0003626912733216841, "tps": 18599, "wall": 25228.5} {"step": 7160, "train_loss": 3.7649221420288086, "lr": 0.0003626795942980999, "tps": 18596, "wall": 25236.4} {"step": 7161, "train_loss": 3.5354058742523193, "lr": 0.0003626679136582337, "tps": 18592, "wall": 25244.5} {"step": 7162, "train_loss": 3.750929355621338, "lr": 0.00036265623140221753, "tps": 18589, "wall": 25252.4} {"step": 7163, "train_loss": 3.8118410110473633, "lr": 0.00036264454753018386, "tps": 18586, "wall": 25260.4} {"step": 7164, "train_loss": 3.674922466278076, "lr": 0.0003626328620422651, "tps": 18583, "wall": 25268.3} {"step": 7165, "train_loss": 3.6672518253326416, "lr": 0.00036262117493859354, "tps": 18579, "wall": 25276.2} {"step": 7166, "train_loss": 3.628110885620117, "lr": 0.0003626094862193015, "tps": 18576, "wall": 25284.2} {"step": 7167, "train_loss": 3.6214962005615234, "lr": 0.00036259779588452163, "tps": 18573, "wall": 25292.1} {"step": 7168, "train_loss": 3.6277191638946533, "lr": 0.00036258610393438614, "tps": 18570, "wall": 25300.1} {"step": 7169, "train_loss": 3.6636016368865967, "lr": 0.00036257441036902755, "tps": 18566, "wall": 25308.0} {"step": 7170, "train_loss": 3.6923837661743164, "lr": 0.00036256271518857837, "tps": 18563, "wall": 25316.0} {"step": 7171, "train_loss": 3.5720884799957275, "lr": 0.00036255101839317096, "tps": 18560, "wall": 25323.9} {"step": 7172, "train_loss": 3.615377187728882, "lr": 0.000362539319982938, "tps": 18557, "wall": 25331.7} {"step": 7173, "train_loss": 3.6771068572998047, "lr": 0.0003625276199580118, "tps": 18554, "wall": 25339.7} {"step": 7174, "train_loss": 3.5945796966552734, "lr": 0.00036251591831852506, "tps": 18550, "wall": 25347.7} {"step": 7175, "train_loss": 3.7140231132507324, "lr": 0.00036250421506461036, "tps": 18547, "wall": 25355.6} {"step": 7176, "train_loss": 3.6510121822357178, "lr": 0.0003624925101964001, "tps": 18544, "wall": 25363.7} {"step": 7177, "train_loss": 3.6406733989715576, "lr": 0.00036248080371402707, "tps": 18541, "wall": 25371.5} {"step": 7178, "train_loss": 3.6556572914123535, "lr": 0.00036246909561762366, "tps": 18537, "wall": 25379.5} {"step": 7179, "train_loss": 3.641291856765747, "lr": 0.00036245738590732276, "tps": 18534, "wall": 25387.4} {"step": 7180, "train_loss": 3.699446678161621, "lr": 0.0003624456745832568, "tps": 18531, "wall": 25395.3} {"step": 7181, "train_loss": 3.6592934131622314, "lr": 0.0003624339616455586, "tps": 18528, "wall": 25403.2} {"step": 7182, "train_loss": 3.5213124752044678, "lr": 0.00036242224709436075, "tps": 18525, "wall": 25411.1} {"step": 7183, "train_loss": 3.612424373626709, "lr": 0.0003624105309297959, "tps": 18522, "wall": 25419.0} {"step": 7184, "train_loss": 3.65341854095459, "lr": 0.000362398813151997, "tps": 18518, "wall": 25427.0} {"step": 7185, "train_loss": 3.6744613647460938, "lr": 0.00036238709376109653, "tps": 18515, "wall": 25434.9} {"step": 7186, "train_loss": 3.6810030937194824, "lr": 0.0003623753727572274, "tps": 18512, "wall": 25442.8} {"step": 7187, "train_loss": 3.6707069873809814, "lr": 0.0003623636501405223, "tps": 18509, "wall": 25450.6} {"step": 7188, "train_loss": 3.551737070083618, "lr": 0.0003623519259111141, "tps": 18506, "wall": 25458.5} {"step": 7189, "train_loss": 3.660494089126587, "lr": 0.0003623402000691356, "tps": 18503, "wall": 25466.3} {"step": 7190, "train_loss": 3.6018660068511963, "lr": 0.0003623284726147196, "tps": 18499, "wall": 25474.3} {"step": 7191, "train_loss": 3.68516206741333, "lr": 0.00036231674354799895, "tps": 18496, "wall": 25482.2} {"step": 7192, "train_loss": 3.6109249591827393, "lr": 0.00036230501286910655, "tps": 18493, "wall": 25490.1} {"step": 7193, "train_loss": 3.6145942211151123, "lr": 0.00036229328057817525, "tps": 18490, "wall": 25498.0} {"step": 7194, "train_loss": 3.5591158866882324, "lr": 0.00036228154667533797, "tps": 18487, "wall": 25505.9} {"step": 7195, "train_loss": 3.5724740028381348, "lr": 0.00036226981116072764, "tps": 18484, "wall": 25513.7} {"step": 7196, "train_loss": 3.7009575366973877, "lr": 0.0003622580740344772, "tps": 18480, "wall": 25521.6} {"step": 7197, "train_loss": 3.7456178665161133, "lr": 0.0003622463352967196, "tps": 18477, "wall": 25529.6} {"step": 7198, "train_loss": 3.676807403564453, "lr": 0.0003622345949475878, "tps": 18474, "wall": 25537.4} {"step": 7199, "train_loss": 3.577744960784912, "lr": 0.0003622228529872148, "tps": 18471, "wall": 25545.3} {"step": 7200, "train_loss": 3.616770029067993, "lr": 0.0003622111094157337, "tps": 18468, "wall": 25553.2} {"step": 7201, "train_loss": 3.585205078125, "lr": 0.0003621993642332774, "tps": 18465, "wall": 25561.3} {"step": 7202, "train_loss": 3.6699488162994385, "lr": 0.000362187617439979, "tps": 18461, "wall": 25569.1} {"step": 7203, "train_loss": 3.5646886825561523, "lr": 0.0003621758690359716, "tps": 18458, "wall": 25577.1} {"step": 7204, "train_loss": 3.6079838275909424, "lr": 0.0003621641190213883, "tps": 18455, "wall": 25585.1} {"step": 7205, "train_loss": 3.675001859664917, "lr": 0.0003621523673963621, "tps": 18452, "wall": 25593.1} {"step": 7206, "train_loss": 3.6871800422668457, "lr": 0.00036214061416102623, "tps": 18449, "wall": 25600.8} {"step": 7207, "train_loss": 3.6548266410827637, "lr": 0.0003621288593155138, "tps": 18446, "wall": 25608.9} {"step": 7208, "train_loss": 3.6690049171447754, "lr": 0.0003621171028599579, "tps": 18442, "wall": 25616.8} {"step": 7209, "train_loss": 3.624077796936035, "lr": 0.00036210534479449183, "tps": 18439, "wall": 25624.5} {"step": 7210, "train_loss": 3.5793213844299316, "lr": 0.0003620935851192487, "tps": 18436, "wall": 25632.4} {"step": 7211, "train_loss": 3.693361759185791, "lr": 0.00036208182383436183, "tps": 18433, "wall": 25640.2} {"step": 7212, "train_loss": 3.658684492111206, "lr": 0.0003620700609399642, "tps": 18430, "wall": 25648.1} {"step": 7213, "train_loss": 3.519493818283081, "lr": 0.0003620582964361894, "tps": 18427, "wall": 25655.9} {"step": 7214, "train_loss": 3.707876205444336, "lr": 0.00036204653032317045, "tps": 18424, "wall": 25664.0} {"step": 7215, "train_loss": 3.573812246322632, "lr": 0.0003620347626010408, "tps": 18421, "wall": 25671.8} {"step": 7216, "train_loss": 3.619821786880493, "lr": 0.00036202299326993357, "tps": 18418, "wall": 25679.7} {"step": 7217, "train_loss": 3.738222599029541, "lr": 0.00036201122232998225, "tps": 18415, "wall": 25687.6} {"step": 7218, "train_loss": 3.5644888877868652, "lr": 0.0003619994497813201, "tps": 18412, "wall": 25695.4} {"step": 7219, "train_loss": 3.625520944595337, "lr": 0.0003619876756240805, "tps": 18408, "wall": 25703.3} {"step": 7220, "train_loss": 3.64743971824646, "lr": 0.0003619758998583969, "tps": 18405, "wall": 25711.0} {"step": 7221, "train_loss": 3.698664426803589, "lr": 0.00036196412248440255, "tps": 18402, "wall": 25718.8} {"step": 7222, "train_loss": 3.73600435256958, "lr": 0.00036195234350223097, "tps": 18399, "wall": 25726.8} {"step": 7223, "train_loss": 3.6454458236694336, "lr": 0.0003619405629120155, "tps": 18396, "wall": 25734.6} {"step": 7224, "train_loss": 3.682185173034668, "lr": 0.0003619287807138897, "tps": 18393, "wall": 25742.5} {"step": 7225, "train_loss": 3.5788826942443848, "lr": 0.00036191699690798704, "tps": 18390, "wall": 25750.3} {"step": 7226, "train_loss": 3.6187641620635986, "lr": 0.0003619052114944409, "tps": 18387, "wall": 25758.1} {"step": 7227, "train_loss": 3.6295838356018066, "lr": 0.00036189342447338484, "tps": 18384, "wall": 25766.0} {"step": 7228, "train_loss": 3.6214523315429688, "lr": 0.00036188163584495247, "tps": 18381, "wall": 25773.8} {"step": 7229, "train_loss": 3.7599997520446777, "lr": 0.00036186984560927717, "tps": 18378, "wall": 25781.6} {"step": 7230, "train_loss": 3.6595749855041504, "lr": 0.0003618580537664926, "tps": 18375, "wall": 25789.7} {"step": 7231, "train_loss": 3.5634121894836426, "lr": 0.00036184626031673234, "tps": 18372, "wall": 25797.6} {"step": 7232, "train_loss": 3.6300430297851562, "lr": 0.00036183446526012996, "tps": 18369, "wall": 25805.4} {"step": 7233, "train_loss": 3.661649227142334, "lr": 0.0003618226685968191, "tps": 18366, "wall": 25813.2} {"step": 7234, "train_loss": 3.6724963188171387, "lr": 0.00036181087032693336, "tps": 18363, "wall": 25821.0} {"step": 7235, "train_loss": 3.6922695636749268, "lr": 0.0003617990704506064, "tps": 18359, "wall": 25828.9} {"step": 7236, "train_loss": 3.630035400390625, "lr": 0.00036178726896797194, "tps": 18356, "wall": 25836.7} {"step": 7237, "train_loss": 3.6511409282684326, "lr": 0.00036177546587916364, "tps": 18353, "wall": 25844.8} {"step": 7238, "train_loss": 3.7836384773254395, "lr": 0.00036176366118431517, "tps": 18350, "wall": 25852.5} {"step": 7239, "train_loss": 3.614319086074829, "lr": 0.0003617518548835602, "tps": 18347, "wall": 25860.4} {"step": 7240, "train_loss": 3.6734838485717773, "lr": 0.00036174004697703266, "tps": 18344, "wall": 25868.2} {"step": 7241, "train_loss": 3.5538182258605957, "lr": 0.00036172823746486615, "tps": 18341, "wall": 25876.1} {"step": 7242, "train_loss": 3.5861129760742188, "lr": 0.00036171642634719446, "tps": 18338, "wall": 25883.9} {"step": 7243, "train_loss": 3.6299328804016113, "lr": 0.00036170461362415146, "tps": 18335, "wall": 25891.8} {"step": 7244, "train_loss": 3.625641345977783, "lr": 0.00036169279929587096, "tps": 18332, "wall": 25899.5} {"step": 7245, "train_loss": 3.598599910736084, "lr": 0.00036168098336248673, "tps": 18329, "wall": 25907.5} {"step": 7246, "train_loss": 3.5111517906188965, "lr": 0.0003616691658241327, "tps": 18326, "wall": 25915.4} {"step": 7247, "train_loss": 3.566781520843506, "lr": 0.00036165734668094267, "tps": 18323, "wall": 25923.2} {"step": 7248, "train_loss": 3.588834285736084, "lr": 0.00036164552593305054, "tps": 18320, "wall": 25931.0} {"step": 7249, "train_loss": 3.591860055923462, "lr": 0.00036163370358059015, "tps": 18317, "wall": 25938.7} {"step": 7250, "train_loss": 3.628127098083496, "lr": 0.00036162187962369567, "tps": 18314, "wall": 25946.7} {"step": 7251, "train_loss": 3.624323844909668, "lr": 0.0003616100540625008, "tps": 18311, "wall": 25954.5} {"step": 7252, "train_loss": 3.5804176330566406, "lr": 0.00036159822689713956, "tps": 18308, "wall": 25962.4} {"step": 7253, "train_loss": 3.6064565181732178, "lr": 0.0003615863981277459, "tps": 18305, "wall": 25970.3} {"step": 7254, "train_loss": 3.784574031829834, "lr": 0.00036157456775445394, "tps": 18302, "wall": 25978.1} {"step": 7255, "train_loss": 3.684894323348999, "lr": 0.00036156273577739756, "tps": 18299, "wall": 25986.0} {"step": 7256, "train_loss": 3.594226837158203, "lr": 0.0003615509021967109, "tps": 18296, "wall": 25993.9} {"step": 7257, "train_loss": 3.6385576725006104, "lr": 0.00036153906701252793, "tps": 18293, "wall": 26001.7} {"step": 7258, "train_loss": 3.664987325668335, "lr": 0.00036152723022498285, "tps": 18290, "wall": 26009.6} {"step": 7259, "train_loss": 3.644186019897461, "lr": 0.0003615153918342095, "tps": 18287, "wall": 26017.4} {"step": 7260, "train_loss": 3.6684069633483887, "lr": 0.00036150355184034225, "tps": 18284, "wall": 26025.3} {"step": 7261, "train_loss": 3.573354959487915, "lr": 0.00036149171024351507, "tps": 18281, "wall": 26033.1} {"step": 7262, "train_loss": 3.756014347076416, "lr": 0.0003614798670438621, "tps": 18278, "wall": 26041.0} {"step": 7263, "train_loss": 3.6817402839660645, "lr": 0.0003614680222415176, "tps": 18275, "wall": 26048.8} {"step": 7264, "train_loss": 3.600442886352539, "lr": 0.0003614561758366157, "tps": 18272, "wall": 26056.6} {"step": 7265, "train_loss": 3.7066426277160645, "lr": 0.00036144432782929056, "tps": 18269, "wall": 26064.5} {"step": 7266, "train_loss": 3.7114241123199463, "lr": 0.0003614324782196764, "tps": 18266, "wall": 26072.3} {"step": 7267, "train_loss": 3.631193161010742, "lr": 0.00036142062700790745, "tps": 18263, "wall": 26080.0} {"step": 7268, "train_loss": 3.609300374984741, "lr": 0.000361408774194118, "tps": 18260, "wall": 26087.9} {"step": 7269, "train_loss": 3.736908197402954, "lr": 0.0003613969197784424, "tps": 18257, "wall": 26095.8} {"step": 7270, "train_loss": 3.6657063961029053, "lr": 0.0003613850637610148, "tps": 18254, "wall": 26103.7} {"step": 7271, "train_loss": 3.668729305267334, "lr": 0.00036137320614196955, "tps": 18251, "wall": 26111.5} {"step": 7272, "train_loss": 3.582136392593384, "lr": 0.0003613613469214409, "tps": 18248, "wall": 26119.2} {"step": 7273, "train_loss": 3.632645845413208, "lr": 0.00036134948609956334, "tps": 18245, "wall": 26127.1} {"step": 7274, "train_loss": 3.6316962242126465, "lr": 0.00036133762367647113, "tps": 18242, "wall": 26135.1} {"step": 7275, "train_loss": 3.6361169815063477, "lr": 0.00036132575965229865, "tps": 18239, "wall": 26142.8} {"step": 7276, "train_loss": 3.6518282890319824, "lr": 0.00036131389402718035, "tps": 18236, "wall": 26150.7} {"step": 7277, "train_loss": 3.6116397380828857, "lr": 0.00036130202680125065, "tps": 18233, "wall": 26158.6} {"step": 7278, "train_loss": 3.607748508453369, "lr": 0.00036129015797464384, "tps": 18230, "wall": 26166.4} {"step": 7279, "train_loss": 3.62526798248291, "lr": 0.0003612782875474946, "tps": 18227, "wall": 26174.2} {"step": 7280, "train_loss": 3.665088653564453, "lr": 0.00036126641551993715, "tps": 18224, "wall": 26182.1} {"step": 7281, "train_loss": 3.670468330383301, "lr": 0.0003612545418921062, "tps": 18221, "wall": 26190.0} {"step": 7282, "train_loss": 3.5356626510620117, "lr": 0.0003612426666641361, "tps": 18218, "wall": 26197.9} {"step": 7283, "train_loss": 3.655522346496582, "lr": 0.0003612307898361615, "tps": 18215, "wall": 26205.9} {"step": 7284, "train_loss": 3.61972975730896, "lr": 0.0003612189114083168, "tps": 18212, "wall": 26213.8} {"step": 7285, "train_loss": 3.7451672554016113, "lr": 0.00036120703138073666, "tps": 18210, "wall": 26221.5} {"step": 7286, "train_loss": 3.6418514251708984, "lr": 0.00036119514975355567, "tps": 18207, "wall": 26229.3} {"step": 7287, "train_loss": 3.7079739570617676, "lr": 0.0003611832665269083, "tps": 18204, "wall": 26237.1} {"step": 7288, "train_loss": 3.600782632827759, "lr": 0.0003611713817009293, "tps": 18201, "wall": 26245.0} {"step": 7289, "train_loss": 3.6129581928253174, "lr": 0.00036115949527575325, "tps": 18198, "wall": 26252.8} {"step": 7290, "train_loss": 3.733010768890381, "lr": 0.0003611476072515148, "tps": 18195, "wall": 26260.5} {"step": 7291, "train_loss": 3.5863897800445557, "lr": 0.00036113571762834857, "tps": 18192, "wall": 26268.5} {"step": 7292, "train_loss": 3.7955384254455566, "lr": 0.0003611238264063894, "tps": 18189, "wall": 26276.2} {"step": 7293, "train_loss": 3.5863919258117676, "lr": 0.00036111193358577185, "tps": 18186, "wall": 26284.1} {"step": 7294, "train_loss": 3.6178250312805176, "lr": 0.0003611000391666306, "tps": 18183, "wall": 26291.9} {"step": 7295, "train_loss": 3.5655603408813477, "lr": 0.0003610881431491005, "tps": 18180, "wall": 26299.7} {"step": 7296, "train_loss": 3.5465927124023438, "lr": 0.00036107624553331633, "tps": 18177, "wall": 26307.6} {"step": 7297, "train_loss": 3.6267974376678467, "lr": 0.00036106434631941284, "tps": 18175, "wall": 26315.3} {"step": 7298, "train_loss": 3.6461241245269775, "lr": 0.00036105244550752475, "tps": 18171, "wall": 26323.3} {"step": 7299, "train_loss": 3.6398096084594727, "lr": 0.000361040543097787, "tps": 18169, "wall": 26331.1} {"step": 7300, "train_loss": 3.5297718048095703, "lr": 0.00036102863909033426, "tps": 18166, "wall": 26338.9} {"step": 7301, "train_loss": 3.559868574142456, "lr": 0.0003610167334853015, "tps": 18163, "wall": 26346.8} {"step": 7302, "train_loss": 3.6164653301239014, "lr": 0.0003610048262828235, "tps": 18160, "wall": 26354.5} {"step": 7303, "train_loss": 3.5872230529785156, "lr": 0.00036099291748303527, "tps": 18157, "wall": 26362.3} {"step": 7304, "train_loss": 3.623053789138794, "lr": 0.0003609810070860717, "tps": 18154, "wall": 26370.1} {"step": 7305, "train_loss": 3.6381824016571045, "lr": 0.0003609690950920675, "tps": 18151, "wall": 26377.9} {"step": 7306, "train_loss": 3.598078489303589, "lr": 0.00036095718150115793, "tps": 18148, "wall": 26385.8} {"step": 7307, "train_loss": 3.5330445766448975, "lr": 0.0003609452663134776, "tps": 18145, "wall": 26393.7} {"step": 7308, "train_loss": 3.6949782371520996, "lr": 0.0003609333495291618, "tps": 18143, "wall": 26401.5} {"step": 7309, "train_loss": 3.6271591186523438, "lr": 0.00036092143114834543, "tps": 18140, "wall": 26409.3} {"step": 7310, "train_loss": 3.6455135345458984, "lr": 0.00036090951117116336, "tps": 18137, "wall": 26417.1} {"step": 7311, "train_loss": 3.8019509315490723, "lr": 0.0003608975895977508, "tps": 18134, "wall": 26424.9} {"step": 7312, "train_loss": 3.5635385513305664, "lr": 0.00036088566642824264, "tps": 18131, "wall": 26432.7} {"step": 7313, "train_loss": 3.63458251953125, "lr": 0.00036087374166277405, "tps": 18128, "wall": 26440.5} {"step": 7314, "train_loss": 3.6764373779296875, "lr": 0.0003608618153014801, "tps": 18125, "wall": 26448.4} {"step": 7315, "train_loss": 3.631129503250122, "lr": 0.0003608498873444959, "tps": 18122, "wall": 26456.2} {"step": 7316, "train_loss": 3.645866870880127, "lr": 0.0003608379577919566, "tps": 18119, "wall": 26464.0} {"step": 7317, "train_loss": 3.587111711502075, "lr": 0.0003608260266439972, "tps": 18117, "wall": 26471.7} {"step": 7318, "train_loss": 3.631740093231201, "lr": 0.000360814093900753, "tps": 18114, "wall": 26479.5} {"step": 7319, "train_loss": 3.5930304527282715, "lr": 0.00036080215956235917, "tps": 18111, "wall": 26487.3} {"step": 7320, "train_loss": 3.791588306427002, "lr": 0.0003607902236289508, "tps": 18108, "wall": 26495.2} {"step": 7321, "train_loss": 3.711299419403076, "lr": 0.00036077828610066315, "tps": 18105, "wall": 26503.1} {"step": 7322, "train_loss": 3.634242057800293, "lr": 0.0003607663469776315, "tps": 18102, "wall": 26511.0} {"step": 7323, "train_loss": 3.5667929649353027, "lr": 0.000360754406259991, "tps": 18099, "wall": 26518.8} {"step": 7324, "train_loss": 3.6685070991516113, "lr": 0.0003607424639478771, "tps": 18096, "wall": 26526.6} {"step": 7325, "train_loss": 3.7059402465820312, "lr": 0.00036073052004142477, "tps": 18094, "wall": 26534.3} {"step": 7326, "train_loss": 3.634803295135498, "lr": 0.00036071857454076967, "tps": 18091, "wall": 26542.2} {"step": 7327, "train_loss": 3.572701930999756, "lr": 0.00036070662744604686, "tps": 18088, "wall": 26550.1} {"step": 7328, "train_loss": 3.7240891456604004, "lr": 0.0003606946787573917, "tps": 18085, "wall": 26557.8} {"step": 7329, "train_loss": 3.6181211471557617, "lr": 0.0003606827284749397, "tps": 18082, "wall": 26565.7} {"step": 7330, "train_loss": 3.6693100929260254, "lr": 0.0003606707765988261, "tps": 18079, "wall": 26573.6} {"step": 7331, "train_loss": 3.630521774291992, "lr": 0.0003606588231291864, "tps": 18076, "wall": 26581.4} {"step": 7332, "train_loss": 3.64357852935791, "lr": 0.0003606468680661559, "tps": 18074, "wall": 26589.3} {"step": 7333, "train_loss": 3.5713324546813965, "lr": 0.0003606349114098701, "tps": 18071, "wall": 26597.1} {"step": 7334, "train_loss": 3.6418306827545166, "lr": 0.0003606229531604643, "tps": 18068, "wall": 26605.0} {"step": 7335, "train_loss": 3.700064182281494, "lr": 0.0003606109933180742, "tps": 18065, "wall": 26612.8} {"step": 7336, "train_loss": 3.666450262069702, "lr": 0.0003605990318828351, "tps": 18062, "wall": 26620.7} {"step": 7337, "train_loss": 3.5787811279296875, "lr": 0.00036058706885488257, "tps": 18059, "wall": 26628.6} {"step": 7338, "train_loss": 3.718928337097168, "lr": 0.0003605751042343521, "tps": 18056, "wall": 26636.4} {"step": 7339, "train_loss": 3.6362810134887695, "lr": 0.00036056313802137926, "tps": 18053, "wall": 26644.2} {"step": 7340, "train_loss": 3.583495855331421, "lr": 0.0003605511702160996, "tps": 18051, "wall": 26651.9} {"step": 7341, "train_loss": 3.6505930423736572, "lr": 0.0003605392008186487, "tps": 18048, "wall": 26659.8} {"step": 7342, "train_loss": 3.6523308753967285, "lr": 0.00036052722982916213, "tps": 18045, "wall": 26667.6} {"step": 7343, "train_loss": 3.6001734733581543, "lr": 0.0003605152572477755, "tps": 18042, "wall": 26675.4} {"step": 7344, "train_loss": 3.727348804473877, "lr": 0.0003605032830746244, "tps": 18039, "wall": 26683.4} {"step": 7345, "train_loss": 3.6891753673553467, "lr": 0.0003604913073098445, "tps": 18036, "wall": 26691.1} {"step": 7346, "train_loss": 3.5542266368865967, "lr": 0.0003604793299535715, "tps": 18034, "wall": 26699.0} {"step": 7347, "train_loss": 3.6605923175811768, "lr": 0.00036046735100594106, "tps": 18031, "wall": 26706.8} {"step": 7348, "train_loss": 3.6093528270721436, "lr": 0.00036045537046708884, "tps": 18028, "wall": 26714.6} {"step": 7349, "train_loss": 3.625051498413086, "lr": 0.0003604433883371506, "tps": 18025, "wall": 26722.4} {"step": 7350, "train_loss": 3.6667048931121826, "lr": 0.0003604314046162621, "tps": 18022, "wall": 26730.3} {"step": 7351, "train_loss": 3.7772576808929443, "lr": 0.00036041941930455896, "tps": 18020, "wall": 26738.0} {"step": 7352, "train_loss": 3.6513166427612305, "lr": 0.0003604074324021771, "tps": 18017, "wall": 26746.0} {"step": 7353, "train_loss": 3.6118431091308594, "lr": 0.0003603954439092522, "tps": 18014, "wall": 26753.8} {"step": 7354, "train_loss": 3.6675305366516113, "lr": 0.00036038345382592013, "tps": 18011, "wall": 26761.5} {"step": 7355, "train_loss": 3.6611528396606445, "lr": 0.0003603714621523168, "tps": 18008, "wall": 26769.3} {"step": 7356, "train_loss": 3.5950136184692383, "lr": 0.00036035946888857785, "tps": 18005, "wall": 26777.2} {"step": 7357, "train_loss": 3.527600049972534, "lr": 0.0003603474740348392, "tps": 18003, "wall": 26785.0} {"step": 7358, "train_loss": 3.767549514770508, "lr": 0.0003603354775912369, "tps": 18000, "wall": 26792.7} {"step": 7359, "train_loss": 3.5671162605285645, "lr": 0.00036032347955790664, "tps": 17997, "wall": 26800.5} {"step": 7360, "train_loss": 3.6381733417510986, "lr": 0.00036031147993498443, "tps": 17994, "wall": 26808.4} {"step": 7361, "train_loss": 3.6372203826904297, "lr": 0.00036029947872260617, "tps": 17991, "wall": 26816.2} {"step": 7362, "train_loss": 3.6396145820617676, "lr": 0.0003602874759209078, "tps": 17989, "wall": 26824.0} {"step": 7363, "train_loss": 3.651858329772949, "lr": 0.0003602754715300254, "tps": 17986, "wall": 26831.8} {"step": 7364, "train_loss": 3.6494009494781494, "lr": 0.00036026346555009483, "tps": 17983, "wall": 26839.6} {"step": 7365, "train_loss": 3.5079264640808105, "lr": 0.0003602514579812521, "tps": 17980, "wall": 26847.4} {"step": 7366, "train_loss": 3.593064308166504, "lr": 0.0003602394488236333, "tps": 17978, "wall": 26855.2} {"step": 7367, "train_loss": 3.579315185546875, "lr": 0.0003602274380773744, "tps": 17975, "wall": 26863.0} {"step": 7368, "train_loss": 3.609328508377075, "lr": 0.0003602154257426115, "tps": 17972, "wall": 26870.8} {"step": 7369, "train_loss": 3.5956268310546875, "lr": 0.00036020341181948077, "tps": 17969, "wall": 26878.7} {"step": 7370, "train_loss": 3.7025532722473145, "lr": 0.00036019139630811815, "tps": 17966, "wall": 26886.5} {"step": 7371, "train_loss": 3.648935556411743, "lr": 0.0003601793792086598, "tps": 17964, "wall": 26894.3} {"step": 7372, "train_loss": 3.6167361736297607, "lr": 0.0003601673605212418, "tps": 17961, "wall": 26902.3} {"step": 7373, "train_loss": 3.6451268196105957, "lr": 0.0003601553402460004, "tps": 17958, "wall": 26910.3} {"step": 7374, "train_loss": 3.6719577312469482, "lr": 0.0003601433183830717, "tps": 17955, "wall": 26918.2} {"step": 7375, "train_loss": 3.619309902191162, "lr": 0.000360131294932592, "tps": 17952, "wall": 26926.3} {"step": 7376, "train_loss": 3.619528293609619, "lr": 0.0003601192698946973, "tps": 17949, "wall": 26934.1} {"step": 7377, "train_loss": 3.669965982437134, "lr": 0.000360107243269524, "tps": 17946, "wall": 26941.9} {"step": 7378, "train_loss": 3.669433832168579, "lr": 0.00036009521505720826, "tps": 17944, "wall": 26949.7} {"step": 7379, "train_loss": 3.56355619430542, "lr": 0.0003600831852578863, "tps": 17941, "wall": 26957.5} {"step": 7380, "train_loss": 3.528042793273926, "lr": 0.0003600711538716945, "tps": 17938, "wall": 26965.3} {"step": 7381, "train_loss": 3.5751616954803467, "lr": 0.00036005912089876905, "tps": 17935, "wall": 26973.0} {"step": 7382, "train_loss": 3.6300759315490723, "lr": 0.00036004708633924636, "tps": 17933, "wall": 26980.8} {"step": 7383, "train_loss": 3.6259560585021973, "lr": 0.0003600350501932626, "tps": 17930, "wall": 26988.8} {"step": 7384, "train_loss": 3.7289509773254395, "lr": 0.0003600230124609543, "tps": 17927, "wall": 26996.6} {"step": 7385, "train_loss": 3.6185386180877686, "lr": 0.00036001097314245775, "tps": 17924, "wall": 27004.4} {"step": 7386, "train_loss": 3.5611038208007812, "lr": 0.00035999893223790926, "tps": 17922, "wall": 27012.2} {"step": 7387, "train_loss": 3.549769878387451, "lr": 0.0003599868897474453, "tps": 17919, "wall": 27019.9} {"step": 7388, "train_loss": 3.7383694648742676, "lr": 0.0003599748456712023, "tps": 17916, "wall": 27027.8} {"step": 7389, "train_loss": 3.5684244632720947, "lr": 0.0003599628000093166, "tps": 17913, "wall": 27035.7} {"step": 7390, "train_loss": 3.7255349159240723, "lr": 0.00035995075276192484, "tps": 17910, "wall": 27043.7} {"step": 7391, "train_loss": 3.649352550506592, "lr": 0.00035993870392916335, "tps": 17907, "wall": 27051.9} {"step": 7392, "train_loss": 3.6018970012664795, "lr": 0.0003599266535111686, "tps": 17904, "wall": 27060.0} {"step": 7393, "train_loss": 3.665337085723877, "lr": 0.0003599146015080772, "tps": 17902, "wall": 27068.0} {"step": 7394, "train_loss": 3.5398356914520264, "lr": 0.00035990254792002565, "tps": 17899, "wall": 27075.8} {"step": 7395, "train_loss": 3.606290817260742, "lr": 0.00035989049274715045, "tps": 17896, "wall": 27083.7} {"step": 7396, "train_loss": 3.6797802448272705, "lr": 0.00035987843598958813, "tps": 17893, "wall": 27091.4} {"step": 7397, "train_loss": 3.646533489227295, "lr": 0.0003598663776474754, "tps": 17891, "wall": 27099.3} {"step": 7398, "train_loss": 3.6297059059143066, "lr": 0.00035985431772094867, "tps": 17888, "wall": 27107.2} {"step": 7399, "train_loss": 3.6009469032287598, "lr": 0.0003598422562101447, "tps": 17885, "wall": 27115.1} {"step": 7400, "train_loss": 3.652876853942871, "lr": 0.00035983019311520016, "tps": 17882, "wall": 27122.9} {"step": 7401, "train_loss": 3.661825180053711, "lr": 0.0003598181284362516, "tps": 17880, "wall": 27130.7} {"step": 7402, "train_loss": 3.6765553951263428, "lr": 0.0003598060621734356, "tps": 17877, "wall": 27138.6} {"step": 7403, "train_loss": 3.6406350135803223, "lr": 0.00035979399432688907, "tps": 17874, "wall": 27146.3} {"step": 7404, "train_loss": 3.6008834838867188, "lr": 0.00035978192489674864, "tps": 17871, "wall": 27154.0} {"step": 7405, "train_loss": 3.653790235519409, "lr": 0.000359769853883151, "tps": 17869, "wall": 27161.8} {"step": 7406, "train_loss": 3.6769113540649414, "lr": 0.00035975778128623286, "tps": 17866, "wall": 27169.7} {"step": 7407, "train_loss": 3.682903289794922, "lr": 0.00035974570710613094, "tps": 17863, "wall": 27177.5} {"step": 7408, "train_loss": 3.546010971069336, "lr": 0.00035973363134298217, "tps": 17860, "wall": 27185.3} {"step": 7409, "train_loss": 3.6239871978759766, "lr": 0.0003597215539969232, "tps": 17858, "wall": 27193.1} {"step": 7410, "train_loss": 3.613737106323242, "lr": 0.00035970947506809103, "tps": 17855, "wall": 27200.9} {"step": 7411, "train_loss": 3.5995852947235107, "lr": 0.00035969739455662226, "tps": 17852, "wall": 27208.7} {"step": 7412, "train_loss": 3.7033329010009766, "lr": 0.00035968531246265395, "tps": 17850, "wall": 27216.6} {"step": 7413, "train_loss": 3.678008794784546, "lr": 0.0003596732287863228, "tps": 17847, "wall": 27224.5} {"step": 7414, "train_loss": 3.679428815841675, "lr": 0.0003596611435277657, "tps": 17844, "wall": 27232.2} {"step": 7415, "train_loss": 3.571178436279297, "lr": 0.00035964905668711965, "tps": 17841, "wall": 27240.0} {"step": 7416, "train_loss": 3.560598134994507, "lr": 0.0003596369682645216, "tps": 17839, "wall": 27247.8} {"step": 7417, "train_loss": 3.6314172744750977, "lr": 0.0003596248782601083, "tps": 17836, "wall": 27255.7} {"step": 7418, "train_loss": 3.729551315307617, "lr": 0.00035961278667401693, "tps": 17833, "wall": 27263.6} {"step": 7419, "train_loss": 3.5464322566986084, "lr": 0.00035960069350638433, "tps": 17830, "wall": 27271.5} {"step": 7420, "train_loss": 3.624850034713745, "lr": 0.0003595885987573475, "tps": 17828, "wall": 27279.2} {"step": 7421, "train_loss": 3.651533603668213, "lr": 0.0003595765024270435, "tps": 17825, "wall": 27287.0} {"step": 7422, "train_loss": 3.563241958618164, "lr": 0.0003595644045156093, "tps": 17822, "wall": 27294.8} {"step": 7423, "train_loss": 3.656532049179077, "lr": 0.000359552305023182, "tps": 17820, "wall": 27302.6} {"step": 7424, "train_loss": 3.797470808029175, "lr": 0.0003595402039498986, "tps": 17817, "wall": 27310.4} {"step": 7425, "train_loss": 3.526031970977783, "lr": 0.0003595281012958962, "tps": 17814, "wall": 27318.2} {"step": 7426, "train_loss": 3.5211429595947266, "lr": 0.00035951599706131207, "tps": 17812, "wall": 27326.0} {"step": 7427, "train_loss": 3.673363447189331, "lr": 0.00035950389124628305, "tps": 17809, "wall": 27333.8} {"step": 7428, "train_loss": 3.597456932067871, "lr": 0.0003594917838509464, "tps": 17806, "wall": 27341.5} {"step": 7429, "train_loss": 3.599024534225464, "lr": 0.00035947967487543934, "tps": 17804, "wall": 27349.4} {"step": 7430, "train_loss": 3.6441051959991455, "lr": 0.00035946756431989895, "tps": 17801, "wall": 27357.2} {"step": 7431, "train_loss": 3.5563740730285645, "lr": 0.00035945545218446246, "tps": 17798, "wall": 27365.0} {"step": 7432, "train_loss": 3.596097469329834, "lr": 0.000359443338469267, "tps": 17796, "wall": 27372.8} {"step": 7433, "train_loss": 3.646732807159424, "lr": 0.0003594312231744499, "tps": 17793, "wall": 27380.6} {"step": 7434, "train_loss": 3.6040139198303223, "lr": 0.0003594191063001484, "tps": 17790, "wall": 27388.5} {"step": 7435, "train_loss": 3.5915660858154297, "lr": 0.0003594069878464997, "tps": 17788, "wall": 27396.3} {"step": 7436, "train_loss": 3.7294299602508545, "lr": 0.00035939486781364107, "tps": 17785, "wall": 27404.2} {"step": 7437, "train_loss": 3.626112937927246, "lr": 0.00035938274620170985, "tps": 17782, "wall": 27411.9} {"step": 7438, "train_loss": 3.5938572883605957, "lr": 0.00035937062301084335, "tps": 17780, "wall": 27419.7} {"step": 7439, "train_loss": 3.6659388542175293, "lr": 0.00035935849824117883, "tps": 17777, "wall": 27427.4} {"step": 7440, "train_loss": 3.490727186203003, "lr": 0.0003593463718928538, "tps": 17774, "wall": 27435.2} {"step": 7441, "train_loss": 3.6564486026763916, "lr": 0.0003593342439660055, "tps": 17772, "wall": 27443.1} {"step": 7442, "train_loss": 3.6147048473358154, "lr": 0.0003593221144607713, "tps": 17769, "wall": 27450.9} {"step": 7443, "train_loss": 3.566269874572754, "lr": 0.00035930998337728866, "tps": 17766, "wall": 27458.6} {"step": 7444, "train_loss": 3.5757155418395996, "lr": 0.00035929785071569506, "tps": 17763, "wall": 27466.7} {"step": 7445, "train_loss": 3.638162612915039, "lr": 0.0003592857164761278, "tps": 17761, "wall": 27474.4} {"step": 7446, "train_loss": 3.610713005065918, "lr": 0.00035927358065872446, "tps": 17758, "wall": 27482.2} {"step": 7447, "train_loss": 3.654266834259033, "lr": 0.00035926144326362246, "tps": 17756, "wall": 27489.9} {"step": 7448, "train_loss": 3.6668834686279297, "lr": 0.00035924930429095925, "tps": 17753, "wall": 27497.7} {"step": 7449, "train_loss": 3.6133837699890137, "lr": 0.0003592371637408724, "tps": 17750, "wall": 27505.5} {"step": 7450, "train_loss": 3.5989744663238525, "lr": 0.0003592250216134994, "tps": 17748, "wall": 27513.3} {"step": 7451, "train_loss": 3.6312742233276367, "lr": 0.0003592128779089779, "tps": 17745, "wall": 27521.0} {"step": 7452, "train_loss": 3.591127634048462, "lr": 0.0003592007326274454, "tps": 17742, "wall": 27529.0} {"step": 7453, "train_loss": 3.5825419425964355, "lr": 0.0003591885857690394, "tps": 17740, "wall": 27536.7} {"step": 7454, "train_loss": 3.6470839977264404, "lr": 0.00035917643733389756, "tps": 17737, "wall": 27544.5} {"step": 7455, "train_loss": 3.5990684032440186, "lr": 0.0003591642873221575, "tps": 17734, "wall": 27552.3} {"step": 7456, "train_loss": 3.7258191108703613, "lr": 0.00035915213573395696, "tps": 17732, "wall": 27560.0} {"step": 7457, "train_loss": 3.641153335571289, "lr": 0.00035913998256943344, "tps": 17729, "wall": 27567.9} {"step": 7458, "train_loss": 3.546752691268921, "lr": 0.0003591278278287246, "tps": 17726, "wall": 27575.7} {"step": 7459, "train_loss": 3.6696131229400635, "lr": 0.00035911567151196834, "tps": 17724, "wall": 27583.6} {"step": 7460, "train_loss": 3.565269947052002, "lr": 0.0003591035136193022, "tps": 17721, "wall": 27591.3} {"step": 7461, "train_loss": 3.669351577758789, "lr": 0.0003590913541508639, "tps": 17719, "wall": 27599.2} {"step": 7462, "train_loss": 3.6289913654327393, "lr": 0.0003590791931067912, "tps": 17716, "wall": 27607.0} {"step": 7463, "train_loss": 3.5815019607543945, "lr": 0.0003590670304872218, "tps": 17713, "wall": 27614.8} {"step": 7464, "train_loss": 3.6300511360168457, "lr": 0.0003590548662922937, "tps": 17711, "wall": 27622.5} {"step": 7465, "train_loss": 3.5943350791931152, "lr": 0.0003590427005221445, "tps": 17708, "wall": 27630.3} {"step": 7466, "train_loss": 3.607478141784668, "lr": 0.000359030533176912, "tps": 17705, "wall": 27638.1} {"step": 7467, "train_loss": 3.695162296295166, "lr": 0.00035901836425673416, "tps": 17703, "wall": 27646.0} {"step": 7468, "train_loss": 3.658237934112549, "lr": 0.0003590061937617488, "tps": 17700, "wall": 27653.8} {"step": 7469, "train_loss": 3.641535997390747, "lr": 0.0003589940216920937, "tps": 17697, "wall": 27661.7} {"step": 7470, "train_loss": 3.736098289489746, "lr": 0.0003589818480479068, "tps": 17695, "wall": 27669.4} {"step": 7471, "train_loss": 3.6188371181488037, "lr": 0.00035896967282932605, "tps": 17692, "wall": 27677.2} {"step": 7472, "train_loss": 3.721681594848633, "lr": 0.00035895749603648936, "tps": 17690, "wall": 27685.1} {"step": 7473, "train_loss": 3.640530586242676, "lr": 0.00035894531766953456, "tps": 17687, "wall": 27692.8} {"step": 7474, "train_loss": 3.7183284759521484, "lr": 0.0003589331377285997, "tps": 17684, "wall": 27700.6} {"step": 7475, "train_loss": 3.5882768630981445, "lr": 0.0003589209562138228, "tps": 17682, "wall": 27708.5} {"step": 7476, "train_loss": 3.6949687004089355, "lr": 0.0003589087731253417, "tps": 17679, "wall": 27716.2} {"step": 7477, "train_loss": 3.5725557804107666, "lr": 0.0003588965884632946, "tps": 17677, "wall": 27724.0} {"step": 7478, "train_loss": 3.6902661323547363, "lr": 0.0003588844022278193, "tps": 17674, "wall": 27731.7} {"step": 7479, "train_loss": 3.6325573921203613, "lr": 0.00035887221441905406, "tps": 17671, "wall": 27739.5} {"step": 7480, "train_loss": 3.7180285453796387, "lr": 0.0003588600250371369, "tps": 17669, "wall": 27747.3} {"step": 7481, "train_loss": 3.659073829650879, "lr": 0.00035884783408220584, "tps": 17666, "wall": 27755.1} {"step": 7482, "train_loss": 3.7156639099121094, "lr": 0.00035883564155439896, "tps": 17664, "wall": 27762.8} {"step": 7483, "train_loss": 3.680858612060547, "lr": 0.0003588234474538545, "tps": 17661, "wall": 27770.8} {"step": 7484, "train_loss": 3.589841604232788, "lr": 0.00035881125178071043, "tps": 17658, "wall": 27778.5} {"step": 7485, "train_loss": 3.5948758125305176, "lr": 0.00035879905453510503, "tps": 17656, "wall": 27786.3} {"step": 7486, "train_loss": 3.6220245361328125, "lr": 0.0003587868557171764, "tps": 17653, "wall": 27794.0} {"step": 7487, "train_loss": 3.647714138031006, "lr": 0.0003587746553270628, "tps": 17651, "wall": 27801.9} {"step": 7488, "train_loss": 3.5910253524780273, "lr": 0.00035876245336490236, "tps": 17648, "wall": 27809.7} {"step": 7489, "train_loss": 3.6224915981292725, "lr": 0.0003587502498308334, "tps": 17645, "wall": 27817.5} {"step": 7490, "train_loss": 3.5244147777557373, "lr": 0.0003587380447249941, "tps": 17643, "wall": 27825.5} {"step": 7491, "train_loss": 3.6327526569366455, "lr": 0.00035872583804752266, "tps": 17640, "wall": 27833.3} {"step": 7492, "train_loss": 3.6886754035949707, "lr": 0.0003587136297985574, "tps": 17638, "wall": 27841.0} {"step": 7493, "train_loss": 3.808931350708008, "lr": 0.00035870141997823676, "tps": 17635, "wall": 27848.8} {"step": 7494, "train_loss": 3.6799280643463135, "lr": 0.00035868920858669884, "tps": 17632, "wall": 27856.6} {"step": 7495, "train_loss": 3.6173105239868164, "lr": 0.0003586769956240821, "tps": 17630, "wall": 27864.4} {"step": 7496, "train_loss": 3.6277482509613037, "lr": 0.0003586647810905248, "tps": 17627, "wall": 27872.1} {"step": 7497, "train_loss": 3.4845824241638184, "lr": 0.0003586525649861654, "tps": 17625, "wall": 27879.9} {"step": 7498, "train_loss": 3.6832642555236816, "lr": 0.00035864034731114227, "tps": 17622, "wall": 27887.9} {"step": 7499, "train_loss": 3.5320308208465576, "lr": 0.00035862812806559377, "tps": 17619, "wall": 27895.7} {"step": 7500, "train_loss": 3.661119222640991, "lr": 0.0003586159072496583, "tps": 17617, "wall": 27903.7} {"step": 7501, "train_loss": 3.6679017543792725, "lr": 0.00035860368486347434, "tps": 17614, "wall": 27911.5} {"step": 7502, "train_loss": 3.6183571815490723, "lr": 0.0003585914609071804, "tps": 17612, "wall": 27919.4} {"step": 7503, "train_loss": 3.6556034088134766, "lr": 0.0003585792353809148, "tps": 17609, "wall": 27927.2} {"step": 7504, "train_loss": 3.6033363342285156, "lr": 0.00035856700828481615, "tps": 17606, "wall": 27935.0} {"step": 7505, "train_loss": 3.525649070739746, "lr": 0.000358554779619023, "tps": 17604, "wall": 27942.8} {"step": 7506, "train_loss": 3.6111154556274414, "lr": 0.00035854254938367375, "tps": 17601, "wall": 27950.7} {"step": 7507, "train_loss": 3.745205879211426, "lr": 0.00035853031757890704, "tps": 17599, "wall": 27958.5} {"step": 7508, "train_loss": 3.534681558609009, "lr": 0.00035851808420486134, "tps": 17596, "wall": 27966.3} {"step": 7509, "train_loss": 3.5770037174224854, "lr": 0.0003585058492616753, "tps": 17593, "wall": 27974.1} {"step": 7510, "train_loss": 3.551220417022705, "lr": 0.0003584936127494876, "tps": 17591, "wall": 27981.9} {"step": 7511, "train_loss": 3.5231192111968994, "lr": 0.00035848137466843664, "tps": 17588, "wall": 27989.8} {"step": 7512, "train_loss": 3.550044059753418, "lr": 0.0003584691350186613, "tps": 17586, "wall": 27997.5} {"step": 7513, "train_loss": 3.633953094482422, "lr": 0.0003584568938003, "tps": 17583, "wall": 28005.4} {"step": 7514, "train_loss": 3.656869888305664, "lr": 0.00035844465101349157, "tps": 17581, "wall": 28013.2} {"step": 7515, "train_loss": 3.6058754920959473, "lr": 0.0003584324066583746, "tps": 17578, "wall": 28020.9} {"step": 7516, "train_loss": 3.6315016746520996, "lr": 0.00035842016073508786, "tps": 17576, "wall": 28028.8} {"step": 7517, "train_loss": 3.554183006286621, "lr": 0.0003584079132437701, "tps": 17573, "wall": 28036.7} {"step": 7518, "train_loss": 3.6632397174835205, "lr": 0.00035839566418455996, "tps": 17570, "wall": 28044.8} {"step": 7519, "train_loss": 3.665470600128174, "lr": 0.00035838341355759625, "tps": 17568, "wall": 28052.6} {"step": 7520, "train_loss": 3.5926265716552734, "lr": 0.00035837116136301774, "tps": 17565, "wall": 28060.7} {"step": 7521, "train_loss": 3.62587308883667, "lr": 0.00035835890760096327, "tps": 17562, "wall": 28068.9} {"step": 7522, "train_loss": 3.6226084232330322, "lr": 0.00035834665227157155, "tps": 17559, "wall": 28076.9} {"step": 7523, "train_loss": 3.6594293117523193, "lr": 0.0003583343953749815, "tps": 17557, "wall": 28084.8} {"step": 7524, "train_loss": 3.695439338684082, "lr": 0.00035832213691133194, "tps": 17554, "wall": 28092.8} {"step": 7525, "train_loss": 3.6250905990600586, "lr": 0.0003583098768807617, "tps": 17551, "wall": 28100.7} {"step": 7526, "train_loss": 3.638251543045044, "lr": 0.00035829761528340977, "tps": 17549, "wall": 28108.7} {"step": 7527, "train_loss": 3.5837721824645996, "lr": 0.0003582853521194149, "tps": 17546, "wall": 28116.5} {"step": 7528, "train_loss": 3.7770323753356934, "lr": 0.0003582730873889161, "tps": 17544, "wall": 28124.5} {"step": 7529, "train_loss": 3.6585779190063477, "lr": 0.0003582608210920523, "tps": 17541, "wall": 28132.4} {"step": 7530, "train_loss": 3.6082000732421875, "lr": 0.0003582485532289624, "tps": 17538, "wall": 28140.3} {"step": 7531, "train_loss": 3.519138813018799, "lr": 0.0003582362837997855, "tps": 17536, "wall": 28148.2} {"step": 7532, "train_loss": 3.6652579307556152, "lr": 0.0003582240128046604, "tps": 17533, "wall": 28156.1} {"step": 7533, "train_loss": 3.5199811458587646, "lr": 0.00035821174024372617, "tps": 17531, "wall": 28164.1} {"step": 7534, "train_loss": 3.56782865524292, "lr": 0.00035819946611712197, "tps": 17528, "wall": 28172.0} {"step": 7535, "train_loss": 3.5181989669799805, "lr": 0.0003581871904249867, "tps": 17525, "wall": 28180.1} {"step": 7536, "train_loss": 3.591038227081299, "lr": 0.0003581749131674595, "tps": 17523, "wall": 28188.4} {"step": 7537, "train_loss": 3.6541402339935303, "lr": 0.0003581626343446794, "tps": 17520, "wall": 28196.4} {"step": 7538, "train_loss": 3.6869702339172363, "lr": 0.00035815035395678544, "tps": 17517, "wall": 28204.5} {"step": 7539, "train_loss": 3.66292667388916, "lr": 0.00035813807200391686, "tps": 17514, "wall": 28212.5} {"step": 7540, "train_loss": 3.747738838195801, "lr": 0.0003581257884862127, "tps": 17512, "wall": 28220.6} {"step": 7541, "train_loss": 3.719750165939331, "lr": 0.00035811350340381214, "tps": 17509, "wall": 28228.8} {"step": 7542, "train_loss": 3.630769968032837, "lr": 0.0003581012167568544, "tps": 17506, "wall": 28236.8} {"step": 7543, "train_loss": 3.639584541320801, "lr": 0.00035808892854547847, "tps": 17504, "wall": 28245.0} {"step": 7544, "train_loss": 3.600537061691284, "lr": 0.0003580766387698238, "tps": 17501, "wall": 28252.9} {"step": 7545, "train_loss": 3.5659828186035156, "lr": 0.0003580643474300294, "tps": 17498, "wall": 28260.8} {"step": 7546, "train_loss": 3.5850889682769775, "lr": 0.0003580520545262347, "tps": 17496, "wall": 28268.8} {"step": 7547, "train_loss": 3.6224398612976074, "lr": 0.0003580397600585788, "tps": 17493, "wall": 28276.7} {"step": 7548, "train_loss": 3.441692352294922, "lr": 0.00035802746402720107, "tps": 17491, "wall": 28284.9} {"step": 7549, "train_loss": 3.6279940605163574, "lr": 0.00035801516643224076, "tps": 17488, "wall": 28292.8} {"step": 7550, "train_loss": 3.4759421348571777, "lr": 0.00035800286727383717, "tps": 17485, "wall": 28300.9} {"step": 7551, "train_loss": 3.711512327194214, "lr": 0.0003579905665521296, "tps": 17483, "wall": 28309.0} {"step": 7552, "train_loss": 3.6198854446411133, "lr": 0.00035797826426725744, "tps": 17480, "wall": 28317.2} {"step": 7553, "train_loss": 3.5934603214263916, "lr": 0.00035796596041936005, "tps": 17477, "wall": 28325.1} {"step": 7554, "train_loss": 3.63407301902771, "lr": 0.00035795365500857683, "tps": 17475, "wall": 28333.2} {"step": 7555, "train_loss": 3.6539549827575684, "lr": 0.00035794134803504715, "tps": 17472, "wall": 28341.0} {"step": 7556, "train_loss": 3.574568033218384, "lr": 0.0003579290394989103, "tps": 17469, "wall": 28349.0} {"step": 7557, "train_loss": 3.593031883239746, "lr": 0.00035791672940030595, "tps": 17467, "wall": 28356.9} {"step": 7558, "train_loss": 3.58811354637146, "lr": 0.00035790441773937335, "tps": 17464, "wall": 28365.0} {"step": 7559, "train_loss": 3.657111883163452, "lr": 0.0003578921045162521, "tps": 17462, "wall": 28372.8} {"step": 7560, "train_loss": 3.612706422805786, "lr": 0.0003578797897310816, "tps": 17459, "wall": 28380.7} {"step": 7561, "train_loss": 3.6889681816101074, "lr": 0.0003578674733840014, "tps": 17457, "wall": 28388.7} {"step": 7562, "train_loss": 3.63747501373291, "lr": 0.000357855155475151, "tps": 17454, "wall": 28396.7} {"step": 7563, "train_loss": 3.6453609466552734, "lr": 0.00035784283600466993, "tps": 17451, "wall": 28404.6} {"step": 7564, "train_loss": 3.660395622253418, "lr": 0.0003578305149726978, "tps": 17449, "wall": 28412.4} {"step": 7565, "train_loss": 3.5596585273742676, "lr": 0.0003578181923793741, "tps": 17446, "wall": 28420.3} {"step": 7566, "train_loss": 3.653770923614502, "lr": 0.0003578058682248384, "tps": 17444, "wall": 28428.3} {"step": 7567, "train_loss": 3.5728909969329834, "lr": 0.00035779354250923043, "tps": 17441, "wall": 28436.1} {"step": 7568, "train_loss": 3.5602002143859863, "lr": 0.0003577812152326898, "tps": 17439, "wall": 28443.9} {"step": 7569, "train_loss": 3.725269317626953, "lr": 0.00035776888639535605, "tps": 17436, "wall": 28451.7} {"step": 7570, "train_loss": 3.5584568977355957, "lr": 0.00035775655599736895, "tps": 17434, "wall": 28459.6} {"step": 7571, "train_loss": 3.5902295112609863, "lr": 0.0003577442240388681, "tps": 17431, "wall": 28467.4} {"step": 7572, "train_loss": 3.634084939956665, "lr": 0.0003577318905199932, "tps": 17429, "wall": 28475.2} {"step": 7573, "train_loss": 3.591625690460205, "lr": 0.000357719555440884, "tps": 17426, "wall": 28483.0} {"step": 7574, "train_loss": 3.537351608276367, "lr": 0.0003577072188016803, "tps": 17424, "wall": 28490.8} {"step": 7575, "train_loss": 3.708987236022949, "lr": 0.0003576948806025217, "tps": 17421, "wall": 28498.7} {"step": 7576, "train_loss": 3.5798568725585938, "lr": 0.000357682540843548, "tps": 17419, "wall": 28506.4} {"step": 7577, "train_loss": 3.547922134399414, "lr": 0.0003576701995248992, "tps": 17417, "wall": 28514.2} {"step": 7578, "train_loss": 3.5770840644836426, "lr": 0.00035765785664671477, "tps": 17414, "wall": 28522.0} {"step": 7579, "train_loss": 3.6919007301330566, "lr": 0.00035764551220913483, "tps": 17412, "wall": 28529.8} {"step": 7580, "train_loss": 3.5466198921203613, "lr": 0.00035763316621229897, "tps": 17409, "wall": 28537.5} {"step": 7581, "train_loss": 3.5880889892578125, "lr": 0.00035762081865634715, "tps": 17407, "wall": 28545.5} {"step": 7582, "train_loss": 3.6101040840148926, "lr": 0.0003576084695414193, "tps": 17404, "wall": 28553.2} {"step": 7583, "train_loss": 3.5051350593566895, "lr": 0.0003575961188676552, "tps": 17402, "wall": 28561.0} {"step": 7584, "train_loss": 3.6299643516540527, "lr": 0.0003575837666351949, "tps": 17399, "wall": 28568.8} {"step": 7585, "train_loss": 3.5844297409057617, "lr": 0.00035757141284417827, "tps": 17397, "wall": 28576.7} {"step": 7586, "train_loss": 3.5650434494018555, "lr": 0.00035755905749474515, "tps": 17394, "wall": 28584.4} {"step": 7587, "train_loss": 3.631563663482666, "lr": 0.00035754670058703563, "tps": 17392, "wall": 28592.2} {"step": 7588, "train_loss": 3.5667500495910645, "lr": 0.0003575343421211896, "tps": 17390, "wall": 28599.9} {"step": 7589, "train_loss": 3.676582098007202, "lr": 0.00035752198209734715, "tps": 17387, "wall": 28607.8} {"step": 7590, "train_loss": 3.5453691482543945, "lr": 0.00035750962051564825, "tps": 17385, "wall": 28615.6} {"step": 7591, "train_loss": 3.6036384105682373, "lr": 0.0003574972573762329, "tps": 17382, "wall": 28623.3} {"step": 7592, "train_loss": 3.6869897842407227, "lr": 0.0003574848926792412, "tps": 17380, "wall": 28631.0} {"step": 7593, "train_loss": 3.602562189102173, "lr": 0.0003574725264248132, "tps": 17377, "wall": 28638.8} {"step": 7594, "train_loss": 3.6871659755706787, "lr": 0.00035746015861308895, "tps": 17375, "wall": 28646.6} {"step": 7595, "train_loss": 3.6226491928100586, "lr": 0.00035744778924420867, "tps": 17373, "wall": 28654.2} {"step": 7596, "train_loss": 3.611771821975708, "lr": 0.0003574354183183123, "tps": 17370, "wall": 28662.0} {"step": 7597, "train_loss": 3.6501245498657227, "lr": 0.0003574230458355401, "tps": 17368, "wall": 28669.8} {"step": 7598, "train_loss": 3.6096529960632324, "lr": 0.0003574106717960322, "tps": 17365, "wall": 28677.6} {"step": 7599, "train_loss": 3.6164865493774414, "lr": 0.00035739829619992877, "tps": 17363, "wall": 28685.4} {"step": 7600, "train_loss": 3.5378456115722656, "lr": 0.0003573859190473701, "tps": 17360, "wall": 28693.2} {"step": 7601, "train_loss": 3.668489933013916, "lr": 0.00035737354033849625, "tps": 17358, "wall": 28700.8} {"step": 7602, "train_loss": 3.6351189613342285, "lr": 0.00035736116007344755, "tps": 17356, "wall": 28708.7} {"step": 7603, "train_loss": 3.559685707092285, "lr": 0.00035734877825236404, "tps": 17353, "wall": 28716.4} {"step": 7604, "train_loss": 3.6535801887512207, "lr": 0.0003573363948753863, "tps": 17351, "wall": 28724.3} {"step": 7605, "train_loss": 3.544384479522705, "lr": 0.00035732400994265435, "tps": 17348, "wall": 28732.0} {"step": 7606, "train_loss": 3.6152377128601074, "lr": 0.0003573116234543086, "tps": 17346, "wall": 28739.9} {"step": 7607, "train_loss": 3.51613450050354, "lr": 0.0003572992354104894, "tps": 17344, "wall": 28747.5} {"step": 7608, "train_loss": 3.7214434146881104, "lr": 0.00035728684581133705, "tps": 17341, "wall": 28755.3} {"step": 7609, "train_loss": 3.586768388748169, "lr": 0.00035727445465699183, "tps": 17339, "wall": 28763.0} {"step": 7610, "train_loss": 3.7086920738220215, "lr": 0.00035726206194759414, "tps": 17336, "wall": 28770.9} {"step": 7611, "train_loss": 3.6103742122650146, "lr": 0.00035724966768328444, "tps": 17334, "wall": 28778.5} {"step": 7612, "train_loss": 3.6489195823669434, "lr": 0.000357237271864203, "tps": 17331, "wall": 28786.4} {"step": 7613, "train_loss": 3.6423957347869873, "lr": 0.00035722487449049045, "tps": 17329, "wall": 28794.2} {"step": 7614, "train_loss": 3.593278646469116, "lr": 0.000357212475562287, "tps": 17327, "wall": 28802.0} {"step": 7615, "train_loss": 3.6093764305114746, "lr": 0.0003572000750797332, "tps": 17324, "wall": 28809.8} {"step": 7616, "train_loss": 3.675307512283325, "lr": 0.00035718767304296963, "tps": 17322, "wall": 28817.6} {"step": 7617, "train_loss": 3.5921630859375, "lr": 0.00035717526945213654, "tps": 17319, "wall": 28825.6} {"step": 7618, "train_loss": 3.578461170196533, "lr": 0.00035716286430737465, "tps": 17317, "wall": 28833.8} {"step": 7619, "train_loss": 3.6613874435424805, "lr": 0.00035715045760882446, "tps": 17314, "wall": 28841.5} {"step": 7620, "train_loss": 3.691744804382324, "lr": 0.0003571380493566264, "tps": 17312, "wall": 28849.5} {"step": 7621, "train_loss": 3.4541378021240234, "lr": 0.0003571256395509211, "tps": 17309, "wall": 28857.3} {"step": 7622, "train_loss": 3.5973494052886963, "lr": 0.00035711322819184915, "tps": 17307, "wall": 28865.2} {"step": 7623, "train_loss": 3.5292441844940186, "lr": 0.0003571008152795511, "tps": 17305, "wall": 28872.9} {"step": 7624, "train_loss": 3.6999990940093994, "lr": 0.00035708840081416764, "tps": 17302, "wall": 28880.6} {"step": 7625, "train_loss": 3.6077370643615723, "lr": 0.0003570759847958393, "tps": 17300, "wall": 28888.5} {"step": 7626, "train_loss": 3.617220878601074, "lr": 0.0003570635672247069, "tps": 17297, "wall": 28896.2} {"step": 7627, "train_loss": 3.6305956840515137, "lr": 0.0003570511481009109, "tps": 17295, "wall": 28904.1} {"step": 7628, "train_loss": 3.661008358001709, "lr": 0.0003570387274245921, "tps": 17293, "wall": 28911.9} {"step": 7629, "train_loss": 3.602173328399658, "lr": 0.0003570263051958912, "tps": 17290, "wall": 28919.7} {"step": 7630, "train_loss": 3.5395374298095703, "lr": 0.0003570138814149489, "tps": 17288, "wall": 28927.5} {"step": 7631, "train_loss": 3.6436920166015625, "lr": 0.00035700145608190593, "tps": 17285, "wall": 28935.3} {"step": 7632, "train_loss": 3.58337140083313, "lr": 0.0003569890291969031, "tps": 17283, "wall": 28943.0} {"step": 7633, "train_loss": 3.508669853210449, "lr": 0.000356976600760081, "tps": 17281, "wall": 28950.9} {"step": 7634, "train_loss": 3.5457375049591064, "lr": 0.0003569641707715807, "tps": 17278, "wall": 28958.6} {"step": 7635, "train_loss": 3.62321138381958, "lr": 0.00035695173923154283, "tps": 17276, "wall": 28966.5} {"step": 7636, "train_loss": 3.541560173034668, "lr": 0.00035693930614010824, "tps": 17273, "wall": 28974.4} {"step": 7637, "train_loss": 3.552717447280884, "lr": 0.0003569268714974178, "tps": 17271, "wall": 28982.2} {"step": 7638, "train_loss": 3.5572216510772705, "lr": 0.0003569144353036123, "tps": 17269, "wall": 28989.9} {"step": 7639, "train_loss": 3.6206164360046387, "lr": 0.0003569019975588327, "tps": 17266, "wall": 28997.8} {"step": 7640, "train_loss": 3.6442623138427734, "lr": 0.0003568895582632199, "tps": 17264, "wall": 29005.5} {"step": 7641, "train_loss": 3.6053614616394043, "lr": 0.0003568771174169147, "tps": 17261, "wall": 29013.3} {"step": 7642, "train_loss": 3.6339874267578125, "lr": 0.00035686467502005816, "tps": 17259, "wall": 29021.0} {"step": 7643, "train_loss": 3.6748414039611816, "lr": 0.0003568522310727911, "tps": 17257, "wall": 29028.8} {"step": 7644, "train_loss": 3.5887808799743652, "lr": 0.00035683978557525466, "tps": 17254, "wall": 29036.7} {"step": 7645, "train_loss": 3.6349902153015137, "lr": 0.00035682733852758974, "tps": 17252, "wall": 29044.5} {"step": 7646, "train_loss": 3.7176496982574463, "lr": 0.00035681488992993725, "tps": 17250, "wall": 29052.2} {"step": 7647, "train_loss": 3.635929822921753, "lr": 0.0003568024397824383, "tps": 17247, "wall": 29060.0} {"step": 7648, "train_loss": 3.6639678478240967, "lr": 0.00035678998808523396, "tps": 17245, "wall": 29067.8} {"step": 7649, "train_loss": 3.6292953491210938, "lr": 0.00035677753483846514, "tps": 17243, "wall": 29075.4} {"step": 7650, "train_loss": 3.747720718383789, "lr": 0.00035676508004227315, "tps": 17240, "wall": 29083.1} {"step": 7651, "train_loss": 3.646289348602295, "lr": 0.00035675262369679885, "tps": 17238, "wall": 29091.1} {"step": 7652, "train_loss": 3.688523769378662, "lr": 0.0003567401658021834, "tps": 17235, "wall": 29098.9} {"step": 7653, "train_loss": 3.66715931892395, "lr": 0.00035672770635856803, "tps": 17233, "wall": 29106.7} {"step": 7654, "train_loss": 3.5683388710021973, "lr": 0.0003567152453660938, "tps": 17231, "wall": 29114.4} {"step": 7655, "train_loss": 3.727269411087036, "lr": 0.00035670278282490177, "tps": 17228, "wall": 29122.3} {"step": 7656, "train_loss": 3.627816915512085, "lr": 0.00035669031873513334, "tps": 17226, "wall": 29130.0} {"step": 7657, "train_loss": 3.599079132080078, "lr": 0.0003566778530969295, "tps": 17224, "wall": 29137.8} {"step": 7658, "train_loss": 3.581040143966675, "lr": 0.0003566653859104316, "tps": 17221, "wall": 29145.6} {"step": 7659, "train_loss": 3.632169246673584, "lr": 0.00035665291717578074, "tps": 17219, "wall": 29153.4} {"step": 7660, "train_loss": 3.578183650970459, "lr": 0.00035664044689311835, "tps": 17217, "wall": 29161.1} {"step": 7661, "train_loss": 3.581754446029663, "lr": 0.0003566279750625855, "tps": 17214, "wall": 29168.8} {"step": 7662, "train_loss": 3.5602633953094482, "lr": 0.00035661550168432355, "tps": 17212, "wall": 29176.6} {"step": 7663, "train_loss": 3.523822069168091, "lr": 0.0003566030267584739, "tps": 17210, "wall": 29184.3} {"step": 7664, "train_loss": 3.6113908290863037, "lr": 0.0003565905502851777, "tps": 17207, "wall": 29192.1} {"step": 7665, "train_loss": 3.653637170791626, "lr": 0.00035657807226457635, "tps": 17205, "wall": 29199.8} {"step": 7666, "train_loss": 3.7475342750549316, "lr": 0.00035656559269681127, "tps": 17203, "wall": 29207.7} {"step": 7667, "train_loss": 3.5008509159088135, "lr": 0.00035655311158202374, "tps": 17200, "wall": 29215.4} {"step": 7668, "train_loss": 3.53997802734375, "lr": 0.0003565406289203551, "tps": 17198, "wall": 29223.1} {"step": 7669, "train_loss": 3.6419174671173096, "lr": 0.0003565281447119469, "tps": 17196, "wall": 29230.8} {"step": 7670, "train_loss": 3.7189183235168457, "lr": 0.0003565156589569405, "tps": 17193, "wall": 29238.6} {"step": 7671, "train_loss": 3.6493091583251953, "lr": 0.0003565031716554773, "tps": 17191, "wall": 29246.4} {"step": 7672, "train_loss": 3.5606915950775146, "lr": 0.00035649068280769883, "tps": 17189, "wall": 29254.1} {"step": 7673, "train_loss": 3.602202892303467, "lr": 0.0003564781924137465, "tps": 17187, "wall": 29261.8} {"step": 7674, "train_loss": 3.613532304763794, "lr": 0.0003564657004737618, "tps": 17184, "wall": 29269.7} {"step": 7675, "train_loss": 3.577152967453003, "lr": 0.0003564532069878863, "tps": 17182, "wall": 29277.5} {"step": 7676, "train_loss": 3.6299610137939453, "lr": 0.00035644071195626144, "tps": 17180, "wall": 29285.2} {"step": 7677, "train_loss": 3.7580997943878174, "lr": 0.00035642821537902884, "tps": 17177, "wall": 29292.8} {"step": 7678, "train_loss": 3.6220650672912598, "lr": 0.00035641571725633, "tps": 17175, "wall": 29300.6} {"step": 7679, "train_loss": 3.6373138427734375, "lr": 0.0003564032175883066, "tps": 17173, "wall": 29308.3} {"step": 7680, "train_loss": 3.5929172039031982, "lr": 0.0003563907163751002, "tps": 17170, "wall": 29316.0} {"step": 7681, "train_loss": 3.560544013977051, "lr": 0.0003563782136168523, "tps": 17168, "wall": 29323.9} {"step": 7682, "train_loss": 3.6469850540161133, "lr": 0.0003563657093137047, "tps": 17166, "wall": 29331.7} {"step": 7683, "train_loss": 3.559173107147217, "lr": 0.00035635320346579885, "tps": 17163, "wall": 29339.4} {"step": 7684, "train_loss": 3.570693254470825, "lr": 0.0003563406960732766, "tps": 17161, "wall": 29347.1} {"step": 7685, "train_loss": 3.531996488571167, "lr": 0.00035632818713627956, "tps": 17159, "wall": 29354.9} {"step": 7686, "train_loss": 3.5831189155578613, "lr": 0.00035631567665494947, "tps": 17157, "wall": 29362.6} {"step": 7687, "train_loss": 3.550153970718384, "lr": 0.000356303164629428, "tps": 17154, "wall": 29370.3} {"step": 7688, "train_loss": 3.533832550048828, "lr": 0.0003562906510598569, "tps": 17152, "wall": 29378.1} {"step": 7689, "train_loss": 3.5450916290283203, "lr": 0.000356278135946378, "tps": 17150, "wall": 29385.9} {"step": 7690, "train_loss": 3.7086358070373535, "lr": 0.0003562656192891329, "tps": 17147, "wall": 29393.7} {"step": 7691, "train_loss": 3.609701156616211, "lr": 0.0003562531010882635, "tps": 17145, "wall": 29401.3} {"step": 7692, "train_loss": 3.6498007774353027, "lr": 0.00035624058134391167, "tps": 17143, "wall": 29409.1} {"step": 7693, "train_loss": 3.592782974243164, "lr": 0.0003562280600562191, "tps": 17141, "wall": 29416.8} {"step": 7694, "train_loss": 3.633202075958252, "lr": 0.00035621553722532776, "tps": 17138, "wall": 29424.7} {"step": 7695, "train_loss": 3.5239744186401367, "lr": 0.0003562030128513794, "tps": 17136, "wall": 29432.4} {"step": 7696, "train_loss": 3.5460972785949707, "lr": 0.000356190486934516, "tps": 17134, "wall": 29440.0} {"step": 7697, "train_loss": 3.5546693801879883, "lr": 0.0003561779594748793, "tps": 17131, "wall": 29447.9} {"step": 7698, "train_loss": 3.641355037689209, "lr": 0.00035616543047261136, "tps": 17129, "wall": 29455.6} {"step": 7699, "train_loss": 3.7099051475524902, "lr": 0.00035615289992785407, "tps": 17127, "wall": 29463.3} {"step": 7700, "train_loss": 3.6164002418518066, "lr": 0.00035614036784074936, "tps": 17125, "wall": 29471.0} {"step": 7701, "train_loss": 3.653252601623535, "lr": 0.00035612783421143916, "tps": 17122, "wall": 29478.7} {"step": 7702, "train_loss": 3.528992176055908, "lr": 0.00035611529904006555, "tps": 17120, "wall": 29486.6} {"step": 7703, "train_loss": 3.697087287902832, "lr": 0.0003561027623267704, "tps": 17118, "wall": 29494.3} {"step": 7704, "train_loss": 3.605681896209717, "lr": 0.00035609022407169586, "tps": 17115, "wall": 29502.0} {"step": 7705, "train_loss": 3.468100070953369, "lr": 0.00035607768427498384, "tps": 17113, "wall": 29509.8} {"step": 7706, "train_loss": 3.555408477783203, "lr": 0.0003560651429367765, "tps": 17111, "wall": 29517.6} {"step": 7707, "train_loss": 3.591939687728882, "lr": 0.0003560526000572158, "tps": 17109, "wall": 29525.3} {"step": 7708, "train_loss": 3.617677688598633, "lr": 0.000356040055636444, "tps": 17106, "wall": 29532.9} {"step": 7709, "train_loss": 3.5181403160095215, "lr": 0.00035602750967460295, "tps": 17104, "wall": 29540.7} {"step": 7710, "train_loss": 3.7004756927490234, "lr": 0.000356014962171835, "tps": 17102, "wall": 29548.5} {"step": 7711, "train_loss": 3.4922327995300293, "lr": 0.00035600241312828214, "tps": 17100, "wall": 29556.1} {"step": 7712, "train_loss": 3.5387887954711914, "lr": 0.00035598986254408663, "tps": 17097, "wall": 29564.1} {"step": 7713, "train_loss": 3.5759730339050293, "lr": 0.0003559773104193906, "tps": 17095, "wall": 29571.8} {"step": 7714, "train_loss": 3.55574369430542, "lr": 0.0003559647567543363, "tps": 17093, "wall": 29579.5} {"step": 7715, "train_loss": 3.5834531784057617, "lr": 0.0003559522015490658, "tps": 17090, "wall": 29587.4} {"step": 7716, "train_loss": 3.570488929748535, "lr": 0.00035593964480372137, "tps": 17088, "wall": 29595.0} {"step": 7717, "train_loss": 3.657331943511963, "lr": 0.0003559270865184453, "tps": 17086, "wall": 29602.9} {"step": 7718, "train_loss": 3.643883228302002, "lr": 0.00035591452669337997, "tps": 17084, "wall": 29610.7} {"step": 7719, "train_loss": 3.567077159881592, "lr": 0.0003559019653286674, "tps": 17081, "wall": 29618.4} {"step": 7720, "train_loss": 3.590524435043335, "lr": 0.00035588940242445, "tps": 17079, "wall": 29626.3} {"step": 7721, "train_loss": 3.6549012660980225, "lr": 0.0003558768379808702, "tps": 17077, "wall": 29634.1} {"step": 7722, "train_loss": 3.666407346725464, "lr": 0.0003558642719980702, "tps": 17075, "wall": 29641.8} {"step": 7723, "train_loss": 3.7163243293762207, "lr": 0.00035585170447619235, "tps": 17072, "wall": 29649.6} {"step": 7724, "train_loss": 3.668914556503296, "lr": 0.0003558391354153791, "tps": 17070, "wall": 29657.3} {"step": 7725, "train_loss": 3.5768308639526367, "lr": 0.00035582656481577266, "tps": 17068, "wall": 29665.0} {"step": 7726, "train_loss": 3.6490159034729004, "lr": 0.0003558139926775156, "tps": 17066, "wall": 29672.7} {"step": 7727, "train_loss": 3.599691390991211, "lr": 0.0003558014190007503, "tps": 17063, "wall": 29680.5} {"step": 7728, "train_loss": 3.566211223602295, "lr": 0.00035578884378561923, "tps": 17061, "wall": 29688.4} {"step": 7729, "train_loss": 3.7524776458740234, "lr": 0.00035577626703226466, "tps": 17059, "wall": 29696.2} {"step": 7730, "train_loss": 3.60319447517395, "lr": 0.00035576368874082933, "tps": 17056, "wall": 29703.9} {"step": 7731, "train_loss": 3.7516613006591797, "lr": 0.00035575110891145555, "tps": 17054, "wall": 29711.7} {"step": 7732, "train_loss": 3.759169816970825, "lr": 0.0003557385275442858, "tps": 17052, "wall": 29719.5} {"step": 7733, "train_loss": 3.6202383041381836, "lr": 0.00035572594463946267, "tps": 17050, "wall": 29727.3} {"step": 7734, "train_loss": 3.525686740875244, "lr": 0.00035571336019712876, "tps": 17047, "wall": 29735.0} {"step": 7735, "train_loss": 3.6860923767089844, "lr": 0.0003557007742174265, "tps": 17045, "wall": 29742.7} {"step": 7736, "train_loss": 3.5737624168395996, "lr": 0.00035568818670049865, "tps": 17043, "wall": 29750.5} {"step": 7737, "train_loss": 3.52851939201355, "lr": 0.00035567559764648754, "tps": 17041, "wall": 29758.4} {"step": 7738, "train_loss": 3.607664108276367, "lr": 0.000355663007055536, "tps": 17038, "wall": 29766.1} {"step": 7739, "train_loss": 3.5929253101348877, "lr": 0.00035565041492778657, "tps": 17036, "wall": 29773.9} {"step": 7740, "train_loss": 3.575416326522827, "lr": 0.00035563782126338186, "tps": 17034, "wall": 29781.7} {"step": 7741, "train_loss": 3.560540199279785, "lr": 0.0003556252260624646, "tps": 17032, "wall": 29789.5} {"step": 7742, "train_loss": 3.6363883018493652, "lr": 0.00035561262932517747, "tps": 17029, "wall": 29797.2} {"step": 7743, "train_loss": 3.638728618621826, "lr": 0.0003556000310516631, "tps": 17027, "wall": 29805.1} {"step": 7744, "train_loss": 3.613668918609619, "lr": 0.00035558743124206423, "tps": 17025, "wall": 29812.8} {"step": 7745, "train_loss": 3.5846924781799316, "lr": 0.0003555748298965236, "tps": 17023, "wall": 29820.6} {"step": 7746, "train_loss": 3.5753731727600098, "lr": 0.00035556222701518396, "tps": 17020, "wall": 29828.4} {"step": 7747, "train_loss": 3.7417593002319336, "lr": 0.00035554962259818815, "tps": 17018, "wall": 29836.2} {"step": 7748, "train_loss": 3.533545970916748, "lr": 0.0003555370166456788, "tps": 17016, "wall": 29843.9} {"step": 7749, "train_loss": 3.5562527179718018, "lr": 0.00035552440915779886, "tps": 17014, "wall": 29851.6} {"step": 7750, "train_loss": 3.574399709701538, "lr": 0.00035551180013469107, "tps": 17012, "wall": 29859.2} {"step": 7751, "train_loss": 3.6668953895568848, "lr": 0.0003554991895764982, "tps": 17009, "wall": 29867.2} {"step": 7752, "train_loss": 3.644606113433838, "lr": 0.0003554865774833633, "tps": 17007, "wall": 29874.9} {"step": 7753, "train_loss": 3.502775192260742, "lr": 0.00035547396385542904, "tps": 17005, "wall": 29882.7} {"step": 7754, "train_loss": 3.6191530227661133, "lr": 0.0003554613486928384, "tps": 17003, "wall": 29890.5} {"step": 7755, "train_loss": 3.615574836730957, "lr": 0.0003554487319957342, "tps": 17000, "wall": 29898.3} {"step": 7756, "train_loss": 3.5587499141693115, "lr": 0.0003554361137642596, "tps": 16998, "wall": 29906.1} {"step": 7757, "train_loss": 3.612793207168579, "lr": 0.00035542349399855723, "tps": 16996, "wall": 29913.8} {"step": 7758, "train_loss": 3.587881565093994, "lr": 0.0003554108726987703, "tps": 16994, "wall": 29921.6} {"step": 7759, "train_loss": 3.5865519046783447, "lr": 0.0003553982498650416, "tps": 16991, "wall": 29929.4} {"step": 7760, "train_loss": 3.5858817100524902, "lr": 0.00035538562549751424, "tps": 16989, "wall": 29937.3} {"step": 7761, "train_loss": 3.5500035285949707, "lr": 0.00035537299959633123, "tps": 16987, "wall": 29945.1} {"step": 7762, "train_loss": 3.549501657485962, "lr": 0.0003553603721616355, "tps": 16985, "wall": 29952.8} {"step": 7763, "train_loss": 3.5159988403320312, "lr": 0.00035534774319357016, "tps": 16983, "wall": 29960.5} {"step": 7764, "train_loss": 3.607356071472168, "lr": 0.0003553351126922783, "tps": 16980, "wall": 29968.3} {"step": 7765, "train_loss": 3.6300888061523438, "lr": 0.0003553224806579029, "tps": 16978, "wall": 29976.0} {"step": 7766, "train_loss": 3.502753496170044, "lr": 0.0003553098470905872, "tps": 16976, "wall": 29984.0} {"step": 7767, "train_loss": 3.552365303039551, "lr": 0.0003552972119904741, "tps": 16974, "wall": 29991.6} {"step": 7768, "train_loss": 3.719442844390869, "lr": 0.00035528457535770693, "tps": 16971, "wall": 29999.4} {"step": 7769, "train_loss": 3.5935466289520264, "lr": 0.0003552719371924288, "tps": 16969, "wall": 30007.1} {"step": 7770, "train_loss": 3.601384401321411, "lr": 0.00035525929749478284, "tps": 16967, "wall": 30014.9} {"step": 7771, "train_loss": 3.5694403648376465, "lr": 0.0003552466562649123, "tps": 16965, "wall": 30022.6} {"step": 7772, "train_loss": 3.459928035736084, "lr": 0.00035523401350296026, "tps": 16963, "wall": 30030.4} {"step": 7773, "train_loss": 3.5792694091796875, "lr": 0.0003552213692090699, "tps": 16961, "wall": 30038.0} {"step": 7774, "train_loss": 3.596806764602661, "lr": 0.0003552087233833847, "tps": 16958, "wall": 30045.8} {"step": 7775, "train_loss": 3.5494394302368164, "lr": 0.0003551960760260477, "tps": 16956, "wall": 30053.5} {"step": 7776, "train_loss": 3.6729180812835693, "lr": 0.00035518342713720225, "tps": 16954, "wall": 30061.4} {"step": 7777, "train_loss": 3.6225085258483887, "lr": 0.0003551707767169916, "tps": 16952, "wall": 30069.1} {"step": 7778, "train_loss": 3.6098904609680176, "lr": 0.0003551581247655591, "tps": 16950, "wall": 30076.8} {"step": 7779, "train_loss": 3.6969730854034424, "lr": 0.00035514547128304814, "tps": 16947, "wall": 30084.6} {"step": 7780, "train_loss": 3.5873849391937256, "lr": 0.00035513281626960185, "tps": 16945, "wall": 30092.3} {"step": 7781, "train_loss": 3.541917324066162, "lr": 0.00035512015972536374, "tps": 16943, "wall": 30100.0} {"step": 7782, "train_loss": 3.6219699382781982, "lr": 0.0003551075016504771, "tps": 16941, "wall": 30107.8} {"step": 7783, "train_loss": 3.633876323699951, "lr": 0.00035509484204508543, "tps": 16939, "wall": 30115.5} {"step": 7784, "train_loss": 3.514892101287842, "lr": 0.00035508218090933206, "tps": 16937, "wall": 30123.2} {"step": 7785, "train_loss": 3.6232211589813232, "lr": 0.00035506951824336046, "tps": 16934, "wall": 30131.0} {"step": 7786, "train_loss": 3.4952399730682373, "lr": 0.000355056854047314, "tps": 16932, "wall": 30138.7} {"step": 7787, "train_loss": 3.5928304195404053, "lr": 0.0003550441883213363, "tps": 16930, "wall": 30146.5} {"step": 7788, "train_loss": 3.6952831745147705, "lr": 0.0003550315210655707, "tps": 16928, "wall": 30154.2} {"step": 7789, "train_loss": 3.6301066875457764, "lr": 0.00035501885228016064, "tps": 16926, "wall": 30161.8} {"step": 7790, "train_loss": 3.607822895050049, "lr": 0.0003550061819652498, "tps": 16923, "wall": 30169.8} {"step": 7791, "train_loss": 3.5407867431640625, "lr": 0.00035499351012098154, "tps": 16921, "wall": 30177.5} {"step": 7792, "train_loss": 3.5311622619628906, "lr": 0.00035498083674749954, "tps": 16919, "wall": 30185.3} {"step": 7793, "train_loss": 3.5823183059692383, "lr": 0.0003549681618449473, "tps": 16917, "wall": 30192.9} {"step": 7794, "train_loss": 3.678670883178711, "lr": 0.0003549554854134685, "tps": 16915, "wall": 30200.7} {"step": 7795, "train_loss": 3.6622307300567627, "lr": 0.0003549428074532066, "tps": 16913, "wall": 30208.5} {"step": 7796, "train_loss": 3.5438852310180664, "lr": 0.00035493012796430527, "tps": 16910, "wall": 30216.2} {"step": 7797, "train_loss": 3.5530812740325928, "lr": 0.00035491744694690814, "tps": 16908, "wall": 30224.1} {"step": 7798, "train_loss": 3.523934841156006, "lr": 0.0003549047644011589, "tps": 16906, "wall": 30231.7} {"step": 7799, "train_loss": 3.5505282878875732, "lr": 0.0003548920803272012, "tps": 16904, "wall": 30239.4} {"step": 7800, "train_loss": 3.6391549110412598, "lr": 0.0003548793947251787, "tps": 16902, "wall": 30247.2} {"step": 7801, "train_loss": 3.625408411026001, "lr": 0.00035486670759523513, "tps": 16900, "wall": 30254.9} {"step": 7802, "train_loss": 3.581749200820923, "lr": 0.00035485401893751414, "tps": 16897, "wall": 30262.7} {"step": 7803, "train_loss": 3.570099115371704, "lr": 0.0003548413287521596, "tps": 16895, "wall": 30270.4} {"step": 7804, "train_loss": 3.603900671005249, "lr": 0.0003548286370393152, "tps": 16893, "wall": 30278.0} {"step": 7805, "train_loss": 3.476003646850586, "lr": 0.00035481594379912465, "tps": 16891, "wall": 30285.9} {"step": 7806, "train_loss": 3.57684588432312, "lr": 0.00035480324903173187, "tps": 16889, "wall": 30293.6} {"step": 7807, "train_loss": 3.5408530235290527, "lr": 0.00035479055273728054, "tps": 16887, "wall": 30301.4} {"step": 7808, "train_loss": 3.6594552993774414, "lr": 0.00035477785491591456, "tps": 16885, "wall": 30309.2} {"step": 7809, "train_loss": 3.58935546875, "lr": 0.0003547651555677777, "tps": 16882, "wall": 30316.9} {"step": 7810, "train_loss": 3.665003538131714, "lr": 0.0003547524546930139, "tps": 16880, "wall": 30324.6} {"step": 7811, "train_loss": 3.6100687980651855, "lr": 0.000354739752291767, "tps": 16878, "wall": 30332.4} {"step": 7812, "train_loss": 3.6408369541168213, "lr": 0.00035472704836418087, "tps": 16876, "wall": 30340.0} {"step": 7813, "train_loss": 3.630992889404297, "lr": 0.00035471434291039946, "tps": 16874, "wall": 30348.0} {"step": 7814, "train_loss": 3.6258018016815186, "lr": 0.00035470163593056674, "tps": 16872, "wall": 30355.6} {"step": 7815, "train_loss": 3.6743531227111816, "lr": 0.00035468892742482653, "tps": 16870, "wall": 30363.3} {"step": 7816, "train_loss": 3.533989667892456, "lr": 0.0003546762173933229, "tps": 16867, "wall": 30371.0} {"step": 7817, "train_loss": 3.5759308338165283, "lr": 0.00035466350583619977, "tps": 16865, "wall": 30378.7} {"step": 7818, "train_loss": 3.613651990890503, "lr": 0.00035465079275360124, "tps": 16863, "wall": 30386.4} {"step": 7819, "train_loss": 3.7093849182128906, "lr": 0.00035463807814567114, "tps": 16861, "wall": 30394.1} {"step": 7820, "train_loss": 3.592745304107666, "lr": 0.00035462536201255363, "tps": 16859, "wall": 30401.8} {"step": 7821, "train_loss": 3.6946403980255127, "lr": 0.0003546126443543928, "tps": 16857, "wall": 30409.6} {"step": 7822, "train_loss": 3.5914034843444824, "lr": 0.0003545999251713326, "tps": 16855, "wall": 30417.3} {"step": 7823, "train_loss": 3.6295478343963623, "lr": 0.0003545872044635172, "tps": 16852, "wall": 30425.1} {"step": 7824, "train_loss": 3.602966785430908, "lr": 0.00035457448223109064, "tps": 16850, "wall": 30432.7} {"step": 7825, "train_loss": 3.6807422637939453, "lr": 0.000354561758474197, "tps": 16848, "wall": 30440.5} {"step": 7826, "train_loss": 3.6384057998657227, "lr": 0.00035454903319298055, "tps": 16846, "wall": 30448.2} {"step": 7827, "train_loss": 3.5033459663391113, "lr": 0.0003545363063875854, "tps": 16844, "wall": 30455.9} {"step": 7828, "train_loss": 3.693627119064331, "lr": 0.0003545235780581557, "tps": 16842, "wall": 30463.8} {"step": 7829, "train_loss": 3.7465620040893555, "lr": 0.00035451084820483557, "tps": 16840, "wall": 30471.5} {"step": 7830, "train_loss": 3.665698528289795, "lr": 0.0003544981168277693, "tps": 16838, "wall": 30479.3} {"step": 7831, "train_loss": 3.504871368408203, "lr": 0.0003544853839271011, "tps": 16835, "wall": 30487.0} {"step": 7832, "train_loss": 3.6301374435424805, "lr": 0.00035447264950297516, "tps": 16833, "wall": 30494.7} {"step": 7833, "train_loss": 3.6314468383789062, "lr": 0.00035445991355553575, "tps": 16831, "wall": 30502.5} {"step": 7834, "train_loss": 3.604126453399658, "lr": 0.0003544471760849272, "tps": 16829, "wall": 30510.2} {"step": 7835, "train_loss": 3.5643250942230225, "lr": 0.0003544344370912938, "tps": 16827, "wall": 30517.9} {"step": 7836, "train_loss": 3.5860977172851562, "lr": 0.0003544216965747798, "tps": 16825, "wall": 30525.8} {"step": 7837, "train_loss": 3.6288676261901855, "lr": 0.0003544089545355295, "tps": 16823, "wall": 30533.6} {"step": 7838, "train_loss": 3.6411850452423096, "lr": 0.00035439621097368735, "tps": 16821, "wall": 30541.3} {"step": 7839, "train_loss": 3.6662254333496094, "lr": 0.0003543834658893977, "tps": 16818, "wall": 30549.0} {"step": 7840, "train_loss": 3.630958080291748, "lr": 0.00035437071928280477, "tps": 16816, "wall": 30556.9} {"step": 7841, "train_loss": 3.5876803398132324, "lr": 0.00035435797115405314, "tps": 16814, "wall": 30564.7} {"step": 7842, "train_loss": 3.6629953384399414, "lr": 0.0003543452215032871, "tps": 16812, "wall": 30572.5} {"step": 7843, "train_loss": 3.5567121505737305, "lr": 0.0003543324703306511, "tps": 16810, "wall": 30580.3} {"step": 7844, "train_loss": 3.557013511657715, "lr": 0.00035431971763628966, "tps": 16808, "wall": 30588.2} {"step": 7845, "train_loss": 3.652278423309326, "lr": 0.0003543069634203472, "tps": 16805, "wall": 30596.0} {"step": 7846, "train_loss": 3.622018814086914, "lr": 0.00035429420768296816, "tps": 16803, "wall": 30603.8} {"step": 7847, "train_loss": 3.6915693283081055, "lr": 0.0003542814504242971, "tps": 16801, "wall": 30611.5} {"step": 7848, "train_loss": 3.601247787475586, "lr": 0.00035426869164447843, "tps": 16799, "wall": 30619.3} {"step": 7849, "train_loss": 3.5293819904327393, "lr": 0.00035425593134365686, "tps": 16797, "wall": 30627.1} {"step": 7850, "train_loss": 3.461635112762451, "lr": 0.00035424316952197677, "tps": 16795, "wall": 30635.0} {"step": 7851, "train_loss": 3.536604642868042, "lr": 0.00035423040617958284, "tps": 16793, "wall": 30642.9} {"step": 7852, "train_loss": 3.579934597015381, "lr": 0.0003542176413166196, "tps": 16790, "wall": 30650.7} {"step": 7853, "train_loss": 3.651810884475708, "lr": 0.0003542048749332316, "tps": 16788, "wall": 30658.5} {"step": 7854, "train_loss": 3.686110734939575, "lr": 0.0003541921070295635, "tps": 16786, "wall": 30666.2} {"step": 7855, "train_loss": 3.6926937103271484, "lr": 0.00035417933760576006, "tps": 16784, "wall": 30673.9} {"step": 7856, "train_loss": 3.6251230239868164, "lr": 0.0003541665666619658, "tps": 16782, "wall": 30681.7} {"step": 7857, "train_loss": 3.6882002353668213, "lr": 0.0003541537941983254, "tps": 16780, "wall": 30689.5} {"step": 7858, "train_loss": 3.6127374172210693, "lr": 0.00035414102021498353, "tps": 16778, "wall": 30697.2} {"step": 7859, "train_loss": 3.6035847663879395, "lr": 0.0003541282447120849, "tps": 16776, "wall": 30705.1} {"step": 7860, "train_loss": 3.6018943786621094, "lr": 0.0003541154676897743, "tps": 16773, "wall": 30713.0} {"step": 7861, "train_loss": 3.5485072135925293, "lr": 0.00035410268914819643, "tps": 16771, "wall": 30720.7} {"step": 7862, "train_loss": 3.6127233505249023, "lr": 0.00035408990908749607, "tps": 16769, "wall": 30728.4} {"step": 7863, "train_loss": 3.625298023223877, "lr": 0.0003540771275078179, "tps": 16767, "wall": 30736.1} {"step": 7864, "train_loss": 3.5761914253234863, "lr": 0.0003540643444093068, "tps": 16765, "wall": 30743.9} {"step": 7865, "train_loss": 3.5547938346862793, "lr": 0.0003540515597921076, "tps": 16763, "wall": 30751.6} {"step": 7866, "train_loss": 3.62148380279541, "lr": 0.00035403877365636503, "tps": 16761, "wall": 30759.3} {"step": 7867, "train_loss": 3.5747060775756836, "lr": 0.000354025986002224, "tps": 16759, "wall": 30767.2} {"step": 7868, "train_loss": 3.6427927017211914, "lr": 0.0003540131968298293, "tps": 16757, "wall": 30774.9} {"step": 7869, "train_loss": 3.67741322517395, "lr": 0.000354000406139326, "tps": 16755, "wall": 30782.7} {"step": 7870, "train_loss": 3.5844640731811523, "lr": 0.0003539876139308587, "tps": 16753, "wall": 30790.5} {"step": 7871, "train_loss": 3.619516134262085, "lr": 0.0003539748202045725, "tps": 16750, "wall": 30798.1} {"step": 7872, "train_loss": 3.609416961669922, "lr": 0.00035396202496061234, "tps": 16748, "wall": 30805.9} {"step": 7873, "train_loss": 3.626826286315918, "lr": 0.00035394922819912306, "tps": 16746, "wall": 30813.6} {"step": 7874, "train_loss": 3.587505578994751, "lr": 0.00035393642992024964, "tps": 16744, "wall": 30821.4} {"step": 7875, "train_loss": 3.585695266723633, "lr": 0.0003539236301241372, "tps": 16742, "wall": 30829.2} {"step": 7876, "train_loss": 3.587475299835205, "lr": 0.0003539108288109305, "tps": 16740, "wall": 30837.0} {"step": 7877, "train_loss": 3.6026644706726074, "lr": 0.0003538980259807748, "tps": 16738, "wall": 30844.6} {"step": 7878, "train_loss": 3.49204158782959, "lr": 0.00035388522163381494, "tps": 16736, "wall": 30852.4} {"step": 7879, "train_loss": 3.659374237060547, "lr": 0.00035387241577019613, "tps": 16734, "wall": 30860.1} {"step": 7880, "train_loss": 3.62518310546875, "lr": 0.00035385960839006336, "tps": 16732, "wall": 30868.0} {"step": 7881, "train_loss": 3.6347193717956543, "lr": 0.00035384679949356163, "tps": 16730, "wall": 30875.6} {"step": 7882, "train_loss": 3.6993558406829834, "lr": 0.0003538339890808361, "tps": 16728, "wall": 30883.3} {"step": 7883, "train_loss": 3.5730981826782227, "lr": 0.00035382117715203196, "tps": 16725, "wall": 30891.2} {"step": 7884, "train_loss": 3.6095657348632812, "lr": 0.00035380836370729426, "tps": 16723, "wall": 30899.0} {"step": 7885, "train_loss": 3.6006717681884766, "lr": 0.00035379554874676814, "tps": 16721, "wall": 30906.8} {"step": 7886, "train_loss": 3.570164918899536, "lr": 0.00035378273227059894, "tps": 16719, "wall": 30914.4} {"step": 7887, "train_loss": 3.4847545623779297, "lr": 0.0003537699142789316, "tps": 16717, "wall": 30922.2} {"step": 7888, "train_loss": 3.6162376403808594, "lr": 0.00035375709477191146, "tps": 16715, "wall": 30929.9} {"step": 7889, "train_loss": 3.7047617435455322, "lr": 0.00035374427374968364, "tps": 16713, "wall": 30937.5} {"step": 7890, "train_loss": 3.650113344192505, "lr": 0.00035373145121239354, "tps": 16711, "wall": 30945.4} {"step": 7891, "train_loss": 3.6747570037841797, "lr": 0.00035371862716018635, "tps": 16709, "wall": 30953.1} {"step": 7892, "train_loss": 3.6333506107330322, "lr": 0.0003537058015932073, "tps": 16707, "wall": 30960.8} {"step": 7893, "train_loss": 3.6044743061065674, "lr": 0.00035369297451160164, "tps": 16705, "wall": 30968.6} {"step": 7894, "train_loss": 3.590768814086914, "lr": 0.00035368014591551474, "tps": 16703, "wall": 30976.3} {"step": 7895, "train_loss": 3.563821315765381, "lr": 0.000353667315805092, "tps": 16701, "wall": 30984.2} {"step": 7896, "train_loss": 3.674417495727539, "lr": 0.00035365448418047855, "tps": 16699, "wall": 30991.8} {"step": 7897, "train_loss": 3.629761219024658, "lr": 0.0003536416510418199, "tps": 16697, "wall": 30999.5} {"step": 7898, "train_loss": 3.570934534072876, "lr": 0.0003536288163892615, "tps": 16695, "wall": 31007.3} {"step": 7899, "train_loss": 3.5580224990844727, "lr": 0.00035361598022294854, "tps": 16693, "wall": 31015.0} {"step": 7900, "train_loss": 3.634488821029663, "lr": 0.00035360314254302656, "tps": 16691, "wall": 31022.5} {"step": 7901, "train_loss": 3.5269317626953125, "lr": 0.00035359030334964096, "tps": 16689, "wall": 31030.3} {"step": 7902, "train_loss": 3.5713019371032715, "lr": 0.0003535774626429372, "tps": 16687, "wall": 31038.0} {"step": 7903, "train_loss": 3.4254493713378906, "lr": 0.00035356462042306064, "tps": 16684, "wall": 31045.8} {"step": 7904, "train_loss": 3.6069881916046143, "lr": 0.0003535517766901569, "tps": 16682, "wall": 31053.4} {"step": 7905, "train_loss": 3.5667905807495117, "lr": 0.0003535389314443714, "tps": 16680, "wall": 31061.1} {"step": 7906, "train_loss": 3.6206185817718506, "lr": 0.00035352608468584964, "tps": 16678, "wall": 31068.9} {"step": 7907, "train_loss": 3.5955214500427246, "lr": 0.0003535132364147372, "tps": 16676, "wall": 31076.8} {"step": 7908, "train_loss": 3.5524370670318604, "lr": 0.0003535003866311796, "tps": 16674, "wall": 31084.4} {"step": 7909, "train_loss": 3.7403972148895264, "lr": 0.00035348753533532233, "tps": 16672, "wall": 31092.2} {"step": 7910, "train_loss": 3.575270652770996, "lr": 0.0003534746825273111, "tps": 16670, "wall": 31099.9} {"step": 7911, "train_loss": 3.689725875854492, "lr": 0.0003534618282072914, "tps": 16668, "wall": 31107.6} {"step": 7912, "train_loss": 3.6469767093658447, "lr": 0.0003534489723754089, "tps": 16666, "wall": 31115.3} {"step": 7913, "train_loss": 3.6120615005493164, "lr": 0.00035343611503180927, "tps": 16664, "wall": 31123.0} {"step": 7914, "train_loss": 3.5595011711120605, "lr": 0.00035342325617663807, "tps": 16662, "wall": 31130.8} {"step": 7915, "train_loss": 3.576463222503662, "lr": 0.000353410395810041, "tps": 16660, "wall": 31138.5} {"step": 7916, "train_loss": 3.6216392517089844, "lr": 0.00035339753393216376, "tps": 16658, "wall": 31146.2} {"step": 7917, "train_loss": 3.776042938232422, "lr": 0.000353384670543152, "tps": 16656, "wall": 31153.9} {"step": 7918, "train_loss": 3.582702159881592, "lr": 0.00035337180564315153, "tps": 16654, "wall": 31161.7} {"step": 7919, "train_loss": 3.6850509643554688, "lr": 0.00035335893923230804, "tps": 16652, "wall": 31169.4} {"step": 7920, "train_loss": 3.5824997425079346, "lr": 0.00035334607131076723, "tps": 16650, "wall": 31177.1} {"step": 7921, "train_loss": 3.6786773204803467, "lr": 0.0003533332018786749, "tps": 16648, "wall": 31184.9} {"step": 7922, "train_loss": 3.6795477867126465, "lr": 0.0003533203309361769, "tps": 16646, "wall": 31192.6} {"step": 7923, "train_loss": 3.634652614593506, "lr": 0.00035330745848341895, "tps": 16644, "wall": 31200.4} {"step": 7924, "train_loss": 3.5065431594848633, "lr": 0.00035329458452054696, "tps": 16642, "wall": 31208.2} {"step": 7925, "train_loss": 3.624619483947754, "lr": 0.0003532817090477066, "tps": 16640, "wall": 31215.9} {"step": 7926, "train_loss": 3.7192301750183105, "lr": 0.0003532688320650439, "tps": 16638, "wall": 31223.6} {"step": 7927, "train_loss": 3.6540379524230957, "lr": 0.00035325595357270465, "tps": 16636, "wall": 31231.3} {"step": 7928, "train_loss": 3.4928810596466064, "lr": 0.0003532430735708347, "tps": 16634, "wall": 31239.1} {"step": 7929, "train_loss": 3.5342931747436523, "lr": 0.00035323019205958005, "tps": 16632, "wall": 31246.9} {"step": 7930, "train_loss": 3.7175965309143066, "lr": 0.0003532173090390866, "tps": 16630, "wall": 31254.5} {"step": 7931, "train_loss": 3.625117063522339, "lr": 0.00035320442450950017, "tps": 16628, "wall": 31262.3} {"step": 7932, "train_loss": 3.554934501647949, "lr": 0.0003531915384709669, "tps": 16626, "wall": 31269.9} {"step": 7933, "train_loss": 3.5350260734558105, "lr": 0.00035317865092363265, "tps": 16624, "wall": 31277.8} {"step": 7934, "train_loss": 3.6314902305603027, "lr": 0.0003531657618676434, "tps": 16622, "wall": 31285.5} {"step": 7935, "train_loss": 3.505357265472412, "lr": 0.00035315287130314527, "tps": 16620, "wall": 31293.2} {"step": 7936, "train_loss": 3.6538374423980713, "lr": 0.0003531399792302842, "tps": 16618, "wall": 31300.8} {"step": 7937, "train_loss": 3.5526561737060547, "lr": 0.00035312708564920627, "tps": 16615, "wall": 31308.7} {"step": 7938, "train_loss": 3.513665199279785, "lr": 0.0003531141905600574, "tps": 16614, "wall": 31316.4} {"step": 7939, "train_loss": 3.664762020111084, "lr": 0.00035310129396298387, "tps": 16612, "wall": 31324.1} {"step": 7940, "train_loss": 3.589339256286621, "lr": 0.00035308839585813164, "tps": 16609, "wall": 31331.8} {"step": 7941, "train_loss": 3.61627197265625, "lr": 0.00035307549624564685, "tps": 16607, "wall": 31339.6} {"step": 7942, "train_loss": 3.4744462966918945, "lr": 0.00035306259512567564, "tps": 16605, "wall": 31347.3} {"step": 7943, "train_loss": 3.534862518310547, "lr": 0.00035304969249836424, "tps": 16604, "wall": 31354.9} {"step": 7944, "train_loss": 3.5967178344726562, "lr": 0.0003530367883638586, "tps": 16602, "wall": 31362.6} {"step": 7945, "train_loss": 3.5291991233825684, "lr": 0.0003530238827223051, "tps": 16600, "wall": 31370.3} {"step": 7946, "train_loss": 3.558861255645752, "lr": 0.00035301097557384985, "tps": 16598, "wall": 31378.0} {"step": 7947, "train_loss": 3.540090560913086, "lr": 0.00035299806691863907, "tps": 16596, "wall": 31385.7} {"step": 7948, "train_loss": 3.56565523147583, "lr": 0.000352985156756819, "tps": 16594, "wall": 31393.3} {"step": 7949, "train_loss": 3.619843006134033, "lr": 0.00035297224508853585, "tps": 16592, "wall": 31401.0} {"step": 7950, "train_loss": 3.6356046199798584, "lr": 0.0003529593319139359, "tps": 16590, "wall": 31408.7} {"step": 7951, "train_loss": 3.655163049697876, "lr": 0.00035294641723316553, "tps": 16588, "wall": 31416.4} {"step": 7952, "train_loss": 3.537696361541748, "lr": 0.0003529335010463709, "tps": 16586, "wall": 31424.2} {"step": 7953, "train_loss": 3.6748111248016357, "lr": 0.00035292058335369836, "tps": 16584, "wall": 31431.8} {"step": 7954, "train_loss": 3.5591793060302734, "lr": 0.0003529076641552943, "tps": 16582, "wall": 31439.4} {"step": 7955, "train_loss": 3.6392338275909424, "lr": 0.00035289474345130505, "tps": 16580, "wall": 31447.0} {"step": 7956, "train_loss": 3.598173141479492, "lr": 0.0003528818212418769, "tps": 16578, "wall": 31454.8} {"step": 7957, "train_loss": 3.5397286415100098, "lr": 0.0003528688975271563, "tps": 16576, "wall": 31462.5} {"step": 7958, "train_loss": 3.6385886669158936, "lr": 0.0003528559723072897, "tps": 16574, "wall": 31470.3} {"step": 7959, "train_loss": 3.529012441635132, "lr": 0.0003528430455824234, "tps": 16572, "wall": 31477.9} {"step": 7960, "train_loss": 3.5841259956359863, "lr": 0.0003528301173527039, "tps": 16570, "wall": 31485.7} {"step": 7961, "train_loss": 3.491957187652588, "lr": 0.00035281718761827764, "tps": 16568, "wall": 31493.3} {"step": 7962, "train_loss": 3.509204387664795, "lr": 0.000352804256379291, "tps": 16566, "wall": 31501.1} {"step": 7963, "train_loss": 3.616621255874634, "lr": 0.00035279132363589074, "tps": 16564, "wall": 31508.8} {"step": 7964, "train_loss": 3.6015658378601074, "lr": 0.0003527783893882231, "tps": 16562, "wall": 31516.5} {"step": 7965, "train_loss": 3.691871404647827, "lr": 0.0003527654536364346, "tps": 16560, "wall": 31524.2} {"step": 7966, "train_loss": 3.662963628768921, "lr": 0.000352752516380672, "tps": 16558, "wall": 31532.0} {"step": 7967, "train_loss": 3.481675863265991, "lr": 0.0003527395776210817, "tps": 16556, "wall": 31539.6} {"step": 7968, "train_loss": 3.519008159637451, "lr": 0.0003527266373578102, "tps": 16554, "wall": 31547.5} {"step": 7969, "train_loss": 3.4952688217163086, "lr": 0.0003527136955910042, "tps": 16552, "wall": 31555.2} {"step": 7970, "train_loss": 3.6322407722473145, "lr": 0.00035270075232081026, "tps": 16550, "wall": 31562.8} {"step": 7971, "train_loss": 3.5903186798095703, "lr": 0.0003526878075473751, "tps": 16548, "wall": 31570.5} {"step": 7972, "train_loss": 3.6295928955078125, "lr": 0.00035267486127084515, "tps": 16546, "wall": 31578.2} {"step": 7973, "train_loss": 3.687418222427368, "lr": 0.0003526619134913673, "tps": 16544, "wall": 31586.0} {"step": 7974, "train_loss": 3.5261688232421875, "lr": 0.00035264896420908806, "tps": 16542, "wall": 31593.7} {"step": 7975, "train_loss": 3.516463279724121, "lr": 0.00035263601342415423, "tps": 16540, "wall": 31601.4} {"step": 7976, "train_loss": 3.7375621795654297, "lr": 0.0003526230611367125, "tps": 16538, "wall": 31609.3} {"step": 7977, "train_loss": 3.5922999382019043, "lr": 0.0003526101073469094, "tps": 16536, "wall": 31617.0} {"step": 7978, "train_loss": 3.611499309539795, "lr": 0.00035259715205489196, "tps": 16534, "wall": 31624.8} {"step": 7979, "train_loss": 3.7336483001708984, "lr": 0.0003525841952608068, "tps": 16532, "wall": 31632.6} {"step": 7980, "train_loss": 3.5788066387176514, "lr": 0.00035257123696480063, "tps": 16530, "wall": 31640.3} {"step": 7981, "train_loss": 3.531954526901245, "lr": 0.0003525582771670204, "tps": 16528, "wall": 31648.1} {"step": 7982, "train_loss": 3.6597604751586914, "lr": 0.0003525453158676128, "tps": 16526, "wall": 31655.8} {"step": 7983, "train_loss": 3.5692059993743896, "lr": 0.00035253235306672464, "tps": 16525, "wall": 31663.5} {"step": 7984, "train_loss": 3.6446542739868164, "lr": 0.0003525193887645029, "tps": 16523, "wall": 31671.3} {"step": 7985, "train_loss": 3.5261144638061523, "lr": 0.0003525064229610943, "tps": 16521, "wall": 31679.0} {"step": 7986, "train_loss": 3.650818109512329, "lr": 0.0003524934556566458, "tps": 16519, "wall": 31686.9} {"step": 7987, "train_loss": 3.518028497695923, "lr": 0.00035248048685130424, "tps": 16517, "wall": 31694.5} {"step": 7988, "train_loss": 3.6063263416290283, "lr": 0.00035246751654521656, "tps": 16515, "wall": 31702.3} {"step": 7989, "train_loss": 3.6379055976867676, "lr": 0.00035245454473852966, "tps": 16513, "wall": 31710.1} {"step": 7990, "train_loss": 3.6513671875, "lr": 0.00035244157143139065, "tps": 16511, "wall": 31717.9} {"step": 7991, "train_loss": 3.6407675743103027, "lr": 0.00035242859662394616, "tps": 16509, "wall": 31725.8} {"step": 7992, "train_loss": 3.585167407989502, "lr": 0.0003524156203163435, "tps": 16507, "wall": 31733.5} {"step": 7993, "train_loss": 3.5179991722106934, "lr": 0.0003524026425087295, "tps": 16505, "wall": 31741.3} {"step": 7994, "train_loss": 3.5924015045166016, "lr": 0.0003523896632012512, "tps": 16503, "wall": 31749.0} {"step": 7995, "train_loss": 3.639881134033203, "lr": 0.0003523766823940556, "tps": 16501, "wall": 31756.8} {"step": 7996, "train_loss": 3.5730597972869873, "lr": 0.0003523637000872898, "tps": 16499, "wall": 31764.6} {"step": 7997, "train_loss": 3.5777747631073, "lr": 0.00035235071628110086, "tps": 16497, "wall": 31772.3} {"step": 7998, "train_loss": 3.6615068912506104, "lr": 0.00035233773097563585, "tps": 16495, "wall": 31780.1} {"step": 7999, "train_loss": 3.619729995727539, "lr": 0.00035232474417104184, "tps": 16493, "wall": 31788.0} {"step": 8000, "train_loss": 3.5504002571105957, "lr": 0.00035231175586746596, "tps": 16491, "wall": 31795.7, "val_loss_monitor": 3.6223373518019395} {"step": 8001, "train_loss": 3.5418004989624023, "lr": 0.0003522987660650554, "tps": 16464, "wall": 31852.2} {"step": 8002, "train_loss": 3.854471445083618, "lr": 0.0003522857747639572, "tps": 16462, "wall": 31860.0} {"step": 8003, "train_loss": 3.468259811401367, "lr": 0.0003522727819643186, "tps": 16460, "wall": 31868.1} {"step": 8004, "train_loss": 3.6454248428344727, "lr": 0.0003522597876662868, "tps": 16457, "wall": 31876.1} {"step": 8005, "train_loss": 3.5889768600463867, "lr": 0.000352246791870009, "tps": 16455, "wall": 31884.2} {"step": 8006, "train_loss": 3.579149007797241, "lr": 0.0003522337945756323, "tps": 16453, "wall": 31892.3} {"step": 8007, "train_loss": 3.550433397293091, "lr": 0.0003522207957833041, "tps": 16451, "wall": 31900.2} {"step": 8008, "train_loss": 3.6073713302612305, "lr": 0.0003522077954931715, "tps": 16449, "wall": 31908.3} {"step": 8009, "train_loss": 3.692185878753662, "lr": 0.0003521947937053819, "tps": 16447, "wall": 31916.1} {"step": 8010, "train_loss": 3.6197292804718018, "lr": 0.0003521817904200825, "tps": 16445, "wall": 31924.1} {"step": 8011, "train_loss": 3.604243516921997, "lr": 0.00035216878563742066, "tps": 16443, "wall": 31931.8} {"step": 8012, "train_loss": 3.731710433959961, "lr": 0.0003521557793575436, "tps": 16441, "wall": 31940.0} {"step": 8013, "train_loss": 3.554744243621826, "lr": 0.0003521427715805988, "tps": 16439, "wall": 31948.1} {"step": 8014, "train_loss": 3.5811638832092285, "lr": 0.0003521297623067335, "tps": 16437, "wall": 31956.0} {"step": 8015, "train_loss": 3.578256130218506, "lr": 0.00035211675153609505, "tps": 16435, "wall": 31964.0} {"step": 8016, "train_loss": 3.6278443336486816, "lr": 0.0003521037392688309, "tps": 16433, "wall": 31972.0} {"step": 8017, "train_loss": 3.586338758468628, "lr": 0.0003520907255050885, "tps": 16431, "wall": 31979.9} {"step": 8018, "train_loss": 3.6315555572509766, "lr": 0.0003520777102450152, "tps": 16429, "wall": 31987.8} {"step": 8019, "train_loss": 3.6810142993927, "lr": 0.00035206469348875847, "tps": 16427, "wall": 31995.6} {"step": 8020, "train_loss": 3.60850191116333, "lr": 0.00035205167523646573, "tps": 16425, "wall": 32003.6} {"step": 8021, "train_loss": 3.5305070877075195, "lr": 0.0003520386554882845, "tps": 16423, "wall": 32011.5} {"step": 8022, "train_loss": 3.58127498626709, "lr": 0.00035202563424436217, "tps": 16421, "wall": 32019.3} {"step": 8023, "train_loss": 3.564070224761963, "lr": 0.00035201261150484634, "tps": 16419, "wall": 32027.2} {"step": 8024, "train_loss": 3.4738917350769043, "lr": 0.0003519995872698846, "tps": 16417, "wall": 32035.1} {"step": 8025, "train_loss": 3.63338041305542, "lr": 0.00035198656153962425, "tps": 16415, "wall": 32042.8} {"step": 8026, "train_loss": 3.6450369358062744, "lr": 0.00035197353431421305, "tps": 16413, "wall": 32050.6} {"step": 8027, "train_loss": 3.5603766441345215, "lr": 0.0003519605055937985, "tps": 16411, "wall": 32058.4} {"step": 8028, "train_loss": 3.665454864501953, "lr": 0.00035194747537852823, "tps": 16409, "wall": 32066.3} {"step": 8029, "train_loss": 3.664257049560547, "lr": 0.0003519344436685498, "tps": 16407, "wall": 32074.2} {"step": 8030, "train_loss": 3.6713294982910156, "lr": 0.0003519214104640109, "tps": 16405, "wall": 32081.9} {"step": 8031, "train_loss": 3.60137939453125, "lr": 0.00035190837576505905, "tps": 16403, "wall": 32089.8} {"step": 8032, "train_loss": 3.624018430709839, "lr": 0.00035189533957184207, "tps": 16401, "wall": 32097.6} {"step": 8033, "train_loss": 3.4773006439208984, "lr": 0.0003518823018845075, "tps": 16399, "wall": 32105.5} {"step": 8034, "train_loss": 3.651245594024658, "lr": 0.00035186926270320304, "tps": 16397, "wall": 32113.3} {"step": 8035, "train_loss": 3.689990520477295, "lr": 0.0003518562220280765, "tps": 16395, "wall": 32121.1} {"step": 8036, "train_loss": 3.6017818450927734, "lr": 0.00035184317985927554, "tps": 16393, "wall": 32129.0} {"step": 8037, "train_loss": 3.5926718711853027, "lr": 0.00035183013619694784, "tps": 16391, "wall": 32136.7} {"step": 8038, "train_loss": 3.568113327026367, "lr": 0.00035181709104124126, "tps": 16389, "wall": 32144.5} {"step": 8039, "train_loss": 3.587888717651367, "lr": 0.00035180404439230363, "tps": 16387, "wall": 32152.4} {"step": 8040, "train_loss": 3.5851621627807617, "lr": 0.0003517909962502825, "tps": 16385, "wall": 32160.1} {"step": 8041, "train_loss": 3.5598320960998535, "lr": 0.00035177794661532595, "tps": 16384, "wall": 32167.9} {"step": 8042, "train_loss": 3.609473466873169, "lr": 0.0003517648954875816, "tps": 16382, "wall": 32175.8} {"step": 8043, "train_loss": 3.564270257949829, "lr": 0.0003517518428671975, "tps": 16380, "wall": 32183.5} {"step": 8044, "train_loss": 3.5389204025268555, "lr": 0.0003517387887543213, "tps": 16378, "wall": 32191.3} {"step": 8045, "train_loss": 3.6191060543060303, "lr": 0.000351725733149101, "tps": 16376, "wall": 32199.0} {"step": 8046, "train_loss": 3.6066582202911377, "lr": 0.00035171267605168453, "tps": 16374, "wall": 32207.0} {"step": 8047, "train_loss": 3.637462854385376, "lr": 0.00035169961746221967, "tps": 16372, "wall": 32214.7} {"step": 8048, "train_loss": 3.6539852619171143, "lr": 0.00035168655738085445, "tps": 16370, "wall": 32222.5} {"step": 8049, "train_loss": 3.723524570465088, "lr": 0.00035167349580773676, "tps": 16368, "wall": 32230.3} {"step": 8050, "train_loss": 3.5478575229644775, "lr": 0.0003516604327430146, "tps": 16366, "wall": 32237.9} {"step": 8051, "train_loss": 3.5067954063415527, "lr": 0.0003516473681868359, "tps": 16364, "wall": 32245.8} {"step": 8052, "train_loss": 3.593069553375244, "lr": 0.0003516343021393488, "tps": 16362, "wall": 32253.5} {"step": 8053, "train_loss": 3.56974720954895, "lr": 0.00035162123460070105, "tps": 16361, "wall": 32261.3} {"step": 8054, "train_loss": 3.5643577575683594, "lr": 0.0003516081655710409, "tps": 16359, "wall": 32269.2} {"step": 8055, "train_loss": 3.59725284576416, "lr": 0.00035159509505051635, "tps": 16357, "wall": 32276.9} {"step": 8056, "train_loss": 3.610797882080078, "lr": 0.0003515820230392755, "tps": 16355, "wall": 32284.7} {"step": 8057, "train_loss": 3.60300874710083, "lr": 0.00035156894953746625, "tps": 16353, "wall": 32292.4} {"step": 8058, "train_loss": 3.6303038597106934, "lr": 0.00035155587454523693, "tps": 16351, "wall": 32300.1} {"step": 8059, "train_loss": 3.580850124359131, "lr": 0.0003515427980627355, "tps": 16349, "wall": 32307.9} {"step": 8060, "train_loss": 3.5107598304748535, "lr": 0.0003515297200901101, "tps": 16347, "wall": 32315.7} {"step": 8061, "train_loss": 3.692861318588257, "lr": 0.00035151664062750895, "tps": 16345, "wall": 32323.4} {"step": 8062, "train_loss": 3.575997829437256, "lr": 0.0003515035596750802, "tps": 16343, "wall": 32331.3} {"step": 8063, "train_loss": 3.495558738708496, "lr": 0.000351490477232972, "tps": 16341, "wall": 32339.1} {"step": 8064, "train_loss": 3.597966194152832, "lr": 0.0003514773933013326, "tps": 16340, "wall": 32346.8} {"step": 8065, "train_loss": 3.650113821029663, "lr": 0.00035146430788031007, "tps": 16338, "wall": 32354.6} {"step": 8066, "train_loss": 3.476868152618408, "lr": 0.0003514512209700529, "tps": 16336, "wall": 32362.3} {"step": 8067, "train_loss": 3.6731510162353516, "lr": 0.000351438132570709, "tps": 16334, "wall": 32370.2} {"step": 8068, "train_loss": 3.548478603363037, "lr": 0.0003514250426824269, "tps": 16332, "wall": 32377.9} {"step": 8069, "train_loss": 3.6291098594665527, "lr": 0.00035141195130535484, "tps": 16330, "wall": 32385.9} {"step": 8070, "train_loss": 3.61102032661438, "lr": 0.0003513988584396411, "tps": 16328, "wall": 32393.7} {"step": 8071, "train_loss": 3.5510506629943848, "lr": 0.000351385764085434, "tps": 16326, "wall": 32401.5} {"step": 8072, "train_loss": 3.4738569259643555, "lr": 0.00035137266824288173, "tps": 16324, "wall": 32409.3} {"step": 8073, "train_loss": 3.711179733276367, "lr": 0.00035135957091213287, "tps": 16322, "wall": 32417.0} {"step": 8074, "train_loss": 3.476482629776001, "lr": 0.00035134647209333566, "tps": 16320, "wall": 32424.9} {"step": 8075, "train_loss": 3.6371076107025146, "lr": 0.00035133337178663854, "tps": 16318, "wall": 32432.7} {"step": 8076, "train_loss": 3.573028326034546, "lr": 0.0003513202699921898, "tps": 16317, "wall": 32440.4} {"step": 8077, "train_loss": 3.6069529056549072, "lr": 0.000351307166710138, "tps": 16315, "wall": 32448.3} {"step": 8078, "train_loss": 3.601318836212158, "lr": 0.0003512940619406315, "tps": 16313, "wall": 32456.0} {"step": 8079, "train_loss": 3.6159400939941406, "lr": 0.0003512809556838188, "tps": 16311, "wall": 32463.7} {"step": 8080, "train_loss": 3.565316677093506, "lr": 0.00035126784793984827, "tps": 16309, "wall": 32471.5} {"step": 8081, "train_loss": 3.569880723953247, "lr": 0.0003512547387088685, "tps": 16307, "wall": 32479.2} {"step": 8082, "train_loss": 3.632228374481201, "lr": 0.0003512416279910279, "tps": 16305, "wall": 32487.1} {"step": 8083, "train_loss": 3.59740948677063, "lr": 0.0003512285157864751, "tps": 16303, "wall": 32494.7} {"step": 8084, "train_loss": 3.644965648651123, "lr": 0.0003512154020953586, "tps": 16302, "wall": 32502.5} {"step": 8085, "train_loss": 3.543793201446533, "lr": 0.0003512022869178268, "tps": 16300, "wall": 32510.4} {"step": 8086, "train_loss": 3.50710391998291, "lr": 0.00035118917025402845, "tps": 16298, "wall": 32518.2} {"step": 8087, "train_loss": 3.5518035888671875, "lr": 0.0003511760521041121, "tps": 16296, "wall": 32526.0} {"step": 8088, "train_loss": 3.5218350887298584, "lr": 0.0003511629324682263, "tps": 16294, "wall": 32533.8} {"step": 8089, "train_loss": 3.571539878845215, "lr": 0.0003511498113465198, "tps": 16292, "wall": 32541.7} {"step": 8090, "train_loss": 3.5944783687591553, "lr": 0.00035113668873914107, "tps": 16290, "wall": 32549.5} {"step": 8091, "train_loss": 3.5577478408813477, "lr": 0.00035112356464623884, "tps": 16288, "wall": 32557.2} {"step": 8092, "train_loss": 3.3980870246887207, "lr": 0.00035111043906796175, "tps": 16286, "wall": 32565.1} {"step": 8093, "train_loss": 3.580389976501465, "lr": 0.00035109731200445854, "tps": 16284, "wall": 32572.9} {"step": 8094, "train_loss": 3.559453010559082, "lr": 0.0003510841834558779, "tps": 16283, "wall": 32580.7} {"step": 8095, "train_loss": 3.539475440979004, "lr": 0.0003510710534223685, "tps": 16281, "wall": 32588.4} {"step": 8096, "train_loss": 3.605029821395874, "lr": 0.00035105792190407917, "tps": 16279, "wall": 32596.2} {"step": 8097, "train_loss": 3.443507432937622, "lr": 0.00035104478890115866, "tps": 16277, "wall": 32604.1} {"step": 8098, "train_loss": 3.6622743606567383, "lr": 0.0003510316544137556, "tps": 16275, "wall": 32611.9} {"step": 8099, "train_loss": 3.5686893463134766, "lr": 0.00035101851844201884, "tps": 16273, "wall": 32619.6} {"step": 8100, "train_loss": 3.555734157562256, "lr": 0.00035100538098609726, "tps": 16271, "wall": 32627.5} {"step": 8101, "train_loss": 3.565079689025879, "lr": 0.00035099224204613964, "tps": 16269, "wall": 32635.1} {"step": 8102, "train_loss": 3.694735288619995, "lr": 0.00035097910162229485, "tps": 16268, "wall": 32642.9} {"step": 8103, "train_loss": 3.542454719543457, "lr": 0.00035096595971471163, "tps": 16266, "wall": 32650.7} {"step": 8104, "train_loss": 3.618626117706299, "lr": 0.000350952816323539, "tps": 16264, "wall": 32658.5} {"step": 8105, "train_loss": 3.5594775676727295, "lr": 0.0003509396714489258, "tps": 16262, "wall": 32666.3} {"step": 8106, "train_loss": 3.5743236541748047, "lr": 0.00035092652509102084, "tps": 16260, "wall": 32674.0} {"step": 8107, "train_loss": 3.5714597702026367, "lr": 0.00035091337724997324, "tps": 16258, "wall": 32681.7} {"step": 8108, "train_loss": 3.714246988296509, "lr": 0.0003509002279259317, "tps": 16256, "wall": 32689.6} {"step": 8109, "train_loss": 3.546025276184082, "lr": 0.00035088707711904534, "tps": 16255, "wall": 32697.4} {"step": 8110, "train_loss": 3.680388927459717, "lr": 0.0003508739248294631, "tps": 16253, "wall": 32705.2} {"step": 8111, "train_loss": 3.5929408073425293, "lr": 0.00035086077105733396, "tps": 16251, "wall": 32713.0} {"step": 8112, "train_loss": 3.6099722385406494, "lr": 0.0003508476158028069, "tps": 16249, "wall": 32720.8} {"step": 8113, "train_loss": 3.6313977241516113, "lr": 0.00035083445906603097, "tps": 16247, "wall": 32728.6} {"step": 8114, "train_loss": 3.5241973400115967, "lr": 0.0003508213008471552, "tps": 16245, "wall": 32736.3} {"step": 8115, "train_loss": 3.5983855724334717, "lr": 0.0003508081411463287, "tps": 16243, "wall": 32744.3} {"step": 8116, "train_loss": 3.573423147201538, "lr": 0.0003507949799637005, "tps": 16241, "wall": 32751.9} {"step": 8117, "train_loss": 3.6901443004608154, "lr": 0.00035078181729941964, "tps": 16240, "wall": 32759.7} {"step": 8118, "train_loss": 3.6025571823120117, "lr": 0.0003507686531536353, "tps": 16238, "wall": 32767.5} {"step": 8119, "train_loss": 3.484976291656494, "lr": 0.0003507554875264966, "tps": 16236, "wall": 32775.4} {"step": 8120, "train_loss": 3.496710777282715, "lr": 0.00035074232041815265, "tps": 16234, "wall": 32783.1} {"step": 8121, "train_loss": 3.6451668739318848, "lr": 0.0003507291518287526, "tps": 16232, "wall": 32791.0} {"step": 8122, "train_loss": 3.6115851402282715, "lr": 0.0003507159817584457, "tps": 16230, "wall": 32798.7} {"step": 8123, "train_loss": 3.5636072158813477, "lr": 0.00035070281020738105, "tps": 16228, "wall": 32806.6} {"step": 8124, "train_loss": 3.620068073272705, "lr": 0.00035068963717570787, "tps": 16227, "wall": 32814.3} {"step": 8125, "train_loss": 3.590158224105835, "lr": 0.0003506764626635755, "tps": 16225, "wall": 32822.1} {"step": 8126, "train_loss": 3.592212200164795, "lr": 0.00035066328667113304, "tps": 16223, "wall": 32829.9} {"step": 8127, "train_loss": 3.6043221950531006, "lr": 0.00035065010919852976, "tps": 16221, "wall": 32837.7} {"step": 8128, "train_loss": 3.5678670406341553, "lr": 0.00035063693024591506, "tps": 16219, "wall": 32845.4} {"step": 8129, "train_loss": 3.7376437187194824, "lr": 0.00035062374981343806, "tps": 16217, "wall": 32853.2} {"step": 8130, "train_loss": 3.649233341217041, "lr": 0.0003506105679012482, "tps": 16216, "wall": 32860.9} {"step": 8131, "train_loss": 3.6606602668762207, "lr": 0.00035059738450949474, "tps": 16214, "wall": 32868.8} {"step": 8132, "train_loss": 3.526435613632202, "lr": 0.0003505841996383271, "tps": 16212, "wall": 32876.6} {"step": 8133, "train_loss": 3.6208832263946533, "lr": 0.0003505710132878945, "tps": 16210, "wall": 32884.3} {"step": 8134, "train_loss": 3.6151137351989746, "lr": 0.00035055782545834646, "tps": 16208, "wall": 32892.1} {"step": 8135, "train_loss": 3.5983729362487793, "lr": 0.00035054463614983224, "tps": 16206, "wall": 32899.8} {"step": 8136, "train_loss": 3.685225009918213, "lr": 0.00035053144536250144, "tps": 16204, "wall": 32907.6} {"step": 8137, "train_loss": 3.5632553100585938, "lr": 0.00035051825309650325, "tps": 16203, "wall": 32915.4} {"step": 8138, "train_loss": 3.6211910247802734, "lr": 0.0003505050593519873, "tps": 16201, "wall": 32923.0} {"step": 8139, "train_loss": 3.6371686458587646, "lr": 0.0003504918641291029, "tps": 16199, "wall": 32930.9} {"step": 8140, "train_loss": 3.5966360569000244, "lr": 0.0003504786674279997, "tps": 16197, "wall": 32938.7} {"step": 8141, "train_loss": 3.653125762939453, "lr": 0.000350465469248827, "tps": 16195, "wall": 32946.5} {"step": 8142, "train_loss": 3.6565632820129395, "lr": 0.0003504522695917345, "tps": 16193, "wall": 32954.3} {"step": 8143, "train_loss": 3.5878729820251465, "lr": 0.00035043906845687154, "tps": 16192, "wall": 32962.1} {"step": 8144, "train_loss": 3.6099307537078857, "lr": 0.0003504258658443878, "tps": 16190, "wall": 32969.9} {"step": 8145, "train_loss": 3.6401827335357666, "lr": 0.00035041266175443275, "tps": 16188, "wall": 32977.6} {"step": 8146, "train_loss": 3.5129616260528564, "lr": 0.00035039945618715613, "tps": 16186, "wall": 32985.5} {"step": 8147, "train_loss": 3.537614583969116, "lr": 0.0003503862491427074, "tps": 16184, "wall": 32993.2} {"step": 8148, "train_loss": 3.68481707572937, "lr": 0.00035037304062123604, "tps": 16182, "wall": 33001.0} {"step": 8149, "train_loss": 3.547431468963623, "lr": 0.000350359830622892, "tps": 16181, "wall": 33008.8} {"step": 8150, "train_loss": 3.6503405570983887, "lr": 0.0003503466191478246, "tps": 16179, "wall": 33016.6} {"step": 8151, "train_loss": 3.575359344482422, "lr": 0.0003503334061961837, "tps": 16177, "wall": 33024.4} {"step": 8152, "train_loss": 3.569479465484619, "lr": 0.00035032019176811896, "tps": 16175, "wall": 33032.1} {"step": 8153, "train_loss": 3.462465524673462, "lr": 0.00035030697586377996, "tps": 16173, "wall": 33039.9} {"step": 8154, "train_loss": 3.6017675399780273, "lr": 0.0003502937584833166, "tps": 16171, "wall": 33047.9} {"step": 8155, "train_loss": 3.6463027000427246, "lr": 0.0003502805396268784, "tps": 16170, "wall": 33055.6} {"step": 8156, "train_loss": 3.5662171840667725, "lr": 0.0003502673192946153, "tps": 16168, "wall": 33063.5} {"step": 8157, "train_loss": 3.5030369758605957, "lr": 0.0003502540974866768, "tps": 16166, "wall": 33071.2} {"step": 8158, "train_loss": 3.6334524154663086, "lr": 0.00035024087420321295, "tps": 16164, "wall": 33079.0} {"step": 8159, "train_loss": 3.675463914871216, "lr": 0.0003502276494443734, "tps": 16162, "wall": 33086.9} {"step": 8160, "train_loss": 3.639845132827759, "lr": 0.00035021442321030806, "tps": 16160, "wall": 33094.7} {"step": 8161, "train_loss": 3.5786380767822266, "lr": 0.0003502011955011666, "tps": 16159, "wall": 33102.3} {"step": 8162, "train_loss": 3.586276054382324, "lr": 0.00035018796631709894, "tps": 16157, "wall": 33110.3} {"step": 8163, "train_loss": 3.503045082092285, "lr": 0.00035017473565825504, "tps": 16155, "wall": 33118.1} {"step": 8164, "train_loss": 3.5938808917999268, "lr": 0.0003501615035247846, "tps": 16153, "wall": 33126.0} {"step": 8165, "train_loss": 3.6515469551086426, "lr": 0.00035014826991683774, "tps": 16151, "wall": 33133.7} {"step": 8166, "train_loss": 3.4975838661193848, "lr": 0.0003501350348345641, "tps": 16149, "wall": 33141.6} {"step": 8167, "train_loss": 3.5764758586883545, "lr": 0.0003501217982781138, "tps": 16148, "wall": 33149.4} {"step": 8168, "train_loss": 3.477829694747925, "lr": 0.00035010856024763676, "tps": 16146, "wall": 33157.4} {"step": 8169, "train_loss": 3.6003029346466064, "lr": 0.0003500953207432829, "tps": 16144, "wall": 33165.2} {"step": 8170, "train_loss": 3.550914764404297, "lr": 0.00035008207976520213, "tps": 16142, "wall": 33173.0} {"step": 8171, "train_loss": 3.5857348442077637, "lr": 0.0003500688373135446, "tps": 16140, "wall": 33180.8} {"step": 8172, "train_loss": 3.5091891288757324, "lr": 0.00035005559338846027, "tps": 16138, "wall": 33188.6} {"step": 8173, "train_loss": 3.6075215339660645, "lr": 0.00035004234799009904, "tps": 16137, "wall": 33196.4} {"step": 8174, "train_loss": 3.5650062561035156, "lr": 0.00035002910111861117, "tps": 16135, "wall": 33204.1} {"step": 8175, "train_loss": 3.5680148601531982, "lr": 0.00035001585277414656, "tps": 16133, "wall": 33211.9} {"step": 8176, "train_loss": 3.604229688644409, "lr": 0.00035000260295685526, "tps": 16131, "wall": 33219.7} {"step": 8177, "train_loss": 3.5535879135131836, "lr": 0.00034998935166688754, "tps": 16129, "wall": 33227.7} {"step": 8178, "train_loss": 3.5560600757598877, "lr": 0.00034997609890439335, "tps": 16127, "wall": 33235.5} {"step": 8179, "train_loss": 3.5734784603118896, "lr": 0.00034996284466952296, "tps": 16126, "wall": 33243.2} {"step": 8180, "train_loss": 3.5734505653381348, "lr": 0.00034994958896242636, "tps": 16124, "wall": 33251.0} {"step": 8181, "train_loss": 3.5559535026550293, "lr": 0.00034993633178325383, "tps": 16122, "wall": 33258.7} {"step": 8182, "train_loss": 3.643829345703125, "lr": 0.0003499230731321554, "tps": 16120, "wall": 33266.6} {"step": 8183, "train_loss": 3.511943817138672, "lr": 0.00034990981300928156, "tps": 16118, "wall": 33274.4} {"step": 8184, "train_loss": 3.5996482372283936, "lr": 0.00034989655141478226, "tps": 16117, "wall": 33282.2} {"step": 8185, "train_loss": 3.5529394149780273, "lr": 0.00034988328834880766, "tps": 16115, "wall": 33290.1} {"step": 8186, "train_loss": 3.598896026611328, "lr": 0.0003498700238115083, "tps": 16113, "wall": 33297.9} {"step": 8187, "train_loss": 3.61930513381958, "lr": 0.0003498567578030342, "tps": 16111, "wall": 33305.7} {"step": 8188, "train_loss": 3.624124050140381, "lr": 0.0003498434903235358, "tps": 16109, "wall": 33313.4} {"step": 8189, "train_loss": 3.5783441066741943, "lr": 0.0003498302213731632, "tps": 16108, "wall": 33321.2} {"step": 8190, "train_loss": 3.6126086711883545, "lr": 0.00034981695095206696, "tps": 16106, "wall": 33329.2} {"step": 8191, "train_loss": 3.511781930923462, "lr": 0.0003498036790603972, "tps": 16104, "wall": 33337.0} {"step": 8192, "train_loss": 3.5868988037109375, "lr": 0.0003497904056983043, "tps": 16102, "wall": 33344.9} {"step": 8193, "train_loss": 3.5724596977233887, "lr": 0.0003497771308659388, "tps": 16100, "wall": 33352.7} {"step": 8194, "train_loss": 3.6217613220214844, "lr": 0.0003497638545634509, "tps": 16098, "wall": 33360.5} {"step": 8195, "train_loss": 3.6569602489471436, "lr": 0.00034975057679099096, "tps": 16097, "wall": 33368.3} {"step": 8196, "train_loss": 3.588151693344116, "lr": 0.0003497372975487095, "tps": 16095, "wall": 33376.1} {"step": 8197, "train_loss": 3.6032299995422363, "lr": 0.00034972401683675697, "tps": 16093, "wall": 33383.9} {"step": 8198, "train_loss": 3.5798287391662598, "lr": 0.00034971073465528364, "tps": 16091, "wall": 33391.7} {"step": 8199, "train_loss": 3.6609995365142822, "lr": 0.00034969745100444017, "tps": 16089, "wall": 33399.5} {"step": 8200, "train_loss": 3.562927007675171, "lr": 0.00034968416588437694, "tps": 16088, "wall": 33407.4} {"step": 8201, "train_loss": 3.704680919647217, "lr": 0.0003496708792952445, "tps": 16086, "wall": 33415.3} {"step": 8202, "train_loss": 3.669508218765259, "lr": 0.0003496575912371933, "tps": 16084, "wall": 33422.9} {"step": 8203, "train_loss": 3.5538861751556396, "lr": 0.0003496443017103739, "tps": 16082, "wall": 33430.7} {"step": 8204, "train_loss": 3.602794647216797, "lr": 0.0003496310107149368, "tps": 16080, "wall": 33438.5} {"step": 8205, "train_loss": 3.5886316299438477, "lr": 0.0003496177182510326, "tps": 16079, "wall": 33446.4} {"step": 8206, "train_loss": 3.629434585571289, "lr": 0.0003496044243188119, "tps": 16077, "wall": 33454.1} {"step": 8207, "train_loss": 3.5880610942840576, "lr": 0.0003495911289184252, "tps": 16075, "wall": 33461.9} {"step": 8208, "train_loss": 3.5581226348876953, "lr": 0.0003495778320500233, "tps": 16073, "wall": 33469.8} {"step": 8209, "train_loss": 3.6426010131835938, "lr": 0.00034956453371375664, "tps": 16071, "wall": 33477.7} {"step": 8210, "train_loss": 3.629635810852051, "lr": 0.000349551233909776, "tps": 16070, "wall": 33485.5} {"step": 8211, "train_loss": 3.575601816177368, "lr": 0.0003495379326382319, "tps": 16068, "wall": 33493.2} {"step": 8212, "train_loss": 3.646289825439453, "lr": 0.0003495246298992751, "tps": 16066, "wall": 33500.9} {"step": 8213, "train_loss": 3.5581560134887695, "lr": 0.0003495113256930563, "tps": 16064, "wall": 33508.8} {"step": 8214, "train_loss": 3.5764591693878174, "lr": 0.0003494980200197262, "tps": 16063, "wall": 33516.6} {"step": 8215, "train_loss": 3.6043879985809326, "lr": 0.0003494847128794355, "tps": 16061, "wall": 33524.5} {"step": 8216, "train_loss": 3.5834267139434814, "lr": 0.000349471404272335, "tps": 16059, "wall": 33532.3} {"step": 8217, "train_loss": 3.6934947967529297, "lr": 0.0003494580941985754, "tps": 16057, "wall": 33540.1} {"step": 8218, "train_loss": 3.5885825157165527, "lr": 0.0003494447826583075, "tps": 16055, "wall": 33548.0} {"step": 8219, "train_loss": 3.59696102142334, "lr": 0.00034943146965168216, "tps": 16054, "wall": 33555.7} {"step": 8220, "train_loss": 3.5054140090942383, "lr": 0.00034941815517885007, "tps": 16052, "wall": 33563.6} {"step": 8221, "train_loss": 3.5667285919189453, "lr": 0.00034940483923996213, "tps": 16050, "wall": 33571.3} {"step": 8222, "train_loss": 3.6285839080810547, "lr": 0.0003493915218351692, "tps": 16048, "wall": 33579.1} {"step": 8223, "train_loss": 3.646397590637207, "lr": 0.00034937820296462207, "tps": 16046, "wall": 33587.0} {"step": 8224, "train_loss": 3.5145273208618164, "lr": 0.00034936488262847173, "tps": 16045, "wall": 33594.9} {"step": 8225, "train_loss": 3.5304527282714844, "lr": 0.0003493515608268689, "tps": 16043, "wall": 33602.6} {"step": 8226, "train_loss": 3.590933322906494, "lr": 0.0003493382375599646, "tps": 16041, "wall": 33610.5} {"step": 8227, "train_loss": 3.6406631469726562, "lr": 0.0003493249128279098, "tps": 16039, "wall": 33618.4} {"step": 8228, "train_loss": 3.608088970184326, "lr": 0.0003493115866308554, "tps": 16038, "wall": 33626.1} {"step": 8229, "train_loss": 3.578721284866333, "lr": 0.0003492982589689523, "tps": 16036, "wall": 33633.9} {"step": 8230, "train_loss": 3.4648919105529785, "lr": 0.0003492849298423516, "tps": 16034, "wall": 33641.6} {"step": 8231, "train_loss": 3.616678237915039, "lr": 0.0003492715992512041, "tps": 16032, "wall": 33649.5} {"step": 8232, "train_loss": 3.526916027069092, "lr": 0.0003492582671956611, "tps": 16030, "wall": 33657.3} {"step": 8233, "train_loss": 3.5745325088500977, "lr": 0.0003492449336758733, "tps": 16029, "wall": 33665.0} {"step": 8234, "train_loss": 3.562798023223877, "lr": 0.00034923159869199196, "tps": 16027, "wall": 33672.8} {"step": 8235, "train_loss": 3.5629539489746094, "lr": 0.00034921826224416805, "tps": 16025, "wall": 33680.6} {"step": 8236, "train_loss": 3.5315659046173096, "lr": 0.00034920492433255276, "tps": 16023, "wall": 33688.4} {"step": 8237, "train_loss": 3.606567144393921, "lr": 0.000349191584957297, "tps": 16022, "wall": 33696.1} {"step": 8238, "train_loss": 3.634117364883423, "lr": 0.000349178244118552, "tps": 16020, "wall": 33704.1} {"step": 8239, "train_loss": 3.5647196769714355, "lr": 0.0003491649018164689, "tps": 16018, "wall": 33711.8} {"step": 8240, "train_loss": 3.5878405570983887, "lr": 0.0003491515580511988, "tps": 16016, "wall": 33719.6} {"step": 8241, "train_loss": 3.656554698944092, "lr": 0.0003491382128228928, "tps": 16015, "wall": 33727.4} {"step": 8242, "train_loss": 3.5086936950683594, "lr": 0.00034912486613170225, "tps": 16013, "wall": 33735.2} {"step": 8243, "train_loss": 3.606149673461914, "lr": 0.00034911151797777817, "tps": 16011, "wall": 33743.0} {"step": 8244, "train_loss": 3.5775935649871826, "lr": 0.0003490981683612718, "tps": 16009, "wall": 33750.8} {"step": 8245, "train_loss": 3.6494407653808594, "lr": 0.0003490848172823344, "tps": 16008, "wall": 33758.6} {"step": 8246, "train_loss": 3.50083589553833, "lr": 0.0003490714647411172, "tps": 16006, "wall": 33766.6} {"step": 8247, "train_loss": 3.6264657974243164, "lr": 0.00034905811073777156, "tps": 16004, "wall": 33774.3} {"step": 8248, "train_loss": 3.5729024410247803, "lr": 0.0003490447552724486, "tps": 16002, "wall": 33782.1} {"step": 8249, "train_loss": 3.532681941986084, "lr": 0.0003490313983452996, "tps": 16000, "wall": 33790.0} {"step": 8250, "train_loss": 3.583287239074707, "lr": 0.00034901803995647605, "tps": 15999, "wall": 33797.8} {"step": 8251, "train_loss": 3.4949116706848145, "lr": 0.00034900468010612906, "tps": 15997, "wall": 33805.6} {"step": 8252, "train_loss": 3.628244161605835, "lr": 0.0003489913187944102, "tps": 15995, "wall": 33813.4} {"step": 8253, "train_loss": 3.594087839126587, "lr": 0.0003489779560214706, "tps": 15993, "wall": 33821.1} {"step": 8254, "train_loss": 3.617644786834717, "lr": 0.00034896459178746176, "tps": 15992, "wall": 33829.1} {"step": 8255, "train_loss": 3.5263023376464844, "lr": 0.000348951226092535, "tps": 15990, "wall": 33836.9} {"step": 8256, "train_loss": 3.6051149368286133, "lr": 0.00034893785893684186, "tps": 15988, "wall": 33844.7} {"step": 8257, "train_loss": 3.593555450439453, "lr": 0.0003489244903205337, "tps": 15986, "wall": 33852.5} {"step": 8258, "train_loss": 3.574789524078369, "lr": 0.0003489111202437618, "tps": 15985, "wall": 33860.3} {"step": 8259, "train_loss": 3.662198066711426, "lr": 0.0003488977487066779, "tps": 15983, "wall": 33868.1} {"step": 8260, "train_loss": 3.6531291007995605, "lr": 0.0003488843757094333, "tps": 15981, "wall": 33875.8} {"step": 8261, "train_loss": 3.5675461292266846, "lr": 0.00034887100125217946, "tps": 15979, "wall": 33883.7} {"step": 8262, "train_loss": 3.612211227416992, "lr": 0.000348857625335068, "tps": 15978, "wall": 33891.7} {"step": 8263, "train_loss": 3.5519468784332275, "lr": 0.00034884424795825035, "tps": 15976, "wall": 33899.4} {"step": 8264, "train_loss": 3.4670863151550293, "lr": 0.0003488308691218781, "tps": 15974, "wall": 33907.1} {"step": 8265, "train_loss": 3.4925918579101562, "lr": 0.0003488174888261028, "tps": 15972, "wall": 33915.0} {"step": 8266, "train_loss": 3.661851406097412, "lr": 0.00034880410707107605, "tps": 15971, "wall": 33922.8} {"step": 8267, "train_loss": 3.686044692993164, "lr": 0.00034879072385694934, "tps": 15969, "wall": 33930.7} {"step": 8268, "train_loss": 3.5016708374023438, "lr": 0.0003487773391838744, "tps": 15967, "wall": 33938.5} {"step": 8269, "train_loss": 3.562089443206787, "lr": 0.0003487639530520028, "tps": 15965, "wall": 33946.5} {"step": 8270, "train_loss": 3.4786903858184814, "lr": 0.0003487505654614861, "tps": 15964, "wall": 33954.2} {"step": 8271, "train_loss": 3.583904266357422, "lr": 0.0003487371764124761, "tps": 15962, "wall": 33962.0} {"step": 8272, "train_loss": 3.6109914779663086, "lr": 0.0003487237859051244, "tps": 15960, "wall": 33969.9} {"step": 8273, "train_loss": 3.5967366695404053, "lr": 0.00034871039393958263, "tps": 15958, "wall": 33977.8} {"step": 8274, "train_loss": 3.556522846221924, "lr": 0.0003486970005160027, "tps": 15957, "wall": 33985.5} {"step": 8275, "train_loss": 3.606574058532715, "lr": 0.000348683605634536, "tps": 15955, "wall": 33993.4} {"step": 8276, "train_loss": 3.5476789474487305, "lr": 0.0003486702092953345, "tps": 15953, "wall": 34001.1} {"step": 8277, "train_loss": 3.6252050399780273, "lr": 0.00034865681149855, "tps": 15951, "wall": 34009.0} {"step": 8278, "train_loss": 3.6455254554748535, "lr": 0.0003486434122443341, "tps": 15950, "wall": 34016.8} {"step": 8279, "train_loss": 3.5552127361297607, "lr": 0.0003486300115328387, "tps": 15948, "wall": 34024.7} {"step": 8280, "train_loss": 3.5917513370513916, "lr": 0.00034861660936421555, "tps": 15946, "wall": 34032.4} {"step": 8281, "train_loss": 3.5995190143585205, "lr": 0.0003486032057386165, "tps": 15944, "wall": 34040.2} {"step": 8282, "train_loss": 3.5988283157348633, "lr": 0.0003485898006561933, "tps": 15943, "wall": 34048.0} {"step": 8283, "train_loss": 3.6130831241607666, "lr": 0.00034857639411709797, "tps": 15941, "wall": 34055.8} {"step": 8284, "train_loss": 3.4739203453063965, "lr": 0.0003485629861214823, "tps": 15939, "wall": 34063.7} {"step": 8285, "train_loss": 3.5192856788635254, "lr": 0.0003485495766694982, "tps": 15937, "wall": 34071.5} {"step": 8286, "train_loss": 3.599179744720459, "lr": 0.00034853616576129747, "tps": 15936, "wall": 34079.4} {"step": 8287, "train_loss": 3.7065234184265137, "lr": 0.00034852275339703213, "tps": 15934, "wall": 34087.2} {"step": 8288, "train_loss": 3.557276725769043, "lr": 0.00034850933957685404, "tps": 15932, "wall": 34094.9} {"step": 8289, "train_loss": 3.5819525718688965, "lr": 0.00034849592430091526, "tps": 15931, "wall": 34102.7} {"step": 8290, "train_loss": 3.5514776706695557, "lr": 0.00034848250756936767, "tps": 15929, "wall": 34110.7} {"step": 8291, "train_loss": 3.641719341278076, "lr": 0.0003484690893823633, "tps": 15927, "wall": 34118.4} {"step": 8292, "train_loss": 3.628520965576172, "lr": 0.00034845566974005406, "tps": 15925, "wall": 34126.3} {"step": 8293, "train_loss": 3.5058255195617676, "lr": 0.00034844224864259216, "tps": 15924, "wall": 34134.0} {"step": 8294, "train_loss": 3.5740318298339844, "lr": 0.0003484288260901294, "tps": 15922, "wall": 34141.9} {"step": 8295, "train_loss": 3.643455982208252, "lr": 0.000348415402082818, "tps": 15920, "wall": 34149.7} {"step": 8296, "train_loss": 3.678920030593872, "lr": 0.0003484019766208101, "tps": 15918, "wall": 34157.5} {"step": 8297, "train_loss": 3.577718734741211, "lr": 0.0003483885497042575, "tps": 15917, "wall": 34165.4} {"step": 8298, "train_loss": 3.572697162628174, "lr": 0.00034837512133331254, "tps": 15915, "wall": 34173.1} {"step": 8299, "train_loss": 3.5909547805786133, "lr": 0.0003483616915081272, "tps": 15913, "wall": 34180.9} {"step": 8300, "train_loss": 3.5681967735290527, "lr": 0.0003483482602288537, "tps": 15912, "wall": 34188.8} {"step": 8301, "train_loss": 3.6401309967041016, "lr": 0.0003483348274956443, "tps": 15910, "wall": 34196.5} {"step": 8302, "train_loss": 3.656952142715454, "lr": 0.0003483213933086508, "tps": 15908, "wall": 34204.3} {"step": 8303, "train_loss": 3.6697921752929688, "lr": 0.00034830795766802573, "tps": 15907, "wall": 34212.0} {"step": 8304, "train_loss": 3.5438451766967773, "lr": 0.0003482945205739212, "tps": 15905, "wall": 34219.8} {"step": 8305, "train_loss": 3.5397210121154785, "lr": 0.0003482810820264893, "tps": 15903, "wall": 34227.6} {"step": 8306, "train_loss": 3.6717708110809326, "lr": 0.00034826764202588247, "tps": 15901, "wall": 34235.5} {"step": 8307, "train_loss": 3.5689034461975098, "lr": 0.0003482542005722528, "tps": 15900, "wall": 34243.5} {"step": 8308, "train_loss": 3.6206369400024414, "lr": 0.0003482407576657526, "tps": 15898, "wall": 34251.4} {"step": 8309, "train_loss": 3.6334176063537598, "lr": 0.0003482273133065342, "tps": 15896, "wall": 34259.1} {"step": 8310, "train_loss": 3.533109664916992, "lr": 0.00034821386749474986, "tps": 15894, "wall": 34267.0} {"step": 8311, "train_loss": 3.6264758110046387, "lr": 0.0003482004202305518, "tps": 15893, "wall": 34274.8} {"step": 8312, "train_loss": 3.587343692779541, "lr": 0.00034818697151409254, "tps": 15891, "wall": 34282.6} {"step": 8313, "train_loss": 3.6054861545562744, "lr": 0.00034817352134552433, "tps": 15889, "wall": 34290.4} {"step": 8314, "train_loss": 3.6374073028564453, "lr": 0.0003481600697249995, "tps": 15888, "wall": 34298.3} {"step": 8315, "train_loss": 3.606557607650757, "lr": 0.00034814661665267047, "tps": 15886, "wall": 34306.3} {"step": 8316, "train_loss": 3.538022756576538, "lr": 0.0003481331621286897, "tps": 15884, "wall": 34314.1} {"step": 8317, "train_loss": 3.668768882751465, "lr": 0.00034811970615320945, "tps": 15882, "wall": 34321.9} {"step": 8318, "train_loss": 3.6315369606018066, "lr": 0.00034810624872638225, "tps": 15881, "wall": 34329.7} {"step": 8319, "train_loss": 3.542175769805908, "lr": 0.0003480927898483606, "tps": 15879, "wall": 34337.4} {"step": 8320, "train_loss": 3.585186719894409, "lr": 0.00034807932951929683, "tps": 15877, "wall": 34345.2} {"step": 8321, "train_loss": 3.6392858028411865, "lr": 0.0003480658677393435, "tps": 15876, "wall": 34352.9} {"step": 8322, "train_loss": 3.628756523132324, "lr": 0.0003480524045086531, "tps": 15874, "wall": 34360.7} {"step": 8323, "train_loss": 3.654995918273926, "lr": 0.00034803893982737814, "tps": 15872, "wall": 34368.7} {"step": 8324, "train_loss": 3.6052870750427246, "lr": 0.00034802547369567114, "tps": 15870, "wall": 34376.5} {"step": 8325, "train_loss": 3.565246105194092, "lr": 0.0003480120061136846, "tps": 15869, "wall": 34384.3} {"step": 8326, "train_loss": 3.4941396713256836, "lr": 0.0003479985370815712, "tps": 15867, "wall": 34392.1} {"step": 8327, "train_loss": 3.6261205673217773, "lr": 0.0003479850665994834, "tps": 15865, "wall": 34399.9} {"step": 8328, "train_loss": 3.6143784523010254, "lr": 0.00034797159466757384, "tps": 15864, "wall": 34407.7} {"step": 8329, "train_loss": 3.577359199523926, "lr": 0.0003479581212859952, "tps": 15862, "wall": 34415.5} {"step": 8330, "train_loss": 3.489264488220215, "lr": 0.0003479446464549, "tps": 15860, "wall": 34423.3} {"step": 8331, "train_loss": 3.5643301010131836, "lr": 0.0003479311701744409, "tps": 15859, "wall": 34431.1} {"step": 8332, "train_loss": 3.6377627849578857, "lr": 0.00034791769244477057, "tps": 15857, "wall": 34438.9} {"step": 8333, "train_loss": 3.5761144161224365, "lr": 0.00034790421326604177, "tps": 15855, "wall": 34446.7} {"step": 8334, "train_loss": 3.643887758255005, "lr": 0.00034789073263840703, "tps": 15854, "wall": 34454.4} {"step": 8335, "train_loss": 3.707200765609741, "lr": 0.0003478772505620192, "tps": 15852, "wall": 34462.2} {"step": 8336, "train_loss": 3.647630214691162, "lr": 0.00034786376703703096, "tps": 15850, "wall": 34470.0} {"step": 8337, "train_loss": 3.511082172393799, "lr": 0.00034785028206359505, "tps": 15849, "wall": 34477.8} {"step": 8338, "train_loss": 3.574110507965088, "lr": 0.0003478367956418642, "tps": 15847, "wall": 34485.7} {"step": 8339, "train_loss": 3.6080970764160156, "lr": 0.0003478233077719913, "tps": 15845, "wall": 34493.5} {"step": 8340, "train_loss": 3.5522267818450928, "lr": 0.000347809818454129, "tps": 15843, "wall": 34501.4} {"step": 8341, "train_loss": 3.5108377933502197, "lr": 0.00034779632768843014, "tps": 15842, "wall": 34509.1} {"step": 8342, "train_loss": 3.560293197631836, "lr": 0.0003477828354750476, "tps": 15840, "wall": 34517.0} {"step": 8343, "train_loss": 3.544588088989258, "lr": 0.0003477693418141342, "tps": 15838, "wall": 34524.9} {"step": 8344, "train_loss": 3.500363826751709, "lr": 0.0003477558467058427, "tps": 15837, "wall": 34532.6} {"step": 8345, "train_loss": 3.5939760208129883, "lr": 0.0003477423501503261, "tps": 15835, "wall": 34540.4} {"step": 8346, "train_loss": 3.5756473541259766, "lr": 0.00034772885214773725, "tps": 15833, "wall": 34548.4} {"step": 8347, "train_loss": 3.527984380722046, "lr": 0.00034771535269822914, "tps": 15832, "wall": 34556.1} {"step": 8348, "train_loss": 3.447047710418701, "lr": 0.0003477018518019545, "tps": 15830, "wall": 34563.8} {"step": 8349, "train_loss": 3.4627628326416016, "lr": 0.0003476883494590664, "tps": 15828, "wall": 34571.7} {"step": 8350, "train_loss": 3.581244945526123, "lr": 0.00034767484566971776, "tps": 15827, "wall": 34579.5} {"step": 8351, "train_loss": 3.6078872680664062, "lr": 0.00034766134043406156, "tps": 15825, "wall": 34587.4} {"step": 8352, "train_loss": 3.575869083404541, "lr": 0.0003476478337522508, "tps": 15823, "wall": 34595.2} {"step": 8353, "train_loss": 3.501451015472412, "lr": 0.0003476343256244385, "tps": 15822, "wall": 34602.9} {"step": 8354, "train_loss": 3.629030227661133, "lr": 0.0003476208160507776, "tps": 15820, "wall": 34610.8} {"step": 8355, "train_loss": 3.6181516647338867, "lr": 0.00034760730503142123, "tps": 15818, "wall": 34618.6} {"step": 8356, "train_loss": 3.6273887157440186, "lr": 0.00034759379256652244, "tps": 15816, "wall": 34626.4} {"step": 8357, "train_loss": 3.493666172027588, "lr": 0.0003475802786562342, "tps": 15815, "wall": 34634.1} {"step": 8358, "train_loss": 3.543099880218506, "lr": 0.0003475667633007097, "tps": 15813, "wall": 34641.9} {"step": 8359, "train_loss": 3.5532655715942383, "lr": 0.00034755324650010197, "tps": 15811, "wall": 34649.7} {"step": 8360, "train_loss": 3.62322998046875, "lr": 0.00034753972825456414, "tps": 15810, "wall": 34657.5} {"step": 8361, "train_loss": 3.6733739376068115, "lr": 0.00034752620856424944, "tps": 15808, "wall": 34665.3} {"step": 8362, "train_loss": 3.640385627746582, "lr": 0.0003475126874293109, "tps": 15807, "wall": 34673.0} {"step": 8363, "train_loss": 3.5957436561584473, "lr": 0.00034749916484990177, "tps": 15805, "wall": 34680.8} {"step": 8364, "train_loss": 3.6599223613739014, "lr": 0.0003474856408261752, "tps": 15803, "wall": 34688.6} {"step": 8365, "train_loss": 3.5209527015686035, "lr": 0.0003474721153582844, "tps": 15802, "wall": 34696.4} {"step": 8366, "train_loss": 3.465437412261963, "lr": 0.00034745858844638253, "tps": 15800, "wall": 34704.1} {"step": 8367, "train_loss": 3.539323568344116, "lr": 0.0003474450600906229, "tps": 15798, "wall": 34712.0} {"step": 8368, "train_loss": 3.5525684356689453, "lr": 0.0003474315302911588, "tps": 15797, "wall": 34719.7} {"step": 8369, "train_loss": 3.599719285964966, "lr": 0.0003474179990481433, "tps": 15795, "wall": 34727.7} {"step": 8370, "train_loss": 3.5803537368774414, "lr": 0.00034740446636172994, "tps": 15793, "wall": 34735.4} {"step": 8371, "train_loss": 3.5833606719970703, "lr": 0.0003473909322320718, "tps": 15792, "wall": 34743.2} {"step": 8372, "train_loss": 3.569988489151001, "lr": 0.00034737739665932236, "tps": 15790, "wall": 34750.9} {"step": 8373, "train_loss": 3.6219303607940674, "lr": 0.00034736385964363487, "tps": 15788, "wall": 34758.7} {"step": 8374, "train_loss": 3.501743793487549, "lr": 0.0003473503211851627, "tps": 15787, "wall": 34766.4} {"step": 8375, "train_loss": 3.4661993980407715, "lr": 0.00034733678128405916, "tps": 15785, "wall": 34774.1} {"step": 8376, "train_loss": 3.5733063220977783, "lr": 0.00034732323994047766, "tps": 15783, "wall": 34781.9} {"step": 8377, "train_loss": 3.391929864883423, "lr": 0.0003473096971545716, "tps": 15782, "wall": 34789.8} {"step": 8378, "train_loss": 3.566739082336426, "lr": 0.00034729615292649447, "tps": 15780, "wall": 34797.6} {"step": 8379, "train_loss": 3.583346128463745, "lr": 0.0003472826072563996, "tps": 15778, "wall": 34805.3} {"step": 8380, "train_loss": 3.5038161277770996, "lr": 0.0003472690601444404, "tps": 15777, "wall": 34813.1} {"step": 8381, "train_loss": 3.6697399616241455, "lr": 0.00034725551159077054, "tps": 15775, "wall": 34821.0} {"step": 8382, "train_loss": 3.6693544387817383, "lr": 0.0003472419615955433, "tps": 15773, "wall": 34828.8} {"step": 8383, "train_loss": 3.5515780448913574, "lr": 0.00034722841015891225, "tps": 15772, "wall": 34836.6} {"step": 8384, "train_loss": 3.683872699737549, "lr": 0.0003472148572810308, "tps": 15770, "wall": 34844.5} {"step": 8385, "train_loss": 3.4752626419067383, "lr": 0.0003472013029620527, "tps": 15768, "wall": 34852.3} {"step": 8386, "train_loss": 3.526196241378784, "lr": 0.0003471877472021312, "tps": 15767, "wall": 34860.1} {"step": 8387, "train_loss": 3.5077919960021973, "lr": 0.0003471741900014201, "tps": 15765, "wall": 34867.8} {"step": 8388, "train_loss": 3.6542105674743652, "lr": 0.0003471606313600729, "tps": 15764, "wall": 34875.6} {"step": 8389, "train_loss": 3.5197434425354004, "lr": 0.0003471470712782432, "tps": 15762, "wall": 34883.5} {"step": 8390, "train_loss": 3.6759610176086426, "lr": 0.0003471335097560846, "tps": 15760, "wall": 34891.2} {"step": 8391, "train_loss": 3.5332119464874268, "lr": 0.0003471199467937507, "tps": 15759, "wall": 34898.9} {"step": 8392, "train_loss": 3.5976250171661377, "lr": 0.00034710638239139515, "tps": 15757, "wall": 34906.8} {"step": 8393, "train_loss": 3.4488136768341064, "lr": 0.0003470928165491716, "tps": 15755, "wall": 34914.6} {"step": 8394, "train_loss": 3.5471553802490234, "lr": 0.0003470792492672339, "tps": 15754, "wall": 34922.3} {"step": 8395, "train_loss": 3.653006076812744, "lr": 0.0003470656805457354, "tps": 15752, "wall": 34930.2} {"step": 8396, "train_loss": 3.52016544342041, "lr": 0.00034705211038483017, "tps": 15750, "wall": 34938.0} {"step": 8397, "train_loss": 3.5507254600524902, "lr": 0.00034703853878467164, "tps": 15749, "wall": 34945.8} {"step": 8398, "train_loss": 3.649576187133789, "lr": 0.0003470249657454137, "tps": 15747, "wall": 34953.6} {"step": 8399, "train_loss": 3.597043037414551, "lr": 0.00034701139126721013, "tps": 15746, "wall": 34961.3} {"step": 8400, "train_loss": 3.5589218139648438, "lr": 0.0003469978153502146, "tps": 15744, "wall": 34969.2} {"step": 8401, "train_loss": 3.5931508541107178, "lr": 0.0003469842379945809, "tps": 15742, "wall": 34977.1} {"step": 8402, "train_loss": 3.5507845878601074, "lr": 0.0003469706592004629, "tps": 15741, "wall": 34984.8} {"step": 8403, "train_loss": 3.5852761268615723, "lr": 0.0003469570789680145, "tps": 15739, "wall": 34992.7} {"step": 8404, "train_loss": 3.556865692138672, "lr": 0.0003469434972973893, "tps": 15737, "wall": 35000.5} {"step": 8405, "train_loss": 3.6199307441711426, "lr": 0.0003469299141887414, "tps": 15736, "wall": 35008.4} {"step": 8406, "train_loss": 3.4536967277526855, "lr": 0.0003469163296422245, "tps": 15734, "wall": 35016.1} {"step": 8407, "train_loss": 3.589364767074585, "lr": 0.0003469027436579926, "tps": 15732, "wall": 35024.0} {"step": 8408, "train_loss": 3.6541547775268555, "lr": 0.00034688915623619956, "tps": 15731, "wall": 35031.8} {"step": 8409, "train_loss": 3.521141529083252, "lr": 0.00034687556737699924, "tps": 15729, "wall": 35039.6} {"step": 8410, "train_loss": 3.555670738220215, "lr": 0.00034686197708054566, "tps": 15727, "wall": 35047.5} {"step": 8411, "train_loss": 3.6560006141662598, "lr": 0.0003468483853469928, "tps": 15726, "wall": 35055.3} {"step": 8412, "train_loss": 3.6762337684631348, "lr": 0.00034683479217649445, "tps": 15724, "wall": 35063.0} {"step": 8413, "train_loss": 3.6430578231811523, "lr": 0.00034682119756920484, "tps": 15723, "wall": 35070.8} {"step": 8414, "train_loss": 3.671570301055908, "lr": 0.00034680760152527775, "tps": 15721, "wall": 35078.6} {"step": 8415, "train_loss": 3.6717190742492676, "lr": 0.0003467940040448673, "tps": 15719, "wall": 35086.6} {"step": 8416, "train_loss": 3.620579957962036, "lr": 0.0003467804051281275, "tps": 15718, "wall": 35094.3} {"step": 8417, "train_loss": 3.7049264907836914, "lr": 0.0003467668047752125, "tps": 15716, "wall": 35102.0} {"step": 8418, "train_loss": 3.556035280227661, "lr": 0.0003467532029862762, "tps": 15714, "wall": 35109.9} {"step": 8419, "train_loss": 3.666034698486328, "lr": 0.0003467395997614728, "tps": 15713, "wall": 35117.8} {"step": 8420, "train_loss": 3.5824387073516846, "lr": 0.00034672599510095626, "tps": 15711, "wall": 35125.5} {"step": 8421, "train_loss": 3.518089532852173, "lr": 0.0003467123890048809, "tps": 15709, "wall": 35133.4} {"step": 8422, "train_loss": 3.7322325706481934, "lr": 0.0003466987814734007, "tps": 15708, "wall": 35141.2} {"step": 8423, "train_loss": 3.5428848266601562, "lr": 0.0003466851725066699, "tps": 15706, "wall": 35149.1} {"step": 8424, "train_loss": 3.5901243686676025, "lr": 0.00034667156210484255, "tps": 15705, "wall": 35156.9} {"step": 8425, "train_loss": 3.5824060440063477, "lr": 0.0003466579502680729, "tps": 15703, "wall": 35164.6} {"step": 8426, "train_loss": 3.6020748615264893, "lr": 0.0003466443369965152, "tps": 15701, "wall": 35172.5} {"step": 8427, "train_loss": 3.4889137744903564, "lr": 0.0003466307222903235, "tps": 15700, "wall": 35180.2} {"step": 8428, "train_loss": 3.631171941757202, "lr": 0.0003466171061496522, "tps": 15698, "wall": 35188.1} {"step": 8429, "train_loss": 3.5772924423217773, "lr": 0.00034660348857465547, "tps": 15696, "wall": 35195.9} {"step": 8430, "train_loss": 3.5035367012023926, "lr": 0.00034658986956548755, "tps": 15695, "wall": 35203.6} {"step": 8431, "train_loss": 3.610456943511963, "lr": 0.0003465762491223027, "tps": 15693, "wall": 35211.5} {"step": 8432, "train_loss": 3.552794933319092, "lr": 0.0003465626272452553, "tps": 15692, "wall": 35219.3} {"step": 8433, "train_loss": 3.5732851028442383, "lr": 0.00034654900393449957, "tps": 15690, "wall": 35227.1} {"step": 8434, "train_loss": 3.5902621746063232, "lr": 0.0003465353791901899, "tps": 15688, "wall": 35234.8} {"step": 8435, "train_loss": 3.5221638679504395, "lr": 0.00034652175301248063, "tps": 15687, "wall": 35242.5} {"step": 8436, "train_loss": 3.598769187927246, "lr": 0.00034650812540152617, "tps": 15685, "wall": 35250.5} {"step": 8437, "train_loss": 3.6131787300109863, "lr": 0.0003464944963574807, "tps": 15684, "wall": 35258.2} {"step": 8438, "train_loss": 3.6417770385742188, "lr": 0.00034648086588049873, "tps": 15682, "wall": 35266.2} {"step": 8439, "train_loss": 3.5920639038085938, "lr": 0.00034646723397073476, "tps": 15680, "wall": 35273.9} {"step": 8440, "train_loss": 3.404183864593506, "lr": 0.000346453600628343, "tps": 15679, "wall": 35281.7} {"step": 8441, "train_loss": 3.595050811767578, "lr": 0.0003464399658534781, "tps": 15677, "wall": 35289.5} {"step": 8442, "train_loss": 3.537081718444824, "lr": 0.0003464263296462944, "tps": 15675, "wall": 35297.3} {"step": 8443, "train_loss": 3.5966100692749023, "lr": 0.0003464126920069464, "tps": 15674, "wall": 35305.1} {"step": 8444, "train_loss": 3.6638383865356445, "lr": 0.0003463990529355887, "tps": 15672, "wall": 35312.8} {"step": 8445, "train_loss": 3.5695176124572754, "lr": 0.0003463854124323755, "tps": 15671, "wall": 35320.5} {"step": 8446, "train_loss": 3.622485637664795, "lr": 0.0003463717704974616, "tps": 15669, "wall": 35328.5} {"step": 8447, "train_loss": 3.630697727203369, "lr": 0.0003463581271310014, "tps": 15668, "wall": 35336.2} {"step": 8448, "train_loss": 3.5429158210754395, "lr": 0.00034634448233314955, "tps": 15666, "wall": 35344.0} {"step": 8449, "train_loss": 3.6045796871185303, "lr": 0.0003463308361040606, "tps": 15664, "wall": 35351.8} {"step": 8450, "train_loss": 3.538386821746826, "lr": 0.0003463171884438891, "tps": 15663, "wall": 35359.6} {"step": 8451, "train_loss": 3.5946733951568604, "lr": 0.0003463035393527896, "tps": 15661, "wall": 35367.4} {"step": 8452, "train_loss": 3.574058771133423, "lr": 0.00034628988883091675, "tps": 15660, "wall": 35375.1} {"step": 8453, "train_loss": 3.703216552734375, "lr": 0.00034627623687842526, "tps": 15658, "wall": 35382.9} {"step": 8454, "train_loss": 3.5139365196228027, "lr": 0.00034626258349546973, "tps": 15656, "wall": 35390.8} {"step": 8455, "train_loss": 3.5671885013580322, "lr": 0.0003462489286822048, "tps": 15655, "wall": 35398.6} {"step": 8456, "train_loss": 3.4852263927459717, "lr": 0.0003462352724387852, "tps": 15653, "wall": 35406.3} {"step": 8457, "train_loss": 3.506821393966675, "lr": 0.0003462216147653656, "tps": 15652, "wall": 35414.1} {"step": 8458, "train_loss": 3.5539355278015137, "lr": 0.0003462079556621007, "tps": 15650, "wall": 35421.7} {"step": 8459, "train_loss": 3.559539318084717, "lr": 0.00034619429512914527, "tps": 15648, "wall": 35429.6} {"step": 8460, "train_loss": 3.5820324420928955, "lr": 0.00034618063316665406, "tps": 15647, "wall": 35437.4} {"step": 8461, "train_loss": 3.5355136394500732, "lr": 0.0003461669697747817, "tps": 15645, "wall": 35445.2} {"step": 8462, "train_loss": 3.56234073638916, "lr": 0.0003461533049536832, "tps": 15644, "wall": 35452.9} {"step": 8463, "train_loss": 3.5735363960266113, "lr": 0.0003461396387035132, "tps": 15642, "wall": 35460.8} {"step": 8464, "train_loss": 3.5484495162963867, "lr": 0.0003461259710244266, "tps": 15640, "wall": 35468.6} {"step": 8465, "train_loss": 3.6094045639038086, "lr": 0.00034611230191657815, "tps": 15639, "wall": 35476.5} {"step": 8466, "train_loss": 3.545905113220215, "lr": 0.00034609863138012264, "tps": 15637, "wall": 35484.2} {"step": 8467, "train_loss": 3.585136890411377, "lr": 0.0003460849594152151, "tps": 15636, "wall": 35492.0} {"step": 8468, "train_loss": 3.6232988834381104, "lr": 0.00034607128602201026, "tps": 15634, "wall": 35499.8} {"step": 8469, "train_loss": 3.654829978942871, "lr": 0.00034605761120066304, "tps": 15632, "wall": 35507.7} {"step": 8470, "train_loss": 3.5646743774414062, "lr": 0.00034604393495132847, "tps": 15631, "wall": 35515.4} {"step": 8471, "train_loss": 3.458519458770752, "lr": 0.00034603025727416133, "tps": 15629, "wall": 35523.2} {"step": 8472, "train_loss": 3.690964698791504, "lr": 0.00034601657816931666, "tps": 15628, "wall": 35530.9} {"step": 8473, "train_loss": 3.667113780975342, "lr": 0.00034600289763694935, "tps": 15626, "wall": 35538.7} {"step": 8474, "train_loss": 3.5252392292022705, "lr": 0.0003459892156772144, "tps": 15625, "wall": 35546.6} {"step": 8475, "train_loss": 3.543456554412842, "lr": 0.0003459755322902668, "tps": 15623, "wall": 35554.3} {"step": 8476, "train_loss": 3.622405529022217, "lr": 0.0003459618474762616, "tps": 15621, "wall": 35562.0} {"step": 8477, "train_loss": 3.5294179916381836, "lr": 0.00034594816123535374, "tps": 15620, "wall": 35569.8} {"step": 8478, "train_loss": 3.501901626586914, "lr": 0.0003459344735676983, "tps": 15618, "wall": 35577.5} {"step": 8479, "train_loss": 3.4952268600463867, "lr": 0.0003459207844734503, "tps": 15617, "wall": 35585.4} {"step": 8480, "train_loss": 3.5081253051757812, "lr": 0.00034590709395276485, "tps": 15615, "wall": 35593.1} {"step": 8481, "train_loss": 3.51233172416687, "lr": 0.00034589340200579704, "tps": 15614, "wall": 35600.9} {"step": 8482, "train_loss": 3.617973804473877, "lr": 0.000345879708632702, "tps": 15612, "wall": 35608.7} {"step": 8483, "train_loss": 3.5568056106567383, "lr": 0.00034586601383363477, "tps": 15610, "wall": 35616.4} {"step": 8484, "train_loss": 3.626978874206543, "lr": 0.0003458523176087505, "tps": 15609, "wall": 35624.3} {"step": 8485, "train_loss": 3.5500500202178955, "lr": 0.0003458386199582044, "tps": 15607, "wall": 35632.1} {"step": 8486, "train_loss": 3.6226253509521484, "lr": 0.0003458249208821516, "tps": 15606, "wall": 35639.6} {"step": 8487, "train_loss": 3.6775503158569336, "lr": 0.00034581122038074736, "tps": 15604, "wall": 35647.4} {"step": 8488, "train_loss": 3.6387746334075928, "lr": 0.0003457975184541467, "tps": 15603, "wall": 35655.2} {"step": 8489, "train_loss": 3.6469979286193848, "lr": 0.00034578381510250503, "tps": 15601, "wall": 35663.0} {"step": 8490, "train_loss": 3.591435432434082, "lr": 0.0003457701103259774, "tps": 15600, "wall": 35670.7} {"step": 8491, "train_loss": 3.4375524520874023, "lr": 0.0003457564041247192, "tps": 15598, "wall": 35678.5} {"step": 8492, "train_loss": 3.5520546436309814, "lr": 0.0003457426964988857, "tps": 15596, "wall": 35686.4} {"step": 8493, "train_loss": 3.5113229751586914, "lr": 0.0003457289874486321, "tps": 15595, "wall": 35694.2} {"step": 8494, "train_loss": 3.6587510108947754, "lr": 0.0003457152769741137, "tps": 15593, "wall": 35701.9} {"step": 8495, "train_loss": 3.57014799118042, "lr": 0.0003457015650754858, "tps": 15592, "wall": 35709.7} {"step": 8496, "train_loss": 3.500927209854126, "lr": 0.0003456878517529039, "tps": 15590, "wall": 35717.5} {"step": 8497, "train_loss": 3.5041139125823975, "lr": 0.0003456741370065232, "tps": 15589, "wall": 35725.3} {"step": 8498, "train_loss": 3.6773698329925537, "lr": 0.00034566042083649897, "tps": 15587, "wall": 35733.1} {"step": 8499, "train_loss": 3.550312042236328, "lr": 0.00034564670324298676, "tps": 15586, "wall": 35740.8} {"step": 8500, "train_loss": 3.5881853103637695, "lr": 0.0003456329842261419, "tps": 15584, "wall": 35748.8} {"step": 8501, "train_loss": 3.645118236541748, "lr": 0.0003456192637861198, "tps": 15582, "wall": 35756.4} {"step": 8502, "train_loss": 3.586339235305786, "lr": 0.0003456055419230759, "tps": 15581, "wall": 35764.2} {"step": 8503, "train_loss": 3.657649040222168, "lr": 0.0003455918186371655, "tps": 15579, "wall": 35771.9} {"step": 8504, "train_loss": 3.5974483489990234, "lr": 0.00034557809392854434, "tps": 15578, "wall": 35779.8} {"step": 8505, "train_loss": 3.680081605911255, "lr": 0.0003455643677973677, "tps": 15576, "wall": 35787.5} {"step": 8506, "train_loss": 3.537667751312256, "lr": 0.00034555064024379106, "tps": 15575, "wall": 35795.2} {"step": 8507, "train_loss": 3.6030561923980713, "lr": 0.00034553691126797, "tps": 15573, "wall": 35802.9} {"step": 8508, "train_loss": 3.532783269882202, "lr": 0.00034552318087006, "tps": 15571, "wall": 35810.9} {"step": 8509, "train_loss": 3.5374555587768555, "lr": 0.00034550944905021664, "tps": 15570, "wall": 35818.7} {"step": 8510, "train_loss": 3.59633731842041, "lr": 0.0003454957158085955, "tps": 15568, "wall": 35826.4} {"step": 8511, "train_loss": 3.6655023097991943, "lr": 0.000345481981145352, "tps": 15567, "wall": 35834.2} {"step": 8512, "train_loss": 3.6256184577941895, "lr": 0.0003454682450606419, "tps": 15565, "wall": 35842.0} {"step": 8513, "train_loss": 3.548733711242676, "lr": 0.0003454545075546207, "tps": 15564, "wall": 35849.8} {"step": 8514, "train_loss": 3.5951268672943115, "lr": 0.00034544076862744405, "tps": 15562, "wall": 35857.6} {"step": 8515, "train_loss": 3.6578900814056396, "lr": 0.00034542702827926764, "tps": 15561, "wall": 35865.3} {"step": 8516, "train_loss": 3.593930244445801, "lr": 0.00034541328651024704, "tps": 15559, "wall": 35873.1} {"step": 8517, "train_loss": 3.5530595779418945, "lr": 0.0003453995433205379, "tps": 15558, "wall": 35880.8} {"step": 8518, "train_loss": 3.6571104526519775, "lr": 0.000345385798710296, "tps": 15556, "wall": 35888.6} {"step": 8519, "train_loss": 3.5718894004821777, "lr": 0.00034537205267967696, "tps": 15554, "wall": 35896.3} {"step": 8520, "train_loss": 3.4868826866149902, "lr": 0.00034535830522883655, "tps": 15553, "wall": 35904.1} {"step": 8521, "train_loss": 3.6343655586242676, "lr": 0.0003453445563579304, "tps": 15551, "wall": 35911.7} {"step": 8522, "train_loss": 3.596278429031372, "lr": 0.00034533080606711445, "tps": 15550, "wall": 35919.6} {"step": 8523, "train_loss": 3.6002960205078125, "lr": 0.00034531705435654426, "tps": 15548, "wall": 35927.4} {"step": 8524, "train_loss": 3.5903544425964355, "lr": 0.0003453033012263758, "tps": 15547, "wall": 35935.2} {"step": 8525, "train_loss": 3.5936431884765625, "lr": 0.00034528954667676465, "tps": 15545, "wall": 35942.9} {"step": 8526, "train_loss": 3.5868587493896484, "lr": 0.0003452757907078668, "tps": 15544, "wall": 35950.6} {"step": 8527, "train_loss": 3.5654308795928955, "lr": 0.00034526203331983803, "tps": 15542, "wall": 35958.4} {"step": 8528, "train_loss": 3.633678674697876, "lr": 0.0003452482745128341, "tps": 15541, "wall": 35966.3} {"step": 8529, "train_loss": 3.647129535675049, "lr": 0.000345234514287011, "tps": 15539, "wall": 35974.0} {"step": 8530, "train_loss": 3.555633783340454, "lr": 0.00034522075264252456, "tps": 15538, "wall": 35981.7} {"step": 8531, "train_loss": 3.5959084033966064, "lr": 0.0003452069895795306, "tps": 15536, "wall": 35989.5} {"step": 8532, "train_loss": 3.653472423553467, "lr": 0.00034519322509818514, "tps": 15535, "wall": 35997.3} {"step": 8533, "train_loss": 3.540724039077759, "lr": 0.000345179459198644, "tps": 15533, "wall": 36005.0} {"step": 8534, "train_loss": 3.5806922912597656, "lr": 0.00034516569188106327, "tps": 15531, "wall": 36012.7} {"step": 8535, "train_loss": 3.6254799365997314, "lr": 0.00034515192314559873, "tps": 15530, "wall": 36020.5} {"step": 8536, "train_loss": 3.5029122829437256, "lr": 0.00034513815299240644, "tps": 15528, "wall": 36028.4} {"step": 8537, "train_loss": 3.529514789581299, "lr": 0.0003451243814216424, "tps": 15527, "wall": 36036.2} {"step": 8538, "train_loss": 3.561184883117676, "lr": 0.0003451106084334626, "tps": 15525, "wall": 36044.0} {"step": 8539, "train_loss": 3.6136279106140137, "lr": 0.00034509683402802305, "tps": 15524, "wall": 36051.8} {"step": 8540, "train_loss": 3.6223106384277344, "lr": 0.00034508305820547976, "tps": 15522, "wall": 36059.7} {"step": 8541, "train_loss": 3.5785961151123047, "lr": 0.0003450692809659889, "tps": 15521, "wall": 36067.5} {"step": 8542, "train_loss": 3.5761032104492188, "lr": 0.0003450555023097064, "tps": 15519, "wall": 36075.2} {"step": 8543, "train_loss": 3.5158228874206543, "lr": 0.0003450417222367885, "tps": 15518, "wall": 36083.1} {"step": 8544, "train_loss": 3.606916904449463, "lr": 0.0003450279407473911, "tps": 15516, "wall": 36090.8} {"step": 8545, "train_loss": 3.569352626800537, "lr": 0.00034501415784167044, "tps": 15515, "wall": 36098.6} {"step": 8546, "train_loss": 3.5476107597351074, "lr": 0.00034500037351978263, "tps": 15513, "wall": 36106.6} {"step": 8547, "train_loss": 3.5702805519104004, "lr": 0.00034498658778188385, "tps": 15511, "wall": 36114.4} {"step": 8548, "train_loss": 3.5751872062683105, "lr": 0.00034497280062813023, "tps": 15510, "wall": 36122.1} {"step": 8549, "train_loss": 3.511303424835205, "lr": 0.000344959012058678, "tps": 15508, "wall": 36130.0} {"step": 8550, "train_loss": 3.599527597427368, "lr": 0.0003449452220736833, "tps": 15507, "wall": 36137.7} {"step": 8551, "train_loss": 3.5751054286956787, "lr": 0.00034493143067330234, "tps": 15505, "wall": 36145.6} {"step": 8552, "train_loss": 3.6563825607299805, "lr": 0.00034491763785769134, "tps": 15504, "wall": 36153.3} {"step": 8553, "train_loss": 3.485344886779785, "lr": 0.00034490384362700666, "tps": 15502, "wall": 36161.1} {"step": 8554, "train_loss": 3.537658214569092, "lr": 0.0003448900479814045, "tps": 15501, "wall": 36169.0} {"step": 8555, "train_loss": 3.5756943225860596, "lr": 0.00034487625092104103, "tps": 15499, "wall": 36176.8} {"step": 8556, "train_loss": 3.5338892936706543, "lr": 0.0003448624524460727, "tps": 15498, "wall": 36184.6} {"step": 8557, "train_loss": 3.6117618083953857, "lr": 0.0003448486525566557, "tps": 15496, "wall": 36192.4} {"step": 8558, "train_loss": 3.6456708908081055, "lr": 0.00034483485125294647, "tps": 15495, "wall": 36200.2} {"step": 8559, "train_loss": 3.5208704471588135, "lr": 0.00034482104853510127, "tps": 15493, "wall": 36208.0} {"step": 8560, "train_loss": 3.5694351196289062, "lr": 0.00034480724440327646, "tps": 15492, "wall": 36215.7} {"step": 8561, "train_loss": 3.533151388168335, "lr": 0.0003447934388576285, "tps": 15490, "wall": 36223.5} {"step": 8562, "train_loss": 3.503830671310425, "lr": 0.00034477963189831365, "tps": 15488, "wall": 36231.4} {"step": 8563, "train_loss": 3.607433319091797, "lr": 0.0003447658235254883, "tps": 15487, "wall": 36239.2} {"step": 8564, "train_loss": 3.576648235321045, "lr": 0.0003447520137393091, "tps": 15485, "wall": 36247.0} {"step": 8565, "train_loss": 3.6014184951782227, "lr": 0.0003447382025399323, "tps": 15484, "wall": 36254.8} {"step": 8566, "train_loss": 3.6964056491851807, "lr": 0.00034472438992751435, "tps": 15482, "wall": 36262.6} {"step": 8567, "train_loss": 3.586061954498291, "lr": 0.00034471057590221174, "tps": 15481, "wall": 36270.3} {"step": 8568, "train_loss": 3.5745909214019775, "lr": 0.00034469676046418107, "tps": 15479, "wall": 36278.1} {"step": 8569, "train_loss": 3.5399491786956787, "lr": 0.0003446829436135787, "tps": 15478, "wall": 36286.0} {"step": 8570, "train_loss": 3.5913009643554688, "lr": 0.0003446691253505612, "tps": 15476, "wall": 36293.8} {"step": 8571, "train_loss": 3.5866923332214355, "lr": 0.00034465530567528513, "tps": 15475, "wall": 36301.6} {"step": 8572, "train_loss": 3.4936718940734863, "lr": 0.000344641484587907, "tps": 15473, "wall": 36309.4} {"step": 8573, "train_loss": 3.668388843536377, "lr": 0.0003446276620885833, "tps": 15472, "wall": 36317.2} {"step": 8574, "train_loss": 3.543506622314453, "lr": 0.00034461383817747086, "tps": 15470, "wall": 36325.2} {"step": 8575, "train_loss": 3.519890308380127, "lr": 0.000344600012854726, "tps": 15469, "wall": 36332.8} {"step": 8576, "train_loss": 3.619129180908203, "lr": 0.00034458618612050553, "tps": 15467, "wall": 36340.6} {"step": 8577, "train_loss": 3.541419506072998, "lr": 0.000344572357974966, "tps": 15466, "wall": 36348.6} {"step": 8578, "train_loss": 3.5700178146362305, "lr": 0.00034455852841826397, "tps": 15464, "wall": 36356.4} {"step": 8579, "train_loss": 3.5613746643066406, "lr": 0.0003445446974505563, "tps": 15462, "wall": 36364.2} {"step": 8580, "train_loss": 3.672304630279541, "lr": 0.00034453086507199945, "tps": 15461, "wall": 36371.9} {"step": 8581, "train_loss": 3.6662025451660156, "lr": 0.00034451703128275034, "tps": 15459, "wall": 36379.8} {"step": 8582, "train_loss": 3.5251054763793945, "lr": 0.0003445031960829655, "tps": 15458, "wall": 36387.5} {"step": 8583, "train_loss": 3.5235519409179688, "lr": 0.00034448935947280175, "tps": 15456, "wall": 36395.3} {"step": 8584, "train_loss": 3.5799171924591064, "lr": 0.0003444755214524158, "tps": 15455, "wall": 36403.2} {"step": 8585, "train_loss": 3.5881049633026123, "lr": 0.00034446168202196436, "tps": 15453, "wall": 36411.0} {"step": 8586, "train_loss": 3.464200973510742, "lr": 0.00034444784118160425, "tps": 15452, "wall": 36418.8} {"step": 8587, "train_loss": 3.5432450771331787, "lr": 0.0003444339989314923, "tps": 15450, "wall": 36426.5} {"step": 8588, "train_loss": 3.4098734855651855, "lr": 0.00034442015527178524, "tps": 15449, "wall": 36434.3} {"step": 8589, "train_loss": 3.6718626022338867, "lr": 0.00034440631020264, "tps": 15447, "wall": 36442.1} {"step": 8590, "train_loss": 3.54758358001709, "lr": 0.00034439246372421333, "tps": 15446, "wall": 36450.0} {"step": 8591, "train_loss": 3.5752246379852295, "lr": 0.000344378615836662, "tps": 15444, "wall": 36457.7} {"step": 8592, "train_loss": 3.6834139823913574, "lr": 0.00034436476654014315, "tps": 15443, "wall": 36465.6} {"step": 8593, "train_loss": 3.5971784591674805, "lr": 0.00034435091583481336, "tps": 15441, "wall": 36473.3} {"step": 8594, "train_loss": 3.508296012878418, "lr": 0.0003443370637208298, "tps": 15440, "wall": 36481.1} {"step": 8595, "train_loss": 3.5609662532806396, "lr": 0.0003443232101983491, "tps": 15438, "wall": 36488.9} {"step": 8596, "train_loss": 3.617461681365967, "lr": 0.00034430935526752845, "tps": 15437, "wall": 36496.8} {"step": 8597, "train_loss": 3.5637850761413574, "lr": 0.0003442954989285247, "tps": 15435, "wall": 36504.5} {"step": 8598, "train_loss": 3.5231778621673584, "lr": 0.00034428164118149477, "tps": 15434, "wall": 36512.3} {"step": 8599, "train_loss": 3.475466012954712, "lr": 0.0003442677820265957, "tps": 15432, "wall": 36519.9} {"step": 8600, "train_loss": 3.5412039756774902, "lr": 0.0003442539214639844, "tps": 15431, "wall": 36527.9} {"step": 8601, "train_loss": 3.6239166259765625, "lr": 0.00034424005949381807, "tps": 15429, "wall": 36535.6} {"step": 8602, "train_loss": 3.5864248275756836, "lr": 0.00034422619611625355, "tps": 15428, "wall": 36543.3} {"step": 8603, "train_loss": 3.5769104957580566, "lr": 0.00034421233133144805, "tps": 15426, "wall": 36551.0} {"step": 8604, "train_loss": 3.5399582386016846, "lr": 0.0003441984651395584, "tps": 15425, "wall": 36558.8} {"step": 8605, "train_loss": 3.497910737991333, "lr": 0.00034418459754074197, "tps": 15423, "wall": 36566.6} {"step": 8606, "train_loss": 3.6368894577026367, "lr": 0.0003441707285351556, "tps": 15422, "wall": 36574.4} {"step": 8607, "train_loss": 3.5937044620513916, "lr": 0.00034415685812295657, "tps": 15421, "wall": 36582.1} {"step": 8608, "train_loss": 3.6743252277374268, "lr": 0.0003441429863043018, "tps": 15419, "wall": 36590.0} {"step": 8609, "train_loss": 3.4827213287353516, "lr": 0.00034412911307934877, "tps": 15417, "wall": 36597.8} {"step": 8610, "train_loss": 3.508443832397461, "lr": 0.0003441152384482543, "tps": 15416, "wall": 36605.5} {"step": 8611, "train_loss": 3.5405821800231934, "lr": 0.0003441013624111757, "tps": 15415, "wall": 36613.3} {"step": 8612, "train_loss": 3.6149630546569824, "lr": 0.00034408748496827016, "tps": 15413, "wall": 36621.0} {"step": 8613, "train_loss": 3.588590145111084, "lr": 0.0003440736061196949, "tps": 15412, "wall": 36628.9} {"step": 8614, "train_loss": 3.6610164642333984, "lr": 0.00034405972586560706, "tps": 15410, "wall": 36636.7} {"step": 8615, "train_loss": 3.480311632156372, "lr": 0.00034404584420616403, "tps": 15409, "wall": 36644.6} {"step": 8616, "train_loss": 3.7324628829956055, "lr": 0.00034403196114152294, "tps": 15407, "wall": 36652.2} {"step": 8617, "train_loss": 3.5481598377227783, "lr": 0.00034401807667184105, "tps": 15406, "wall": 36660.1} {"step": 8618, "train_loss": 3.583355188369751, "lr": 0.0003440041907972757, "tps": 15404, "wall": 36667.8} {"step": 8619, "train_loss": 3.585231304168701, "lr": 0.0003439903035179841, "tps": 15403, "wall": 36675.5} {"step": 8620, "train_loss": 3.5994906425476074, "lr": 0.00034397641483412377, "tps": 15401, "wall": 36683.3} {"step": 8621, "train_loss": 3.6526219844818115, "lr": 0.00034396252474585176, "tps": 15400, "wall": 36691.0} {"step": 8622, "train_loss": 3.557982921600342, "lr": 0.00034394863325332565, "tps": 15398, "wall": 36698.8} {"step": 8623, "train_loss": 3.5016298294067383, "lr": 0.00034393474035670265, "tps": 15397, "wall": 36706.7} {"step": 8624, "train_loss": 3.6027979850769043, "lr": 0.0003439208460561403, "tps": 15395, "wall": 36714.3} {"step": 8625, "train_loss": 3.6028342247009277, "lr": 0.00034390695035179584, "tps": 15394, "wall": 36722.1} {"step": 8626, "train_loss": 3.58925199508667, "lr": 0.0003438930532438268, "tps": 15392, "wall": 36729.9} {"step": 8627, "train_loss": 3.596036911010742, "lr": 0.0003438791547323905, "tps": 15391, "wall": 36737.7} {"step": 8628, "train_loss": 3.655939817428589, "lr": 0.00034386525481764436, "tps": 15389, "wall": 36745.6} {"step": 8629, "train_loss": 3.595153570175171, "lr": 0.000343851353499746, "tps": 15388, "wall": 36753.4} {"step": 8630, "train_loss": 3.6982109546661377, "lr": 0.0003438374507788528, "tps": 15386, "wall": 36761.1} {"step": 8631, "train_loss": 3.710865020751953, "lr": 0.0003438235466551223, "tps": 15385, "wall": 36769.0} {"step": 8632, "train_loss": 3.6752984523773193, "lr": 0.0003438096411287119, "tps": 15383, "wall": 36776.7} {"step": 8633, "train_loss": 3.58015775680542, "lr": 0.0003437957341997793, "tps": 15382, "wall": 36784.6} {"step": 8634, "train_loss": 3.4745824337005615, "lr": 0.0003437818258684818, "tps": 15380, "wall": 36792.4} {"step": 8635, "train_loss": 3.555361270904541, "lr": 0.0003437679161349771, "tps": 15379, "wall": 36800.2} {"step": 8636, "train_loss": 3.513190269470215, "lr": 0.00034375400499942274, "tps": 15378, "wall": 36808.0} {"step": 8637, "train_loss": 3.5682973861694336, "lr": 0.0003437400924619764, "tps": 15376, "wall": 36815.8} {"step": 8638, "train_loss": 3.6356701850891113, "lr": 0.00034372617852279554, "tps": 15375, "wall": 36823.5} {"step": 8639, "train_loss": 3.606825828552246, "lr": 0.00034371226318203783, "tps": 15373, "wall": 36831.4} {"step": 8640, "train_loss": 3.547290563583374, "lr": 0.00034369834643986093, "tps": 15372, "wall": 36839.2} {"step": 8641, "train_loss": 3.61281681060791, "lr": 0.0003436844282964225, "tps": 15370, "wall": 36847.1} {"step": 8642, "train_loss": 3.62739634513855, "lr": 0.00034367050875188006, "tps": 15369, "wall": 36854.8} {"step": 8643, "train_loss": 3.555426597595215, "lr": 0.00034365658780639147, "tps": 15367, "wall": 36862.5} {"step": 8644, "train_loss": 3.560879945755005, "lr": 0.00034364266546011444, "tps": 15366, "wall": 36870.4} {"step": 8645, "train_loss": 3.6481785774230957, "lr": 0.0003436287417132065, "tps": 15364, "wall": 36878.3} {"step": 8646, "train_loss": 3.552933692932129, "lr": 0.0003436148165658255, "tps": 15363, "wall": 36886.2} {"step": 8647, "train_loss": 3.677060842514038, "lr": 0.0003436008900181292, "tps": 15361, "wall": 36894.0} {"step": 8648, "train_loss": 3.54318904876709, "lr": 0.0003435869620702754, "tps": 15360, "wall": 36901.7} {"step": 8649, "train_loss": 3.5358166694641113, "lr": 0.00034357303272242174, "tps": 15358, "wall": 36909.5} {"step": 8650, "train_loss": 3.6456592082977295, "lr": 0.000343559101974726, "tps": 15357, "wall": 36917.3} {"step": 8651, "train_loss": 3.6574721336364746, "lr": 0.00034354516982734615, "tps": 15355, "wall": 36925.1} {"step": 8652, "train_loss": 3.6174635887145996, "lr": 0.00034353123628044, "tps": 15354, "wall": 36933.0} {"step": 8653, "train_loss": 3.6908490657806396, "lr": 0.0003435173013341652, "tps": 15352, "wall": 36940.7} {"step": 8654, "train_loss": 3.557542324066162, "lr": 0.0003435033649886798, "tps": 15351, "wall": 36948.7} {"step": 8655, "train_loss": 3.6175193786621094, "lr": 0.00034348942724414153, "tps": 15349, "wall": 36956.5} {"step": 8656, "train_loss": 3.611509323120117, "lr": 0.0003434754881007084, "tps": 15348, "wall": 36964.2} {"step": 8657, "train_loss": 3.606855869293213, "lr": 0.0003434615475585382, "tps": 15347, "wall": 36972.0} {"step": 8658, "train_loss": 3.6128439903259277, "lr": 0.00034344760561778897, "tps": 15345, "wall": 36979.9} {"step": 8659, "train_loss": 3.657942771911621, "lr": 0.0003434336622786186, "tps": 15344, "wall": 36987.6} {"step": 8660, "train_loss": 3.565964698791504, "lr": 0.000343419717541185, "tps": 15342, "wall": 36995.5} {"step": 8661, "train_loss": 3.590819835662842, "lr": 0.0003434057714056462, "tps": 15341, "wall": 37003.2} {"step": 8662, "train_loss": 3.6584296226501465, "lr": 0.00034339182387216013, "tps": 15339, "wall": 37011.1} {"step": 8663, "train_loss": 3.4912071228027344, "lr": 0.00034337787494088473, "tps": 15338, "wall": 37019.0} {"step": 8664, "train_loss": 3.5605039596557617, "lr": 0.00034336392461197825, "tps": 15336, "wall": 37026.9} {"step": 8665, "train_loss": 3.4966678619384766, "lr": 0.0003433499728855984, "tps": 15335, "wall": 37034.6} {"step": 8666, "train_loss": 3.613525867462158, "lr": 0.0003433360197619034, "tps": 15333, "wall": 37042.3} {"step": 8667, "train_loss": 3.589501142501831, "lr": 0.00034332206524105135, "tps": 15332, "wall": 37050.2} {"step": 8668, "train_loss": 3.6149649620056152, "lr": 0.00034330810932320025, "tps": 15330, "wall": 37058.0} {"step": 8669, "train_loss": 3.6042680740356445, "lr": 0.0003432941520085082, "tps": 15329, "wall": 37065.8} {"step": 8670, "train_loss": 3.637901782989502, "lr": 0.0003432801932971334, "tps": 15327, "wall": 37073.6} {"step": 8671, "train_loss": 3.6264517307281494, "lr": 0.0003432662331892338, "tps": 15326, "wall": 37081.3} {"step": 8672, "train_loss": 3.60684871673584, "lr": 0.00034325227168496776, "tps": 15325, "wall": 37089.1} {"step": 8673, "train_loss": 3.5599896907806396, "lr": 0.0003432383087844932, "tps": 15323, "wall": 37097.0} {"step": 8674, "train_loss": 3.5217337608337402, "lr": 0.00034322434448796847, "tps": 15322, "wall": 37104.8} {"step": 8675, "train_loss": 3.5218722820281982, "lr": 0.0003432103787955517, "tps": 15320, "wall": 37112.5} {"step": 8676, "train_loss": 3.5555317401885986, "lr": 0.0003431964117074011, "tps": 15319, "wall": 37120.2} {"step": 8677, "train_loss": 3.6523871421813965, "lr": 0.00034318244322367487, "tps": 15317, "wall": 37128.2} {"step": 8678, "train_loss": 3.488104820251465, "lr": 0.00034316847334453125, "tps": 15316, "wall": 37136.1} {"step": 8679, "train_loss": 3.489576816558838, "lr": 0.00034315450207012856, "tps": 15314, "wall": 37143.9} {"step": 8680, "train_loss": 3.522274971008301, "lr": 0.0003431405294006249, "tps": 15313, "wall": 37151.7} {"step": 8681, "train_loss": 3.4836387634277344, "lr": 0.00034312655533617876, "tps": 15311, "wall": 37159.5} {"step": 8682, "train_loss": 3.5487852096557617, "lr": 0.00034311257987694823, "tps": 15310, "wall": 37167.3} {"step": 8683, "train_loss": 3.6497111320495605, "lr": 0.0003430986030230918, "tps": 15309, "wall": 37175.1} {"step": 8684, "train_loss": 3.6694016456604004, "lr": 0.0003430846247747678, "tps": 15307, "wall": 37182.9} {"step": 8685, "train_loss": 3.606734037399292, "lr": 0.0003430706451321344, "tps": 15306, "wall": 37190.9} {"step": 8686, "train_loss": 3.5473062992095947, "lr": 0.00034305666409535017, "tps": 15304, "wall": 37198.5} {"step": 8687, "train_loss": 3.5933313369750977, "lr": 0.0003430426816645733, "tps": 15303, "wall": 37206.3} {"step": 8688, "train_loss": 3.5861074924468994, "lr": 0.0003430286978399624, "tps": 15301, "wall": 37214.1} {"step": 8689, "train_loss": 3.588904857635498, "lr": 0.00034301471262167564, "tps": 15300, "wall": 37221.9} {"step": 8690, "train_loss": 3.594302177429199, "lr": 0.00034300072600987157, "tps": 15298, "wall": 37229.7} {"step": 8691, "train_loss": 3.64461088180542, "lr": 0.00034298673800470865, "tps": 15297, "wall": 37237.5} {"step": 8692, "train_loss": 3.5327558517456055, "lr": 0.0003429727486063453, "tps": 15295, "wall": 37245.4} {"step": 8693, "train_loss": 3.457792282104492, "lr": 0.00034295875781494, "tps": 15294, "wall": 37253.3} {"step": 8694, "train_loss": 3.520610809326172, "lr": 0.0003429447656306513, "tps": 15293, "wall": 37261.0} {"step": 8695, "train_loss": 3.662167549133301, "lr": 0.00034293077205363757, "tps": 15291, "wall": 37268.8} {"step": 8696, "train_loss": 3.454054832458496, "lr": 0.00034291677708405744, "tps": 15290, "wall": 37276.6} {"step": 8697, "train_loss": 3.5289530754089355, "lr": 0.00034290278072206937, "tps": 15288, "wall": 37284.4} {"step": 8698, "train_loss": 3.644097328186035, "lr": 0.00034288878296783197, "tps": 15287, "wall": 37292.2} {"step": 8699, "train_loss": 3.598802089691162, "lr": 0.0003428747838215038, "tps": 15285, "wall": 37300.0} {"step": 8700, "train_loss": 3.6217916011810303, "lr": 0.00034286078328324345, "tps": 15284, "wall": 37308.0} {"step": 8701, "train_loss": 3.526015281677246, "lr": 0.00034284678135320946, "tps": 15282, "wall": 37315.8} {"step": 8702, "train_loss": 3.579000949859619, "lr": 0.0003428327780315605, "tps": 15281, "wall": 37323.5} {"step": 8703, "train_loss": 3.584433078765869, "lr": 0.00034281877331845517, "tps": 15280, "wall": 37331.3} {"step": 8704, "train_loss": 3.4820594787597656, "lr": 0.00034280476721405216, "tps": 15278, "wall": 37339.0} {"step": 8705, "train_loss": 3.4957776069641113, "lr": 0.00034279075971851004, "tps": 15277, "wall": 37347.0} {"step": 8706, "train_loss": 3.5217533111572266, "lr": 0.00034277675083198766, "tps": 15275, "wall": 37354.7} {"step": 8707, "train_loss": 3.5785913467407227, "lr": 0.0003427627405546435, "tps": 15274, "wall": 37362.5} {"step": 8708, "train_loss": 3.594289541244507, "lr": 0.00034274872888663646, "tps": 15272, "wall": 37370.4} {"step": 8709, "train_loss": 3.546414852142334, "lr": 0.0003427347158281251, "tps": 15271, "wall": 37378.2} {"step": 8710, "train_loss": 3.6580750942230225, "lr": 0.00034272070137926833, "tps": 15269, "wall": 37386.0} {"step": 8711, "train_loss": 3.4757375717163086, "lr": 0.00034270668554022476, "tps": 15268, "wall": 37393.8} {"step": 8712, "train_loss": 3.5443036556243896, "lr": 0.0003426926683111532, "tps": 15267, "wall": 37401.6} {"step": 8713, "train_loss": 3.604450225830078, "lr": 0.0003426786496922124, "tps": 15265, "wall": 37409.5} {"step": 8714, "train_loss": 3.5336334705352783, "lr": 0.0003426646296835614, "tps": 15264, "wall": 37417.4} {"step": 8715, "train_loss": 3.6265251636505127, "lr": 0.0003426506082853587, "tps": 15262, "wall": 37425.2} {"step": 8716, "train_loss": 3.624509811401367, "lr": 0.0003426365854977633, "tps": 15261, "wall": 37433.1} {"step": 8717, "train_loss": 3.5357565879821777, "lr": 0.00034262256132093407, "tps": 15259, "wall": 37440.7} {"step": 8718, "train_loss": 3.484175682067871, "lr": 0.0003426085357550298, "tps": 15258, "wall": 37448.5} {"step": 8719, "train_loss": 3.580641508102417, "lr": 0.00034259450880020937, "tps": 15257, "wall": 37456.3} {"step": 8720, "train_loss": 3.6014866828918457, "lr": 0.0003425804804566318, "tps": 15255, "wall": 37464.1} {"step": 8721, "train_loss": 3.5726921558380127, "lr": 0.00034256645072445585, "tps": 15254, "wall": 37471.9} {"step": 8722, "train_loss": 3.573078155517578, "lr": 0.0003425524196038405, "tps": 15252, "wall": 37479.7} {"step": 8723, "train_loss": 3.643016815185547, "lr": 0.00034253838709494473, "tps": 15251, "wall": 37487.6} {"step": 8724, "train_loss": 3.6270081996917725, "lr": 0.00034252435319792753, "tps": 15249, "wall": 37495.4} {"step": 8725, "train_loss": 3.507293939590454, "lr": 0.0003425103179129478, "tps": 15248, "wall": 37503.1} {"step": 8726, "train_loss": 3.4869937896728516, "lr": 0.0003424962812401645, "tps": 15247, "wall": 37511.0} {"step": 8727, "train_loss": 3.597147226333618, "lr": 0.0003424822431797368, "tps": 15245, "wall": 37518.7} {"step": 8728, "train_loss": 3.5743579864501953, "lr": 0.00034246820373182353, "tps": 15244, "wall": 37526.6} {"step": 8729, "train_loss": 3.553067684173584, "lr": 0.0003424541628965838, "tps": 15242, "wall": 37534.4} {"step": 8730, "train_loss": 3.617711305618286, "lr": 0.00034244012067417677, "tps": 15241, "wall": 37542.2} {"step": 8731, "train_loss": 3.571321964263916, "lr": 0.0003424260770647614, "tps": 15239, "wall": 37550.0} {"step": 8732, "train_loss": 3.699103355407715, "lr": 0.0003424120320684969, "tps": 15238, "wall": 37557.8} {"step": 8733, "train_loss": 3.566459894180298, "lr": 0.0003423979856855421, "tps": 15237, "wall": 37565.5} {"step": 8734, "train_loss": 3.564176321029663, "lr": 0.00034238393791605643, "tps": 15235, "wall": 37573.4} {"step": 8735, "train_loss": 3.6434082984924316, "lr": 0.0003423698887601988, "tps": 15234, "wall": 37581.1} {"step": 8736, "train_loss": 3.6321141719818115, "lr": 0.00034235583821812856, "tps": 15232, "wall": 37589.1} {"step": 8737, "train_loss": 3.672306537628174, "lr": 0.0003423417862900047, "tps": 15231, "wall": 37596.7} {"step": 8738, "train_loss": 3.5081162452697754, "lr": 0.0003423277329759864, "tps": 15230, "wall": 37604.6} {"step": 8739, "train_loss": 3.5839080810546875, "lr": 0.00034231367827623304, "tps": 15228, "wall": 37612.3} {"step": 8740, "train_loss": 3.5689430236816406, "lr": 0.0003422996221909037, "tps": 15227, "wall": 37620.2} {"step": 8741, "train_loss": 3.7084271907806396, "lr": 0.0003422855647201576, "tps": 15225, "wall": 37627.9} {"step": 8742, "train_loss": 3.624457836151123, "lr": 0.00034227150586415395, "tps": 15224, "wall": 37635.7} {"step": 8743, "train_loss": 3.6395950317382812, "lr": 0.00034225744562305213, "tps": 15222, "wall": 37643.5} {"step": 8744, "train_loss": 3.5687856674194336, "lr": 0.0003422433839970113, "tps": 15221, "wall": 37651.3} {"step": 8745, "train_loss": 3.50651216506958, "lr": 0.00034222932098619085, "tps": 15220, "wall": 37659.0} {"step": 8746, "train_loss": 3.5467779636383057, "lr": 0.00034221525659075005, "tps": 15218, "wall": 37666.9} {"step": 8747, "train_loss": 3.4178552627563477, "lr": 0.00034220119081084817, "tps": 15217, "wall": 37674.8} {"step": 8748, "train_loss": 3.5913286209106445, "lr": 0.00034218712364664466, "tps": 15215, "wall": 37682.6} {"step": 8749, "train_loss": 3.616375684738159, "lr": 0.00034217305509829873, "tps": 15214, "wall": 37690.3} {"step": 8750, "train_loss": 3.4994077682495117, "lr": 0.00034215898516596987, "tps": 15213, "wall": 37698.1} {"step": 8751, "train_loss": 3.6044187545776367, "lr": 0.0003421449138498174, "tps": 15211, "wall": 37705.9} {"step": 8752, "train_loss": 3.597813129425049, "lr": 0.00034213084115000073, "tps": 15210, "wall": 37713.6} {"step": 8753, "train_loss": 3.589297294616699, "lr": 0.0003421167670666793, "tps": 15208, "wall": 37721.3} {"step": 8754, "train_loss": 3.509014129638672, "lr": 0.00034210269160001245, "tps": 15207, "wall": 37729.2} {"step": 8755, "train_loss": 3.4808685779571533, "lr": 0.0003420886147501598, "tps": 15206, "wall": 37737.1} {"step": 8756, "train_loss": 3.558547019958496, "lr": 0.0003420745365172806, "tps": 15204, "wall": 37744.7} {"step": 8757, "train_loss": 3.5458083152770996, "lr": 0.00034206045690153455, "tps": 15203, "wall": 37752.6} {"step": 8758, "train_loss": 3.5976500511169434, "lr": 0.0003420463759030811, "tps": 15201, "wall": 37760.3} {"step": 8759, "train_loss": 3.5170767307281494, "lr": 0.0003420322935220796, "tps": 15200, "wall": 37768.1} {"step": 8760, "train_loss": 3.618428945541382, "lr": 0.0003420182097586897, "tps": 15199, "wall": 37775.9} {"step": 8761, "train_loss": 3.676466464996338, "lr": 0.0003420041246130709, "tps": 15197, "wall": 37783.7} {"step": 8762, "train_loss": 3.6105504035949707, "lr": 0.0003419900380853828, "tps": 15196, "wall": 37791.6} {"step": 8763, "train_loss": 3.5465173721313477, "lr": 0.000341975950175785, "tps": 15194, "wall": 37799.4} {"step": 8764, "train_loss": 3.5422041416168213, "lr": 0.000341961860884437, "tps": 15193, "wall": 37807.2} {"step": 8765, "train_loss": 3.6677165031433105, "lr": 0.00034194777021149836, "tps": 15192, "wall": 37815.0} {"step": 8766, "train_loss": 3.5100762844085693, "lr": 0.00034193367815712886, "tps": 15190, "wall": 37822.8} {"step": 8767, "train_loss": 3.583853244781494, "lr": 0.000341919584721488, "tps": 15189, "wall": 37830.7} {"step": 8768, "train_loss": 3.614386558532715, "lr": 0.0003419054899047356, "tps": 15187, "wall": 37838.5} {"step": 8769, "train_loss": 3.6340413093566895, "lr": 0.0003418913937070311, "tps": 15186, "wall": 37846.4} {"step": 8770, "train_loss": 3.6001851558685303, "lr": 0.0003418772961285344, "tps": 15185, "wall": 37854.2} {"step": 8771, "train_loss": 3.5089969635009766, "lr": 0.000341863197169405, "tps": 15183, "wall": 37861.9} {"step": 8772, "train_loss": 3.474159002304077, "lr": 0.0003418490968298028, "tps": 15182, "wall": 37869.7} {"step": 8773, "train_loss": 3.5273373126983643, "lr": 0.00034183499510988735, "tps": 15180, "wall": 37877.5} {"step": 8774, "train_loss": 3.607116937637329, "lr": 0.0003418208920098185, "tps": 15179, "wall": 37885.3} {"step": 8775, "train_loss": 3.5470447540283203, "lr": 0.00034180678752975603, "tps": 15178, "wall": 37893.0} {"step": 8776, "train_loss": 3.5504891872406006, "lr": 0.00034179268166985966, "tps": 15176, "wall": 37900.8} {"step": 8777, "train_loss": 3.505756378173828, "lr": 0.00034177857443028924, "tps": 15175, "wall": 37908.8} {"step": 8778, "train_loss": 3.562885284423828, "lr": 0.00034176446581120454, "tps": 15173, "wall": 37916.5} {"step": 8779, "train_loss": 3.6157755851745605, "lr": 0.0003417503558127653, "tps": 15172, "wall": 37924.3} {"step": 8780, "train_loss": 3.459892511367798, "lr": 0.0003417362444351315, "tps": 15171, "wall": 37932.2} {"step": 8781, "train_loss": 3.581577777862549, "lr": 0.0003417221316784629, "tps": 15169, "wall": 37939.9} {"step": 8782, "train_loss": 3.567028284072876, "lr": 0.0003417080175429195, "tps": 15168, "wall": 37947.8} {"step": 8783, "train_loss": 3.619033098220825, "lr": 0.00034169390202866103, "tps": 15166, "wall": 37955.7} {"step": 8784, "train_loss": 3.7912347316741943, "lr": 0.00034167978513584746, "tps": 15165, "wall": 37963.6} {"step": 8785, "train_loss": 3.6163840293884277, "lr": 0.0003416656668646387, "tps": 15164, "wall": 37971.4} {"step": 8786, "train_loss": 3.5709214210510254, "lr": 0.0003416515472151947, "tps": 15162, "wall": 37979.2} {"step": 8787, "train_loss": 3.5331878662109375, "lr": 0.0003416374261876754, "tps": 15161, "wall": 37987.0} {"step": 8788, "train_loss": 3.6878437995910645, "lr": 0.00034162330378224073, "tps": 15159, "wall": 37994.8} {"step": 8789, "train_loss": 3.530285120010376, "lr": 0.00034160917999905065, "tps": 15158, "wall": 38002.6} {"step": 8790, "train_loss": 3.4362127780914307, "lr": 0.00034159505483826526, "tps": 15157, "wall": 38010.5} {"step": 8791, "train_loss": 3.435823917388916, "lr": 0.00034158092830004455, "tps": 15155, "wall": 38018.3} {"step": 8792, "train_loss": 3.5200695991516113, "lr": 0.0003415668003845484, "tps": 15154, "wall": 38026.3} {"step": 8793, "train_loss": 3.525146007537842, "lr": 0.000341552671091937, "tps": 15152, "wall": 38034.0} {"step": 8794, "train_loss": 3.436394453048706, "lr": 0.00034153854042237044, "tps": 15151, "wall": 38041.7} {"step": 8795, "train_loss": 3.5437068939208984, "lr": 0.00034152440837600863, "tps": 15150, "wall": 38049.5} {"step": 8796, "train_loss": 3.716582775115967, "lr": 0.0003415102749530118, "tps": 15148, "wall": 38057.3} {"step": 8797, "train_loss": 3.5969510078430176, "lr": 0.00034149614015354, "tps": 15147, "wall": 38065.1} {"step": 8798, "train_loss": 3.519787311553955, "lr": 0.00034148200397775334, "tps": 15145, "wall": 38072.9} {"step": 8799, "train_loss": 3.5799026489257812, "lr": 0.00034146786642581193, "tps": 15144, "wall": 38080.6} {"step": 8800, "train_loss": 3.4849066734313965, "lr": 0.000341453727497876, "tps": 15143, "wall": 38088.5} {"step": 8801, "train_loss": 3.5589184761047363, "lr": 0.00034143958719410564, "tps": 15141, "wall": 38096.2} {"step": 8802, "train_loss": 3.666520595550537, "lr": 0.00034142544551466115, "tps": 15140, "wall": 38104.0} {"step": 8803, "train_loss": 3.484374761581421, "lr": 0.00034141130245970253, "tps": 15139, "wall": 38111.8} {"step": 8804, "train_loss": 3.5735924243927, "lr": 0.00034139715802939015, "tps": 15137, "wall": 38119.6} {"step": 8805, "train_loss": 3.5762977600097656, "lr": 0.00034138301222388424, "tps": 15136, "wall": 38127.5} {"step": 8806, "train_loss": 3.5226314067840576, "lr": 0.00034136886504334494, "tps": 15134, "wall": 38135.2} {"step": 8807, "train_loss": 3.547044277191162, "lr": 0.0003413547164879326, "tps": 15133, "wall": 38143.1} {"step": 8808, "train_loss": 3.561328887939453, "lr": 0.0003413405665578075, "tps": 15132, "wall": 38150.9} {"step": 8809, "train_loss": 3.578279495239258, "lr": 0.0003413264152531298, "tps": 15130, "wall": 38158.7} {"step": 8810, "train_loss": 3.532080888748169, "lr": 0.00034131226257405996, "tps": 15129, "wall": 38166.5} {"step": 8811, "train_loss": 3.530391216278076, "lr": 0.00034129810852075827, "tps": 15128, "wall": 38174.3} {"step": 8812, "train_loss": 3.640876293182373, "lr": 0.00034128395309338504, "tps": 15126, "wall": 38182.1} {"step": 8813, "train_loss": 3.622479200363159, "lr": 0.00034126979629210056, "tps": 15125, "wall": 38189.9} {"step": 8814, "train_loss": 3.5259480476379395, "lr": 0.00034125563811706537, "tps": 15123, "wall": 38197.6} {"step": 8815, "train_loss": 3.5985264778137207, "lr": 0.00034124147856843975, "tps": 15122, "wall": 38205.4} {"step": 8816, "train_loss": 3.6101741790771484, "lr": 0.00034122731764638407, "tps": 15121, "wall": 38213.1} {"step": 8817, "train_loss": 3.665153980255127, "lr": 0.0003412131553510587, "tps": 15119, "wall": 38220.9} {"step": 8818, "train_loss": 3.638576030731201, "lr": 0.00034119899168262417, "tps": 15118, "wall": 38228.6} {"step": 8819, "train_loss": 3.4601833820343018, "lr": 0.00034118482664124094, "tps": 15117, "wall": 38236.3} {"step": 8820, "train_loss": 3.3856654167175293, "lr": 0.0003411706602270695, "tps": 15115, "wall": 38244.1} {"step": 8821, "train_loss": 3.6164608001708984, "lr": 0.0003411564924402702, "tps": 15114, "wall": 38251.9} {"step": 8822, "train_loss": 3.5018951892852783, "lr": 0.0003411423232810036, "tps": 15113, "wall": 38259.6} {"step": 8823, "train_loss": 3.574882984161377, "lr": 0.00034112815274943024, "tps": 15111, "wall": 38267.4} {"step": 8824, "train_loss": 3.491832733154297, "lr": 0.00034111398084571057, "tps": 15110, "wall": 38275.1} {"step": 8825, "train_loss": 3.6556825637817383, "lr": 0.0003410998075700052, "tps": 15109, "wall": 38282.8} {"step": 8826, "train_loss": 3.468409776687622, "lr": 0.00034108563292247466, "tps": 15107, "wall": 38290.5} {"step": 8827, "train_loss": 3.5302999019622803, "lr": 0.0003410714569032795, "tps": 15106, "wall": 38298.3} {"step": 8828, "train_loss": 3.4824180603027344, "lr": 0.0003410572795125803, "tps": 15105, "wall": 38306.0} {"step": 8829, "train_loss": 3.561352252960205, "lr": 0.00034104310075053776, "tps": 15103, "wall": 38313.8} {"step": 8830, "train_loss": 3.5995006561279297, "lr": 0.00034102892061731237, "tps": 15102, "wall": 38321.5} {"step": 8831, "train_loss": 3.5397379398345947, "lr": 0.00034101473911306486, "tps": 15101, "wall": 38329.4} {"step": 8832, "train_loss": 3.566997766494751, "lr": 0.00034100055623795586, "tps": 15099, "wall": 38337.2} {"step": 8833, "train_loss": 3.4862489700317383, "lr": 0.00034098637199214595, "tps": 15098, "wall": 38344.9} {"step": 8834, "train_loss": 3.508223533630371, "lr": 0.0003409721863757959, "tps": 15097, "wall": 38352.7} {"step": 8835, "train_loss": 3.6027719974517822, "lr": 0.00034095799938906637, "tps": 15095, "wall": 38360.4} {"step": 8836, "train_loss": 3.469736099243164, "lr": 0.00034094381103211806, "tps": 15094, "wall": 38368.2} {"step": 8837, "train_loss": 3.632929801940918, "lr": 0.00034092962130511176, "tps": 15092, "wall": 38376.0} {"step": 8838, "train_loss": 3.5621845722198486, "lr": 0.00034091543020820815, "tps": 15091, "wall": 38383.6} {"step": 8839, "train_loss": 3.4139885902404785, "lr": 0.000340901237741568, "tps": 15090, "wall": 38391.6} {"step": 8840, "train_loss": 3.6107401847839355, "lr": 0.00034088704390535207, "tps": 15088, "wall": 38399.3} {"step": 8841, "train_loss": 3.5391182899475098, "lr": 0.0003408728486997212, "tps": 15087, "wall": 38407.0} {"step": 8842, "train_loss": 3.552243232727051, "lr": 0.00034085865212483615, "tps": 15086, "wall": 38414.7} {"step": 8843, "train_loss": 3.649555206298828, "lr": 0.0003408444541808577, "tps": 15084, "wall": 38422.6} {"step": 8844, "train_loss": 3.6198525428771973, "lr": 0.0003408302548679468, "tps": 15083, "wall": 38430.4} {"step": 8845, "train_loss": 3.4239046573638916, "lr": 0.0003408160541862643, "tps": 15082, "wall": 38438.0} {"step": 8846, "train_loss": 3.6089260578155518, "lr": 0.00034080185213597084, "tps": 15080, "wall": 38445.9} {"step": 8847, "train_loss": 3.51524019241333, "lr": 0.00034078764871722756, "tps": 15079, "wall": 38453.6} {"step": 8848, "train_loss": 3.549380302429199, "lr": 0.0003407734439301953, "tps": 15078, "wall": 38461.3} {"step": 8849, "train_loss": 3.547140121459961, "lr": 0.00034075923777503484, "tps": 15076, "wall": 38469.0} {"step": 8850, "train_loss": 3.5709805488586426, "lr": 0.00034074503025190725, "tps": 15075, "wall": 38476.7} {"step": 8851, "train_loss": 3.5106635093688965, "lr": 0.00034073082136097346, "tps": 15074, "wall": 38484.5} {"step": 8852, "train_loss": 3.4570438861846924, "lr": 0.0003407166111023943, "tps": 15072, "wall": 38492.3} {"step": 8853, "train_loss": 3.470245838165283, "lr": 0.0003407023994763309, "tps": 15071, "wall": 38500.0} {"step": 8854, "train_loss": 3.6080806255340576, "lr": 0.0003406881864829442, "tps": 15070, "wall": 38507.9} {"step": 8855, "train_loss": 3.5710792541503906, "lr": 0.0003406739721223951, "tps": 15068, "wall": 38515.7} {"step": 8856, "train_loss": 3.709105968475342, "lr": 0.0003406597563948448, "tps": 15067, "wall": 38523.4} {"step": 8857, "train_loss": 3.458608388900757, "lr": 0.00034064553930045427, "tps": 15066, "wall": 38531.1} {"step": 8858, "train_loss": 3.6032824516296387, "lr": 0.00034063132083938456, "tps": 15064, "wall": 38539.0} {"step": 8859, "train_loss": 3.615436315536499, "lr": 0.0003406171010117966, "tps": 15063, "wall": 38546.8} {"step": 8860, "train_loss": 3.4538984298706055, "lr": 0.00034060287981785173, "tps": 15062, "wall": 38554.5} {"step": 8861, "train_loss": 3.492816686630249, "lr": 0.00034058865725771083, "tps": 15060, "wall": 38562.2} {"step": 8862, "train_loss": 3.580631732940674, "lr": 0.00034057443333153516, "tps": 15059, "wall": 38570.2} {"step": 8863, "train_loss": 3.491044282913208, "lr": 0.0003405602080394857, "tps": 15058, "wall": 38577.8} {"step": 8864, "train_loss": 3.542877435684204, "lr": 0.00034054598138172376, "tps": 15056, "wall": 38585.6} {"step": 8865, "train_loss": 3.5267372131347656, "lr": 0.00034053175335841036, "tps": 15055, "wall": 38593.4} {"step": 8866, "train_loss": 3.613203763961792, "lr": 0.00034051752396970674, "tps": 15054, "wall": 38601.3} {"step": 8867, "train_loss": 3.5385117530822754, "lr": 0.0003405032932157742, "tps": 15052, "wall": 38609.1} {"step": 8868, "train_loss": 3.5998969078063965, "lr": 0.0003404890610967737, "tps": 15051, "wall": 38616.9} {"step": 8869, "train_loss": 3.534797191619873, "lr": 0.0003404748276128666, "tps": 15050, "wall": 38624.8} {"step": 8870, "train_loss": 3.6201086044311523, "lr": 0.00034046059276421424, "tps": 15048, "wall": 38632.6} {"step": 8871, "train_loss": 3.5965094566345215, "lr": 0.00034044635655097765, "tps": 15047, "wall": 38640.3} {"step": 8872, "train_loss": 3.561337471008301, "lr": 0.00034043211897331833, "tps": 15046, "wall": 38648.0} {"step": 8873, "train_loss": 3.5628864765167236, "lr": 0.0003404178800313974, "tps": 15044, "wall": 38655.7} {"step": 8874, "train_loss": 3.5174965858459473, "lr": 0.00034040363972537616, "tps": 15043, "wall": 38663.6} {"step": 8875, "train_loss": 3.6549532413482666, "lr": 0.000340389398055416, "tps": 15042, "wall": 38671.4} {"step": 8876, "train_loss": 3.57747745513916, "lr": 0.00034037515502167835, "tps": 15040, "wall": 38679.1} {"step": 8877, "train_loss": 3.593662738800049, "lr": 0.0003403609106243243, "tps": 15039, "wall": 38686.9} {"step": 8878, "train_loss": 3.490914821624756, "lr": 0.00034034666486351537, "tps": 15038, "wall": 38694.7} {"step": 8879, "train_loss": 3.5366828441619873, "lr": 0.0003403324177394129, "tps": 15036, "wall": 38702.4} {"step": 8880, "train_loss": 3.4355227947235107, "lr": 0.00034031816925217834, "tps": 15035, "wall": 38710.1} {"step": 8881, "train_loss": 3.559786319732666, "lr": 0.000340303919401973, "tps": 15034, "wall": 38717.7} {"step": 8882, "train_loss": 3.66093373298645, "lr": 0.0003402896681889584, "tps": 15032, "wall": 38725.6} {"step": 8883, "train_loss": 3.495774507522583, "lr": 0.0003402754156132959, "tps": 15031, "wall": 38733.4} {"step": 8884, "train_loss": 3.6081578731536865, "lr": 0.00034026116167514697, "tps": 15030, "wall": 38741.2} {"step": 8885, "train_loss": 3.555375099182129, "lr": 0.0003402469063746731, "tps": 15028, "wall": 38749.1} {"step": 8886, "train_loss": 3.5546367168426514, "lr": 0.0003402326497120358, "tps": 15027, "wall": 38756.8} {"step": 8887, "train_loss": 3.573751926422119, "lr": 0.00034021839168739653, "tps": 15026, "wall": 38764.5} {"step": 8888, "train_loss": 3.5406112670898438, "lr": 0.0003402041323009168, "tps": 15024, "wall": 38772.2} {"step": 8889, "train_loss": 3.5366008281707764, "lr": 0.00034018987155275815, "tps": 15023, "wall": 38780.0} {"step": 8890, "train_loss": 3.6481435298919678, "lr": 0.00034017560944308217, "tps": 15022, "wall": 38787.8} {"step": 8891, "train_loss": 3.519500494003296, "lr": 0.0003401613459720504, "tps": 15020, "wall": 38795.5} {"step": 8892, "train_loss": 3.5963613986968994, "lr": 0.00034014708113982425, "tps": 15019, "wall": 38803.2} {"step": 8893, "train_loss": 3.5835890769958496, "lr": 0.0003401328149465656, "tps": 15018, "wall": 38811.1} {"step": 8894, "train_loss": 3.4906654357910156, "lr": 0.00034011854739243594, "tps": 15017, "wall": 38818.8} {"step": 8895, "train_loss": 3.6215128898620605, "lr": 0.00034010427847759687, "tps": 15015, "wall": 38826.5} {"step": 8896, "train_loss": 3.60895037651062, "lr": 0.00034009000820220994, "tps": 15014, "wall": 38834.2} {"step": 8897, "train_loss": 3.5569300651550293, "lr": 0.00034007573656643703, "tps": 15013, "wall": 38841.9} {"step": 8898, "train_loss": 3.6968495845794678, "lr": 0.00034006146357043953, "tps": 15011, "wall": 38849.8} {"step": 8899, "train_loss": 3.513737440109253, "lr": 0.0003400471892143794, "tps": 15010, "wall": 38857.5} {"step": 8900, "train_loss": 3.5373334884643555, "lr": 0.00034003291349841817, "tps": 15009, "wall": 38865.3} {"step": 8901, "train_loss": 3.5529983043670654, "lr": 0.00034001863642271757, "tps": 15007, "wall": 38873.1} {"step": 8902, "train_loss": 3.6064648628234863, "lr": 0.0003400043579874395, "tps": 15006, "wall": 38880.8} {"step": 8903, "train_loss": 3.551603317260742, "lr": 0.00033999007819274544, "tps": 15005, "wall": 38888.5} {"step": 8904, "train_loss": 3.5501246452331543, "lr": 0.0003399757970387973, "tps": 15003, "wall": 38896.3} {"step": 8905, "train_loss": 3.610424041748047, "lr": 0.00033996151452575686, "tps": 15002, "wall": 38904.0} {"step": 8906, "train_loss": 3.6162047386169434, "lr": 0.00033994723065378584, "tps": 15001, "wall": 38911.7} {"step": 8907, "train_loss": 3.4592132568359375, "lr": 0.0003399329454230462, "tps": 15000, "wall": 38919.5} {"step": 8908, "train_loss": 3.5895848274230957, "lr": 0.0003399186588336996, "tps": 14998, "wall": 38927.3} {"step": 8909, "train_loss": 3.5130670070648193, "lr": 0.000339904370885908, "tps": 14997, "wall": 38935.1} {"step": 8910, "train_loss": 3.4935593605041504, "lr": 0.0003398900815798331, "tps": 14996, "wall": 38942.7} {"step": 8911, "train_loss": 3.6112101078033447, "lr": 0.000339875790915637, "tps": 14994, "wall": 38950.6} {"step": 8912, "train_loss": 3.6352128982543945, "lr": 0.0003398614988934813, "tps": 14993, "wall": 38958.4} {"step": 8913, "train_loss": 3.559084415435791, "lr": 0.0003398472055135282, "tps": 14992, "wall": 38966.2} {"step": 8914, "train_loss": 3.5499911308288574, "lr": 0.0003398329107759394, "tps": 14990, "wall": 38973.9} {"step": 8915, "train_loss": 3.5476272106170654, "lr": 0.0003398186146808769, "tps": 14989, "wall": 38981.6} {"step": 8916, "train_loss": 3.504768133163452, "lr": 0.00033980431722850266, "tps": 14988, "wall": 38989.5} {"step": 8917, "train_loss": 3.5422263145446777, "lr": 0.0003397900184189786, "tps": 14986, "wall": 38997.2} {"step": 8918, "train_loss": 3.5698189735412598, "lr": 0.00033977571825246684, "tps": 14985, "wall": 39005.0} {"step": 8919, "train_loss": 3.575136184692383, "lr": 0.00033976141672912923, "tps": 14984, "wall": 39012.6} {"step": 8920, "train_loss": 3.5509190559387207, "lr": 0.0003397471138491277, "tps": 14983, "wall": 39020.4} {"step": 8921, "train_loss": 3.5252580642700195, "lr": 0.00033973280961262453, "tps": 14981, "wall": 39028.1} {"step": 8922, "train_loss": 3.5805206298828125, "lr": 0.00033971850401978156, "tps": 14980, "wall": 39035.8} {"step": 8923, "train_loss": 3.669419288635254, "lr": 0.0003397041970707609, "tps": 14979, "wall": 39043.5} {"step": 8924, "train_loss": 3.6001055240631104, "lr": 0.0003396898887657246, "tps": 14977, "wall": 39051.4} {"step": 8925, "train_loss": 3.5294785499572754, "lr": 0.0003396755791048348, "tps": 14976, "wall": 39059.2} {"step": 8926, "train_loss": 3.6869399547576904, "lr": 0.0003396612680882535, "tps": 14975, "wall": 39066.9} {"step": 8927, "train_loss": 3.7028965950012207, "lr": 0.0003396469557161429, "tps": 14974, "wall": 39074.7} {"step": 8928, "train_loss": 3.6232075691223145, "lr": 0.00033963264198866517, "tps": 14972, "wall": 39082.3} {"step": 8929, "train_loss": 3.688147783279419, "lr": 0.00033961832690598235, "tps": 14971, "wall": 39090.2} {"step": 8930, "train_loss": 3.568192958831787, "lr": 0.00033960401046825666, "tps": 14970, "wall": 39097.9} {"step": 8931, "train_loss": 3.5182299613952637, "lr": 0.0003395896926756503, "tps": 14968, "wall": 39105.8} {"step": 8932, "train_loss": 3.6306447982788086, "lr": 0.0003395753735283254, "tps": 14967, "wall": 39113.5} {"step": 8933, "train_loss": 3.4732775688171387, "lr": 0.0003395610530264442, "tps": 14966, "wall": 39121.2} {"step": 8934, "train_loss": 3.6298844814300537, "lr": 0.00033954673117016893, "tps": 14965, "wall": 39128.9} {"step": 8935, "train_loss": 3.550398111343384, "lr": 0.0003395324079596618, "tps": 14963, "wall": 39136.7} {"step": 8936, "train_loss": 3.5412189960479736, "lr": 0.00033951808339508513, "tps": 14962, "wall": 39144.4} {"step": 8937, "train_loss": 3.521923065185547, "lr": 0.00033950375747660114, "tps": 14961, "wall": 39152.1} {"step": 8938, "train_loss": 3.492248058319092, "lr": 0.0003394894302043721, "tps": 14959, "wall": 39159.8} {"step": 8939, "train_loss": 3.5908665657043457, "lr": 0.0003394751015785603, "tps": 14958, "wall": 39167.7} {"step": 8940, "train_loss": 3.522467851638794, "lr": 0.00033946077159932814, "tps": 14957, "wall": 39175.4} {"step": 8941, "train_loss": 3.5568764209747314, "lr": 0.0003394464402668379, "tps": 14956, "wall": 39183.1} {"step": 8942, "train_loss": 3.4966018199920654, "lr": 0.0003394321075812518, "tps": 14954, "wall": 39190.9} {"step": 8943, "train_loss": 3.581115245819092, "lr": 0.0003394177735427325, "tps": 14953, "wall": 39198.7} {"step": 8944, "train_loss": 3.5766990184783936, "lr": 0.00033940343815144205, "tps": 14952, "wall": 39206.5} {"step": 8945, "train_loss": 3.5784335136413574, "lr": 0.00033938910140754317, "tps": 14950, "wall": 39214.2} {"step": 8946, "train_loss": 3.671536922454834, "lr": 0.000339374763311198, "tps": 14949, "wall": 39221.9} {"step": 8947, "train_loss": 3.627532482147217, "lr": 0.000339360423862569, "tps": 14948, "wall": 39229.8} {"step": 8948, "train_loss": 3.586019992828369, "lr": 0.00033934608306181873, "tps": 14946, "wall": 39237.5} {"step": 8949, "train_loss": 3.5192675590515137, "lr": 0.0003393317409091095, "tps": 14945, "wall": 39245.3} {"step": 8950, "train_loss": 3.5303268432617188, "lr": 0.00033931739740460397, "tps": 14944, "wall": 39253.1} {"step": 8951, "train_loss": 3.5915884971618652, "lr": 0.00033930305254846433, "tps": 14943, "wall": 39260.9} {"step": 8952, "train_loss": 3.3663477897644043, "lr": 0.0003392887063408534, "tps": 14941, "wall": 39268.7} {"step": 8953, "train_loss": 3.5610523223876953, "lr": 0.00033927435878193356, "tps": 14940, "wall": 39276.4} {"step": 8954, "train_loss": 3.61716365814209, "lr": 0.0003392600098718673, "tps": 14939, "wall": 39284.2} {"step": 8955, "train_loss": 3.544222116470337, "lr": 0.00033924565961081715, "tps": 14937, "wall": 39292.0} {"step": 8956, "train_loss": 3.533045768737793, "lr": 0.0003392313079989457, "tps": 14936, "wall": 39299.9} {"step": 8957, "train_loss": 3.43996524810791, "lr": 0.0003392169550364156, "tps": 14935, "wall": 39307.7} {"step": 8958, "train_loss": 3.5148792266845703, "lr": 0.0003392026007233894, "tps": 14933, "wall": 39315.5} {"step": 8959, "train_loss": 3.5736947059631348, "lr": 0.00033918824506002965, "tps": 14932, "wall": 39323.3} {"step": 8960, "train_loss": 3.6013927459716797, "lr": 0.00033917388804649903, "tps": 14931, "wall": 39331.1} {"step": 8961, "train_loss": 3.5212583541870117, "lr": 0.0003391595296829602, "tps": 14930, "wall": 39338.8} {"step": 8962, "train_loss": 3.6370315551757812, "lr": 0.00033914516996957564, "tps": 14928, "wall": 39346.7} {"step": 8963, "train_loss": 3.5894765853881836, "lr": 0.0003391308089065083, "tps": 14927, "wall": 39354.5} {"step": 8964, "train_loss": 3.5520544052124023, "lr": 0.00033911644649392065, "tps": 14926, "wall": 39362.2} {"step": 8965, "train_loss": 3.572272777557373, "lr": 0.00033910208273197544, "tps": 14924, "wall": 39370.0} {"step": 8966, "train_loss": 3.5484676361083984, "lr": 0.0003390877176208354, "tps": 14923, "wall": 39377.7} {"step": 8967, "train_loss": 3.5931410789489746, "lr": 0.0003390733511606633, "tps": 14922, "wall": 39385.5} {"step": 8968, "train_loss": 3.5620012283325195, "lr": 0.0003390589833516218, "tps": 14921, "wall": 39393.4} {"step": 8969, "train_loss": 3.579090118408203, "lr": 0.00033904461419387365, "tps": 14919, "wall": 39401.1} {"step": 8970, "train_loss": 3.5913562774658203, "lr": 0.00033903024368758176, "tps": 14918, "wall": 39409.0} {"step": 8971, "train_loss": 3.5425002574920654, "lr": 0.00033901587183290873, "tps": 14917, "wall": 39416.7} {"step": 8972, "train_loss": 3.617537498474121, "lr": 0.00033900149863001755, "tps": 14915, "wall": 39424.5} {"step": 8973, "train_loss": 3.61151123046875, "lr": 0.0003389871240790709, "tps": 14914, "wall": 39432.2} {"step": 8974, "train_loss": 3.529653549194336, "lr": 0.0003389727481802317, "tps": 14913, "wall": 39440.0} {"step": 8975, "train_loss": 3.5579774379730225, "lr": 0.00033895837093366274, "tps": 14912, "wall": 39447.8} {"step": 8976, "train_loss": 3.5099306106567383, "lr": 0.000338943992339527, "tps": 14910, "wall": 39455.5} {"step": 8977, "train_loss": 3.404590368270874, "lr": 0.00033892961239798716, "tps": 14909, "wall": 39463.3} {"step": 8978, "train_loss": 3.4786510467529297, "lr": 0.00033891523110920633, "tps": 14908, "wall": 39471.1} {"step": 8979, "train_loss": 3.572664499282837, "lr": 0.00033890084847334724, "tps": 14907, "wall": 39479.0} {"step": 8980, "train_loss": 3.485609531402588, "lr": 0.000338886464490573, "tps": 14905, "wall": 39486.8} {"step": 8981, "train_loss": 3.5724358558654785, "lr": 0.00033887207916104636, "tps": 14904, "wall": 39494.6} {"step": 8982, "train_loss": 3.5956525802612305, "lr": 0.0003388576924849305, "tps": 14903, "wall": 39502.4} {"step": 8983, "train_loss": 3.5564448833465576, "lr": 0.00033884330446238816, "tps": 14901, "wall": 39510.2} {"step": 8984, "train_loss": 3.648365020751953, "lr": 0.0003388289150935825, "tps": 14900, "wall": 39518.0} {"step": 8985, "train_loss": 3.5831661224365234, "lr": 0.00033881452437867644, "tps": 14899, "wall": 39525.9} {"step": 8986, "train_loss": 3.6451120376586914, "lr": 0.00033880013231783306, "tps": 14898, "wall": 39533.6} {"step": 8987, "train_loss": 3.5525593757629395, "lr": 0.00033878573891121534, "tps": 14896, "wall": 39541.4} {"step": 8988, "train_loss": 3.6468372344970703, "lr": 0.0003387713441589863, "tps": 14895, "wall": 39549.1} {"step": 8989, "train_loss": 3.5721242427825928, "lr": 0.00033875694806130904, "tps": 14894, "wall": 39556.9} {"step": 8990, "train_loss": 3.5325958728790283, "lr": 0.00033874255061834666, "tps": 14892, "wall": 39564.7} {"step": 8991, "train_loss": 3.5223946571350098, "lr": 0.00033872815183026234, "tps": 14891, "wall": 39572.5} {"step": 8992, "train_loss": 3.5993998050689697, "lr": 0.000338713751697219, "tps": 14890, "wall": 39580.2} {"step": 8993, "train_loss": 3.491588592529297, "lr": 0.00033869935021937984, "tps": 14889, "wall": 39588.0} {"step": 8994, "train_loss": 3.4032506942749023, "lr": 0.00033868494739690806, "tps": 14887, "wall": 39595.8} {"step": 8995, "train_loss": 3.503275156021118, "lr": 0.0003386705432299667, "tps": 14886, "wall": 39603.5} {"step": 8996, "train_loss": 3.6516335010528564, "lr": 0.00033865613771871914, "tps": 14885, "wall": 39611.3} {"step": 8997, "train_loss": 3.6491363048553467, "lr": 0.0003386417308633284, "tps": 14884, "wall": 39619.1} {"step": 8998, "train_loss": 3.500555992126465, "lr": 0.00033862732266395765, "tps": 14882, "wall": 39626.9} {"step": 8999, "train_loss": 3.568324089050293, "lr": 0.0003386129131207702, "tps": 14881, "wall": 39634.8} {"step": 9000, "train_loss": 3.58052396774292, "lr": 0.00033859850223392926, "tps": 14880, "wall": 39642.6, "val_loss_monitor": 3.5872377041296435} {"step": 9001, "train_loss": 3.630016565322876, "lr": 0.0003385840900035981, "tps": 14860, "wall": 39699.7} {"step": 9002, "train_loss": 3.5731916427612305, "lr": 0.0003385696764299399, "tps": 14859, "wall": 39707.7} {"step": 9003, "train_loss": 3.6295371055603027, "lr": 0.000338555261513118, "tps": 14857, "wall": 39715.6} {"step": 9004, "train_loss": 3.5060875415802, "lr": 0.0003385408452532957, "tps": 14856, "wall": 39723.7} {"step": 9005, "train_loss": 3.660015106201172, "lr": 0.0003385264276506363, "tps": 14855, "wall": 39731.8} {"step": 9006, "train_loss": 3.625647783279419, "lr": 0.00033851200870530315, "tps": 14853, "wall": 39739.9} {"step": 9007, "train_loss": 3.479015827178955, "lr": 0.00033849758841745945, "tps": 14852, "wall": 39748.0} {"step": 9008, "train_loss": 3.556262731552124, "lr": 0.00033848316678726867, "tps": 14850, "wall": 39755.9} {"step": 9009, "train_loss": 3.4784626960754395, "lr": 0.00033846874381489425, "tps": 14849, "wall": 39763.8} {"step": 9010, "train_loss": 3.589855670928955, "lr": 0.00033845431950049943, "tps": 14848, "wall": 39771.8} {"step": 9011, "train_loss": 3.586242437362671, "lr": 0.0003384398938442477, "tps": 14846, "wall": 39779.9} {"step": 9012, "train_loss": 3.646307945251465, "lr": 0.00033842546684630245, "tps": 14845, "wall": 39787.7} {"step": 9013, "train_loss": 3.585827350616455, "lr": 0.00033841103850682706, "tps": 14844, "wall": 39795.7} {"step": 9014, "train_loss": 3.540289878845215, "lr": 0.0003383966088259851, "tps": 14843, "wall": 39803.6} {"step": 9015, "train_loss": 3.4956984519958496, "lr": 0.00033838217780393984, "tps": 14841, "wall": 39811.6} {"step": 9016, "train_loss": 3.5194058418273926, "lr": 0.000338367745440855, "tps": 14840, "wall": 39819.5} {"step": 9017, "train_loss": 3.5080504417419434, "lr": 0.00033835331173689384, "tps": 14839, "wall": 39827.5} {"step": 9018, "train_loss": 3.479520320892334, "lr": 0.00033833887669222, "tps": 14837, "wall": 39835.4} {"step": 9019, "train_loss": 3.5705342292785645, "lr": 0.0003383244403069969, "tps": 14836, "wall": 39843.3} {"step": 9020, "train_loss": 3.5986599922180176, "lr": 0.00033831000258138815, "tps": 14835, "wall": 39851.2} {"step": 9021, "train_loss": 3.5582427978515625, "lr": 0.0003382955635155574, "tps": 14833, "wall": 39859.1} {"step": 9022, "train_loss": 3.602834939956665, "lr": 0.000338281123109668, "tps": 14832, "wall": 39867.0} {"step": 9023, "train_loss": 3.570089817047119, "lr": 0.0003382666813638837, "tps": 14831, "wall": 39874.9} {"step": 9024, "train_loss": 3.4890060424804688, "lr": 0.000338252238278368, "tps": 14829, "wall": 39882.9} {"step": 9025, "train_loss": 3.553558349609375, "lr": 0.0003382377938532845, "tps": 14828, "wall": 39890.8} {"step": 9026, "train_loss": 3.5607526302337646, "lr": 0.000338223348088797, "tps": 14827, "wall": 39898.7} {"step": 9027, "train_loss": 3.4473485946655273, "lr": 0.0003382089009850689, "tps": 14826, "wall": 39906.5} {"step": 9028, "train_loss": 3.6098828315734863, "lr": 0.0003381944525422641, "tps": 14824, "wall": 39914.5} {"step": 9029, "train_loss": 3.568965435028076, "lr": 0.000338180002760546, "tps": 14823, "wall": 39922.2} {"step": 9030, "train_loss": 3.560971975326538, "lr": 0.00033816555164007853, "tps": 14822, "wall": 39930.1} {"step": 9031, "train_loss": 3.5101053714752197, "lr": 0.0003381510991810253, "tps": 14821, "wall": 39938.0} {"step": 9032, "train_loss": 3.6439123153686523, "lr": 0.00033813664538355, "tps": 14819, "wall": 39945.9} {"step": 9033, "train_loss": 3.5985631942749023, "lr": 0.00033812219024781636, "tps": 14818, "wall": 39953.7} {"step": 9034, "train_loss": 3.5610008239746094, "lr": 0.00033810773377398817, "tps": 14817, "wall": 39961.5} {"step": 9035, "train_loss": 3.5605523586273193, "lr": 0.0003380932759622292, "tps": 14815, "wall": 39969.2} {"step": 9036, "train_loss": 3.44844126701355, "lr": 0.00033807881681270326, "tps": 14814, "wall": 39977.2} {"step": 9037, "train_loss": 3.5043137073516846, "lr": 0.000338064356325574, "tps": 14813, "wall": 39985.0} {"step": 9038, "train_loss": 3.516439437866211, "lr": 0.0003380498945010053, "tps": 14811, "wall": 39994.0} {"step": 9039, "train_loss": 3.541022300720215, "lr": 0.0003380354313391611, "tps": 14810, "wall": 40002.2} {"step": 9040, "train_loss": 3.5602173805236816, "lr": 0.0003380209668402052, "tps": 14809, "wall": 40010.1} {"step": 9041, "train_loss": 3.5940918922424316, "lr": 0.0003380065010043013, "tps": 14807, "wall": 40018.1} {"step": 9042, "train_loss": 3.5469584465026855, "lr": 0.0003379920338316134, "tps": 14806, "wall": 40025.8} {"step": 9043, "train_loss": 3.56768798828125, "lr": 0.00033797756532230535, "tps": 14805, "wall": 40033.6} {"step": 9044, "train_loss": 3.525686264038086, "lr": 0.00033796309547654105, "tps": 14804, "wall": 40041.3} {"step": 9045, "train_loss": 3.6356048583984375, "lr": 0.00033794862429448446, "tps": 14802, "wall": 40049.1} {"step": 9046, "train_loss": 3.458463668823242, "lr": 0.00033793415177629945, "tps": 14801, "wall": 40057.0} {"step": 9047, "train_loss": 3.530978202819824, "lr": 0.00033791967792215, "tps": 14800, "wall": 40064.9} {"step": 9048, "train_loss": 3.4385998249053955, "lr": 0.0003379052027322001, "tps": 14799, "wall": 40072.6} {"step": 9049, "train_loss": 3.543959140777588, "lr": 0.0003378907262066136, "tps": 14797, "wall": 40080.4} {"step": 9050, "train_loss": 3.7177743911743164, "lr": 0.0003378762483455546, "tps": 14796, "wall": 40088.2} {"step": 9051, "train_loss": 3.515374183654785, "lr": 0.0003378617691491871, "tps": 14795, "wall": 40096.1} {"step": 9052, "train_loss": 3.5854482650756836, "lr": 0.00033784728861767507, "tps": 14794, "wall": 40103.9} {"step": 9053, "train_loss": 3.575593948364258, "lr": 0.0003378328067511826, "tps": 14792, "wall": 40111.8} {"step": 9054, "train_loss": 3.489912509918213, "lr": 0.0003378183235498738, "tps": 14791, "wall": 40119.8} {"step": 9055, "train_loss": 3.630359649658203, "lr": 0.00033780383901391256, "tps": 14790, "wall": 40127.7} {"step": 9056, "train_loss": 3.5438222885131836, "lr": 0.0003377893531434631, "tps": 14788, "wall": 40135.5} {"step": 9057, "train_loss": 3.574479103088379, "lr": 0.0003377748659386894, "tps": 14787, "wall": 40143.4} {"step": 9058, "train_loss": 3.5586042404174805, "lr": 0.00033776037739975575, "tps": 14786, "wall": 40151.1} {"step": 9059, "train_loss": 3.778409481048584, "lr": 0.0003377458875268261, "tps": 14785, "wall": 40159.0} {"step": 9060, "train_loss": 3.5433902740478516, "lr": 0.0003377313963200647, "tps": 14783, "wall": 40166.8} {"step": 9061, "train_loss": 3.592379570007324, "lr": 0.00033771690377963566, "tps": 14782, "wall": 40174.7} {"step": 9062, "train_loss": 3.6220693588256836, "lr": 0.0003377024099057032, "tps": 14781, "wall": 40182.6} {"step": 9063, "train_loss": 3.489630937576294, "lr": 0.00033768791469843145, "tps": 14780, "wall": 40190.5} {"step": 9064, "train_loss": 3.5021800994873047, "lr": 0.0003376734181579846, "tps": 14778, "wall": 40198.3} {"step": 9065, "train_loss": 3.613398313522339, "lr": 0.000337658920284527, "tps": 14777, "wall": 40206.2} {"step": 9066, "train_loss": 3.6143553256988525, "lr": 0.00033764442107822265, "tps": 14776, "wall": 40213.9} {"step": 9067, "train_loss": 3.5785770416259766, "lr": 0.0003376299205392361, "tps": 14775, "wall": 40221.8} {"step": 9068, "train_loss": 3.6425700187683105, "lr": 0.0003376154186677313, "tps": 14773, "wall": 40229.8} {"step": 9069, "train_loss": 3.5163300037384033, "lr": 0.0003376009154638727, "tps": 14772, "wall": 40237.5} {"step": 9070, "train_loss": 3.546579599380493, "lr": 0.0003375864109278246, "tps": 14771, "wall": 40245.5} {"step": 9071, "train_loss": 3.4808690547943115, "lr": 0.00033757190505975126, "tps": 14770, "wall": 40253.3} {"step": 9072, "train_loss": 3.546156883239746, "lr": 0.0003375573978598171, "tps": 14768, "wall": 40261.3} {"step": 9073, "train_loss": 3.5454118251800537, "lr": 0.0003375428893281862, "tps": 14767, "wall": 40269.2} {"step": 9074, "train_loss": 3.5756521224975586, "lr": 0.00033752837946502323, "tps": 14766, "wall": 40277.0} {"step": 9075, "train_loss": 3.5083343982696533, "lr": 0.0003375138682704924, "tps": 14765, "wall": 40284.8} {"step": 9076, "train_loss": 3.613985061645508, "lr": 0.0003374993557447581, "tps": 14763, "wall": 40292.7} {"step": 9077, "train_loss": 3.5934393405914307, "lr": 0.00033748484188798476, "tps": 14762, "wall": 40300.5} {"step": 9078, "train_loss": 3.540337562561035, "lr": 0.00033747032670033674, "tps": 14761, "wall": 40308.5} {"step": 9079, "train_loss": 3.5873918533325195, "lr": 0.00033745581018197854, "tps": 14759, "wall": 40316.4} {"step": 9080, "train_loss": 3.5022802352905273, "lr": 0.00033744129233307453, "tps": 14758, "wall": 40324.2} {"step": 9081, "train_loss": 3.6163153648376465, "lr": 0.00033742677315378925, "tps": 14757, "wall": 40332.0} {"step": 9082, "train_loss": 3.6139373779296875, "lr": 0.00033741225264428704, "tps": 14756, "wall": 40339.8} {"step": 9083, "train_loss": 3.482114791870117, "lr": 0.00033739773080473256, "tps": 14754, "wall": 40347.6} {"step": 9084, "train_loss": 3.4113173484802246, "lr": 0.0003373832076352902, "tps": 14753, "wall": 40355.6} {"step": 9085, "train_loss": 3.642613410949707, "lr": 0.00033736868313612455, "tps": 14752, "wall": 40363.4} {"step": 9086, "train_loss": 3.5988569259643555, "lr": 0.0003373541573074001, "tps": 14751, "wall": 40371.3} {"step": 9087, "train_loss": 3.527621269226074, "lr": 0.00033733963014928136, "tps": 14749, "wall": 40379.1} {"step": 9088, "train_loss": 3.4938206672668457, "lr": 0.00033732510166193297, "tps": 14748, "wall": 40387.0} {"step": 9089, "train_loss": 3.5044491291046143, "lr": 0.0003373105718455195, "tps": 14747, "wall": 40394.8} {"step": 9090, "train_loss": 3.5361318588256836, "lr": 0.0003372960407002055, "tps": 14746, "wall": 40402.6} {"step": 9091, "train_loss": 3.5453245639801025, "lr": 0.0003372815082261557, "tps": 14745, "wall": 40410.4} {"step": 9092, "train_loss": 3.514288902282715, "lr": 0.0003372669744235345, "tps": 14743, "wall": 40418.4} {"step": 9093, "train_loss": 3.5163512229919434, "lr": 0.00033725243929250674, "tps": 14742, "wall": 40426.3} {"step": 9094, "train_loss": 3.5985827445983887, "lr": 0.000337237902833237, "tps": 14741, "wall": 40434.2} {"step": 9095, "train_loss": 3.5107834339141846, "lr": 0.00033722336504588994, "tps": 14740, "wall": 40442.0} {"step": 9096, "train_loss": 3.6373603343963623, "lr": 0.0003372088259306303, "tps": 14738, "wall": 40449.8} {"step": 9097, "train_loss": 3.488259792327881, "lr": 0.00033719428548762266, "tps": 14737, "wall": 40457.5} {"step": 9098, "train_loss": 3.5375988483428955, "lr": 0.00033717974371703187, "tps": 14736, "wall": 40465.4} {"step": 9099, "train_loss": 3.5811400413513184, "lr": 0.00033716520061902254, "tps": 14735, "wall": 40473.3} {"step": 9100, "train_loss": 3.5423378944396973, "lr": 0.0003371506561937595, "tps": 14733, "wall": 40481.1} {"step": 9101, "train_loss": 3.4870970249176025, "lr": 0.00033713611044140757, "tps": 14732, "wall": 40489.0} {"step": 9102, "train_loss": 3.5939929485321045, "lr": 0.00033712156336213137, "tps": 14731, "wall": 40496.8} {"step": 9103, "train_loss": 3.6170411109924316, "lr": 0.0003371070149560958, "tps": 14730, "wall": 40504.6} {"step": 9104, "train_loss": 3.4239697456359863, "lr": 0.0003370924652234656, "tps": 14728, "wall": 40512.3} {"step": 9105, "train_loss": 3.5403008460998535, "lr": 0.00033707791416440566, "tps": 14727, "wall": 40520.2} {"step": 9106, "train_loss": 3.535291910171509, "lr": 0.0003370633617790807, "tps": 14726, "wall": 40528.1} {"step": 9107, "train_loss": 3.5080695152282715, "lr": 0.0003370488080676557, "tps": 14725, "wall": 40536.1} {"step": 9108, "train_loss": 3.6305389404296875, "lr": 0.0003370342530302955, "tps": 14723, "wall": 40543.9} {"step": 9109, "train_loss": 3.616778612136841, "lr": 0.00033701969666716485, "tps": 14722, "wall": 40551.8} {"step": 9110, "train_loss": 3.630321741104126, "lr": 0.00033700513897842884, "tps": 14721, "wall": 40559.6} {"step": 9111, "train_loss": 3.6492373943328857, "lr": 0.00033699057996425225, "tps": 14720, "wall": 40567.3} {"step": 9112, "train_loss": 3.5165176391601562, "lr": 0.0003369760196248, "tps": 14719, "wall": 40575.3} {"step": 9113, "train_loss": 3.584472179412842, "lr": 0.00033696145796023716, "tps": 14717, "wall": 40583.2} {"step": 9114, "train_loss": 3.6018853187561035, "lr": 0.0003369468949707285, "tps": 14716, "wall": 40591.0} {"step": 9115, "train_loss": 3.649106502532959, "lr": 0.0003369323306564392, "tps": 14715, "wall": 40598.9} {"step": 9116, "train_loss": 3.462825059890747, "lr": 0.000336917765017534, "tps": 14714, "wall": 40606.7} {"step": 9117, "train_loss": 3.552766799926758, "lr": 0.00033690319805417814, "tps": 14712, "wall": 40614.6} {"step": 9118, "train_loss": 3.532231330871582, "lr": 0.00033688862976653653, "tps": 14711, "wall": 40622.5} {"step": 9119, "train_loss": 3.5304551124572754, "lr": 0.0003368740601547741, "tps": 14710, "wall": 40630.3} {"step": 9120, "train_loss": 3.506946563720703, "lr": 0.0003368594892190561, "tps": 14709, "wall": 40638.2} {"step": 9121, "train_loss": 3.4831106662750244, "lr": 0.00033684491695954745, "tps": 14707, "wall": 40646.0} {"step": 9122, "train_loss": 3.606290578842163, "lr": 0.0003368303433764132, "tps": 14706, "wall": 40653.8} {"step": 9123, "train_loss": 3.4790544509887695, "lr": 0.00033681576846981856, "tps": 14705, "wall": 40661.6} {"step": 9124, "train_loss": 3.6091911792755127, "lr": 0.0003368011922399286, "tps": 14704, "wall": 40669.5} {"step": 9125, "train_loss": 3.514352321624756, "lr": 0.0003367866146869083, "tps": 14703, "wall": 40677.3} {"step": 9126, "train_loss": 3.407431125640869, "lr": 0.000336772035810923, "tps": 14701, "wall": 40685.2} {"step": 9127, "train_loss": 3.5137405395507812, "lr": 0.0003367574556121378, "tps": 14700, "wall": 40693.0} {"step": 9128, "train_loss": 3.5066208839416504, "lr": 0.00033674287409071773, "tps": 14699, "wall": 40700.9} {"step": 9129, "train_loss": 3.6067535877227783, "lr": 0.00033672829124682815, "tps": 14698, "wall": 40708.8} {"step": 9130, "train_loss": 3.5692005157470703, "lr": 0.0003367137070806341, "tps": 14696, "wall": 40716.6} {"step": 9131, "train_loss": 3.5900487899780273, "lr": 0.0003366991215923009, "tps": 14695, "wall": 40724.3} {"step": 9132, "train_loss": 3.7884130477905273, "lr": 0.00033668453478199377, "tps": 14694, "wall": 40732.2} {"step": 9133, "train_loss": 3.5253281593322754, "lr": 0.00033666994664987784, "tps": 14693, "wall": 40740.1} {"step": 9134, "train_loss": 3.5979673862457275, "lr": 0.0003366553571961185, "tps": 14692, "wall": 40748.0} {"step": 9135, "train_loss": 3.4732248783111572, "lr": 0.00033664076642088095, "tps": 14690, "wall": 40755.8} {"step": 9136, "train_loss": 3.516785144805908, "lr": 0.00033662617432433044, "tps": 14689, "wall": 40763.7} {"step": 9137, "train_loss": 3.572160243988037, "lr": 0.00033661158090663243, "tps": 14688, "wall": 40771.4} {"step": 9138, "train_loss": 3.558849811553955, "lr": 0.00033659698616795203, "tps": 14687, "wall": 40779.2} {"step": 9139, "train_loss": 3.442762851715088, "lr": 0.00033658239010845475, "tps": 14686, "wall": 40787.0} {"step": 9140, "train_loss": 3.545450448989868, "lr": 0.00033656779272830576, "tps": 14684, "wall": 40794.9} {"step": 9141, "train_loss": 3.5345489978790283, "lr": 0.0003365531940276705, "tps": 14683, "wall": 40802.7} {"step": 9142, "train_loss": 3.5492782592773438, "lr": 0.00033653859400671436, "tps": 14682, "wall": 40810.4} {"step": 9143, "train_loss": 3.635436534881592, "lr": 0.0003365239926656028, "tps": 14681, "wall": 40818.2} {"step": 9144, "train_loss": 3.39925479888916, "lr": 0.00033650939000450105, "tps": 14680, "wall": 40826.0} {"step": 9145, "train_loss": 3.6942341327667236, "lr": 0.0003364947860235747, "tps": 14678, "wall": 40833.8} {"step": 9146, "train_loss": 3.4551548957824707, "lr": 0.0003364801807229891, "tps": 14677, "wall": 40841.5} {"step": 9147, "train_loss": 3.4898459911346436, "lr": 0.0003364655741029097, "tps": 14676, "wall": 40849.4} {"step": 9148, "train_loss": 3.581190586090088, "lr": 0.0003364509661635019, "tps": 14675, "wall": 40857.3} {"step": 9149, "train_loss": 3.554008722305298, "lr": 0.0003364363569049314, "tps": 14674, "wall": 40865.0} {"step": 9150, "train_loss": 3.5213356018066406, "lr": 0.00033642174632736346, "tps": 14672, "wall": 40872.8} {"step": 9151, "train_loss": 3.611649751663208, "lr": 0.00033640713443096364, "tps": 14671, "wall": 40880.6} {"step": 9152, "train_loss": 3.472729206085205, "lr": 0.0003363925212158976, "tps": 14670, "wall": 40888.4} {"step": 9153, "train_loss": 3.6358282566070557, "lr": 0.00033637790668233073, "tps": 14669, "wall": 40896.3} {"step": 9154, "train_loss": 3.6045727729797363, "lr": 0.0003363632908304287, "tps": 14668, "wall": 40904.1} {"step": 9155, "train_loss": 3.6154189109802246, "lr": 0.0003363486736603569, "tps": 14666, "wall": 40912.0} {"step": 9156, "train_loss": 3.4913175106048584, "lr": 0.0003363340551722811, "tps": 14665, "wall": 40919.9} {"step": 9157, "train_loss": 3.626075029373169, "lr": 0.00033631943536636684, "tps": 14664, "wall": 40927.6} {"step": 9158, "train_loss": 3.5988268852233887, "lr": 0.00033630481424277975, "tps": 14663, "wall": 40935.5} {"step": 9159, "train_loss": 3.6016616821289062, "lr": 0.0003362901918016854, "tps": 14662, "wall": 40943.2} {"step": 9160, "train_loss": 3.4976048469543457, "lr": 0.00033627556804324946, "tps": 14660, "wall": 40951.0} {"step": 9161, "train_loss": 3.494441032409668, "lr": 0.0003362609429676375, "tps": 14659, "wall": 40958.8} {"step": 9162, "train_loss": 3.4924566745758057, "lr": 0.0003362463165750154, "tps": 14658, "wall": 40966.7} {"step": 9163, "train_loss": 3.466852903366089, "lr": 0.00033623168886554874, "tps": 14657, "wall": 40974.5} {"step": 9164, "train_loss": 3.541376829147339, "lr": 0.0003362170598394032, "tps": 14656, "wall": 40982.3} {"step": 9165, "train_loss": 3.534275531768799, "lr": 0.0003362024294967445, "tps": 14654, "wall": 40990.1} {"step": 9166, "train_loss": 3.5622920989990234, "lr": 0.0003361877978377385, "tps": 14653, "wall": 40997.9} {"step": 9167, "train_loss": 3.4446194171905518, "lr": 0.00033617316486255064, "tps": 14652, "wall": 41005.8} {"step": 9168, "train_loss": 3.56484055519104, "lr": 0.00033615853057134703, "tps": 14651, "wall": 41013.5} {"step": 9169, "train_loss": 3.4324545860290527, "lr": 0.00033614389496429333, "tps": 14650, "wall": 41021.4} {"step": 9170, "train_loss": 3.4997682571411133, "lr": 0.00033612925804155514, "tps": 14648, "wall": 41029.2} {"step": 9171, "train_loss": 3.584294319152832, "lr": 0.00033611461980329857, "tps": 14647, "wall": 41037.1} {"step": 9172, "train_loss": 3.535191297531128, "lr": 0.0003360999802496893, "tps": 14646, "wall": 41044.8} {"step": 9173, "train_loss": 3.53873348236084, "lr": 0.0003360853393808931, "tps": 14645, "wall": 41052.7} {"step": 9174, "train_loss": 3.5609312057495117, "lr": 0.00033607069719707595, "tps": 14644, "wall": 41060.5} {"step": 9175, "train_loss": 3.616776466369629, "lr": 0.00033605605369840363, "tps": 14642, "wall": 41068.3} {"step": 9176, "train_loss": 3.5906641483306885, "lr": 0.0003360414088850421, "tps": 14641, "wall": 41076.1} {"step": 9177, "train_loss": 3.5977838039398193, "lr": 0.00033602676275715714, "tps": 14640, "wall": 41083.9} {"step": 9178, "train_loss": 3.4430041313171387, "lr": 0.0003360121153149148, "tps": 14639, "wall": 41091.8} {"step": 9179, "train_loss": 3.695669174194336, "lr": 0.00033599746655848097, "tps": 14638, "wall": 41099.6} {"step": 9180, "train_loss": 3.573892116546631, "lr": 0.0003359828164880215, "tps": 14636, "wall": 41107.3} {"step": 9181, "train_loss": 3.5430376529693604, "lr": 0.00033596816510370243, "tps": 14635, "wall": 41115.1} {"step": 9182, "train_loss": 3.6044106483459473, "lr": 0.0003359535124056897, "tps": 14634, "wall": 41122.9} {"step": 9183, "train_loss": 3.5388898849487305, "lr": 0.0003359388583941493, "tps": 14633, "wall": 41130.8} {"step": 9184, "train_loss": 3.5234439373016357, "lr": 0.0003359242030692472, "tps": 14632, "wall": 41138.6} {"step": 9185, "train_loss": 3.5441155433654785, "lr": 0.0003359095464311496, "tps": 14630, "wall": 41146.6} {"step": 9186, "train_loss": 3.5140674114227295, "lr": 0.0003358948884800223, "tps": 14629, "wall": 41154.4} {"step": 9187, "train_loss": 3.5884532928466797, "lr": 0.0003358802292160314, "tps": 14628, "wall": 41162.0} {"step": 9188, "train_loss": 3.4903342723846436, "lr": 0.00033586556863934305, "tps": 14627, "wall": 41169.9} {"step": 9189, "train_loss": 3.5116875171661377, "lr": 0.00033585090675012323, "tps": 14626, "wall": 41177.8} {"step": 9190, "train_loss": 3.551973819732666, "lr": 0.0003358362435485381, "tps": 14625, "wall": 41185.6} {"step": 9191, "train_loss": 3.512908458709717, "lr": 0.00033582157903475367, "tps": 14623, "wall": 41193.3} {"step": 9192, "train_loss": 3.5438265800476074, "lr": 0.0003358069132089362, "tps": 14622, "wall": 41201.2} {"step": 9193, "train_loss": 3.6075353622436523, "lr": 0.00033579224607125177, "tps": 14621, "wall": 41209.1} {"step": 9194, "train_loss": 3.517014265060425, "lr": 0.00033577757762186646, "tps": 14620, "wall": 41216.9} {"step": 9195, "train_loss": 3.4977827072143555, "lr": 0.0003357629078609465, "tps": 14619, "wall": 41224.6} {"step": 9196, "train_loss": 3.5603976249694824, "lr": 0.00033574823678865804, "tps": 14617, "wall": 41232.5} {"step": 9197, "train_loss": 3.5640153884887695, "lr": 0.00033573356440516736, "tps": 14616, "wall": 41240.3} {"step": 9198, "train_loss": 3.6830646991729736, "lr": 0.0003357188907106405, "tps": 14615, "wall": 41248.1} {"step": 9199, "train_loss": 3.648401975631714, "lr": 0.0003357042157052439, "tps": 14614, "wall": 41255.8} {"step": 9200, "train_loss": 3.619354724884033, "lr": 0.00033568953938914356, "tps": 14613, "wall": 41263.7} {"step": 9201, "train_loss": 3.5159354209899902, "lr": 0.00033567486176250597, "tps": 14612, "wall": 41271.5} {"step": 9202, "train_loss": 3.602356433868408, "lr": 0.00033566018282549725, "tps": 14610, "wall": 41279.4} {"step": 9203, "train_loss": 3.4469335079193115, "lr": 0.0003356455025782837, "tps": 14609, "wall": 41287.2} {"step": 9204, "train_loss": 3.52201509475708, "lr": 0.00033563082102103166, "tps": 14608, "wall": 41295.1} {"step": 9205, "train_loss": 3.6843421459198, "lr": 0.0003356161381539074, "tps": 14607, "wall": 41302.8} {"step": 9206, "train_loss": 3.498202085494995, "lr": 0.0003356014539770773, "tps": 14606, "wall": 41310.6} {"step": 9207, "train_loss": 3.6909193992614746, "lr": 0.00033558676849070767, "tps": 14605, "wall": 41318.4} {"step": 9208, "train_loss": 3.5376999378204346, "lr": 0.0003355720816949649, "tps": 14603, "wall": 41326.2} {"step": 9209, "train_loss": 3.5394225120544434, "lr": 0.0003355573935900153, "tps": 14602, "wall": 41334.0} {"step": 9210, "train_loss": 3.5521233081817627, "lr": 0.0003355427041760253, "tps": 14601, "wall": 41341.9} {"step": 9211, "train_loss": 3.5586020946502686, "lr": 0.00033552801345316125, "tps": 14600, "wall": 41349.6} {"step": 9212, "train_loss": 3.5600876808166504, "lr": 0.00033551332142158966, "tps": 14599, "wall": 41357.7} {"step": 9213, "train_loss": 3.5025877952575684, "lr": 0.0003354986280814769, "tps": 14597, "wall": 41365.4} {"step": 9214, "train_loss": 3.5352399349212646, "lr": 0.00033548393343298946, "tps": 14596, "wall": 41373.2} {"step": 9215, "train_loss": 3.5971596240997314, "lr": 0.00033546923747629375, "tps": 14595, "wall": 41380.9} {"step": 9216, "train_loss": 3.6176135540008545, "lr": 0.0003354545402115563, "tps": 14594, "wall": 41388.8} {"step": 9217, "train_loss": 3.5672080516815186, "lr": 0.0003354398416389436, "tps": 14593, "wall": 41396.7} {"step": 9218, "train_loss": 3.545207977294922, "lr": 0.0003354251417586221, "tps": 14592, "wall": 41404.5} {"step": 9219, "train_loss": 3.54617977142334, "lr": 0.0003354104405707583, "tps": 14590, "wall": 41412.3} {"step": 9220, "train_loss": 3.542015552520752, "lr": 0.00033539573807551883, "tps": 14589, "wall": 41420.1} {"step": 9221, "train_loss": 3.5691676139831543, "lr": 0.00033538103427307016, "tps": 14588, "wall": 41427.9} {"step": 9222, "train_loss": 3.537964105606079, "lr": 0.0003353663291635789, "tps": 14587, "wall": 41435.8} {"step": 9223, "train_loss": 3.6671314239501953, "lr": 0.0003353516227472117, "tps": 14586, "wall": 41443.6} {"step": 9224, "train_loss": 3.5640366077423096, "lr": 0.000335336915024135, "tps": 14585, "wall": 41451.5} {"step": 9225, "train_loss": 3.387153387069702, "lr": 0.0003353222059945155, "tps": 14583, "wall": 41459.4} {"step": 9226, "train_loss": 3.578531503677368, "lr": 0.0003353074956585199, "tps": 14582, "wall": 41467.1} {"step": 9227, "train_loss": 3.7210092544555664, "lr": 0.0003352927840163146, "tps": 14581, "wall": 41475.1} {"step": 9228, "train_loss": 3.4842584133148193, "lr": 0.00033527807106806647, "tps": 14580, "wall": 41483.0} {"step": 9229, "train_loss": 3.517831802368164, "lr": 0.00033526335681394214, "tps": 14579, "wall": 41490.9} {"step": 9230, "train_loss": 3.5025134086608887, "lr": 0.0003352486412541082, "tps": 14577, "wall": 41498.7} {"step": 9231, "train_loss": 3.4410738945007324, "lr": 0.0003352339243887315, "tps": 14576, "wall": 41506.6} {"step": 9232, "train_loss": 3.5855050086975098, "lr": 0.0003352192062179786, "tps": 14575, "wall": 41514.4} {"step": 9233, "train_loss": 3.5684585571289062, "lr": 0.00033520448674201635, "tps": 14574, "wall": 41522.3} {"step": 9234, "train_loss": 3.54278564453125, "lr": 0.0003351897659610114, "tps": 14573, "wall": 41529.9} {"step": 9235, "train_loss": 3.6062870025634766, "lr": 0.00033517504387513064, "tps": 14572, "wall": 41537.8} {"step": 9236, "train_loss": 3.533919334411621, "lr": 0.00033516032048454064, "tps": 14570, "wall": 41545.7} {"step": 9237, "train_loss": 3.5211985111236572, "lr": 0.00033514559578940833, "tps": 14569, "wall": 41553.5} {"step": 9238, "train_loss": 3.544936180114746, "lr": 0.0003351308697899005, "tps": 14568, "wall": 41561.3} {"step": 9239, "train_loss": 3.5629031658172607, "lr": 0.0003351161424861839, "tps": 14567, "wall": 41569.2} {"step": 9240, "train_loss": 3.5314626693725586, "lr": 0.0003351014138784255, "tps": 14566, "wall": 41577.1} {"step": 9241, "train_loss": 3.5291707515716553, "lr": 0.000335086683966792, "tps": 14565, "wall": 41584.8} {"step": 9242, "train_loss": 3.547861337661743, "lr": 0.0003350719527514503, "tps": 14563, "wall": 41592.5} {"step": 9243, "train_loss": 3.5305840969085693, "lr": 0.00033505722023256736, "tps": 14562, "wall": 41600.3} {"step": 9244, "train_loss": 3.608630418777466, "lr": 0.00033504248641031, "tps": 14561, "wall": 41608.2} {"step": 9245, "train_loss": 3.5585508346557617, "lr": 0.00033502775128484505, "tps": 14560, "wall": 41616.0} {"step": 9246, "train_loss": 3.532857656478882, "lr": 0.00033501301485633963, "tps": 14559, "wall": 41623.7} {"step": 9247, "train_loss": 3.570739269256592, "lr": 0.00033499827712496044, "tps": 14558, "wall": 41631.5} {"step": 9248, "train_loss": 3.6633288860321045, "lr": 0.00033498353809087455, "tps": 14556, "wall": 41639.5} {"step": 9249, "train_loss": 3.565530776977539, "lr": 0.000334968797754249, "tps": 14555, "wall": 41647.1} {"step": 9250, "train_loss": 3.591759204864502, "lr": 0.0003349540561152506, "tps": 14554, "wall": 41654.9} {"step": 9251, "train_loss": 3.480543613433838, "lr": 0.00033493931317404656, "tps": 14553, "wall": 41662.7} {"step": 9252, "train_loss": 3.5558509826660156, "lr": 0.0003349245689308036, "tps": 14552, "wall": 41670.6} {"step": 9253, "train_loss": 3.466648578643799, "lr": 0.00033490982338568905, "tps": 14551, "wall": 41678.4} {"step": 9254, "train_loss": 3.518988609313965, "lr": 0.0003348950765388698, "tps": 14550, "wall": 41686.3} {"step": 9255, "train_loss": 3.620316982269287, "lr": 0.0003348803283905128, "tps": 14548, "wall": 41694.1} {"step": 9256, "train_loss": 3.49027681350708, "lr": 0.00033486557894078523, "tps": 14547, "wall": 41702.0} {"step": 9257, "train_loss": 3.501295328140259, "lr": 0.00033485082818985424, "tps": 14546, "wall": 41709.7} {"step": 9258, "train_loss": 3.5761561393737793, "lr": 0.0003348360761378869, "tps": 14545, "wall": 41717.5} {"step": 9259, "train_loss": 3.498793363571167, "lr": 0.00033482132278505017, "tps": 14544, "wall": 41725.4} {"step": 9260, "train_loss": 3.6304874420166016, "lr": 0.0003348065681315113, "tps": 14543, "wall": 41733.2} {"step": 9261, "train_loss": 3.6276519298553467, "lr": 0.0003347918121774375, "tps": 14541, "wall": 41741.0} {"step": 9262, "train_loss": 3.522498607635498, "lr": 0.00033477705492299575, "tps": 14540, "wall": 41749.0} {"step": 9263, "train_loss": 3.553010940551758, "lr": 0.0003347622963683533, "tps": 14539, "wall": 41756.7} {"step": 9264, "train_loss": 3.45076060295105, "lr": 0.0003347475365136774, "tps": 14538, "wall": 41764.5} {"step": 9265, "train_loss": 3.5974082946777344, "lr": 0.00033473277535913515, "tps": 14537, "wall": 41772.3} {"step": 9266, "train_loss": 3.607646942138672, "lr": 0.00033471801290489386, "tps": 14536, "wall": 41780.1} {"step": 9267, "train_loss": 3.5833864212036133, "lr": 0.0003347032491511207, "tps": 14535, "wall": 41787.9} {"step": 9268, "train_loss": 3.5045270919799805, "lr": 0.0003346884840979829, "tps": 14533, "wall": 41795.8} {"step": 9269, "train_loss": 3.487241744995117, "lr": 0.0003346737177456478, "tps": 14532, "wall": 41803.6} {"step": 9270, "train_loss": 3.523803472518921, "lr": 0.00033465895009428265, "tps": 14531, "wall": 41811.5} {"step": 9271, "train_loss": 3.5500741004943848, "lr": 0.00033464418114405466, "tps": 14530, "wall": 41819.4} {"step": 9272, "train_loss": 3.5754363536834717, "lr": 0.00033462941089513115, "tps": 14529, "wall": 41827.2} {"step": 9273, "train_loss": 3.613973617553711, "lr": 0.0003346146393476795, "tps": 14528, "wall": 41835.0} {"step": 9274, "train_loss": 3.4916248321533203, "lr": 0.0003345998665018671, "tps": 14526, "wall": 41842.9} {"step": 9275, "train_loss": 3.5713088512420654, "lr": 0.0003345850923578611, "tps": 14525, "wall": 41850.8} {"step": 9276, "train_loss": 3.624058723449707, "lr": 0.000334570316915829, "tps": 14524, "wall": 41858.6} {"step": 9277, "train_loss": 3.4953696727752686, "lr": 0.0003345555401759382, "tps": 14523, "wall": 41866.5} {"step": 9278, "train_loss": 3.4609084129333496, "lr": 0.000334540762138356, "tps": 14522, "wall": 41874.3} {"step": 9279, "train_loss": 3.593836784362793, "lr": 0.0003345259828032498, "tps": 14521, "wall": 41882.2} {"step": 9280, "train_loss": 3.5039291381835938, "lr": 0.0003345112021707872, "tps": 14519, "wall": 41889.9} {"step": 9281, "train_loss": 3.4896154403686523, "lr": 0.0003344964202411354, "tps": 14518, "wall": 41897.8} {"step": 9282, "train_loss": 3.5181124210357666, "lr": 0.00033448163701446193, "tps": 14517, "wall": 41905.7} {"step": 9283, "train_loss": 3.5485963821411133, "lr": 0.00033446685249093435, "tps": 14516, "wall": 41913.5} {"step": 9284, "train_loss": 3.5844364166259766, "lr": 0.0003344520666707201, "tps": 14515, "wall": 41921.3} {"step": 9285, "train_loss": 3.550373077392578, "lr": 0.0003344372795539866, "tps": 14514, "wall": 41929.2} {"step": 9286, "train_loss": 3.633992910385132, "lr": 0.0003344224911409014, "tps": 14513, "wall": 41937.0} {"step": 9287, "train_loss": 3.5408053398132324, "lr": 0.0003344077014316321, "tps": 14511, "wall": 41944.9} {"step": 9288, "train_loss": 3.715191125869751, "lr": 0.0003343929104263461, "tps": 14510, "wall": 41952.6} {"step": 9289, "train_loss": 3.550765037536621, "lr": 0.0003343781181252111, "tps": 14509, "wall": 41960.5} {"step": 9290, "train_loss": 3.535548448562622, "lr": 0.00033436332452839446, "tps": 14508, "wall": 41968.3} {"step": 9291, "train_loss": 3.5874900817871094, "lr": 0.00033434852963606395, "tps": 14507, "wall": 41976.2} {"step": 9292, "train_loss": 3.5355687141418457, "lr": 0.0003343337334483872, "tps": 14506, "wall": 41983.9} {"step": 9293, "train_loss": 3.5219435691833496, "lr": 0.0003343189359655316, "tps": 14504, "wall": 41991.9} {"step": 9294, "train_loss": 3.535360097885132, "lr": 0.000334304137187665, "tps": 14503, "wall": 41999.7} {"step": 9295, "train_loss": 3.474416494369507, "lr": 0.0003342893371149549, "tps": 14502, "wall": 42007.5} {"step": 9296, "train_loss": 3.5383548736572266, "lr": 0.000334274535747569, "tps": 14501, "wall": 42015.3} {"step": 9297, "train_loss": 3.5344390869140625, "lr": 0.00033425973308567495, "tps": 14500, "wall": 42023.1} {"step": 9298, "train_loss": 3.513239860534668, "lr": 0.0003342449291294406, "tps": 14499, "wall": 42030.9} {"step": 9299, "train_loss": 3.585172414779663, "lr": 0.00033423012387903336, "tps": 14498, "wall": 42038.7} {"step": 9300, "train_loss": 3.536180019378662, "lr": 0.0003342153173346212, "tps": 14497, "wall": 42046.6} {"step": 9301, "train_loss": 3.513578176498413, "lr": 0.0003342005094963717, "tps": 14495, "wall": 42054.5} {"step": 9302, "train_loss": 3.567858934402466, "lr": 0.0003341857003644526, "tps": 14494, "wall": 42062.3} {"step": 9303, "train_loss": 3.5936765670776367, "lr": 0.00033417088993903187, "tps": 14493, "wall": 42070.2} {"step": 9304, "train_loss": 3.542085886001587, "lr": 0.000334156078220277, "tps": 14492, "wall": 42078.1} {"step": 9305, "train_loss": 3.605588912963867, "lr": 0.0003341412652083559, "tps": 14491, "wall": 42085.9} {"step": 9306, "train_loss": 3.710775852203369, "lr": 0.0003341264509034364, "tps": 14490, "wall": 42093.7} {"step": 9307, "train_loss": 3.4752769470214844, "lr": 0.00033411163530568626, "tps": 14488, "wall": 42101.6} {"step": 9308, "train_loss": 3.6614835262298584, "lr": 0.00033409681841527336, "tps": 14487, "wall": 42109.5} {"step": 9309, "train_loss": 3.551680088043213, "lr": 0.00033408200023236554, "tps": 14486, "wall": 42117.4} {"step": 9310, "train_loss": 3.6159088611602783, "lr": 0.00033406718075713063, "tps": 14485, "wall": 42125.2} {"step": 9311, "train_loss": 3.5720949172973633, "lr": 0.0003340523599897365, "tps": 14484, "wall": 42133.0} {"step": 9312, "train_loss": 3.5755422115325928, "lr": 0.00033403753793035117, "tps": 14483, "wall": 42141.0} {"step": 9313, "train_loss": 3.589076042175293, "lr": 0.00033402271457914234, "tps": 14482, "wall": 42148.8} {"step": 9314, "train_loss": 3.539914608001709, "lr": 0.0003340078899362781, "tps": 14480, "wall": 42156.6} {"step": 9315, "train_loss": 3.4727425575256348, "lr": 0.00033399306400192625, "tps": 14479, "wall": 42164.4} {"step": 9316, "train_loss": 3.5567121505737305, "lr": 0.0003339782367762548, "tps": 14478, "wall": 42172.3} {"step": 9317, "train_loss": 3.511363983154297, "lr": 0.0003339634082594318, "tps": 14477, "wall": 42180.3} {"step": 9318, "train_loss": 3.500143051147461, "lr": 0.00033394857845162507, "tps": 14476, "wall": 42188.2} {"step": 9319, "train_loss": 3.5340843200683594, "lr": 0.00033393374735300274, "tps": 14475, "wall": 42196.1} {"step": 9320, "train_loss": 3.4686977863311768, "lr": 0.0003339189149637327, "tps": 14474, "wall": 42203.9} {"step": 9321, "train_loss": 3.5730581283569336, "lr": 0.00033390408128398306, "tps": 14472, "wall": 42211.6} {"step": 9322, "train_loss": 3.4353394508361816, "lr": 0.00033388924631392176, "tps": 14471, "wall": 42219.5} {"step": 9323, "train_loss": 3.569667339324951, "lr": 0.000333874410053717, "tps": 14470, "wall": 42227.4} {"step": 9324, "train_loss": 3.6017978191375732, "lr": 0.0003338595725035367, "tps": 14469, "wall": 42235.3} {"step": 9325, "train_loss": 3.503384590148926, "lr": 0.00033384473366354905, "tps": 14468, "wall": 42243.1} {"step": 9326, "train_loss": 3.501065731048584, "lr": 0.00033382989353392215, "tps": 14467, "wall": 42251.0} {"step": 9327, "train_loss": 3.483038902282715, "lr": 0.00033381505211482396, "tps": 14466, "wall": 42258.7} {"step": 9328, "train_loss": 3.5829601287841797, "lr": 0.00033380020940642274, "tps": 14464, "wall": 42266.6} {"step": 9329, "train_loss": 3.4363656044006348, "lr": 0.0003337853654088866, "tps": 14463, "wall": 42274.4} {"step": 9330, "train_loss": 3.545832872390747, "lr": 0.00033377052012238364, "tps": 14462, "wall": 42282.2} {"step": 9331, "train_loss": 3.591928005218506, "lr": 0.00033375567354708213, "tps": 14461, "wall": 42290.0} {"step": 9332, "train_loss": 3.6636197566986084, "lr": 0.0003337408256831502, "tps": 14460, "wall": 42297.9} {"step": 9333, "train_loss": 3.6090810298919678, "lr": 0.000333725976530756, "tps": 14459, "wall": 42305.7} {"step": 9334, "train_loss": 3.576953411102295, "lr": 0.00033371112609006774, "tps": 14458, "wall": 42313.4} {"step": 9335, "train_loss": 3.5373640060424805, "lr": 0.0003336962743612538, "tps": 14457, "wall": 42321.2} {"step": 9336, "train_loss": 3.518123149871826, "lr": 0.00033368142134448226, "tps": 14455, "wall": 42329.2} {"step": 9337, "train_loss": 3.528982639312744, "lr": 0.0003336665670399214, "tps": 14454, "wall": 42336.9} {"step": 9338, "train_loss": 3.601940155029297, "lr": 0.00033365171144773956, "tps": 14453, "wall": 42344.7} {"step": 9339, "train_loss": 3.529792070388794, "lr": 0.000333636854568105, "tps": 14452, "wall": 42352.5} {"step": 9340, "train_loss": 3.522838830947876, "lr": 0.000333621996401186, "tps": 14451, "wall": 42360.4} {"step": 9341, "train_loss": 3.5160839557647705, "lr": 0.0003336071369471508, "tps": 14450, "wall": 42368.1} {"step": 9342, "train_loss": 3.5669026374816895, "lr": 0.00033359227620616787, "tps": 14449, "wall": 42376.1} {"step": 9343, "train_loss": 3.5098438262939453, "lr": 0.0003335774141784055, "tps": 14448, "wall": 42383.9} {"step": 9344, "train_loss": 3.544644832611084, "lr": 0.000333562550864032, "tps": 14447, "wall": 42391.7} {"step": 9345, "train_loss": 3.5001139640808105, "lr": 0.0003335476862632158, "tps": 14445, "wall": 42399.5} {"step": 9346, "train_loss": 3.6282386779785156, "lr": 0.0003335328203761253, "tps": 14444, "wall": 42407.5} {"step": 9347, "train_loss": 3.6016130447387695, "lr": 0.00033351795320292883, "tps": 14443, "wall": 42415.3} {"step": 9348, "train_loss": 3.4574272632598877, "lr": 0.00033350308474379485, "tps": 14442, "wall": 42423.2} {"step": 9349, "train_loss": 3.597490072250366, "lr": 0.0003334882149988918, "tps": 14441, "wall": 42431.0} {"step": 9350, "train_loss": 3.6151270866394043, "lr": 0.0003334733439683881, "tps": 14440, "wall": 42438.8} {"step": 9351, "train_loss": 3.5536763668060303, "lr": 0.0003334584716524522, "tps": 14439, "wall": 42446.7} {"step": 9352, "train_loss": 3.5760178565979004, "lr": 0.00033344359805125267, "tps": 14437, "wall": 42454.6} {"step": 9353, "train_loss": 3.614292621612549, "lr": 0.00033342872316495785, "tps": 14436, "wall": 42462.4} {"step": 9354, "train_loss": 3.53830623626709, "lr": 0.00033341384699373634, "tps": 14435, "wall": 42470.3} {"step": 9355, "train_loss": 3.5125174522399902, "lr": 0.0003333989695377566, "tps": 14434, "wall": 42478.2} {"step": 9356, "train_loss": 3.6427788734436035, "lr": 0.00033338409079718725, "tps": 14433, "wall": 42486.1} {"step": 9357, "train_loss": 3.487410068511963, "lr": 0.00033336921077219676, "tps": 14432, "wall": 42493.9} {"step": 9358, "train_loss": 3.497316598892212, "lr": 0.0003333543294629537, "tps": 14431, "wall": 42501.9} {"step": 9359, "train_loss": 3.537982940673828, "lr": 0.0003333394468696267, "tps": 14429, "wall": 42509.8} {"step": 9360, "train_loss": 3.4433350563049316, "lr": 0.0003333245629923843, "tps": 14428, "wall": 42517.7} {"step": 9361, "train_loss": 3.443394660949707, "lr": 0.00033330967783139513, "tps": 14427, "wall": 42525.8} {"step": 9362, "train_loss": 3.4178638458251953, "lr": 0.00033329479138682774, "tps": 14426, "wall": 42533.6} {"step": 9363, "train_loss": 3.570523977279663, "lr": 0.00033327990365885095, "tps": 14425, "wall": 42541.4} {"step": 9364, "train_loss": 3.591946840286255, "lr": 0.00033326501464763317, "tps": 14424, "wall": 42549.3} {"step": 9365, "train_loss": 3.542851209640503, "lr": 0.00033325012435334327, "tps": 14423, "wall": 42557.2} {"step": 9366, "train_loss": 3.484147310256958, "lr": 0.00033323523277614973, "tps": 14422, "wall": 42565.1} {"step": 9367, "train_loss": 3.530712127685547, "lr": 0.00033322033991622143, "tps": 14420, "wall": 42573.0} {"step": 9368, "train_loss": 3.6285359859466553, "lr": 0.000333205445773727, "tps": 14419, "wall": 42580.9} {"step": 9369, "train_loss": 3.552489995956421, "lr": 0.00033319055034883505, "tps": 14418, "wall": 42588.9} {"step": 9370, "train_loss": 3.5351076126098633, "lr": 0.00033317565364171444, "tps": 14417, "wall": 42596.9} {"step": 9371, "train_loss": 3.514187812805176, "lr": 0.000333160755652534, "tps": 14416, "wall": 42604.7} {"step": 9372, "train_loss": 3.6109485626220703, "lr": 0.0003331458563814624, "tps": 14415, "wall": 42612.6} {"step": 9373, "train_loss": 3.6170105934143066, "lr": 0.0003331309558286684, "tps": 14414, "wall": 42620.5} {"step": 9374, "train_loss": 3.5356714725494385, "lr": 0.0003331160539943207, "tps": 14412, "wall": 42628.4} {"step": 9375, "train_loss": 3.471771240234375, "lr": 0.0003331011508785883, "tps": 14411, "wall": 42636.3} {"step": 9376, "train_loss": 3.4689033031463623, "lr": 0.00033308624648163996, "tps": 14410, "wall": 42644.3} {"step": 9377, "train_loss": 3.5457749366760254, "lr": 0.0003330713408036445, "tps": 14409, "wall": 42652.2} {"step": 9378, "train_loss": 3.555276393890381, "lr": 0.00033305643384477074, "tps": 14408, "wall": 42660.1} {"step": 9379, "train_loss": 3.413745403289795, "lr": 0.0003330415256051876, "tps": 14407, "wall": 42667.9} {"step": 9380, "train_loss": 3.5914742946624756, "lr": 0.000333026616085064, "tps": 14406, "wall": 42675.9} {"step": 9381, "train_loss": 3.5304641723632812, "lr": 0.0003330117052845687, "tps": 14405, "wall": 42683.7} {"step": 9382, "train_loss": 3.5263302326202393, "lr": 0.00033299679320387065, "tps": 14403, "wall": 42691.7} {"step": 9383, "train_loss": 3.544239044189453, "lr": 0.0003329818798431389, "tps": 14402, "wall": 42699.6} {"step": 9384, "train_loss": 3.5549240112304688, "lr": 0.00033296696520254226, "tps": 14401, "wall": 42707.6} {"step": 9385, "train_loss": 3.488945245742798, "lr": 0.00033295204928224974, "tps": 14400, "wall": 42715.5} {"step": 9386, "train_loss": 3.552137851715088, "lr": 0.00033293713208243033, "tps": 14399, "wall": 42723.5} {"step": 9387, "train_loss": 3.6680731773376465, "lr": 0.000332922213603253, "tps": 14398, "wall": 42731.4} {"step": 9388, "train_loss": 3.4684736728668213, "lr": 0.00033290729384488664, "tps": 14396, "wall": 42739.3} {"step": 9389, "train_loss": 3.6202540397644043, "lr": 0.00033289237280750036, "tps": 14395, "wall": 42747.2} {"step": 9390, "train_loss": 3.6870524883270264, "lr": 0.0003328774504912632, "tps": 14394, "wall": 42755.1} {"step": 9391, "train_loss": 3.4313721656799316, "lr": 0.00033286252689634417, "tps": 14393, "wall": 42763.0} {"step": 9392, "train_loss": 3.496812343597412, "lr": 0.00033284760202291236, "tps": 14392, "wall": 42771.1} {"step": 9393, "train_loss": 3.61527156829834, "lr": 0.00033283267587113675, "tps": 14391, "wall": 42779.1} {"step": 9394, "train_loss": 3.4897091388702393, "lr": 0.0003328177484411866, "tps": 14390, "wall": 42786.9} {"step": 9395, "train_loss": 3.5164406299591064, "lr": 0.0003328028197332307, "tps": 14389, "wall": 42794.9} {"step": 9396, "train_loss": 3.53531551361084, "lr": 0.0003327878897474385, "tps": 14387, "wall": 42802.8} {"step": 9397, "train_loss": 3.6383938789367676, "lr": 0.00033277295848397893, "tps": 14386, "wall": 42810.8} {"step": 9398, "train_loss": 3.5245354175567627, "lr": 0.00033275802594302117, "tps": 14385, "wall": 42818.7} {"step": 9399, "train_loss": 3.6789331436157227, "lr": 0.00033274309212473447, "tps": 14384, "wall": 42826.7} {"step": 9400, "train_loss": 3.5388331413269043, "lr": 0.0003327281570292879, "tps": 14383, "wall": 42834.7} {"step": 9401, "train_loss": 3.511493444442749, "lr": 0.00033271322065685064, "tps": 14382, "wall": 42842.6} {"step": 9402, "train_loss": 3.5289597511291504, "lr": 0.0003326982830075919, "tps": 14381, "wall": 42850.6} {"step": 9403, "train_loss": 3.435488700866699, "lr": 0.0003326833440816809, "tps": 14379, "wall": 42858.5} {"step": 9404, "train_loss": 3.5493850708007812, "lr": 0.00033266840387928694, "tps": 14378, "wall": 42866.5} {"step": 9405, "train_loss": 3.5807409286499023, "lr": 0.00033265346240057917, "tps": 14377, "wall": 42874.5} {"step": 9406, "train_loss": 3.5119547843933105, "lr": 0.0003326385196457269, "tps": 14376, "wall": 42882.3} {"step": 9407, "train_loss": 3.6232123374938965, "lr": 0.0003326235756148994, "tps": 14375, "wall": 42890.4} {"step": 9408, "train_loss": 3.508852005004883, "lr": 0.00033260863030826595, "tps": 14374, "wall": 42898.3} {"step": 9409, "train_loss": 3.627716541290283, "lr": 0.0003325936837259958, "tps": 14373, "wall": 42906.3} {"step": 9410, "train_loss": 3.5605478286743164, "lr": 0.0003325787358682583, "tps": 14371, "wall": 42914.0} {"step": 9411, "train_loss": 3.506040573120117, "lr": 0.00033256378673522283, "tps": 14370, "wall": 42922.0} {"step": 9412, "train_loss": 3.5794568061828613, "lr": 0.00033254883632705866, "tps": 14369, "wall": 42930.0} {"step": 9413, "train_loss": 3.5283608436584473, "lr": 0.0003325338846439352, "tps": 14368, "wall": 42938.0} {"step": 9414, "train_loss": 3.5552947521209717, "lr": 0.0003325189316860218, "tps": 14367, "wall": 42946.0} {"step": 9415, "train_loss": 3.5471479892730713, "lr": 0.00033250397745348783, "tps": 14366, "wall": 42953.9} {"step": 9416, "train_loss": 3.5306363105773926, "lr": 0.0003324890219465028, "tps": 14365, "wall": 42961.9} {"step": 9417, "train_loss": 3.52323317527771, "lr": 0.00033247406516523603, "tps": 14364, "wall": 42969.7} {"step": 9418, "train_loss": 3.589029312133789, "lr": 0.00033245910710985686, "tps": 14362, "wall": 42977.7} {"step": 9419, "train_loss": 3.5632991790771484, "lr": 0.000332444147780535, "tps": 14361, "wall": 42985.6} {"step": 9420, "train_loss": 3.578827381134033, "lr": 0.0003324291871774396, "tps": 14360, "wall": 42993.6} {"step": 9421, "train_loss": 3.6212072372436523, "lr": 0.00033241422530074036, "tps": 14359, "wall": 43001.5} {"step": 9422, "train_loss": 3.5241873264312744, "lr": 0.00033239926215060666, "tps": 14358, "wall": 43009.6} {"step": 9423, "train_loss": 3.577874183654785, "lr": 0.0003323842977272081, "tps": 14357, "wall": 43017.5} {"step": 9424, "train_loss": 3.536628246307373, "lr": 0.0003323693320307141, "tps": 14356, "wall": 43025.5} {"step": 9425, "train_loss": 3.4561102390289307, "lr": 0.0003323543650612942, "tps": 14354, "wall": 43033.3} {"step": 9426, "train_loss": 3.525935411453247, "lr": 0.000332339396819118, "tps": 14353, "wall": 43041.2} {"step": 9427, "train_loss": 3.4361867904663086, "lr": 0.00033232442730435504, "tps": 14352, "wall": 43049.3} {"step": 9428, "train_loss": 3.5529868602752686, "lr": 0.0003323094565171749, "tps": 14351, "wall": 43057.4} {"step": 9429, "train_loss": 3.5466339588165283, "lr": 0.00033229448445774715, "tps": 14350, "wall": 43065.4} {"step": 9430, "train_loss": 3.475585460662842, "lr": 0.00033227951112624137, "tps": 14349, "wall": 43073.3} {"step": 9431, "train_loss": 3.6054868698120117, "lr": 0.0003322645365228273, "tps": 14348, "wall": 43081.3} {"step": 9432, "train_loss": 3.5921530723571777, "lr": 0.00033224956064767435, "tps": 14346, "wall": 43089.3} {"step": 9433, "train_loss": 3.55967378616333, "lr": 0.0003322345835009524, "tps": 14345, "wall": 43097.2} {"step": 9434, "train_loss": 3.558006525039673, "lr": 0.00033221960508283103, "tps": 14344, "wall": 43105.2} {"step": 9435, "train_loss": 3.4413259029388428, "lr": 0.0003322046253934799, "tps": 14343, "wall": 43113.1} {"step": 9436, "train_loss": 3.6190154552459717, "lr": 0.00033218964443306864, "tps": 14342, "wall": 43121.1} {"step": 9437, "train_loss": 3.4980740547180176, "lr": 0.0003321746622017671, "tps": 14341, "wall": 43129.2} {"step": 9438, "train_loss": 3.520289659500122, "lr": 0.00033215967869974484, "tps": 14340, "wall": 43137.3} {"step": 9439, "train_loss": 3.6761646270751953, "lr": 0.0003321446939271717, "tps": 14339, "wall": 43145.2} {"step": 9440, "train_loss": 3.471700668334961, "lr": 0.00033212970788421735, "tps": 14337, "wall": 43153.1} {"step": 9441, "train_loss": 3.4551291465759277, "lr": 0.00033211472057105166, "tps": 14336, "wall": 43161.1} {"step": 9442, "train_loss": 3.45290207862854, "lr": 0.00033209973198784434, "tps": 14335, "wall": 43169.2} {"step": 9443, "train_loss": 3.472656726837158, "lr": 0.0003320847421347653, "tps": 14334, "wall": 43177.1} {"step": 9444, "train_loss": 3.633418560028076, "lr": 0.0003320697510119841, "tps": 14333, "wall": 43185.1} {"step": 9445, "train_loss": 3.582064151763916, "lr": 0.00033205475861967075, "tps": 14332, "wall": 43193.0} {"step": 9446, "train_loss": 3.5842604637145996, "lr": 0.00033203976495799496, "tps": 14331, "wall": 43201.0} {"step": 9447, "train_loss": 3.5738730430603027, "lr": 0.0003320247700271267, "tps": 14329, "wall": 43209.0} {"step": 9448, "train_loss": 3.578427314758301, "lr": 0.0003320097738272359, "tps": 14328, "wall": 43216.9} {"step": 9449, "train_loss": 3.46140193939209, "lr": 0.00033199477635849215, "tps": 14327, "wall": 43224.8} {"step": 9450, "train_loss": 3.4912302494049072, "lr": 0.00033197977762106556, "tps": 14326, "wall": 43232.9} {"step": 9451, "train_loss": 3.6433238983154297, "lr": 0.000331964777615126, "tps": 14325, "wall": 43241.0} {"step": 9452, "train_loss": 3.554929733276367, "lr": 0.00033194977634084345, "tps": 14324, "wall": 43248.9} {"step": 9453, "train_loss": 3.5869758129119873, "lr": 0.0003319347737983877, "tps": 14323, "wall": 43256.9} {"step": 9454, "train_loss": 3.6202895641326904, "lr": 0.0003319197699879288, "tps": 14322, "wall": 43264.9} {"step": 9455, "train_loss": 3.523747444152832, "lr": 0.0003319047649096367, "tps": 14320, "wall": 43272.7} {"step": 9456, "train_loss": 3.5352261066436768, "lr": 0.0003318897585636813, "tps": 14319, "wall": 43280.8} {"step": 9457, "train_loss": 3.596919059753418, "lr": 0.0003318747509502328, "tps": 14318, "wall": 43288.8} {"step": 9458, "train_loss": 3.522777557373047, "lr": 0.00033185974206946094, "tps": 14317, "wall": 43296.8} {"step": 9459, "train_loss": 3.5135092735290527, "lr": 0.0003318447319215359, "tps": 14316, "wall": 43304.7} {"step": 9460, "train_loss": 3.461301803588867, "lr": 0.00033182972050662773, "tps": 14315, "wall": 43312.7} {"step": 9461, "train_loss": 3.6472644805908203, "lr": 0.0003318147078249064, "tps": 14314, "wall": 43320.7} {"step": 9462, "train_loss": 3.503833770751953, "lr": 0.0003317996938765421, "tps": 14313, "wall": 43328.6} {"step": 9463, "train_loss": 3.6189355850219727, "lr": 0.0003317846786617047, "tps": 14311, "wall": 43336.6} {"step": 9464, "train_loss": 3.5897016525268555, "lr": 0.00033176966218056444, "tps": 14310, "wall": 43344.7} {"step": 9465, "train_loss": 3.6303768157958984, "lr": 0.0003317546444332914, "tps": 14309, "wall": 43352.7} {"step": 9466, "train_loss": 3.5350821018218994, "lr": 0.0003317396254200557, "tps": 14308, "wall": 43360.7} {"step": 9467, "train_loss": 3.5164103507995605, "lr": 0.0003317246051410275, "tps": 14307, "wall": 43368.7} {"step": 9468, "train_loss": 3.5350112915039062, "lr": 0.0003317095835963769, "tps": 14306, "wall": 43376.8} {"step": 9469, "train_loss": 3.4988608360290527, "lr": 0.0003316945607862742, "tps": 14305, "wall": 43384.7} {"step": 9470, "train_loss": 3.546553373336792, "lr": 0.00033167953671088936, "tps": 14304, "wall": 43392.6} {"step": 9471, "train_loss": 3.5198733806610107, "lr": 0.0003316645113703927, "tps": 14302, "wall": 43400.6} {"step": 9472, "train_loss": 3.496338367462158, "lr": 0.00033164948476495446, "tps": 14301, "wall": 43408.7} {"step": 9473, "train_loss": 3.476729154586792, "lr": 0.0003316344568947448, "tps": 14300, "wall": 43416.7} {"step": 9474, "train_loss": 3.518444776535034, "lr": 0.00033161942775993393, "tps": 14299, "wall": 43424.5} {"step": 9475, "train_loss": 3.613011598587036, "lr": 0.00033160439736069214, "tps": 14298, "wall": 43432.6} {"step": 9476, "train_loss": 3.6449358463287354, "lr": 0.0003315893656971898, "tps": 14297, "wall": 43440.6} {"step": 9477, "train_loss": 3.5997655391693115, "lr": 0.00033157433276959704, "tps": 14296, "wall": 43448.7} {"step": 9478, "train_loss": 3.523374557495117, "lr": 0.0003315592985780841, "tps": 14295, "wall": 43456.6} {"step": 9479, "train_loss": 3.5645272731781006, "lr": 0.0003315442631228215, "tps": 14293, "wall": 43464.6} {"step": 9480, "train_loss": 3.4531946182250977, "lr": 0.00033152922640397944, "tps": 14292, "wall": 43472.6} {"step": 9481, "train_loss": 3.4400746822357178, "lr": 0.00033151418842172824, "tps": 14291, "wall": 43480.7} {"step": 9482, "train_loss": 3.395677328109741, "lr": 0.00033149914917623833, "tps": 14290, "wall": 43488.7} {"step": 9483, "train_loss": 3.4858484268188477, "lr": 0.00033148410866767994, "tps": 14289, "wall": 43496.8} {"step": 9484, "train_loss": 3.6041126251220703, "lr": 0.0003314690668962237, "tps": 14288, "wall": 43504.6} {"step": 9485, "train_loss": 3.580983877182007, "lr": 0.00033145402386203964, "tps": 14287, "wall": 43512.6} {"step": 9486, "train_loss": 3.5214710235595703, "lr": 0.0003314389795652985, "tps": 14286, "wall": 43520.6} {"step": 9487, "train_loss": 3.616359233856201, "lr": 0.0003314239340061705, "tps": 14284, "wall": 43528.6} {"step": 9488, "train_loss": 3.5482044219970703, "lr": 0.00033140888718482614, "tps": 14283, "wall": 43536.6} {"step": 9489, "train_loss": 3.4888503551483154, "lr": 0.00033139383910143593, "tps": 14282, "wall": 43544.5} {"step": 9490, "train_loss": 3.5024688243865967, "lr": 0.00033137878975617036, "tps": 14281, "wall": 43552.7} {"step": 9491, "train_loss": 3.5708391666412354, "lr": 0.0003313637391491997, "tps": 14280, "wall": 43560.6} {"step": 9492, "train_loss": 3.5691542625427246, "lr": 0.00033134868728069457, "tps": 14279, "wall": 43568.5} {"step": 9493, "train_loss": 3.561290740966797, "lr": 0.00033133363415082555, "tps": 14278, "wall": 43576.4} {"step": 9494, "train_loss": 3.5339555740356445, "lr": 0.0003313185797597631, "tps": 14277, "wall": 43584.5} {"step": 9495, "train_loss": 3.5667524337768555, "lr": 0.00033130352410767774, "tps": 14276, "wall": 43592.4} {"step": 9496, "train_loss": 3.4925568103790283, "lr": 0.0003312884671947401, "tps": 14274, "wall": 43600.4} {"step": 9497, "train_loss": 3.6163330078125, "lr": 0.00033127340902112056, "tps": 14273, "wall": 43608.5} {"step": 9498, "train_loss": 3.531742811203003, "lr": 0.0003312583495869899, "tps": 14272, "wall": 43616.5} {"step": 9499, "train_loss": 3.482541561126709, "lr": 0.00033124328889251863, "tps": 14271, "wall": 43624.4} {"step": 9500, "train_loss": 3.589171886444092, "lr": 0.0003312282269378774, "tps": 14270, "wall": 43632.4} {"step": 9501, "train_loss": 3.579622268676758, "lr": 0.0003312131637232367, "tps": 14269, "wall": 43640.3} {"step": 9502, "train_loss": 3.490260362625122, "lr": 0.00033119809924876735, "tps": 14268, "wall": 43648.3} {"step": 9503, "train_loss": 3.4206268787384033, "lr": 0.0003311830335146399, "tps": 14267, "wall": 43656.4} {"step": 9504, "train_loss": 3.5589394569396973, "lr": 0.00033116796652102494, "tps": 14266, "wall": 43664.3} {"step": 9505, "train_loss": 3.4039134979248047, "lr": 0.00033115289826809335, "tps": 14264, "wall": 43672.4} {"step": 9506, "train_loss": 3.5456531047821045, "lr": 0.0003311378287560157, "tps": 14263, "wall": 43680.4} {"step": 9507, "train_loss": 3.5650289058685303, "lr": 0.00033112275798496266, "tps": 14262, "wall": 43688.4} {"step": 9508, "train_loss": 3.5825986862182617, "lr": 0.00033110768595510514, "tps": 14261, "wall": 43696.4} {"step": 9509, "train_loss": 3.537015199661255, "lr": 0.0003310926126666136, "tps": 14260, "wall": 43704.4} {"step": 9510, "train_loss": 3.4530346393585205, "lr": 0.00033107753811965896, "tps": 14259, "wall": 43712.3} {"step": 9511, "train_loss": 3.5376439094543457, "lr": 0.000331062462314412, "tps": 14258, "wall": 43720.4} {"step": 9512, "train_loss": 3.4453439712524414, "lr": 0.0003310473852510434, "tps": 14257, "wall": 43728.4} {"step": 9513, "train_loss": 3.6520214080810547, "lr": 0.0003310323069297241, "tps": 14256, "wall": 43736.5} {"step": 9514, "train_loss": 3.527676820755005, "lr": 0.0003310172273506248, "tps": 14254, "wall": 43744.4} {"step": 9515, "train_loss": 3.4639739990234375, "lr": 0.0003310021465139163, "tps": 14253, "wall": 43752.4} {"step": 9516, "train_loss": 3.51531982421875, "lr": 0.00033098706441976947, "tps": 14252, "wall": 43760.4} {"step": 9517, "train_loss": 3.5169496536254883, "lr": 0.0003309719810683552, "tps": 14251, "wall": 43768.5} {"step": 9518, "train_loss": 3.493699073791504, "lr": 0.0003309568964598443, "tps": 14250, "wall": 43776.5} {"step": 9519, "train_loss": 3.5682003498077393, "lr": 0.00033094181059440775, "tps": 14249, "wall": 43784.5} {"step": 9520, "train_loss": 3.5667409896850586, "lr": 0.00033092672347221627, "tps": 14248, "wall": 43792.5} {"step": 9521, "train_loss": 3.631361246109009, "lr": 0.00033091163509344087, "tps": 14247, "wall": 43800.6} {"step": 9522, "train_loss": 3.5615458488464355, "lr": 0.0003308965454582525, "tps": 14246, "wall": 43808.4} {"step": 9523, "train_loss": 3.466573476791382, "lr": 0.0003308814545668221, "tps": 14245, "wall": 43816.4} {"step": 9524, "train_loss": 3.4219727516174316, "lr": 0.00033086636241932055, "tps": 14243, "wall": 43824.4} {"step": 9525, "train_loss": 3.4713125228881836, "lr": 0.0003308512690159188, "tps": 14242, "wall": 43832.4} {"step": 9526, "train_loss": 3.4617881774902344, "lr": 0.00033083617435678795, "tps": 14241, "wall": 43840.5} {"step": 9527, "train_loss": 3.5604705810546875, "lr": 0.000330821078442099, "tps": 14240, "wall": 43848.5} {"step": 9528, "train_loss": 3.5358974933624268, "lr": 0.0003308059812720227, "tps": 14239, "wall": 43856.7} {"step": 9529, "train_loss": 3.46016526222229, "lr": 0.0003307908828467303, "tps": 14238, "wall": 43864.6} {"step": 9530, "train_loss": 3.581517219543457, "lr": 0.00033077578316639285, "tps": 14237, "wall": 43872.5} {"step": 9531, "train_loss": 3.535823106765747, "lr": 0.0003307606822311813, "tps": 14236, "wall": 43880.6} {"step": 9532, "train_loss": 3.560554027557373, "lr": 0.0003307455800412667, "tps": 14235, "wall": 43888.6} {"step": 9533, "train_loss": 3.5839643478393555, "lr": 0.0003307304765968203, "tps": 14233, "wall": 43896.7} {"step": 9534, "train_loss": 3.6422195434570312, "lr": 0.00033071537189801296, "tps": 14232, "wall": 43904.7} {"step": 9535, "train_loss": 3.4912688732147217, "lr": 0.00033070026594501586, "tps": 14231, "wall": 43912.7} {"step": 9536, "train_loss": 3.5864837169647217, "lr": 0.0003306851587380003, "tps": 14230, "wall": 43920.6} {"step": 9537, "train_loss": 3.5514044761657715, "lr": 0.0003306700502771372, "tps": 14229, "wall": 43928.5} {"step": 9538, "train_loss": 3.6289944648742676, "lr": 0.0003306549405625978, "tps": 14228, "wall": 43936.5} {"step": 9539, "train_loss": 3.6096701622009277, "lr": 0.0003306398295945532, "tps": 14227, "wall": 43944.5} {"step": 9540, "train_loss": 3.525312900543213, "lr": 0.00033062471737317466, "tps": 14226, "wall": 43952.6} {"step": 9541, "train_loss": 3.535334825515747, "lr": 0.00033060960389863335, "tps": 14225, "wall": 43960.6} {"step": 9542, "train_loss": 3.580286979675293, "lr": 0.00033059448917110046, "tps": 14223, "wall": 43968.7} {"step": 9543, "train_loss": 3.497814655303955, "lr": 0.0003305793731907472, "tps": 14222, "wall": 43976.8} {"step": 9544, "train_loss": 3.3764805793762207, "lr": 0.0003305642559577448, "tps": 14221, "wall": 43984.8} {"step": 9545, "train_loss": 3.5006515979766846, "lr": 0.00033054913747226455, "tps": 14220, "wall": 43992.7} {"step": 9546, "train_loss": 3.5853281021118164, "lr": 0.0003305340177344777, "tps": 14219, "wall": 44000.7} {"step": 9547, "train_loss": 3.4946396350860596, "lr": 0.00033051889674455553, "tps": 14218, "wall": 44008.9} {"step": 9548, "train_loss": 3.5045223236083984, "lr": 0.0003305037745026693, "tps": 14217, "wall": 44016.9} {"step": 9549, "train_loss": 3.5571823120117188, "lr": 0.0003304886510089903, "tps": 14216, "wall": 44024.8} {"step": 9550, "train_loss": 3.584900379180908, "lr": 0.0003304735262636899, "tps": 14215, "wall": 44032.8} {"step": 9551, "train_loss": 3.4678730964660645, "lr": 0.00033045840026693944, "tps": 14214, "wall": 44040.8} {"step": 9552, "train_loss": 3.4933512210845947, "lr": 0.00033044327301891025, "tps": 14213, "wall": 44048.8} {"step": 9553, "train_loss": 3.5628035068511963, "lr": 0.0003304281445197737, "tps": 14211, "wall": 44056.7} {"step": 9554, "train_loss": 3.639329433441162, "lr": 0.0003304130147697011, "tps": 14210, "wall": 44064.6} {"step": 9555, "train_loss": 3.5506176948547363, "lr": 0.00033039788376886393, "tps": 14209, "wall": 44072.7} {"step": 9556, "train_loss": 3.5157439708709717, "lr": 0.00033038275151743357, "tps": 14208, "wall": 44080.7} {"step": 9557, "train_loss": 3.5645861625671387, "lr": 0.0003303676180155814, "tps": 14207, "wall": 44088.7} {"step": 9558, "train_loss": 3.626115083694458, "lr": 0.00033035248326347894, "tps": 14206, "wall": 44096.7} {"step": 9559, "train_loss": 3.523630380630493, "lr": 0.0003303373472612975, "tps": 14205, "wall": 44104.7} {"step": 9560, "train_loss": 3.5497188568115234, "lr": 0.00033032221000920867, "tps": 14204, "wall": 44112.6} {"step": 9561, "train_loss": 3.445383071899414, "lr": 0.0003303070715073839, "tps": 14203, "wall": 44120.6} {"step": 9562, "train_loss": 3.5856151580810547, "lr": 0.0003302919317559946, "tps": 14202, "wall": 44128.8} {"step": 9563, "train_loss": 3.6102070808410645, "lr": 0.00033027679075521235, "tps": 14200, "wall": 44136.8} {"step": 9564, "train_loss": 3.521355628967285, "lr": 0.00033026164850520867, "tps": 14199, "wall": 44144.8} {"step": 9565, "train_loss": 3.5084166526794434, "lr": 0.00033024650500615497, "tps": 14198, "wall": 44152.9} {"step": 9566, "train_loss": 3.583256244659424, "lr": 0.00033023136025822305, "tps": 14197, "wall": 44160.9} {"step": 9567, "train_loss": 3.6020259857177734, "lr": 0.00033021621426158426, "tps": 14196, "wall": 44168.9} {"step": 9568, "train_loss": 3.5073330402374268, "lr": 0.0003302010670164102, "tps": 14195, "wall": 44176.9} {"step": 9569, "train_loss": 3.6003103256225586, "lr": 0.00033018591852287255, "tps": 14194, "wall": 44184.8} {"step": 9570, "train_loss": 3.4428539276123047, "lr": 0.00033017076878114277, "tps": 14193, "wall": 44192.9} {"step": 9571, "train_loss": 3.4517149925231934, "lr": 0.0003301556177913926, "tps": 14192, "wall": 44200.9} {"step": 9572, "train_loss": 3.61832332611084, "lr": 0.0003301404655537937, "tps": 14191, "wall": 44209.0} {"step": 9573, "train_loss": 3.5627453327178955, "lr": 0.0003301253120685175, "tps": 14190, "wall": 44217.0} {"step": 9574, "train_loss": 3.580258369445801, "lr": 0.0003301101573357359, "tps": 14188, "wall": 44225.1} {"step": 9575, "train_loss": 3.4992620944976807, "lr": 0.0003300950013556205, "tps": 14187, "wall": 44232.9} {"step": 9576, "train_loss": 3.5158157348632812, "lr": 0.00033007984412834296, "tps": 14186, "wall": 44240.9} {"step": 9577, "train_loss": 3.5548505783081055, "lr": 0.0003300646856540749, "tps": 14185, "wall": 44249.0} {"step": 9578, "train_loss": 3.5010061264038086, "lr": 0.00033004952593298825, "tps": 14184, "wall": 44257.1} {"step": 9579, "train_loss": 3.5924506187438965, "lr": 0.00033003436496525457, "tps": 14183, "wall": 44265.2} {"step": 9580, "train_loss": 3.527362823486328, "lr": 0.00033001920275104563, "tps": 14182, "wall": 44273.2} {"step": 9581, "train_loss": 3.57639217376709, "lr": 0.00033000403929053324, "tps": 14181, "wall": 44281.2} {"step": 9582, "train_loss": 3.4810547828674316, "lr": 0.0003299888745838891, "tps": 14180, "wall": 44289.2} {"step": 9583, "train_loss": 3.602442502975464, "lr": 0.0003299737086312851, "tps": 14179, "wall": 44297.1} {"step": 9584, "train_loss": 3.713825225830078, "lr": 0.0003299585414328929, "tps": 14178, "wall": 44305.1} {"step": 9585, "train_loss": 3.4889793395996094, "lr": 0.0003299433729888845, "tps": 14177, "wall": 44313.2} {"step": 9586, "train_loss": 3.5517196655273438, "lr": 0.00032992820329943155, "tps": 14175, "wall": 44321.2} {"step": 9587, "train_loss": 3.595710277557373, "lr": 0.000329913032364706, "tps": 14174, "wall": 44329.3} {"step": 9588, "train_loss": 3.5480048656463623, "lr": 0.0003298978601848796, "tps": 14173, "wall": 44337.4} {"step": 9589, "train_loss": 3.5751123428344727, "lr": 0.00032988268676012434, "tps": 14172, "wall": 44345.3} {"step": 9590, "train_loss": 3.6338582038879395, "lr": 0.00032986751209061207, "tps": 14171, "wall": 44353.3} {"step": 9591, "train_loss": 3.548768997192383, "lr": 0.0003298523361765147, "tps": 14170, "wall": 44361.3} {"step": 9592, "train_loss": 3.521784782409668, "lr": 0.0003298371590180041, "tps": 14169, "wall": 44369.4} {"step": 9593, "train_loss": 3.5463104248046875, "lr": 0.0003298219806152522, "tps": 14168, "wall": 44377.5} {"step": 9594, "train_loss": 3.5986337661743164, "lr": 0.000329806800968431, "tps": 14167, "wall": 44385.7} {"step": 9595, "train_loss": 3.505601406097412, "lr": 0.0003297916200777124, "tps": 14166, "wall": 44393.6} {"step": 9596, "train_loss": 3.604579448699951, "lr": 0.00032977643794326834, "tps": 14165, "wall": 44401.6} {"step": 9597, "train_loss": 3.510479211807251, "lr": 0.00032976125456527097, "tps": 14163, "wall": 44409.6} {"step": 9598, "train_loss": 3.5374269485473633, "lr": 0.00032974606994389205, "tps": 14162, "wall": 44417.8} {"step": 9599, "train_loss": 3.5659618377685547, "lr": 0.0003297308840793037, "tps": 14161, "wall": 44425.8} {"step": 9600, "train_loss": 3.5288102626800537, "lr": 0.0003297156969716781, "tps": 14160, "wall": 44433.8} {"step": 9601, "train_loss": 3.5265772342681885, "lr": 0.00032970050862118704, "tps": 14159, "wall": 44441.8} {"step": 9602, "train_loss": 3.4914281368255615, "lr": 0.0003296853190280027, "tps": 14158, "wall": 44449.9} {"step": 9603, "train_loss": 3.5098047256469727, "lr": 0.00032967012819229717, "tps": 14157, "wall": 44457.9} {"step": 9604, "train_loss": 3.590505838394165, "lr": 0.0003296549361142424, "tps": 14156, "wall": 44466.0} {"step": 9605, "train_loss": 3.517030715942383, "lr": 0.0003296397427940107, "tps": 14155, "wall": 44473.8} {"step": 9606, "train_loss": 3.457019329071045, "lr": 0.000329624548231774, "tps": 14154, "wall": 44481.9} {"step": 9607, "train_loss": 3.487196445465088, "lr": 0.0003296093524277045, "tps": 14153, "wall": 44490.0} {"step": 9608, "train_loss": 3.444403648376465, "lr": 0.0003295941553819743, "tps": 14151, "wall": 44498.0} {"step": 9609, "train_loss": 3.6953794956207275, "lr": 0.0003295789570947557, "tps": 14150, "wall": 44506.1} {"step": 9610, "train_loss": 3.5499048233032227, "lr": 0.0003295637575662206, "tps": 14149, "wall": 44514.2} {"step": 9611, "train_loss": 3.6851606369018555, "lr": 0.00032954855679654136, "tps": 14148, "wall": 44522.2} {"step": 9612, "train_loss": 3.5224621295928955, "lr": 0.0003295333547858902, "tps": 14147, "wall": 44530.3} {"step": 9613, "train_loss": 3.5416464805603027, "lr": 0.00032951815153443924, "tps": 14146, "wall": 44538.3} {"step": 9614, "train_loss": 3.4273173809051514, "lr": 0.0003295029470423607, "tps": 14145, "wall": 44546.4} {"step": 9615, "train_loss": 3.505418300628662, "lr": 0.0003294877413098269, "tps": 14144, "wall": 44554.4} {"step": 9616, "train_loss": 3.618851661682129, "lr": 0.00032947253433701, "tps": 14143, "wall": 44562.3} {"step": 9617, "train_loss": 3.603646755218506, "lr": 0.00032945732612408234, "tps": 14142, "wall": 44570.5} {"step": 9618, "train_loss": 3.527066230773926, "lr": 0.0003294421166712162, "tps": 14141, "wall": 44578.6} {"step": 9619, "train_loss": 3.492643356323242, "lr": 0.0003294269059785838, "tps": 14140, "wall": 44586.6} {"step": 9620, "train_loss": 3.5036003589630127, "lr": 0.00032941169404635743, "tps": 14138, "wall": 44594.5} {"step": 9621, "train_loss": 3.627207040786743, "lr": 0.00032939648087470955, "tps": 14137, "wall": 44602.6} {"step": 9622, "train_loss": 3.5565531253814697, "lr": 0.0003293812664638124, "tps": 14136, "wall": 44610.6} {"step": 9623, "train_loss": 3.3714280128479004, "lr": 0.00032936605081383837, "tps": 14135, "wall": 44618.7} {"step": 9624, "train_loss": 3.5174849033355713, "lr": 0.0003293508339249597, "tps": 14134, "wall": 44626.7} {"step": 9625, "train_loss": 3.49187970161438, "lr": 0.000329335615797349, "tps": 14133, "wall": 44634.9} {"step": 9626, "train_loss": 3.4830667972564697, "lr": 0.0003293203964311784, "tps": 14132, "wall": 44642.8} {"step": 9627, "train_loss": 3.553467035293579, "lr": 0.0003293051758266206, "tps": 14131, "wall": 44650.9} {"step": 9628, "train_loss": 3.490020275115967, "lr": 0.00032928995398384767, "tps": 14130, "wall": 44658.9} {"step": 9629, "train_loss": 3.5425775051116943, "lr": 0.00032927473090303233, "tps": 14129, "wall": 44667.2} {"step": 9630, "train_loss": 3.560641288757324, "lr": 0.0003292595065843469, "tps": 14128, "wall": 44675.0} {"step": 9631, "train_loss": 3.6175427436828613, "lr": 0.0003292442810279639, "tps": 14127, "wall": 44683.1} {"step": 9632, "train_loss": 3.4521727561950684, "lr": 0.0003292290542340558, "tps": 14126, "wall": 44691.2} {"step": 9633, "train_loss": 3.4944043159484863, "lr": 0.00032921382620279495, "tps": 14124, "wall": 44699.3} {"step": 9634, "train_loss": 3.6674556732177734, "lr": 0.00032919859693435405, "tps": 14123, "wall": 44707.3} {"step": 9635, "train_loss": 3.4805898666381836, "lr": 0.00032918336642890554, "tps": 14122, "wall": 44715.3} {"step": 9636, "train_loss": 3.4516589641571045, "lr": 0.00032916813468662195, "tps": 14121, "wall": 44723.6} {"step": 9637, "train_loss": 3.5659732818603516, "lr": 0.0003291529017076758, "tps": 14120, "wall": 44731.7} {"step": 9638, "train_loss": 3.4969491958618164, "lr": 0.00032913766749223967, "tps": 14119, "wall": 44739.7} {"step": 9639, "train_loss": 3.5196361541748047, "lr": 0.00032912243204048623, "tps": 14118, "wall": 44747.7} {"step": 9640, "train_loss": 3.5940065383911133, "lr": 0.00032910719535258787, "tps": 14117, "wall": 44755.7} {"step": 9641, "train_loss": 3.522657632827759, "lr": 0.0003290919574287173, "tps": 14116, "wall": 44763.8} {"step": 9642, "train_loss": 3.57855224609375, "lr": 0.00032907671826904714, "tps": 14115, "wall": 44771.8} {"step": 9643, "train_loss": 3.5744519233703613, "lr": 0.0003290614778737501, "tps": 14114, "wall": 44779.8} {"step": 9644, "train_loss": 3.5777289867401123, "lr": 0.0003290462362429986, "tps": 14113, "wall": 44787.9} {"step": 9645, "train_loss": 3.5802862644195557, "lr": 0.00032903099337696555, "tps": 14111, "wall": 44796.0} {"step": 9646, "train_loss": 3.597458839416504, "lr": 0.0003290157492758235, "tps": 14110, "wall": 44804.0} {"step": 9647, "train_loss": 3.516836404800415, "lr": 0.00032900050393974505, "tps": 14109, "wall": 44812.1} {"step": 9648, "train_loss": 3.593518018722534, "lr": 0.0003289852573689031, "tps": 14108, "wall": 44820.2} {"step": 9649, "train_loss": 3.5807881355285645, "lr": 0.00032897000956347023, "tps": 14107, "wall": 44828.2} {"step": 9650, "train_loss": 3.551780939102173, "lr": 0.0003289547605236192, "tps": 14106, "wall": 44836.3} {"step": 9651, "train_loss": 3.6138010025024414, "lr": 0.00032893951024952274, "tps": 14105, "wall": 44844.3} {"step": 9652, "train_loss": 3.4839553833007812, "lr": 0.0003289242587413536, "tps": 14104, "wall": 44852.3} {"step": 9653, "train_loss": 3.5040059089660645, "lr": 0.00032890900599928457, "tps": 14103, "wall": 44860.5} {"step": 9654, "train_loss": 3.533863067626953, "lr": 0.0003288937520234884, "tps": 14102, "wall": 44868.5} {"step": 9655, "train_loss": 3.6482644081115723, "lr": 0.00032887849681413796, "tps": 14101, "wall": 44876.6} {"step": 9656, "train_loss": 3.48252272605896, "lr": 0.00032886324037140603, "tps": 14100, "wall": 44884.6} {"step": 9657, "train_loss": 3.543356418609619, "lr": 0.00032884798269546537, "tps": 14099, "wall": 44892.5} {"step": 9658, "train_loss": 3.601177930831909, "lr": 0.0003288327237864889, "tps": 14098, "wall": 44900.5} {"step": 9659, "train_loss": 3.598269462585449, "lr": 0.0003288174636446494, "tps": 14097, "wall": 44908.5} {"step": 9660, "train_loss": 3.534546136856079, "lr": 0.00032880220227011987, "tps": 14095, "wall": 44916.6} {"step": 9661, "train_loss": 3.5220210552215576, "lr": 0.00032878693966307307, "tps": 14094, "wall": 44924.6} {"step": 9662, "train_loss": 3.552800416946411, "lr": 0.00032877167582368196, "tps": 14093, "wall": 44932.5} {"step": 9663, "train_loss": 3.6345038414001465, "lr": 0.0003287564107521194, "tps": 14092, "wall": 44940.5} {"step": 9664, "train_loss": 3.480372428894043, "lr": 0.00032874114444855833, "tps": 14091, "wall": 44948.5} {"step": 9665, "train_loss": 3.559079170227051, "lr": 0.00032872587691317167, "tps": 14090, "wall": 44956.5} {"step": 9666, "train_loss": 3.536101818084717, "lr": 0.0003287106081461324, "tps": 14089, "wall": 44964.6} {"step": 9667, "train_loss": 3.5598621368408203, "lr": 0.00032869533814761353, "tps": 14088, "wall": 44972.5} {"step": 9668, "train_loss": 3.5283327102661133, "lr": 0.00032868006691778797, "tps": 14087, "wall": 44980.7} {"step": 9669, "train_loss": 3.553684711456299, "lr": 0.00032866479445682866, "tps": 14086, "wall": 44988.6} {"step": 9670, "train_loss": 3.5616068840026855, "lr": 0.00032864952076490877, "tps": 14085, "wall": 44996.7} {"step": 9671, "train_loss": 3.566649913787842, "lr": 0.0003286342458422012, "tps": 14084, "wall": 45004.6} {"step": 9672, "train_loss": 3.5795841217041016, "lr": 0.000328618969688879, "tps": 14083, "wall": 45012.5} {"step": 9673, "train_loss": 3.5346364974975586, "lr": 0.00032860369230511526, "tps": 14082, "wall": 45020.5} {"step": 9674, "train_loss": 3.5465307235717773, "lr": 0.00032858841369108296, "tps": 14081, "wall": 45028.8} {"step": 9675, "train_loss": 3.542339563369751, "lr": 0.0003285731338469553, "tps": 14080, "wall": 45036.9} {"step": 9676, "train_loss": 3.5392704010009766, "lr": 0.0003285578527729053, "tps": 14079, "wall": 45045.2} {"step": 9677, "train_loss": 3.5143227577209473, "lr": 0.00032854257046910606, "tps": 14077, "wall": 45053.2} {"step": 9678, "train_loss": 3.46923828125, "lr": 0.00032852728693573077, "tps": 14076, "wall": 45061.1} {"step": 9679, "train_loss": 3.6097140312194824, "lr": 0.0003285120021729524, "tps": 14075, "wall": 45069.1} {"step": 9680, "train_loss": 3.525944232940674, "lr": 0.00032849671618094425, "tps": 14074, "wall": 45077.3} {"step": 9681, "train_loss": 3.6246776580810547, "lr": 0.0003284814289598793, "tps": 14073, "wall": 45085.3} {"step": 9682, "train_loss": 3.4716434478759766, "lr": 0.0003284661405099311, "tps": 14072, "wall": 45093.3} {"step": 9683, "train_loss": 3.6687309741973877, "lr": 0.00032845085083127245, "tps": 14071, "wall": 45101.4} {"step": 9684, "train_loss": 3.603865146636963, "lr": 0.0003284355599240767, "tps": 14070, "wall": 45109.5} {"step": 9685, "train_loss": 3.497105360031128, "lr": 0.00032842026778851706, "tps": 14069, "wall": 45117.7} {"step": 9686, "train_loss": 3.5551772117614746, "lr": 0.00032840497442476675, "tps": 14068, "wall": 45125.5} {"step": 9687, "train_loss": 3.5725488662719727, "lr": 0.0003283896798329991, "tps": 14067, "wall": 45133.6} {"step": 9688, "train_loss": 3.6458580493927, "lr": 0.00032837438401338726, "tps": 14066, "wall": 45141.6} {"step": 9689, "train_loss": 3.434645414352417, "lr": 0.0003283590869661044, "tps": 14065, "wall": 45149.7} {"step": 9690, "train_loss": 3.4851832389831543, "lr": 0.00032834378869132415, "tps": 14064, "wall": 45157.7} {"step": 9691, "train_loss": 3.6030948162078857, "lr": 0.0003283284891892195, "tps": 14063, "wall": 45165.9} {"step": 9692, "train_loss": 3.54714298248291, "lr": 0.00032831318845996383, "tps": 14062, "wall": 45173.9} {"step": 9693, "train_loss": 3.444334030151367, "lr": 0.0003282978865037305, "tps": 14061, "wall": 45181.9} {"step": 9694, "train_loss": 3.5797924995422363, "lr": 0.00032828258332069296, "tps": 14060, "wall": 45189.9} {"step": 9695, "train_loss": 3.5421760082244873, "lr": 0.0003282672789110244, "tps": 14058, "wall": 45198.0} {"step": 9696, "train_loss": 3.533350944519043, "lr": 0.00032825197327489823, "tps": 14057, "wall": 45206.1} {"step": 9697, "train_loss": 3.4817991256713867, "lr": 0.0003282366664124879, "tps": 14056, "wall": 45214.2} {"step": 9698, "train_loss": 3.563490390777588, "lr": 0.0003282213583239667, "tps": 14055, "wall": 45222.2} {"step": 9699, "train_loss": 3.5896315574645996, "lr": 0.0003282060490095081, "tps": 14054, "wall": 45230.3} {"step": 9700, "train_loss": 3.6047592163085938, "lr": 0.0003281907384692855, "tps": 14053, "wall": 45238.4} {"step": 9701, "train_loss": 3.476799964904785, "lr": 0.00032817542670347246, "tps": 14052, "wall": 45246.3} {"step": 9702, "train_loss": 3.4933979511260986, "lr": 0.0003281601137122423, "tps": 14051, "wall": 45254.4} {"step": 9703, "train_loss": 3.49686336517334, "lr": 0.00032814479949576847, "tps": 14050, "wall": 45262.5} {"step": 9704, "train_loss": 3.4692018032073975, "lr": 0.0003281294840542245, "tps": 14049, "wall": 45270.6} {"step": 9705, "train_loss": 3.523681402206421, "lr": 0.00032811416738778393, "tps": 14048, "wall": 45278.8} {"step": 9706, "train_loss": 3.4063873291015625, "lr": 0.0003280988494966202, "tps": 14047, "wall": 45286.8} {"step": 9707, "train_loss": 3.478912353515625, "lr": 0.0003280835303809069, "tps": 14046, "wall": 45294.9} {"step": 9708, "train_loss": 3.515026807785034, "lr": 0.00032806821004081747, "tps": 14045, "wall": 45303.0} {"step": 9709, "train_loss": 3.5083370208740234, "lr": 0.00032805288847652554, "tps": 14044, "wall": 45311.0} {"step": 9710, "train_loss": 3.5119333267211914, "lr": 0.0003280375656882046, "tps": 14043, "wall": 45319.2} {"step": 9711, "train_loss": 3.48443341255188, "lr": 0.0003280222416760283, "tps": 14041, "wall": 45327.4} {"step": 9712, "train_loss": 3.5061817169189453, "lr": 0.00032800691644017016, "tps": 14040, "wall": 45335.3} {"step": 9713, "train_loss": 3.5230751037597656, "lr": 0.0003279915899808039, "tps": 14039, "wall": 45343.5} {"step": 9714, "train_loss": 3.503908634185791, "lr": 0.00032797626229810306, "tps": 14038, "wall": 45351.5} {"step": 9715, "train_loss": 3.577378511428833, "lr": 0.0003279609333922412, "tps": 14037, "wall": 45359.7} {"step": 9716, "train_loss": 3.515552520751953, "lr": 0.0003279456032633921, "tps": 14036, "wall": 45367.7} {"step": 9717, "train_loss": 3.556556224822998, "lr": 0.00032793027191172934, "tps": 14035, "wall": 45375.9} {"step": 9718, "train_loss": 3.583160638809204, "lr": 0.00032791493933742664, "tps": 14034, "wall": 45383.9} {"step": 9719, "train_loss": 3.5317916870117188, "lr": 0.0003278996055406577, "tps": 14033, "wall": 45392.1} {"step": 9720, "train_loss": 3.507429838180542, "lr": 0.00032788427052159614, "tps": 14032, "wall": 45400.0} {"step": 9721, "train_loss": 3.613701105117798, "lr": 0.0003278689342804158, "tps": 14031, "wall": 45408.2} {"step": 9722, "train_loss": 3.4818484783172607, "lr": 0.00032785359681729027, "tps": 14030, "wall": 45416.2} {"step": 9723, "train_loss": 3.630016326904297, "lr": 0.0003278382581323934, "tps": 14029, "wall": 45424.3} {"step": 9724, "train_loss": 3.4931392669677734, "lr": 0.0003278229182258989, "tps": 14028, "wall": 45432.3} {"step": 9725, "train_loss": 3.5027928352355957, "lr": 0.0003278075770979805, "tps": 14027, "wall": 45440.3} {"step": 9726, "train_loss": 3.4947502613067627, "lr": 0.0003277922347488121, "tps": 14026, "wall": 45448.4} {"step": 9727, "train_loss": 3.4898293018341064, "lr": 0.00032777689117856736, "tps": 14025, "wall": 45456.5} {"step": 9728, "train_loss": 3.4611949920654297, "lr": 0.00032776154638742026, "tps": 14024, "wall": 45464.5} {"step": 9729, "train_loss": 3.6138694286346436, "lr": 0.00032774620037554446, "tps": 14023, "wall": 45472.6} {"step": 9730, "train_loss": 3.6029186248779297, "lr": 0.0003277308531431139, "tps": 14022, "wall": 45480.7} {"step": 9731, "train_loss": 3.4934208393096924, "lr": 0.0003277155046903024, "tps": 14021, "wall": 45488.6} {"step": 9732, "train_loss": 3.526824712753296, "lr": 0.0003277001550172839, "tps": 14019, "wall": 45496.7} {"step": 9733, "train_loss": 3.571873188018799, "lr": 0.0003276848041242321, "tps": 14018, "wall": 45504.8} {"step": 9734, "train_loss": 3.5520806312561035, "lr": 0.0003276694520113211, "tps": 14017, "wall": 45512.9} {"step": 9735, "train_loss": 3.5862433910369873, "lr": 0.0003276540986787247, "tps": 14016, "wall": 45520.9} {"step": 9736, "train_loss": 3.5920557975769043, "lr": 0.0003276387441266168, "tps": 14015, "wall": 45529.1} {"step": 9737, "train_loss": 3.440134286880493, "lr": 0.0003276233883551714, "tps": 14014, "wall": 45537.2} {"step": 9738, "train_loss": 3.48299503326416, "lr": 0.0003276080313645625, "tps": 14013, "wall": 45545.3} {"step": 9739, "train_loss": 3.4738826751708984, "lr": 0.00032759267315496393, "tps": 14012, "wall": 45553.3} {"step": 9740, "train_loss": 3.519912004470825, "lr": 0.00032757731372654974, "tps": 14011, "wall": 45561.4} {"step": 9741, "train_loss": 3.622903347015381, "lr": 0.000327561953079494, "tps": 14010, "wall": 45569.6} {"step": 9742, "train_loss": 3.619489908218384, "lr": 0.00032754659121397053, "tps": 14009, "wall": 45577.6} {"step": 9743, "train_loss": 3.553401470184326, "lr": 0.00032753122813015354, "tps": 14008, "wall": 45585.8} {"step": 9744, "train_loss": 3.5539329051971436, "lr": 0.0003275158638282169, "tps": 14007, "wall": 45593.9} {"step": 9745, "train_loss": 3.4642295837402344, "lr": 0.0003275004983083348, "tps": 14006, "wall": 45602.1} {"step": 9746, "train_loss": 3.543820381164551, "lr": 0.00032748513157068124, "tps": 14005, "wall": 45610.1} {"step": 9747, "train_loss": 3.5257298946380615, "lr": 0.0003274697636154303, "tps": 14004, "wall": 45618.2} {"step": 9748, "train_loss": 3.496687889099121, "lr": 0.00032745439444275604, "tps": 14003, "wall": 45626.2} {"step": 9749, "train_loss": 3.4277377128601074, "lr": 0.0003274390240528326, "tps": 14002, "wall": 45634.3} {"step": 9750, "train_loss": 3.5650405883789062, "lr": 0.0003274236524458341, "tps": 14001, "wall": 45642.5} {"step": 9751, "train_loss": 3.5130209922790527, "lr": 0.0003274082796219346, "tps": 13999, "wall": 45650.7} {"step": 9752, "train_loss": 3.5282959938049316, "lr": 0.0003273929055813083, "tps": 13998, "wall": 45658.7} {"step": 9753, "train_loss": 3.6179447174072266, "lr": 0.0003273775303241294, "tps": 13997, "wall": 45666.7} {"step": 9754, "train_loss": 3.564291000366211, "lr": 0.00032736215385057197, "tps": 13996, "wall": 45674.7} {"step": 9755, "train_loss": 3.505103826522827, "lr": 0.0003273467761608103, "tps": 13995, "wall": 45682.8} {"step": 9756, "train_loss": 3.5808262825012207, "lr": 0.0003273313972550185, "tps": 13994, "wall": 45690.8} {"step": 9757, "train_loss": 3.486206531524658, "lr": 0.0003273160171333709, "tps": 13993, "wall": 45699.0} {"step": 9758, "train_loss": 3.5571439266204834, "lr": 0.00032730063579604167, "tps": 13992, "wall": 45707.1} {"step": 9759, "train_loss": 3.466827392578125, "lr": 0.00032728525324320497, "tps": 13991, "wall": 45715.2} {"step": 9760, "train_loss": 3.4676313400268555, "lr": 0.0003272698694750351, "tps": 13990, "wall": 45723.3} {"step": 9761, "train_loss": 3.542207717895508, "lr": 0.0003272544844917063, "tps": 13989, "wall": 45731.4} {"step": 9762, "train_loss": 3.4416115283966064, "lr": 0.000327239098293393, "tps": 13988, "wall": 45739.6} {"step": 9763, "train_loss": 3.5624732971191406, "lr": 0.00032722371088026933, "tps": 13987, "wall": 45747.6} {"step": 9764, "train_loss": 3.5165231227874756, "lr": 0.0003272083222525097, "tps": 13986, "wall": 45755.7} {"step": 9765, "train_loss": 3.4477248191833496, "lr": 0.00032719293241028843, "tps": 13985, "wall": 45763.6} {"step": 9766, "train_loss": 3.6252167224884033, "lr": 0.00032717754135377973, "tps": 13984, "wall": 45771.8} {"step": 9767, "train_loss": 3.478903293609619, "lr": 0.0003271621490831581, "tps": 13983, "wall": 45779.9} {"step": 9768, "train_loss": 3.5352225303649902, "lr": 0.00032714675559859785, "tps": 13982, "wall": 45788.0} {"step": 9769, "train_loss": 3.4705214500427246, "lr": 0.00032713136090027335, "tps": 13981, "wall": 45796.2} {"step": 9770, "train_loss": 3.484583854675293, "lr": 0.00032711596498835897, "tps": 13980, "wall": 45804.3} {"step": 9771, "train_loss": 3.578981399536133, "lr": 0.0003271005678630292, "tps": 13979, "wall": 45812.3} {"step": 9772, "train_loss": 3.5423569679260254, "lr": 0.00032708516952445834, "tps": 13978, "wall": 45820.3} {"step": 9773, "train_loss": 3.609954595565796, "lr": 0.00032706976997282094, "tps": 13977, "wall": 45828.4} {"step": 9774, "train_loss": 3.561999559402466, "lr": 0.0003270543692082914, "tps": 13976, "wall": 45836.5} {"step": 9775, "train_loss": 3.446071147918701, "lr": 0.0003270389672310441, "tps": 13975, "wall": 45844.5} {"step": 9776, "train_loss": 3.5052435398101807, "lr": 0.00032702356404125366, "tps": 13974, "wall": 45852.5} {"step": 9777, "train_loss": 3.521033525466919, "lr": 0.0003270081596390944, "tps": 13972, "wall": 45860.7} {"step": 9778, "train_loss": 3.447176456451416, "lr": 0.000326992754024741, "tps": 13971, "wall": 45868.7} {"step": 9779, "train_loss": 3.4452013969421387, "lr": 0.00032697734719836787, "tps": 13970, "wall": 45876.8} {"step": 9780, "train_loss": 3.4686570167541504, "lr": 0.00032696193916014957, "tps": 13969, "wall": 45884.7} {"step": 9781, "train_loss": 3.558460235595703, "lr": 0.0003269465299102607, "tps": 13968, "wall": 45892.8} {"step": 9782, "train_loss": 3.544264793395996, "lr": 0.0003269311194488756, "tps": 13967, "wall": 45900.8} {"step": 9783, "train_loss": 3.591998338699341, "lr": 0.00032691570777616916, "tps": 13966, "wall": 45908.9} {"step": 9784, "train_loss": 3.4984993934631348, "lr": 0.00032690029489231573, "tps": 13965, "wall": 45917.0} {"step": 9785, "train_loss": 3.5608766078948975, "lr": 0.00032688488079748995, "tps": 13964, "wall": 45925.2} {"step": 9786, "train_loss": 3.4627246856689453, "lr": 0.00032686946549186655, "tps": 13963, "wall": 45933.4} {"step": 9787, "train_loss": 3.44663143157959, "lr": 0.00032685404897561996, "tps": 13962, "wall": 45941.4} {"step": 9788, "train_loss": 3.5764260292053223, "lr": 0.0003268386312489249, "tps": 13961, "wall": 45949.6} {"step": 9789, "train_loss": 3.5232717990875244, "lr": 0.00032682321231195617, "tps": 13960, "wall": 45957.7} {"step": 9790, "train_loss": 3.543351650238037, "lr": 0.00032680779216488824, "tps": 13959, "wall": 45965.7} {"step": 9791, "train_loss": 3.6089253425598145, "lr": 0.00032679237080789585, "tps": 13958, "wall": 45973.6} {"step": 9792, "train_loss": 3.5112342834472656, "lr": 0.0003267769482411537, "tps": 13957, "wall": 45981.7} {"step": 9793, "train_loss": 3.408341884613037, "lr": 0.00032676152446483653, "tps": 13956, "wall": 45989.9} {"step": 9794, "train_loss": 3.5854263305664062, "lr": 0.00032674609947911905, "tps": 13955, "wall": 45997.9} {"step": 9795, "train_loss": 3.5986294746398926, "lr": 0.0003267306732841759, "tps": 13954, "wall": 46006.0} {"step": 9796, "train_loss": 3.6001455783843994, "lr": 0.000326715245880182, "tps": 13953, "wall": 46014.0} {"step": 9797, "train_loss": 3.4822540283203125, "lr": 0.00032669981726731205, "tps": 13952, "wall": 46022.1} {"step": 9798, "train_loss": 3.5456180572509766, "lr": 0.00032668438744574074, "tps": 13951, "wall": 46030.1} {"step": 9799, "train_loss": 3.56587815284729, "lr": 0.0003266689564156429, "tps": 13950, "wall": 46038.1} {"step": 9800, "train_loss": 3.5401434898376465, "lr": 0.00032665352417719334, "tps": 13949, "wall": 46046.3} {"step": 9801, "train_loss": 3.5421135425567627, "lr": 0.00032663809073056697, "tps": 13948, "wall": 46054.3} {"step": 9802, "train_loss": 3.6009130477905273, "lr": 0.00032662265607593847, "tps": 13947, "wall": 46062.3} {"step": 9803, "train_loss": 3.525197744369507, "lr": 0.0003266072202134828, "tps": 13946, "wall": 46070.4} {"step": 9804, "train_loss": 3.5542850494384766, "lr": 0.0003265917831433747, "tps": 13945, "wall": 46078.4} {"step": 9805, "train_loss": 3.4971261024475098, "lr": 0.00032657634486578916, "tps": 13944, "wall": 46086.3} {"step": 9806, "train_loss": 3.5539679527282715, "lr": 0.000326560905380901, "tps": 13943, "wall": 46094.4} {"step": 9807, "train_loss": 3.4718332290649414, "lr": 0.00032654546468888516, "tps": 13942, "wall": 46102.4} {"step": 9808, "train_loss": 3.5059409141540527, "lr": 0.0003265300227899165, "tps": 13941, "wall": 46110.5} {"step": 9809, "train_loss": 3.6126139163970947, "lr": 0.00032651457968417005, "tps": 13940, "wall": 46118.5} {"step": 9810, "train_loss": 3.5535707473754883, "lr": 0.0003264991353718206, "tps": 13939, "wall": 46126.6} {"step": 9811, "train_loss": 3.637542247772217, "lr": 0.00032648368985304326, "tps": 13938, "wall": 46134.6} {"step": 9812, "train_loss": 3.5932774543762207, "lr": 0.00032646824312801285, "tps": 13937, "wall": 46142.7} {"step": 9813, "train_loss": 3.572284698486328, "lr": 0.00032645279519690444, "tps": 13936, "wall": 46150.7} {"step": 9814, "train_loss": 3.531534433364868, "lr": 0.00032643734605989304, "tps": 13935, "wall": 46158.8} {"step": 9815, "train_loss": 3.485987663269043, "lr": 0.0003264218957171536, "tps": 13934, "wall": 46166.8} {"step": 9816, "train_loss": 3.4623899459838867, "lr": 0.0003264064441688612, "tps": 13933, "wall": 46174.9} {"step": 9817, "train_loss": 3.605982780456543, "lr": 0.00032639099141519074, "tps": 13932, "wall": 46182.9} {"step": 9818, "train_loss": 3.465458393096924, "lr": 0.0003263755374563175, "tps": 13931, "wall": 46191.0} {"step": 9819, "train_loss": 3.5808169841766357, "lr": 0.00032636008229241636, "tps": 13930, "wall": 46199.2} {"step": 9820, "train_loss": 3.540144681930542, "lr": 0.00032634462592366246, "tps": 13929, "wall": 46207.2} {"step": 9821, "train_loss": 3.6135001182556152, "lr": 0.00032632916835023093, "tps": 13928, "wall": 46215.2} {"step": 9822, "train_loss": 3.5105209350585938, "lr": 0.00032631370957229676, "tps": 13927, "wall": 46223.3} {"step": 9823, "train_loss": 3.525705337524414, "lr": 0.00032629824959003515, "tps": 13926, "wall": 46231.2} {"step": 9824, "train_loss": 3.555520534515381, "lr": 0.00032628278840362126, "tps": 13925, "wall": 46239.3} {"step": 9825, "train_loss": 3.542685031890869, "lr": 0.0003262673260132301, "tps": 13924, "wall": 46247.4} {"step": 9826, "train_loss": 3.6151201725006104, "lr": 0.00032625186241903696, "tps": 13923, "wall": 46255.5} {"step": 9827, "train_loss": 3.4990522861480713, "lr": 0.000326236397621217, "tps": 13922, "wall": 46263.5} {"step": 9828, "train_loss": 3.554201602935791, "lr": 0.00032622093161994536, "tps": 13921, "wall": 46271.5} {"step": 9829, "train_loss": 3.5288212299346924, "lr": 0.0003262054644153973, "tps": 13920, "wall": 46279.5} {"step": 9830, "train_loss": 3.5994608402252197, "lr": 0.000326189996007748, "tps": 13919, "wall": 46287.6} {"step": 9831, "train_loss": 3.4964747428894043, "lr": 0.00032617452639717263, "tps": 13918, "wall": 46295.7} {"step": 9832, "train_loss": 3.563819408416748, "lr": 0.0003261590555838465, "tps": 13917, "wall": 46303.8} {"step": 9833, "train_loss": 3.5715651512145996, "lr": 0.0003261435835679449, "tps": 13916, "wall": 46311.8} {"step": 9834, "train_loss": 3.4841127395629883, "lr": 0.0003261281103496429, "tps": 13915, "wall": 46319.8} {"step": 9835, "train_loss": 3.5192689895629883, "lr": 0.00032611263592911605, "tps": 13914, "wall": 46327.8} {"step": 9836, "train_loss": 3.6479251384735107, "lr": 0.0003260971603065395, "tps": 13913, "wall": 46335.8} {"step": 9837, "train_loss": 3.5659079551696777, "lr": 0.0003260816834820885, "tps": 13912, "wall": 46343.8} {"step": 9838, "train_loss": 3.545417547225952, "lr": 0.0003260662054559386, "tps": 13911, "wall": 46351.8} {"step": 9839, "train_loss": 3.5910472869873047, "lr": 0.00032605072622826485, "tps": 13910, "wall": 46359.7} {"step": 9840, "train_loss": 3.535658597946167, "lr": 0.00032603524579924285, "tps": 13909, "wall": 46367.8} {"step": 9841, "train_loss": 3.5192930698394775, "lr": 0.00032601976416904774, "tps": 13908, "wall": 46375.8} {"step": 9842, "train_loss": 3.480407238006592, "lr": 0.0003260042813378551, "tps": 13907, "wall": 46383.7} {"step": 9843, "train_loss": 3.4641916751861572, "lr": 0.0003259887973058401, "tps": 13906, "wall": 46391.7} {"step": 9844, "train_loss": 3.4217448234558105, "lr": 0.00032597331207317835, "tps": 13905, "wall": 46399.7} {"step": 9845, "train_loss": 3.4842581748962402, "lr": 0.0003259578256400452, "tps": 13904, "wall": 46407.8} {"step": 9846, "train_loss": 3.5895462036132812, "lr": 0.00032594233800661604, "tps": 13903, "wall": 46415.8} {"step": 9847, "train_loss": 3.4817402362823486, "lr": 0.0003259268491730664, "tps": 13902, "wall": 46423.9} {"step": 9848, "train_loss": 3.5232138633728027, "lr": 0.0003259113591395716, "tps": 13901, "wall": 46432.0} {"step": 9849, "train_loss": 3.6328470706939697, "lr": 0.00032589586790630724, "tps": 13900, "wall": 46440.0} {"step": 9850, "train_loss": 3.4916274547576904, "lr": 0.0003258803754734488, "tps": 13899, "wall": 46447.9} {"step": 9851, "train_loss": 3.446803569793701, "lr": 0.00032586488184117163, "tps": 13898, "wall": 46455.9} {"step": 9852, "train_loss": 3.4666104316711426, "lr": 0.00032584938700965145, "tps": 13897, "wall": 46463.8} {"step": 9853, "train_loss": 3.4419469833374023, "lr": 0.0003258338909790637, "tps": 13896, "wall": 46471.8} {"step": 9854, "train_loss": 3.4911975860595703, "lr": 0.0003258183937495838, "tps": 13895, "wall": 46479.8} {"step": 9855, "train_loss": 3.4785070419311523, "lr": 0.00032580289532138743, "tps": 13894, "wall": 46488.0} {"step": 9856, "train_loss": 3.6273856163024902, "lr": 0.00032578739569465024, "tps": 13893, "wall": 46496.0} {"step": 9857, "train_loss": 3.625188112258911, "lr": 0.00032577189486954764, "tps": 13892, "wall": 46503.9} {"step": 9858, "train_loss": 3.492941379547119, "lr": 0.00032575639284625527, "tps": 13891, "wall": 46512.0} {"step": 9859, "train_loss": 3.58099627494812, "lr": 0.0003257408896249488, "tps": 13890, "wall": 46520.1} {"step": 9860, "train_loss": 3.411090850830078, "lr": 0.0003257253852058038, "tps": 13889, "wall": 46528.2} {"step": 9861, "train_loss": 3.522188901901245, "lr": 0.00032570987958899597, "tps": 13888, "wall": 46536.3} {"step": 9862, "train_loss": 3.539799690246582, "lr": 0.0003256943727747008, "tps": 13887, "wall": 46544.3} {"step": 9863, "train_loss": 3.526581048965454, "lr": 0.00032567886476309407, "tps": 13886, "wall": 46552.3} {"step": 9864, "train_loss": 3.4525442123413086, "lr": 0.00032566335555435155, "tps": 13885, "wall": 46560.4} {"step": 9865, "train_loss": 3.6005682945251465, "lr": 0.0003256478451486487, "tps": 13884, "wall": 46568.4} {"step": 9866, "train_loss": 3.6160945892333984, "lr": 0.0003256323335461614, "tps": 13883, "wall": 46576.3} {"step": 9867, "train_loss": 3.5307624340057373, "lr": 0.00032561682074706534, "tps": 13882, "wall": 46584.4} {"step": 9868, "train_loss": 3.46805477142334, "lr": 0.0003256013067515362, "tps": 13881, "wall": 46592.4} {"step": 9869, "train_loss": 3.5054917335510254, "lr": 0.0003255857915597497, "tps": 13880, "wall": 46600.4} {"step": 9870, "train_loss": 3.43369197845459, "lr": 0.0003255702751718817, "tps": 13879, "wall": 46608.5} {"step": 9871, "train_loss": 3.5352187156677246, "lr": 0.00032555475758810784, "tps": 13878, "wall": 46616.6} {"step": 9872, "train_loss": 3.514645576477051, "lr": 0.0003255392388086041, "tps": 13877, "wall": 46624.5} {"step": 9873, "train_loss": 3.544440269470215, "lr": 0.000325523718833546, "tps": 13876, "wall": 46632.6} {"step": 9874, "train_loss": 3.474780559539795, "lr": 0.00032550819766310964, "tps": 13875, "wall": 46640.6} {"step": 9875, "train_loss": 3.556919574737549, "lr": 0.00032549267529747065, "tps": 13874, "wall": 46648.7} {"step": 9876, "train_loss": 3.5026891231536865, "lr": 0.0003254771517368049, "tps": 13873, "wall": 46656.7} {"step": 9877, "train_loss": 3.458406448364258, "lr": 0.00032546162698128826, "tps": 13872, "wall": 46664.7} {"step": 9878, "train_loss": 3.5654187202453613, "lr": 0.0003254461010310967, "tps": 13871, "wall": 46672.7} {"step": 9879, "train_loss": 3.5890188217163086, "lr": 0.0003254305738864059, "tps": 13870, "wall": 46680.9} {"step": 9880, "train_loss": 3.554377555847168, "lr": 0.0003254150455473919, "tps": 13869, "wall": 46688.7} {"step": 9881, "train_loss": 3.5381669998168945, "lr": 0.00032539951601423056, "tps": 13868, "wall": 46696.7} {"step": 9882, "train_loss": 3.475299835205078, "lr": 0.00032538398528709784, "tps": 13867, "wall": 46704.7} {"step": 9883, "train_loss": 3.5408082008361816, "lr": 0.0003253684533661695, "tps": 13866, "wall": 46712.7} {"step": 9884, "train_loss": 3.542370319366455, "lr": 0.00032535292025162176, "tps": 13865, "wall": 46720.8} {"step": 9885, "train_loss": 3.450472354888916, "lr": 0.00032533738594363044, "tps": 13864, "wall": 46728.9} {"step": 9886, "train_loss": 3.556365489959717, "lr": 0.00032532185044237147, "tps": 13863, "wall": 46737.0} {"step": 9887, "train_loss": 3.525998592376709, "lr": 0.0003253063137480208, "tps": 13862, "wall": 46745.0} {"step": 9888, "train_loss": 3.5278234481811523, "lr": 0.0003252907758607546, "tps": 13861, "wall": 46752.8} {"step": 9889, "train_loss": 3.415666341781616, "lr": 0.00032527523678074885, "tps": 13860, "wall": 46760.9} {"step": 9890, "train_loss": 3.4533028602600098, "lr": 0.0003252596965081794, "tps": 13859, "wall": 46768.9} {"step": 9891, "train_loss": 3.623537540435791, "lr": 0.0003252441550432225, "tps": 13858, "wall": 46777.0} {"step": 9892, "train_loss": 3.608107566833496, "lr": 0.0003252286123860541, "tps": 13858, "wall": 46785.0} {"step": 9893, "train_loss": 3.514707565307617, "lr": 0.00032521306853685027, "tps": 13857, "wall": 46793.1} {"step": 9894, "train_loss": 3.465747833251953, "lr": 0.0003251975234957871, "tps": 13856, "wall": 46801.1} {"step": 9895, "train_loss": 3.578467607498169, "lr": 0.0003251819772630407, "tps": 13855, "wall": 46809.1} {"step": 9896, "train_loss": 3.489504337310791, "lr": 0.0003251664298387872, "tps": 13854, "wall": 46817.1} {"step": 9897, "train_loss": 3.5202646255493164, "lr": 0.00032515088122320266, "tps": 13853, "wall": 46825.0} {"step": 9898, "train_loss": 3.651470184326172, "lr": 0.0003251353314164633, "tps": 13852, "wall": 46833.1} {"step": 9899, "train_loss": 3.6253504753112793, "lr": 0.00032511978041874516, "tps": 13851, "wall": 46841.2} {"step": 9900, "train_loss": 3.4756016731262207, "lr": 0.0003251042282302245, "tps": 13850, "wall": 46849.3} {"step": 9901, "train_loss": 3.557826280593872, "lr": 0.0003250886748510774, "tps": 13849, "wall": 46857.5} {"step": 9902, "train_loss": 3.5470924377441406, "lr": 0.00032507312028148014, "tps": 13848, "wall": 46865.4} {"step": 9903, "train_loss": 3.5242576599121094, "lr": 0.0003250575645216089, "tps": 13847, "wall": 46873.4} {"step": 9904, "train_loss": 3.4707939624786377, "lr": 0.0003250420075716398, "tps": 13846, "wall": 46881.5} {"step": 9905, "train_loss": 3.497252941131592, "lr": 0.00032502644943174926, "tps": 13845, "wall": 46889.5} {"step": 9906, "train_loss": 3.517179012298584, "lr": 0.00032501089010211336, "tps": 13844, "wall": 46897.6} {"step": 9907, "train_loss": 3.504141330718994, "lr": 0.0003249953295829085, "tps": 13843, "wall": 46905.7} {"step": 9908, "train_loss": 3.504239082336426, "lr": 0.00032497976787431083, "tps": 13842, "wall": 46913.8} {"step": 9909, "train_loss": 3.4851021766662598, "lr": 0.0003249642049764966, "tps": 13841, "wall": 46921.7} {"step": 9910, "train_loss": 3.518045663833618, "lr": 0.0003249486408896423, "tps": 13840, "wall": 46929.7} {"step": 9911, "train_loss": 3.52020525932312, "lr": 0.000324933075613924, "tps": 13839, "wall": 46937.8} {"step": 9912, "train_loss": 3.4452528953552246, "lr": 0.0003249175091495182, "tps": 13838, "wall": 46946.0} {"step": 9913, "train_loss": 3.615118980407715, "lr": 0.00032490194149660117, "tps": 13837, "wall": 46954.0} {"step": 9914, "train_loss": 3.492375612258911, "lr": 0.0003248863726553492, "tps": 13836, "wall": 46962.0} {"step": 9915, "train_loss": 3.518700122833252, "lr": 0.00032487080262593885, "tps": 13835, "wall": 46970.2} {"step": 9916, "train_loss": 3.4695510864257812, "lr": 0.0003248552314085463, "tps": 13834, "wall": 46978.3} {"step": 9917, "train_loss": 3.546628713607788, "lr": 0.0003248396590033481, "tps": 13833, "wall": 46986.2} {"step": 9918, "train_loss": 3.464517593383789, "lr": 0.00032482408541052043, "tps": 13832, "wall": 46994.1} {"step": 9919, "train_loss": 3.483569622039795, "lr": 0.00032480851063023997, "tps": 13831, "wall": 47002.1} {"step": 9920, "train_loss": 3.4804091453552246, "lr": 0.000324792934662683, "tps": 13830, "wall": 47010.1} {"step": 9921, "train_loss": 3.5608901977539062, "lr": 0.00032477735750802595, "tps": 13829, "wall": 47018.3} {"step": 9922, "train_loss": 3.5684502124786377, "lr": 0.00032476177916644536, "tps": 13828, "wall": 47026.4} {"step": 9923, "train_loss": 3.583794116973877, "lr": 0.00032474619963811767, "tps": 13827, "wall": 47034.4} {"step": 9924, "train_loss": 3.638920783996582, "lr": 0.0003247306189232194, "tps": 13826, "wall": 47042.4} {"step": 9925, "train_loss": 3.5099143981933594, "lr": 0.00032471503702192697, "tps": 13825, "wall": 47050.5} {"step": 9926, "train_loss": 3.514591932296753, "lr": 0.0003246994539344169, "tps": 13824, "wall": 47058.5} {"step": 9927, "train_loss": 3.508607864379883, "lr": 0.0003246838696608658, "tps": 13823, "wall": 47066.4} {"step": 9928, "train_loss": 3.4692678451538086, "lr": 0.0003246682842014502, "tps": 13822, "wall": 47074.5} {"step": 9929, "train_loss": 3.520991802215576, "lr": 0.0003246526975563465, "tps": 13821, "wall": 47082.4} {"step": 9930, "train_loss": 3.4974629878997803, "lr": 0.0003246371097257315, "tps": 13821, "wall": 47090.4} {"step": 9931, "train_loss": 3.530857563018799, "lr": 0.00032462152070978164, "tps": 13820, "wall": 47098.4} {"step": 9932, "train_loss": 3.602651357650757, "lr": 0.0003246059305086735, "tps": 13819, "wall": 47106.5} {"step": 9933, "train_loss": 3.4811065196990967, "lr": 0.0003245903391225837, "tps": 13818, "wall": 47114.4} {"step": 9934, "train_loss": 3.534961223602295, "lr": 0.00032457474655168896, "tps": 13817, "wall": 47122.4} {"step": 9935, "train_loss": 3.460636615753174, "lr": 0.00032455915279616573, "tps": 13816, "wall": 47130.5} {"step": 9936, "train_loss": 3.3790459632873535, "lr": 0.0003245435578561908, "tps": 13815, "wall": 47138.4} {"step": 9937, "train_loss": 3.5222976207733154, "lr": 0.0003245279617319408, "tps": 13814, "wall": 47146.5} {"step": 9938, "train_loss": 3.512831926345825, "lr": 0.0003245123644235924, "tps": 13813, "wall": 47154.5} {"step": 9939, "train_loss": 3.4496703147888184, "lr": 0.0003244967659313223, "tps": 13812, "wall": 47162.5} {"step": 9940, "train_loss": 3.5580615997314453, "lr": 0.0003244811662553071, "tps": 13811, "wall": 47170.6} {"step": 9941, "train_loss": 3.6172964572906494, "lr": 0.00032446556539572364, "tps": 13810, "wall": 47178.6} {"step": 9942, "train_loss": 3.5705978870391846, "lr": 0.00032444996335274863, "tps": 13809, "wall": 47186.7} {"step": 9943, "train_loss": 3.5251193046569824, "lr": 0.00032443436012655885, "tps": 13808, "wall": 47194.7} {"step": 9944, "train_loss": 3.590062141418457, "lr": 0.0003244187557173309, "tps": 13807, "wall": 47202.8} {"step": 9945, "train_loss": 3.53737735748291, "lr": 0.00032440315012524163, "tps": 13806, "wall": 47211.0} {"step": 9946, "train_loss": 3.5925955772399902, "lr": 0.00032438754335046785, "tps": 13805, "wall": 47219.2} {"step": 9947, "train_loss": 3.630357027053833, "lr": 0.0003243719353931863, "tps": 13804, "wall": 47227.3} {"step": 9948, "train_loss": 3.595008373260498, "lr": 0.00032435632625357384, "tps": 13803, "wall": 47235.3} {"step": 9949, "train_loss": 3.5100131034851074, "lr": 0.00032434071593180733, "tps": 13802, "wall": 47243.4} {"step": 9950, "train_loss": 3.4464292526245117, "lr": 0.00032432510442806346, "tps": 13801, "wall": 47251.4} {"step": 9951, "train_loss": 3.594083786010742, "lr": 0.00032430949174251916, "tps": 13800, "wall": 47259.5} {"step": 9952, "train_loss": 3.6685433387756348, "lr": 0.00032429387787535137, "tps": 13799, "wall": 47267.6} {"step": 9953, "train_loss": 3.4082508087158203, "lr": 0.00032427826282673683, "tps": 13798, "wall": 47275.6} {"step": 9954, "train_loss": 3.6064865589141846, "lr": 0.0003242626465968525, "tps": 13797, "wall": 47283.6} {"step": 9955, "train_loss": 3.4971961975097656, "lr": 0.0003242470291858753, "tps": 13796, "wall": 47291.6} {"step": 9956, "train_loss": 3.4423816204071045, "lr": 0.00032423141059398207, "tps": 13795, "wall": 47299.6} {"step": 9957, "train_loss": 3.503931999206543, "lr": 0.0003242157908213498, "tps": 13794, "wall": 47307.8} {"step": 9958, "train_loss": 3.4019014835357666, "lr": 0.0003242001698681554, "tps": 13793, "wall": 47315.9} {"step": 9959, "train_loss": 3.45674991607666, "lr": 0.00032418454773457594, "tps": 13793, "wall": 47323.9} {"step": 9960, "train_loss": 3.595991373062134, "lr": 0.00032416892442078813, "tps": 13792, "wall": 47332.0} {"step": 9961, "train_loss": 3.5669236183166504, "lr": 0.0003241532999269692, "tps": 13791, "wall": 47340.0} {"step": 9962, "train_loss": 3.4795780181884766, "lr": 0.000324137674253296, "tps": 13790, "wall": 47347.9} {"step": 9963, "train_loss": 3.558067798614502, "lr": 0.0003241220473999456, "tps": 13789, "wall": 47355.9} {"step": 9964, "train_loss": 3.5181031227111816, "lr": 0.0003241064193670951, "tps": 13788, "wall": 47364.0} {"step": 9965, "train_loss": 3.454322338104248, "lr": 0.0003240907901549214, "tps": 13787, "wall": 47372.0} {"step": 9966, "train_loss": 3.606048583984375, "lr": 0.00032407515976360155, "tps": 13786, "wall": 47380.1} {"step": 9967, "train_loss": 3.4829728603363037, "lr": 0.00032405952819331273, "tps": 13785, "wall": 47388.2} {"step": 9968, "train_loss": 3.4436452388763428, "lr": 0.0003240438954442319, "tps": 13784, "wall": 47396.3} {"step": 9969, "train_loss": 3.4755067825317383, "lr": 0.00032402826151653615, "tps": 13783, "wall": 47404.2} {"step": 9970, "train_loss": 3.5852253437042236, "lr": 0.00032401262641040276, "tps": 13782, "wall": 47412.1} {"step": 9971, "train_loss": 3.449098587036133, "lr": 0.00032399699012600864, "tps": 13781, "wall": 47420.1} {"step": 9972, "train_loss": 3.46944260597229, "lr": 0.00032398135266353096, "tps": 13780, "wall": 47428.2} {"step": 9973, "train_loss": 3.5151991844177246, "lr": 0.00032396571402314693, "tps": 13779, "wall": 47436.2} {"step": 9974, "train_loss": 3.5647265911102295, "lr": 0.0003239500742050336, "tps": 13778, "wall": 47444.2} {"step": 9975, "train_loss": 3.4985029697418213, "lr": 0.00032393443320936823, "tps": 13777, "wall": 47452.4} {"step": 9976, "train_loss": 3.507359266281128, "lr": 0.00032391879103632805, "tps": 13776, "wall": 47460.5} {"step": 9977, "train_loss": 3.481346845626831, "lr": 0.00032390314768609014, "tps": 13775, "wall": 47468.5} {"step": 9978, "train_loss": 3.565207004547119, "lr": 0.00032388750315883174, "tps": 13774, "wall": 47476.4} {"step": 9979, "train_loss": 3.6240313053131104, "lr": 0.0003238718574547301, "tps": 13773, "wall": 47484.5} {"step": 9980, "train_loss": 3.602936267852783, "lr": 0.0003238562105739624, "tps": 13773, "wall": 47492.4} {"step": 9981, "train_loss": 3.4611432552337646, "lr": 0.000323840562516706, "tps": 13772, "wall": 47500.4} {"step": 9982, "train_loss": 3.40902042388916, "lr": 0.00032382491328313803, "tps": 13771, "wall": 47508.5} {"step": 9983, "train_loss": 3.561668872833252, "lr": 0.0003238092628734359, "tps": 13770, "wall": 47516.5} {"step": 9984, "train_loss": 3.6527292728424072, "lr": 0.0003237936112877767, "tps": 13769, "wall": 47524.5} {"step": 9985, "train_loss": 3.569344997406006, "lr": 0.0003237779585263379, "tps": 13768, "wall": 47532.4} {"step": 9986, "train_loss": 3.7267112731933594, "lr": 0.0003237623045892969, "tps": 13767, "wall": 47540.5} {"step": 9987, "train_loss": 3.536113739013672, "lr": 0.0003237466494768308, "tps": 13766, "wall": 47548.5} {"step": 9988, "train_loss": 3.5553479194641113, "lr": 0.000323730993189117, "tps": 13765, "wall": 47556.6} {"step": 9989, "train_loss": 3.5140271186828613, "lr": 0.0003237153357263329, "tps": 13764, "wall": 47564.6} {"step": 9990, "train_loss": 3.496838331222534, "lr": 0.0003236996770886559, "tps": 13763, "wall": 47572.7} {"step": 9991, "train_loss": 3.5162644386291504, "lr": 0.0003236840172762634, "tps": 13762, "wall": 47580.8} {"step": 9992, "train_loss": 3.548126697540283, "lr": 0.0003236683562893327, "tps": 13761, "wall": 47588.8} {"step": 9993, "train_loss": 3.4111952781677246, "lr": 0.00032365269412804124, "tps": 13760, "wall": 47596.8} {"step": 9994, "train_loss": 3.470940351486206, "lr": 0.00032363703079256646, "tps": 13759, "wall": 47604.8} {"step": 9995, "train_loss": 3.430020809173584, "lr": 0.0003236213662830858, "tps": 13758, "wall": 47612.8} {"step": 9996, "train_loss": 3.51944637298584, "lr": 0.0003236057005997767, "tps": 13757, "wall": 47620.9} {"step": 9997, "train_loss": 3.465005397796631, "lr": 0.00032359003374281655, "tps": 13756, "wall": 47628.9} {"step": 9998, "train_loss": 3.5615131855010986, "lr": 0.000323574365712383, "tps": 13755, "wall": 47637.0} {"step": 9999, "train_loss": 3.541797399520874, "lr": 0.0003235586965086534, "tps": 13755, "wall": 47644.9} {"step": 10000, "train_loss": 3.5409507751464844, "lr": 0.00032354302613180525, "tps": 13754, "wall": 47653.0, "val_loss_monitor": 3.554552662702031, "val_loss_full": 3.570345794212032} {"step": 10001, "train_loss": 3.425427198410034, "lr": 0.0003235273545820161, "tps": 13702, "wall": 47837.9} {"step": 10002, "train_loss": 3.554288625717163, "lr": 0.0003235116818594635, "tps": 13701, "wall": 47846.5} {"step": 10003, "train_loss": 3.487333297729492, "lr": 0.0003234960079643249, "tps": 13700, "wall": 47855.0} {"step": 10004, "train_loss": 3.529857635498047, "lr": 0.000323480332896778, "tps": 13699, "wall": 47863.5} {"step": 10005, "train_loss": 3.525691509246826, "lr": 0.0003234646566570003, "tps": 13698, "wall": 47872.1} {"step": 10006, "train_loss": 3.581634998321533, "lr": 0.00032344897924516927, "tps": 13696, "wall": 47880.6} {"step": 10007, "train_loss": 3.5179758071899414, "lr": 0.0003234333006614627, "tps": 13695, "wall": 47888.8} {"step": 10008, "train_loss": 3.557222604751587, "lr": 0.0003234176209060581, "tps": 13694, "wall": 47897.2} {"step": 10009, "train_loss": 3.557561159133911, "lr": 0.00032340193997913307, "tps": 13693, "wall": 47905.5} {"step": 10010, "train_loss": 3.5413248538970947, "lr": 0.0003233862578808653, "tps": 13692, "wall": 47913.8} {"step": 10011, "train_loss": 3.546574354171753, "lr": 0.00032337057461143234, "tps": 13691, "wall": 47922.1} {"step": 10012, "train_loss": 3.6136534214019775, "lr": 0.00032335489017101197, "tps": 13690, "wall": 47930.5} {"step": 10013, "train_loss": 3.5004663467407227, "lr": 0.0003233392045597819, "tps": 13689, "wall": 47938.9} {"step": 10014, "train_loss": 3.446712017059326, "lr": 0.0003233235177779196, "tps": 13688, "wall": 47947.1} {"step": 10015, "train_loss": 3.5590744018554688, "lr": 0.0003233078298256029, "tps": 13687, "wall": 47955.3} {"step": 10016, "train_loss": 3.548734664916992, "lr": 0.00032329214070300955, "tps": 13686, "wall": 47963.5} {"step": 10017, "train_loss": 3.4787044525146484, "lr": 0.0003232764504103173, "tps": 13685, "wall": 47971.9} {"step": 10018, "train_loss": 3.530404567718506, "lr": 0.00032326075894770375, "tps": 13684, "wall": 47980.0} {"step": 10019, "train_loss": 3.560845136642456, "lr": 0.00032324506631534677, "tps": 13683, "wall": 47988.3} {"step": 10020, "train_loss": 3.4272572994232178, "lr": 0.00032322937251342404, "tps": 13683, "wall": 47996.5} {"step": 10021, "train_loss": 3.4451520442962646, "lr": 0.0003232136775421135, "tps": 13682, "wall": 48004.7} {"step": 10022, "train_loss": 3.581099033355713, "lr": 0.00032319798140159275, "tps": 13681, "wall": 48012.7} {"step": 10023, "train_loss": 3.5416300296783447, "lr": 0.0003231822840920397, "tps": 13680, "wall": 48020.9} {"step": 10024, "train_loss": 3.6346137523651123, "lr": 0.00032316658561363213, "tps": 13679, "wall": 48029.1} {"step": 10025, "train_loss": 3.49149227142334, "lr": 0.000323150885966548, "tps": 13678, "wall": 48037.1} {"step": 10026, "train_loss": 3.556938886642456, "lr": 0.00032313518515096493, "tps": 13677, "wall": 48045.2} {"step": 10027, "train_loss": 3.5945892333984375, "lr": 0.00032311948316706096, "tps": 13676, "wall": 48053.4} {"step": 10028, "train_loss": 3.4768929481506348, "lr": 0.00032310378001501394, "tps": 13675, "wall": 48061.6} {"step": 10029, "train_loss": 3.5364527702331543, "lr": 0.0003230880756950017, "tps": 13674, "wall": 48069.6} {"step": 10030, "train_loss": 3.505160093307495, "lr": 0.0003230723702072021, "tps": 13673, "wall": 48077.6} {"step": 10031, "train_loss": 3.5415308475494385, "lr": 0.0003230566635517932, "tps": 13672, "wall": 48085.5} {"step": 10032, "train_loss": 3.4827303886413574, "lr": 0.00032304095572895276, "tps": 13671, "wall": 48093.6} {"step": 10033, "train_loss": 3.4587819576263428, "lr": 0.00032302524673885884, "tps": 13670, "wall": 48101.7} {"step": 10034, "train_loss": 3.5029869079589844, "lr": 0.00032300953658168937, "tps": 13669, "wall": 48109.8} {"step": 10035, "train_loss": 3.5169458389282227, "lr": 0.0003229938252576223, "tps": 13668, "wall": 48117.8} {"step": 10036, "train_loss": 3.608877658843994, "lr": 0.00032297811276683555, "tps": 13668, "wall": 48125.8} {"step": 10037, "train_loss": 3.5006866455078125, "lr": 0.00032296239910950726, "tps": 13667, "wall": 48133.9} {"step": 10038, "train_loss": 3.5514233112335205, "lr": 0.00032294668428581525, "tps": 13666, "wall": 48141.9} {"step": 10039, "train_loss": 3.496654987335205, "lr": 0.00032293096829593765, "tps": 13665, "wall": 48150.1} {"step": 10040, "train_loss": 3.5225887298583984, "lr": 0.0003229152511400525, "tps": 13664, "wall": 48158.1} {"step": 10041, "train_loss": 3.511561632156372, "lr": 0.0003228995328183378, "tps": 13663, "wall": 48166.3} {"step": 10042, "train_loss": 3.426521062850952, "lr": 0.0003228838133309717, "tps": 13662, "wall": 48174.3} {"step": 10043, "train_loss": 3.547537326812744, "lr": 0.00032286809267813207, "tps": 13661, "wall": 48182.3} {"step": 10044, "train_loss": 3.6210827827453613, "lr": 0.0003228523708599972, "tps": 13660, "wall": 48190.2} {"step": 10045, "train_loss": 3.63088321685791, "lr": 0.0003228366478767451, "tps": 13659, "wall": 48198.3} {"step": 10046, "train_loss": 3.513101577758789, "lr": 0.00032282092372855386, "tps": 13658, "wall": 48206.4} {"step": 10047, "train_loss": 3.549281597137451, "lr": 0.00032280519841560167, "tps": 13657, "wall": 48214.5} {"step": 10048, "train_loss": 3.5217552185058594, "lr": 0.00032278947193806656, "tps": 13656, "wall": 48222.5} {"step": 10049, "train_loss": 3.5017940998077393, "lr": 0.00032277374429612684, "tps": 13655, "wall": 48230.6} {"step": 10050, "train_loss": 3.5543875694274902, "lr": 0.0003227580154899606, "tps": 13655, "wall": 48238.6} {"step": 10051, "train_loss": 3.578526496887207, "lr": 0.0003227422855197459, "tps": 13654, "wall": 48246.7} {"step": 10052, "train_loss": 3.575037717819214, "lr": 0.00032272655438566103, "tps": 13653, "wall": 48254.8} {"step": 10053, "train_loss": 3.5478334426879883, "lr": 0.00032271082208788434, "tps": 13652, "wall": 48263.1} {"step": 10054, "train_loss": 3.513258934020996, "lr": 0.0003226950886265938, "tps": 13651, "wall": 48271.4} {"step": 10055, "train_loss": 3.4134178161621094, "lr": 0.0003226793540019677, "tps": 13650, "wall": 48279.7} {"step": 10056, "train_loss": 3.5746350288391113, "lr": 0.0003226636182141844, "tps": 13649, "wall": 48288.0} {"step": 10057, "train_loss": 3.4568862915039062, "lr": 0.00032264788126342206, "tps": 13648, "wall": 48296.0} {"step": 10058, "train_loss": 3.479423999786377, "lr": 0.0003226321431498589, "tps": 13647, "wall": 48304.2} {"step": 10059, "train_loss": 3.4497644901275635, "lr": 0.00032261640387367334, "tps": 13646, "wall": 48312.2} {"step": 10060, "train_loss": 3.486478567123413, "lr": 0.00032260066343504364, "tps": 13645, "wall": 48320.2} {"step": 10061, "train_loss": 3.435168981552124, "lr": 0.000322584921834148, "tps": 13644, "wall": 48328.3} {"step": 10062, "train_loss": 3.505988121032715, "lr": 0.00032256917907116483, "tps": 13643, "wall": 48336.5} {"step": 10063, "train_loss": 3.4877848625183105, "lr": 0.0003225534351462725, "tps": 13642, "wall": 48344.6} {"step": 10064, "train_loss": 3.6127676963806152, "lr": 0.00032253769005964925, "tps": 13641, "wall": 48352.8} {"step": 10065, "train_loss": 3.609712839126587, "lr": 0.0003225219438114735, "tps": 13640, "wall": 48361.0} {"step": 10066, "train_loss": 3.436253070831299, "lr": 0.00032250619640192366, "tps": 13639, "wall": 48369.0} {"step": 10067, "train_loss": 3.3985300064086914, "lr": 0.0003224904478311781, "tps": 13639, "wall": 48377.1} {"step": 10068, "train_loss": 3.5824174880981445, "lr": 0.0003224746980994152, "tps": 13638, "wall": 48385.3} {"step": 10069, "train_loss": 3.6061758995056152, "lr": 0.00032245894720681333, "tps": 13637, "wall": 48393.5} {"step": 10070, "train_loss": 3.4618868827819824, "lr": 0.000322443195153551, "tps": 13636, "wall": 48401.8} {"step": 10071, "train_loss": 3.479933977127075, "lr": 0.00032242744193980655, "tps": 13635, "wall": 48410.1} {"step": 10072, "train_loss": 3.474738597869873, "lr": 0.00032241168756575855, "tps": 13634, "wall": 48418.2} {"step": 10073, "train_loss": 3.4810791015625, "lr": 0.0003223959320315854, "tps": 13633, "wall": 48426.3} {"step": 10074, "train_loss": 3.558107852935791, "lr": 0.00032238017533746556, "tps": 13632, "wall": 48434.4} {"step": 10075, "train_loss": 3.4665606021881104, "lr": 0.0003223644174835776, "tps": 13631, "wall": 48442.5} {"step": 10076, "train_loss": 3.4532737731933594, "lr": 0.0003223486584701, "tps": 13630, "wall": 48450.6} {"step": 10077, "train_loss": 3.5737719535827637, "lr": 0.0003223328982972112, "tps": 13629, "wall": 48458.8} {"step": 10078, "train_loss": 3.5316057205200195, "lr": 0.00032231713696508985, "tps": 13628, "wall": 48466.9} {"step": 10079, "train_loss": 3.572345733642578, "lr": 0.0003223013744739144, "tps": 13627, "wall": 48475.1} {"step": 10080, "train_loss": 3.5275216102600098, "lr": 0.00032228561082386345, "tps": 13626, "wall": 48483.2} {"step": 10081, "train_loss": 3.5324957370758057, "lr": 0.0003222698460151155, "tps": 13625, "wall": 48491.2} {"step": 10082, "train_loss": 3.557943820953369, "lr": 0.0003222540800478493, "tps": 13624, "wall": 48499.3} {"step": 10083, "train_loss": 3.6368584632873535, "lr": 0.0003222383129222434, "tps": 13623, "wall": 48507.5} {"step": 10084, "train_loss": 3.587038516998291, "lr": 0.0003222225446384762, "tps": 13623, "wall": 48515.7} {"step": 10085, "train_loss": 3.395742893218994, "lr": 0.0003222067751967266, "tps": 13622, "wall": 48523.7} {"step": 10086, "train_loss": 3.4865612983703613, "lr": 0.0003221910045971731, "tps": 13621, "wall": 48531.9} {"step": 10087, "train_loss": 3.464433193206787, "lr": 0.00032217523283999437, "tps": 13620, "wall": 48540.1} {"step": 10088, "train_loss": 3.5079588890075684, "lr": 0.00032215945992536903, "tps": 13619, "wall": 48548.1} {"step": 10089, "train_loss": 3.600759506225586, "lr": 0.00032214368585347584, "tps": 13618, "wall": 48556.2} {"step": 10090, "train_loss": 3.506509780883789, "lr": 0.0003221279106244934, "tps": 13617, "wall": 48564.3} {"step": 10091, "train_loss": 3.542600631713867, "lr": 0.00032211213423860054, "tps": 13616, "wall": 48572.5} {"step": 10092, "train_loss": 3.6013474464416504, "lr": 0.0003220963566959759, "tps": 13615, "wall": 48580.6} {"step": 10093, "train_loss": 3.5556907653808594, "lr": 0.0003220805779967982, "tps": 13614, "wall": 48588.7} {"step": 10094, "train_loss": 3.550182342529297, "lr": 0.0003220647981412461, "tps": 13613, "wall": 48596.8} {"step": 10095, "train_loss": 3.498734474182129, "lr": 0.00032204901712949854, "tps": 13612, "wall": 48604.9} {"step": 10096, "train_loss": 3.588031768798828, "lr": 0.0003220332349617342, "tps": 13611, "wall": 48612.9} {"step": 10097, "train_loss": 3.618283748626709, "lr": 0.0003220174516381318, "tps": 13611, "wall": 48621.0} {"step": 10098, "train_loss": 3.532579183578491, "lr": 0.0003220016671588702, "tps": 13610, "wall": 48629.3} {"step": 10099, "train_loss": 3.541954755783081, "lr": 0.0003219858815241282, "tps": 13609, "wall": 48637.4} {"step": 10100, "train_loss": 3.4365029335021973, "lr": 0.00032197009473408465, "tps": 13608, "wall": 48645.5} {"step": 10101, "train_loss": 3.516531229019165, "lr": 0.0003219543067889183, "tps": 13607, "wall": 48653.7} {"step": 10102, "train_loss": 3.5370006561279297, "lr": 0.0003219385176888081, "tps": 13606, "wall": 48661.8} {"step": 10103, "train_loss": 3.5677897930145264, "lr": 0.0003219227274339328, "tps": 13605, "wall": 48669.9} {"step": 10104, "train_loss": 3.4996683597564697, "lr": 0.00032190693602447137, "tps": 13604, "wall": 48678.1} {"step": 10105, "train_loss": 3.623051643371582, "lr": 0.00032189114346060265, "tps": 13603, "wall": 48686.3} {"step": 10106, "train_loss": 3.4877448081970215, "lr": 0.0003218753497425055, "tps": 13602, "wall": 48694.5} {"step": 10107, "train_loss": 3.624116897583008, "lr": 0.00032185955487035894, "tps": 13601, "wall": 48702.7} {"step": 10108, "train_loss": 3.5674209594726562, "lr": 0.0003218437588443418, "tps": 13600, "wall": 48710.8} {"step": 10109, "train_loss": 3.4236600399017334, "lr": 0.000321827961664633, "tps": 13599, "wall": 48719.1} {"step": 10110, "train_loss": 3.483461380004883, "lr": 0.0003218121633314116, "tps": 13598, "wall": 48727.2} {"step": 10111, "train_loss": 3.537013530731201, "lr": 0.00032179636384485654, "tps": 13597, "wall": 48735.3} {"step": 10112, "train_loss": 3.616204261779785, "lr": 0.0003217805632051467, "tps": 13597, "wall": 48743.4} {"step": 10113, "train_loss": 3.4132330417633057, "lr": 0.0003217647614124612, "tps": 13596, "wall": 48751.4} {"step": 10114, "train_loss": 3.509882926940918, "lr": 0.0003217489584669789, "tps": 13595, "wall": 48759.6} {"step": 10115, "train_loss": 3.5231897830963135, "lr": 0.00032173315436887894, "tps": 13594, "wall": 48767.8} {"step": 10116, "train_loss": 3.5422916412353516, "lr": 0.00032171734911834026, "tps": 13593, "wall": 48776.0} {"step": 10117, "train_loss": 3.563297748565674, "lr": 0.000321701542715542, "tps": 13592, "wall": 48784.0} {"step": 10118, "train_loss": 3.4453651905059814, "lr": 0.00032168573516066313, "tps": 13591, "wall": 48792.2} {"step": 10119, "train_loss": 3.483283519744873, "lr": 0.00032166992645388275, "tps": 13590, "wall": 48800.3} {"step": 10120, "train_loss": 3.4548234939575195, "lr": 0.00032165411659538, "tps": 13589, "wall": 48808.6} {"step": 10121, "train_loss": 3.6660196781158447, "lr": 0.00032163830558533385, "tps": 13588, "wall": 48816.8} {"step": 10122, "train_loss": 3.6017796993255615, "lr": 0.00032162249342392355, "tps": 13587, "wall": 48824.9} {"step": 10123, "train_loss": 3.4605116844177246, "lr": 0.0003216066801113281, "tps": 13586, "wall": 48833.3} {"step": 10124, "train_loss": 3.5194175243377686, "lr": 0.0003215908656477267, "tps": 13585, "wall": 48841.2} {"step": 10125, "train_loss": 3.528413772583008, "lr": 0.0003215750500332984, "tps": 13584, "wall": 48849.4} {"step": 10126, "train_loss": 3.5533719062805176, "lr": 0.0003215592332682225, "tps": 13584, "wall": 48857.3} {"step": 10127, "train_loss": 3.4419493675231934, "lr": 0.00032154341535267807, "tps": 13583, "wall": 48865.5} {"step": 10128, "train_loss": 3.381757974624634, "lr": 0.0003215275962868444, "tps": 13582, "wall": 48873.6} {"step": 10129, "train_loss": 3.5505032539367676, "lr": 0.00032151177607090065, "tps": 13581, "wall": 48881.7} {"step": 10130, "train_loss": 3.622943878173828, "lr": 0.00032149595470502596, "tps": 13580, "wall": 48890.0} {"step": 10131, "train_loss": 3.5568113327026367, "lr": 0.0003214801321893996, "tps": 13579, "wall": 48898.3} {"step": 10132, "train_loss": 3.634129047393799, "lr": 0.0003214643085242008, "tps": 13578, "wall": 48906.3} {"step": 10133, "train_loss": 3.5018763542175293, "lr": 0.0003214484837096088, "tps": 13577, "wall": 48914.5} {"step": 10134, "train_loss": 3.4516265392303467, "lr": 0.00032143265774580294, "tps": 13576, "wall": 48922.6} {"step": 10135, "train_loss": 3.5217528343200684, "lr": 0.0003214168306329624, "tps": 13575, "wall": 48930.7} {"step": 10136, "train_loss": 3.4807674884796143, "lr": 0.00032140100237126656, "tps": 13574, "wall": 48938.9} {"step": 10137, "train_loss": 3.4250986576080322, "lr": 0.00032138517296089467, "tps": 13573, "wall": 48947.2} {"step": 10138, "train_loss": 3.4932126998901367, "lr": 0.0003213693424020261, "tps": 13572, "wall": 48955.4} {"step": 10139, "train_loss": 3.5707314014434814, "lr": 0.00032135351069484007, "tps": 13572, "wall": 48963.4} {"step": 10140, "train_loss": 3.493913173675537, "lr": 0.000321337677839516, "tps": 13571, "wall": 48971.6} {"step": 10141, "train_loss": 3.446666955947876, "lr": 0.0003213218438362332, "tps": 13570, "wall": 48979.8} {"step": 10142, "train_loss": 3.5036542415618896, "lr": 0.00032130600868517117, "tps": 13569, "wall": 48987.9} {"step": 10143, "train_loss": 3.4962003231048584, "lr": 0.0003212901723865091, "tps": 13568, "wall": 48996.1} {"step": 10144, "train_loss": 3.478997230529785, "lr": 0.00032127433494042655, "tps": 13567, "wall": 49004.3} {"step": 10145, "train_loss": 3.528130054473877, "lr": 0.0003212584963471028, "tps": 13566, "wall": 49012.4} {"step": 10146, "train_loss": 3.562979221343994, "lr": 0.00032124265660671736, "tps": 13565, "wall": 49020.5} {"step": 10147, "train_loss": 3.4519994258880615, "lr": 0.0003212268157194496, "tps": 13564, "wall": 49028.6} {"step": 10148, "train_loss": 3.607663154602051, "lr": 0.00032121097368547903, "tps": 13563, "wall": 49036.8} {"step": 10149, "train_loss": 3.444735050201416, "lr": 0.00032119513050498505, "tps": 13562, "wall": 49044.9} {"step": 10150, "train_loss": 3.4893147945404053, "lr": 0.00032117928617814715, "tps": 13561, "wall": 49053.1} {"step": 10151, "train_loss": 3.3832173347473145, "lr": 0.0003211634407051448, "tps": 13560, "wall": 49061.4} {"step": 10152, "train_loss": 3.584779977798462, "lr": 0.0003211475940861576, "tps": 13560, "wall": 49069.6} {"step": 10153, "train_loss": 3.4854140281677246, "lr": 0.0003211317463213649, "tps": 13559, "wall": 49077.8} {"step": 10154, "train_loss": 3.4505486488342285, "lr": 0.00032111589741094635, "tps": 13558, "wall": 49085.9} {"step": 10155, "train_loss": 3.5556631088256836, "lr": 0.00032110004735508144, "tps": 13557, "wall": 49094.0} {"step": 10156, "train_loss": 3.534038543701172, "lr": 0.0003210841961539497, "tps": 13556, "wall": 49102.0} {"step": 10157, "train_loss": 3.5300822257995605, "lr": 0.00032106834380773075, "tps": 13555, "wall": 49110.2} {"step": 10158, "train_loss": 3.5942583084106445, "lr": 0.0003210524903166041, "tps": 13554, "wall": 49118.4} {"step": 10159, "train_loss": 3.443293571472168, "lr": 0.0003210366356807494, "tps": 13553, "wall": 49126.7} {"step": 10160, "train_loss": 3.588372230529785, "lr": 0.0003210207799003463, "tps": 13552, "wall": 49134.8} {"step": 10161, "train_loss": 3.5282928943634033, "lr": 0.00032100492297557423, "tps": 13551, "wall": 49142.9} {"step": 10162, "train_loss": 3.5362799167633057, "lr": 0.00032098906490661295, "tps": 13550, "wall": 49151.0} {"step": 10163, "train_loss": 3.4641776084899902, "lr": 0.0003209732056936421, "tps": 13550, "wall": 49159.1} {"step": 10164, "train_loss": 3.444542169570923, "lr": 0.00032095734533684123, "tps": 13549, "wall": 49167.4} {"step": 10165, "train_loss": 3.509774684906006, "lr": 0.00032094148383639016, "tps": 13548, "wall": 49175.4} {"step": 10166, "train_loss": 3.514228105545044, "lr": 0.0003209256211924685, "tps": 13547, "wall": 49183.6} {"step": 10167, "train_loss": 3.480898380279541, "lr": 0.000320909757405256, "tps": 13546, "wall": 49191.8} {"step": 10168, "train_loss": 3.587665557861328, "lr": 0.0003208938924749322, "tps": 13545, "wall": 49200.0} {"step": 10169, "train_loss": 3.5188145637512207, "lr": 0.000320878026401677, "tps": 13544, "wall": 49208.1} {"step": 10170, "train_loss": 3.4329848289489746, "lr": 0.00032086215918567, "tps": 13543, "wall": 49216.2} {"step": 10171, "train_loss": 3.5834736824035645, "lr": 0.00032084629082709104, "tps": 13542, "wall": 49224.4} {"step": 10172, "train_loss": 3.4578499794006348, "lr": 0.0003208304213261199, "tps": 13541, "wall": 49232.5} {"step": 10173, "train_loss": 3.5161099433898926, "lr": 0.00032081455068293626, "tps": 13540, "wall": 49240.7} {"step": 10174, "train_loss": 3.500387191772461, "lr": 0.0003207986788977199, "tps": 13539, "wall": 49249.0} {"step": 10175, "train_loss": 3.4936437606811523, "lr": 0.0003207828059706506, "tps": 13539, "wall": 49257.2} {"step": 10176, "train_loss": 3.5638582706451416, "lr": 0.00032076693190190834, "tps": 13538, "wall": 49265.4} {"step": 10177, "train_loss": 3.554842710494995, "lr": 0.00032075105669167277, "tps": 13537, "wall": 49273.5} {"step": 10178, "train_loss": 3.505676746368408, "lr": 0.00032073518034012375, "tps": 13536, "wall": 49281.6} {"step": 10179, "train_loss": 3.5179717540740967, "lr": 0.00032071930284744115, "tps": 13535, "wall": 49289.8} {"step": 10180, "train_loss": 3.598644495010376, "lr": 0.0003207034242138049, "tps": 13534, "wall": 49297.9} {"step": 10181, "train_loss": 3.5455970764160156, "lr": 0.00032068754443939483, "tps": 13533, "wall": 49306.2} {"step": 10182, "train_loss": 3.489943504333496, "lr": 0.0003206716635243908, "tps": 13532, "wall": 49314.3} {"step": 10183, "train_loss": 3.5546278953552246, "lr": 0.00032065578146897263, "tps": 13531, "wall": 49322.6} {"step": 10184, "train_loss": 3.410808563232422, "lr": 0.00032063989827332037, "tps": 13530, "wall": 49330.7} {"step": 10185, "train_loss": 3.509737491607666, "lr": 0.00032062401393761396, "tps": 13529, "wall": 49339.0} {"step": 10186, "train_loss": 3.5424435138702393, "lr": 0.0003206081284620332, "tps": 13528, "wall": 49347.2} {"step": 10187, "train_loss": 3.5019924640655518, "lr": 0.0003205922418467582, "tps": 13528, "wall": 49355.4} {"step": 10188, "train_loss": 3.575779914855957, "lr": 0.00032057635409196873, "tps": 13527, "wall": 49363.5} {"step": 10189, "train_loss": 3.6191444396972656, "lr": 0.00032056046519784493, "tps": 13526, "wall": 49371.8} {"step": 10190, "train_loss": 3.587418794631958, "lr": 0.0003205445751645667, "tps": 13525, "wall": 49380.0} {"step": 10191, "train_loss": 3.502729892730713, "lr": 0.00032052868399231417, "tps": 13524, "wall": 49388.2} {"step": 10192, "train_loss": 3.582364559173584, "lr": 0.0003205127916812672, "tps": 13523, "wall": 49396.4} {"step": 10193, "train_loss": 3.498547077178955, "lr": 0.00032049689823160593, "tps": 13522, "wall": 49404.5} {"step": 10194, "train_loss": 3.4559693336486816, "lr": 0.0003204810036435103, "tps": 13521, "wall": 49412.7} {"step": 10195, "train_loss": 3.523804187774658, "lr": 0.00032046510791716053, "tps": 13520, "wall": 49420.8} {"step": 10196, "train_loss": 3.541844367980957, "lr": 0.00032044921105273653, "tps": 13519, "wall": 49429.1} {"step": 10197, "train_loss": 3.5276033878326416, "lr": 0.0003204333130504184, "tps": 13518, "wall": 49437.3} {"step": 10198, "train_loss": 3.5479512214660645, "lr": 0.0003204174139103863, "tps": 13517, "wall": 49445.4} {"step": 10199, "train_loss": 3.5500731468200684, "lr": 0.00032040151363282025, "tps": 13517, "wall": 49453.6} {"step": 10200, "train_loss": 3.631894111633301, "lr": 0.0003203856122179005, "tps": 13516, "wall": 49461.8} {"step": 10201, "train_loss": 3.5674848556518555, "lr": 0.00032036970966580706, "tps": 13515, "wall": 49470.2} {"step": 10202, "train_loss": 3.4992289543151855, "lr": 0.00032035380597672015, "tps": 13514, "wall": 49478.3} {"step": 10203, "train_loss": 3.441804885864258, "lr": 0.00032033790115081984, "tps": 13513, "wall": 49486.6} {"step": 10204, "train_loss": 3.599865436553955, "lr": 0.0003203219951882864, "tps": 13512, "wall": 49494.7} {"step": 10205, "train_loss": 3.559725284576416, "lr": 0.0003203060880893, "tps": 13511, "wall": 49502.9} {"step": 10206, "train_loss": 3.527217388153076, "lr": 0.00032029017985404077, "tps": 13510, "wall": 49511.0} {"step": 10207, "train_loss": 3.4987168312072754, "lr": 0.000320274270482689, "tps": 13509, "wall": 49519.2} {"step": 10208, "train_loss": 3.418377637863159, "lr": 0.0003202583599754248, "tps": 13508, "wall": 49527.4} {"step": 10209, "train_loss": 3.573151111602783, "lr": 0.0003202424483324285, "tps": 13507, "wall": 49535.8} {"step": 10210, "train_loss": 3.5851335525512695, "lr": 0.00032022653555388033, "tps": 13506, "wall": 49544.0} {"step": 10211, "train_loss": 3.5383620262145996, "lr": 0.00032021062163996056, "tps": 13506, "wall": 49552.3} {"step": 10212, "train_loss": 3.5301401615142822, "lr": 0.0003201947065908494, "tps": 13505, "wall": 49560.6} {"step": 10213, "train_loss": 3.5408740043640137, "lr": 0.0003201787904067272, "tps": 13504, "wall": 49568.6} {"step": 10214, "train_loss": 3.52514910697937, "lr": 0.00032016287308777425, "tps": 13503, "wall": 49576.8} {"step": 10215, "train_loss": 3.4717509746551514, "lr": 0.00032014695463417086, "tps": 13502, "wall": 49585.1} {"step": 10216, "train_loss": 3.6200623512268066, "lr": 0.00032013103504609735, "tps": 13501, "wall": 49593.4} {"step": 10217, "train_loss": 3.566685676574707, "lr": 0.00032011511432373407, "tps": 13500, "wall": 49601.6} {"step": 10218, "train_loss": 3.4730889797210693, "lr": 0.0003200991924672613, "tps": 13499, "wall": 49609.9} {"step": 10219, "train_loss": 3.5710513591766357, "lr": 0.0003200832694768595, "tps": 13498, "wall": 49618.1} {"step": 10220, "train_loss": 3.529414653778076, "lr": 0.000320067345352709, "tps": 13497, "wall": 49626.3} {"step": 10221, "train_loss": 3.5273728370666504, "lr": 0.0003200514200949902, "tps": 13496, "wall": 49634.4} {"step": 10222, "train_loss": 3.5748610496520996, "lr": 0.0003200354937038836, "tps": 13495, "wall": 49642.7} {"step": 10223, "train_loss": 3.4749205112457275, "lr": 0.0003200195661795694, "tps": 13495, "wall": 49650.8} {"step": 10224, "train_loss": 3.546154022216797, "lr": 0.00032000363752222817, "tps": 13494, "wall": 49659.2} {"step": 10225, "train_loss": 3.52736234664917, "lr": 0.0003199877077320403, "tps": 13493, "wall": 49667.5} {"step": 10226, "train_loss": 3.4739928245544434, "lr": 0.00031997177680918626, "tps": 13492, "wall": 49675.8} {"step": 10227, "train_loss": 3.487319231033325, "lr": 0.00031995584475384665, "tps": 13491, "wall": 49684.0} {"step": 10228, "train_loss": 3.5486185550689697, "lr": 0.0003199399115662017, "tps": 13490, "wall": 49692.0} {"step": 10229, "train_loss": 3.4629478454589844, "lr": 0.00031992397724643206, "tps": 13489, "wall": 49700.2} {"step": 10230, "train_loss": 3.593353748321533, "lr": 0.00031990804179471817, "tps": 13488, "wall": 49708.5} {"step": 10231, "train_loss": 3.499316453933716, "lr": 0.0003198921052112406, "tps": 13487, "wall": 49716.8} {"step": 10232, "train_loss": 3.475487470626831, "lr": 0.0003198761674961798, "tps": 13486, "wall": 49724.9} {"step": 10233, "train_loss": 3.5403592586517334, "lr": 0.0003198602286497165, "tps": 13485, "wall": 49733.2} {"step": 10234, "train_loss": 3.4284276962280273, "lr": 0.00031984428867203106, "tps": 13484, "wall": 49741.5} {"step": 10235, "train_loss": 3.554417610168457, "lr": 0.0003198283475633042, "tps": 13484, "wall": 49749.7} {"step": 10236, "train_loss": 3.6124424934387207, "lr": 0.00031981240532371626, "tps": 13483, "wall": 49757.9} {"step": 10237, "train_loss": 3.418440341949463, "lr": 0.0003197964619534481, "tps": 13482, "wall": 49766.1} {"step": 10238, "train_loss": 3.4744153022766113, "lr": 0.0003197805174526802, "tps": 13481, "wall": 49774.3} {"step": 10239, "train_loss": 3.448270797729492, "lr": 0.00031976457182159317, "tps": 13480, "wall": 49782.5} {"step": 10240, "train_loss": 3.5349016189575195, "lr": 0.00031974862506036774, "tps": 13479, "wall": 49790.8} {"step": 10241, "train_loss": 3.5771708488464355, "lr": 0.00031973267716918437, "tps": 13478, "wall": 49799.0} {"step": 10242, "train_loss": 3.5371742248535156, "lr": 0.00031971672814822395, "tps": 13477, "wall": 49807.1} {"step": 10243, "train_loss": 3.5447804927825928, "lr": 0.00031970077799766696, "tps": 13476, "wall": 49815.3} {"step": 10244, "train_loss": 3.4191153049468994, "lr": 0.00031968482671769423, "tps": 13475, "wall": 49823.5} {"step": 10245, "train_loss": 3.6236042976379395, "lr": 0.00031966887430848634, "tps": 13474, "wall": 49831.7} {"step": 10246, "train_loss": 3.613093137741089, "lr": 0.0003196529207702241, "tps": 13474, "wall": 49840.0} {"step": 10247, "train_loss": 3.568028688430786, "lr": 0.0003196369661030881, "tps": 13473, "wall": 49848.2} {"step": 10248, "train_loss": 3.55495023727417, "lr": 0.00031962101030725925, "tps": 13472, "wall": 49856.6} {"step": 10249, "train_loss": 3.488582134246826, "lr": 0.0003196050533829181, "tps": 13471, "wall": 49864.7} {"step": 10250, "train_loss": 3.451397657394409, "lr": 0.0003195890953302456, "tps": 13470, "wall": 49872.8} {"step": 10251, "train_loss": 3.456287384033203, "lr": 0.00031957313614942244, "tps": 13469, "wall": 49881.0} {"step": 10252, "train_loss": 3.5899362564086914, "lr": 0.00031955717584062943, "tps": 13468, "wall": 49889.2} {"step": 10253, "train_loss": 3.51511812210083, "lr": 0.00031954121440404726, "tps": 13467, "wall": 49897.5} {"step": 10254, "train_loss": 3.586803436279297, "lr": 0.0003195252518398569, "tps": 13466, "wall": 49905.8} {"step": 10255, "train_loss": 3.5750553607940674, "lr": 0.00031950928814823904, "tps": 13465, "wall": 49914.1} {"step": 10256, "train_loss": 3.4853901863098145, "lr": 0.0003194933233293746, "tps": 13465, "wall": 49922.2} {"step": 10257, "train_loss": 3.678133487701416, "lr": 0.0003194773573834445, "tps": 13464, "wall": 49930.3} {"step": 10258, "train_loss": 3.3846046924591064, "lr": 0.0003194613903106294, "tps": 13463, "wall": 49938.6} {"step": 10259, "train_loss": 3.5061192512512207, "lr": 0.00031944542211111035, "tps": 13462, "wall": 49947.0} {"step": 10260, "train_loss": 3.5627901554107666, "lr": 0.00031942945278506815, "tps": 13461, "wall": 49955.2} {"step": 10261, "train_loss": 3.5108144283294678, "lr": 0.0003194134823326838, "tps": 13460, "wall": 49963.4} {"step": 10262, "train_loss": 3.612334966659546, "lr": 0.00031939751075413806, "tps": 13459, "wall": 49971.7} {"step": 10263, "train_loss": 3.60744047164917, "lr": 0.0003193815380496119, "tps": 13458, "wall": 49979.9} {"step": 10264, "train_loss": 3.504244327545166, "lr": 0.0003193655642192864, "tps": 13457, "wall": 49988.1} {"step": 10265, "train_loss": 3.46433687210083, "lr": 0.00031934958926334235, "tps": 13456, "wall": 49996.3} {"step": 10266, "train_loss": 3.496065616607666, "lr": 0.0003193336131819608, "tps": 13455, "wall": 50004.6} {"step": 10267, "train_loss": 3.443227767944336, "lr": 0.00031931763597532276, "tps": 13455, "wall": 50012.8} {"step": 10268, "train_loss": 3.488049268722534, "lr": 0.0003193016576436091, "tps": 13454, "wall": 50020.9} {"step": 10269, "train_loss": 3.530928611755371, "lr": 0.0003192856781870009, "tps": 13453, "wall": 50029.1} {"step": 10270, "train_loss": 3.539940118789673, "lr": 0.00031926969760567923, "tps": 13452, "wall": 50037.4} {"step": 10271, "train_loss": 3.5488333702087402, "lr": 0.000319253715899825, "tps": 13451, "wall": 50045.5} {"step": 10272, "train_loss": 3.527364730834961, "lr": 0.00031923773306961927, "tps": 13450, "wall": 50053.7} {"step": 10273, "train_loss": 3.5472757816314697, "lr": 0.0003192217491152432, "tps": 13449, "wall": 50062.0} {"step": 10274, "train_loss": 3.546095848083496, "lr": 0.00031920576403687774, "tps": 13448, "wall": 50070.2} {"step": 10275, "train_loss": 3.532961368560791, "lr": 0.00031918977783470403, "tps": 13447, "wall": 50078.4} {"step": 10276, "train_loss": 3.549501419067383, "lr": 0.00031917379050890314, "tps": 13446, "wall": 50086.7} {"step": 10277, "train_loss": 3.577601432800293, "lr": 0.0003191578020596562, "tps": 13446, "wall": 50095.1} {"step": 10278, "train_loss": 3.498853921890259, "lr": 0.0003191418124871443, "tps": 13445, "wall": 50103.2} {"step": 10279, "train_loss": 3.4243149757385254, "lr": 0.0003191258217915487, "tps": 13444, "wall": 50111.4} {"step": 10280, "train_loss": 3.5513219833374023, "lr": 0.00031910982997305023, "tps": 13443, "wall": 50119.6} {"step": 10281, "train_loss": 3.5442428588867188, "lr": 0.00031909383703183035, "tps": 13442, "wall": 50127.9} {"step": 10282, "train_loss": 3.560987949371338, "lr": 0.00031907784296807015, "tps": 13441, "wall": 50136.2} {"step": 10283, "train_loss": 3.4339547157287598, "lr": 0.0003190618477819507, "tps": 13440, "wall": 50144.4} {"step": 10284, "train_loss": 3.500485897064209, "lr": 0.0003190458514736534, "tps": 13439, "wall": 50152.7} {"step": 10285, "train_loss": 3.508852481842041, "lr": 0.0003190298540433593, "tps": 13438, "wall": 50160.8} {"step": 10286, "train_loss": 3.5505056381225586, "lr": 0.00031901385549124955, "tps": 13437, "wall": 50169.0} {"step": 10287, "train_loss": 3.513481616973877, "lr": 0.0003189978558175056, "tps": 13437, "wall": 50177.3} {"step": 10288, "train_loss": 3.538327693939209, "lr": 0.00031898185502230846, "tps": 13436, "wall": 50185.6} {"step": 10289, "train_loss": 3.5063815116882324, "lr": 0.00031896585310583965, "tps": 13435, "wall": 50193.7} {"step": 10290, "train_loss": 3.489508628845215, "lr": 0.0003189498500682802, "tps": 13434, "wall": 50201.9} {"step": 10291, "train_loss": 3.454850196838379, "lr": 0.0003189338459098116, "tps": 13433, "wall": 50210.1} {"step": 10292, "train_loss": 3.5485646724700928, "lr": 0.0003189178406306149, "tps": 13432, "wall": 50218.4} {"step": 10293, "train_loss": 3.612964391708374, "lr": 0.0003189018342308717, "tps": 13431, "wall": 50226.5} {"step": 10294, "train_loss": 3.651406764984131, "lr": 0.0003188858267107631, "tps": 13430, "wall": 50234.7} {"step": 10295, "train_loss": 3.4354562759399414, "lr": 0.00031886981807047047, "tps": 13429, "wall": 50243.0} {"step": 10296, "train_loss": 3.518230438232422, "lr": 0.0003188538083101753, "tps": 13429, "wall": 50251.1} {"step": 10297, "train_loss": 3.5723419189453125, "lr": 0.00031883779743005876, "tps": 13428, "wall": 50259.5} {"step": 10298, "train_loss": 3.4928531646728516, "lr": 0.00031882178543030234, "tps": 13427, "wall": 50267.7} {"step": 10299, "train_loss": 3.4061763286590576, "lr": 0.00031880577231108734, "tps": 13426, "wall": 50275.9} {"step": 10300, "train_loss": 3.5460402965545654, "lr": 0.00031878975807259524, "tps": 13425, "wall": 50284.1} {"step": 10301, "train_loss": 3.5141549110412598, "lr": 0.00031877374271500745, "tps": 13424, "wall": 50292.4} {"step": 10302, "train_loss": 3.4792113304138184, "lr": 0.0003187577262385053, "tps": 13423, "wall": 50300.5} {"step": 10303, "train_loss": 3.496072292327881, "lr": 0.0003187417086432703, "tps": 13422, "wall": 50308.8} {"step": 10304, "train_loss": 3.4371590614318848, "lr": 0.0003187256899294839, "tps": 13421, "wall": 50316.9} {"step": 10305, "train_loss": 3.4629435539245605, "lr": 0.0003187096700973275, "tps": 13421, "wall": 50325.2} {"step": 10306, "train_loss": 3.455507516860962, "lr": 0.00031869364914698263, "tps": 13420, "wall": 50333.5} {"step": 10307, "train_loss": 3.53786039352417, "lr": 0.00031867762707863084, "tps": 13419, "wall": 50341.7} {"step": 10308, "train_loss": 3.6177194118499756, "lr": 0.0003186616038924534, "tps": 13418, "wall": 50349.9} {"step": 10309, "train_loss": 3.507246255874634, "lr": 0.00031864557958863213, "tps": 13417, "wall": 50358.1} {"step": 10310, "train_loss": 3.4776811599731445, "lr": 0.0003186295541673483, "tps": 13416, "wall": 50366.3} {"step": 10311, "train_loss": 3.395084857940674, "lr": 0.0003186135276287836, "tps": 13415, "wall": 50374.4} {"step": 10312, "train_loss": 3.608011245727539, "lr": 0.00031859749997311944, "tps": 13414, "wall": 50382.6} {"step": 10313, "train_loss": 3.476714849472046, "lr": 0.0003185814712005376, "tps": 13413, "wall": 50391.0} {"step": 10314, "train_loss": 3.556382179260254, "lr": 0.00031856544131121943, "tps": 13412, "wall": 50399.2} {"step": 10315, "train_loss": 3.4043021202087402, "lr": 0.0003185494103053466, "tps": 13412, "wall": 50407.3} {"step": 10316, "train_loss": 3.508375883102417, "lr": 0.00031853337818310074, "tps": 13411, "wall": 50415.5} {"step": 10317, "train_loss": 3.454430103302002, "lr": 0.0003185173449446635, "tps": 13410, "wall": 50423.7} {"step": 10318, "train_loss": 3.6161608695983887, "lr": 0.0003185013105902163, "tps": 13409, "wall": 50432.1} {"step": 10319, "train_loss": 3.467282772064209, "lr": 0.0003184852751199411, "tps": 13408, "wall": 50440.3} {"step": 10320, "train_loss": 3.5151796340942383, "lr": 0.0003184692385340193, "tps": 13407, "wall": 50448.7} {"step": 10321, "train_loss": 3.5413436889648438, "lr": 0.0003184532008326326, "tps": 13406, "wall": 50456.9} {"step": 10322, "train_loss": 3.519500732421875, "lr": 0.0003184371620159628, "tps": 13405, "wall": 50465.1} {"step": 10323, "train_loss": 3.579146385192871, "lr": 0.00031842112208419144, "tps": 13405, "wall": 50473.2} {"step": 10324, "train_loss": 3.5027825832366943, "lr": 0.0003184050810375003, "tps": 13404, "wall": 50481.3} {"step": 10325, "train_loss": 3.4576196670532227, "lr": 0.00031838903887607107, "tps": 13403, "wall": 50489.6} {"step": 10326, "train_loss": 3.478013515472412, "lr": 0.0003183729956000854, "tps": 13402, "wall": 50497.9} {"step": 10327, "train_loss": 3.4344820976257324, "lr": 0.00031835695120972524, "tps": 13401, "wall": 50506.3} {"step": 10328, "train_loss": 3.5562069416046143, "lr": 0.0003183409057051722, "tps": 13400, "wall": 50514.6} {"step": 10329, "train_loss": 3.5088624954223633, "lr": 0.00031832485908660804, "tps": 13399, "wall": 50522.7} {"step": 10330, "train_loss": 3.473226547241211, "lr": 0.00031830881135421456, "tps": 13398, "wall": 50530.9} {"step": 10331, "train_loss": 3.629733085632324, "lr": 0.00031829276250817354, "tps": 13397, "wall": 50539.2} {"step": 10332, "train_loss": 3.543086528778076, "lr": 0.00031827671254866687, "tps": 13396, "wall": 50547.4} {"step": 10333, "train_loss": 3.4750661849975586, "lr": 0.00031826066147587614, "tps": 13396, "wall": 50555.7} {"step": 10334, "train_loss": 3.58270263671875, "lr": 0.0003182446092899834, "tps": 13395, "wall": 50563.9} {"step": 10335, "train_loss": 3.430851697921753, "lr": 0.00031822855599117036, "tps": 13394, "wall": 50572.1} {"step": 10336, "train_loss": 3.5392768383026123, "lr": 0.000318212501579619, "tps": 13393, "wall": 50580.4} {"step": 10337, "train_loss": 3.482908248901367, "lr": 0.000318196446055511, "tps": 13392, "wall": 50588.5} {"step": 10338, "train_loss": 3.451260566711426, "lr": 0.00031818038941902843, "tps": 13391, "wall": 50596.9} {"step": 10339, "train_loss": 3.694000720977783, "lr": 0.00031816433167035314, "tps": 13390, "wall": 50605.0} {"step": 10340, "train_loss": 3.6168723106384277, "lr": 0.0003181482728096669, "tps": 13389, "wall": 50613.4} {"step": 10341, "train_loss": 3.5236029624938965, "lr": 0.0003181322128371517, "tps": 13389, "wall": 50621.6} {"step": 10342, "train_loss": 3.500065803527832, "lr": 0.00031811615175298953, "tps": 13388, "wall": 50630.0} {"step": 10343, "train_loss": 3.427140951156616, "lr": 0.0003181000895573623, "tps": 13387, "wall": 50638.2} {"step": 10344, "train_loss": 3.596066951751709, "lr": 0.00031808402625045195, "tps": 13386, "wall": 50646.5} {"step": 10345, "train_loss": 3.4650630950927734, "lr": 0.0003180679618324404, "tps": 13385, "wall": 50654.7} {"step": 10346, "train_loss": 3.49532413482666, "lr": 0.00031805189630350973, "tps": 13384, "wall": 50662.9} {"step": 10347, "train_loss": 3.5640764236450195, "lr": 0.0003180358296638419, "tps": 13383, "wall": 50671.2} {"step": 10348, "train_loss": 3.4346413612365723, "lr": 0.0003180197619136188, "tps": 13382, "wall": 50679.5} {"step": 10349, "train_loss": 3.472647190093994, "lr": 0.0003180036930530226, "tps": 13381, "wall": 50687.9} {"step": 10350, "train_loss": 3.470735549926758, "lr": 0.0003179876230822352, "tps": 13380, "wall": 50696.1} {"step": 10351, "train_loss": 3.4371423721313477, "lr": 0.00031797155200143876, "tps": 13380, "wall": 50704.3} {"step": 10352, "train_loss": 3.558539867401123, "lr": 0.00031795547981081524, "tps": 13379, "wall": 50712.4} {"step": 10353, "train_loss": 3.4936962127685547, "lr": 0.0003179394065105468, "tps": 13378, "wall": 50720.7} {"step": 10354, "train_loss": 3.537327289581299, "lr": 0.0003179233321008154, "tps": 13377, "wall": 50729.0} {"step": 10355, "train_loss": 3.5437793731689453, "lr": 0.0003179072565818032, "tps": 13376, "wall": 50737.1} {"step": 10356, "train_loss": 3.5441746711730957, "lr": 0.00031789117995369235, "tps": 13375, "wall": 50745.3} {"step": 10357, "train_loss": 3.551731824874878, "lr": 0.0003178751022166649, "tps": 13374, "wall": 50753.6} {"step": 10358, "train_loss": 3.512427806854248, "lr": 0.000317859023370903, "tps": 13373, "wall": 50761.9} {"step": 10359, "train_loss": 3.421010971069336, "lr": 0.00031784294341658876, "tps": 13373, "wall": 50770.1} {"step": 10360, "train_loss": 3.475721836090088, "lr": 0.00031782686235390443, "tps": 13372, "wall": 50778.3} {"step": 10361, "train_loss": 3.556823253631592, "lr": 0.00031781078018303197, "tps": 13371, "wall": 50786.5} {"step": 10362, "train_loss": 3.597414016723633, "lr": 0.00031779469690415384, "tps": 13370, "wall": 50794.7} {"step": 10363, "train_loss": 3.5145955085754395, "lr": 0.000317778612517452, "tps": 13369, "wall": 50802.9} {"step": 10364, "train_loss": 3.531710147857666, "lr": 0.0003177625270231089, "tps": 13368, "wall": 50811.4} {"step": 10365, "train_loss": 3.5036940574645996, "lr": 0.0003177464404213064, "tps": 13367, "wall": 50819.6} {"step": 10366, "train_loss": 3.545095205307007, "lr": 0.00031773035271222706, "tps": 13366, "wall": 50827.8} {"step": 10367, "train_loss": 3.472445249557495, "lr": 0.00031771426389605293, "tps": 13366, "wall": 50836.1} {"step": 10368, "train_loss": 3.4415130615234375, "lr": 0.00031769817397296645, "tps": 13365, "wall": 50844.4} {"step": 10369, "train_loss": 3.5118885040283203, "lr": 0.00031768208294314965, "tps": 13364, "wall": 50852.6} {"step": 10370, "train_loss": 3.4828667640686035, "lr": 0.000317665990806785, "tps": 13363, "wall": 50860.9} {"step": 10371, "train_loss": 3.4844982624053955, "lr": 0.0003176498975640547, "tps": 13362, "wall": 50869.2} {"step": 10372, "train_loss": 3.494235038757324, "lr": 0.00031763380321514105, "tps": 13361, "wall": 50877.4} {"step": 10373, "train_loss": 3.426988124847412, "lr": 0.0003176177077602264, "tps": 13360, "wall": 50885.6} {"step": 10374, "train_loss": 3.556342124938965, "lr": 0.0003176016111994931, "tps": 13359, "wall": 50893.9} {"step": 10375, "train_loss": 3.482740879058838, "lr": 0.00031758551353312347, "tps": 13359, "wall": 50902.0} {"step": 10376, "train_loss": 3.417773723602295, "lr": 0.0003175694147612998, "tps": 13358, "wall": 50910.2} {"step": 10377, "train_loss": 3.5044589042663574, "lr": 0.00031755331488420464, "tps": 13357, "wall": 50918.5} {"step": 10378, "train_loss": 3.556507110595703, "lr": 0.0003175372139020202, "tps": 13356, "wall": 50926.8} {"step": 10379, "train_loss": 3.426182746887207, "lr": 0.00031752111181492887, "tps": 13355, "wall": 50935.1} {"step": 10380, "train_loss": 3.494535446166992, "lr": 0.0003175050086231131, "tps": 13354, "wall": 50943.4} {"step": 10381, "train_loss": 3.556520462036133, "lr": 0.0003174889043267555, "tps": 13353, "wall": 50951.6} {"step": 10382, "train_loss": 3.5639896392822266, "lr": 0.0003174727989260382, "tps": 13352, "wall": 50959.9} {"step": 10383, "train_loss": 3.531994581222534, "lr": 0.0003174566924211437, "tps": 13352, "wall": 50968.1} {"step": 10384, "train_loss": 3.485100269317627, "lr": 0.00031744058481225455, "tps": 13351, "wall": 50976.4} {"step": 10385, "train_loss": 3.453153133392334, "lr": 0.0003174244760995532, "tps": 13350, "wall": 50984.5} {"step": 10386, "train_loss": 3.487797975540161, "lr": 0.0003174083662832221, "tps": 13349, "wall": 50993.0} {"step": 10387, "train_loss": 3.5308971405029297, "lr": 0.00031739225536344377, "tps": 13348, "wall": 51001.2} {"step": 10388, "train_loss": 3.4903604984283447, "lr": 0.0003173761433404007, "tps": 13347, "wall": 51009.5} {"step": 10389, "train_loss": 3.4464778900146484, "lr": 0.00031736003021427546, "tps": 13346, "wall": 51017.7} {"step": 10390, "train_loss": 3.4717392921447754, "lr": 0.0003173439159852504, "tps": 13345, "wall": 51026.1} {"step": 10391, "train_loss": 3.4758379459381104, "lr": 0.0003173278006535083, "tps": 13344, "wall": 51034.4} {"step": 10392, "train_loss": 3.5566558837890625, "lr": 0.0003173116842192316, "tps": 13344, "wall": 51042.6} {"step": 10393, "train_loss": 3.492875099182129, "lr": 0.00031729556668260285, "tps": 13343, "wall": 51050.9} {"step": 10394, "train_loss": 3.4802846908569336, "lr": 0.0003172794480438047, "tps": 13342, "wall": 51059.1} {"step": 10395, "train_loss": 3.485598087310791, "lr": 0.00031726332830301967, "tps": 13341, "wall": 51067.4} {"step": 10396, "train_loss": 3.489410877227783, "lr": 0.0003172472074604304, "tps": 13340, "wall": 51075.5} {"step": 10397, "train_loss": 3.5045881271362305, "lr": 0.00031723108551621944, "tps": 13339, "wall": 51083.9} {"step": 10398, "train_loss": 3.564924478530884, "lr": 0.00031721496247056957, "tps": 13338, "wall": 51092.2} {"step": 10399, "train_loss": 3.5265731811523438, "lr": 0.0003171988383236633, "tps": 13337, "wall": 51100.4} {"step": 10400, "train_loss": 3.4897613525390625, "lr": 0.00031718271307568335, "tps": 13337, "wall": 51108.7} {"step": 10401, "train_loss": 3.5457143783569336, "lr": 0.0003171665867268124, "tps": 13336, "wall": 51117.1} {"step": 10402, "train_loss": 3.6022119522094727, "lr": 0.00031715045927723304, "tps": 13335, "wall": 51125.4} {"step": 10403, "train_loss": 3.4559378623962402, "lr": 0.00031713433072712803, "tps": 13334, "wall": 51133.5} {"step": 10404, "train_loss": 3.5867624282836914, "lr": 0.00031711820107668007, "tps": 13333, "wall": 51141.8} {"step": 10405, "train_loss": 3.5053138732910156, "lr": 0.00031710207032607194, "tps": 13332, "wall": 51150.1} {"step": 10406, "train_loss": 3.495849370956421, "lr": 0.0003170859384754863, "tps": 13331, "wall": 51158.3} {"step": 10407, "train_loss": 3.4401040077209473, "lr": 0.0003170698055251058, "tps": 13330, "wall": 51166.6} {"step": 10408, "train_loss": 3.5589005947113037, "lr": 0.0003170536714751133, "tps": 13330, "wall": 51174.9} {"step": 10409, "train_loss": 3.507164478302002, "lr": 0.00031703753632569164, "tps": 13329, "wall": 51183.1} {"step": 10410, "train_loss": 3.529043197631836, "lr": 0.0003170214000770235, "tps": 13328, "wall": 51191.3} {"step": 10411, "train_loss": 3.5272464752197266, "lr": 0.0003170052627292916, "tps": 13327, "wall": 51199.7} {"step": 10412, "train_loss": 3.412250518798828, "lr": 0.00031698912428267887, "tps": 13326, "wall": 51208.0} {"step": 10413, "train_loss": 3.4918670654296875, "lr": 0.0003169729847373682, "tps": 13325, "wall": 51216.2} {"step": 10414, "train_loss": 3.5231924057006836, "lr": 0.0003169568440935422, "tps": 13324, "wall": 51224.4} {"step": 10415, "train_loss": 3.5059814453125, "lr": 0.00031694070235138385, "tps": 13323, "wall": 51232.7} {"step": 10416, "train_loss": 3.5047287940979004, "lr": 0.00031692455951107604, "tps": 13323, "wall": 51241.0} {"step": 10417, "train_loss": 3.45215106010437, "lr": 0.0003169084155728015, "tps": 13322, "wall": 51249.3} {"step": 10418, "train_loss": 3.5540480613708496, "lr": 0.0003168922705367432, "tps": 13321, "wall": 51257.5} {"step": 10419, "train_loss": 3.695434331893921, "lr": 0.0003168761244030841, "tps": 13320, "wall": 51265.8} {"step": 10420, "train_loss": 3.4584460258483887, "lr": 0.00031685997717200695, "tps": 13319, "wall": 51273.9} {"step": 10421, "train_loss": 3.524322509765625, "lr": 0.0003168438288436947, "tps": 13318, "wall": 51282.2} {"step": 10422, "train_loss": 3.499516248703003, "lr": 0.0003168276794183304, "tps": 13317, "wall": 51290.5} {"step": 10423, "train_loss": 3.439483404159546, "lr": 0.0003168115288960969, "tps": 13316, "wall": 51298.9} {"step": 10424, "train_loss": 3.5620994567871094, "lr": 0.0003167953772771771, "tps": 13316, "wall": 51307.2} {"step": 10425, "train_loss": 3.5961737632751465, "lr": 0.00031677922456175406, "tps": 13315, "wall": 51315.4} {"step": 10426, "train_loss": 3.4557323455810547, "lr": 0.0003167630707500107, "tps": 13314, "wall": 51323.6} {"step": 10427, "train_loss": 3.4596152305603027, "lr": 0.00031674691584213007, "tps": 13313, "wall": 51331.9} {"step": 10428, "train_loss": 3.484553575515747, "lr": 0.00031673075983829513, "tps": 13312, "wall": 51340.1} {"step": 10429, "train_loss": 3.5031161308288574, "lr": 0.00031671460273868893, "tps": 13311, "wall": 51348.4} {"step": 10430, "train_loss": 3.490165948867798, "lr": 0.0003166984445434945, "tps": 13310, "wall": 51356.9} {"step": 10431, "train_loss": 3.4757766723632812, "lr": 0.0003166822852528948, "tps": 13310, "wall": 51365.0} {"step": 10432, "train_loss": 3.4775443077087402, "lr": 0.000316666124867073, "tps": 13309, "wall": 51373.4} {"step": 10433, "train_loss": 3.4589264392852783, "lr": 0.0003166499633862121, "tps": 13308, "wall": 51381.7} {"step": 10434, "train_loss": 3.542668104171753, "lr": 0.00031663380081049515, "tps": 13307, "wall": 51389.9} {"step": 10435, "train_loss": 3.515024423599243, "lr": 0.00031661763714010526, "tps": 13306, "wall": 51398.2} {"step": 10436, "train_loss": 3.478386402130127, "lr": 0.00031660147237522565, "tps": 13305, "wall": 51406.5} {"step": 10437, "train_loss": 3.468170642852783, "lr": 0.00031658530651603925, "tps": 13304, "wall": 51414.8} {"step": 10438, "train_loss": 3.452737808227539, "lr": 0.00031656913956272926, "tps": 13303, "wall": 51423.1} {"step": 10439, "train_loss": 3.529590368270874, "lr": 0.00031655297151547885, "tps": 13303, "wall": 51431.4} {"step": 10440, "train_loss": 3.518021821975708, "lr": 0.0003165368023744712, "tps": 13302, "wall": 51439.6} {"step": 10441, "train_loss": 3.4292149543762207, "lr": 0.0003165206321398894, "tps": 13301, "wall": 51447.9} {"step": 10442, "train_loss": 3.4077768325805664, "lr": 0.0003165044608119166, "tps": 13300, "wall": 51456.2} {"step": 10443, "train_loss": 3.380237340927124, "lr": 0.0003164882883907362, "tps": 13299, "wall": 51464.5} {"step": 10444, "train_loss": 3.4880313873291016, "lr": 0.00031647211487653113, "tps": 13298, "wall": 51472.9} {"step": 10445, "train_loss": 3.4462897777557373, "lr": 0.0003164559402694847, "tps": 13297, "wall": 51481.2} {"step": 10446, "train_loss": 3.458404064178467, "lr": 0.0003164397645697803, "tps": 13296, "wall": 51489.5} {"step": 10447, "train_loss": 3.434096336364746, "lr": 0.00031642358777760087, "tps": 13296, "wall": 51497.7} {"step": 10448, "train_loss": 3.491574287414551, "lr": 0.0003164074098931299, "tps": 13295, "wall": 51506.0} {"step": 10449, "train_loss": 3.4131269454956055, "lr": 0.00031639123091655054, "tps": 13294, "wall": 51514.2} {"step": 10450, "train_loss": 3.509442090988159, "lr": 0.00031637505084804613, "tps": 13293, "wall": 51522.5} {"step": 10451, "train_loss": 3.4912025928497314, "lr": 0.00031635886968779995, "tps": 13292, "wall": 51530.7} {"step": 10452, "train_loss": 3.4966304302215576, "lr": 0.00031634268743599523, "tps": 13291, "wall": 51539.1} {"step": 10453, "train_loss": 3.496762990951538, "lr": 0.0003163265040928154, "tps": 13290, "wall": 51547.3} {"step": 10454, "train_loss": 3.5202958583831787, "lr": 0.00031631031965844363, "tps": 13290, "wall": 51555.7} {"step": 10455, "train_loss": 3.408078193664551, "lr": 0.00031629413413306344, "tps": 13289, "wall": 51563.9} {"step": 10456, "train_loss": 3.5196890830993652, "lr": 0.00031627794751685806, "tps": 13288, "wall": 51572.1} {"step": 10457, "train_loss": 3.550612449645996, "lr": 0.0003162617598100109, "tps": 13287, "wall": 51580.4} {"step": 10458, "train_loss": 3.5725393295288086, "lr": 0.00031624557101270526, "tps": 13286, "wall": 51588.8} {"step": 10459, "train_loss": 3.4898016452789307, "lr": 0.0003162293811251246, "tps": 13285, "wall": 51597.0} {"step": 10460, "train_loss": 3.406953811645508, "lr": 0.00031621319014745234, "tps": 13284, "wall": 51605.2} {"step": 10461, "train_loss": 3.448955535888672, "lr": 0.0003161969980798718, "tps": 13284, "wall": 51613.4} {"step": 10462, "train_loss": 3.497197151184082, "lr": 0.0003161808049225665, "tps": 13283, "wall": 51621.7} {"step": 10463, "train_loss": 3.620532512664795, "lr": 0.00031616461067571986, "tps": 13282, "wall": 51630.0} {"step": 10464, "train_loss": 3.5018537044525146, "lr": 0.00031614841533951526, "tps": 13281, "wall": 51638.2} {"step": 10465, "train_loss": 3.4769577980041504, "lr": 0.0003161322189141362, "tps": 13280, "wall": 51646.7} {"step": 10466, "train_loss": 3.5276877880096436, "lr": 0.0003161160213997662, "tps": 13279, "wall": 51654.9} {"step": 10467, "train_loss": 3.575479507446289, "lr": 0.00031609982279658875, "tps": 13278, "wall": 51663.2} {"step": 10468, "train_loss": 3.4307472705841064, "lr": 0.00031608362310478727, "tps": 13278, "wall": 51671.4} {"step": 10469, "train_loss": 3.514089584350586, "lr": 0.00031606742232454524, "tps": 13277, "wall": 51679.6} {"step": 10470, "train_loss": 3.4608185291290283, "lr": 0.0003160512204560464, "tps": 13276, "wall": 51688.0} {"step": 10471, "train_loss": 3.4324421882629395, "lr": 0.000316035017499474, "tps": 13275, "wall": 51696.0} {"step": 10472, "train_loss": 3.5362815856933594, "lr": 0.0003160188134550118, "tps": 13274, "wall": 51704.4} {"step": 10473, "train_loss": 3.4615981578826904, "lr": 0.0003160026083228433, "tps": 13273, "wall": 51712.6} {"step": 10474, "train_loss": 3.5360727310180664, "lr": 0.000315986402103152, "tps": 13272, "wall": 51720.9} {"step": 10475, "train_loss": 3.5515077114105225, "lr": 0.0003159701947961216, "tps": 13272, "wall": 51729.1} {"step": 10476, "train_loss": 3.3878989219665527, "lr": 0.0003159539864019356, "tps": 13271, "wall": 51737.5} {"step": 10477, "train_loss": 3.4913418292999268, "lr": 0.0003159377769207776, "tps": 13270, "wall": 51745.7} {"step": 10478, "train_loss": 3.4777889251708984, "lr": 0.00031592156635283137, "tps": 13269, "wall": 51753.9} {"step": 10479, "train_loss": 3.57558012008667, "lr": 0.0003159053546982804, "tps": 13268, "wall": 51762.4} {"step": 10480, "train_loss": 3.611492395401001, "lr": 0.00031588914195730845, "tps": 13267, "wall": 51770.7} {"step": 10481, "train_loss": 3.4076006412506104, "lr": 0.000315872928130099, "tps": 13266, "wall": 51779.1} {"step": 10482, "train_loss": 3.486588954925537, "lr": 0.0003158567132168359, "tps": 13266, "wall": 51787.4} {"step": 10483, "train_loss": 3.545973300933838, "lr": 0.00031584049721770273, "tps": 13264, "wall": 51797.4} {"step": 10484, "train_loss": 3.4998960494995117, "lr": 0.00031582428013288334, "tps": 13263, "wall": 51806.0} {"step": 10485, "train_loss": 3.4783482551574707, "lr": 0.00031580806196256116, "tps": 13262, "wall": 51814.4} {"step": 10486, "train_loss": 3.4905624389648438, "lr": 0.00031579184270692014, "tps": 13262, "wall": 51822.6} {"step": 10487, "train_loss": 3.498478651046753, "lr": 0.00031577562236614404, "tps": 13261, "wall": 51830.8} {"step": 10488, "train_loss": 3.5264909267425537, "lr": 0.0003157594009404164, "tps": 13260, "wall": 51838.9} {"step": 10489, "train_loss": 3.5030593872070312, "lr": 0.00031574317842992107, "tps": 13259, "wall": 51847.3} {"step": 10490, "train_loss": 3.586703062057495, "lr": 0.0003157269548348419, "tps": 13258, "wall": 51855.4} {"step": 10491, "train_loss": 3.518813133239746, "lr": 0.0003157107301553626, "tps": 13257, "wall": 51863.7} {"step": 10492, "train_loss": 3.501986265182495, "lr": 0.0003156945043916669, "tps": 13257, "wall": 51872.0} {"step": 10493, "train_loss": 3.532987117767334, "lr": 0.0003156782775439388, "tps": 13256, "wall": 51880.3} {"step": 10494, "train_loss": 3.4223852157592773, "lr": 0.00031566204961236183, "tps": 13255, "wall": 51888.8} {"step": 10495, "train_loss": 3.516467571258545, "lr": 0.0003156458205971201, "tps": 13254, "wall": 51897.1} {"step": 10496, "train_loss": 3.5509941577911377, "lr": 0.00031562959049839735, "tps": 13253, "wall": 51905.2} {"step": 10497, "train_loss": 3.5352020263671875, "lr": 0.00031561335931637734, "tps": 13252, "wall": 51913.4} {"step": 10498, "train_loss": 3.512786388397217, "lr": 0.00031559712705124407, "tps": 13251, "wall": 51921.5} {"step": 10499, "train_loss": 3.438863754272461, "lr": 0.0003155808937031814, "tps": 13251, "wall": 51929.6} {"step": 10500, "train_loss": 3.5775039196014404, "lr": 0.0003155646592723732, "tps": 13250, "wall": 51937.7} {"step": 10501, "train_loss": 3.3970704078674316, "lr": 0.00031554842375900333, "tps": 13249, "wall": 51945.8} {"step": 10502, "train_loss": 3.5679407119750977, "lr": 0.00031553218716325575, "tps": 13248, "wall": 51954.0} {"step": 10503, "train_loss": 3.612276554107666, "lr": 0.00031551594948531436, "tps": 13247, "wall": 51962.0} {"step": 10504, "train_loss": 3.4366579055786133, "lr": 0.0003154997107253632, "tps": 13247, "wall": 51970.1} {"step": 10505, "train_loss": 3.5450758934020996, "lr": 0.0003154834708835861, "tps": 13246, "wall": 51978.2} {"step": 10506, "train_loss": 3.5487589836120605, "lr": 0.0003154672299601671, "tps": 13245, "wall": 51986.3} {"step": 10507, "train_loss": 3.5034849643707275, "lr": 0.0003154509879552901, "tps": 13244, "wall": 51994.3} {"step": 10508, "train_loss": 3.5533971786499023, "lr": 0.0003154347448691392, "tps": 13243, "wall": 52002.4} {"step": 10509, "train_loss": 3.545243263244629, "lr": 0.0003154185007018984, "tps": 13243, "wall": 52010.6} {"step": 10510, "train_loss": 3.551044464111328, "lr": 0.0003154022554537515, "tps": 13242, "wall": 52018.7} {"step": 10511, "train_loss": 3.5104713439941406, "lr": 0.00031538600912488283, "tps": 13241, "wall": 52026.8} {"step": 10512, "train_loss": 3.5533270835876465, "lr": 0.00031536976171547625, "tps": 13240, "wall": 52034.9} {"step": 10513, "train_loss": 3.573791027069092, "lr": 0.0003153535132257158, "tps": 13239, "wall": 52043.0} {"step": 10514, "train_loss": 3.481539011001587, "lr": 0.00031533726365578563, "tps": 13239, "wall": 52051.0} {"step": 10515, "train_loss": 3.503070592880249, "lr": 0.00031532101300586984, "tps": 13238, "wall": 52059.1} {"step": 10516, "train_loss": 3.469925880432129, "lr": 0.0003153047612761524, "tps": 13237, "wall": 52067.3} {"step": 10517, "train_loss": 3.4698920249938965, "lr": 0.0003152885084668174, "tps": 13236, "wall": 52075.5} {"step": 10518, "train_loss": 3.471529006958008, "lr": 0.00031527225457804914, "tps": 13235, "wall": 52083.6} {"step": 10519, "train_loss": 3.574553966522217, "lr": 0.00031525599961003165, "tps": 13235, "wall": 52091.9} {"step": 10520, "train_loss": 3.5278544425964355, "lr": 0.00031523974356294893, "tps": 13234, "wall": 52100.1} {"step": 10521, "train_loss": 3.6022145748138428, "lr": 0.00031522348643698526, "tps": 13233, "wall": 52108.1} {"step": 10522, "train_loss": 3.4853477478027344, "lr": 0.0003152072282323248, "tps": 13232, "wall": 52116.3} {"step": 10523, "train_loss": 3.594017505645752, "lr": 0.0003151909689491518, "tps": 13231, "wall": 52124.4} {"step": 10524, "train_loss": 3.4229118824005127, "lr": 0.0003151747085876502, "tps": 13231, "wall": 52132.5} {"step": 10525, "train_loss": 3.400967597961426, "lr": 0.00031515844714800445, "tps": 13230, "wall": 52140.6} {"step": 10526, "train_loss": 3.497121810913086, "lr": 0.0003151421846303986, "tps": 13229, "wall": 52148.7} {"step": 10527, "train_loss": 3.4782917499542236, "lr": 0.000315125921035017, "tps": 13228, "wall": 52156.8} {"step": 10528, "train_loss": 3.4709506034851074, "lr": 0.0003151096563620438, "tps": 13227, "wall": 52164.7} {"step": 10529, "train_loss": 3.5138254165649414, "lr": 0.00031509339061166325, "tps": 13227, "wall": 52172.8} {"step": 10530, "train_loss": 3.569033145904541, "lr": 0.0003150771237840596, "tps": 13226, "wall": 52180.8} {"step": 10531, "train_loss": 3.3906469345092773, "lr": 0.00031506085587941723, "tps": 13225, "wall": 52189.1} {"step": 10532, "train_loss": 3.430534601211548, "lr": 0.0003150445868979203, "tps": 13224, "wall": 52197.1} {"step": 10533, "train_loss": 3.5274269580841064, "lr": 0.00031502831683975313, "tps": 13223, "wall": 52205.2} {"step": 10534, "train_loss": 3.5692355632781982, "lr": 0.0003150120457051, "tps": 13223, "wall": 52213.3} {"step": 10535, "train_loss": 3.5090041160583496, "lr": 0.0003149957734941454, "tps": 13222, "wall": 52221.4} {"step": 10536, "train_loss": 3.467965602874756, "lr": 0.00031497950020707347, "tps": 13221, "wall": 52229.6} {"step": 10537, "train_loss": 3.4596097469329834, "lr": 0.00031496322584406857, "tps": 13220, "wall": 52237.7} {"step": 10538, "train_loss": 3.51161789894104, "lr": 0.0003149469504053152, "tps": 13219, "wall": 52246.3} {"step": 10539, "train_loss": 3.5551841259002686, "lr": 0.00031493067389099763, "tps": 13218, "wall": 52254.3} {"step": 10540, "train_loss": 3.6094002723693848, "lr": 0.0003149143963013002, "tps": 13218, "wall": 52262.4} {"step": 10541, "train_loss": 3.5571558475494385, "lr": 0.0003148981176364074, "tps": 13217, "wall": 52270.7} {"step": 10542, "train_loss": 3.556973934173584, "lr": 0.0003148818378965035, "tps": 13216, "wall": 52278.8} {"step": 10543, "train_loss": 3.608187198638916, "lr": 0.00031486555708177313, "tps": 13215, "wall": 52286.8} {"step": 10544, "train_loss": 3.610057830810547, "lr": 0.00031484927519240057, "tps": 13215, "wall": 52294.9} {"step": 10545, "train_loss": 3.464723587036133, "lr": 0.0003148329922285703, "tps": 13214, "wall": 52303.0} {"step": 10546, "train_loss": 3.543491840362549, "lr": 0.0003148167081904667, "tps": 13213, "wall": 52311.2} {"step": 10547, "train_loss": 3.50834321975708, "lr": 0.0003148004230782743, "tps": 13212, "wall": 52319.1} {"step": 10548, "train_loss": 3.547520637512207, "lr": 0.00031478413689217763, "tps": 13211, "wall": 52327.2} {"step": 10549, "train_loss": 3.4659786224365234, "lr": 0.0003147678496323611, "tps": 13211, "wall": 52335.2} {"step": 10550, "train_loss": 3.5824320316314697, "lr": 0.0003147515612990092, "tps": 13210, "wall": 52343.3} {"step": 10551, "train_loss": 3.498843193054199, "lr": 0.00031473527189230664, "tps": 13209, "wall": 52351.3} {"step": 10552, "train_loss": 3.533214807510376, "lr": 0.00031471898141243766, "tps": 13208, "wall": 52359.5} {"step": 10553, "train_loss": 3.5554039478302, "lr": 0.0003147026898595869, "tps": 13207, "wall": 52367.6} {"step": 10554, "train_loss": 3.465158700942993, "lr": 0.00031468639723393905, "tps": 13207, "wall": 52375.8} {"step": 10555, "train_loss": 3.5023462772369385, "lr": 0.0003146701035356786, "tps": 13206, "wall": 52383.9} {"step": 10556, "train_loss": 3.5278215408325195, "lr": 0.00031465380876499, "tps": 13205, "wall": 52392.1} {"step": 10557, "train_loss": 3.5649170875549316, "lr": 0.0003146375129220579, "tps": 13204, "wall": 52400.2} {"step": 10558, "train_loss": 3.4404451847076416, "lr": 0.00031462121600706706, "tps": 13203, "wall": 52408.4} {"step": 10559, "train_loss": 3.4642298221588135, "lr": 0.0003146049180202019, "tps": 13203, "wall": 52416.5} {"step": 10560, "train_loss": 3.444683074951172, "lr": 0.00031458861896164705, "tps": 13202, "wall": 52424.6} {"step": 10561, "train_loss": 3.5369226932525635, "lr": 0.00031457231883158727, "tps": 13201, "wall": 52432.8} {"step": 10562, "train_loss": 3.474973201751709, "lr": 0.0003145560176302072, "tps": 13200, "wall": 52440.9} {"step": 10563, "train_loss": 3.5803260803222656, "lr": 0.00031453971535769134, "tps": 13199, "wall": 52449.1} {"step": 10564, "train_loss": 3.461897850036621, "lr": 0.00031452341201422453, "tps": 13199, "wall": 52457.2} {"step": 10565, "train_loss": 3.494988441467285, "lr": 0.0003145071075999914, "tps": 13198, "wall": 52465.2} {"step": 10566, "train_loss": 3.506401538848877, "lr": 0.00031449080211517664, "tps": 13197, "wall": 52473.2} {"step": 10567, "train_loss": 3.516112804412842, "lr": 0.00031447449555996494, "tps": 13196, "wall": 52481.3} {"step": 10568, "train_loss": 3.540487766265869, "lr": 0.0003144581879345411, "tps": 13196, "wall": 52489.4} {"step": 10569, "train_loss": 3.543790340423584, "lr": 0.0003144418792390897, "tps": 13195, "wall": 52497.4} {"step": 10570, "train_loss": 3.383760452270508, "lr": 0.00031442556947379566, "tps": 13194, "wall": 52505.5} {"step": 10571, "train_loss": 3.4943785667419434, "lr": 0.0003144092586388436, "tps": 13193, "wall": 52513.5} {"step": 10572, "train_loss": 3.485474109649658, "lr": 0.00031439294673441844, "tps": 13192, "wall": 52521.5} {"step": 10573, "train_loss": 3.492941379547119, "lr": 0.00031437663376070483, "tps": 13192, "wall": 52529.6} {"step": 10574, "train_loss": 3.636730670928955, "lr": 0.0003143603197178876, "tps": 13191, "wall": 52537.7} {"step": 10575, "train_loss": 3.5324416160583496, "lr": 0.00031434400460615154, "tps": 13190, "wall": 52545.7} {"step": 10576, "train_loss": 3.550673723220825, "lr": 0.0003143276884256815, "tps": 13189, "wall": 52553.9} {"step": 10577, "train_loss": 3.5314762592315674, "lr": 0.00031431137117666233, "tps": 13189, "wall": 52561.9} {"step": 10578, "train_loss": 3.391406536102295, "lr": 0.00031429505285927883, "tps": 13188, "wall": 52569.9} {"step": 10579, "train_loss": 3.5081064701080322, "lr": 0.00031427873347371593, "tps": 13187, "wall": 52577.9} {"step": 10580, "train_loss": 3.5617215633392334, "lr": 0.0003142624130201583, "tps": 13186, "wall": 52586.0} {"step": 10581, "train_loss": 3.55564284324646, "lr": 0.00031424609149879103, "tps": 13185, "wall": 52594.1} {"step": 10582, "train_loss": 3.5064566135406494, "lr": 0.0003142297689097989, "tps": 13185, "wall": 52602.2} {"step": 10583, "train_loss": 3.491793394088745, "lr": 0.0003142134452533669, "tps": 13184, "wall": 52610.3} {"step": 10584, "train_loss": 3.6098077297210693, "lr": 0.00031419712052967993, "tps": 13183, "wall": 52618.5} {"step": 10585, "train_loss": 3.4349801540374756, "lr": 0.0003141807947389228, "tps": 13182, "wall": 52626.6} {"step": 10586, "train_loss": 3.5491297245025635, "lr": 0.0003141644678812806, "tps": 13181, "wall": 52634.7} {"step": 10587, "train_loss": 3.463894844055176, "lr": 0.00031414813995693817, "tps": 13181, "wall": 52642.8} {"step": 10588, "train_loss": 3.4366912841796875, "lr": 0.0003141318109660805, "tps": 13180, "wall": 52650.9} {"step": 10589, "train_loss": 3.498695135116577, "lr": 0.00031411548090889263, "tps": 13179, "wall": 52659.0} {"step": 10590, "train_loss": 3.5280027389526367, "lr": 0.0003140991497855595, "tps": 13178, "wall": 52667.2} {"step": 10591, "train_loss": 3.612408399581909, "lr": 0.0003140828175962661, "tps": 13178, "wall": 52675.4} {"step": 10592, "train_loss": 3.585020065307617, "lr": 0.0003140664843411974, "tps": 13177, "wall": 52683.4} {"step": 10593, "train_loss": 3.5174007415771484, "lr": 0.00031405015002053854, "tps": 13176, "wall": 52691.4} {"step": 10594, "train_loss": 3.435351848602295, "lr": 0.0003140338146344745, "tps": 13175, "wall": 52699.5} {"step": 10595, "train_loss": 3.5157437324523926, "lr": 0.0003140174781831903, "tps": 13174, "wall": 52707.5} {"step": 10596, "train_loss": 3.527817487716675, "lr": 0.000314001140666871, "tps": 13174, "wall": 52715.6} {"step": 10597, "train_loss": 3.4849812984466553, "lr": 0.00031398480208570174, "tps": 13173, "wall": 52723.8} {"step": 10598, "train_loss": 3.475641965866089, "lr": 0.0003139684624398675, "tps": 13172, "wall": 52732.0} {"step": 10599, "train_loss": 3.4205760955810547, "lr": 0.00031395212172955346, "tps": 13171, "wall": 52740.1} {"step": 10600, "train_loss": 3.650681734085083, "lr": 0.0003139357799549447, "tps": 13171, "wall": 52748.2} {"step": 10601, "train_loss": 3.326871156692505, "lr": 0.00031391943711622637, "tps": 13170, "wall": 52756.2} {"step": 10602, "train_loss": 3.548982620239258, "lr": 0.00031390309321358353, "tps": 13169, "wall": 52764.2} {"step": 10603, "train_loss": 3.4605135917663574, "lr": 0.0003138867482472014, "tps": 13168, "wall": 52772.4} {"step": 10604, "train_loss": 3.511017322540283, "lr": 0.00031387040221726514, "tps": 13167, "wall": 52780.5} {"step": 10605, "train_loss": 3.569408893585205, "lr": 0.0003138540551239598, "tps": 13167, "wall": 52788.8} {"step": 10606, "train_loss": 3.5418853759765625, "lr": 0.0003138377069674707, "tps": 13166, "wall": 52796.8} {"step": 10607, "train_loss": 3.446614980697632, "lr": 0.0003138213577479829, "tps": 13165, "wall": 52805.0} {"step": 10608, "train_loss": 3.5503787994384766, "lr": 0.00031380500746568184, "tps": 13164, "wall": 52813.2} {"step": 10609, "train_loss": 3.521385431289673, "lr": 0.00031378865612075247, "tps": 13163, "wall": 52821.3} {"step": 10610, "train_loss": 3.50831937789917, "lr": 0.00031377230371338016, "tps": 13163, "wall": 52829.9} {"step": 10611, "train_loss": 3.4149231910705566, "lr": 0.00031375595024375004, "tps": 13161, "wall": 52839.5} {"step": 10612, "train_loss": 3.5127882957458496, "lr": 0.00031373959571204756, "tps": 13161, "wall": 52847.8} {"step": 10613, "train_loss": 3.44633150100708, "lr": 0.00031372324011845785, "tps": 13160, "wall": 52855.9} {"step": 10614, "train_loss": 3.587749719619751, "lr": 0.0003137068834631662, "tps": 13159, "wall": 52864.1} {"step": 10615, "train_loss": 3.4000868797302246, "lr": 0.00031369052574635784, "tps": 13158, "wall": 52872.5} {"step": 10616, "train_loss": 3.5389907360076904, "lr": 0.00031367416696821823, "tps": 13157, "wall": 52880.8} {"step": 10617, "train_loss": 3.5732579231262207, "lr": 0.00031365780712893255, "tps": 13156, "wall": 52889.2} {"step": 10618, "train_loss": 3.458998680114746, "lr": 0.00031364144622868614, "tps": 13156, "wall": 52897.4} {"step": 10619, "train_loss": 3.514387607574463, "lr": 0.00031362508426766435, "tps": 13155, "wall": 52905.7} {"step": 10620, "train_loss": 3.4152252674102783, "lr": 0.0003136087212460526, "tps": 13154, "wall": 52914.0} {"step": 10621, "train_loss": 3.5138726234436035, "lr": 0.00031359235716403616, "tps": 13153, "wall": 52922.3} {"step": 10622, "train_loss": 3.3867244720458984, "lr": 0.0003135759920218004, "tps": 13152, "wall": 52930.6} {"step": 10623, "train_loss": 3.618004560470581, "lr": 0.0003135596258195308, "tps": 13152, "wall": 52938.9} {"step": 10624, "train_loss": 3.5039241313934326, "lr": 0.0003135432585574126, "tps": 13151, "wall": 52947.2} {"step": 10625, "train_loss": 3.575540542602539, "lr": 0.0003135268902356314, "tps": 13150, "wall": 52955.4} {"step": 10626, "train_loss": 3.5223512649536133, "lr": 0.0003135105208543725, "tps": 13149, "wall": 52963.5} {"step": 10627, "train_loss": 3.4078710079193115, "lr": 0.0003134941504138214, "tps": 13148, "wall": 52971.8} {"step": 10628, "train_loss": 3.487895965576172, "lr": 0.00031347777891416347, "tps": 13148, "wall": 52979.9} {"step": 10629, "train_loss": 3.4384407997131348, "lr": 0.00031346140635558423, "tps": 13147, "wall": 52987.9} {"step": 10630, "train_loss": 3.445646286010742, "lr": 0.0003134450327382691, "tps": 13146, "wall": 52996.1} {"step": 10631, "train_loss": 3.55256724357605, "lr": 0.00031342865806240354, "tps": 13145, "wall": 53004.1} {"step": 10632, "train_loss": 3.569951057434082, "lr": 0.00031341228232817316, "tps": 13144, "wall": 53012.2} {"step": 10633, "train_loss": 3.5130817890167236, "lr": 0.00031339590553576335, "tps": 13144, "wall": 53020.3} {"step": 10634, "train_loss": 3.510833501815796, "lr": 0.0003133795276853597, "tps": 13143, "wall": 53028.5} {"step": 10635, "train_loss": 3.516122341156006, "lr": 0.0003133631487771476, "tps": 13142, "wall": 53036.5} {"step": 10636, "train_loss": 3.4948487281799316, "lr": 0.0003133467688113128, "tps": 13141, "wall": 53044.6} {"step": 10637, "train_loss": 3.54752516746521, "lr": 0.00031333038778804084, "tps": 13141, "wall": 53052.8} {"step": 10638, "train_loss": 3.517084836959839, "lr": 0.00031331400570751706, "tps": 13140, "wall": 53060.8} {"step": 10639, "train_loss": 3.370152473449707, "lr": 0.0003132976225699272, "tps": 13139, "wall": 53068.9} {"step": 10640, "train_loss": 3.504031181335449, "lr": 0.0003132812383754568, "tps": 13138, "wall": 53077.0} {"step": 10641, "train_loss": 3.4125943183898926, "lr": 0.00031326485312429154, "tps": 13138, "wall": 53085.1} {"step": 10642, "train_loss": 3.503849983215332, "lr": 0.000313248466816617, "tps": 13137, "wall": 53093.3} {"step": 10643, "train_loss": 3.496725082397461, "lr": 0.0003132320794526187, "tps": 13136, "wall": 53101.4} {"step": 10644, "train_loss": 3.534715175628662, "lr": 0.0003132156910324824, "tps": 13135, "wall": 53109.6} {"step": 10645, "train_loss": 3.437864065170288, "lr": 0.00031319930155639374, "tps": 13134, "wall": 53117.7} {"step": 10646, "train_loss": 3.4096171855926514, "lr": 0.0003131829110245383, "tps": 13134, "wall": 53125.8} {"step": 10647, "train_loss": 3.559886932373047, "lr": 0.00031316651943710187, "tps": 13133, "wall": 53133.8} {"step": 10648, "train_loss": 3.4784674644470215, "lr": 0.00031315012679426996, "tps": 13132, "wall": 53142.1} {"step": 10649, "train_loss": 3.5063557624816895, "lr": 0.00031313373309622847, "tps": 13131, "wall": 53150.2} {"step": 10650, "train_loss": 3.450915813446045, "lr": 0.00031311733834316297, "tps": 13130, "wall": 53158.6} {"step": 10651, "train_loss": 3.463808536529541, "lr": 0.0003131009425352593, "tps": 13130, "wall": 53166.7} {"step": 10652, "train_loss": 3.500072479248047, "lr": 0.000313084545672703, "tps": 13129, "wall": 53174.8} {"step": 10653, "train_loss": 3.5099735260009766, "lr": 0.00031306814775568, "tps": 13128, "wall": 53182.7} {"step": 10654, "train_loss": 3.4070255756378174, "lr": 0.00031305174878437593, "tps": 13127, "wall": 53190.8} {"step": 10655, "train_loss": 3.465521812438965, "lr": 0.0003130353487589767, "tps": 13127, "wall": 53199.1} {"step": 10656, "train_loss": 3.444242477416992, "lr": 0.00031301894767966795, "tps": 13126, "wall": 53207.3} {"step": 10657, "train_loss": 3.580841541290283, "lr": 0.0003130025455466356, "tps": 13125, "wall": 53215.4} {"step": 10658, "train_loss": 3.514052391052246, "lr": 0.0003129861423600653, "tps": 13124, "wall": 53223.5} {"step": 10659, "train_loss": 3.508863687515259, "lr": 0.000312969738120143, "tps": 13124, "wall": 53231.5} {"step": 10660, "train_loss": 3.4349238872528076, "lr": 0.0003129533328270544, "tps": 13123, "wall": 53239.6} {"step": 10661, "train_loss": 3.540989398956299, "lr": 0.0003129369264809855, "tps": 13122, "wall": 53247.7} {"step": 10662, "train_loss": 3.4715466499328613, "lr": 0.00031292051908212207, "tps": 13121, "wall": 53255.7} {"step": 10663, "train_loss": 3.5095102787017822, "lr": 0.00031290411063064985, "tps": 13121, "wall": 53263.7} {"step": 10664, "train_loss": 3.561492919921875, "lr": 0.00031288770112675494, "tps": 13120, "wall": 53271.9} {"step": 10665, "train_loss": 3.496690273284912, "lr": 0.0003128712905706231, "tps": 13119, "wall": 53279.8} {"step": 10666, "train_loss": 3.4879584312438965, "lr": 0.00031285487896244026, "tps": 13118, "wall": 53287.8} {"step": 10667, "train_loss": 3.4922993183135986, "lr": 0.00031283846630239233, "tps": 13118, "wall": 53295.7} {"step": 10668, "train_loss": 3.4566197395324707, "lr": 0.00031282205259066526, "tps": 13117, "wall": 53303.7} {"step": 10669, "train_loss": 3.5363576412200928, "lr": 0.000312805637827445, "tps": 13116, "wall": 53311.7} {"step": 10670, "train_loss": 3.462369441986084, "lr": 0.00031278922201291733, "tps": 13115, "wall": 53319.8} {"step": 10671, "train_loss": 3.4177486896514893, "lr": 0.00031277280514726836, "tps": 13115, "wall": 53327.9} {"step": 10672, "train_loss": 3.624000072479248, "lr": 0.0003127563872306841, "tps": 13114, "wall": 53335.9} {"step": 10673, "train_loss": 3.5638251304626465, "lr": 0.0003127399682633504, "tps": 13113, "wall": 53343.9} {"step": 10674, "train_loss": 3.3982324600219727, "lr": 0.0003127235482454534, "tps": 13112, "wall": 53352.0} {"step": 10675, "train_loss": 3.403395175933838, "lr": 0.00031270712717717907, "tps": 13112, "wall": 53360.0} {"step": 10676, "train_loss": 3.429802417755127, "lr": 0.0003126907050587132, "tps": 13111, "wall": 53368.0} {"step": 10677, "train_loss": 3.445633888244629, "lr": 0.00031267428189024214, "tps": 13110, "wall": 53376.0} {"step": 10678, "train_loss": 3.414153575897217, "lr": 0.0003126578576719518, "tps": 13109, "wall": 53384.2} {"step": 10679, "train_loss": 3.3118059635162354, "lr": 0.00031264143240402817, "tps": 13109, "wall": 53392.3} {"step": 10680, "train_loss": 3.438661575317383, "lr": 0.00031262500608665746, "tps": 13108, "wall": 53400.3} {"step": 10681, "train_loss": 3.4827535152435303, "lr": 0.0003126085787200256, "tps": 13107, "wall": 53408.4} {"step": 10682, "train_loss": 3.4673964977264404, "lr": 0.0003125921503043188, "tps": 13106, "wall": 53416.4} {"step": 10683, "train_loss": 3.5815703868865967, "lr": 0.00031257572083972303, "tps": 13106, "wall": 53424.5} {"step": 10684, "train_loss": 3.4850172996520996, "lr": 0.0003125592903264246, "tps": 13105, "wall": 53432.6} {"step": 10685, "train_loss": 3.419405937194824, "lr": 0.00031254285876460946, "tps": 13104, "wall": 53440.6} {"step": 10686, "train_loss": 3.4584970474243164, "lr": 0.0003125264261544638, "tps": 13103, "wall": 53448.8} {"step": 10687, "train_loss": 3.417970657348633, "lr": 0.00031250999249617383, "tps": 13103, "wall": 53456.8} {"step": 10688, "train_loss": 3.5640618801116943, "lr": 0.00031249355778992564, "tps": 13102, "wall": 53464.8} {"step": 10689, "train_loss": 3.5956270694732666, "lr": 0.0003124771220359054, "tps": 13101, "wall": 53472.9} {"step": 10690, "train_loss": 3.4743094444274902, "lr": 0.00031246068523429934, "tps": 13100, "wall": 53480.9} {"step": 10691, "train_loss": 3.6605381965637207, "lr": 0.0003124442473852936, "tps": 13100, "wall": 53488.9} {"step": 10692, "train_loss": 3.5773043632507324, "lr": 0.0003124278084890745, "tps": 13099, "wall": 53496.9} {"step": 10693, "train_loss": 3.4335975646972656, "lr": 0.00031241136854582815, "tps": 13098, "wall": 53505.0} {"step": 10694, "train_loss": 3.5752434730529785, "lr": 0.0003123949275557408, "tps": 13097, "wall": 53513.1} {"step": 10695, "train_loss": 3.4664087295532227, "lr": 0.0003123784855189987, "tps": 13097, "wall": 53521.1} {"step": 10696, "train_loss": 3.5256991386413574, "lr": 0.0003123620424357881, "tps": 13096, "wall": 53529.2} {"step": 10697, "train_loss": 3.551503896713257, "lr": 0.00031234559830629535, "tps": 13095, "wall": 53537.2} {"step": 10698, "train_loss": 3.464158296585083, "lr": 0.0003123291531307067, "tps": 13094, "wall": 53545.3} {"step": 10699, "train_loss": 3.4282565116882324, "lr": 0.0003123127069092083, "tps": 13094, "wall": 53553.3} {"step": 10700, "train_loss": 3.505359411239624, "lr": 0.0003122962596419866, "tps": 13093, "wall": 53561.3} {"step": 10701, "train_loss": 3.4999711513519287, "lr": 0.00031227981132922786, "tps": 13092, "wall": 53569.4} {"step": 10702, "train_loss": 3.5281314849853516, "lr": 0.00031226336197111846, "tps": 13091, "wall": 53577.5} {"step": 10703, "train_loss": 3.5267105102539062, "lr": 0.0003122469115678447, "tps": 13091, "wall": 53585.5} {"step": 10704, "train_loss": 3.573758125305176, "lr": 0.0003122304601195929, "tps": 13090, "wall": 53593.6} {"step": 10705, "train_loss": 3.447108745574951, "lr": 0.0003122140076265495, "tps": 13089, "wall": 53601.7} {"step": 10706, "train_loss": 3.5687613487243652, "lr": 0.00031219755408890085, "tps": 13088, "wall": 53609.7} {"step": 10707, "train_loss": 3.5209803581237793, "lr": 0.0003121810995068333, "tps": 13088, "wall": 53617.8} {"step": 10708, "train_loss": 3.466610908508301, "lr": 0.00031216464388053323, "tps": 13087, "wall": 53625.9} {"step": 10709, "train_loss": 3.406717300415039, "lr": 0.0003121481872101871, "tps": 13086, "wall": 53634.1} {"step": 10710, "train_loss": 3.4720964431762695, "lr": 0.00031213172949598136, "tps": 13085, "wall": 53642.2} {"step": 10711, "train_loss": 3.359569549560547, "lr": 0.00031211527073810236, "tps": 13085, "wall": 53650.3} {"step": 10712, "train_loss": 3.441948890686035, "lr": 0.00031209881093673667, "tps": 13084, "wall": 53658.3} {"step": 10713, "train_loss": 3.550614833831787, "lr": 0.0003120823500920706, "tps": 13083, "wall": 53666.3} {"step": 10714, "train_loss": 3.55368709564209, "lr": 0.0003120658882042907, "tps": 13082, "wall": 53674.3} {"step": 10715, "train_loss": 3.490241527557373, "lr": 0.00031204942527358345, "tps": 13082, "wall": 53682.4} {"step": 10716, "train_loss": 3.4673938751220703, "lr": 0.0003120329613001353, "tps": 13081, "wall": 53690.6} {"step": 10717, "train_loss": 3.512209892272949, "lr": 0.00031201649628413274, "tps": 13080, "wall": 53698.7} {"step": 10718, "train_loss": 3.3643269538879395, "lr": 0.0003120000302257624, "tps": 13079, "wall": 53706.9} {"step": 10719, "train_loss": 3.4983832836151123, "lr": 0.0003119835631252108, "tps": 13079, "wall": 53715.1} {"step": 10720, "train_loss": 3.4224085807800293, "lr": 0.00031196709498266433, "tps": 13078, "wall": 53723.1} {"step": 10721, "train_loss": 3.417976140975952, "lr": 0.0003119506257983097, "tps": 13077, "wall": 53731.2} {"step": 10722, "train_loss": 3.4580347537994385, "lr": 0.0003119341555723333, "tps": 13076, "wall": 53739.3} {"step": 10723, "train_loss": 3.5495285987854004, "lr": 0.00031191768430492185, "tps": 13076, "wall": 53747.5} {"step": 10724, "train_loss": 3.5489439964294434, "lr": 0.00031190121199626197, "tps": 13075, "wall": 53755.7} {"step": 10725, "train_loss": 3.4750657081604004, "lr": 0.00031188473864654016, "tps": 13074, "wall": 53763.8} {"step": 10726, "train_loss": 3.3776895999908447, "lr": 0.00031186826425594306, "tps": 13073, "wall": 53771.8} {"step": 10727, "train_loss": 3.4992012977600098, "lr": 0.0003118517888246572, "tps": 13073, "wall": 53780.0} {"step": 10728, "train_loss": 3.4041121006011963, "lr": 0.0003118353123528694, "tps": 13072, "wall": 53788.3} {"step": 10729, "train_loss": 3.596625328063965, "lr": 0.0003118188348407662, "tps": 13071, "wall": 53796.5} {"step": 10730, "train_loss": 3.498392343521118, "lr": 0.00031180235628853423, "tps": 13070, "wall": 53804.6} {"step": 10731, "train_loss": 3.607562780380249, "lr": 0.0003117858766963603, "tps": 13069, "wall": 53812.8} {"step": 10732, "train_loss": 3.5651650428771973, "lr": 0.00031176939606443097, "tps": 13069, "wall": 53820.8} {"step": 10733, "train_loss": 3.521432638168335, "lr": 0.0003117529143929329, "tps": 13068, "wall": 53828.9} {"step": 10734, "train_loss": 3.4090635776519775, "lr": 0.00031173643168205285, "tps": 13067, "wall": 53837.0} {"step": 10735, "train_loss": 3.471663236618042, "lr": 0.00031171994793197756, "tps": 13067, "wall": 53845.0} {"step": 10736, "train_loss": 3.4384593963623047, "lr": 0.0003117034631428937, "tps": 13066, "wall": 53853.5} {"step": 10737, "train_loss": 3.4680047035217285, "lr": 0.0003116869773149881, "tps": 13065, "wall": 53861.6} {"step": 10738, "train_loss": 3.4740443229675293, "lr": 0.00031167049044844743, "tps": 13064, "wall": 53869.9} {"step": 10739, "train_loss": 3.483412742614746, "lr": 0.0003116540025434585, "tps": 13063, "wall": 53878.0} {"step": 10740, "train_loss": 3.516664505004883, "lr": 0.0003116375136002081, "tps": 13063, "wall": 53886.0} {"step": 10741, "train_loss": 3.492826461791992, "lr": 0.000311621023618883, "tps": 13062, "wall": 53894.1} {"step": 10742, "train_loss": 3.449615240097046, "lr": 0.0003116045325996699, "tps": 13061, "wall": 53902.1} {"step": 10743, "train_loss": 3.4298176765441895, "lr": 0.0003115880405427558, "tps": 13060, "wall": 53910.2} {"step": 10744, "train_loss": 3.4941186904907227, "lr": 0.0003115715474483274, "tps": 13060, "wall": 53918.2} {"step": 10745, "train_loss": 3.50502347946167, "lr": 0.00031155505331657146, "tps": 13059, "wall": 53926.5} {"step": 10746, "train_loss": 3.413086414337158, "lr": 0.0003115385581476751, "tps": 13058, "wall": 53934.6} {"step": 10747, "train_loss": 3.40964412689209, "lr": 0.00031152206194182483, "tps": 13057, "wall": 53943.1} {"step": 10748, "train_loss": 3.680368661880493, "lr": 0.00031150556469920776, "tps": 13057, "wall": 53951.2} {"step": 10749, "train_loss": 3.472097158432007, "lr": 0.00031148906642001063, "tps": 13056, "wall": 53959.2} {"step": 10750, "train_loss": 3.574831962585449, "lr": 0.00031147256710442053, "tps": 13055, "wall": 53967.2} {"step": 10751, "train_loss": 3.4848716259002686, "lr": 0.0003114560667526242, "tps": 13054, "wall": 53975.3} {"step": 10752, "train_loss": 3.421964645385742, "lr": 0.0003114395653648085, "tps": 13054, "wall": 53983.3} {"step": 10753, "train_loss": 3.4337406158447266, "lr": 0.00031142306294116055, "tps": 13053, "wall": 53991.5} {"step": 10754, "train_loss": 3.4553425312042236, "lr": 0.0003114065594818672, "tps": 13052, "wall": 53999.5} {"step": 10755, "train_loss": 3.5114405155181885, "lr": 0.0003113900549871154, "tps": 13051, "wall": 54007.6} {"step": 10756, "train_loss": 3.447399377822876, "lr": 0.0003113735494570921, "tps": 13051, "wall": 54015.8} {"step": 10757, "train_loss": 3.6108787059783936, "lr": 0.00031135704289198424, "tps": 13050, "wall": 54023.9} {"step": 10758, "train_loss": 3.446655750274658, "lr": 0.00031134053529197894, "tps": 13049, "wall": 54032.1} {"step": 10759, "train_loss": 3.483835458755493, "lr": 0.00031132402665726307, "tps": 13048, "wall": 54040.1} {"step": 10760, "train_loss": 3.4804210662841797, "lr": 0.0003113075169880237, "tps": 13048, "wall": 54048.3} {"step": 10761, "train_loss": 3.4457755088806152, "lr": 0.00031129100628444784, "tps": 13047, "wall": 54056.4} {"step": 10762, "train_loss": 3.533468723297119, "lr": 0.0003112744945467225, "tps": 13046, "wall": 54064.4} {"step": 10763, "train_loss": 3.5116310119628906, "lr": 0.00031125798177503476, "tps": 13045, "wall": 54072.5} {"step": 10764, "train_loss": 3.504317045211792, "lr": 0.00031124146796957165, "tps": 13045, "wall": 54080.6} {"step": 10765, "train_loss": 3.4971442222595215, "lr": 0.00031122495313052023, "tps": 13044, "wall": 54088.6} {"step": 10766, "train_loss": 3.41679048538208, "lr": 0.0003112084372580677, "tps": 13043, "wall": 54096.7} {"step": 10767, "train_loss": 3.471717119216919, "lr": 0.000311191920352401, "tps": 13043, "wall": 54104.7} {"step": 10768, "train_loss": 3.5288937091827393, "lr": 0.0003111754024137073, "tps": 13042, "wall": 54112.9} {"step": 10769, "train_loss": 3.549187660217285, "lr": 0.00031115888344217366, "tps": 13041, "wall": 54121.1} {"step": 10770, "train_loss": 3.5490849018096924, "lr": 0.00031114236343798737, "tps": 13040, "wall": 54129.1} {"step": 10771, "train_loss": 3.483760356903076, "lr": 0.00031112584240133536, "tps": 13040, "wall": 54137.2} {"step": 10772, "train_loss": 3.4979288578033447, "lr": 0.00031110932033240487, "tps": 13039, "wall": 54145.3} {"step": 10773, "train_loss": 3.3925976753234863, "lr": 0.00031109279723138313, "tps": 13038, "wall": 54153.3} {"step": 10774, "train_loss": 3.4611356258392334, "lr": 0.00031107627309845723, "tps": 13037, "wall": 54161.4} {"step": 10775, "train_loss": 3.413175582885742, "lr": 0.00031105974793381436, "tps": 13037, "wall": 54169.5} {"step": 10776, "train_loss": 3.573223114013672, "lr": 0.00031104322173764175, "tps": 13036, "wall": 54177.6} {"step": 10777, "train_loss": 3.5267984867095947, "lr": 0.00031102669451012665, "tps": 13035, "wall": 54185.7} {"step": 10778, "train_loss": 3.4512155055999756, "lr": 0.0003110101662514562, "tps": 13034, "wall": 54193.8} {"step": 10779, "train_loss": 3.5894625186920166, "lr": 0.0003109936369618176, "tps": 13034, "wall": 54201.9} {"step": 10780, "train_loss": 3.4760451316833496, "lr": 0.00031097710664139823, "tps": 13033, "wall": 54210.1} {"step": 10781, "train_loss": 3.4496967792510986, "lr": 0.0003109605752903853, "tps": 13032, "wall": 54218.3} {"step": 10782, "train_loss": 3.46195125579834, "lr": 0.00031094404290896594, "tps": 13031, "wall": 54226.5} {"step": 10783, "train_loss": 3.6078522205352783, "lr": 0.0003109275094973277, "tps": 13031, "wall": 54234.6} {"step": 10784, "train_loss": 3.4900102615356445, "lr": 0.00031091097505565754, "tps": 13030, "wall": 54242.7} {"step": 10785, "train_loss": 3.5070557594299316, "lr": 0.00031089443958414305, "tps": 13029, "wall": 54250.8} {"step": 10786, "train_loss": 3.4939372539520264, "lr": 0.0003108779030829714, "tps": 13028, "wall": 54258.9} {"step": 10787, "train_loss": 3.504446029663086, "lr": 0.00031086136555232995, "tps": 13028, "wall": 54267.0} {"step": 10788, "train_loss": 3.386019706726074, "lr": 0.00031084482699240604, "tps": 13027, "wall": 54275.2} {"step": 10789, "train_loss": 3.5402016639709473, "lr": 0.00031082828740338703, "tps": 13026, "wall": 54283.3} {"step": 10790, "train_loss": 3.5605504512786865, "lr": 0.0003108117467854602, "tps": 13025, "wall": 54291.6} {"step": 10791, "train_loss": 3.446536064147949, "lr": 0.00031079520513881305, "tps": 13025, "wall": 54299.8} {"step": 10792, "train_loss": 3.559115409851074, "lr": 0.0003107786624636329, "tps": 13024, "wall": 54307.9} {"step": 10793, "train_loss": 3.53560733795166, "lr": 0.0003107621187601072, "tps": 13023, "wall": 54316.0} {"step": 10794, "train_loss": 3.53684663772583, "lr": 0.0003107455740284232, "tps": 13022, "wall": 54324.1} {"step": 10795, "train_loss": 3.636028289794922, "lr": 0.00031072902826876844, "tps": 13022, "wall": 54332.4} {"step": 10796, "train_loss": 3.525041103363037, "lr": 0.0003107124814813304, "tps": 13021, "wall": 54340.6} {"step": 10797, "train_loss": 3.4805119037628174, "lr": 0.00031069593366629645, "tps": 13020, "wall": 54348.9} {"step": 10798, "train_loss": 3.55172061920166, "lr": 0.000310679384823854, "tps": 13019, "wall": 54357.0} {"step": 10799, "train_loss": 3.512402296066284, "lr": 0.00031066283495419065, "tps": 13019, "wall": 54365.1} {"step": 10800, "train_loss": 3.6519370079040527, "lr": 0.00031064628405749376, "tps": 13018, "wall": 54373.2} {"step": 10801, "train_loss": 3.405259609222412, "lr": 0.0003106297321339509, "tps": 13017, "wall": 54381.3} {"step": 10802, "train_loss": 3.561990737915039, "lr": 0.0003106131791837495, "tps": 13016, "wall": 54389.5} {"step": 10803, "train_loss": 3.443010091781616, "lr": 0.0003105966252070771, "tps": 13016, "wall": 54397.8} {"step": 10804, "train_loss": 3.5051279067993164, "lr": 0.00031058007020412124, "tps": 13015, "wall": 54405.8} {"step": 10805, "train_loss": 3.514570474624634, "lr": 0.0003105635141750694, "tps": 13014, "wall": 54414.0} {"step": 10806, "train_loss": 3.4522833824157715, "lr": 0.00031054695712010917, "tps": 13013, "wall": 54422.3} {"step": 10807, "train_loss": 3.5497050285339355, "lr": 0.0003105303990394282, "tps": 13013, "wall": 54430.4} {"step": 10808, "train_loss": 3.482048273086548, "lr": 0.00031051383993321386, "tps": 13012, "wall": 54438.6} {"step": 10809, "train_loss": 3.5328876972198486, "lr": 0.0003104972798016539, "tps": 13011, "wall": 54446.6} {"step": 10810, "train_loss": 3.577528715133667, "lr": 0.00031048071864493595, "tps": 13010, "wall": 54454.7} {"step": 10811, "train_loss": 3.353610038757324, "lr": 0.0003104641564632474, "tps": 13010, "wall": 54462.8} {"step": 10812, "train_loss": 3.4422435760498047, "lr": 0.000310447593256776, "tps": 13009, "wall": 54471.1} {"step": 10813, "train_loss": 3.490546703338623, "lr": 0.0003104310290257094, "tps": 13008, "wall": 54479.3} {"step": 10814, "train_loss": 3.5839061737060547, "lr": 0.0003104144637702353, "tps": 13007, "wall": 54487.5} {"step": 10815, "train_loss": 3.392883777618408, "lr": 0.00031039789749054116, "tps": 13007, "wall": 54495.6} {"step": 10816, "train_loss": 3.5028014183044434, "lr": 0.0003103813301868147, "tps": 13006, "wall": 54503.8} {"step": 10817, "train_loss": 3.6000607013702393, "lr": 0.0003103647618592438, "tps": 13005, "wall": 54512.0} {"step": 10818, "train_loss": 3.5302512645721436, "lr": 0.0003103481925080158, "tps": 13004, "wall": 54520.2} {"step": 10819, "train_loss": 3.5109057426452637, "lr": 0.0003103316221333187, "tps": 13004, "wall": 54528.5} {"step": 10820, "train_loss": 3.437030792236328, "lr": 0.0003103150507353401, "tps": 13003, "wall": 54536.6} {"step": 10821, "train_loss": 3.6049740314483643, "lr": 0.00031029847831426767, "tps": 13002, "wall": 54544.8} {"step": 10822, "train_loss": 3.5102052688598633, "lr": 0.00031028190487028925, "tps": 13001, "wall": 54552.9} {"step": 10823, "train_loss": 3.5593953132629395, "lr": 0.00031026533040359245, "tps": 13001, "wall": 54561.0} {"step": 10824, "train_loss": 3.4356529712677, "lr": 0.0003102487549143652, "tps": 13000, "wall": 54569.2} {"step": 10825, "train_loss": 3.456416606903076, "lr": 0.00031023217840279516, "tps": 12999, "wall": 54577.4} {"step": 10826, "train_loss": 3.5639519691467285, "lr": 0.0003102156008690701, "tps": 12998, "wall": 54585.7} {"step": 10827, "train_loss": 3.5679707527160645, "lr": 0.00031019902231337775, "tps": 12998, "wall": 54593.8} {"step": 10828, "train_loss": 3.6174590587615967, "lr": 0.0003101824427359061, "tps": 12997, "wall": 54602.0} {"step": 10829, "train_loss": 3.473381519317627, "lr": 0.0003101658621368428, "tps": 12996, "wall": 54610.1} {"step": 10830, "train_loss": 3.5037174224853516, "lr": 0.00031014928051637577, "tps": 12996, "wall": 54618.3} {"step": 10831, "train_loss": 3.47458553314209, "lr": 0.00031013269787469284, "tps": 12995, "wall": 54626.4} {"step": 10832, "train_loss": 3.4524853229522705, "lr": 0.00031011611421198176, "tps": 12994, "wall": 54634.7} {"step": 10833, "train_loss": 3.5744712352752686, "lr": 0.0003100995295284305, "tps": 12993, "wall": 54642.9} {"step": 10834, "train_loss": 3.4883761405944824, "lr": 0.0003100829438242269, "tps": 12992, "wall": 54651.3} {"step": 10835, "train_loss": 3.5158090591430664, "lr": 0.00031006635709955886, "tps": 12992, "wall": 54659.3} {"step": 10836, "train_loss": 3.592331886291504, "lr": 0.0003100497693546142, "tps": 12991, "wall": 54667.5} {"step": 10837, "train_loss": 3.422290325164795, "lr": 0.00031003318058958086, "tps": 12990, "wall": 54675.8} {"step": 10838, "train_loss": 3.5044188499450684, "lr": 0.0003100165908046469, "tps": 12990, "wall": 54683.8} {"step": 10839, "train_loss": 3.4767961502075195, "lr": 0.00031, "tps": 12989, "wall": 54692.0} {"step": 10840, "train_loss": 3.5515692234039307, "lr": 0.0003099834081758283, "tps": 12988, "wall": 54700.2} {"step": 10841, "train_loss": 3.4678845405578613, "lr": 0.0003099668153323197, "tps": 12987, "wall": 54708.4} {"step": 10842, "train_loss": 3.4432568550109863, "lr": 0.00030995022146966213, "tps": 12987, "wall": 54716.6} {"step": 10843, "train_loss": 3.495560646057129, "lr": 0.0003099336265880435, "tps": 12986, "wall": 54724.8} {"step": 10844, "train_loss": 3.509814739227295, "lr": 0.000309917030687652, "tps": 12985, "wall": 54733.0} {"step": 10845, "train_loss": 3.59616756439209, "lr": 0.0003099004337686755, "tps": 12984, "wall": 54741.1} {"step": 10846, "train_loss": 3.4684081077575684, "lr": 0.00030988383583130196, "tps": 12984, "wall": 54749.4} {"step": 10847, "train_loss": 3.5155253410339355, "lr": 0.00030986723687571947, "tps": 12983, "wall": 54757.6} {"step": 10848, "train_loss": 3.4705893993377686, "lr": 0.0003098506369021162, "tps": 12982, "wall": 54765.7} {"step": 10849, "train_loss": 3.4301958084106445, "lr": 0.00030983403591067985, "tps": 12981, "wall": 54774.0} {"step": 10850, "train_loss": 3.372957706451416, "lr": 0.0003098174339015988, "tps": 12981, "wall": 54782.1} {"step": 10851, "train_loss": 3.438088893890381, "lr": 0.00030980083087506097, "tps": 12980, "wall": 54790.3} {"step": 10852, "train_loss": 3.475461006164551, "lr": 0.0003097842268312545, "tps": 12979, "wall": 54798.4} {"step": 10853, "train_loss": 3.4371755123138428, "lr": 0.00030976762177036736, "tps": 12978, "wall": 54806.7} {"step": 10854, "train_loss": 3.5080933570861816, "lr": 0.00030975101569258784, "tps": 12978, "wall": 54814.7} {"step": 10855, "train_loss": 3.544560670852661, "lr": 0.00030973440859810396, "tps": 12977, "wall": 54822.9} {"step": 10856, "train_loss": 3.5148186683654785, "lr": 0.0003097178004871038, "tps": 12976, "wall": 54831.2} {"step": 10857, "train_loss": 3.537738084793091, "lr": 0.00030970119135977553, "tps": 12975, "wall": 54839.3} {"step": 10858, "train_loss": 3.5721683502197266, "lr": 0.00030968458121630735, "tps": 12975, "wall": 54847.5} {"step": 10859, "train_loss": 3.6295251846313477, "lr": 0.00030966797005688737, "tps": 12974, "wall": 54855.8} {"step": 10860, "train_loss": 3.5512428283691406, "lr": 0.00030965135788170374, "tps": 12973, "wall": 54864.0} {"step": 10861, "train_loss": 3.487741231918335, "lr": 0.0003096347446909447, "tps": 12972, "wall": 54872.1} {"step": 10862, "train_loss": 3.587461471557617, "lr": 0.0003096181304847985, "tps": 12972, "wall": 54880.4} {"step": 10863, "train_loss": 3.520232915878296, "lr": 0.0003096015152634531, "tps": 12971, "wall": 54888.7} {"step": 10864, "train_loss": 3.5368919372558594, "lr": 0.000309584899027097, "tps": 12970, "wall": 54896.9} {"step": 10865, "train_loss": 3.516641139984131, "lr": 0.0003095682817759184, "tps": 12969, "wall": 54905.1} {"step": 10866, "train_loss": 3.568087100982666, "lr": 0.00030955166351010534, "tps": 12969, "wall": 54913.2} {"step": 10867, "train_loss": 3.5811502933502197, "lr": 0.0003095350442298462, "tps": 12968, "wall": 54921.4} {"step": 10868, "train_loss": 3.548644542694092, "lr": 0.0003095184239353293, "tps": 12967, "wall": 54929.6} {"step": 10869, "train_loss": 3.5656588077545166, "lr": 0.00030950180262674274, "tps": 12966, "wall": 54937.8} {"step": 10870, "train_loss": 3.3538012504577637, "lr": 0.000309485180304275, "tps": 12966, "wall": 54946.0} {"step": 10871, "train_loss": 3.5389151573181152, "lr": 0.00030946855696811423, "tps": 12965, "wall": 54954.2} {"step": 10872, "train_loss": 3.564666986465454, "lr": 0.0003094519326184489, "tps": 12964, "wall": 54962.5} {"step": 10873, "train_loss": 3.4462122917175293, "lr": 0.0003094353072554672, "tps": 12963, "wall": 54970.7} {"step": 10874, "train_loss": 3.5079185962677, "lr": 0.0003094186808793575, "tps": 12963, "wall": 54978.8} {"step": 10875, "train_loss": 3.594658851623535, "lr": 0.0003094020534903082, "tps": 12962, "wall": 54987.0} {"step": 10876, "train_loss": 3.3850936889648438, "lr": 0.0003093854250885075, "tps": 12961, "wall": 54995.3} {"step": 10877, "train_loss": 3.537815809249878, "lr": 0.0003093687956741439, "tps": 12961, "wall": 55003.4} {"step": 10878, "train_loss": 3.5497992038726807, "lr": 0.0003093521652474057, "tps": 12960, "wall": 55011.6} {"step": 10879, "train_loss": 3.4926657676696777, "lr": 0.00030933553380848146, "tps": 12959, "wall": 55019.9} {"step": 10880, "train_loss": 3.5333433151245117, "lr": 0.0003093189013575594, "tps": 12958, "wall": 55028.0} {"step": 10881, "train_loss": 3.5281143188476562, "lr": 0.0003093022678948279, "tps": 12958, "wall": 55036.2} {"step": 10882, "train_loss": 3.5431368350982666, "lr": 0.00030928563342047565, "tps": 12957, "wall": 55044.3} {"step": 10883, "train_loss": 3.455159902572632, "lr": 0.0003092689979346908, "tps": 12956, "wall": 55052.5} {"step": 10884, "train_loss": 3.461258888244629, "lr": 0.00030925236143766196, "tps": 12955, "wall": 55060.6} {"step": 10885, "train_loss": 3.442511796951294, "lr": 0.0003092357239295775, "tps": 12955, "wall": 55068.9} {"step": 10886, "train_loss": 3.5129828453063965, "lr": 0.00030921908541062595, "tps": 12954, "wall": 55077.0} {"step": 10887, "train_loss": 3.524104118347168, "lr": 0.0003092024458809958, "tps": 12953, "wall": 55085.0} {"step": 10888, "train_loss": 3.4489145278930664, "lr": 0.0003091858053408755, "tps": 12952, "wall": 55093.2} {"step": 10889, "train_loss": 3.495222568511963, "lr": 0.00030916916379045357, "tps": 12952, "wall": 55101.4} {"step": 10890, "train_loss": 3.4966797828674316, "lr": 0.00030915252122991853, "tps": 12951, "wall": 55109.6} {"step": 10891, "train_loss": 3.497070789337158, "lr": 0.0003091358776594589, "tps": 12950, "wall": 55117.8} {"step": 10892, "train_loss": 3.507852554321289, "lr": 0.00030911923307926325, "tps": 12950, "wall": 55125.9} {"step": 10893, "train_loss": 3.4195849895477295, "lr": 0.00030910258748952004, "tps": 12949, "wall": 55134.2} {"step": 10894, "train_loss": 3.5289556980133057, "lr": 0.00030908594089041795, "tps": 12948, "wall": 55142.4} {"step": 10895, "train_loss": 3.4546420574188232, "lr": 0.0003090692932821455, "tps": 12947, "wall": 55150.5} {"step": 10896, "train_loss": 3.5811002254486084, "lr": 0.0003090526446648913, "tps": 12947, "wall": 55158.8} {"step": 10897, "train_loss": 3.644320011138916, "lr": 0.0003090359950388439, "tps": 12946, "wall": 55166.9} {"step": 10898, "train_loss": 3.468522310256958, "lr": 0.0003090193444041919, "tps": 12945, "wall": 55175.1} {"step": 10899, "train_loss": 3.455320119857788, "lr": 0.000309002692761124, "tps": 12944, "wall": 55183.3} {"step": 10900, "train_loss": 3.4591612815856934, "lr": 0.00030898604010982873, "tps": 12944, "wall": 55191.5} {"step": 10901, "train_loss": 3.5390663146972656, "lr": 0.00030896938645049484, "tps": 12943, "wall": 55199.8} {"step": 10902, "train_loss": 3.4687740802764893, "lr": 0.0003089527317833109, "tps": 12942, "wall": 55207.8} {"step": 10903, "train_loss": 3.5546703338623047, "lr": 0.0003089360761084656, "tps": 12942, "wall": 55215.9} {"step": 10904, "train_loss": 3.5322458744049072, "lr": 0.0003089194194261476, "tps": 12941, "wall": 55224.0} {"step": 10905, "train_loss": 3.465205192565918, "lr": 0.0003089027617365456, "tps": 12940, "wall": 55232.2} {"step": 10906, "train_loss": 3.528968334197998, "lr": 0.0003088861030398484, "tps": 12939, "wall": 55240.3} {"step": 10907, "train_loss": 3.4864277839660645, "lr": 0.00030886944333624453, "tps": 12939, "wall": 55248.6} {"step": 10908, "train_loss": 3.4726412296295166, "lr": 0.0003088527826259228, "tps": 12938, "wall": 55256.8} {"step": 10909, "train_loss": 3.485138416290283, "lr": 0.00030883612090907203, "tps": 12937, "wall": 55265.0} {"step": 10910, "train_loss": 3.418700695037842, "lr": 0.0003088194581858808, "tps": 12936, "wall": 55273.3} {"step": 10911, "train_loss": 3.461264133453369, "lr": 0.00030880279445653794, "tps": 12936, "wall": 55281.5} {"step": 10912, "train_loss": 3.5557022094726562, "lr": 0.0003087861297212322, "tps": 12935, "wall": 55289.7} {"step": 10913, "train_loss": 3.5258848667144775, "lr": 0.00030876946398015245, "tps": 12934, "wall": 55297.9} {"step": 10914, "train_loss": 3.484492063522339, "lr": 0.00030875279723348737, "tps": 12933, "wall": 55306.3} {"step": 10915, "train_loss": 3.472776412963867, "lr": 0.0003087361294814258, "tps": 12933, "wall": 55314.5} {"step": 10916, "train_loss": 3.4771604537963867, "lr": 0.0003087194607241565, "tps": 12932, "wall": 55322.8} {"step": 10917, "train_loss": 3.4756782054901123, "lr": 0.00030870279096186843, "tps": 12931, "wall": 55331.1} {"step": 10918, "train_loss": 3.388275623321533, "lr": 0.0003086861201947504, "tps": 12930, "wall": 55339.3} {"step": 10919, "train_loss": 3.462675094604492, "lr": 0.00030866944842299104, "tps": 12930, "wall": 55347.6} {"step": 10920, "train_loss": 3.6118597984313965, "lr": 0.0003086527756467795, "tps": 12929, "wall": 55355.8} {"step": 10921, "train_loss": 3.5289413928985596, "lr": 0.0003086361018663045, "tps": 12928, "wall": 55364.0} {"step": 10922, "train_loss": 3.5559611320495605, "lr": 0.00030861942708175483, "tps": 12927, "wall": 55372.4} {"step": 10923, "train_loss": 3.5283331871032715, "lr": 0.0003086027512933196, "tps": 12927, "wall": 55380.5} {"step": 10924, "train_loss": 3.508045196533203, "lr": 0.0003085860745011876, "tps": 12926, "wall": 55388.7} {"step": 10925, "train_loss": 3.4635367393493652, "lr": 0.00030856939670554777, "tps": 12925, "wall": 55396.9} {"step": 10926, "train_loss": 3.460644006729126, "lr": 0.00030855271790658896, "tps": 12925, "wall": 55405.0} {"step": 10927, "train_loss": 3.61106276512146, "lr": 0.00030853603810450023, "tps": 12924, "wall": 55413.2} {"step": 10928, "train_loss": 3.4736812114715576, "lr": 0.00030851935729947044, "tps": 12923, "wall": 55421.3} {"step": 10929, "train_loss": 3.4728329181671143, "lr": 0.0003085026754916886, "tps": 12922, "wall": 55429.5} {"step": 10930, "train_loss": 3.615659713745117, "lr": 0.0003084859926813437, "tps": 12922, "wall": 55437.7} {"step": 10931, "train_loss": 3.4959635734558105, "lr": 0.0003084693088686246, "tps": 12921, "wall": 55445.9} {"step": 10932, "train_loss": 3.5560288429260254, "lr": 0.00030845262405372045, "tps": 12920, "wall": 55454.1} {"step": 10933, "train_loss": 3.508355140686035, "lr": 0.0003084359382368202, "tps": 12919, "wall": 55462.2} {"step": 10934, "train_loss": 3.5526678562164307, "lr": 0.0003084192514181128, "tps": 12919, "wall": 55470.4} {"step": 10935, "train_loss": 3.4685263633728027, "lr": 0.0003084025635977873, "tps": 12918, "wall": 55478.4} {"step": 10936, "train_loss": 3.5196280479431152, "lr": 0.00030838587477603286, "tps": 12917, "wall": 55486.8} {"step": 10937, "train_loss": 3.441643238067627, "lr": 0.00030836918495303847, "tps": 12917, "wall": 55494.8} {"step": 10938, "train_loss": 3.5240607261657715, "lr": 0.0003083524941289931, "tps": 12916, "wall": 55503.0} {"step": 10939, "train_loss": 3.5097856521606445, "lr": 0.000308335802304086, "tps": 12915, "wall": 55511.1} {"step": 10940, "train_loss": 3.59895658493042, "lr": 0.00030831910947850605, "tps": 12914, "wall": 55519.2} {"step": 10941, "train_loss": 3.4302611351013184, "lr": 0.00030830241565244247, "tps": 12914, "wall": 55527.3} {"step": 10942, "train_loss": 3.5094974040985107, "lr": 0.00030828572082608436, "tps": 12913, "wall": 55535.5} {"step": 10943, "train_loss": 3.4805121421813965, "lr": 0.0003082690249996208, "tps": 12912, "wall": 55543.6} {"step": 10944, "train_loss": 3.492178201675415, "lr": 0.000308252328173241, "tps": 12912, "wall": 55551.8} {"step": 10945, "train_loss": 3.4200992584228516, "lr": 0.00030823563034713405, "tps": 12911, "wall": 55559.9} {"step": 10946, "train_loss": 3.4019997119903564, "lr": 0.0003082189315214891, "tps": 12910, "wall": 55568.0} {"step": 10947, "train_loss": 3.5393905639648438, "lr": 0.0003082022316964953, "tps": 12909, "wall": 55576.2} {"step": 10948, "train_loss": 3.452922821044922, "lr": 0.00030818553087234185, "tps": 12909, "wall": 55584.4} {"step": 10949, "train_loss": 3.5161209106445312, "lr": 0.0003081688290492179, "tps": 12908, "wall": 55592.6} {"step": 10950, "train_loss": 3.387075185775757, "lr": 0.00030815212622731274, "tps": 12907, "wall": 55600.8} {"step": 10951, "train_loss": 3.528677463531494, "lr": 0.0003081354224068155, "tps": 12907, "wall": 55609.2} {"step": 10952, "train_loss": 3.4361395835876465, "lr": 0.00030811871758791543, "tps": 12906, "wall": 55617.4} {"step": 10953, "train_loss": 3.448795795440674, "lr": 0.0003081020117708018, "tps": 12905, "wall": 55625.6} {"step": 10954, "train_loss": 3.471677780151367, "lr": 0.0003080853049556638, "tps": 12904, "wall": 55633.9} {"step": 10955, "train_loss": 3.550233840942383, "lr": 0.00030806859714269065, "tps": 12904, "wall": 55642.1} {"step": 10956, "train_loss": 3.5239968299865723, "lr": 0.0003080518883320717, "tps": 12903, "wall": 55650.3} {"step": 10957, "train_loss": 3.4192404747009277, "lr": 0.0003080351785239962, "tps": 12902, "wall": 55658.4} {"step": 10958, "train_loss": 3.561793327331543, "lr": 0.0003080184677186534, "tps": 12901, "wall": 55666.8} {"step": 10959, "train_loss": 3.4624946117401123, "lr": 0.0003080017559162327, "tps": 12901, "wall": 55674.9} {"step": 10960, "train_loss": 3.550884485244751, "lr": 0.0003079850431169233, "tps": 12900, "wall": 55683.1} {"step": 10961, "train_loss": 3.5935559272766113, "lr": 0.00030796832932091455, "tps": 12899, "wall": 55691.3} {"step": 10962, "train_loss": 3.480341911315918, "lr": 0.0003079516145283959, "tps": 12899, "wall": 55699.5} {"step": 10963, "train_loss": 3.432305335998535, "lr": 0.0003079348987395565, "tps": 12898, "wall": 55707.7} {"step": 10964, "train_loss": 3.5241217613220215, "lr": 0.00030791818195458585, "tps": 12897, "wall": 55715.9} {"step": 10965, "train_loss": 3.5035512447357178, "lr": 0.00030790146417367326, "tps": 12896, "wall": 55724.1} {"step": 10966, "train_loss": 3.5968315601348877, "lr": 0.0003078847453970082, "tps": 12896, "wall": 55732.4} {"step": 10967, "train_loss": 3.409081220626831, "lr": 0.00030786802562477995, "tps": 12895, "wall": 55740.5} {"step": 10968, "train_loss": 3.5025393962860107, "lr": 0.0003078513048571779, "tps": 12894, "wall": 55748.8} {"step": 10969, "train_loss": 3.570777416229248, "lr": 0.0003078345830943915, "tps": 12894, "wall": 55756.9} {"step": 10970, "train_loss": 3.5479836463928223, "lr": 0.00030781786033661033, "tps": 12893, "wall": 55765.0} {"step": 10971, "train_loss": 3.4744603633880615, "lr": 0.0003078011365840236, "tps": 12892, "wall": 55773.3} {"step": 10972, "train_loss": 3.452925443649292, "lr": 0.00030778441183682085, "tps": 12891, "wall": 55781.4} {"step": 10973, "train_loss": 3.4760375022888184, "lr": 0.00030776768609519153, "tps": 12891, "wall": 55789.7} {"step": 10974, "train_loss": 3.5720436573028564, "lr": 0.00030775095935932513, "tps": 12890, "wall": 55797.9} {"step": 10975, "train_loss": 3.4528985023498535, "lr": 0.00030773423162941106, "tps": 12889, "wall": 55806.0} {"step": 10976, "train_loss": 3.548248767852783, "lr": 0.00030771750290563895, "tps": 12888, "wall": 55814.3} {"step": 10977, "train_loss": 3.4475669860839844, "lr": 0.00030770077318819814, "tps": 12888, "wall": 55822.4} {"step": 10978, "train_loss": 3.5262351036071777, "lr": 0.0003076840424772783, "tps": 12887, "wall": 55830.8} {"step": 10979, "train_loss": 3.491107702255249, "lr": 0.00030766731077306887, "tps": 12886, "wall": 55839.0} {"step": 10980, "train_loss": 3.670544147491455, "lr": 0.0003076505780757594, "tps": 12886, "wall": 55847.3} {"step": 10981, "train_loss": 3.548281192779541, "lr": 0.0003076338443855394, "tps": 12885, "wall": 55855.6} {"step": 10982, "train_loss": 3.5499765872955322, "lr": 0.00030761710970259845, "tps": 12884, "wall": 55863.9} {"step": 10983, "train_loss": 3.5156378746032715, "lr": 0.00030760037402712616, "tps": 12883, "wall": 55872.2} {"step": 10984, "train_loss": 3.5240495204925537, "lr": 0.0003075836373593122, "tps": 12883, "wall": 55880.5} {"step": 10985, "train_loss": 3.506420850753784, "lr": 0.00030756689969934595, "tps": 12882, "wall": 55888.8} {"step": 10986, "train_loss": 3.3764171600341797, "lr": 0.0003075501610474171, "tps": 12881, "wall": 55897.1} {"step": 10987, "train_loss": 3.492948532104492, "lr": 0.00030753342140371544, "tps": 12880, "wall": 55905.3} {"step": 10988, "train_loss": 3.587563991546631, "lr": 0.0003075166807684303, "tps": 12880, "wall": 55913.7} {"step": 10989, "train_loss": 3.5267727375030518, "lr": 0.0003074999391417515, "tps": 12879, "wall": 55922.0} {"step": 10990, "train_loss": 3.46297025680542, "lr": 0.0003074831965238687, "tps": 12878, "wall": 55930.3} {"step": 10991, "train_loss": 3.488314390182495, "lr": 0.0003074664529149714, "tps": 12877, "wall": 55938.5} {"step": 10992, "train_loss": 3.4905953407287598, "lr": 0.0003074497083152495, "tps": 12877, "wall": 55946.8} {"step": 10993, "train_loss": 3.5788767337799072, "lr": 0.0003074329627248926, "tps": 12876, "wall": 55954.9} {"step": 10994, "train_loss": 3.565948486328125, "lr": 0.0003074162161440903, "tps": 12875, "wall": 55963.2} {"step": 10995, "train_loss": 3.565837860107422, "lr": 0.0003073994685730324, "tps": 12875, "wall": 55971.4} {"step": 10996, "train_loss": 3.550630807876587, "lr": 0.0003073827200119086, "tps": 12874, "wall": 55979.6} {"step": 10997, "train_loss": 3.4938390254974365, "lr": 0.00030736597046090856, "tps": 12873, "wall": 55987.8} {"step": 10998, "train_loss": 3.6056413650512695, "lr": 0.0003073492199202221, "tps": 12872, "wall": 55996.1} {"step": 10999, "train_loss": 3.487731456756592, "lr": 0.000307332468390039, "tps": 12872, "wall": 56004.4} {"step": 11000, "train_loss": 3.5377159118652344, "lr": 0.00030731571587054894, "tps": 12871, "wall": 56012.6, "val_loss_monitor": 3.5291973107180796} {"step": 11001, "train_loss": 3.504690647125244, "lr": 0.0003072989623619418, "tps": 12859, "wall": 56071.6} {"step": 11002, "train_loss": 3.551374912261963, "lr": 0.0003072822078644072, "tps": 12858, "wall": 56079.9} {"step": 11003, "train_loss": 3.4437339305877686, "lr": 0.00030726545237813504, "tps": 12857, "wall": 56088.4} {"step": 11004, "train_loss": 3.515165328979492, "lr": 0.0003072486959033151, "tps": 12856, "wall": 56096.7} {"step": 11005, "train_loss": 3.525773048400879, "lr": 0.00030723193844013727, "tps": 12856, "wall": 56105.0} {"step": 11006, "train_loss": 3.4495656490325928, "lr": 0.0003072151799887913, "tps": 12855, "wall": 56113.3} {"step": 11007, "train_loss": 3.4766554832458496, "lr": 0.000307198420549467, "tps": 12854, "wall": 56121.5} {"step": 11008, "train_loss": 3.5352120399475098, "lr": 0.00030718166012235436, "tps": 12853, "wall": 56129.9} {"step": 11009, "train_loss": 3.523313045501709, "lr": 0.00030716489870764304, "tps": 12853, "wall": 56138.2} {"step": 11010, "train_loss": 3.579554557800293, "lr": 0.0003071481363055231, "tps": 12852, "wall": 56146.9} {"step": 11011, "train_loss": 3.5027034282684326, "lr": 0.00030713137291618446, "tps": 12851, "wall": 56155.0} {"step": 11012, "train_loss": 3.4343793392181396, "lr": 0.0003071146085398168, "tps": 12850, "wall": 56163.3} {"step": 11013, "train_loss": 3.4729504585266113, "lr": 0.0003070978431766101, "tps": 12850, "wall": 56171.7} {"step": 11014, "train_loss": 3.5237741470336914, "lr": 0.00030708107682675444, "tps": 12849, "wall": 56179.9} {"step": 11015, "train_loss": 3.486833095550537, "lr": 0.0003070643094904396, "tps": 12848, "wall": 56188.2} {"step": 11016, "train_loss": 3.4427881240844727, "lr": 0.0003070475411678555, "tps": 12847, "wall": 56196.4} {"step": 11017, "train_loss": 3.4710936546325684, "lr": 0.00030703077185919214, "tps": 12847, "wall": 56204.7} {"step": 11018, "train_loss": 3.5056424140930176, "lr": 0.00030701400156463957, "tps": 12846, "wall": 56213.2} {"step": 11019, "train_loss": 3.4378745555877686, "lr": 0.0003069972302843876, "tps": 12845, "wall": 56221.4} {"step": 11020, "train_loss": 3.44746994972229, "lr": 0.0003069804580186263, "tps": 12845, "wall": 56229.7} {"step": 11021, "train_loss": 3.5627388954162598, "lr": 0.0003069636847675457, "tps": 12844, "wall": 56238.0} {"step": 11022, "train_loss": 3.5370469093322754, "lr": 0.0003069469105313358, "tps": 12843, "wall": 56246.2} {"step": 11023, "train_loss": 3.521371364593506, "lr": 0.0003069301353101866, "tps": 12842, "wall": 56254.6} {"step": 11024, "train_loss": 3.475358486175537, "lr": 0.00030691335910428805, "tps": 12842, "wall": 56262.8} {"step": 11025, "train_loss": 3.622143030166626, "lr": 0.0003068965819138303, "tps": 12841, "wall": 56271.0} {"step": 11026, "train_loss": 3.45951509475708, "lr": 0.0003068798037390034, "tps": 12840, "wall": 56279.2} {"step": 11027, "train_loss": 3.49124813079834, "lr": 0.0003068630245799973, "tps": 12839, "wall": 56287.5} {"step": 11028, "train_loss": 3.4991610050201416, "lr": 0.00030684624443700226, "tps": 12839, "wall": 56295.7} {"step": 11029, "train_loss": 3.4790806770324707, "lr": 0.00030682946331020823, "tps": 12838, "wall": 56303.9} {"step": 11030, "train_loss": 3.5855660438537598, "lr": 0.0003068126811998053, "tps": 12837, "wall": 56312.1} {"step": 11031, "train_loss": 3.4296364784240723, "lr": 0.00030679589810598363, "tps": 12837, "wall": 56320.3} {"step": 11032, "train_loss": 3.592909812927246, "lr": 0.0003067791140289334, "tps": 12836, "wall": 56328.8} {"step": 11033, "train_loss": 3.3830630779266357, "lr": 0.0003067623289688446, "tps": 12835, "wall": 56337.0} {"step": 11034, "train_loss": 3.597156047821045, "lr": 0.00030674554292590744, "tps": 12834, "wall": 56345.2} {"step": 11035, "train_loss": 3.5074024200439453, "lr": 0.00030672875590031216, "tps": 12834, "wall": 56353.4} {"step": 11036, "train_loss": 3.493136405944824, "lr": 0.00030671196789224876, "tps": 12833, "wall": 56361.6} {"step": 11037, "train_loss": 3.4915249347686768, "lr": 0.0003066951789019075, "tps": 12832, "wall": 56369.9} {"step": 11038, "train_loss": 3.488443613052368, "lr": 0.00030667838892947853, "tps": 12832, "wall": 56378.2} {"step": 11039, "train_loss": 3.489638328552246, "lr": 0.00030666159797515226, "tps": 12831, "wall": 56386.7} {"step": 11040, "train_loss": 3.3803861141204834, "lr": 0.00030664480603911855, "tps": 12830, "wall": 56394.8} {"step": 11041, "train_loss": 3.481808662414551, "lr": 0.00030662801312156783, "tps": 12829, "wall": 56403.0} {"step": 11042, "train_loss": 3.4481656551361084, "lr": 0.0003066112192226903, "tps": 12829, "wall": 56411.3} {"step": 11043, "train_loss": 3.412947177886963, "lr": 0.0003065944243426762, "tps": 12828, "wall": 56419.5} {"step": 11044, "train_loss": 3.4244282245635986, "lr": 0.00030657762848171577, "tps": 12827, "wall": 56427.6} {"step": 11045, "train_loss": 3.599123001098633, "lr": 0.00030656083163999926, "tps": 12827, "wall": 56435.8} {"step": 11046, "train_loss": 3.600581169128418, "lr": 0.000306544033817717, "tps": 12826, "wall": 56444.2} {"step": 11047, "train_loss": 3.4738593101501465, "lr": 0.0003065272350150592, "tps": 12825, "wall": 56452.5} {"step": 11048, "train_loss": 3.5089244842529297, "lr": 0.0003065104352322162, "tps": 12824, "wall": 56460.8} {"step": 11049, "train_loss": 3.4250266551971436, "lr": 0.00030649363446937837, "tps": 12824, "wall": 56469.0} {"step": 11050, "train_loss": 3.477961778640747, "lr": 0.0003064768327267359, "tps": 12823, "wall": 56477.3} {"step": 11051, "train_loss": 3.4954833984375, "lr": 0.00030646003000447925, "tps": 12822, "wall": 56485.5} {"step": 11052, "train_loss": 3.5244059562683105, "lr": 0.0003064432263027987, "tps": 12822, "wall": 56494.0} {"step": 11053, "train_loss": 3.392928123474121, "lr": 0.0003064264216218846, "tps": 12821, "wall": 56502.4} {"step": 11054, "train_loss": 3.5877320766448975, "lr": 0.0003064096159619273, "tps": 12820, "wall": 56510.8} {"step": 11055, "train_loss": 3.483440637588501, "lr": 0.0003063928093231172, "tps": 12819, "wall": 56519.0} {"step": 11056, "train_loss": 3.448451519012451, "lr": 0.0003063760017056447, "tps": 12819, "wall": 56527.2} {"step": 11057, "train_loss": 3.516448736190796, "lr": 0.00030635919310970013, "tps": 12818, "wall": 56535.5} {"step": 11058, "train_loss": 3.387467861175537, "lr": 0.00030634238353547397, "tps": 12817, "wall": 56543.7} {"step": 11059, "train_loss": 3.3319692611694336, "lr": 0.00030632557298315667, "tps": 12817, "wall": 56552.0} {"step": 11060, "train_loss": 3.4937939643859863, "lr": 0.00030630876145293855, "tps": 12816, "wall": 56560.3} {"step": 11061, "train_loss": 3.451314926147461, "lr": 0.0003062919489450101, "tps": 12815, "wall": 56568.6} {"step": 11062, "train_loss": 3.503594398498535, "lr": 0.00030627513545956187, "tps": 12814, "wall": 56576.8} {"step": 11063, "train_loss": 3.4859559535980225, "lr": 0.0003062583209967842, "tps": 12814, "wall": 56585.0} {"step": 11064, "train_loss": 3.515254020690918, "lr": 0.00030624150555686754, "tps": 12813, "wall": 56593.2} {"step": 11065, "train_loss": 3.3954825401306152, "lr": 0.00030622468914000246, "tps": 12812, "wall": 56601.4} {"step": 11066, "train_loss": 3.5190858840942383, "lr": 0.00030620787174637953, "tps": 12812, "wall": 56609.6} {"step": 11067, "train_loss": 3.405853748321533, "lr": 0.00030619105337618903, "tps": 12811, "wall": 56617.8} {"step": 11068, "train_loss": 3.534569263458252, "lr": 0.0003061742340296217, "tps": 12810, "wall": 56626.1} {"step": 11069, "train_loss": 3.4698243141174316, "lr": 0.000306157413706868, "tps": 12809, "wall": 56634.4} {"step": 11070, "train_loss": 3.415071487426758, "lr": 0.0003061405924081184, "tps": 12809, "wall": 56642.7} {"step": 11071, "train_loss": 3.379441022872925, "lr": 0.0003061237701335635, "tps": 12808, "wall": 56650.9} {"step": 11072, "train_loss": 3.630204916000366, "lr": 0.0003061069468833939, "tps": 12807, "wall": 56659.1} {"step": 11073, "train_loss": 3.5131888389587402, "lr": 0.0003060901226578002, "tps": 12807, "wall": 56667.3} {"step": 11074, "train_loss": 3.592083692550659, "lr": 0.00030607329745697287, "tps": 12806, "wall": 56675.6} {"step": 11075, "train_loss": 3.503000497817993, "lr": 0.0003060564712811026, "tps": 12805, "wall": 56683.9} {"step": 11076, "train_loss": 3.4998974800109863, "lr": 0.00030603964413038, "tps": 12804, "wall": 56692.3} {"step": 11077, "train_loss": 3.467258930206299, "lr": 0.00030602281600499554, "tps": 12804, "wall": 56700.5} {"step": 11078, "train_loss": 3.4773526191711426, "lr": 0.00030600598690514006, "tps": 12803, "wall": 56708.7} {"step": 11079, "train_loss": 3.430004119873047, "lr": 0.0003059891568310041, "tps": 12802, "wall": 56717.0} {"step": 11080, "train_loss": 3.585875988006592, "lr": 0.0003059723257827783, "tps": 12802, "wall": 56725.2} {"step": 11081, "train_loss": 3.6545140743255615, "lr": 0.00030595549376065336, "tps": 12801, "wall": 56733.5} {"step": 11082, "train_loss": 3.478153705596924, "lr": 0.00030593866076481993, "tps": 12800, "wall": 56741.8} {"step": 11083, "train_loss": 3.5741639137268066, "lr": 0.0003059218267954687, "tps": 12799, "wall": 56750.2} {"step": 11084, "train_loss": 3.436959743499756, "lr": 0.00030590499185279035, "tps": 12799, "wall": 56758.6} {"step": 11085, "train_loss": 3.511289596557617, "lr": 0.0003058881559369756, "tps": 12798, "wall": 56766.9} {"step": 11086, "train_loss": 3.5545082092285156, "lr": 0.0003058713190482152, "tps": 12797, "wall": 56775.1} {"step": 11087, "train_loss": 3.5291213989257812, "lr": 0.0003058544811866998, "tps": 12797, "wall": 56783.3} {"step": 11088, "train_loss": 3.590778112411499, "lr": 0.0003058376423526203, "tps": 12796, "wall": 56791.6} {"step": 11089, "train_loss": 3.442497968673706, "lr": 0.00030582080254616727, "tps": 12795, "wall": 56799.9} {"step": 11090, "train_loss": 3.466726064682007, "lr": 0.00030580396176753155, "tps": 12794, "wall": 56808.2} {"step": 11091, "train_loss": 3.4821038246154785, "lr": 0.00030578712001690393, "tps": 12794, "wall": 56816.5} {"step": 11092, "train_loss": 3.5505483150482178, "lr": 0.0003057702772944751, "tps": 12793, "wall": 56824.7} {"step": 11093, "train_loss": 3.4349563121795654, "lr": 0.00030575343360043607, "tps": 12792, "wall": 56833.0} {"step": 11094, "train_loss": 3.5088143348693848, "lr": 0.00030573658893497737, "tps": 12792, "wall": 56841.3} {"step": 11095, "train_loss": 3.4811649322509766, "lr": 0.00030571974329829, "tps": 12791, "wall": 56849.6} {"step": 11096, "train_loss": 3.5228962898254395, "lr": 0.0003057028966905647, "tps": 12790, "wall": 56857.9} {"step": 11097, "train_loss": 3.3611743450164795, "lr": 0.0003056860491119924, "tps": 12789, "wall": 56866.3} {"step": 11098, "train_loss": 3.5292444229125977, "lr": 0.00030566920056276394, "tps": 12789, "wall": 56874.6} {"step": 11099, "train_loss": 3.399750232696533, "lr": 0.0003056523510430701, "tps": 12788, "wall": 56882.9} {"step": 11100, "train_loss": 3.479059934616089, "lr": 0.0003056355005531018, "tps": 12787, "wall": 56891.3} {"step": 11101, "train_loss": 3.492741107940674, "lr": 0.0003056186490930499, "tps": 12787, "wall": 56899.6} {"step": 11102, "train_loss": 3.4721298217773438, "lr": 0.0003056017966631053, "tps": 12786, "wall": 56907.9} {"step": 11103, "train_loss": 3.461733102798462, "lr": 0.00030558494326345895, "tps": 12785, "wall": 56916.2} {"step": 11104, "train_loss": 3.490598201751709, "lr": 0.0003055680888943017, "tps": 12784, "wall": 56924.5} {"step": 11105, "train_loss": 3.6389708518981934, "lr": 0.0003055512335558245, "tps": 12784, "wall": 56932.9} {"step": 11106, "train_loss": 3.5289676189422607, "lr": 0.0003055343772482183, "tps": 12783, "wall": 56941.2} {"step": 11107, "train_loss": 3.492713212966919, "lr": 0.00030551751997167406, "tps": 12782, "wall": 56949.4} {"step": 11108, "train_loss": 3.529445171356201, "lr": 0.0003055006617263828, "tps": 12782, "wall": 56957.7} {"step": 11109, "train_loss": 3.49442195892334, "lr": 0.0003054838025125353, "tps": 12781, "wall": 56966.0} {"step": 11110, "train_loss": 3.459409475326538, "lr": 0.0003054669423303228, "tps": 12780, "wall": 56974.3} {"step": 11111, "train_loss": 3.540311336517334, "lr": 0.000305450081179936, "tps": 12779, "wall": 56982.6} {"step": 11112, "train_loss": 3.471724033355713, "lr": 0.00030543321906156617, "tps": 12779, "wall": 56991.0} {"step": 11113, "train_loss": 3.4902853965759277, "lr": 0.00030541635597540413, "tps": 12778, "wall": 56999.3} {"step": 11114, "train_loss": 3.531076669692993, "lr": 0.00030539949192164104, "tps": 12777, "wall": 57007.5} {"step": 11115, "train_loss": 3.6004109382629395, "lr": 0.0003053826269004679, "tps": 12777, "wall": 57015.8} {"step": 11116, "train_loss": 3.4850070476531982, "lr": 0.0003053657609120757, "tps": 12776, "wall": 57024.1} {"step": 11117, "train_loss": 3.4996960163116455, "lr": 0.00030534889395665555, "tps": 12775, "wall": 57032.2} {"step": 11118, "train_loss": 3.491441011428833, "lr": 0.00030533202603439855, "tps": 12775, "wall": 57040.5} {"step": 11119, "train_loss": 3.4784786701202393, "lr": 0.0003053151571454957, "tps": 12774, "wall": 57048.9} {"step": 11120, "train_loss": 3.528128147125244, "lr": 0.00030529828729013815, "tps": 12773, "wall": 57057.2} {"step": 11121, "train_loss": 3.600090265274048, "lr": 0.000305281416468517, "tps": 12772, "wall": 57065.4} {"step": 11122, "train_loss": 3.5079758167266846, "lr": 0.0003052645446808233, "tps": 12772, "wall": 57073.6} {"step": 11123, "train_loss": 3.5150156021118164, "lr": 0.0003052476719272483, "tps": 12771, "wall": 57081.9} {"step": 11124, "train_loss": 3.4386205673217773, "lr": 0.000305230798207983, "tps": 12770, "wall": 57090.1} {"step": 11125, "train_loss": 3.5422916412353516, "lr": 0.0003052139235232186, "tps": 12770, "wall": 57098.4} {"step": 11126, "train_loss": 3.3550515174865723, "lr": 0.0003051970478731463, "tps": 12769, "wall": 57106.9} {"step": 11127, "train_loss": 3.4849610328674316, "lr": 0.00030518017125795725, "tps": 12768, "wall": 57115.2} {"step": 11128, "train_loss": 3.4561572074890137, "lr": 0.00030516329367784263, "tps": 12767, "wall": 57123.4} {"step": 11129, "train_loss": 3.5060348510742188, "lr": 0.00030514641513299353, "tps": 12767, "wall": 57131.8} {"step": 11130, "train_loss": 3.545487880706787, "lr": 0.0003051295356236013, "tps": 12766, "wall": 57140.0} {"step": 11131, "train_loss": 3.532752513885498, "lr": 0.00030511265514985707, "tps": 12765, "wall": 57148.3} {"step": 11132, "train_loss": 3.507892608642578, "lr": 0.00030509577371195206, "tps": 12765, "wall": 57156.6} {"step": 11133, "train_loss": 3.4772748947143555, "lr": 0.00030507889131007747, "tps": 12764, "wall": 57164.9} {"step": 11134, "train_loss": 3.499410629272461, "lr": 0.00030506200794442473, "tps": 12763, "wall": 57173.3} {"step": 11135, "train_loss": 3.536367893218994, "lr": 0.00030504512361518486, "tps": 12763, "wall": 57181.6} {"step": 11136, "train_loss": 3.5161428451538086, "lr": 0.00030502823832254924, "tps": 12762, "wall": 57189.9} {"step": 11137, "train_loss": 3.4639954566955566, "lr": 0.00030501135206670917, "tps": 12761, "wall": 57198.2} {"step": 11138, "train_loss": 3.5812268257141113, "lr": 0.0003049944648478559, "tps": 12760, "wall": 57206.6} {"step": 11139, "train_loss": 3.424630641937256, "lr": 0.0003049775766661807, "tps": 12760, "wall": 57215.0} {"step": 11140, "train_loss": 3.4847888946533203, "lr": 0.0003049606875218749, "tps": 12759, "wall": 57223.2} {"step": 11141, "train_loss": 3.528756618499756, "lr": 0.0003049437974151299, "tps": 12758, "wall": 57231.7} {"step": 11142, "train_loss": 3.5576171875, "lr": 0.000304926906346137, "tps": 12758, "wall": 57240.0} {"step": 11143, "train_loss": 3.5430283546447754, "lr": 0.0003049100143150874, "tps": 12757, "wall": 57248.3} {"step": 11144, "train_loss": 3.5656328201293945, "lr": 0.0003048931213221726, "tps": 12756, "wall": 57256.6} {"step": 11145, "train_loss": 3.3888301849365234, "lr": 0.000304876227367584, "tps": 12755, "wall": 57264.9} {"step": 11146, "train_loss": 3.456571578979492, "lr": 0.00030485933245151276, "tps": 12755, "wall": 57273.3} {"step": 11147, "train_loss": 3.4958271980285645, "lr": 0.0003048424365741505, "tps": 12754, "wall": 57281.6} {"step": 11148, "train_loss": 3.562718629837036, "lr": 0.0003048255397356886, "tps": 12753, "wall": 57290.0} {"step": 11149, "train_loss": 3.549555778503418, "lr": 0.0003048086419363183, "tps": 12753, "wall": 57298.3} {"step": 11150, "train_loss": 3.478243827819824, "lr": 0.0003047917431762311, "tps": 12752, "wall": 57306.6} {"step": 11151, "train_loss": 3.518223762512207, "lr": 0.0003047748434556185, "tps": 12751, "wall": 57314.8} {"step": 11152, "train_loss": 3.4973413944244385, "lr": 0.00030475794277467187, "tps": 12750, "wall": 57323.2} {"step": 11153, "train_loss": 3.5270509719848633, "lr": 0.0003047410411335827, "tps": 12750, "wall": 57331.6} {"step": 11154, "train_loss": 3.4994258880615234, "lr": 0.0003047241385325424, "tps": 12749, "wall": 57339.7} {"step": 11155, "train_loss": 3.4995529651641846, "lr": 0.0003047072349717425, "tps": 12748, "wall": 57348.2} {"step": 11156, "train_loss": 3.4312403202056885, "lr": 0.0003046903304513745, "tps": 12748, "wall": 57356.4} {"step": 11157, "train_loss": 3.366912603378296, "lr": 0.00030467342497162976, "tps": 12747, "wall": 57364.7} {"step": 11158, "train_loss": 3.55531907081604, "lr": 0.0003046565185326999, "tps": 12746, "wall": 57373.2} {"step": 11159, "train_loss": 3.4382612705230713, "lr": 0.00030463961113477646, "tps": 12745, "wall": 57381.5} {"step": 11160, "train_loss": 3.5084471702575684, "lr": 0.0003046227027780509, "tps": 12745, "wall": 57389.9} {"step": 11161, "train_loss": 3.487807273864746, "lr": 0.0003046057934627148, "tps": 12744, "wall": 57398.3} {"step": 11162, "train_loss": 3.4785053730010986, "lr": 0.0003045888831889597, "tps": 12743, "wall": 57406.8} {"step": 11163, "train_loss": 3.5472090244293213, "lr": 0.00030457197195697715, "tps": 12743, "wall": 57415.2} {"step": 11164, "train_loss": 3.5192759037017822, "lr": 0.0003045550597669587, "tps": 12742, "wall": 57423.5} {"step": 11165, "train_loss": 3.466245174407959, "lr": 0.000304538146619096, "tps": 12741, "wall": 57431.9} {"step": 11166, "train_loss": 3.441476821899414, "lr": 0.0003045212325135806, "tps": 12740, "wall": 57440.2} {"step": 11167, "train_loss": 3.41451358795166, "lr": 0.00030450431745060404, "tps": 12740, "wall": 57448.6} {"step": 11168, "train_loss": 3.40200138092041, "lr": 0.0003044874014303581, "tps": 12739, "wall": 57456.8} {"step": 11169, "train_loss": 3.4765515327453613, "lr": 0.00030447048445303427, "tps": 12738, "wall": 57465.2} {"step": 11170, "train_loss": 3.3753838539123535, "lr": 0.0003044535665188242, "tps": 12738, "wall": 57473.6} {"step": 11171, "train_loss": 3.5001637935638428, "lr": 0.00030443664762791955, "tps": 12737, "wall": 57481.9} {"step": 11172, "train_loss": 3.409285545349121, "lr": 0.000304419727780512, "tps": 12736, "wall": 57490.1} {"step": 11173, "train_loss": 3.467895984649658, "lr": 0.00030440280697679317, "tps": 12735, "wall": 57498.4} {"step": 11174, "train_loss": 3.5110340118408203, "lr": 0.00030438588521695487, "tps": 12735, "wall": 57506.6} {"step": 11175, "train_loss": 3.5283522605895996, "lr": 0.0003043689625011886, "tps": 12734, "wall": 57514.9} {"step": 11176, "train_loss": 3.4747490882873535, "lr": 0.0003043520388296862, "tps": 12733, "wall": 57523.2} {"step": 11177, "train_loss": 3.4384422302246094, "lr": 0.00030433511420263935, "tps": 12733, "wall": 57531.6} {"step": 11178, "train_loss": 3.472881317138672, "lr": 0.0003043181886202398, "tps": 12732, "wall": 57539.9} {"step": 11179, "train_loss": 3.4586243629455566, "lr": 0.00030430126208267917, "tps": 12731, "wall": 57548.3} {"step": 11180, "train_loss": 3.5073680877685547, "lr": 0.00030428433459014936, "tps": 12731, "wall": 57556.7} {"step": 11181, "train_loss": 3.3901290893554688, "lr": 0.00030426740614284195, "tps": 12730, "wall": 57565.0} {"step": 11182, "train_loss": 3.425386428833008, "lr": 0.00030425047674094885, "tps": 12729, "wall": 57573.3} {"step": 11183, "train_loss": 3.5062971115112305, "lr": 0.0003042335463846618, "tps": 12729, "wall": 57581.4} {"step": 11184, "train_loss": 3.5620100498199463, "lr": 0.0003042166150741726, "tps": 12728, "wall": 57589.9} {"step": 11185, "train_loss": 3.51470947265625, "lr": 0.000304199682809673, "tps": 12727, "wall": 57598.1} {"step": 11186, "train_loss": 3.4502971172332764, "lr": 0.00030418274959135487, "tps": 12726, "wall": 57606.6} {"step": 11187, "train_loss": 3.5205812454223633, "lr": 0.00030416581541940996, "tps": 12726, "wall": 57615.1} {"step": 11188, "train_loss": 3.537111282348633, "lr": 0.0003041488802940302, "tps": 12725, "wall": 57623.3} {"step": 11189, "train_loss": 3.3755970001220703, "lr": 0.00030413194421540727, "tps": 12724, "wall": 57631.8} {"step": 11190, "train_loss": 3.517747640609741, "lr": 0.00030411500718373314, "tps": 12724, "wall": 57640.0} {"step": 11191, "train_loss": 3.5821495056152344, "lr": 0.00030409806919919974, "tps": 12723, "wall": 57648.3} {"step": 11192, "train_loss": 3.5367414951324463, "lr": 0.0003040811302619988, "tps": 12722, "wall": 57656.7} {"step": 11193, "train_loss": 3.5014595985412598, "lr": 0.0003040641903723223, "tps": 12721, "wall": 57666.1} {"step": 11194, "train_loss": 3.533738136291504, "lr": 0.0003040472495303621, "tps": 12720, "wall": 57674.6} {"step": 11195, "train_loss": 3.5019326210021973, "lr": 0.0003040303077363101, "tps": 12720, "wall": 57683.0} {"step": 11196, "train_loss": 3.4411492347717285, "lr": 0.0003040133649903582, "tps": 12719, "wall": 57691.3} {"step": 11197, "train_loss": 3.4687719345092773, "lr": 0.00030399642129269843, "tps": 12718, "wall": 57699.7} {"step": 11198, "train_loss": 3.555968999862671, "lr": 0.0003039794766435225, "tps": 12718, "wall": 57708.3} {"step": 11199, "train_loss": 3.5323314666748047, "lr": 0.0003039625310430227, "tps": 12717, "wall": 57716.7} {"step": 11200, "train_loss": 3.521542549133301, "lr": 0.00030394558449139074, "tps": 12716, "wall": 57724.9} {"step": 11201, "train_loss": 3.5226571559906006, "lr": 0.00030392863698881865, "tps": 12715, "wall": 57733.3} {"step": 11202, "train_loss": 3.4865193367004395, "lr": 0.00030391168853549844, "tps": 12715, "wall": 57741.6} {"step": 11203, "train_loss": 3.5407767295837402, "lr": 0.00030389473913162204, "tps": 12714, "wall": 57750.0} {"step": 11204, "train_loss": 3.5169413089752197, "lr": 0.0003038777887773815, "tps": 12713, "wall": 57758.3} {"step": 11205, "train_loss": 3.547725200653076, "lr": 0.0003038608374729689, "tps": 12713, "wall": 57767.0} {"step": 11206, "train_loss": 3.4625773429870605, "lr": 0.00030384388521857616, "tps": 12712, "wall": 57775.3} {"step": 11207, "train_loss": 3.5289502143859863, "lr": 0.0003038269320143953, "tps": 12711, "wall": 57783.9} {"step": 11208, "train_loss": 3.4402413368225098, "lr": 0.0003038099778606184, "tps": 12710, "wall": 57792.7} {"step": 11209, "train_loss": 3.558957576751709, "lr": 0.00030379302275743765, "tps": 12710, "wall": 57801.3} {"step": 11210, "train_loss": 3.5522611141204834, "lr": 0.000303776066705045, "tps": 12709, "wall": 57809.7} {"step": 11211, "train_loss": 3.4520230293273926, "lr": 0.0003037591097036324, "tps": 12708, "wall": 57818.0} {"step": 11212, "train_loss": 3.469585418701172, "lr": 0.00030374215175339215, "tps": 12707, "wall": 57826.5} {"step": 11213, "train_loss": 3.6060407161712646, "lr": 0.00030372519285451634, "tps": 12707, "wall": 57834.9} {"step": 11214, "train_loss": 3.493288040161133, "lr": 0.00030370823300719695, "tps": 12706, "wall": 57843.2} {"step": 11215, "train_loss": 3.468244791030884, "lr": 0.0003036912722116262, "tps": 12705, "wall": 57851.7} {"step": 11216, "train_loss": 3.510176181793213, "lr": 0.0003036743104679962, "tps": 12705, "wall": 57860.0} {"step": 11217, "train_loss": 3.483344078063965, "lr": 0.000303657347776499, "tps": 12704, "wall": 57868.4} {"step": 11218, "train_loss": 3.5014443397521973, "lr": 0.0003036403841373269, "tps": 12703, "wall": 57876.6} {"step": 11219, "train_loss": 3.4602270126342773, "lr": 0.000303623419550672, "tps": 12703, "wall": 57885.0} {"step": 11220, "train_loss": 3.5405659675598145, "lr": 0.00030360645401672644, "tps": 12702, "wall": 57893.5} {"step": 11221, "train_loss": 3.4881505966186523, "lr": 0.0003035894875356825, "tps": 12701, "wall": 57901.8} {"step": 11222, "train_loss": 3.5495223999023438, "lr": 0.00030357252010773233, "tps": 12700, "wall": 57910.1} {"step": 11223, "train_loss": 3.5053391456604004, "lr": 0.0003035555517330681, "tps": 12700, "wall": 57918.4} {"step": 11224, "train_loss": 3.4509472846984863, "lr": 0.0003035385824118821, "tps": 12699, "wall": 57926.7} {"step": 11225, "train_loss": 3.4330101013183594, "lr": 0.00030352161214436646, "tps": 12698, "wall": 57935.0} {"step": 11226, "train_loss": 3.4946038722991943, "lr": 0.00030350464093071346, "tps": 12698, "wall": 57943.5} {"step": 11227, "train_loss": 3.53757381439209, "lr": 0.00030348766877111543, "tps": 12697, "wall": 57951.9} {"step": 11228, "train_loss": 3.4524803161621094, "lr": 0.0003034706956657645, "tps": 12696, "wall": 57960.3} {"step": 11229, "train_loss": 3.5635101795196533, "lr": 0.00030345372161485313, "tps": 12696, "wall": 57968.6} {"step": 11230, "train_loss": 3.5573229789733887, "lr": 0.00030343674661857336, "tps": 12695, "wall": 57976.7} {"step": 11231, "train_loss": 3.5177836418151855, "lr": 0.0003034197706771177, "tps": 12694, "wall": 57985.1} {"step": 11232, "train_loss": 3.5258264541625977, "lr": 0.0003034027937906784, "tps": 12693, "wall": 57993.6} {"step": 11233, "train_loss": 3.557325839996338, "lr": 0.0003033858159594476, "tps": 12693, "wall": 58001.9} {"step": 11234, "train_loss": 3.4736275672912598, "lr": 0.0003033688371836179, "tps": 12692, "wall": 58010.5} {"step": 11235, "train_loss": 3.431976318359375, "lr": 0.0003033518574633814, "tps": 12691, "wall": 58018.9} {"step": 11236, "train_loss": 3.4073548316955566, "lr": 0.00030333487679893065, "tps": 12691, "wall": 58027.5} {"step": 11237, "train_loss": 3.447896957397461, "lr": 0.0003033178951904578, "tps": 12690, "wall": 58037.1} {"step": 11238, "train_loss": 3.6017024517059326, "lr": 0.00030330091263815537, "tps": 12689, "wall": 58045.5} {"step": 11239, "train_loss": 3.392763614654541, "lr": 0.00030328392914221575, "tps": 12688, "wall": 58053.9} {"step": 11240, "train_loss": 3.441361427307129, "lr": 0.0003032669447028312, "tps": 12687, "wall": 58062.2} {"step": 11241, "train_loss": 3.4421286582946777, "lr": 0.00030324995932019426, "tps": 12687, "wall": 58070.8} {"step": 11242, "train_loss": 3.4520015716552734, "lr": 0.00030323297299449727, "tps": 12686, "wall": 58079.1} {"step": 11243, "train_loss": 3.414140224456787, "lr": 0.0003032159857259326, "tps": 12685, "wall": 58087.6} {"step": 11244, "train_loss": 3.575943946838379, "lr": 0.0003031989975146928, "tps": 12685, "wall": 58095.9} {"step": 11245, "train_loss": 3.5683441162109375, "lr": 0.00030318200836097016, "tps": 12684, "wall": 58104.3} {"step": 11246, "train_loss": 3.5085701942443848, "lr": 0.00030316501826495735, "tps": 12683, "wall": 58112.7} {"step": 11247, "train_loss": 3.510507583618164, "lr": 0.0003031480272268467, "tps": 12682, "wall": 58121.1} {"step": 11248, "train_loss": 3.459773063659668, "lr": 0.0003031310352468306, "tps": 12682, "wall": 58129.7} {"step": 11249, "train_loss": 3.43918514251709, "lr": 0.0003031140423251017, "tps": 12681, "wall": 58138.1} {"step": 11250, "train_loss": 3.4936163425445557, "lr": 0.0003030970484618525, "tps": 12680, "wall": 58146.5} {"step": 11251, "train_loss": 3.518500566482544, "lr": 0.0003030800536572753, "tps": 12680, "wall": 58154.9} {"step": 11252, "train_loss": 3.4854013919830322, "lr": 0.0003030630579115628, "tps": 12679, "wall": 58163.2} {"step": 11253, "train_loss": 3.5274698734283447, "lr": 0.0003030460612249076, "tps": 12678, "wall": 58171.5} {"step": 11254, "train_loss": 3.481670379638672, "lr": 0.000303029063597502, "tps": 12678, "wall": 58179.9} {"step": 11255, "train_loss": 3.4852263927459717, "lr": 0.00030301206502953874, "tps": 12677, "wall": 58188.4} {"step": 11256, "train_loss": 3.5551562309265137, "lr": 0.0003029950655212102, "tps": 12676, "wall": 58196.8} {"step": 11257, "train_loss": 3.5420804023742676, "lr": 0.00030297806507270924, "tps": 12675, "wall": 58205.1} {"step": 11258, "train_loss": 3.4816529750823975, "lr": 0.00030296106368422817, "tps": 12675, "wall": 58213.5} {"step": 11259, "train_loss": 3.495312452316284, "lr": 0.0003029440613559597, "tps": 12674, "wall": 58221.9} {"step": 11260, "train_loss": 3.4212849140167236, "lr": 0.00030292705808809643, "tps": 12673, "wall": 58230.3} {"step": 11261, "train_loss": 3.468095541000366, "lr": 0.00030291005388083093, "tps": 12673, "wall": 58238.7} {"step": 11262, "train_loss": 3.407541275024414, "lr": 0.00030289304873435584, "tps": 12672, "wall": 58247.2} {"step": 11263, "train_loss": 3.5209579467773438, "lr": 0.00030287604264886387, "tps": 12671, "wall": 58255.4} {"step": 11264, "train_loss": 3.347346305847168, "lr": 0.0003028590356245476, "tps": 12671, "wall": 58263.8} {"step": 11265, "train_loss": 3.484569549560547, "lr": 0.0003028420276615996, "tps": 12670, "wall": 58272.1} {"step": 11266, "train_loss": 3.528031587600708, "lr": 0.00030282501876021273, "tps": 12669, "wall": 58280.6} {"step": 11267, "train_loss": 3.433406352996826, "lr": 0.00030280800892057956, "tps": 12668, "wall": 58288.9} {"step": 11268, "train_loss": 3.48636531829834, "lr": 0.0003027909981428927, "tps": 12668, "wall": 58297.3} {"step": 11269, "train_loss": 3.4911935329437256, "lr": 0.00030277398642734497, "tps": 12667, "wall": 58305.7} {"step": 11270, "train_loss": 3.474863290786743, "lr": 0.00030275697377412915, "tps": 12666, "wall": 58314.2} {"step": 11271, "train_loss": 3.5439016819000244, "lr": 0.0003027399601834377, "tps": 12666, "wall": 58322.5} {"step": 11272, "train_loss": 3.493081569671631, "lr": 0.00030272294565546356, "tps": 12665, "wall": 58330.9} {"step": 11273, "train_loss": 3.438699245452881, "lr": 0.00030270593019039943, "tps": 12664, "wall": 58339.4} {"step": 11274, "train_loss": 3.5035533905029297, "lr": 0.0003026889137884381, "tps": 12664, "wall": 58347.8} {"step": 11275, "train_loss": 3.4607648849487305, "lr": 0.00030267189644977223, "tps": 12663, "wall": 58356.1} {"step": 11276, "train_loss": 3.4844584465026855, "lr": 0.00030265487817459464, "tps": 12662, "wall": 58364.4} {"step": 11277, "train_loss": 3.4420413970947266, "lr": 0.00030263785896309816, "tps": 12661, "wall": 58373.1} {"step": 11278, "train_loss": 3.3985602855682373, "lr": 0.0003026208388154755, "tps": 12661, "wall": 58381.5} {"step": 11279, "train_loss": 3.506596088409424, "lr": 0.0003026038177319194, "tps": 12660, "wall": 58389.8} {"step": 11280, "train_loss": 3.5164871215820312, "lr": 0.000302586795712623, "tps": 12659, "wall": 58398.2} {"step": 11281, "train_loss": 3.488039493560791, "lr": 0.0003025697727577788, "tps": 12659, "wall": 58406.6} {"step": 11282, "train_loss": 3.5695323944091797, "lr": 0.00030255274886757975, "tps": 12658, "wall": 58415.0} {"step": 11283, "train_loss": 3.3585619926452637, "lr": 0.0003025357240422187, "tps": 12657, "wall": 58423.4} {"step": 11284, "train_loss": 3.4844324588775635, "lr": 0.0003025186982818885, "tps": 12657, "wall": 58432.0} {"step": 11285, "train_loss": 3.444122791290283, "lr": 0.000302501671586782, "tps": 12656, "wall": 58440.4} {"step": 11286, "train_loss": 3.490353584289551, "lr": 0.00030248464395709213, "tps": 12655, "wall": 58448.8} {"step": 11287, "train_loss": 3.5188145637512207, "lr": 0.0003024676153930118, "tps": 12654, "wall": 58457.3} {"step": 11288, "train_loss": 3.461243152618408, "lr": 0.0003024505858947338, "tps": 12654, "wall": 58465.6} {"step": 11289, "train_loss": 3.3555805683135986, "lr": 0.00030243355546245106, "tps": 12653, "wall": 58474.1} {"step": 11290, "train_loss": 3.4082143306732178, "lr": 0.00030241652409635666, "tps": 12652, "wall": 58482.6} {"step": 11291, "train_loss": 3.3973515033721924, "lr": 0.00030239949179664336, "tps": 12652, "wall": 58491.1} {"step": 11292, "train_loss": 3.4950380325317383, "lr": 0.00030238245856350414, "tps": 12651, "wall": 58499.4} {"step": 11293, "train_loss": 3.5126559734344482, "lr": 0.00030236542439713194, "tps": 12650, "wall": 58507.8} {"step": 11294, "train_loss": 3.4351308345794678, "lr": 0.00030234838929771985, "tps": 12649, "wall": 58516.2} {"step": 11295, "train_loss": 3.482739210128784, "lr": 0.0003023313532654607, "tps": 12649, "wall": 58524.6} {"step": 11296, "train_loss": 3.444272041320801, "lr": 0.0003023143163005475, "tps": 12648, "wall": 58533.1} {"step": 11297, "train_loss": 3.4748053550720215, "lr": 0.00030229727840317333, "tps": 12647, "wall": 58541.5} {"step": 11298, "train_loss": 3.532555341720581, "lr": 0.00030228023957353103, "tps": 12647, "wall": 58550.0} {"step": 11299, "train_loss": 3.5307929515838623, "lr": 0.00030226319981181384, "tps": 12646, "wall": 58558.4} {"step": 11300, "train_loss": 3.455350399017334, "lr": 0.00030224615911821464, "tps": 12645, "wall": 58566.8} {"step": 11301, "train_loss": 3.5198726654052734, "lr": 0.0003022291174929265, "tps": 12645, "wall": 58575.1} {"step": 11302, "train_loss": 3.3926641941070557, "lr": 0.0003022120749361424, "tps": 12644, "wall": 58583.5} {"step": 11303, "train_loss": 3.418834686279297, "lr": 0.00030219503144805553, "tps": 12643, "wall": 58591.9} {"step": 11304, "train_loss": 3.458432674407959, "lr": 0.00030217798702885897, "tps": 12643, "wall": 58600.4} {"step": 11305, "train_loss": 3.469493865966797, "lr": 0.00030216094167874566, "tps": 12642, "wall": 58608.9} {"step": 11306, "train_loss": 3.368929862976074, "lr": 0.0003021438953979087, "tps": 12641, "wall": 58617.4} {"step": 11307, "train_loss": 3.4239492416381836, "lr": 0.00030212684818654135, "tps": 12640, "wall": 58625.8} {"step": 11308, "train_loss": 3.5426218509674072, "lr": 0.0003021098000448366, "tps": 12640, "wall": 58634.2} {"step": 11309, "train_loss": 3.503600597381592, "lr": 0.0003020927509729875, "tps": 12639, "wall": 58642.6} {"step": 11310, "train_loss": 3.464830160140991, "lr": 0.00030207570097118736, "tps": 12638, "wall": 58651.0} {"step": 11311, "train_loss": 3.3538818359375, "lr": 0.00030205865003962923, "tps": 12638, "wall": 58659.4} {"step": 11312, "train_loss": 3.5267839431762695, "lr": 0.00030204159817850626, "tps": 12637, "wall": 58667.9} {"step": 11313, "train_loss": 3.355067729949951, "lr": 0.0003020245453880116, "tps": 12636, "wall": 58676.5} {"step": 11314, "train_loss": 3.3843629360198975, "lr": 0.00030200749166833855, "tps": 12635, "wall": 58684.8} {"step": 11315, "train_loss": 3.4132814407348633, "lr": 0.0003019904370196801, "tps": 12635, "wall": 58693.2} {"step": 11316, "train_loss": 3.5848963260650635, "lr": 0.00030197338144222956, "tps": 12634, "wall": 58701.6} {"step": 11317, "train_loss": 3.430349588394165, "lr": 0.00030195632493618016, "tps": 12633, "wall": 58710.1} {"step": 11318, "train_loss": 3.5098624229431152, "lr": 0.00030193926750172507, "tps": 12633, "wall": 58718.6} {"step": 11319, "train_loss": 3.4160709381103516, "lr": 0.00030192220913905746, "tps": 12632, "wall": 58727.2} {"step": 11320, "train_loss": 3.465723991394043, "lr": 0.0003019051498483707, "tps": 12631, "wall": 58735.7} {"step": 11321, "train_loss": 3.4899539947509766, "lr": 0.000301888089629858, "tps": 12630, "wall": 58744.3} {"step": 11322, "train_loss": 3.4898595809936523, "lr": 0.00030187102848371246, "tps": 12630, "wall": 58752.8} {"step": 11323, "train_loss": 3.548917770385742, "lr": 0.0003018539664101276, "tps": 12629, "wall": 58761.1} {"step": 11324, "train_loss": 3.5024302005767822, "lr": 0.0003018369034092965, "tps": 12628, "wall": 58769.6} {"step": 11325, "train_loss": 3.5024733543395996, "lr": 0.0003018198394814126, "tps": 12628, "wall": 58778.0} {"step": 11326, "train_loss": 3.5559542179107666, "lr": 0.00030180277462666906, "tps": 12627, "wall": 58786.5} {"step": 11327, "train_loss": 3.458176612854004, "lr": 0.00030178570884525934, "tps": 12626, "wall": 58795.0} {"step": 11328, "train_loss": 3.5219876766204834, "lr": 0.00030176864213737664, "tps": 12626, "wall": 58803.4} {"step": 11329, "train_loss": 3.413116216659546, "lr": 0.0003017515745032144, "tps": 12625, "wall": 58811.9} {"step": 11330, "train_loss": 3.4244260787963867, "lr": 0.00030173450594296586, "tps": 12624, "wall": 58820.4} {"step": 11331, "train_loss": 3.5066378116607666, "lr": 0.0003017174364568244, "tps": 12623, "wall": 58828.8} {"step": 11332, "train_loss": 3.4149184226989746, "lr": 0.00030170036604498346, "tps": 12623, "wall": 58837.1} {"step": 11333, "train_loss": 3.5144741535186768, "lr": 0.0003016832947076363, "tps": 12622, "wall": 58845.6} {"step": 11334, "train_loss": 3.6157326698303223, "lr": 0.0003016662224449763, "tps": 12621, "wall": 58854.3} {"step": 11335, "train_loss": 3.5412955284118652, "lr": 0.000301649149257197, "tps": 12621, "wall": 58862.8} {"step": 11336, "train_loss": 3.5423083305358887, "lr": 0.0003016320751444917, "tps": 12620, "wall": 58871.4} {"step": 11337, "train_loss": 3.476144790649414, "lr": 0.00030161500010705383, "tps": 12619, "wall": 58879.7} {"step": 11338, "train_loss": 3.5574607849121094, "lr": 0.00030159792414507684, "tps": 12619, "wall": 58888.1} {"step": 11339, "train_loss": 3.471309185028076, "lr": 0.0003015808472587541, "tps": 12618, "wall": 58896.5} {"step": 11340, "train_loss": 3.5829358100891113, "lr": 0.00030156376944827915, "tps": 12617, "wall": 58905.0} {"step": 11341, "train_loss": 3.5056614875793457, "lr": 0.00030154669071384536, "tps": 12616, "wall": 58913.6} {"step": 11342, "train_loss": 3.5192441940307617, "lr": 0.00030152961105564633, "tps": 12616, "wall": 58922.0} {"step": 11343, "train_loss": 3.5419013500213623, "lr": 0.0003015125304738754, "tps": 12615, "wall": 58930.5} {"step": 11344, "train_loss": 3.3946821689605713, "lr": 0.00030149544896872617, "tps": 12614, "wall": 58939.0} {"step": 11345, "train_loss": 3.4588706493377686, "lr": 0.000301478366540392, "tps": 12614, "wall": 58947.4} {"step": 11346, "train_loss": 3.510672092437744, "lr": 0.00030146128318906654, "tps": 12613, "wall": 58955.8} {"step": 11347, "train_loss": 3.622391700744629, "lr": 0.00030144419891494327, "tps": 12612, "wall": 58964.2} {"step": 11348, "train_loss": 3.5863492488861084, "lr": 0.0003014271137182156, "tps": 12612, "wall": 58972.8} {"step": 11349, "train_loss": 3.4971799850463867, "lr": 0.0003014100275990773, "tps": 12611, "wall": 58981.3} {"step": 11350, "train_loss": 3.4709486961364746, "lr": 0.00030139294055772176, "tps": 12610, "wall": 58989.7} {"step": 11351, "train_loss": 3.4040660858154297, "lr": 0.00030137585259434267, "tps": 12609, "wall": 58998.2} {"step": 11352, "train_loss": 3.5405521392822266, "lr": 0.0003013587637091334, "tps": 12609, "wall": 59006.7} {"step": 11353, "train_loss": 3.529179573059082, "lr": 0.0003013416739022877, "tps": 12608, "wall": 59015.1} {"step": 11354, "train_loss": 3.4131674766540527, "lr": 0.0003013245831739991, "tps": 12607, "wall": 59023.5} {"step": 11355, "train_loss": 3.4922256469726562, "lr": 0.0003013074915244613, "tps": 12607, "wall": 59032.1} {"step": 11356, "train_loss": 3.55609393119812, "lr": 0.00030129039895386773, "tps": 12606, "wall": 59040.6} {"step": 11357, "train_loss": 3.524233818054199, "lr": 0.00030127330546241216, "tps": 12605, "wall": 59048.9} {"step": 11358, "train_loss": 3.518939256668091, "lr": 0.0003012562110502882, "tps": 12605, "wall": 59057.4} {"step": 11359, "train_loss": 3.4354207515716553, "lr": 0.0003012391157176895, "tps": 12604, "wall": 59065.9} {"step": 11360, "train_loss": 3.4698538780212402, "lr": 0.00030122201946480967, "tps": 12603, "wall": 59074.4} {"step": 11361, "train_loss": 3.3553576469421387, "lr": 0.00030120492229184246, "tps": 12602, "wall": 59082.9} {"step": 11362, "train_loss": 3.53228759765625, "lr": 0.00030118782419898143, "tps": 12602, "wall": 59091.4} {"step": 11363, "train_loss": 3.5694267749786377, "lr": 0.00030117072518642037, "tps": 12601, "wall": 59099.8} {"step": 11364, "train_loss": 3.4500415325164795, "lr": 0.0003011536252543529, "tps": 12600, "wall": 59108.3} {"step": 11365, "train_loss": 3.4715654850006104, "lr": 0.00030113652440297284, "tps": 12600, "wall": 59116.8} {"step": 11366, "train_loss": 3.4585835933685303, "lr": 0.00030111942263247386, "tps": 12599, "wall": 59125.2} {"step": 11367, "train_loss": 3.6763598918914795, "lr": 0.00030110231994304957, "tps": 12598, "wall": 59133.6} {"step": 11368, "train_loss": 3.602174997329712, "lr": 0.0003010852163348939, "tps": 12598, "wall": 59142.1} {"step": 11369, "train_loss": 3.5188698768615723, "lr": 0.0003010681118082005, "tps": 12597, "wall": 59150.7} {"step": 11370, "train_loss": 3.4684834480285645, "lr": 0.0003010510063631631, "tps": 12596, "wall": 59159.1} {"step": 11371, "train_loss": 3.5106332302093506, "lr": 0.0003010338999999755, "tps": 12596, "wall": 59167.5} {"step": 11372, "train_loss": 3.4932525157928467, "lr": 0.0003010167927188316, "tps": 12595, "wall": 59176.1} {"step": 11373, "train_loss": 3.4435861110687256, "lr": 0.00030099968451992505, "tps": 12594, "wall": 59184.5} {"step": 11374, "train_loss": 3.426973581314087, "lr": 0.0003009825754034496, "tps": 12593, "wall": 59192.9} {"step": 11375, "train_loss": 3.440007448196411, "lr": 0.00030096546536959924, "tps": 12593, "wall": 59201.3} {"step": 11376, "train_loss": 3.5153727531433105, "lr": 0.00030094835441856773, "tps": 12592, "wall": 59209.8} {"step": 11377, "train_loss": 3.5182852745056152, "lr": 0.00030093124255054876, "tps": 12591, "wall": 59218.2} {"step": 11378, "train_loss": 3.4834718704223633, "lr": 0.0003009141297657364, "tps": 12591, "wall": 59226.7} {"step": 11379, "train_loss": 3.478367805480957, "lr": 0.0003008970160643244, "tps": 12590, "wall": 59235.1} {"step": 11380, "train_loss": 3.503178119659424, "lr": 0.00030087990144650657, "tps": 12589, "wall": 59243.5} {"step": 11381, "train_loss": 3.4975430965423584, "lr": 0.0003008627859124769, "tps": 12589, "wall": 59251.9} {"step": 11382, "train_loss": 3.459721803665161, "lr": 0.00030084566946242923, "tps": 12588, "wall": 59260.4} {"step": 11383, "train_loss": 3.4485111236572266, "lr": 0.0003008285520965574, "tps": 12587, "wall": 59269.1} {"step": 11384, "train_loss": 3.511518955230713, "lr": 0.00030081143381505533, "tps": 12587, "wall": 59277.5} {"step": 11385, "train_loss": 3.4698328971862793, "lr": 0.000300794314618117, "tps": 12586, "wall": 59285.9} {"step": 11386, "train_loss": 3.427553653717041, "lr": 0.0003007771945059363, "tps": 12585, "wall": 59294.4} {"step": 11387, "train_loss": 3.47080135345459, "lr": 0.0003007600734787072, "tps": 12584, "wall": 59302.9} {"step": 11388, "train_loss": 3.4288175106048584, "lr": 0.0003007429515366236, "tps": 12584, "wall": 59311.3} {"step": 11389, "train_loss": 3.5485498905181885, "lr": 0.0003007258286798795, "tps": 12583, "wall": 59319.7} {"step": 11390, "train_loss": 3.4446256160736084, "lr": 0.00030070870490866877, "tps": 12582, "wall": 59328.3} {"step": 11391, "train_loss": 3.4538445472717285, "lr": 0.00030069158022318554, "tps": 12582, "wall": 59336.8} {"step": 11392, "train_loss": 3.480651617050171, "lr": 0.0003006744546236237, "tps": 12581, "wall": 59345.2} {"step": 11393, "train_loss": 3.518306255340576, "lr": 0.00030065732811017723, "tps": 12580, "wall": 59353.7} {"step": 11394, "train_loss": 3.5224368572235107, "lr": 0.0003006402006830402, "tps": 12580, "wall": 59362.0} {"step": 11395, "train_loss": 3.508096694946289, "lr": 0.00030062307234240667, "tps": 12579, "wall": 59370.5} {"step": 11396, "train_loss": 3.491117000579834, "lr": 0.0003006059430884706, "tps": 12578, "wall": 59379.0} {"step": 11397, "train_loss": 3.42474627494812, "lr": 0.000300588812921426, "tps": 12578, "wall": 59387.6} {"step": 11398, "train_loss": 3.4518585205078125, "lr": 0.000300571681841467, "tps": 12577, "wall": 59396.0} {"step": 11399, "train_loss": 3.557588577270508, "lr": 0.0003005545498487876, "tps": 12576, "wall": 59404.5} {"step": 11400, "train_loss": 3.4811530113220215, "lr": 0.00030053741694358195, "tps": 12575, "wall": 59413.0} {"step": 11401, "train_loss": 3.471522331237793, "lr": 0.000300520283126044, "tps": 12575, "wall": 59421.5} {"step": 11402, "train_loss": 3.4477720260620117, "lr": 0.00030050314839636804, "tps": 12574, "wall": 59430.1} {"step": 11403, "train_loss": 3.471254348754883, "lr": 0.00030048601275474803, "tps": 12573, "wall": 59438.4} {"step": 11404, "train_loss": 3.4170918464660645, "lr": 0.000300468876201378, "tps": 12573, "wall": 59447.1} {"step": 11405, "train_loss": 3.491276264190674, "lr": 0.0003004517387364523, "tps": 12572, "wall": 59455.7} {"step": 11406, "train_loss": 3.5397109985351562, "lr": 0.000300434600360165, "tps": 12571, "wall": 59464.0} {"step": 11407, "train_loss": 3.5059399604797363, "lr": 0.0003004174610727101, "tps": 12571, "wall": 59472.4} {"step": 11408, "train_loss": 3.5214362144470215, "lr": 0.0003004003208742818, "tps": 12570, "wall": 59480.8} {"step": 11409, "train_loss": 3.4312541484832764, "lr": 0.00030038317976507445, "tps": 12569, "wall": 59489.3} {"step": 11410, "train_loss": 3.499542236328125, "lr": 0.00030036603774528204, "tps": 12569, "wall": 59497.7} {"step": 11411, "train_loss": 3.469717502593994, "lr": 0.00030034889481509873, "tps": 12568, "wall": 59506.1} {"step": 11412, "train_loss": 3.452754020690918, "lr": 0.00030033175097471886, "tps": 12567, "wall": 59514.7} {"step": 11413, "train_loss": 3.5015041828155518, "lr": 0.00030031460622433656, "tps": 12566, "wall": 59523.2} {"step": 11414, "train_loss": 3.520677328109741, "lr": 0.0003002974605641461, "tps": 12566, "wall": 59531.6} {"step": 11415, "train_loss": 3.451300859451294, "lr": 0.00030028031399434164, "tps": 12565, "wall": 59540.1} {"step": 11416, "train_loss": 3.3938393592834473, "lr": 0.00030026316651511744, "tps": 12564, "wall": 59548.5} {"step": 11417, "train_loss": 3.444408416748047, "lr": 0.00030024601812666775, "tps": 12564, "wall": 59556.9} {"step": 11418, "train_loss": 3.467414140701294, "lr": 0.00030022886882918675, "tps": 12563, "wall": 59565.3} {"step": 11419, "train_loss": 3.4502151012420654, "lr": 0.0003002117186228689, "tps": 12562, "wall": 59573.9} {"step": 11420, "train_loss": 3.4871363639831543, "lr": 0.00030019456750790834, "tps": 12562, "wall": 59582.4} {"step": 11421, "train_loss": 3.563222885131836, "lr": 0.00030017741548449934, "tps": 12561, "wall": 59590.8} {"step": 11422, "train_loss": 3.3475160598754883, "lr": 0.00030016026255283624, "tps": 12560, "wall": 59599.2} {"step": 11423, "train_loss": 3.3417506217956543, "lr": 0.00030014310871311333, "tps": 12560, "wall": 59607.8} {"step": 11424, "train_loss": 3.475414276123047, "lr": 0.00030012595396552495, "tps": 12559, "wall": 59616.2} {"step": 11425, "train_loss": 3.5388104915618896, "lr": 0.00030010879831026543, "tps": 12558, "wall": 59624.6} {"step": 11426, "train_loss": 3.587820053100586, "lr": 0.00030009164174752914, "tps": 12558, "wall": 59633.3} {"step": 11427, "train_loss": 3.585658550262451, "lr": 0.0003000744842775104, "tps": 12557, "wall": 59641.7} {"step": 11428, "train_loss": 3.5190234184265137, "lr": 0.00030005732590040356, "tps": 12556, "wall": 59650.1} {"step": 11429, "train_loss": 3.5548017024993896, "lr": 0.000300040166616403, "tps": 12556, "wall": 59658.5} {"step": 11430, "train_loss": 3.5084238052368164, "lr": 0.00030002300642570313, "tps": 12555, "wall": 59666.9} {"step": 11431, "train_loss": 3.463456153869629, "lr": 0.0003000058453284983, "tps": 12554, "wall": 59675.3} {"step": 11432, "train_loss": 3.52850079536438, "lr": 0.00029998868332498286, "tps": 12554, "wall": 59683.8} {"step": 11433, "train_loss": 3.5041513442993164, "lr": 0.00029997152041535133, "tps": 12553, "wall": 59692.5} {"step": 11434, "train_loss": 3.5755581855773926, "lr": 0.00029995435659979815, "tps": 12552, "wall": 59700.9} {"step": 11435, "train_loss": 3.4360923767089844, "lr": 0.0002999371918785176, "tps": 12551, "wall": 59709.3} {"step": 11436, "train_loss": 3.543689250946045, "lr": 0.0002999200262517043, "tps": 12551, "wall": 59717.8} {"step": 11437, "train_loss": 3.6360158920288086, "lr": 0.0002999028597195526, "tps": 12550, "wall": 59726.3} {"step": 11438, "train_loss": 3.436025619506836, "lr": 0.0002998856922822569, "tps": 12549, "wall": 59734.7} {"step": 11439, "train_loss": 3.5887835025787354, "lr": 0.0002998685239400119, "tps": 12549, "wall": 59743.1} {"step": 11440, "train_loss": 3.58103084564209, "lr": 0.00029985135469301185, "tps": 12548, "wall": 59751.8} {"step": 11441, "train_loss": 3.3913650512695312, "lr": 0.0002998341845414513, "tps": 12547, "wall": 59760.3} {"step": 11442, "train_loss": 3.4930953979492188, "lr": 0.00029981701348552484, "tps": 12547, "wall": 59768.7} {"step": 11443, "train_loss": 3.4995036125183105, "lr": 0.00029979984152542693, "tps": 12546, "wall": 59777.1} {"step": 11444, "train_loss": 3.503756046295166, "lr": 0.0002997826686613521, "tps": 12545, "wall": 59785.6} {"step": 11445, "train_loss": 3.5405490398406982, "lr": 0.00029976549489349485, "tps": 12545, "wall": 59794.1} {"step": 11446, "train_loss": 3.6133997440338135, "lr": 0.0002997483202220498, "tps": 12544, "wall": 59802.6} {"step": 11447, "train_loss": 3.5628910064697266, "lr": 0.00029973114464721144, "tps": 12543, "wall": 59811.1} {"step": 11448, "train_loss": 3.505793333053589, "lr": 0.00029971396816917434, "tps": 12543, "wall": 59819.7} {"step": 11449, "train_loss": 3.501770496368408, "lr": 0.0002996967907881331, "tps": 12542, "wall": 59828.1} {"step": 11450, "train_loss": 3.516589641571045, "lr": 0.0002996796125042824, "tps": 12541, "wall": 59836.6} {"step": 11451, "train_loss": 3.51348876953125, "lr": 0.00029966243331781665, "tps": 12541, "wall": 59845.0} {"step": 11452, "train_loss": 3.4820713996887207, "lr": 0.0002996452532289306, "tps": 12540, "wall": 59853.5} {"step": 11453, "train_loss": 3.3797783851623535, "lr": 0.0002996280722378187, "tps": 12539, "wall": 59862.0} {"step": 11454, "train_loss": 3.3802642822265625, "lr": 0.0002996108903446758, "tps": 12538, "wall": 59870.6} {"step": 11455, "train_loss": 3.3936305046081543, "lr": 0.0002995937075496964, "tps": 12538, "wall": 59879.1} {"step": 11456, "train_loss": 3.4511585235595703, "lr": 0.00029957652385307514, "tps": 12537, "wall": 59887.6} {"step": 11457, "train_loss": 3.3369317054748535, "lr": 0.00029955933925500676, "tps": 12536, "wall": 59895.9} {"step": 11458, "train_loss": 3.371293067932129, "lr": 0.00029954215375568584, "tps": 12536, "wall": 59904.3} {"step": 11459, "train_loss": 3.414128065109253, "lr": 0.00029952496735530715, "tps": 12535, "wall": 59912.7} {"step": 11460, "train_loss": 3.444735288619995, "lr": 0.0002995077800540653, "tps": 12534, "wall": 59921.2} {"step": 11461, "train_loss": 3.5708770751953125, "lr": 0.00029949059185215503, "tps": 12534, "wall": 59929.8} {"step": 11462, "train_loss": 3.5331876277923584, "lr": 0.000299473402749771, "tps": 12533, "wall": 59938.2} {"step": 11463, "train_loss": 3.549391269683838, "lr": 0.000299456212747108, "tps": 12532, "wall": 59946.6} {"step": 11464, "train_loss": 3.512355089187622, "lr": 0.0002994390218443607, "tps": 12532, "wall": 59955.0} {"step": 11465, "train_loss": 3.5129809379577637, "lr": 0.00029942183004172385, "tps": 12531, "wall": 59963.5} {"step": 11466, "train_loss": 3.405313014984131, "lr": 0.0002994046373393922, "tps": 12530, "wall": 59971.9} {"step": 11467, "train_loss": 3.5050840377807617, "lr": 0.0002993874437375606, "tps": 12530, "wall": 59980.2} {"step": 11468, "train_loss": 3.4623162746429443, "lr": 0.0002993702492364237, "tps": 12529, "wall": 59988.8} {"step": 11469, "train_loss": 3.443490982055664, "lr": 0.00029935305383617627, "tps": 12528, "wall": 59997.2} {"step": 11470, "train_loss": 3.5728063583374023, "lr": 0.0002993358575370132, "tps": 12528, "wall": 60005.8} {"step": 11471, "train_loss": 3.4709479808807373, "lr": 0.00029931866033912927, "tps": 12527, "wall": 60014.3} {"step": 11472, "train_loss": 3.5793070793151855, "lr": 0.0002993014622427193, "tps": 12526, "wall": 60022.8} {"step": 11473, "train_loss": 3.4319546222686768, "lr": 0.00029928426324797797, "tps": 12526, "wall": 60031.2} {"step": 11474, "train_loss": 3.446117877960205, "lr": 0.0002992670633551003, "tps": 12525, "wall": 60039.7} {"step": 11475, "train_loss": 3.453700542449951, "lr": 0.000299249862564281, "tps": 12524, "wall": 60048.4} {"step": 11476, "train_loss": 3.585270881652832, "lr": 0.0002992326608757149, "tps": 12524, "wall": 60056.7} {"step": 11477, "train_loss": 3.585047483444214, "lr": 0.0002992154582895971, "tps": 12523, "wall": 60065.2} {"step": 11478, "train_loss": 3.461505889892578, "lr": 0.0002991982548061222, "tps": 12522, "wall": 60073.6} {"step": 11479, "train_loss": 3.386380434036255, "lr": 0.00029918105042548517, "tps": 12522, "wall": 60082.1} {"step": 11480, "train_loss": 3.4914469718933105, "lr": 0.00029916384514788095, "tps": 12521, "wall": 60090.6} {"step": 11481, "train_loss": 3.492976665496826, "lr": 0.00029914663897350445, "tps": 12520, "wall": 60099.0} {"step": 11482, "train_loss": 3.4834604263305664, "lr": 0.0002991294319025505, "tps": 12520, "wall": 60107.7} {"step": 11483, "train_loss": 3.3804614543914795, "lr": 0.00029911222393521405, "tps": 12519, "wall": 60116.2} {"step": 11484, "train_loss": 3.4149692058563232, "lr": 0.0002990950150716901, "tps": 12518, "wall": 60124.7} {"step": 11485, "train_loss": 3.4187428951263428, "lr": 0.00029907780531217347, "tps": 12517, "wall": 60133.2} {"step": 11486, "train_loss": 3.397002696990967, "lr": 0.00029906059465685915, "tps": 12517, "wall": 60141.7} {"step": 11487, "train_loss": 3.5348801612854004, "lr": 0.00029904338310594224, "tps": 12516, "wall": 60150.2} {"step": 11488, "train_loss": 3.4974868297576904, "lr": 0.0002990261706596176, "tps": 12515, "wall": 60158.7} {"step": 11489, "train_loss": 3.405122756958008, "lr": 0.00029900895731808014, "tps": 12515, "wall": 60167.3} {"step": 11490, "train_loss": 3.529067277908325, "lr": 0.00029899174308152505, "tps": 12514, "wall": 60175.8} {"step": 11491, "train_loss": 3.5199666023254395, "lr": 0.00029897452795014717, "tps": 12513, "wall": 60184.2} {"step": 11492, "train_loss": 3.513949394226074, "lr": 0.0002989573119241415, "tps": 12513, "wall": 60192.6} {"step": 11493, "train_loss": 3.527219772338867, "lr": 0.00029894009500370324, "tps": 12512, "wall": 60201.1} {"step": 11494, "train_loss": 3.5119071006774902, "lr": 0.0002989228771890273, "tps": 12511, "wall": 60209.6} {"step": 11495, "train_loss": 3.4470343589782715, "lr": 0.0002989056584803086, "tps": 12511, "wall": 60218.0} {"step": 11496, "train_loss": 3.497023344039917, "lr": 0.00029888843887774245, "tps": 12510, "wall": 60226.4} {"step": 11497, "train_loss": 3.4204611778259277, "lr": 0.0002988712183815237, "tps": 12509, "wall": 60234.9} {"step": 11498, "train_loss": 3.460965156555176, "lr": 0.0002988539969918477, "tps": 12509, "wall": 60243.4} {"step": 11499, "train_loss": 3.4253599643707275, "lr": 0.00029883677470890924, "tps": 12508, "wall": 60251.9} {"step": 11500, "train_loss": 3.4943628311157227, "lr": 0.0002988195515329036, "tps": 12507, "wall": 60260.3} {"step": 11501, "train_loss": 3.5361034870147705, "lr": 0.0002988023274640257, "tps": 12507, "wall": 60268.8} {"step": 11502, "train_loss": 3.4347825050354004, "lr": 0.00029878510250247085, "tps": 12506, "wall": 60277.2} {"step": 11503, "train_loss": 3.5366055965423584, "lr": 0.0002987678766484341, "tps": 12505, "wall": 60285.7} {"step": 11504, "train_loss": 3.4868271350860596, "lr": 0.0002987506499021105, "tps": 12505, "wall": 60294.3} {"step": 11505, "train_loss": 3.5060582160949707, "lr": 0.0002987334222636954, "tps": 12504, "wall": 60302.9} {"step": 11506, "train_loss": 3.361543655395508, "lr": 0.00029871619373338375, "tps": 12503, "wall": 60311.2} {"step": 11507, "train_loss": 3.438405990600586, "lr": 0.0002986989643113708, "tps": 12503, "wall": 60319.6} {"step": 11508, "train_loss": 3.4785852432250977, "lr": 0.0002986817339978517, "tps": 12502, "wall": 60328.0} {"step": 11509, "train_loss": 3.510611057281494, "lr": 0.0002986645027930218, "tps": 12501, "wall": 60336.5} {"step": 11510, "train_loss": 3.4714229106903076, "lr": 0.00029864727069707606, "tps": 12501, "wall": 60344.9} {"step": 11511, "train_loss": 3.4360334873199463, "lr": 0.0002986300377102097, "tps": 12500, "wall": 60353.5} {"step": 11512, "train_loss": 3.420215129852295, "lr": 0.00029861280383261816, "tps": 12499, "wall": 60361.9} {"step": 11513, "train_loss": 3.4584951400756836, "lr": 0.00029859556906449645, "tps": 12499, "wall": 60370.3} {"step": 11514, "train_loss": 3.4172310829162598, "lr": 0.0002985783334060399, "tps": 12498, "wall": 60378.8} {"step": 11515, "train_loss": 3.5443291664123535, "lr": 0.0002985610968574438, "tps": 12497, "wall": 60387.3} {"step": 11516, "train_loss": 3.577624797821045, "lr": 0.00029854385941890325, "tps": 12497, "wall": 60395.8} {"step": 11517, "train_loss": 3.454165458679199, "lr": 0.00029852662109061364, "tps": 12496, "wall": 60404.2} {"step": 11518, "train_loss": 3.4991722106933594, "lr": 0.00029850938187277025, "tps": 12495, "wall": 60412.8} {"step": 11519, "train_loss": 3.531731128692627, "lr": 0.0002984921417655683, "tps": 12495, "wall": 60421.2} {"step": 11520, "train_loss": 3.298943519592285, "lr": 0.0002984749007692031, "tps": 12494, "wall": 60429.7} {"step": 11521, "train_loss": 3.467174530029297, "lr": 0.00029845765888387, "tps": 12493, "wall": 60438.0} {"step": 11522, "train_loss": 3.528285503387451, "lr": 0.00029844041610976434, "tps": 12493, "wall": 60446.5} {"step": 11523, "train_loss": 3.4054315090179443, "lr": 0.0002984231724470814, "tps": 12492, "wall": 60455.1} {"step": 11524, "train_loss": 3.3734235763549805, "lr": 0.0002984059278960165, "tps": 12491, "wall": 60463.6} {"step": 11525, "train_loss": 3.5081729888916016, "lr": 0.000298388682456765, "tps": 12491, "wall": 60472.2} {"step": 11526, "train_loss": 3.5154271125793457, "lr": 0.00029837143612952217, "tps": 12490, "wall": 60480.6} {"step": 11527, "train_loss": 3.499479293823242, "lr": 0.0002983541889144836, "tps": 12489, "wall": 60489.1} {"step": 11528, "train_loss": 3.4477908611297607, "lr": 0.00029833694081184446, "tps": 12489, "wall": 60497.6} {"step": 11529, "train_loss": 3.5144643783569336, "lr": 0.00029831969182180033, "tps": 12488, "wall": 60506.0} {"step": 11530, "train_loss": 3.4649813175201416, "lr": 0.00029830244194454635, "tps": 12487, "wall": 60514.5} {"step": 11531, "train_loss": 3.500314712524414, "lr": 0.0002982851911802782, "tps": 12487, "wall": 60523.1} {"step": 11532, "train_loss": 3.5280652046203613, "lr": 0.0002982679395291911, "tps": 12486, "wall": 60531.7} {"step": 11533, "train_loss": 3.4585704803466797, "lr": 0.00029825068699148053, "tps": 12485, "wall": 60540.2} {"step": 11534, "train_loss": 3.5446248054504395, "lr": 0.000298233433567342, "tps": 12485, "wall": 60548.8} {"step": 11535, "train_loss": 3.3665263652801514, "lr": 0.00029821617925697083, "tps": 12484, "wall": 60557.2} {"step": 11536, "train_loss": 3.4233932495117188, "lr": 0.0002981989240605626, "tps": 12483, "wall": 60565.7} {"step": 11537, "train_loss": 3.499478816986084, "lr": 0.00029818166797831276, "tps": 12483, "wall": 60574.1} {"step": 11538, "train_loss": 3.4221115112304688, "lr": 0.00029816441101041663, "tps": 12482, "wall": 60582.6} {"step": 11539, "train_loss": 3.4162168502807617, "lr": 0.00029814715315707, "tps": 12481, "wall": 60591.3} {"step": 11540, "train_loss": 3.420900583267212, "lr": 0.0002981298944184681, "tps": 12481, "wall": 60599.8} {"step": 11541, "train_loss": 3.416163206100464, "lr": 0.00029811263479480646, "tps": 12480, "wall": 60608.4} {"step": 11542, "train_loss": 3.4373385906219482, "lr": 0.0002980953742862808, "tps": 12479, "wall": 60616.8} {"step": 11543, "train_loss": 3.5301904678344727, "lr": 0.00029807811289308644, "tps": 12479, "wall": 60625.2} {"step": 11544, "train_loss": 3.4209322929382324, "lr": 0.00029806085061541903, "tps": 12478, "wall": 60634.0} {"step": 11545, "train_loss": 3.4200210571289062, "lr": 0.000298043587453474, "tps": 12477, "wall": 60642.5} {"step": 11546, "train_loss": 3.5444226264953613, "lr": 0.0002980263234074471, "tps": 12477, "wall": 60651.1} {"step": 11547, "train_loss": 3.4876112937927246, "lr": 0.00029800905847753375, "tps": 12476, "wall": 60659.6} {"step": 11548, "train_loss": 3.418665885925293, "lr": 0.0002979917926639295, "tps": 12475, "wall": 60668.1} {"step": 11549, "train_loss": 3.4627020359039307, "lr": 0.0002979745259668301, "tps": 12475, "wall": 60676.6} {"step": 11550, "train_loss": 3.4000837802886963, "lr": 0.000297957258386431, "tps": 12474, "wall": 60685.0} {"step": 11551, "train_loss": 3.5630600452423096, "lr": 0.00029793998992292786, "tps": 12473, "wall": 60693.4} {"step": 11552, "train_loss": 3.4486494064331055, "lr": 0.0002979227205765163, "tps": 12473, "wall": 60701.9} {"step": 11553, "train_loss": 3.530414342880249, "lr": 0.0002979054503473919, "tps": 12472, "wall": 60710.5} {"step": 11554, "train_loss": 3.476588487625122, "lr": 0.00029788817923575043, "tps": 12471, "wall": 60719.0} {"step": 11555, "train_loss": 3.377230644226074, "lr": 0.00029787090724178744, "tps": 12471, "wall": 60727.6} {"step": 11556, "train_loss": 3.403453826904297, "lr": 0.0002978536343656986, "tps": 12470, "wall": 60736.1} {"step": 11557, "train_loss": 3.400531768798828, "lr": 0.0002978363606076795, "tps": 12469, "wall": 60744.6} {"step": 11558, "train_loss": 3.434656858444214, "lr": 0.000297819085967926, "tps": 12469, "wall": 60752.9} {"step": 11559, "train_loss": 3.4272170066833496, "lr": 0.00029780181044663357, "tps": 12468, "wall": 60761.4} {"step": 11560, "train_loss": 3.4771275520324707, "lr": 0.0002977845340439981, "tps": 12467, "wall": 60769.9} {"step": 11561, "train_loss": 3.3763303756713867, "lr": 0.00029776725676021525, "tps": 12467, "wall": 60778.3} {"step": 11562, "train_loss": 3.4796085357666016, "lr": 0.0002977499785954806, "tps": 12466, "wall": 60786.7} {"step": 11563, "train_loss": 3.4398062229156494, "lr": 0.0002977326995499901, "tps": 12465, "wall": 60795.1} {"step": 11564, "train_loss": 3.4241340160369873, "lr": 0.0002977154196239393, "tps": 12465, "wall": 60803.7} {"step": 11565, "train_loss": 3.494056224822998, "lr": 0.00029769813881752404, "tps": 12464, "wall": 60812.3} {"step": 11566, "train_loss": 3.453399181365967, "lr": 0.0002976808571309401, "tps": 12463, "wall": 60820.7} {"step": 11567, "train_loss": 3.284923553466797, "lr": 0.00029766357456438314, "tps": 12463, "wall": 60829.3} {"step": 11568, "train_loss": 3.4833006858825684, "lr": 0.00029764629111804904, "tps": 12462, "wall": 60837.8} {"step": 11569, "train_loss": 3.5027236938476562, "lr": 0.0002976290067921335, "tps": 12461, "wall": 60846.2} {"step": 11570, "train_loss": 3.476595878601074, "lr": 0.00029761172158683253, "tps": 12461, "wall": 60854.6} {"step": 11571, "train_loss": 3.5050177574157715, "lr": 0.00029759443550234164, "tps": 12460, "wall": 60863.0} {"step": 11572, "train_loss": 3.3813562393188477, "lr": 0.00029757714853885677, "tps": 12459, "wall": 60871.4} {"step": 11573, "train_loss": 3.369825839996338, "lr": 0.00029755986069657383, "tps": 12459, "wall": 60879.9} {"step": 11574, "train_loss": 3.4403574466705322, "lr": 0.0002975425719756886, "tps": 12458, "wall": 60888.5} {"step": 11575, "train_loss": 3.3882718086242676, "lr": 0.0002975252823763969, "tps": 12457, "wall": 60896.9} {"step": 11576, "train_loss": 3.4726438522338867, "lr": 0.0002975079918988946, "tps": 12457, "wall": 60905.3} {"step": 11577, "train_loss": 3.4871973991394043, "lr": 0.00029749070054337757, "tps": 12456, "wall": 60913.7} {"step": 11578, "train_loss": 3.508293628692627, "lr": 0.00029747340831004173, "tps": 12455, "wall": 60922.1} {"step": 11579, "train_loss": 3.436174154281616, "lr": 0.00029745611519908295, "tps": 12455, "wall": 60930.8} {"step": 11580, "train_loss": 3.494997978210449, "lr": 0.000297438821210697, "tps": 12454, "wall": 60939.3} {"step": 11581, "train_loss": 3.511610507965088, "lr": 0.00029742152634507996, "tps": 12453, "wall": 60947.8} {"step": 11582, "train_loss": 3.5226337909698486, "lr": 0.0002974042306024276, "tps": 12453, "wall": 60956.3} {"step": 11583, "train_loss": 3.4623584747314453, "lr": 0.00029738693398293604, "tps": 12452, "wall": 60964.7} {"step": 11584, "train_loss": 3.4270131587982178, "lr": 0.0002973696364868011, "tps": 12451, "wall": 60973.2} {"step": 11585, "train_loss": 3.3644378185272217, "lr": 0.0002973523381142187, "tps": 12451, "wall": 60981.6} {"step": 11586, "train_loss": 3.465885877609253, "lr": 0.00029733503886538484, "tps": 12450, "wall": 60990.0} {"step": 11587, "train_loss": 3.362630605697632, "lr": 0.0002973177387404955, "tps": 12450, "wall": 60998.5} {"step": 11588, "train_loss": 3.5141217708587646, "lr": 0.00029730043773974654, "tps": 12449, "wall": 61007.0} {"step": 11589, "train_loss": 3.393918991088867, "lr": 0.0002972831358633341, "tps": 12448, "wall": 61015.5} {"step": 11590, "train_loss": 3.461014747619629, "lr": 0.0002972658331114541, "tps": 12448, "wall": 61023.9} {"step": 11591, "train_loss": 3.5339536666870117, "lr": 0.0002972485294843026, "tps": 12447, "wall": 61032.3} {"step": 11592, "train_loss": 3.4094955921173096, "lr": 0.0002972312249820755, "tps": 12446, "wall": 61040.8} {"step": 11593, "train_loss": 3.429165840148926, "lr": 0.000297213919604969, "tps": 12446, "wall": 61049.2} {"step": 11594, "train_loss": 3.6176459789276123, "lr": 0.000297196613353179, "tps": 12445, "wall": 61057.7} {"step": 11595, "train_loss": 3.4087629318237305, "lr": 0.0002971793062269016, "tps": 12444, "wall": 61066.1} {"step": 11596, "train_loss": 3.4609575271606445, "lr": 0.0002971619982263328, "tps": 12444, "wall": 61074.7} {"step": 11597, "train_loss": 3.4561362266540527, "lr": 0.0002971446893516688, "tps": 12443, "wall": 61083.2} {"step": 11598, "train_loss": 3.5158135890960693, "lr": 0.0002971273796031055, "tps": 12442, "wall": 61091.9} {"step": 11599, "train_loss": 3.429123878479004, "lr": 0.00029711006898083906, "tps": 12442, "wall": 61100.3} {"step": 11600, "train_loss": 3.5276613235473633, "lr": 0.00029709275748506566, "tps": 12441, "wall": 61108.7} {"step": 11601, "train_loss": 3.5097861289978027, "lr": 0.0002970754451159813, "tps": 12440, "wall": 61117.2} {"step": 11602, "train_loss": 3.418382406234741, "lr": 0.0002970581318737821, "tps": 12440, "wall": 61125.7} {"step": 11603, "train_loss": 3.368305206298828, "lr": 0.0002970408177586642, "tps": 12439, "wall": 61134.2} {"step": 11604, "train_loss": 3.5224647521972656, "lr": 0.0002970235027708239, "tps": 12438, "wall": 61142.6} {"step": 11605, "train_loss": 3.431069850921631, "lr": 0.00029700618691045705, "tps": 12438, "wall": 61151.1} {"step": 11606, "train_loss": 3.389340877532959, "lr": 0.00029698887017775996, "tps": 12437, "wall": 61159.6} {"step": 11607, "train_loss": 3.469996452331543, "lr": 0.0002969715525729288, "tps": 12436, "wall": 61168.0} {"step": 11608, "train_loss": 3.4914586544036865, "lr": 0.00029695423409615976, "tps": 12436, "wall": 61176.4} {"step": 11609, "train_loss": 3.5677003860473633, "lr": 0.0002969369147476489, "tps": 12435, "wall": 61184.8} {"step": 11610, "train_loss": 3.4217441082000732, "lr": 0.0002969195945275926, "tps": 12435, "wall": 61193.2} {"step": 11611, "train_loss": 3.5654850006103516, "lr": 0.0002969022734361869, "tps": 12434, "wall": 61201.6} {"step": 11612, "train_loss": 3.5507731437683105, "lr": 0.00029688495147362816, "tps": 12433, "wall": 61209.9} {"step": 11613, "train_loss": 3.456063747406006, "lr": 0.0002968676286401125, "tps": 12433, "wall": 61218.5} {"step": 11614, "train_loss": 3.4753365516662598, "lr": 0.0002968503049358362, "tps": 12432, "wall": 61226.8} {"step": 11615, "train_loss": 3.553525686264038, "lr": 0.0002968329803609955, "tps": 12431, "wall": 61235.3} {"step": 11616, "train_loss": 3.4503707885742188, "lr": 0.0002968156549157866, "tps": 12431, "wall": 61243.8} {"step": 11617, "train_loss": 3.418701648712158, "lr": 0.0002967983286004058, "tps": 12430, "wall": 61252.3} {"step": 11618, "train_loss": 3.4656028747558594, "lr": 0.0002967810014150494, "tps": 12429, "wall": 61260.8} {"step": 11619, "train_loss": 3.4918699264526367, "lr": 0.0002967636733599137, "tps": 12429, "wall": 61269.1} {"step": 11620, "train_loss": 3.4521656036376953, "lr": 0.00029674634443519485, "tps": 12428, "wall": 61277.5} {"step": 11621, "train_loss": 3.4476115703582764, "lr": 0.0002967290146410894, "tps": 12427, "wall": 61286.2} {"step": 11622, "train_loss": 3.452582359313965, "lr": 0.00029671168397779336, "tps": 12427, "wall": 61294.6} {"step": 11623, "train_loss": 3.3730854988098145, "lr": 0.00029669435244550335, "tps": 12426, "wall": 61303.0} {"step": 11624, "train_loss": 3.5143306255340576, "lr": 0.00029667702004441553, "tps": 12425, "wall": 61311.5} {"step": 11625, "train_loss": 3.416869640350342, "lr": 0.0002966596867747263, "tps": 12425, "wall": 61320.0} {"step": 11626, "train_loss": 3.529694080352783, "lr": 0.00029664235263663193, "tps": 12424, "wall": 61328.4} {"step": 11627, "train_loss": 3.4058234691619873, "lr": 0.00029662501763032885, "tps": 12424, "wall": 61336.7} {"step": 11628, "train_loss": 3.5576658248901367, "lr": 0.00029660768175601346, "tps": 12423, "wall": 61345.1} {"step": 11629, "train_loss": 3.521054744720459, "lr": 0.00029659034501388205, "tps": 12422, "wall": 61353.5} {"step": 11630, "train_loss": 3.465029239654541, "lr": 0.00029657300740413114, "tps": 12422, "wall": 61362.0} {"step": 11631, "train_loss": 3.5042433738708496, "lr": 0.000296555668926957, "tps": 12421, "wall": 61370.4} {"step": 11632, "train_loss": 3.4318714141845703, "lr": 0.0002965383295825562, "tps": 12420, "wall": 61378.9} {"step": 11633, "train_loss": 3.3492729663848877, "lr": 0.00029652098937112494, "tps": 12420, "wall": 61387.3} {"step": 11634, "train_loss": 3.4986572265625, "lr": 0.0002965036482928598, "tps": 12419, "wall": 61395.6} {"step": 11635, "train_loss": 3.4287548065185547, "lr": 0.00029648630634795725, "tps": 12419, "wall": 61403.9} {"step": 11636, "train_loss": 3.528261423110962, "lr": 0.0002964689635366136, "tps": 12418, "wall": 61412.4} {"step": 11637, "train_loss": 3.480253219604492, "lr": 0.00029645161985902553, "tps": 12417, "wall": 61420.6} {"step": 11638, "train_loss": 3.3922231197357178, "lr": 0.00029643427531538924, "tps": 12417, "wall": 61429.1} {"step": 11639, "train_loss": 3.42095685005188, "lr": 0.0002964169299059014, "tps": 12416, "wall": 61437.5} {"step": 11640, "train_loss": 3.4392497539520264, "lr": 0.00029639958363075845, "tps": 12415, "wall": 61445.8} {"step": 11641, "train_loss": 3.4946177005767822, "lr": 0.0002963822364901569, "tps": 12415, "wall": 61454.1} {"step": 11642, "train_loss": 3.4550302028656006, "lr": 0.0002963648884842932, "tps": 12414, "wall": 61462.4} {"step": 11643, "train_loss": 3.4450464248657227, "lr": 0.0002963475396133639, "tps": 12414, "wall": 61470.9} {"step": 11644, "train_loss": 3.4059958457946777, "lr": 0.0002963301898775656, "tps": 12413, "wall": 61479.2} {"step": 11645, "train_loss": 3.505737781524658, "lr": 0.0002963128392770947, "tps": 12412, "wall": 61487.6} {"step": 11646, "train_loss": 3.472674608230591, "lr": 0.00029629548781214785, "tps": 12412, "wall": 61496.0} {"step": 11647, "train_loss": 3.565040349960327, "lr": 0.0002962781354829217, "tps": 12411, "wall": 61504.4} {"step": 11648, "train_loss": 3.427380084991455, "lr": 0.0002962607822896126, "tps": 12410, "wall": 61512.7} {"step": 11649, "train_loss": 3.502195119857788, "lr": 0.0002962434282324172, "tps": 12410, "wall": 61521.2} {"step": 11650, "train_loss": 3.433712959289551, "lr": 0.0002962260733115322, "tps": 12409, "wall": 61529.6} {"step": 11651, "train_loss": 3.520102024078369, "lr": 0.0002962087175271541, "tps": 12409, "wall": 61537.9} {"step": 11652, "train_loss": 3.474181652069092, "lr": 0.00029619136087947947, "tps": 12408, "wall": 61546.3} {"step": 11653, "train_loss": 3.3994970321655273, "lr": 0.00029617400336870507, "tps": 12407, "wall": 61554.7} {"step": 11654, "train_loss": 3.5273237228393555, "lr": 0.0002961566449950274, "tps": 12407, "wall": 61562.9} {"step": 11655, "train_loss": 3.4674394130706787, "lr": 0.00029613928575864315, "tps": 12406, "wall": 61571.3} {"step": 11656, "train_loss": 3.509470224380493, "lr": 0.0002961219256597489, "tps": 12405, "wall": 61579.5} {"step": 11657, "train_loss": 3.4889092445373535, "lr": 0.00029610456469854134, "tps": 12405, "wall": 61587.8} {"step": 11658, "train_loss": 3.348855972290039, "lr": 0.0002960872028752173, "tps": 12404, "wall": 61596.2} {"step": 11659, "train_loss": 3.3907699584960938, "lr": 0.0002960698401899732, "tps": 12404, "wall": 61604.5} {"step": 11660, "train_loss": 3.475996494293213, "lr": 0.00029605247664300576, "tps": 12403, "wall": 61613.0} {"step": 11661, "train_loss": 3.3963561058044434, "lr": 0.0002960351122345119, "tps": 12402, "wall": 61621.2} {"step": 11662, "train_loss": 3.4120216369628906, "lr": 0.0002960177469646881, "tps": 12402, "wall": 61629.5} {"step": 11663, "train_loss": 3.444423198699951, "lr": 0.0002960003808337311, "tps": 12401, "wall": 61637.9} {"step": 11664, "train_loss": 3.4165587425231934, "lr": 0.0002959830138418378, "tps": 12401, "wall": 61646.1} {"step": 11665, "train_loss": 3.595999002456665, "lr": 0.0002959656459892047, "tps": 12400, "wall": 61654.4} {"step": 11666, "train_loss": 3.547147750854492, "lr": 0.0002959482772760287, "tps": 12399, "wall": 61662.7} {"step": 11667, "train_loss": 3.4698596000671387, "lr": 0.00029593090770250655, "tps": 12399, "wall": 61671.1} {"step": 11668, "train_loss": 3.471907138824463, "lr": 0.0002959135372688349, "tps": 12398, "wall": 61679.4} {"step": 11669, "train_loss": 3.4223644733428955, "lr": 0.00029589616597521065, "tps": 12398, "wall": 61687.7} {"step": 11670, "train_loss": 3.427793025970459, "lr": 0.0002958787938218305, "tps": 12397, "wall": 61696.0} {"step": 11671, "train_loss": 3.4413094520568848, "lr": 0.0002958614208088912, "tps": 12396, "wall": 61704.3} {"step": 11672, "train_loss": 3.5480761528015137, "lr": 0.00029584404693658973, "tps": 12396, "wall": 61712.6} {"step": 11673, "train_loss": 3.5068676471710205, "lr": 0.00029582667220512274, "tps": 12395, "wall": 61720.8} {"step": 11674, "train_loss": 3.5006823539733887, "lr": 0.0002958092966146871, "tps": 12395, "wall": 61729.1} {"step": 11675, "train_loss": 3.376556873321533, "lr": 0.0002957919201654797, "tps": 12394, "wall": 61737.3} {"step": 11676, "train_loss": 3.414113998413086, "lr": 0.0002957745428576972, "tps": 12393, "wall": 61745.6} {"step": 11677, "train_loss": 3.527693271636963, "lr": 0.00029575716469153673, "tps": 12393, "wall": 61753.9} {"step": 11678, "train_loss": 3.4102425575256348, "lr": 0.0002957397856671949, "tps": 12392, "wall": 61762.1} {"step": 11679, "train_loss": 3.5802345275878906, "lr": 0.00029572240578486876, "tps": 12392, "wall": 61770.4} {"step": 11680, "train_loss": 3.4869840145111084, "lr": 0.00029570502504475506, "tps": 12391, "wall": 61778.6} {"step": 11681, "train_loss": 3.5772175788879395, "lr": 0.00029568764344705073, "tps": 12390, "wall": 61787.1} {"step": 11682, "train_loss": 3.472707509994507, "lr": 0.0002956702609919527, "tps": 12390, "wall": 61795.4} {"step": 11683, "train_loss": 3.427217483520508, "lr": 0.00029565287767965783, "tps": 12389, "wall": 61803.7} {"step": 11684, "train_loss": 3.4910519123077393, "lr": 0.00029563549351036315, "tps": 12388, "wall": 61812.0} {"step": 11685, "train_loss": 3.464909076690674, "lr": 0.00029561810848426545, "tps": 12388, "wall": 61820.3} {"step": 11686, "train_loss": 3.5007739067077637, "lr": 0.00029560072260156173, "tps": 12387, "wall": 61828.6} {"step": 11687, "train_loss": 3.427624225616455, "lr": 0.0002955833358624489, "tps": 12387, "wall": 61836.8} {"step": 11688, "train_loss": 3.4636008739471436, "lr": 0.00029556594826712397, "tps": 12386, "wall": 61845.1} {"step": 11689, "train_loss": 3.392063617706299, "lr": 0.0002955485598157839, "tps": 12385, "wall": 61853.6} {"step": 11690, "train_loss": 3.577876091003418, "lr": 0.0002955311705086257, "tps": 12385, "wall": 61861.7} {"step": 11691, "train_loss": 3.5085983276367188, "lr": 0.0002955137803458463, "tps": 12384, "wall": 61869.9} {"step": 11692, "train_loss": 3.3298392295837402, "lr": 0.0002954963893276427, "tps": 12384, "wall": 61878.2} {"step": 11693, "train_loss": 3.4881134033203125, "lr": 0.00029547899745421184, "tps": 12383, "wall": 61886.4} {"step": 11694, "train_loss": 3.3935959339141846, "lr": 0.00029546160472575093, "tps": 12383, "wall": 61894.8} {"step": 11695, "train_loss": 3.5498080253601074, "lr": 0.00029544421114245683, "tps": 12382, "wall": 61902.9} {"step": 11696, "train_loss": 3.330202102661133, "lr": 0.0002954268167045266, "tps": 12381, "wall": 61911.4} {"step": 11697, "train_loss": 3.3719537258148193, "lr": 0.00029540942141215734, "tps": 12381, "wall": 61919.6} {"step": 11698, "train_loss": 3.4269914627075195, "lr": 0.000295392025265546, "tps": 12380, "wall": 61927.9} {"step": 11699, "train_loss": 3.562436819076538, "lr": 0.00029537462826488987, "tps": 12380, "wall": 61936.1} {"step": 11700, "train_loss": 3.4343690872192383, "lr": 0.00029535723041038576, "tps": 12379, "wall": 61944.4} {"step": 11701, "train_loss": 3.450314521789551, "lr": 0.0002953398317022309, "tps": 12378, "wall": 61952.6} {"step": 11702, "train_loss": 3.420393466949463, "lr": 0.0002953224321406224, "tps": 12378, "wall": 61960.9} {"step": 11703, "train_loss": 3.452237367630005, "lr": 0.00029530503172575727, "tps": 12377, "wall": 61969.2} {"step": 11704, "train_loss": 3.374678373336792, "lr": 0.0002952876304578326, "tps": 12377, "wall": 61977.5} {"step": 11705, "train_loss": 3.533207416534424, "lr": 0.0002952702283370456, "tps": 12376, "wall": 61985.8} {"step": 11706, "train_loss": 3.537367820739746, "lr": 0.0002952528253635935, "tps": 12375, "wall": 61994.0} {"step": 11707, "train_loss": 3.572061061859131, "lr": 0.00029523542153767323, "tps": 12375, "wall": 62002.4} {"step": 11708, "train_loss": 3.4291515350341797, "lr": 0.00029521801685948205, "tps": 12374, "wall": 62010.6} {"step": 11709, "train_loss": 3.5104362964630127, "lr": 0.00029520061132921714, "tps": 12374, "wall": 62018.9} {"step": 11710, "train_loss": 3.49676775932312, "lr": 0.0002951832049470755, "tps": 12373, "wall": 62027.4} {"step": 11711, "train_loss": 3.5071253776550293, "lr": 0.0002951657977132546, "tps": 12372, "wall": 62035.6} {"step": 11712, "train_loss": 3.4635262489318848, "lr": 0.00029514838962795144, "tps": 12372, "wall": 62043.7} {"step": 11713, "train_loss": 3.524667263031006, "lr": 0.00029513098069136324, "tps": 12371, "wall": 62052.0} {"step": 11714, "train_loss": 3.480490207672119, "lr": 0.00029511357090368723, "tps": 12371, "wall": 62060.2} {"step": 11715, "train_loss": 3.5504932403564453, "lr": 0.0002950961602651206, "tps": 12370, "wall": 62068.4} {"step": 11716, "train_loss": 3.454836368560791, "lr": 0.00029507874877586065, "tps": 12369, "wall": 62076.6} {"step": 11717, "train_loss": 3.4181101322174072, "lr": 0.0002950613364361045, "tps": 12369, "wall": 62084.8} {"step": 11718, "train_loss": 3.5038442611694336, "lr": 0.0002950439232460496, "tps": 12368, "wall": 62093.2} {"step": 11719, "train_loss": 3.4565529823303223, "lr": 0.000295026509205893, "tps": 12368, "wall": 62101.4} {"step": 11720, "train_loss": 3.547429084777832, "lr": 0.000295009094315832, "tps": 12367, "wall": 62109.6} {"step": 11721, "train_loss": 3.526028633117676, "lr": 0.0002949916785760639, "tps": 12367, "wall": 62117.8} {"step": 11722, "train_loss": 3.496135711669922, "lr": 0.0002949742619867861, "tps": 12366, "wall": 62126.1} {"step": 11723, "train_loss": 3.4325318336486816, "lr": 0.0002949568445481958, "tps": 12365, "wall": 62134.5} {"step": 11724, "train_loss": 3.4968981742858887, "lr": 0.00029493942626049026, "tps": 12365, "wall": 62142.8} {"step": 11725, "train_loss": 3.5262088775634766, "lr": 0.0002949220071238669, "tps": 12364, "wall": 62151.2} {"step": 11726, "train_loss": 3.5871164798736572, "lr": 0.00029490458713852293, "tps": 12364, "wall": 62159.5} {"step": 11727, "train_loss": 3.5340611934661865, "lr": 0.0002948871663046558, "tps": 12363, "wall": 62167.8} {"step": 11728, "train_loss": 3.5600385665893555, "lr": 0.0002948697446224627, "tps": 12362, "wall": 62176.1} {"step": 11729, "train_loss": 3.331538677215576, "lr": 0.0002948523220921413, "tps": 12362, "wall": 62184.4} {"step": 11730, "train_loss": 3.4033284187316895, "lr": 0.0002948348987138885, "tps": 12361, "wall": 62192.7} {"step": 11731, "train_loss": 3.544341802597046, "lr": 0.00029481747448790205, "tps": 12361, "wall": 62201.0} {"step": 11732, "train_loss": 3.520059108734131, "lr": 0.0002948000494143791, "tps": 12360, "wall": 62209.4} {"step": 11733, "train_loss": 3.4448630809783936, "lr": 0.0002947826234935173, "tps": 12359, "wall": 62217.8} {"step": 11734, "train_loss": 3.426858425140381, "lr": 0.0002947651967255138, "tps": 12359, "wall": 62225.9} {"step": 11735, "train_loss": 3.536862373352051, "lr": 0.00029474776911056613, "tps": 12358, "wall": 62234.2} {"step": 11736, "train_loss": 3.4864633083343506, "lr": 0.0002947303406488717, "tps": 12358, "wall": 62242.5} {"step": 11737, "train_loss": 3.4727072715759277, "lr": 0.0002947129113406279, "tps": 12357, "wall": 62250.7} {"step": 11738, "train_loss": 3.4615628719329834, "lr": 0.00029469548118603214, "tps": 12356, "wall": 62259.1} {"step": 11739, "train_loss": 3.482813596725464, "lr": 0.000294678050185282, "tps": 12356, "wall": 62267.5} {"step": 11740, "train_loss": 3.5448074340820312, "lr": 0.0002946606183385749, "tps": 12355, "wall": 62275.7} {"step": 11741, "train_loss": 3.413900852203369, "lr": 0.0002946431856461082, "tps": 12355, "wall": 62284.0} {"step": 11742, "train_loss": 3.381911516189575, "lr": 0.0002946257521080795, "tps": 12354, "wall": 62292.3} {"step": 11743, "train_loss": 3.4571571350097656, "lr": 0.00029460831772468626, "tps": 12353, "wall": 62300.5} {"step": 11744, "train_loss": 3.388751983642578, "lr": 0.00029459088249612594, "tps": 12353, "wall": 62308.8} {"step": 11745, "train_loss": 3.365060329437256, "lr": 0.000294573446422596, "tps": 12352, "wall": 62317.0} {"step": 11746, "train_loss": 3.5102269649505615, "lr": 0.0002945560095042941, "tps": 12352, "wall": 62325.4} {"step": 11747, "train_loss": 3.471845865249634, "lr": 0.0002945385717414177, "tps": 12351, "wall": 62333.9} {"step": 11748, "train_loss": 3.5118284225463867, "lr": 0.0002945211331341643, "tps": 12350, "wall": 62342.1} {"step": 11749, "train_loss": 3.5051109790802, "lr": 0.0002945036936827314, "tps": 12350, "wall": 62350.4} {"step": 11750, "train_loss": 3.497486114501953, "lr": 0.00029448625338731677, "tps": 12349, "wall": 62358.7} {"step": 11751, "train_loss": 3.5833539962768555, "lr": 0.00029446881224811776, "tps": 12349, "wall": 62366.8} {"step": 11752, "train_loss": 3.4423232078552246, "lr": 0.000294451370265332, "tps": 12348, "wall": 62374.9} {"step": 11753, "train_loss": 3.4639892578125, "lr": 0.00029443392743915713, "tps": 12348, "wall": 62383.2} {"step": 11754, "train_loss": 3.4373669624328613, "lr": 0.0002944164837697907, "tps": 12347, "wall": 62391.6} {"step": 11755, "train_loss": 3.4998652935028076, "lr": 0.00029439903925743035, "tps": 12346, "wall": 62399.9} {"step": 11756, "train_loss": 3.481107234954834, "lr": 0.0002943815939022736, "tps": 12346, "wall": 62408.0} {"step": 11757, "train_loss": 3.476335287094116, "lr": 0.00029436414770451813, "tps": 12345, "wall": 62416.3} {"step": 11758, "train_loss": 3.544787645339966, "lr": 0.0002943467006643616, "tps": 12345, "wall": 62424.6} {"step": 11759, "train_loss": 3.4458305835723877, "lr": 0.0002943292527820015, "tps": 12344, "wall": 62432.7} {"step": 11760, "train_loss": 3.4710898399353027, "lr": 0.00029431180405763575, "tps": 12343, "wall": 62441.0} {"step": 11761, "train_loss": 3.4280714988708496, "lr": 0.00029429435449146186, "tps": 12343, "wall": 62449.3} {"step": 11762, "train_loss": 3.3887476921081543, "lr": 0.00029427690408367744, "tps": 12342, "wall": 62457.6} {"step": 11763, "train_loss": 3.502366781234741, "lr": 0.00029425945283448026, "tps": 12342, "wall": 62465.8} {"step": 11764, "train_loss": 3.568044424057007, "lr": 0.000294242000744068, "tps": 12341, "wall": 62474.0} {"step": 11765, "train_loss": 3.4489173889160156, "lr": 0.00029422454781263834, "tps": 12341, "wall": 62482.3} {"step": 11766, "train_loss": 3.4546141624450684, "lr": 0.00029420709404038886, "tps": 12340, "wall": 62490.4} {"step": 11767, "train_loss": 3.4801974296569824, "lr": 0.0002941896394275176, "tps": 12339, "wall": 62498.7} {"step": 11768, "train_loss": 3.4661104679107666, "lr": 0.00029417218397422197, "tps": 12339, "wall": 62507.0} {"step": 11769, "train_loss": 3.5042309761047363, "lr": 0.00029415472768069985, "tps": 12338, "wall": 62515.3} {"step": 11770, "train_loss": 3.4334347248077393, "lr": 0.0002941372705471489, "tps": 12338, "wall": 62523.6} {"step": 11771, "train_loss": 3.4129586219787598, "lr": 0.0002941198125737671, "tps": 12337, "wall": 62531.9} {"step": 11772, "train_loss": 3.4492087364196777, "lr": 0.0002941023537607519, "tps": 12336, "wall": 62540.1} {"step": 11773, "train_loss": 3.4174442291259766, "lr": 0.0002940848941083013, "tps": 12336, "wall": 62548.5} {"step": 11774, "train_loss": 3.3833565711975098, "lr": 0.00029406743361661306, "tps": 12335, "wall": 62556.7} {"step": 11775, "train_loss": 3.4458625316619873, "lr": 0.00029404997228588484, "tps": 12335, "wall": 62565.0} {"step": 11776, "train_loss": 3.4029669761657715, "lr": 0.00029403251011631454, "tps": 12334, "wall": 62573.3} {"step": 11777, "train_loss": 3.4609241485595703, "lr": 0.0002940150471081, "tps": 12334, "wall": 62581.6} {"step": 11778, "train_loss": 3.376757860183716, "lr": 0.000293997583261439, "tps": 12333, "wall": 62589.8} {"step": 11779, "train_loss": 3.508697986602783, "lr": 0.0002939801185765293, "tps": 12332, "wall": 62598.0} {"step": 11780, "train_loss": 3.523466110229492, "lr": 0.00029396265305356884, "tps": 12332, "wall": 62606.2} {"step": 11781, "train_loss": 3.504143714904785, "lr": 0.0002939451866927555, "tps": 12331, "wall": 62614.5} {"step": 11782, "train_loss": 3.50329852104187, "lr": 0.000293927719494287, "tps": 12331, "wall": 62622.7} {"step": 11783, "train_loss": 3.53521990776062, "lr": 0.0002939102514583614, "tps": 12330, "wall": 62631.0} {"step": 11784, "train_loss": 3.459528923034668, "lr": 0.00029389278258517643, "tps": 12330, "wall": 62639.2} {"step": 11785, "train_loss": 3.5345232486724854, "lr": 0.00029387531287492993, "tps": 12329, "wall": 62647.6} {"step": 11786, "train_loss": 3.4693186283111572, "lr": 0.00029385784232782, "tps": 12328, "wall": 62655.8} {"step": 11787, "train_loss": 3.4822933673858643, "lr": 0.00029384037094404443, "tps": 12328, "wall": 62664.0} {"step": 11788, "train_loss": 3.479961395263672, "lr": 0.0002938228987238011, "tps": 12327, "wall": 62672.3} {"step": 11789, "train_loss": 3.519198417663574, "lr": 0.000293805425667288, "tps": 12327, "wall": 62680.4} {"step": 11790, "train_loss": 3.5162665843963623, "lr": 0.00029378795177470305, "tps": 12326, "wall": 62688.7} {"step": 11791, "train_loss": 3.4257571697235107, "lr": 0.0002937704770462442, "tps": 12325, "wall": 62696.9} {"step": 11792, "train_loss": 3.360377073287964, "lr": 0.00029375300148210936, "tps": 12325, "wall": 62705.1} {"step": 11793, "train_loss": 3.60591983795166, "lr": 0.00029373552508249657, "tps": 12324, "wall": 62713.4} {"step": 11794, "train_loss": 3.5183229446411133, "lr": 0.00029371804784760375, "tps": 12324, "wall": 62721.7} {"step": 11795, "train_loss": 3.4944188594818115, "lr": 0.00029370056977762887, "tps": 12323, "wall": 62729.8} {"step": 11796, "train_loss": 3.4506897926330566, "lr": 0.00029368309087276996, "tps": 12323, "wall": 62738.1} {"step": 11797, "train_loss": 3.468949556350708, "lr": 0.00029366561113322505, "tps": 12322, "wall": 62746.3} {"step": 11798, "train_loss": 3.467528820037842, "lr": 0.00029364813055919207, "tps": 12321, "wall": 62754.7} {"step": 11799, "train_loss": 3.3643884658813477, "lr": 0.00029363064915086904, "tps": 12321, "wall": 62762.8} {"step": 11800, "train_loss": 3.4988255500793457, "lr": 0.00029361316690845415, "tps": 12320, "wall": 62771.0} {"step": 11801, "train_loss": 3.424268960952759, "lr": 0.0002935956838321452, "tps": 12320, "wall": 62779.3} {"step": 11802, "train_loss": 3.383246898651123, "lr": 0.0002935781999221405, "tps": 12319, "wall": 62787.4} {"step": 11803, "train_loss": 3.499870777130127, "lr": 0.00029356071517863783, "tps": 12319, "wall": 62795.6} {"step": 11804, "train_loss": 3.407386302947998, "lr": 0.0002935432296018355, "tps": 12318, "wall": 62803.9} {"step": 11805, "train_loss": 3.4134867191314697, "lr": 0.00029352574319193144, "tps": 12317, "wall": 62812.2} {"step": 11806, "train_loss": 3.517163038253784, "lr": 0.0002935082559491238, "tps": 12317, "wall": 62820.5} {"step": 11807, "train_loss": 3.528791904449463, "lr": 0.00029349076787361055, "tps": 12316, "wall": 62828.7} {"step": 11808, "train_loss": 3.434988498687744, "lr": 0.0002934732789655901, "tps": 12316, "wall": 62837.1} {"step": 11809, "train_loss": 3.420347213745117, "lr": 0.00029345578922526026, "tps": 12315, "wall": 62845.3} {"step": 11810, "train_loss": 3.3224527835845947, "lr": 0.00029343829865281925, "tps": 12315, "wall": 62853.6} {"step": 11811, "train_loss": 3.3848118782043457, "lr": 0.0002934208072484653, "tps": 12314, "wall": 62861.8} {"step": 11812, "train_loss": 3.456838607788086, "lr": 0.0002934033150123964, "tps": 12313, "wall": 62870.2} {"step": 11813, "train_loss": 3.5117626190185547, "lr": 0.0002933858219448108, "tps": 12313, "wall": 62878.5} {"step": 11814, "train_loss": 3.555168867111206, "lr": 0.00029336832804590664, "tps": 12312, "wall": 62886.7} {"step": 11815, "train_loss": 3.4808499813079834, "lr": 0.00029335083331588207, "tps": 12312, "wall": 62894.9} {"step": 11816, "train_loss": 3.3515021800994873, "lr": 0.0002933333377549353, "tps": 12311, "wall": 62903.0} {"step": 11817, "train_loss": 3.5074379444122314, "lr": 0.0002933158413632646, "tps": 12311, "wall": 62911.2} {"step": 11818, "train_loss": 3.353393077850342, "lr": 0.00029329834414106796, "tps": 12310, "wall": 62919.5} {"step": 11819, "train_loss": 3.459733486175537, "lr": 0.0002932808460885438, "tps": 12309, "wall": 62928.0} {"step": 11820, "train_loss": 3.4029808044433594, "lr": 0.00029326334720589017, "tps": 12309, "wall": 62936.2} {"step": 11821, "train_loss": 3.5735929012298584, "lr": 0.00029324584749330543, "tps": 12308, "wall": 62944.5} {"step": 11822, "train_loss": 3.457645893096924, "lr": 0.0002932283469509877, "tps": 12308, "wall": 62952.8} {"step": 11823, "train_loss": 3.549232244491577, "lr": 0.00029321084557913543, "tps": 12307, "wall": 62961.1} {"step": 11824, "train_loss": 3.4091036319732666, "lr": 0.0002931933433779466, "tps": 12307, "wall": 62969.3} {"step": 11825, "train_loss": 3.568321704864502, "lr": 0.0002931758403476197, "tps": 12306, "wall": 62977.5} {"step": 11826, "train_loss": 3.5201382637023926, "lr": 0.00029315833648835293, "tps": 12305, "wall": 62985.7} {"step": 11827, "train_loss": 3.3770506381988525, "lr": 0.00029314083180034453, "tps": 12305, "wall": 62994.2} {"step": 11828, "train_loss": 3.4822323322296143, "lr": 0.00029312332628379285, "tps": 12304, "wall": 63002.5} {"step": 11829, "train_loss": 3.51900315284729, "lr": 0.0002931058199388961, "tps": 12304, "wall": 63010.7} {"step": 11830, "train_loss": 3.5047109127044678, "lr": 0.00029308831276585276, "tps": 12303, "wall": 63019.0} {"step": 11831, "train_loss": 3.4041495323181152, "lr": 0.00029307080476486107, "tps": 12302, "wall": 63027.3} {"step": 11832, "train_loss": 3.4428248405456543, "lr": 0.0002930532959361193, "tps": 12302, "wall": 63035.7} {"step": 11833, "train_loss": 3.4598474502563477, "lr": 0.00029303578627982584, "tps": 12301, "wall": 63044.0} {"step": 11834, "train_loss": 3.4303388595581055, "lr": 0.00029301827579617906, "tps": 12301, "wall": 63052.3} {"step": 11835, "train_loss": 3.584503173828125, "lr": 0.00029300076448537726, "tps": 12300, "wall": 63060.6} {"step": 11836, "train_loss": 3.396237373352051, "lr": 0.00029298325234761895, "tps": 12300, "wall": 63068.9} {"step": 11837, "train_loss": 3.5362653732299805, "lr": 0.00029296573938310234, "tps": 12299, "wall": 63077.2} {"step": 11838, "train_loss": 3.564222812652588, "lr": 0.0002929482255920258, "tps": 12298, "wall": 63085.4} {"step": 11839, "train_loss": 3.5319628715515137, "lr": 0.00029293071097458796, "tps": 12298, "wall": 63093.6} {"step": 11840, "train_loss": 3.4526147842407227, "lr": 0.000292913195530987, "tps": 12297, "wall": 63101.9} {"step": 11841, "train_loss": 3.505476474761963, "lr": 0.00029289567926142146, "tps": 12297, "wall": 63110.3} {"step": 11842, "train_loss": 3.4630250930786133, "lr": 0.00029287816216608974, "tps": 12296, "wall": 63118.5} {"step": 11843, "train_loss": 3.526449203491211, "lr": 0.00029286064424519017, "tps": 12296, "wall": 63126.8} {"step": 11844, "train_loss": 3.4839980602264404, "lr": 0.0002928431254989213, "tps": 12295, "wall": 63135.0} {"step": 11845, "train_loss": 3.5092527866363525, "lr": 0.00029282560592748167, "tps": 12294, "wall": 63143.3} {"step": 11846, "train_loss": 3.4510293006896973, "lr": 0.00029280808553106956, "tps": 12294, "wall": 63151.5} {"step": 11847, "train_loss": 3.406989574432373, "lr": 0.0002927905643098835, "tps": 12293, "wall": 63159.7} {"step": 11848, "train_loss": 3.442645788192749, "lr": 0.00029277304226412197, "tps": 12293, "wall": 63168.0} {"step": 11849, "train_loss": 3.435727119445801, "lr": 0.00029275551939398356, "tps": 12292, "wall": 63176.3} {"step": 11850, "train_loss": 3.4549155235290527, "lr": 0.00029273799569966665, "tps": 12292, "wall": 63184.6} {"step": 11851, "train_loss": 3.4698214530944824, "lr": 0.00029272047118136975, "tps": 12291, "wall": 63192.8} {"step": 11852, "train_loss": 3.4403891563415527, "lr": 0.0002927029458392915, "tps": 12290, "wall": 63201.1} {"step": 11853, "train_loss": 3.425081968307495, "lr": 0.0002926854196736303, "tps": 12290, "wall": 63209.4} {"step": 11854, "train_loss": 3.3943557739257812, "lr": 0.0002926678926845847, "tps": 12289, "wall": 63217.6} {"step": 11855, "train_loss": 3.483506679534912, "lr": 0.0002926503648723533, "tps": 12289, "wall": 63225.9} {"step": 11856, "train_loss": 3.452036142349243, "lr": 0.0002926328362371347, "tps": 12288, "wall": 63234.4} {"step": 11857, "train_loss": 3.490858316421509, "lr": 0.00029261530677912736, "tps": 12288, "wall": 63242.6} {"step": 11858, "train_loss": 3.3913042545318604, "lr": 0.0002925977764985299, "tps": 12287, "wall": 63250.9} {"step": 11859, "train_loss": 3.370061159133911, "lr": 0.0002925802453955409, "tps": 12286, "wall": 63259.1} {"step": 11860, "train_loss": 3.517423152923584, "lr": 0.0002925627134703589, "tps": 12286, "wall": 63267.4} {"step": 11861, "train_loss": 3.498405933380127, "lr": 0.00029254518072318263, "tps": 12285, "wall": 63275.6} {"step": 11862, "train_loss": 3.5947771072387695, "lr": 0.0002925276471542106, "tps": 12285, "wall": 63283.7} {"step": 11863, "train_loss": 3.497925043106079, "lr": 0.00029251011276364147, "tps": 12284, "wall": 63292.0} {"step": 11864, "train_loss": 3.5219075679779053, "lr": 0.0002924925775516738, "tps": 12284, "wall": 63300.3} {"step": 11865, "train_loss": 3.475106954574585, "lr": 0.00029247504151850635, "tps": 12283, "wall": 63308.4} {"step": 11866, "train_loss": 3.4357688426971436, "lr": 0.0002924575046643377, "tps": 12282, "wall": 63316.6} {"step": 11867, "train_loss": 3.428299903869629, "lr": 0.00029243996698936653, "tps": 12282, "wall": 63325.0} {"step": 11868, "train_loss": 3.4956250190734863, "lr": 0.0002924224284937914, "tps": 12281, "wall": 63333.2} {"step": 11869, "train_loss": 3.5658318996429443, "lr": 0.00029240488917781126, "tps": 12281, "wall": 63341.5} {"step": 11870, "train_loss": 3.478429079055786, "lr": 0.0002923873490416245, "tps": 12280, "wall": 63349.9} {"step": 11871, "train_loss": 3.426658868789673, "lr": 0.00029236980808542996, "tps": 12280, "wall": 63358.2} {"step": 11872, "train_loss": 3.41848087310791, "lr": 0.00029235226630942634, "tps": 12279, "wall": 63366.4} {"step": 11873, "train_loss": 3.5796093940734863, "lr": 0.0002923347237138123, "tps": 12278, "wall": 63374.6} {"step": 11874, "train_loss": 3.304396390914917, "lr": 0.0002923171802987866, "tps": 12278, "wall": 63382.8} {"step": 11875, "train_loss": 3.4312853813171387, "lr": 0.0002922996360645479, "tps": 12277, "wall": 63391.1} {"step": 11876, "train_loss": 3.505200147628784, "lr": 0.00029228209101129517, "tps": 12277, "wall": 63399.2} {"step": 11877, "train_loss": 3.5279605388641357, "lr": 0.0002922645451392268, "tps": 12276, "wall": 63407.6} {"step": 11878, "train_loss": 3.488609790802002, "lr": 0.00029224699844854196, "tps": 12276, "wall": 63415.9} {"step": 11879, "train_loss": 3.3966283798217773, "lr": 0.00029222945093943913, "tps": 12275, "wall": 63424.0} {"step": 11880, "train_loss": 3.474086284637451, "lr": 0.00029221190261211717, "tps": 12275, "wall": 63432.2} {"step": 11881, "train_loss": 3.545250654220581, "lr": 0.0002921943534667748, "tps": 12274, "wall": 63440.5} {"step": 11882, "train_loss": 3.4645745754241943, "lr": 0.0002921768035036109, "tps": 12273, "wall": 63448.7} {"step": 11883, "train_loss": 3.4762260913848877, "lr": 0.00029215925272282444, "tps": 12273, "wall": 63456.9} {"step": 11884, "train_loss": 3.5480730533599854, "lr": 0.00029214170112461387, "tps": 12272, "wall": 63465.2} {"step": 11885, "train_loss": 3.4758787155151367, "lr": 0.00029212414870917827, "tps": 12272, "wall": 63473.5} {"step": 11886, "train_loss": 3.48638916015625, "lr": 0.0002921065954767165, "tps": 12271, "wall": 63481.9} {"step": 11887, "train_loss": 3.438645839691162, "lr": 0.0002920890414274272, "tps": 12271, "wall": 63490.1} {"step": 11888, "train_loss": 3.4827699661254883, "lr": 0.0002920714865615093, "tps": 12270, "wall": 63498.3} {"step": 11889, "train_loss": 3.5457663536071777, "lr": 0.00029205393087916186, "tps": 12269, "wall": 63506.5} {"step": 11890, "train_loss": 3.598405361175537, "lr": 0.00029203637438058347, "tps": 12269, "wall": 63514.8} {"step": 11891, "train_loss": 3.4700567722320557, "lr": 0.00029201881706597316, "tps": 12268, "wall": 63523.0} {"step": 11892, "train_loss": 3.4512131214141846, "lr": 0.0002920012589355298, "tps": 12268, "wall": 63531.3} {"step": 11893, "train_loss": 3.5017142295837402, "lr": 0.00029198369998945236, "tps": 12267, "wall": 63539.6} {"step": 11894, "train_loss": 3.532111167907715, "lr": 0.0002919661402279395, "tps": 12267, "wall": 63547.8} {"step": 11895, "train_loss": 3.4556808471679688, "lr": 0.0002919485796511904, "tps": 12266, "wall": 63556.0} {"step": 11896, "train_loss": 3.4493374824523926, "lr": 0.00029193101825940397, "tps": 12266, "wall": 63564.2} {"step": 11897, "train_loss": 3.3892953395843506, "lr": 0.000291913456052779, "tps": 12265, "wall": 63572.5} {"step": 11898, "train_loss": 3.43411922454834, "lr": 0.00029189589303151454, "tps": 12264, "wall": 63580.7} {"step": 11899, "train_loss": 3.495487689971924, "lr": 0.00029187832919580953, "tps": 12264, "wall": 63589.1} {"step": 11900, "train_loss": 3.4862828254699707, "lr": 0.0002918607645458629, "tps": 12263, "wall": 63597.3} {"step": 11901, "train_loss": 3.476957082748413, "lr": 0.00029184319908187356, "tps": 12263, "wall": 63605.5} {"step": 11902, "train_loss": 3.385103940963745, "lr": 0.0002918256328040406, "tps": 12262, "wall": 63613.8} {"step": 11903, "train_loss": 3.5386977195739746, "lr": 0.00029180806571256306, "tps": 12262, "wall": 63621.9} {"step": 11904, "train_loss": 3.540678024291992, "lr": 0.00029179049780763983, "tps": 12261, "wall": 63630.1} {"step": 11905, "train_loss": 3.433932065963745, "lr": 0.00029177292908946995, "tps": 12261, "wall": 63638.3} {"step": 11906, "train_loss": 3.440345287322998, "lr": 0.00029175535955825246, "tps": 12260, "wall": 63646.6} {"step": 11907, "train_loss": 3.508953094482422, "lr": 0.0002917377892141864, "tps": 12259, "wall": 63655.1} {"step": 11908, "train_loss": 3.434216022491455, "lr": 0.0002917202180574707, "tps": 12259, "wall": 63663.4} {"step": 11909, "train_loss": 3.505289077758789, "lr": 0.0002917026460883046, "tps": 12258, "wall": 63671.6} {"step": 11910, "train_loss": 3.4601902961730957, "lr": 0.000291685073306887, "tps": 12258, "wall": 63679.9} {"step": 11911, "train_loss": 3.5221939086914062, "lr": 0.000291667499713417, "tps": 12257, "wall": 63688.0} {"step": 11912, "train_loss": 3.4773120880126953, "lr": 0.00029164992530809365, "tps": 12257, "wall": 63696.3} {"step": 11913, "train_loss": 3.487793207168579, "lr": 0.00029163235009111615, "tps": 12256, "wall": 63704.6} {"step": 11914, "train_loss": 3.4042649269104004, "lr": 0.0002916147740626834, "tps": 12255, "wall": 63712.9} {"step": 11915, "train_loss": 3.532402276992798, "lr": 0.0002915971972229947, "tps": 12255, "wall": 63721.2} {"step": 11916, "train_loss": 3.4577269554138184, "lr": 0.0002915796195722491, "tps": 12254, "wall": 63729.4} {"step": 11917, "train_loss": 3.513141632080078, "lr": 0.0002915620411106457, "tps": 12254, "wall": 63737.7} {"step": 11918, "train_loss": 3.5244178771972656, "lr": 0.0002915444618383835, "tps": 12253, "wall": 63745.9} {"step": 11919, "train_loss": 3.4851465225219727, "lr": 0.0002915268817556619, "tps": 12253, "wall": 63754.1} {"step": 11920, "train_loss": 3.450770854949951, "lr": 0.0002915093008626799, "tps": 12252, "wall": 63762.4} {"step": 11921, "train_loss": 3.4375758171081543, "lr": 0.0002914917191596366, "tps": 12252, "wall": 63770.7} {"step": 11922, "train_loss": 3.543034076690674, "lr": 0.00029147413664673126, "tps": 12251, "wall": 63778.9} {"step": 11923, "train_loss": 3.5462775230407715, "lr": 0.00029145655332416307, "tps": 12250, "wall": 63787.1} {"step": 11924, "train_loss": 3.460000514984131, "lr": 0.0002914389691921312, "tps": 12250, "wall": 63795.3} {"step": 11925, "train_loss": 3.40606427192688, "lr": 0.0002914213842508347, "tps": 12249, "wall": 63803.5} {"step": 11926, "train_loss": 3.454251289367676, "lr": 0.00029140379850047297, "tps": 12249, "wall": 63811.8} {"step": 11927, "train_loss": 3.5474209785461426, "lr": 0.0002913862119412452, "tps": 12248, "wall": 63820.0} {"step": 11928, "train_loss": 3.5167455673217773, "lr": 0.0002913686245733505, "tps": 12248, "wall": 63828.4} {"step": 11929, "train_loss": 3.4611990451812744, "lr": 0.00029135103639698815, "tps": 12247, "wall": 63836.6} {"step": 11930, "train_loss": 3.5057625770568848, "lr": 0.00029133344741235744, "tps": 12247, "wall": 63844.8} {"step": 11931, "train_loss": 3.4975295066833496, "lr": 0.0002913158576196576, "tps": 12246, "wall": 63853.1} {"step": 11932, "train_loss": 3.3535549640655518, "lr": 0.0002912982670190878, "tps": 12245, "wall": 63861.4} {"step": 11933, "train_loss": 3.4494481086730957, "lr": 0.00029128067561084737, "tps": 12245, "wall": 63869.6} {"step": 11934, "train_loss": 3.4688234329223633, "lr": 0.0002912630833951357, "tps": 12244, "wall": 63877.7} {"step": 11935, "train_loss": 3.3525948524475098, "lr": 0.00029124549037215183, "tps": 12244, "wall": 63886.0} {"step": 11936, "train_loss": 3.3884048461914062, "lr": 0.0002912278965420952, "tps": 12243, "wall": 63894.5} {"step": 11937, "train_loss": 3.367662191390991, "lr": 0.0002912103019051652, "tps": 12243, "wall": 63902.7} {"step": 11938, "train_loss": 3.5079715251922607, "lr": 0.000291192706461561, "tps": 12242, "wall": 63910.9} {"step": 11939, "train_loss": 3.493879795074463, "lr": 0.00029117511021148194, "tps": 12242, "wall": 63919.2} {"step": 11940, "train_loss": 3.5683627128601074, "lr": 0.0002911575131551274, "tps": 12241, "wall": 63927.3} {"step": 11941, "train_loss": 3.460850715637207, "lr": 0.00029113991529269677, "tps": 12240, "wall": 63935.7} {"step": 11942, "train_loss": 3.4429988861083984, "lr": 0.00029112231662438925, "tps": 12240, "wall": 63944.1} {"step": 11943, "train_loss": 3.3959922790527344, "lr": 0.00029110471715040426, "tps": 12239, "wall": 63952.3} {"step": 11944, "train_loss": 3.4815454483032227, "lr": 0.00029108711687094124, "tps": 12239, "wall": 63960.6} {"step": 11945, "train_loss": 3.456264019012451, "lr": 0.00029106951578619953, "tps": 12238, "wall": 63968.9} {"step": 11946, "train_loss": 3.35899019241333, "lr": 0.00029105191389637846, "tps": 12238, "wall": 63977.2} {"step": 11947, "train_loss": 3.4426283836364746, "lr": 0.00029103431120167746, "tps": 12237, "wall": 63985.5} {"step": 11948, "train_loss": 3.569150447845459, "lr": 0.000291016707702296, "tps": 12236, "wall": 63993.7} {"step": 11949, "train_loss": 3.5839123725891113, "lr": 0.0002909991033984333, "tps": 12236, "wall": 64002.0} {"step": 11950, "train_loss": 3.427259922027588, "lr": 0.0002909814982902891, "tps": 12235, "wall": 64010.3} {"step": 11951, "train_loss": 3.5083603858947754, "lr": 0.00029096389237806254, "tps": 12235, "wall": 64018.5} {"step": 11952, "train_loss": 3.4710142612457275, "lr": 0.0002909462856619532, "tps": 12234, "wall": 64026.8} {"step": 11953, "train_loss": 3.493441343307495, "lr": 0.0002909286781421604, "tps": 12234, "wall": 64035.0} {"step": 11954, "train_loss": 3.5188300609588623, "lr": 0.00029091106981888384, "tps": 12233, "wall": 64043.3} {"step": 11955, "train_loss": 3.503051280975342, "lr": 0.0002908934606923228, "tps": 12233, "wall": 64051.5} {"step": 11956, "train_loss": 3.4990806579589844, "lr": 0.00029087585076267673, "tps": 12232, "wall": 64059.8} {"step": 11957, "train_loss": 3.4662699699401855, "lr": 0.0002908582400301452, "tps": 12231, "wall": 64068.3} {"step": 11958, "train_loss": 3.538505792617798, "lr": 0.0002908406284949278, "tps": 12231, "wall": 64076.6} {"step": 11959, "train_loss": 3.4483165740966797, "lr": 0.0002908230161572239, "tps": 12230, "wall": 64084.8} {"step": 11960, "train_loss": 3.461118698120117, "lr": 0.00029080540301723297, "tps": 12230, "wall": 64093.0} {"step": 11961, "train_loss": 3.5012104511260986, "lr": 0.00029078778907515464, "tps": 12229, "wall": 64101.3} {"step": 11962, "train_loss": 3.5186052322387695, "lr": 0.0002907701743311884, "tps": 12229, "wall": 64109.5} {"step": 11963, "train_loss": 3.4461135864257812, "lr": 0.0002907525587855338, "tps": 12228, "wall": 64117.9} {"step": 11964, "train_loss": 3.501067876815796, "lr": 0.0002907349424383904, "tps": 12228, "wall": 64126.2} {"step": 11965, "train_loss": 3.3883113861083984, "lr": 0.00029071732528995775, "tps": 12227, "wall": 64134.6} {"step": 11966, "train_loss": 3.5549564361572266, "lr": 0.0002906997073404354, "tps": 12226, "wall": 64142.9} {"step": 11967, "train_loss": 3.4640958309173584, "lr": 0.0002906820885900229, "tps": 12226, "wall": 64151.2} {"step": 11968, "train_loss": 3.5971763134002686, "lr": 0.00029066446903891995, "tps": 12225, "wall": 64159.5} {"step": 11969, "train_loss": 3.4910032749176025, "lr": 0.000290646848687326, "tps": 12225, "wall": 64167.9} {"step": 11970, "train_loss": 3.3639135360717773, "lr": 0.0002906292275354408, "tps": 12224, "wall": 64176.2} {"step": 11971, "train_loss": 3.45182466506958, "lr": 0.0002906116055834639, "tps": 12224, "wall": 64184.5} {"step": 11972, "train_loss": 3.4262092113494873, "lr": 0.0002905939828315948, "tps": 12223, "wall": 64192.9} {"step": 11973, "train_loss": 3.4459874629974365, "lr": 0.00029057635928003326, "tps": 12222, "wall": 64201.2} {"step": 11974, "train_loss": 3.4293062686920166, "lr": 0.000290558734928979, "tps": 12222, "wall": 64209.5} {"step": 11975, "train_loss": 3.507236957550049, "lr": 0.0002905411097786315, "tps": 12221, "wall": 64217.7} {"step": 11976, "train_loss": 3.445174217224121, "lr": 0.0002905234838291905, "tps": 12221, "wall": 64225.9} {"step": 11977, "train_loss": 3.3655033111572266, "lr": 0.00029050585708085576, "tps": 12220, "wall": 64234.1} {"step": 11978, "train_loss": 3.526409864425659, "lr": 0.0002904882295338268, "tps": 12220, "wall": 64242.3} {"step": 11979, "train_loss": 3.5147547721862793, "lr": 0.00029047060118830327, "tps": 12219, "wall": 64250.7} {"step": 11980, "train_loss": 3.481231212615967, "lr": 0.000290452972044485, "tps": 12219, "wall": 64259.0} {"step": 11981, "train_loss": 3.543735980987549, "lr": 0.0002904353421025717, "tps": 12218, "wall": 64267.2} {"step": 11982, "train_loss": 3.462118148803711, "lr": 0.00029041771136276303, "tps": 12217, "wall": 64275.5} {"step": 11983, "train_loss": 3.504473924636841, "lr": 0.00029040007982525866, "tps": 12217, "wall": 64283.7} {"step": 11984, "train_loss": 3.4896240234375, "lr": 0.0002903824474902584, "tps": 12216, "wall": 64291.9} {"step": 11985, "train_loss": 3.424863576889038, "lr": 0.000290364814357962, "tps": 12216, "wall": 64300.1} {"step": 11986, "train_loss": 3.406557321548462, "lr": 0.00029034718042856916, "tps": 12215, "wall": 64308.5} {"step": 11987, "train_loss": 3.561863660812378, "lr": 0.0002903295457022797, "tps": 12215, "wall": 64316.9} {"step": 11988, "train_loss": 3.452742576599121, "lr": 0.0002903119101792933, "tps": 12214, "wall": 64325.1} {"step": 11989, "train_loss": 3.4967291355133057, "lr": 0.00029029427385980974, "tps": 12214, "wall": 64333.3} {"step": 11990, "train_loss": 3.479430675506592, "lr": 0.0002902766367440288, "tps": 12213, "wall": 64341.5} {"step": 11991, "train_loss": 3.393413782119751, "lr": 0.00029025899883215045, "tps": 12213, "wall": 64349.7} {"step": 11992, "train_loss": 3.438831329345703, "lr": 0.00029024136012437433, "tps": 12212, "wall": 64358.0} {"step": 11993, "train_loss": 3.554969549179077, "lr": 0.0002902237206209002, "tps": 12211, "wall": 64366.2} {"step": 11994, "train_loss": 3.563310384750366, "lr": 0.00029020608032192803, "tps": 12211, "wall": 64374.5} {"step": 11995, "train_loss": 3.4885153770446777, "lr": 0.0002901884392276576, "tps": 12210, "wall": 64382.7} {"step": 11996, "train_loss": 3.429192543029785, "lr": 0.0002901707973382887, "tps": 12210, "wall": 64391.0} {"step": 11997, "train_loss": 3.465409517288208, "lr": 0.00029015315465402117, "tps": 12209, "wall": 64399.2} {"step": 11998, "train_loss": 3.5813064575195312, "lr": 0.00029013551117505493, "tps": 12209, "wall": 64407.3} {"step": 11999, "train_loss": 3.3947927951812744, "lr": 0.00029011786690158985, "tps": 12208, "wall": 64415.5} {"step": 12000, "train_loss": 3.5072059631347656, "lr": 0.0002901002218338258, "tps": 12208, "wall": 64423.7, "val_loss_monitor": 3.5030978004178346} {"step": 12001, "train_loss": 3.451291561126709, "lr": 0.00029008257597196266, "tps": 12197, "wall": 64483.3} {"step": 12002, "train_loss": 3.4073057174682617, "lr": 0.00029006492931620025, "tps": 12197, "wall": 64491.7} {"step": 12003, "train_loss": 3.4170408248901367, "lr": 0.0002900472818667386, "tps": 12196, "wall": 64500.0} {"step": 12004, "train_loss": 3.4995062351226807, "lr": 0.00029002963362377744, "tps": 12196, "wall": 64508.4} {"step": 12005, "train_loss": 3.4810147285461426, "lr": 0.00029001198458751694, "tps": 12195, "wall": 64516.7} {"step": 12006, "train_loss": 3.4443774223327637, "lr": 0.0002899943347581568, "tps": 12195, "wall": 64525.0} {"step": 12007, "train_loss": 3.482781410217285, "lr": 0.0002899766841358971, "tps": 12194, "wall": 64533.3} {"step": 12008, "train_loss": 3.567464828491211, "lr": 0.0002899590327209377, "tps": 12194, "wall": 64541.6} {"step": 12009, "train_loss": 3.2820589542388916, "lr": 0.0002899413805134786, "tps": 12193, "wall": 64550.0} {"step": 12010, "train_loss": 3.4960110187530518, "lr": 0.00028992372751371977, "tps": 12192, "wall": 64558.3} {"step": 12011, "train_loss": 3.487839937210083, "lr": 0.00028990607372186107, "tps": 12192, "wall": 64566.6} {"step": 12012, "train_loss": 3.547637462615967, "lr": 0.00028988841913810267, "tps": 12191, "wall": 64574.9} {"step": 12013, "train_loss": 3.502746105194092, "lr": 0.0002898707637626445, "tps": 12191, "wall": 64583.2} {"step": 12014, "train_loss": 3.4677538871765137, "lr": 0.0002898531075956865, "tps": 12190, "wall": 64591.6} {"step": 12015, "train_loss": 3.5103347301483154, "lr": 0.00028983545063742875, "tps": 12190, "wall": 64599.8} {"step": 12016, "train_loss": 3.501690626144409, "lr": 0.0002898177928880713, "tps": 12189, "wall": 64608.2} {"step": 12017, "train_loss": 3.5771422386169434, "lr": 0.00028980013434781396, "tps": 12189, "wall": 64616.5} {"step": 12018, "train_loss": 3.4752144813537598, "lr": 0.000289782475016857, "tps": 12188, "wall": 64624.8} {"step": 12019, "train_loss": 3.503866195678711, "lr": 0.0002897648148954004, "tps": 12187, "wall": 64633.0} {"step": 12020, "train_loss": 3.435183048248291, "lr": 0.00028974715398364417, "tps": 12187, "wall": 64641.3} {"step": 12021, "train_loss": 3.4743778705596924, "lr": 0.00028972949228178843, "tps": 12186, "wall": 64649.5} {"step": 12022, "train_loss": 3.371535301208496, "lr": 0.00028971182979003324, "tps": 12186, "wall": 64657.8} {"step": 12023, "train_loss": 3.493509292602539, "lr": 0.00028969416650857863, "tps": 12185, "wall": 64666.0} {"step": 12024, "train_loss": 3.440821409225464, "lr": 0.00028967650243762476, "tps": 12185, "wall": 64674.4} {"step": 12025, "train_loss": 3.471587657928467, "lr": 0.0002896588375773717, "tps": 12184, "wall": 64682.6} {"step": 12026, "train_loss": 3.3789501190185547, "lr": 0.00028964117192801955, "tps": 12184, "wall": 64690.8} {"step": 12027, "train_loss": 3.4866089820861816, "lr": 0.00028962350548976845, "tps": 12183, "wall": 64699.1} {"step": 12028, "train_loss": 3.479243755340576, "lr": 0.0002896058382628185, "tps": 12183, "wall": 64707.3} {"step": 12029, "train_loss": 3.4971818923950195, "lr": 0.0002895881702473699, "tps": 12182, "wall": 64715.5} {"step": 12030, "train_loss": 3.443910837173462, "lr": 0.00028957050144362263, "tps": 12182, "wall": 64723.5} {"step": 12031, "train_loss": 3.521318197250366, "lr": 0.00028955283185177707, "tps": 12181, "wall": 64731.9} {"step": 12032, "train_loss": 3.4366097450256348, "lr": 0.00028953516147203317, "tps": 12180, "wall": 64740.0} {"step": 12033, "train_loss": 3.5002684593200684, "lr": 0.0002895174903045913, "tps": 12180, "wall": 64748.2} {"step": 12034, "train_loss": 3.4984025955200195, "lr": 0.00028949981834965147, "tps": 12179, "wall": 64756.3} {"step": 12035, "train_loss": 3.5282044410705566, "lr": 0.00028948214560741396, "tps": 12179, "wall": 64764.5} {"step": 12036, "train_loss": 3.3979241847991943, "lr": 0.00028946447207807896, "tps": 12178, "wall": 64772.6} {"step": 12037, "train_loss": 3.514805316925049, "lr": 0.00028944679776184666, "tps": 12178, "wall": 64780.8} {"step": 12038, "train_loss": 3.404745578765869, "lr": 0.0002894291226589172, "tps": 12177, "wall": 64789.1} {"step": 12039, "train_loss": 3.4905171394348145, "lr": 0.000289411446769491, "tps": 12177, "wall": 64797.2} {"step": 12040, "train_loss": 3.4294323921203613, "lr": 0.0002893937700937681, "tps": 12176, "wall": 64805.4} {"step": 12041, "train_loss": 3.432058334350586, "lr": 0.0002893760926319488, "tps": 12176, "wall": 64813.5} {"step": 12042, "train_loss": 3.467444896697998, "lr": 0.00028935841438423345, "tps": 12175, "wall": 64821.8} {"step": 12043, "train_loss": 3.4025936126708984, "lr": 0.0002893407353508222, "tps": 12175, "wall": 64830.0} {"step": 12044, "train_loss": 3.5248875617980957, "lr": 0.0002893230555319153, "tps": 12174, "wall": 64838.2} {"step": 12045, "train_loss": 3.4773926734924316, "lr": 0.0002893053749277131, "tps": 12174, "wall": 64846.3} {"step": 12046, "train_loss": 3.4458744525909424, "lr": 0.00028928769353841593, "tps": 12173, "wall": 64854.7} {"step": 12047, "train_loss": 3.4820055961608887, "lr": 0.00028927001136422396, "tps": 12173, "wall": 64862.8} {"step": 12048, "train_loss": 3.568039894104004, "lr": 0.0002892523284053375, "tps": 12172, "wall": 64871.0} {"step": 12049, "train_loss": 3.4900598526000977, "lr": 0.00028923464466195704, "tps": 12171, "wall": 64879.2} {"step": 12050, "train_loss": 3.450648069381714, "lr": 0.0002892169601342827, "tps": 12171, "wall": 64887.4} {"step": 12051, "train_loss": 3.512908458709717, "lr": 0.00028919927482251486, "tps": 12170, "wall": 64895.5} {"step": 12052, "train_loss": 3.4194231033325195, "lr": 0.000289181588726854, "tps": 12170, "wall": 64903.6} {"step": 12053, "train_loss": 3.394430637359619, "lr": 0.0002891639018475003, "tps": 12169, "wall": 64911.9} {"step": 12054, "train_loss": 3.4586591720581055, "lr": 0.00028914621418465417, "tps": 12169, "wall": 64920.1} {"step": 12055, "train_loss": 3.546328544616699, "lr": 0.00028912852573851597, "tps": 12168, "wall": 64928.3} {"step": 12056, "train_loss": 3.5994954109191895, "lr": 0.0002891108365092862, "tps": 12168, "wall": 64936.4} {"step": 12057, "train_loss": 3.5247349739074707, "lr": 0.000289093146497165, "tps": 12167, "wall": 64944.6} {"step": 12058, "train_loss": 3.4942684173583984, "lr": 0.0002890754557023529, "tps": 12167, "wall": 64952.7} {"step": 12059, "train_loss": 3.4842116832733154, "lr": 0.00028905776412505046, "tps": 12166, "wall": 64960.9} {"step": 12060, "train_loss": 3.4528000354766846, "lr": 0.0002890400717654578, "tps": 12166, "wall": 64969.1} {"step": 12061, "train_loss": 3.420194625854492, "lr": 0.00028902237862377545, "tps": 12165, "wall": 64977.3} {"step": 12062, "train_loss": 3.504713535308838, "lr": 0.00028900468470020386, "tps": 12165, "wall": 64985.5} {"step": 12063, "train_loss": 3.3660473823547363, "lr": 0.0002889869899949436, "tps": 12164, "wall": 64993.6} {"step": 12064, "train_loss": 3.4817733764648438, "lr": 0.0002889692945081949, "tps": 12164, "wall": 65001.8} {"step": 12065, "train_loss": 3.4846365451812744, "lr": 0.0002889515982401582, "tps": 12163, "wall": 65009.8} {"step": 12066, "train_loss": 3.453378677368164, "lr": 0.00028893390119103424, "tps": 12163, "wall": 65018.0} {"step": 12067, "train_loss": 3.572841167449951, "lr": 0.00028891620336102324, "tps": 12162, "wall": 65026.1} {"step": 12068, "train_loss": 3.5772972106933594, "lr": 0.0002888985047503257, "tps": 12162, "wall": 65034.3} {"step": 12069, "train_loss": 3.4387171268463135, "lr": 0.0002888808053591422, "tps": 12161, "wall": 65042.5} {"step": 12070, "train_loss": 3.395064115524292, "lr": 0.0002888631051876733, "tps": 12161, "wall": 65050.7} {"step": 12071, "train_loss": 3.5427558422088623, "lr": 0.0002888454042361194, "tps": 12160, "wall": 65058.7} {"step": 12072, "train_loss": 3.3999335765838623, "lr": 0.0002888277025046809, "tps": 12160, "wall": 65066.8} {"step": 12073, "train_loss": 3.457226037979126, "lr": 0.00028880999999355867, "tps": 12159, "wall": 65074.9} {"step": 12074, "train_loss": 3.4967613220214844, "lr": 0.00028879229670295285, "tps": 12159, "wall": 65083.1} {"step": 12075, "train_loss": 3.444209575653076, "lr": 0.00028877459263306426, "tps": 12158, "wall": 65091.4} {"step": 12076, "train_loss": 3.431905508041382, "lr": 0.0002887568877840934, "tps": 12157, "wall": 65099.6} {"step": 12077, "train_loss": 3.485360622406006, "lr": 0.00028873918215624076, "tps": 12157, "wall": 65107.7} {"step": 12078, "train_loss": 3.6176557540893555, "lr": 0.0002887214757497069, "tps": 12156, "wall": 65115.8} {"step": 12079, "train_loss": 3.475210666656494, "lr": 0.0002887037685646925, "tps": 12156, "wall": 65124.0} {"step": 12080, "train_loss": 3.4393773078918457, "lr": 0.0002886860606013981, "tps": 12155, "wall": 65132.1} {"step": 12081, "train_loss": 3.4818832874298096, "lr": 0.0002886683518600242, "tps": 12155, "wall": 65140.3} {"step": 12082, "train_loss": 3.5179553031921387, "lr": 0.00028865064234077155, "tps": 12154, "wall": 65148.5} {"step": 12083, "train_loss": 3.4794838428497314, "lr": 0.00028863293204384074, "tps": 12154, "wall": 65156.6} {"step": 12084, "train_loss": 3.5068650245666504, "lr": 0.00028861522096943235, "tps": 12153, "wall": 65164.8} {"step": 12085, "train_loss": 3.441952705383301, "lr": 0.000288597509117747, "tps": 12153, "wall": 65172.9} {"step": 12086, "train_loss": 3.429536819458008, "lr": 0.00028857979648898535, "tps": 12152, "wall": 65181.0} {"step": 12087, "train_loss": 3.4624199867248535, "lr": 0.0002885620830833481, "tps": 12152, "wall": 65189.1} {"step": 12088, "train_loss": 3.5488171577453613, "lr": 0.00028854436890103587, "tps": 12151, "wall": 65197.2} {"step": 12089, "train_loss": 3.5263876914978027, "lr": 0.00028852665394224925, "tps": 12151, "wall": 65205.3} {"step": 12090, "train_loss": 3.589345932006836, "lr": 0.00028850893820718906, "tps": 12150, "wall": 65213.6} {"step": 12091, "train_loss": 3.40995454788208, "lr": 0.00028849122169605587, "tps": 12150, "wall": 65221.6} {"step": 12092, "train_loss": 3.539534568786621, "lr": 0.0002884735044090504, "tps": 12149, "wall": 65229.8} {"step": 12093, "train_loss": 3.4667892456054688, "lr": 0.0002884557863463734, "tps": 12149, "wall": 65237.9} {"step": 12094, "train_loss": 3.4654834270477295, "lr": 0.0002884380675082256, "tps": 12148, "wall": 65246.0} {"step": 12095, "train_loss": 3.4234917163848877, "lr": 0.0002884203478948076, "tps": 12148, "wall": 65254.1} {"step": 12096, "train_loss": 3.4519400596618652, "lr": 0.00028840262750632023, "tps": 12147, "wall": 65262.3} {"step": 12097, "train_loss": 3.4750449657440186, "lr": 0.0002883849063429642, "tps": 12147, "wall": 65270.5} {"step": 12098, "train_loss": 3.495011806488037, "lr": 0.0002883671844049402, "tps": 12146, "wall": 65278.6} {"step": 12099, "train_loss": 3.4520580768585205, "lr": 0.000288349461692449, "tps": 12146, "wall": 65286.8} {"step": 12100, "train_loss": 3.440441131591797, "lr": 0.00028833173820569147, "tps": 12145, "wall": 65294.9} {"step": 12101, "train_loss": 3.479160785675049, "lr": 0.00028831401394486834, "tps": 12145, "wall": 65303.0} {"step": 12102, "train_loss": 3.4380993843078613, "lr": 0.0002882962889101803, "tps": 12144, "wall": 65311.3} {"step": 12103, "train_loss": 3.5365991592407227, "lr": 0.0002882785631018282, "tps": 12144, "wall": 65319.4} {"step": 12104, "train_loss": 3.423516035079956, "lr": 0.00028826083652001285, "tps": 12143, "wall": 65327.7} {"step": 12105, "train_loss": 3.4991683959960938, "lr": 0.0002882431091649351, "tps": 12143, "wall": 65335.7} {"step": 12106, "train_loss": 3.4833946228027344, "lr": 0.00028822538103679573, "tps": 12142, "wall": 65343.8} {"step": 12107, "train_loss": 3.4237661361694336, "lr": 0.0002882076521357955, "tps": 12142, "wall": 65352.0} {"step": 12108, "train_loss": 3.444612979888916, "lr": 0.0002881899224621353, "tps": 12141, "wall": 65360.0} {"step": 12109, "train_loss": 3.5407896041870117, "lr": 0.000288172192016016, "tps": 12141, "wall": 65368.1} {"step": 12110, "train_loss": 3.5271060466766357, "lr": 0.0002881544607976384, "tps": 12140, "wall": 65376.3} {"step": 12111, "train_loss": 3.409334421157837, "lr": 0.00028813672880720337, "tps": 12140, "wall": 65384.4} {"step": 12112, "train_loss": 3.472308397293091, "lr": 0.00028811899604491183, "tps": 12139, "wall": 65392.7} {"step": 12113, "train_loss": 3.4080848693847656, "lr": 0.0002881012625109646, "tps": 12139, "wall": 65400.8} {"step": 12114, "train_loss": 3.5308566093444824, "lr": 0.0002880835282055625, "tps": 12138, "wall": 65408.9} {"step": 12115, "train_loss": 3.486194133758545, "lr": 0.0002880657931289067, "tps": 12138, "wall": 65417.0} {"step": 12116, "train_loss": 3.490696907043457, "lr": 0.00028804805728119775, "tps": 12137, "wall": 65425.1} {"step": 12117, "train_loss": 3.51305890083313, "lr": 0.0002880303206626368, "tps": 12137, "wall": 65433.2} {"step": 12118, "train_loss": 3.470262050628662, "lr": 0.00028801258327342466, "tps": 12136, "wall": 65441.3} {"step": 12119, "train_loss": 3.4885482788085938, "lr": 0.0002879948451137623, "tps": 12136, "wall": 65449.6} {"step": 12120, "train_loss": 3.436260223388672, "lr": 0.00028797710618385064, "tps": 12135, "wall": 65457.6} {"step": 12121, "train_loss": 3.4662909507751465, "lr": 0.0002879593664838907, "tps": 12135, "wall": 65465.7} {"step": 12122, "train_loss": 3.4371705055236816, "lr": 0.00028794162601408334, "tps": 12134, "wall": 65474.0} {"step": 12123, "train_loss": 3.451040744781494, "lr": 0.0002879238847746295, "tps": 12133, "wall": 65482.2} {"step": 12124, "train_loss": 3.4367928504943848, "lr": 0.0002879061427657304, "tps": 12133, "wall": 65490.4} {"step": 12001, "train_loss": 3.40289306640625, "lr": 0.00029008257597196266, "tps": 169344322, "wall": 4.6} {"step": 12002, "train_loss": 3.421067714691162, "lr": 0.00029006492931620025, "tps": 91542858, "wall": 8.6} {"step": 12003, "train_loss": 3.4190003871917725, "lr": 0.0002900472818667386, "tps": 62185603, "wall": 12.7} {"step": 12004, "train_loss": 3.5077273845672607, "lr": 0.00029002963362377744, "tps": 46705930, "wall": 16.8} {"step": 12005, "train_loss": 3.3827550411224365, "lr": 0.00029001198458751694, "tps": 37209861, "wall": 21.1} {"step": 12006, "train_loss": 3.4193997383117676, "lr": 0.0002899943347581568, "tps": 30858128, "wall": 25.5} {"step": 12007, "train_loss": 3.4064722061157227, "lr": 0.0002899766841358971, "tps": 26258550, "wall": 30.0} {"step": 12008, "train_loss": 3.506822109222412, "lr": 0.0002899590327209377, "tps": 22878918, "wall": 34.4} {"step": 12009, "train_loss": 3.4736905097961426, "lr": 0.0002899413805134786, "tps": 20235592, "wall": 38.9} {"step": 12010, "train_loss": 3.501345634460449, "lr": 0.00028992372751371977, "tps": 18105865, "wall": 43.5} {"step": 12011, "train_loss": 3.3855996131896973, "lr": 0.00028990607372186107, "tps": 16343168, "wall": 48.2} {"step": 12012, "train_loss": 3.472259998321533, "lr": 0.00028988841913810267, "tps": 14847782, "wall": 53.0} {"step": 12013, "train_loss": 3.347350597381592, "lr": 0.0002898707637626445, "tps": 13546429, "wall": 58.1} {"step": 12014, "train_loss": 3.4081149101257324, "lr": 0.0002898531075956865, "tps": 12436010, "wall": 63.3} {"step": 12015, "train_loss": 3.551806688308716, "lr": 0.00028983545063742875, "tps": 11482878, "wall": 68.6} {"step": 12016, "train_loss": 3.4635374546051025, "lr": 0.0002898177928880713, "tps": 10663627, "wall": 73.9} {"step": 12017, "train_loss": 3.3998475074768066, "lr": 0.00028980013434781396, "tps": 9952289, "wall": 79.1} {"step": 12018, "train_loss": 3.5015854835510254, "lr": 0.000289782475016857, "tps": 9311967, "wall": 84.6} {"step": 12019, "train_loss": 3.4751641750335693, "lr": 0.0002897648148954004, "tps": 8734235, "wall": 90.2} {"step": 12020, "train_loss": 3.4356539249420166, "lr": 0.00028974715398364417, "tps": 8240003, "wall": 95.6} {"step": 12021, "train_loss": 3.5311946868896484, "lr": 0.00028972949228178843, "tps": 7797449, "wall": 101.0} {"step": 12022, "train_loss": 3.5217339992523193, "lr": 0.00028971182979003324, "tps": 7397937, "wall": 106.5} {"step": 12023, "train_loss": 3.427642345428467, "lr": 0.00028969416650857863, "tps": 7044281, "wall": 111.9} {"step": 12024, "train_loss": 3.3986141681671143, "lr": 0.00028967650243762476, "tps": 6721208, "wall": 117.3} {"step": 12025, "train_loss": 3.4190926551818848, "lr": 0.0002896588375773717, "tps": 6429774, "wall": 122.6} {"step": 12026, "train_loss": 3.3270740509033203, "lr": 0.00028964117192801955, "tps": 6162661, "wall": 127.9} {"step": 12027, "train_loss": 3.4175753593444824, "lr": 0.00028962350548976845, "tps": 5913741, "wall": 133.3} {"step": 12028, "train_loss": 3.542224645614624, "lr": 0.0002896058382628185, "tps": 5681373, "wall": 138.8} {"step": 12029, "train_loss": 3.426377058029175, "lr": 0.0002895881702473699, "tps": 5466389, "wall": 144.2} {"step": 12030, "train_loss": 3.460127353668213, "lr": 0.00028957050144362263, "tps": 5263075, "wall": 149.8} {"step": 12031, "train_loss": 3.4142379760742188, "lr": 0.00028955283185177707, "tps": 5080177, "wall": 155.2} {"step": 12032, "train_loss": 3.465660572052002, "lr": 0.00028953516147203317, "tps": 4905637, "wall": 160.8} {"step": 12033, "train_loss": 3.469045639038086, "lr": 0.0002895174903045913, "tps": 4742654, "wall": 166.3} {"step": 12034, "train_loss": 3.3356502056121826, "lr": 0.00028949981834965147, "tps": 4585672, "wall": 172.0} {"step": 12035, "train_loss": 3.4854683876037598, "lr": 0.00028948214560741396, "tps": 4439713, "wall": 177.7} {"step": 12036, "train_loss": 3.450216293334961, "lr": 0.00028946447207807896, "tps": 4296732, "wall": 183.6} {"step": 12037, "train_loss": 3.4796903133392334, "lr": 0.00028944679776184666, "tps": 4162499, "wall": 189.5} {"step": 12038, "train_loss": 3.4324212074279785, "lr": 0.0002894291226589172, "tps": 4036237, "wall": 195.5} {"step": 12039, "train_loss": 3.3686556816101074, "lr": 0.000289411446769491, "tps": 3915126, "wall": 201.5} {"step": 12040, "train_loss": 3.4087090492248535, "lr": 0.0002893937700937681, "tps": 3790382, "wall": 208.2} {"step": 12041, "train_loss": 3.393785238265991, "lr": 0.0002893760926319488, "tps": 3676249, "wall": 214.7} {"step": 12042, "train_loss": 3.493032693862915, "lr": 0.00028935841438423345, "tps": 3567193, "wall": 221.3} {"step": 12043, "train_loss": 3.3262248039245605, "lr": 0.0002893407353508222, "tps": 3454688, "wall": 228.5} {"step": 12044, "train_loss": 3.5214502811431885, "lr": 0.0002893230555319153, "tps": 3354061, "wall": 235.4} {"step": 12045, "train_loss": 3.3705921173095703, "lr": 0.0002893053749277131, "tps": 3254098, "wall": 242.6} {"step": 12046, "train_loss": 3.514937162399292, "lr": 0.00028928769353841593, "tps": 3163212, "wall": 249.6} {"step": 12047, "train_loss": 3.3082993030548096, "lr": 0.00028927001136422396, "tps": 3076266, "wall": 256.7} {"step": 12048, "train_loss": 3.4814505577087402, "lr": 0.0002892523284053375, "tps": 2989342, "wall": 264.2} {"step": 12049, "train_loss": 3.5179591178894043, "lr": 0.00028923464466195704, "tps": 2908328, "wall": 271.5} {"step": 12050, "train_loss": 3.4506683349609375, "lr": 0.0002892169601342827, "tps": 2826619, "wall": 279.4} {"step": 12051, "train_loss": 3.3592870235443115, "lr": 0.00028919927482251486, "tps": 2750435, "wall": 287.2} {"step": 12052, "train_loss": 3.470945358276367, "lr": 0.000289181588726854, "tps": 2677346, "wall": 295.0} {"step": 12053, "train_loss": 3.502816677093506, "lr": 0.0002891639018475003, "tps": 2606342, "wall": 303.1} {"step": 12054, "train_loss": 3.445448875427246, "lr": 0.00028914621418465417, "tps": 2537530, "wall": 311.3} {"step": 12055, "train_loss": 3.409529685974121, "lr": 0.00028912852573851597, "tps": 2472860, "wall": 319.5} {"step": 12056, "train_loss": 3.391357421875, "lr": 0.0002891108365092862, "tps": 2409298, "wall": 328.0} {"step": 12057, "train_loss": 3.476294994354248, "lr": 0.000289093146497165, "tps": 2351477, "wall": 336.1} {"step": 12058, "train_loss": 3.466921091079712, "lr": 0.0002890754557023529, "tps": 2295272, "wall": 344.3} {"step": 12059, "train_loss": 3.4479000568389893, "lr": 0.00028905776412505046, "tps": 2237767, "wall": 353.2} {"step": 12060, "train_loss": 3.5734751224517822, "lr": 0.0002890400717654578, "tps": 2187677, "wall": 361.3} {"step": 12061, "train_loss": 3.5004587173461914, "lr": 0.00028902237862377545, "tps": 2140147, "wall": 369.4} {"step": 12062, "train_loss": 3.4495413303375244, "lr": 0.00028900468470020386, "tps": 2094421, "wall": 377.5} {"step": 12063, "train_loss": 3.521289348602295, "lr": 0.0002889869899949436, "tps": 2049878, "wall": 385.7} {"step": 12064, "train_loss": 3.4311046600341797, "lr": 0.0002889692945081949, "tps": 2006886, "wall": 394.0} {"step": 12065, "train_loss": 3.429978370666504, "lr": 0.0002889515982401582, "tps": 1967109, "wall": 402.0} {"step": 12066, "train_loss": 3.515047550201416, "lr": 0.00028893390119103424, "tps": 1928678, "wall": 410.0} {"step": 12067, "train_loss": 3.5530195236206055, "lr": 0.00028891620336102324, "tps": 1891747, "wall": 418.1} {"step": 12068, "train_loss": 3.415929079055786, "lr": 0.0002888985047503257, "tps": 1856484, "wall": 426.0} {"step": 12069, "train_loss": 3.3555445671081543, "lr": 0.0002888808053591422, "tps": 1822774, "wall": 434.0} {"step": 12070, "train_loss": 3.5453433990478516, "lr": 0.0002888631051876733, "tps": 1790459, "wall": 441.8} {"step": 12071, "train_loss": 3.458287477493286, "lr": 0.0002888454042361194, "tps": 1758726, "wall": 449.8} {"step": 12072, "train_loss": 3.4397976398468018, "lr": 0.0002888277025046809, "tps": 1728853, "wall": 457.7} {"step": 12073, "train_loss": 3.4629411697387695, "lr": 0.00028880999999355867, "tps": 1699967, "wall": 465.5} {"step": 12074, "train_loss": 3.3934428691864014, "lr": 0.00028879229670295285, "tps": 1672184, "wall": 473.2} {"step": 12075, "train_loss": 3.454300880432129, "lr": 0.00028877459263306426, "tps": 1645309, "wall": 481.0} {"step": 12076, "train_loss": 3.5037789344787598, "lr": 0.0002887568877840934, "tps": 1619542, "wall": 488.7} {"step": 12077, "train_loss": 3.468440294265747, "lr": 0.00028873918215624076, "tps": 1594709, "wall": 496.4} {"step": 12078, "train_loss": 3.503129720687866, "lr": 0.0002887214757497069, "tps": 1570681, "wall": 504.0} {"step": 12079, "train_loss": 3.557251214981079, "lr": 0.0002887037685646925, "tps": 1547450, "wall": 511.6} {"step": 12080, "train_loss": 3.391916036605835, "lr": 0.0002886860606013981, "tps": 1525032, "wall": 519.2} {"step": 12081, "train_loss": 3.4697203636169434, "lr": 0.0002886683518600242, "tps": 1503531, "wall": 526.6} {"step": 12082, "train_loss": 3.4431748390197754, "lr": 0.00028865064234077155, "tps": 1482400, "wall": 534.2} {"step": 12083, "train_loss": 3.428305149078369, "lr": 0.00028863293204384074, "tps": 1461712, "wall": 541.8} {"step": 12084, "train_loss": 3.445439338684082, "lr": 0.00028861522096943235, "tps": 1442346, "wall": 549.1} {"step": 12085, "train_loss": 3.510392427444458, "lr": 0.000288597509117747, "tps": 1423722, "wall": 556.3} {"step": 12086, "train_loss": 3.4641201496124268, "lr": 0.00028857979648898535, "tps": 1405460, "wall": 563.6} {"step": 12087, "train_loss": 3.4402709007263184, "lr": 0.0002885620830833481, "tps": 1387718, "wall": 570.9} {"step": 12088, "train_loss": 3.4552154541015625, "lr": 0.00028854436890103587, "tps": 1370757, "wall": 578.0} {"step": 12089, "train_loss": 3.4382786750793457, "lr": 0.00028852665394224925, "tps": 1353326, "wall": 585.5} {"step": 12090, "train_loss": 3.4295525550842285, "lr": 0.00028850893820718906, "tps": 1336809, "wall": 592.8} {"step": 12091, "train_loss": 3.3679850101470947, "lr": 0.00028849122169605587, "tps": 1320945, "wall": 599.9} {"step": 12092, "train_loss": 3.4886727333068848, "lr": 0.0002884735044090504, "tps": 1305741, "wall": 607.0} {"step": 12093, "train_loss": 3.475480079650879, "lr": 0.0002884557863463734, "tps": 1289877, "wall": 614.5} {"step": 12094, "train_loss": 3.498157501220703, "lr": 0.0002884380675082256, "tps": 1275458, "wall": 621.5} {"step": 12095, "train_loss": 3.396723747253418, "lr": 0.0002884203478948076, "tps": 1261455, "wall": 628.4} {"step": 12096, "train_loss": 3.4377574920654297, "lr": 0.00028840262750632023, "tps": 1248092, "wall": 635.2} {"step": 12097, "train_loss": 3.4363179206848145, "lr": 0.0002883849063429642, "tps": 1234135, "wall": 642.4} {"step": 12098, "train_loss": 3.5065391063690186, "lr": 0.0002883671844049402, "tps": 1221536, "wall": 649.1} {"step": 12099, "train_loss": 3.5153636932373047, "lr": 0.000288349461692449, "tps": 1209026, "wall": 655.9} {"step": 12100, "train_loss": 3.4506139755249023, "lr": 0.00028833173820569147, "tps": 1196906, "wall": 662.6} {"step": 12101, "train_loss": 3.309767246246338, "lr": 0.00028831401394486834, "tps": 1185377, "wall": 669.1} {"step": 12102, "train_loss": 3.3840713500976562, "lr": 0.0002882962889101803, "tps": 1173930, "wall": 675.7} {"step": 12103, "train_loss": 3.374690055847168, "lr": 0.0002882785631018282, "tps": 1163040, "wall": 682.0} {"step": 12104, "train_loss": 3.358645439147949, "lr": 0.00028826083652001285, "tps": 1152006, "wall": 688.6} {"step": 12105, "train_loss": 3.412846565246582, "lr": 0.0002882431091649351, "tps": 1141388, "wall": 695.1} {"step": 12106, "train_loss": 3.491863250732422, "lr": 0.00028822538103679573, "tps": 1131026, "wall": 701.5} {"step": 12107, "train_loss": 3.3882076740264893, "lr": 0.0002882076521357955, "tps": 1121118, "wall": 707.8} {"step": 12108, "train_loss": 3.5195670127868652, "lr": 0.0002881899224621353, "tps": 1111319, "wall": 714.1} {"step": 12109, "train_loss": 3.410409927368164, "lr": 0.000288172192016016, "tps": 1101619, "wall": 720.4} {"step": 12110, "train_loss": 3.437086343765259, "lr": 0.0002881544607976384, "tps": 1092185, "wall": 726.7} {"step": 12111, "train_loss": 3.4070584774017334, "lr": 0.00028813672880720337, "tps": 1083104, "wall": 732.9} {"step": 12112, "train_loss": 3.4207561016082764, "lr": 0.00028811899604491183, "tps": 1074027, "wall": 739.1} {"step": 12113, "train_loss": 3.438539505004883, "lr": 0.0002881012625109646, "tps": 1065169, "wall": 745.3} {"step": 12114, "train_loss": 3.4087727069854736, "lr": 0.0002880835282055625, "tps": 1056407, "wall": 751.6} {"step": 12115, "train_loss": 3.449810266494751, "lr": 0.0002880657931289067, "tps": 1047967, "wall": 757.7} {"step": 12116, "train_loss": 3.4325857162475586, "lr": 0.00028804805728119775, "tps": 1039632, "wall": 763.8} {"step": 12117, "train_loss": 3.441101551055908, "lr": 0.0002880303206626368, "tps": 1031326, "wall": 770.0} {"step": 12118, "train_loss": 3.397573947906494, "lr": 0.00028801258327342466, "tps": 1023327, "wall": 776.1} {"step": 12119, "train_loss": 3.5142879486083984, "lr": 0.0002879948451137623, "tps": 1015480, "wall": 782.2} {"step": 12120, "train_loss": 3.5140938758850098, "lr": 0.00028797710618385064, "tps": 1007835, "wall": 788.2} {"step": 12121, "train_loss": 3.437405824661255, "lr": 0.0002879593664838907, "tps": 1000234, "wall": 794.2} {"step": 12122, "train_loss": 3.4798693656921387, "lr": 0.00028794162601408334, "tps": 992806, "wall": 800.2} {"step": 12123, "train_loss": 3.4559977054595947, "lr": 0.0002879238847746295, "tps": 985467, "wall": 806.3} {"step": 12124, "train_loss": 3.434230089187622, "lr": 0.0002879061427657304, "tps": 978210, "wall": 812.3} {"step": 12125, "train_loss": 3.445974826812744, "lr": 0.00028788839998758665, "tps": 971142, "wall": 818.3} {"step": 12126, "train_loss": 3.3835394382476807, "lr": 0.00028787065644039956, "tps": 964126, "wall": 824.3} {"step": 12127, "train_loss": 3.492119312286377, "lr": 0.00028785291212436997, "tps": 957341, "wall": 830.2} {"step": 12128, "train_loss": 3.4559249877929688, "lr": 0.0002878351670396989, "tps": 950585, "wall": 836.2} {"step": 12129, "train_loss": 3.424563407897949, "lr": 0.0002878174211865874, "tps": 943976, "wall": 842.1} {"step": 12130, "train_loss": 3.4511055946350098, "lr": 0.00028779967456523645, "tps": 937410, "wall": 848.1} {"step": 12131, "train_loss": 3.427152156829834, "lr": 0.0002877819271758472, "tps": 930948, "wall": 854.1} {"step": 12132, "train_loss": 3.53922963142395, "lr": 0.00028776417901862054, "tps": 924436, "wall": 860.1} {"step": 12133, "train_loss": 3.3287806510925293, "lr": 0.0002877464300937576, "tps": 918056, "wall": 866.2} {"step": 12134, "train_loss": 3.3372745513916016, "lr": 0.00028772868040145947, "tps": 911776, "wall": 872.2} {"step": 12135, "train_loss": 3.3072471618652344, "lr": 0.00028771092994192717, "tps": 905753, "wall": 878.1} {"step": 12136, "train_loss": 3.5976247787475586, "lr": 0.0002876931787153618, "tps": 899807, "wall": 884.0} {"step": 12137, "train_loss": 3.4656906127929688, "lr": 0.00028767542672196434, "tps": 893919, "wall": 889.9} {"step": 12138, "train_loss": 3.3643150329589844, "lr": 0.00028765767396193615, "tps": 888098, "wall": 895.8} {"step": 12139, "train_loss": 3.5493979454040527, "lr": 0.00028763992043547807, "tps": 882419, "wall": 901.6} {"step": 12140, "train_loss": 3.3372979164123535, "lr": 0.00028762216614279133, "tps": 876764, "wall": 907.5} {"step": 12141, "train_loss": 3.437725067138672, "lr": 0.00028760441108407705, "tps": 871181, "wall": 913.4} {"step": 12142, "train_loss": 3.4163129329681396, "lr": 0.0002875866552595363, "tps": 865703, "wall": 919.3} {"step": 12143, "train_loss": 3.538466691970825, "lr": 0.0002875688986693703, "tps": 859876, "wall": 925.6} {"step": 12144, "train_loss": 3.5664217472076416, "lr": 0.00028755114131378016, "tps": 854157, "wall": 931.8} {"step": 12145, "train_loss": 3.4483871459960938, "lr": 0.000287533383192967, "tps": 848612, "wall": 938.0} {"step": 12146, "train_loss": 3.348522663116455, "lr": 0.00028751562430713205, "tps": 843205, "wall": 944.1} {"step": 12147, "train_loss": 3.4134750366210938, "lr": 0.0002874978646564765, "tps": 837825, "wall": 950.2} {"step": 12148, "train_loss": 3.446634531021118, "lr": 0.0002874801042412014, "tps": 831801, "wall": 957.2} {"step": 12149, "train_loss": 3.4555063247680664, "lr": 0.00028746234306150807, "tps": 826168, "wall": 963.8} {"step": 12150, "train_loss": 3.321443557739258, "lr": 0.0002874445811175977, "tps": 821133, "wall": 969.8} {"step": 12151, "train_loss": 3.4116477966308594, "lr": 0.0002874268184096715, "tps": 816068, "wall": 975.9} {"step": 12152, "train_loss": 3.4504201412200928, "lr": 0.00028740905493793053, "tps": 811053, "wall": 982.0} {"step": 12153, "train_loss": 3.4941842555999756, "lr": 0.0002873912907025762, "tps": 806078, "wall": 988.1} {"step": 12154, "train_loss": 3.440894603729248, "lr": 0.00028737352570380964, "tps": 801509, "wall": 993.9} {"step": 12155, "train_loss": 3.3622686862945557, "lr": 0.00028735575994183227, "tps": 797020, "wall": 999.5} {"step": 12156, "train_loss": 3.4218082427978516, "lr": 0.0002873379934168451, "tps": 792607, "wall": 1005.2} {"step": 12157, "train_loss": 3.4048426151275635, "lr": 0.0002873202261290495, "tps": 788216, "wall": 1010.9} {"step": 12158, "train_loss": 3.509035110473633, "lr": 0.00028730245807864676, "tps": 783915, "wall": 1016.5} {"step": 12159, "train_loss": 3.408926486968994, "lr": 0.0002872846892658381, "tps": 779619, "wall": 1022.2} {"step": 12160, "train_loss": 3.4466309547424316, "lr": 0.00028726691969082485, "tps": 775405, "wall": 1027.8} {"step": 12161, "train_loss": 3.580831527709961, "lr": 0.0002872491493538083, "tps": 771246, "wall": 1033.5} {"step": 12162, "train_loss": 3.336846351623535, "lr": 0.00028723137825498976, "tps": 767175, "wall": 1039.0} {"step": 12163, "train_loss": 3.4554495811462402, "lr": 0.0002872136063945705, "tps": 763119, "wall": 1044.6} {"step": 12164, "train_loss": 3.3621835708618164, "lr": 0.0002871958337727519, "tps": 759066, "wall": 1050.3} {"step": 12165, "train_loss": 3.4020423889160156, "lr": 0.0002871780603897353, "tps": 755141, "wall": 1055.8} {"step": 12166, "train_loss": 3.573355197906494, "lr": 0.00028716028624572196, "tps": 751251, "wall": 1061.4} {"step": 12167, "train_loss": 3.3272042274475098, "lr": 0.00028714251134091324, "tps": 747385, "wall": 1067.0} {"step": 12168, "train_loss": 3.3304529190063477, "lr": 0.00028712473567551057, "tps": 743550, "wall": 1072.6} {"step": 12169, "train_loss": 3.3621387481689453, "lr": 0.0002871069592497152, "tps": 739762, "wall": 1078.1} {"step": 12170, "train_loss": 3.469353199005127, "lr": 0.0002870891820637286, "tps": 736002, "wall": 1083.7} {"step": 12171, "train_loss": 3.473288059234619, "lr": 0.0002870714041177521, "tps": 732297, "wall": 1089.3} {"step": 12172, "train_loss": 3.5104222297668457, "lr": 0.0002870536254119871, "tps": 728565, "wall": 1095.0} {"step": 12173, "train_loss": 3.3194031715393066, "lr": 0.0002870358459466351, "tps": 724880, "wall": 1100.6} {"step": 12174, "train_loss": 3.4153735637664795, "lr": 0.00028701806572189727, "tps": 721227, "wall": 1106.3} {"step": 12175, "train_loss": 3.5454940795898438, "lr": 0.00028700028473797526, "tps": 717588, "wall": 1112.0} {"step": 12176, "train_loss": 3.4137303829193115, "lr": 0.00028698250299507037, "tps": 714045, "wall": 1117.6} {"step": 12177, "train_loss": 3.437636137008667, "lr": 0.0002869647204933841, "tps": 710581, "wall": 1123.2} {"step": 12178, "train_loss": 3.431105375289917, "lr": 0.0002869469372331178, "tps": 707113, "wall": 1128.8} {"step": 12179, "train_loss": 3.4107046127319336, "lr": 0.00028692915321447296, "tps": 703669, "wall": 1134.4} {"step": 12180, "train_loss": 3.3348987102508545, "lr": 0.0002869113684376511, "tps": 700316, "wall": 1139.9} {"step": 12181, "train_loss": 3.504734992980957, "lr": 0.0002868935829028536, "tps": 697025, "wall": 1145.4} {"step": 12182, "train_loss": 3.3803606033325195, "lr": 0.000286875796610282, "tps": 693770, "wall": 1150.8} {"step": 12183, "train_loss": 3.4921066761016846, "lr": 0.00028685800956013775, "tps": 690550, "wall": 1156.3} {"step": 12184, "train_loss": 3.447777271270752, "lr": 0.00028684022175262235, "tps": 687309, "wall": 1161.9} {"step": 12185, "train_loss": 3.473037004470825, "lr": 0.0002868224331879373, "tps": 684137, "wall": 1167.3} {"step": 12186, "train_loss": 3.5326991081237793, "lr": 0.0002868046438662841, "tps": 680960, "wall": 1172.9} {"step": 12187, "train_loss": 3.469989538192749, "lr": 0.00028678685378786433, "tps": 677848, "wall": 1178.4} {"step": 12188, "train_loss": 3.4900646209716797, "lr": 0.00028676906295287943, "tps": 674791, "wall": 1183.8} {"step": 12189, "train_loss": 3.4715025424957275, "lr": 0.000286751271361531, "tps": 671748, "wall": 1189.3} {"step": 12190, "train_loss": 3.320659875869751, "lr": 0.00028673347901402046, "tps": 668752, "wall": 1194.7} {"step": 12191, "train_loss": 3.5695905685424805, "lr": 0.00028671568591054954, "tps": 665777, "wall": 1200.1} {"step": 12192, "train_loss": 3.3502249717712402, "lr": 0.00028669789205131973, "tps": 662824, "wall": 1205.6} {"step": 12193, "train_loss": 3.3176064491271973, "lr": 0.00028668009743653257, "tps": 659908, "wall": 1211.0} {"step": 12194, "train_loss": 3.416459798812866, "lr": 0.00028666230206638967, "tps": 656980, "wall": 1216.5} {"step": 12195, "train_loss": 3.42598032951355, "lr": 0.0002866445059410926, "tps": 654102, "wall": 1221.9} {"step": 12196, "train_loss": 3.474483013153076, "lr": 0.0002866267090608429, "tps": 651230, "wall": 1227.4} {"step": 12197, "train_loss": 3.3429253101348877, "lr": 0.00028660891142584234, "tps": 648343, "wall": 1233.0} {"step": 12198, "train_loss": 3.4293200969696045, "lr": 0.0002865911130362924, "tps": 645548, "wall": 1238.4} {"step": 12199, "train_loss": 3.5044960975646973, "lr": 0.0002865733138923947, "tps": 642771, "wall": 1243.9} {"step": 12200, "train_loss": 3.500293254852295, "lr": 0.0002865555139943509, "tps": 640015, "wall": 1249.4} {"step": 12201, "train_loss": 3.499183177947998, "lr": 0.0002865377133423627, "tps": 637290, "wall": 1254.8} {"step": 12202, "train_loss": 3.454733371734619, "lr": 0.00028651991193663157, "tps": 634585, "wall": 1260.2} {"step": 12203, "train_loss": 3.44989013671875, "lr": 0.00028650210977735935, "tps": 631897, "wall": 1265.7} {"step": 12204, "train_loss": 3.353250741958618, "lr": 0.0002864843068647476, "tps": 629242, "wall": 1271.2} {"step": 12205, "train_loss": 3.3843178749084473, "lr": 0.000286466503198998, "tps": 626609, "wall": 1276.6} {"step": 12206, "train_loss": 3.465480327606201, "lr": 0.0002864486987803124, "tps": 623986, "wall": 1282.1} {"step": 12207, "train_loss": 3.4013195037841797, "lr": 0.0002864308936088922, "tps": 621329, "wall": 1287.7} {"step": 12208, "train_loss": 3.3573102951049805, "lr": 0.0002864130876849393, "tps": 618746, "wall": 1293.1} {"step": 12209, "train_loss": 3.458956718444824, "lr": 0.00028639528100865536, "tps": 616189, "wall": 1298.6} {"step": 12210, "train_loss": 3.3434677124023438, "lr": 0.000286377473580242, "tps": 613653, "wall": 1304.1} {"step": 12211, "train_loss": 3.3964788913726807, "lr": 0.0002863596653999011, "tps": 611134, "wall": 1309.6} {"step": 12212, "train_loss": 3.380404472351074, "lr": 0.00028634185646783433, "tps": 608635, "wall": 1315.1} {"step": 12213, "train_loss": 3.4365310668945312, "lr": 0.0002863240467842434, "tps": 606177, "wall": 1320.5} {"step": 12214, "train_loss": 3.4182815551757812, "lr": 0.0002863062363493301, "tps": 603741, "wall": 1325.9} {"step": 12215, "train_loss": 3.4865498542785645, "lr": 0.00028628842516329616, "tps": 601322, "wall": 1331.4} {"step": 12216, "train_loss": 3.4634077548980713, "lr": 0.0002862706132263434, "tps": 598902, "wall": 1336.9} {"step": 12217, "train_loss": 3.399332284927368, "lr": 0.0002862528005386734, "tps": 596507, "wall": 1342.3} {"step": 12218, "train_loss": 3.40710186958313, "lr": 0.0002862349871004882, "tps": 594112, "wall": 1347.9} {"step": 12219, "train_loss": 3.385737895965576, "lr": 0.00028621717291198943, "tps": 591774, "wall": 1353.3} {"step": 12220, "train_loss": 3.501518964767456, "lr": 0.000286199357973379, "tps": 589448, "wall": 1358.8} {"step": 12221, "train_loss": 3.4327738285064697, "lr": 0.0002861815422848587, "tps": 587130, "wall": 1364.2} {"step": 12222, "train_loss": 3.5178327560424805, "lr": 0.00028616372584663023, "tps": 584840, "wall": 1369.7} {"step": 12223, "train_loss": 3.4578213691711426, "lr": 0.00028614590865889554, "tps": 582563, "wall": 1375.2} {"step": 12224, "train_loss": 3.4894046783447266, "lr": 0.0002861280907218564, "tps": 580306, "wall": 1380.6} {"step": 12225, "train_loss": 3.5263257026672363, "lr": 0.00028611027203571466, "tps": 578064, "wall": 1386.1} {"step": 12226, "train_loss": 3.411447763442993, "lr": 0.0002860924526006722, "tps": 575829, "wall": 1391.6} {"step": 12227, "train_loss": 3.3341808319091797, "lr": 0.0002860746324169308, "tps": 573629, "wall": 1397.0} {"step": 12228, "train_loss": 3.4666123390197754, "lr": 0.00028605681148469246, "tps": 571438, "wall": 1402.5} {"step": 12229, "train_loss": 3.5060038566589355, "lr": 0.00028603898980415895, "tps": 569230, "wall": 1408.0} {"step": 12230, "train_loss": 3.372812509536743, "lr": 0.00028602116737553223, "tps": 567077, "wall": 1413.5} {"step": 12231, "train_loss": 3.4185357093811035, "lr": 0.00028600334419901413, "tps": 564932, "wall": 1419.0} {"step": 12232, "train_loss": 3.360780954360962, "lr": 0.0002859855202748065, "tps": 562802, "wall": 1424.5} {"step": 12233, "train_loss": 3.428384304046631, "lr": 0.0002859676956031115, "tps": 560713, "wall": 1429.9} {"step": 12234, "train_loss": 3.524355173110962, "lr": 0.0002859498701841308, "tps": 558623, "wall": 1435.4} {"step": 12235, "train_loss": 3.3897275924682617, "lr": 0.0002859320440180663, "tps": 556552, "wall": 1440.8} {"step": 12236, "train_loss": 3.4038047790527344, "lr": 0.00028591421710512014, "tps": 554490, "wall": 1446.3} {"step": 12237, "train_loss": 3.468186616897583, "lr": 0.00028589638944549414, "tps": 552463, "wall": 1451.7} {"step": 12238, "train_loss": 3.4868030548095703, "lr": 0.00028587856103939023, "tps": 550415, "wall": 1457.3} {"step": 12239, "train_loss": 3.3900985717773438, "lr": 0.0002858607318870105, "tps": 548405, "wall": 1462.7} {"step": 12240, "train_loss": 3.459831476211548, "lr": 0.00028584290198855683, "tps": 546376, "wall": 1468.3} {"step": 12241, "train_loss": 3.397031307220459, "lr": 0.00028582507134423116, "tps": 544402, "wall": 1473.7} {"step": 12242, "train_loss": 3.4442527294158936, "lr": 0.0002858072399542355, "tps": 542429, "wall": 1479.2} {"step": 12243, "train_loss": 3.458944797515869, "lr": 0.00028578940781877197, "tps": 540482, "wall": 1484.6} {"step": 12244, "train_loss": 3.414418935775757, "lr": 0.00028577157493804236, "tps": 538530, "wall": 1490.1} {"step": 12245, "train_loss": 3.4855635166168213, "lr": 0.00028575374131224876, "tps": 536600, "wall": 1495.6} {"step": 12246, "train_loss": 3.4374215602874756, "lr": 0.0002857359069415933, "tps": 534691, "wall": 1501.1} {"step": 12247, "train_loss": 3.463728427886963, "lr": 0.00028571807182627796, "tps": 532805, "wall": 1506.5} {"step": 12248, "train_loss": 3.3771159648895264, "lr": 0.00028570023596650475, "tps": 530927, "wall": 1512.0} {"step": 12249, "train_loss": 3.4742541313171387, "lr": 0.00028568239936247565, "tps": 529068, "wall": 1517.4} {"step": 12250, "train_loss": 3.474985361099243, "lr": 0.0002856645620143928, "tps": 527214, "wall": 1522.9} {"step": 12251, "train_loss": 3.3733577728271484, "lr": 0.0002856467239224582, "tps": 525349, "wall": 1528.4} {"step": 12252, "train_loss": 3.337721109390259, "lr": 0.00028562888508687403, "tps": 523526, "wall": 1533.9} {"step": 12253, "train_loss": 3.423600196838379, "lr": 0.00028561104550784225, "tps": 521718, "wall": 1539.3} {"step": 12254, "train_loss": 3.4951863288879395, "lr": 0.00028559320518556505, "tps": 519922, "wall": 1544.7} {"step": 12255, "train_loss": 3.49100399017334, "lr": 0.00028557536412024436, "tps": 518145, "wall": 1550.2} {"step": 12256, "train_loss": 3.5145955085754395, "lr": 0.0002855575223120825, "tps": 516369, "wall": 1555.6} {"step": 12257, "train_loss": 3.3687081336975098, "lr": 0.00028553967976128146, "tps": 514604, "wall": 1561.1} {"step": 12258, "train_loss": 3.4499711990356445, "lr": 0.0002855218364680434, "tps": 512839, "wall": 1566.6} {"step": 12259, "train_loss": 3.50293231010437, "lr": 0.0002855039924325704, "tps": 511099, "wall": 1572.0} {"step": 12260, "train_loss": 3.2996625900268555, "lr": 0.0002854861476550646, "tps": 509365, "wall": 1577.5} {"step": 12261, "train_loss": 3.3833200931549072, "lr": 0.00028546830213572826, "tps": 507648, "wall": 1583.0} {"step": 12262, "train_loss": 3.481703758239746, "lr": 0.0002854504558747634, "tps": 505907, "wall": 1588.6} {"step": 12263, "train_loss": 3.5382792949676514, "lr": 0.00028543260887237224, "tps": 504229, "wall": 1594.0} {"step": 12264, "train_loss": 3.47031831741333, "lr": 0.0002854147611287569, "tps": 502548, "wall": 1599.4} {"step": 12265, "train_loss": 3.2782371044158936, "lr": 0.0002853969126441197, "tps": 500885, "wall": 1604.9} {"step": 12266, "train_loss": 3.377080202102661, "lr": 0.0002853790634186627, "tps": 499240, "wall": 1610.3} {"step": 12267, "train_loss": 3.4174466133117676, "lr": 0.00028536121345258816, "tps": 497611, "wall": 1615.7} {"step": 12268, "train_loss": 3.4892780780792236, "lr": 0.0002853433627460982, "tps": 495977, "wall": 1621.2} {"step": 12269, "train_loss": 3.409679889678955, "lr": 0.0002853255112993951, "tps": 494369, "wall": 1626.6} {"step": 12270, "train_loss": 3.4568142890930176, "lr": 0.00028530765911268104, "tps": 492761, "wall": 1632.0} {"step": 12271, "train_loss": 3.4221038818359375, "lr": 0.00028528980618615834, "tps": 491166, "wall": 1637.4} {"step": 12272, "train_loss": 3.453937530517578, "lr": 0.00028527195252002924, "tps": 489585, "wall": 1642.9} {"step": 12273, "train_loss": 3.3836255073547363, "lr": 0.00028525409811449583, "tps": 488000, "wall": 1648.3} {"step": 12274, "train_loss": 3.5322160720825195, "lr": 0.0002852362429697605, "tps": 486434, "wall": 1653.8} {"step": 12275, "train_loss": 3.410677433013916, "lr": 0.0002852183870860255, "tps": 484882, "wall": 1659.2} {"step": 12276, "train_loss": 3.412303924560547, "lr": 0.00028520053046349306, "tps": 483341, "wall": 1664.6} {"step": 12277, "train_loss": 3.4543888568878174, "lr": 0.00028518267310236544, "tps": 481809, "wall": 1670.1} {"step": 12278, "train_loss": 3.442234992980957, "lr": 0.0002851648150028451, "tps": 480287, "wall": 1675.5} {"step": 12279, "train_loss": 3.477848529815674, "lr": 0.0002851469561651341, "tps": 478781, "wall": 1680.9} {"step": 12280, "train_loss": 3.5055837631225586, "lr": 0.00028512909658943487, "tps": 477283, "wall": 1686.3} {"step": 12281, "train_loss": 3.4002537727355957, "lr": 0.0002851112362759497, "tps": 475799, "wall": 1691.7} {"step": 12282, "train_loss": 3.425506114959717, "lr": 0.000285093375224881, "tps": 474321, "wall": 1697.1} {"step": 12283, "train_loss": 3.3620455265045166, "lr": 0.00028507551343643093, "tps": 472845, "wall": 1702.6} {"step": 12284, "train_loss": 3.4575657844543457, "lr": 0.000285057650910802, "tps": 471361, "wall": 1708.1} {"step": 12285, "train_loss": 3.4394009113311768, "lr": 0.00028503978764819645, "tps": 469915, "wall": 1713.4} {"step": 12286, "train_loss": 3.468374490737915, "lr": 0.00028502192364881666, "tps": 468464, "wall": 1718.9} {"step": 12287, "train_loss": 3.4388427734375, "lr": 0.000285004058912865, "tps": 467026, "wall": 1724.3} {"step": 12288, "train_loss": 3.42155385017395, "lr": 0.0002849861934405439, "tps": 465603, "wall": 1729.7} {"step": 12289, "train_loss": 3.3753905296325684, "lr": 0.00028496832723205555, "tps": 464184, "wall": 1735.2} {"step": 12290, "train_loss": 3.445572853088379, "lr": 0.0002849504602876026, "tps": 462765, "wall": 1740.6} {"step": 12291, "train_loss": 3.531686305999756, "lr": 0.0002849325926073873, "tps": 461366, "wall": 1746.0} {"step": 12292, "train_loss": 3.3998026847839355, "lr": 0.00028491472419161205, "tps": 459950, "wall": 1751.6} {"step": 12293, "train_loss": 3.4472928047180176, "lr": 0.0002848968550404793, "tps": 458576, "wall": 1757.0} {"step": 12294, "train_loss": 3.448909282684326, "lr": 0.00028487898515419153, "tps": 457204, "wall": 1762.4} {"step": 12295, "train_loss": 3.4094109535217285, "lr": 0.000284861114532951, "tps": 455801, "wall": 1767.9} {"step": 12296, "train_loss": 3.4396111965179443, "lr": 0.0002848432431769603, "tps": 454438, "wall": 1773.4} {"step": 12297, "train_loss": 3.459805488586426, "lr": 0.00028482537108642184, "tps": 453085, "wall": 1778.8} {"step": 12298, "train_loss": 3.5108726024627686, "lr": 0.0002848074982615381, "tps": 451738, "wall": 1784.3} {"step": 12299, "train_loss": 3.5279979705810547, "lr": 0.00028478962470251143, "tps": 450408, "wall": 1789.7} {"step": 12300, "train_loss": 3.3415918350219727, "lr": 0.0002847717504095444, "tps": 449080, "wall": 1795.1} {"step": 12301, "train_loss": 3.4982237815856934, "lr": 0.0002847538753828396, "tps": 447765, "wall": 1800.5} {"step": 12302, "train_loss": 3.4202523231506348, "lr": 0.00028473599962259926, "tps": 446453, "wall": 1806.0} {"step": 12303, "train_loss": 3.4061005115509033, "lr": 0.00028471812312902607, "tps": 445147, "wall": 1811.4} {"step": 12304, "train_loss": 3.380869150161743, "lr": 0.0002847002459023224, "tps": 443856, "wall": 1816.9} {"step": 12305, "train_loss": 3.396056890487671, "lr": 0.000284682367942691, "tps": 442565, "wall": 1822.3} {"step": 12306, "train_loss": 3.392422914505005, "lr": 0.00028466448925033416, "tps": 441278, "wall": 1827.8} {"step": 12307, "train_loss": 3.3848917484283447, "lr": 0.0002846466098254544, "tps": 440001, "wall": 1833.2} {"step": 12308, "train_loss": 3.4161388874053955, "lr": 0.00028462872966825446, "tps": 438740, "wall": 1838.6} {"step": 12309, "train_loss": 3.381166934967041, "lr": 0.00028461084877893676, "tps": 437492, "wall": 1844.0} {"step": 12310, "train_loss": 3.3163342475891113, "lr": 0.0002845929671577039, "tps": 436248, "wall": 1849.4} {"step": 12311, "train_loss": 3.438647985458374, "lr": 0.00028457508480475834, "tps": 435010, "wall": 1854.8} {"step": 12312, "train_loss": 3.4491968154907227, "lr": 0.00028455720172030274, "tps": 433776, "wall": 1860.3} {"step": 12313, "train_loss": 3.5050652027130127, "lr": 0.00028453931790453966, "tps": 432553, "wall": 1865.7} {"step": 12314, "train_loss": 3.5058279037475586, "lr": 0.00028452143335767167, "tps": 431339, "wall": 1871.1} {"step": 12315, "train_loss": 3.448775291442871, "lr": 0.00028450354807990153, "tps": 430131, "wall": 1876.5} {"step": 12316, "train_loss": 3.3689115047454834, "lr": 0.00028448566207143154, "tps": 428928, "wall": 1881.9} {"step": 12317, "train_loss": 3.431004762649536, "lr": 0.0002844677753324645, "tps": 427715, "wall": 1887.4} {"step": 12318, "train_loss": 3.355933427810669, "lr": 0.00028444988786320314, "tps": 426514, "wall": 1892.9} {"step": 12319, "train_loss": 3.4280850887298584, "lr": 0.0002844319996638499, "tps": 425339, "wall": 1898.3} {"step": 12320, "train_loss": 3.352694511413574, "lr": 0.00028441411073460744, "tps": 424160, "wall": 1903.7} {"step": 12321, "train_loss": 3.504103183746338, "lr": 0.0002843962210756785, "tps": 422996, "wall": 1909.1} {"step": 12322, "train_loss": 3.431084156036377, "lr": 0.0002843783306872657, "tps": 421839, "wall": 1914.5} {"step": 12323, "train_loss": 3.391554117202759, "lr": 0.0002843604395695716, "tps": 420672, "wall": 1919.9} {"step": 12324, "train_loss": 3.3376917839050293, "lr": 0.000284342547722799, "tps": 419517, "wall": 1925.4} {"step": 12325, "train_loss": 3.4011032581329346, "lr": 0.0002843246551471506, "tps": 418378, "wall": 1930.8} {"step": 12326, "train_loss": 3.4712843894958496, "lr": 0.0002843067618428289, "tps": 417233, "wall": 1936.2} {"step": 12327, "train_loss": 3.540187358856201, "lr": 0.00028428886781003683, "tps": 416102, "wall": 1941.7} {"step": 12328, "train_loss": 3.3941071033477783, "lr": 0.000284270973048977, "tps": 414972, "wall": 1947.1} {"step": 12329, "train_loss": 3.362124443054199, "lr": 0.0002842530775598521, "tps": 413828, "wall": 1952.6} {"step": 12330, "train_loss": 3.4041528701782227, "lr": 0.00028423518134286475, "tps": 412707, "wall": 1958.1} {"step": 12331, "train_loss": 3.506923198699951, "lr": 0.0002842172843982179, "tps": 411597, "wall": 1963.5} {"step": 12332, "train_loss": 3.364197015762329, "lr": 0.00028419938672611414, "tps": 410494, "wall": 1969.0} {"step": 12333, "train_loss": 3.3930649757385254, "lr": 0.00028418148832675625, "tps": 409402, "wall": 1974.4} {"step": 12334, "train_loss": 3.351560592651367, "lr": 0.00028416358920034697, "tps": 408321, "wall": 1979.8} {"step": 12335, "train_loss": 3.5278286933898926, "lr": 0.00028414568934708915, "tps": 407235, "wall": 1985.2} {"step": 12336, "train_loss": 3.422752618789673, "lr": 0.0002841277887671855, "tps": 406154, "wall": 1990.7} {"step": 12337, "train_loss": 3.473660707473755, "lr": 0.0002841098874608387, "tps": 405077, "wall": 1996.1} {"step": 12338, "train_loss": 3.4812450408935547, "lr": 0.00028409198542825163, "tps": 404008, "wall": 2001.6} {"step": 12339, "train_loss": 3.377864122390747, "lr": 0.00028407408266962716, "tps": 402956, "wall": 2006.9} {"step": 12340, "train_loss": 3.392691135406494, "lr": 0.00028405617918516793, "tps": 401886, "wall": 2012.5} {"step": 12341, "train_loss": 3.406704902648926, "lr": 0.0002840382749750769, "tps": 400836, "wall": 2017.9} {"step": 12342, "train_loss": 3.6771445274353027, "lr": 0.00028402037003955684, "tps": 399792, "wall": 2023.3} {"step": 12343, "train_loss": 3.4322049617767334, "lr": 0.0002840024643788105, "tps": 398758, "wall": 2028.7} {"step": 12344, "train_loss": 3.4219532012939453, "lr": 0.0002839845579930408, "tps": 397722, "wall": 2034.2} {"step": 12345, "train_loss": 3.399510145187378, "lr": 0.0002839666508824506, "tps": 396697, "wall": 2039.6} {"step": 12346, "train_loss": 3.4179224967956543, "lr": 0.0002839487430472427, "tps": 395675, "wall": 2045.0} {"step": 12347, "train_loss": 3.4561057090759277, "lr": 0.00028393083448762, "tps": 394666, "wall": 2050.4} {"step": 12348, "train_loss": 3.382100820541382, "lr": 0.0002839129252037853, "tps": 393664, "wall": 2055.8} {"step": 12349, "train_loss": 3.4077446460723877, "lr": 0.0002838950151959416, "tps": 392660, "wall": 2061.2} {"step": 12350, "train_loss": 3.358180046081543, "lr": 0.00028387710446429163, "tps": 391660, "wall": 2066.7} {"step": 12351, "train_loss": 3.499915361404419, "lr": 0.00028385919300903835, "tps": 390652, "wall": 2072.2} {"step": 12352, "train_loss": 3.393805503845215, "lr": 0.0002838412808303847, "tps": 389669, "wall": 2077.6} {"step": 12353, "train_loss": 3.4929587841033936, "lr": 0.00028382336792853366, "tps": 388681, "wall": 2083.0} {"step": 12354, "train_loss": 3.470618724822998, "lr": 0.00028380545430368797, "tps": 387703, "wall": 2088.4} {"step": 12355, "train_loss": 3.505099058151245, "lr": 0.00028378753995605065, "tps": 386728, "wall": 2093.9} {"step": 12356, "train_loss": 3.3498659133911133, "lr": 0.00028376962488582463, "tps": 385754, "wall": 2099.3} {"step": 12357, "train_loss": 3.4166312217712402, "lr": 0.00028375170909321286, "tps": 384798, "wall": 2104.7} {"step": 12358, "train_loss": 3.428823947906494, "lr": 0.0002837337925784183, "tps": 383848, "wall": 2110.1} {"step": 12359, "train_loss": 3.40307354927063, "lr": 0.00028371587534164387, "tps": 382900, "wall": 2115.5} {"step": 12360, "train_loss": 3.4166347980499268, "lr": 0.0002836979573830925, "tps": 381954, "wall": 2120.9} {"step": 12361, "train_loss": 3.4057371616363525, "lr": 0.0002836800387029673, "tps": 381006, "wall": 2126.4} {"step": 12362, "train_loss": 3.486762046813965, "lr": 0.00028366211930147116, "tps": 380060, "wall": 2131.8} {"step": 12363, "train_loss": 3.352194309234619, "lr": 0.00028364419917880707, "tps": 379126, "wall": 2137.2} {"step": 12364, "train_loss": 3.3919010162353516, "lr": 0.0002836262783351781, "tps": 378200, "wall": 2142.7} {"step": 12365, "train_loss": 3.4539294242858887, "lr": 0.0002836083567707871, "tps": 377274, "wall": 2148.1} {"step": 12366, "train_loss": 3.3735971450805664, "lr": 0.0002835904344858373, "tps": 376357, "wall": 2153.5} {"step": 12367, "train_loss": 3.544454336166382, "lr": 0.00028357251148053154, "tps": 375446, "wall": 2158.9} {"step": 12368, "train_loss": 3.262437343597412, "lr": 0.00028355458775507295, "tps": 374541, "wall": 2164.3} {"step": 12369, "train_loss": 3.376555919647217, "lr": 0.0002835366633096646, "tps": 373638, "wall": 2169.7} {"step": 12370, "train_loss": 3.286130905151367, "lr": 0.00028351873814450946, "tps": 372736, "wall": 2175.1} {"step": 12371, "train_loss": 3.387481927871704, "lr": 0.0002835008122598106, "tps": 371832, "wall": 2180.6} {"step": 12372, "train_loss": 3.2940080165863037, "lr": 0.0002834828856557711, "tps": 370809, "wall": 2186.8} {"step": 12373, "train_loss": 3.4263994693756104, "lr": 0.0002834649583325941, "tps": 369877, "wall": 2192.5} {"step": 12374, "train_loss": 3.323949098587036, "lr": 0.00028344703029048256, "tps": 368985, "wall": 2197.9} {"step": 12375, "train_loss": 3.32637095451355, "lr": 0.0002834291015296396, "tps": 368111, "wall": 2203.3} {"step": 12376, "train_loss": 3.477609634399414, "lr": 0.0002834111720502684, "tps": 367237, "wall": 2208.8} {"step": 12377, "train_loss": 3.468738555908203, "lr": 0.00028339324185257204, "tps": 366369, "wall": 2214.2} {"step": 12378, "train_loss": 3.4914538860321045, "lr": 0.00028337531093675355, "tps": 365508, "wall": 2219.6} {"step": 12379, "train_loss": 3.451010227203369, "lr": 0.0002833573793030161, "tps": 364645, "wall": 2225.0} {"step": 12380, "train_loss": 3.5367259979248047, "lr": 0.0002833394469515629, "tps": 363784, "wall": 2230.4} {"step": 12381, "train_loss": 3.3327012062072754, "lr": 0.00028332151388259696, "tps": 362928, "wall": 2235.9} {"step": 12382, "train_loss": 3.4369893074035645, "lr": 0.00028330358009632145, "tps": 362084, "wall": 2241.3} {"step": 12383, "train_loss": 3.448607921600342, "lr": 0.00028328564559293966, "tps": 361241, "wall": 2246.7} {"step": 12384, "train_loss": 3.4348630905151367, "lr": 0.0002832677103726546, "tps": 360388, "wall": 2252.2} {"step": 12385, "train_loss": 3.3397912979125977, "lr": 0.0002832497744356695, "tps": 359549, "wall": 2257.6} {"step": 12386, "train_loss": 3.4266197681427, "lr": 0.00028323183778218754, "tps": 358717, "wall": 2263.0} {"step": 12387, "train_loss": 3.4166080951690674, "lr": 0.00028321390041241194, "tps": 357886, "wall": 2268.5} {"step": 12388, "train_loss": 3.4276552200317383, "lr": 0.00028319596232654574, "tps": 357063, "wall": 2273.9} {"step": 12389, "train_loss": 3.359251022338867, "lr": 0.0002831780235247924, "tps": 356243, "wall": 2279.3} {"step": 12390, "train_loss": 3.498504400253296, "lr": 0.00028316008400735486, "tps": 355426, "wall": 2284.7} {"step": 12391, "train_loss": 3.4981093406677246, "lr": 0.00028314214377443654, "tps": 354619, "wall": 2290.1} {"step": 12392, "train_loss": 3.466092109680176, "lr": 0.00028312420282624055, "tps": 353805, "wall": 2295.6} {"step": 12393, "train_loss": 3.3620967864990234, "lr": 0.0002831062611629703, "tps": 353006, "wall": 2301.0} {"step": 12394, "train_loss": 3.4146666526794434, "lr": 0.0002830883187848288, "tps": 352212, "wall": 2306.3} {"step": 12395, "train_loss": 3.493577480316162, "lr": 0.00028307037569201944, "tps": 351400, "wall": 2311.8} {"step": 12396, "train_loss": 3.401937961578369, "lr": 0.0002830524318847454, "tps": 350605, "wall": 2317.3} {"step": 12397, "train_loss": 3.4592666625976562, "lr": 0.00028303448736321005, "tps": 349813, "wall": 2322.7} {"step": 12398, "train_loss": 3.439655303955078, "lr": 0.00028301654212761664, "tps": 349029, "wall": 2328.1} {"step": 12399, "train_loss": 3.4513843059539795, "lr": 0.0002829985961781684, "tps": 348245, "wall": 2333.5} {"step": 12400, "train_loss": 3.3425328731536865, "lr": 0.0002829806495150687, "tps": 347468, "wall": 2339.0} {"step": 12401, "train_loss": 3.4261362552642822, "lr": 0.00028296270213852077, "tps": 346692, "wall": 2344.4} {"step": 12402, "train_loss": 3.4290080070495605, "lr": 0.0002829447540487279, "tps": 345923, "wall": 2349.8} {"step": 12403, "train_loss": 3.4655003547668457, "lr": 0.0002829268052458935, "tps": 345162, "wall": 2355.1} {"step": 12404, "train_loss": 3.522651195526123, "lr": 0.0002829088557302208, "tps": 344398, "wall": 2360.6} {"step": 12405, "train_loss": 3.4070444107055664, "lr": 0.00028289090550191325, "tps": 343641, "wall": 2366.0} {"step": 12406, "train_loss": 3.4812116622924805, "lr": 0.00028287295456117407, "tps": 342874, "wall": 2371.4} {"step": 12407, "train_loss": 3.3748316764831543, "lr": 0.00028285500290820665, "tps": 342123, "wall": 2376.8} {"step": 12408, "train_loss": 3.4722089767456055, "lr": 0.0002828370505432144, "tps": 341375, "wall": 2382.2} {"step": 12409, "train_loss": 3.49064564704895, "lr": 0.0002828190974664006, "tps": 340635, "wall": 2387.6} {"step": 12410, "train_loss": 3.4170608520507812, "lr": 0.00028280114367796867, "tps": 339898, "wall": 2393.0} {"step": 12411, "train_loss": 3.4143903255462646, "lr": 0.00028278318917812205, "tps": 339155, "wall": 2398.4} {"step": 12412, "train_loss": 3.3259310722351074, "lr": 0.00028276523396706396, "tps": 338422, "wall": 2403.8} {"step": 12413, "train_loss": 3.379411220550537, "lr": 0.000282747278044998, "tps": 337693, "wall": 2409.2} {"step": 12414, "train_loss": 3.4103493690490723, "lr": 0.00028272932141212745, "tps": 336966, "wall": 2414.6} {"step": 12415, "train_loss": 3.5336079597473145, "lr": 0.0002827113640686557, "tps": 336245, "wall": 2419.9} {"step": 12416, "train_loss": 3.4619030952453613, "lr": 0.00028269340601478623, "tps": 335526, "wall": 2425.3} {"step": 12417, "train_loss": 3.3541321754455566, "lr": 0.0002826754472507226, "tps": 334802, "wall": 2430.8} {"step": 12418, "train_loss": 3.3434534072875977, "lr": 0.0002826574877766679, "tps": 334085, "wall": 2436.2} {"step": 12419, "train_loss": 3.4745638370513916, "lr": 0.000282639527592826, "tps": 333374, "wall": 2441.6} {"step": 12420, "train_loss": 3.3536345958709717, "lr": 0.0002826215666994, "tps": 332665, "wall": 2447.0} {"step": 12421, "train_loss": 3.424276828765869, "lr": 0.0002826036050965936, "tps": 331960, "wall": 2452.4} {"step": 12422, "train_loss": 3.440688133239746, "lr": 0.00028258564278461006, "tps": 331249, "wall": 2457.8} {"step": 12423, "train_loss": 3.4091274738311768, "lr": 0.00028256767976365314, "tps": 330552, "wall": 2463.2} {"step": 12424, "train_loss": 3.4874675273895264, "lr": 0.000282549716033926, "tps": 329855, "wall": 2468.6} {"step": 12425, "train_loss": 3.3061256408691406, "lr": 0.00028253175159563234, "tps": 329159, "wall": 2474.0} {"step": 12426, "train_loss": 3.4306769371032715, "lr": 0.00028251378644897563, "tps": 328468, "wall": 2479.4} {"step": 12427, "train_loss": 3.523995876312256, "lr": 0.00028249582059415937, "tps": 327786, "wall": 2484.8} {"step": 12428, "train_loss": 3.4874520301818848, "lr": 0.0002824778540313871, "tps": 327091, "wall": 2490.3} {"step": 12429, "train_loss": 3.4681453704833984, "lr": 0.00028245988676086226, "tps": 326410, "wall": 2495.7} {"step": 12430, "train_loss": 3.4710586071014404, "lr": 0.0002824419187827885, "tps": 325731, "wall": 2501.1} {"step": 12431, "train_loss": 3.4193692207336426, "lr": 0.0002824239500973693, "tps": 325060, "wall": 2506.4} {"step": 12432, "train_loss": 3.3952879905700684, "lr": 0.00028240598070480816, "tps": 324382, "wall": 2511.9} {"step": 12433, "train_loss": 3.4617364406585693, "lr": 0.0002823880106053087, "tps": 323715, "wall": 2517.3} {"step": 12434, "train_loss": 3.516091823577881, "lr": 0.00028237003979907457, "tps": 323048, "wall": 2522.7} {"step": 12435, "train_loss": 3.50875186920166, "lr": 0.00028235206828630915, "tps": 322381, "wall": 2528.1} {"step": 12436, "train_loss": 3.4346041679382324, "lr": 0.00028233409606721616, "tps": 321718, "wall": 2533.5} {"step": 12437, "train_loss": 3.4741625785827637, "lr": 0.00028231612314199916, "tps": 321060, "wall": 2538.9} {"step": 12438, "train_loss": 3.4585466384887695, "lr": 0.00028229814951086175, "tps": 320405, "wall": 2544.3} {"step": 12439, "train_loss": 3.38991379737854, "lr": 0.00028228017517400756, "tps": 319742, "wall": 2549.8} {"step": 12440, "train_loss": 3.359833240509033, "lr": 0.00028226220013164013, "tps": 319092, "wall": 2555.2} {"step": 12441, "train_loss": 3.453766345977783, "lr": 0.00028224422438396314, "tps": 318444, "wall": 2560.6} {"step": 12442, "train_loss": 3.3225183486938477, "lr": 0.0002822262479311802, "tps": 317802, "wall": 2565.9} {"step": 12443, "train_loss": 3.4322474002838135, "lr": 0.000282208270773495, "tps": 317158, "wall": 2571.4} {"step": 12444, "train_loss": 3.4559874534606934, "lr": 0.00028219029291111114, "tps": 316520, "wall": 2576.8} {"step": 12445, "train_loss": 3.380164861679077, "lr": 0.0002821723143442322, "tps": 315883, "wall": 2582.2} {"step": 12446, "train_loss": 3.4572577476501465, "lr": 0.00028215433507306197, "tps": 315251, "wall": 2587.5} {"step": 12447, "train_loss": 3.415703773498535, "lr": 0.0002821363550978041, "tps": 314620, "wall": 2592.9} {"step": 12448, "train_loss": 3.492976427078247, "lr": 0.00028211837441866224, "tps": 313994, "wall": 2598.3} {"step": 12449, "train_loss": 3.4604382514953613, "lr": 0.00028210039303584, "tps": 313367, "wall": 2603.7} {"step": 12450, "train_loss": 3.3932619094848633, "lr": 0.0002820824109495412, "tps": 312735, "wall": 2609.2} {"step": 12451, "train_loss": 3.5307769775390625, "lr": 0.00028206442815996956, "tps": 312119, "wall": 2614.6} {"step": 12452, "train_loss": 3.480916976928711, "lr": 0.0002820464446673286, "tps": 311503, "wall": 2619.9} {"step": 12453, "train_loss": 3.4389572143554688, "lr": 0.00028202846047182216, "tps": 310890, "wall": 2625.3} {"step": 12454, "train_loss": 3.440885066986084, "lr": 0.000282010475573654, "tps": 310278, "wall": 2630.7} {"step": 12455, "train_loss": 3.5646910667419434, "lr": 0.0002819924899730278, "tps": 309669, "wall": 2636.1} {"step": 12456, "train_loss": 3.447880983352661, "lr": 0.00028197450367014736, "tps": 309060, "wall": 2641.5} {"step": 12457, "train_loss": 3.4549670219421387, "lr": 0.0002819565166652164, "tps": 308455, "wall": 2646.9} {"step": 12458, "train_loss": 3.36787486076355, "lr": 0.0002819385289584387, "tps": 307843, "wall": 2652.4} {"step": 12459, "train_loss": 3.3624634742736816, "lr": 0.0002819205405500179, "tps": 307244, "wall": 2657.8} {"step": 12460, "train_loss": 3.3717339038848877, "lr": 0.00028190255144015786, "tps": 306649, "wall": 2663.1} {"step": 12461, "train_loss": 3.38424015045166, "lr": 0.00028188456162906247, "tps": 306035, "wall": 2668.7} {"step": 12462, "train_loss": 3.3596928119659424, "lr": 0.00028186657111693535, "tps": 305446, "wall": 2674.0} {"step": 12463, "train_loss": 3.388843536376953, "lr": 0.0002818485799039804, "tps": 304859, "wall": 2679.4} {"step": 12464, "train_loss": 3.326599597930908, "lr": 0.00028183058799040127, "tps": 304273, "wall": 2684.8} {"step": 12465, "train_loss": 3.445981502532959, "lr": 0.00028181259537640203, "tps": 303689, "wall": 2690.2} {"step": 12466, "train_loss": 3.441967248916626, "lr": 0.0002817946020621863, "tps": 303103, "wall": 2695.6} {"step": 12467, "train_loss": 3.4084861278533936, "lr": 0.000281776608047958, "tps": 302523, "wall": 2701.0} {"step": 12468, "train_loss": 3.468538284301758, "lr": 0.000281758613333921, "tps": 301939, "wall": 2706.4} {"step": 12469, "train_loss": 3.4444632530212402, "lr": 0.00028174061792027896, "tps": 301362, "wall": 2711.8} {"step": 12470, "train_loss": 3.4400928020477295, "lr": 0.00028172262180723595, "tps": 300783, "wall": 2717.2} {"step": 12471, "train_loss": 3.3654675483703613, "lr": 0.0002817046249949958, "tps": 300211, "wall": 2722.6} {"step": 12472, "train_loss": 3.4863991737365723, "lr": 0.0002816866274837622, "tps": 299632, "wall": 2728.1} {"step": 12473, "train_loss": 3.4107184410095215, "lr": 0.00028166862927373913, "tps": 299068, "wall": 2733.5} {"step": 12474, "train_loss": 3.413268566131592, "lr": 0.0002816506303651306, "tps": 298506, "wall": 2738.8} {"step": 12475, "train_loss": 3.3881123065948486, "lr": 0.0002816326307581403, "tps": 297943, "wall": 2744.2} {"step": 12476, "train_loss": 3.4716899394989014, "lr": 0.0002816146304529723, "tps": 297383, "wall": 2749.6} {"step": 12477, "train_loss": 3.4659814834594727, "lr": 0.00028159662944983037, "tps": 296826, "wall": 2755.0} {"step": 12478, "train_loss": 3.3841006755828857, "lr": 0.00028157862774891854, "tps": 296266, "wall": 2760.4} {"step": 12479, "train_loss": 3.4712026119232178, "lr": 0.0002815606253504407, "tps": 295711, "wall": 2765.8} {"step": 12480, "train_loss": 3.411067485809326, "lr": 0.0002815426222546007, "tps": 295159, "wall": 2771.2} {"step": 12481, "train_loss": 3.3965096473693848, "lr": 0.0002815246184616025, "tps": 294610, "wall": 2776.6} {"step": 12482, "train_loss": 3.3480539321899414, "lr": 0.0002815066139716502, "tps": 294064, "wall": 2782.0} {"step": 12483, "train_loss": 3.5526418685913086, "lr": 0.0002814886087849476, "tps": 293518, "wall": 2787.4} {"step": 12484, "train_loss": 3.4170289039611816, "lr": 0.00028147060290169875, "tps": 292971, "wall": 2792.8} {"step": 12485, "train_loss": 3.322906732559204, "lr": 0.00028145259632210754, "tps": 292428, "wall": 2798.2} {"step": 12486, "train_loss": 3.4252121448516846, "lr": 0.00028143458904637803, "tps": 291890, "wall": 2803.6} {"step": 12487, "train_loss": 3.47049617767334, "lr": 0.00028141658107471416, "tps": 291353, "wall": 2809.0} {"step": 12488, "train_loss": 3.4660840034484863, "lr": 0.0002813985724073199, "tps": 290816, "wall": 2814.4} {"step": 12489, "train_loss": 3.521993637084961, "lr": 0.00028138056304439937, "tps": 290282, "wall": 2819.8} {"step": 12490, "train_loss": 3.409930467605591, "lr": 0.00028136255298615644, "tps": 289752, "wall": 2825.2} {"step": 12491, "train_loss": 3.464099407196045, "lr": 0.0002813445422327952, "tps": 289228, "wall": 2830.6} {"step": 12492, "train_loss": 3.4325504302978516, "lr": 0.00028132653078451967, "tps": 288703, "wall": 2835.9} {"step": 12493, "train_loss": 3.409979820251465, "lr": 0.00028130851864153393, "tps": 288177, "wall": 2841.3} {"step": 12494, "train_loss": 3.479079484939575, "lr": 0.0002812905058040419, "tps": 287649, "wall": 2846.8} {"step": 12495, "train_loss": 3.4001290798187256, "lr": 0.0002812724922722478, "tps": 287122, "wall": 2852.2} {"step": 12496, "train_loss": 3.435988664627075, "lr": 0.00028125447804635547, "tps": 286601, "wall": 2857.6} {"step": 12497, "train_loss": 3.445317029953003, "lr": 0.00028123646312656913, "tps": 286080, "wall": 2863.1} {"step": 12498, "train_loss": 3.36997389793396, "lr": 0.0002812184475130929, "tps": 285564, "wall": 2868.5} {"step": 12499, "train_loss": 3.4387145042419434, "lr": 0.00028120043120613076, "tps": 285049, "wall": 2873.9} {"step": 12500, "train_loss": 3.419417381286621, "lr": 0.00028118241420588676, "tps": 284540, "wall": 2879.3} {"step": 12501, "train_loss": 3.508492946624756, "lr": 0.00028116439651256506, "tps": 284011, "wall": 2884.9} {"step": 12502, "train_loss": 3.402683734893799, "lr": 0.0002811463781263699, "tps": 283503, "wall": 2890.3} {"step": 12503, "train_loss": 3.3278868198394775, "lr": 0.0002811283590475051, "tps": 282999, "wall": 2895.6} {"step": 12504, "train_loss": 3.4069926738739014, "lr": 0.0002811103392761751, "tps": 282494, "wall": 2901.0} {"step": 12505, "train_loss": 3.4833459854125977, "lr": 0.0002810923188125837, "tps": 281989, "wall": 2906.5} {"step": 12506, "train_loss": 3.366926908493042, "lr": 0.0002810742976569353, "tps": 281484, "wall": 2911.9} {"step": 12507, "train_loss": 3.3291783332824707, "lr": 0.00028105627580943395, "tps": 280988, "wall": 2917.3} {"step": 12508, "train_loss": 3.236647367477417, "lr": 0.0002810382532702838, "tps": 280494, "wall": 2922.7} {"step": 12509, "train_loss": 3.467095136642456, "lr": 0.000281020230039689, "tps": 279999, "wall": 2928.1} {"step": 12510, "train_loss": 3.438403606414795, "lr": 0.0002810022061178538, "tps": 279508, "wall": 2933.4} {"step": 12511, "train_loss": 3.345351219177246, "lr": 0.0002809841815049822, "tps": 279019, "wall": 2938.8} {"step": 12512, "train_loss": 3.3789398670196533, "lr": 0.00028096615620127853, "tps": 278535, "wall": 2944.2} {"step": 12513, "train_loss": 3.5737032890319824, "lr": 0.000280948130206947, "tps": 278046, "wall": 2949.6} {"step": 12514, "train_loss": 3.4261081218719482, "lr": 0.0002809301035221917, "tps": 277561, "wall": 2955.0} {"step": 12515, "train_loss": 3.4161131381988525, "lr": 0.0002809120761472169, "tps": 277080, "wall": 2960.3} {"step": 12516, "train_loss": 3.5305888652801514, "lr": 0.00028089404808222685, "tps": 276601, "wall": 2965.7} {"step": 12517, "train_loss": 3.4125423431396484, "lr": 0.00028087601932742567, "tps": 276111, "wall": 2971.2} {"step": 12518, "train_loss": 3.452470541000366, "lr": 0.00028085798988301765, "tps": 275631, "wall": 2976.6} {"step": 12519, "train_loss": 3.4117319583892822, "lr": 0.0002808399597492071, "tps": 275157, "wall": 2982.0} {"step": 12520, "train_loss": 3.372623920440674, "lr": 0.0002808219289261981, "tps": 274685, "wall": 2987.3} {"step": 12521, "train_loss": 3.427248239517212, "lr": 0.0002808038974141951, "tps": 274210, "wall": 2992.7} {"step": 12522, "train_loss": 3.3791236877441406, "lr": 0.00028078586521340215, "tps": 273742, "wall": 2998.1} {"step": 12523, "train_loss": 3.47261118888855, "lr": 0.0002807678323240237, "tps": 273274, "wall": 3003.5} {"step": 12524, "train_loss": 3.4314138889312744, "lr": 0.0002807497987462639, "tps": 272807, "wall": 3008.9} {"step": 12525, "train_loss": 3.3851709365844727, "lr": 0.0002807317644803272, "tps": 272342, "wall": 3014.2} {"step": 12526, "train_loss": 3.326610565185547, "lr": 0.00028071372952641766, "tps": 271879, "wall": 3019.6} {"step": 12527, "train_loss": 3.443316698074341, "lr": 0.0002806956938847398, "tps": 271415, "wall": 3025.0} {"step": 12528, "train_loss": 3.308565139770508, "lr": 0.0002806776575554978, "tps": 270949, "wall": 3030.5} {"step": 12529, "train_loss": 3.314640522003174, "lr": 0.000280659620538896, "tps": 270491, "wall": 3035.8} {"step": 12530, "train_loss": 3.4598240852355957, "lr": 0.00028064158283513875, "tps": 270036, "wall": 3041.2} {"step": 12531, "train_loss": 3.402033567428589, "lr": 0.0002806235444444304, "tps": 269583, "wall": 3046.5} {"step": 12532, "train_loss": 3.4057021141052246, "lr": 0.0002806055053669752, "tps": 269129, "wall": 3051.9} {"step": 12533, "train_loss": 3.4901885986328125, "lr": 0.00028058746560297756, "tps": 268679, "wall": 3057.3} {"step": 12534, "train_loss": 3.3826303482055664, "lr": 0.00028056942515264187, "tps": 268227, "wall": 3062.7} {"step": 12535, "train_loss": 3.455686092376709, "lr": 0.0002805513840161724, "tps": 267779, "wall": 3068.0} {"step": 12536, "train_loss": 3.4105286598205566, "lr": 0.0002805333421937737, "tps": 267332, "wall": 3073.4} {"step": 12537, "train_loss": 3.5021533966064453, "lr": 0.00028051529968564995, "tps": 266883, "wall": 3078.8} {"step": 12538, "train_loss": 3.3462939262390137, "lr": 0.0002804972564920056, "tps": 266438, "wall": 3084.2} {"step": 12539, "train_loss": 3.460798740386963, "lr": 0.000280479212613045, "tps": 265988, "wall": 3089.7} {"step": 12540, "train_loss": 3.5079421997070312, "lr": 0.0002804611680489727, "tps": 265548, "wall": 3095.1} {"step": 12541, "train_loss": 3.330495595932007, "lr": 0.000280443122799993, "tps": 265108, "wall": 3100.4} {"step": 12542, "train_loss": 3.3747150897979736, "lr": 0.0002804250768663103, "tps": 264671, "wall": 3105.8} {"step": 12543, "train_loss": 3.490821123123169, "lr": 0.00028040703024812913, "tps": 264231, "wall": 3111.2} {"step": 12544, "train_loss": 3.3924765586853027, "lr": 0.00028038898294565376, "tps": 263795, "wall": 3116.6} {"step": 12545, "train_loss": 3.449094772338867, "lr": 0.0002803709349590888, "tps": 263362, "wall": 3122.0} {"step": 12546, "train_loss": 3.498021125793457, "lr": 0.0002803528862886386, "tps": 262932, "wall": 3127.3} {"step": 12547, "train_loss": 3.4403445720672607, "lr": 0.0002803348369345076, "tps": 262502, "wall": 3132.7} {"step": 12548, "train_loss": 3.408284902572632, "lr": 0.0002803167868969003, "tps": 262074, "wall": 3138.1} {"step": 12549, "train_loss": 3.3442001342773438, "lr": 0.00028029873617602124, "tps": 261647, "wall": 3143.5} {"step": 12550, "train_loss": 3.3919625282287598, "lr": 0.0002802806847720748, "tps": 261213, "wall": 3148.9} {"step": 12551, "train_loss": 3.3770081996917725, "lr": 0.00028026263268526554, "tps": 260791, "wall": 3154.3} {"step": 12552, "train_loss": 3.46154522895813, "lr": 0.00028024457991579786, "tps": 260367, "wall": 3159.7} {"step": 12553, "train_loss": 3.421818494796753, "lr": 0.00028022652646387636, "tps": 259945, "wall": 3165.0} {"step": 12554, "train_loss": 3.370420455932617, "lr": 0.00028020847232970546, "tps": 259525, "wall": 3170.4} {"step": 12555, "train_loss": 3.4098005294799805, "lr": 0.0002801904175134898, "tps": 259107, "wall": 3175.8} {"step": 12556, "train_loss": 3.4523558616638184, "lr": 0.00028017236201543377, "tps": 258688, "wall": 3181.2} {"step": 12557, "train_loss": 3.317565441131592, "lr": 0.000280154305835742, "tps": 258271, "wall": 3186.6} {"step": 12558, "train_loss": 3.2805676460266113, "lr": 0.000280136248974619, "tps": 257858, "wall": 3191.9} {"step": 12559, "train_loss": 3.438359260559082, "lr": 0.0002801181914322693, "tps": 257444, "wall": 3197.3} {"step": 12560, "train_loss": 3.323516845703125, "lr": 0.0002801001332088975, "tps": 257033, "wall": 3202.7} {"step": 12561, "train_loss": 3.4418113231658936, "lr": 0.00028008207430470813, "tps": 256615, "wall": 3208.2} {"step": 12562, "train_loss": 3.382662773132324, "lr": 0.00028006401471990575, "tps": 256207, "wall": 3213.5} {"step": 12563, "train_loss": 3.361154317855835, "lr": 0.000280045954454695, "tps": 255799, "wall": 3218.9} {"step": 12564, "train_loss": 3.4706063270568848, "lr": 0.00028002789350928037, "tps": 255391, "wall": 3224.3} {"step": 12565, "train_loss": 3.381120443344116, "lr": 0.00028000983188386654, "tps": 254987, "wall": 3229.7} {"step": 12566, "train_loss": 3.31821608543396, "lr": 0.0002799917695786581, "tps": 254585, "wall": 3235.0} {"step": 12567, "train_loss": 3.289501428604126, "lr": 0.0002799737065938597, "tps": 254181, "wall": 3240.4} {"step": 12568, "train_loss": 3.529276132583618, "lr": 0.00027995564292967583, "tps": 253781, "wall": 3245.8} {"step": 12569, "train_loss": 3.330594301223755, "lr": 0.0002799375785863112, "tps": 253383, "wall": 3251.2} {"step": 12570, "train_loss": 3.5051751136779785, "lr": 0.0002799195135639705, "tps": 252984, "wall": 3256.5} {"step": 12571, "train_loss": 3.295667886734009, "lr": 0.0002799014478628583, "tps": 252587, "wall": 3261.9} {"step": 12572, "train_loss": 3.3281726837158203, "lr": 0.00027988338148317917, "tps": 252193, "wall": 3267.3} {"step": 12573, "train_loss": 3.2941319942474365, "lr": 0.0002798653144251379, "tps": 251792, "wall": 3272.7} {"step": 12574, "train_loss": 3.4991984367370605, "lr": 0.00027984724668893914, "tps": 251400, "wall": 3278.1} {"step": 12575, "train_loss": 3.4186580181121826, "lr": 0.0002798291782747875, "tps": 251007, "wall": 3283.5} {"step": 12576, "train_loss": 3.3779945373535156, "lr": 0.0002798111091828877, "tps": 250617, "wall": 3288.9} {"step": 12577, "train_loss": 3.4751853942871094, "lr": 0.00027979303941344443, "tps": 250229, "wall": 3294.2} {"step": 12578, "train_loss": 3.316786289215088, "lr": 0.00027977496896666233, "tps": 249841, "wall": 3299.6} {"step": 12579, "train_loss": 3.4193968772888184, "lr": 0.0002797568978427462, "tps": 249456, "wall": 3305.0} {"step": 12580, "train_loss": 3.446852207183838, "lr": 0.0002797388260419007, "tps": 249069, "wall": 3310.4} {"step": 12581, "train_loss": 3.4324259757995605, "lr": 0.0002797207535643305, "tps": 248685, "wall": 3315.7} {"step": 12582, "train_loss": 3.5270981788635254, "lr": 0.0002797026804102404, "tps": 248302, "wall": 3321.1} {"step": 12583, "train_loss": 3.3993477821350098, "lr": 0.0002796846065798351, "tps": 247922, "wall": 3326.5} {"step": 12584, "train_loss": 3.509148359298706, "lr": 0.0002796665320733194, "tps": 247538, "wall": 3331.9} {"step": 12585, "train_loss": 3.3762896060943604, "lr": 0.0002796484568908979, "tps": 247158, "wall": 3337.3} {"step": 12586, "train_loss": 3.3745126724243164, "lr": 0.00027963038103277554, "tps": 246780, "wall": 3342.6} {"step": 12587, "train_loss": 3.4499435424804688, "lr": 0.000279612304499157, "tps": 246404, "wall": 3348.0} {"step": 12588, "train_loss": 3.3125712871551514, "lr": 0.000279594227290247, "tps": 246029, "wall": 3353.4} {"step": 12589, "train_loss": 3.381554365158081, "lr": 0.00027957614940625036, "tps": 245654, "wall": 3358.8} {"step": 12590, "train_loss": 3.4072909355163574, "lr": 0.0002795580708473719, "tps": 245280, "wall": 3364.2} {"step": 12591, "train_loss": 3.297942638397217, "lr": 0.0002795399916138164, "tps": 244910, "wall": 3369.5} {"step": 12592, "train_loss": 3.4176430702209473, "lr": 0.00027952191170578863, "tps": 244540, "wall": 3374.9} {"step": 12593, "train_loss": 3.342393398284912, "lr": 0.00027950383112349344, "tps": 244171, "wall": 3380.2} {"step": 12594, "train_loss": 3.509702444076538, "lr": 0.0002794857498671356, "tps": 243805, "wall": 3385.6} {"step": 12595, "train_loss": 3.444023847579956, "lr": 0.00027946766793692006, "tps": 243431, "wall": 3391.1} {"step": 12596, "train_loss": 3.3603463172912598, "lr": 0.0002794495853330515, "tps": 243065, "wall": 3396.4} {"step": 12597, "train_loss": 3.3209595680236816, "lr": 0.0002794315020557348, "tps": 242700, "wall": 3401.8} {"step": 12598, "train_loss": 3.4499051570892334, "lr": 0.00027941341810517483, "tps": 242335, "wall": 3407.2} {"step": 12599, "train_loss": 3.518400192260742, "lr": 0.0002793953334815765, "tps": 241975, "wall": 3412.6} {"step": 12600, "train_loss": 3.318727970123291, "lr": 0.00027937724818514456, "tps": 241616, "wall": 3417.9} {"step": 12601, "train_loss": 3.5286331176757812, "lr": 0.000279359162216084, "tps": 241254, "wall": 3423.3} {"step": 12602, "train_loss": 3.4399468898773193, "lr": 0.00027934107557459965, "tps": 240894, "wall": 3428.7} {"step": 12603, "train_loss": 3.482506275177002, "lr": 0.0002793229882608963, "tps": 240537, "wall": 3434.0} {"step": 12604, "train_loss": 3.3354134559631348, "lr": 0.00027930490027517897, "tps": 240181, "wall": 3439.4} {"step": 12605, "train_loss": 3.388951063156128, "lr": 0.00027928681161765254, "tps": 239825, "wall": 3444.8} {"step": 12606, "train_loss": 3.4188292026519775, "lr": 0.00027926872228852185, "tps": 239465, "wall": 3450.2} {"step": 12607, "train_loss": 3.3931944370269775, "lr": 0.0002792506322879919, "tps": 239113, "wall": 3455.6} {"step": 12608, "train_loss": 3.3623807430267334, "lr": 0.0002792325416162676, "tps": 238761, "wall": 3461.0} {"step": 12609, "train_loss": 3.5029587745666504, "lr": 0.0002792144502735538, "tps": 238410, "wall": 3466.3} {"step": 12610, "train_loss": 3.2450122833251953, "lr": 0.0002791963582600555, "tps": 238059, "wall": 3471.7} {"step": 12611, "train_loss": 3.371645450592041, "lr": 0.00027917826557597776, "tps": 237713, "wall": 3477.0} {"step": 12612, "train_loss": 3.392946243286133, "lr": 0.0002791601722215254, "tps": 237364, "wall": 3482.4} {"step": 12613, "train_loss": 3.4199345111846924, "lr": 0.00027914207819690334, "tps": 237018, "wall": 3487.8} {"step": 12614, "train_loss": 3.4505858421325684, "lr": 0.00027912398350231663, "tps": 236671, "wall": 3493.2} {"step": 12615, "train_loss": 3.360111713409424, "lr": 0.0002791058881379703, "tps": 236324, "wall": 3498.6} {"step": 12616, "train_loss": 3.4977142810821533, "lr": 0.00027908779210406926, "tps": 235981, "wall": 3504.0} {"step": 12617, "train_loss": 3.4314088821411133, "lr": 0.0002790696954008184, "tps": 235632, "wall": 3509.4} {"step": 12618, "train_loss": 3.4055168628692627, "lr": 0.000279051598028423, "tps": 235291, "wall": 3514.8} {"step": 12619, "train_loss": 3.4064078330993652, "lr": 0.0002790334999870878, "tps": 234950, "wall": 3520.2} {"step": 12620, "train_loss": 3.437037944793701, "lr": 0.00027901540127701793, "tps": 234612, "wall": 3525.5} {"step": 12621, "train_loss": 3.482720375061035, "lr": 0.00027899730189841844, "tps": 234273, "wall": 3530.9} {"step": 12622, "train_loss": 3.419511318206787, "lr": 0.00027897920185149423, "tps": 233937, "wall": 3536.2} {"step": 12623, "train_loss": 3.369199275970459, "lr": 0.00027896110113645055, "tps": 233600, "wall": 3541.6} {"step": 12624, "train_loss": 3.3728160858154297, "lr": 0.00027894299975349225, "tps": 233265, "wall": 3547.0} {"step": 12625, "train_loss": 3.404513359069824, "lr": 0.00027892489770282446, "tps": 232927, "wall": 3552.4} {"step": 12626, "train_loss": 3.4339070320129395, "lr": 0.0002789067949846523, "tps": 232593, "wall": 3557.8} {"step": 12627, "train_loss": 3.3282172679901123, "lr": 0.0002788886915991808, "tps": 232263, "wall": 3563.1} {"step": 12628, "train_loss": 3.4931087493896484, "lr": 0.00027887058754661495, "tps": 231926, "wall": 3568.6} {"step": 12629, "train_loss": 3.4121251106262207, "lr": 0.0002788524828271599, "tps": 231596, "wall": 3574.0} {"step": 12630, "train_loss": 3.4308266639709473, "lr": 0.0002788343774410207, "tps": 231267, "wall": 3579.3} {"step": 12631, "train_loss": 3.4757378101348877, "lr": 0.0002788162713884026, "tps": 230939, "wall": 3584.7} {"step": 12632, "train_loss": 3.40041446685791, "lr": 0.00027879816466951047, "tps": 230612, "wall": 3590.1} {"step": 12633, "train_loss": 3.3847498893737793, "lr": 0.0002787800572845496, "tps": 230287, "wall": 3595.4} {"step": 12634, "train_loss": 3.3893508911132812, "lr": 0.0002787619492337251, "tps": 229961, "wall": 3600.8} {"step": 12635, "train_loss": 3.4000797271728516, "lr": 0.00027874384051724204, "tps": 229638, "wall": 3606.2} {"step": 12636, "train_loss": 3.4950156211853027, "lr": 0.0002787257311353056, "tps": 229315, "wall": 3611.5} {"step": 12637, "train_loss": 3.3992886543273926, "lr": 0.0002787076210881208, "tps": 228993, "wall": 3616.9} {"step": 12638, "train_loss": 3.437528133392334, "lr": 0.000278689510375893, "tps": 228671, "wall": 3622.3} {"step": 12639, "train_loss": 3.364187240600586, "lr": 0.0002786713989988272, "tps": 228351, "wall": 3627.6} {"step": 12640, "train_loss": 3.5581676959991455, "lr": 0.00027865328695712865, "tps": 228030, "wall": 3633.0} {"step": 12641, "train_loss": 3.338884115219116, "lr": 0.0002786351742510025, "tps": 227714, "wall": 3638.4} {"step": 12642, "train_loss": 3.282400608062744, "lr": 0.0002786170608806539, "tps": 227395, "wall": 3643.7} {"step": 12643, "train_loss": 3.42922043800354, "lr": 0.000278598946846288, "tps": 227081, "wall": 3649.1} {"step": 12644, "train_loss": 3.457606792449951, "lr": 0.00027858083214811014, "tps": 226765, "wall": 3654.4} {"step": 12645, "train_loss": 3.3974266052246094, "lr": 0.0002785627167863255, "tps": 226449, "wall": 3659.8} {"step": 12646, "train_loss": 3.405996322631836, "lr": 0.0002785446007611391, "tps": 226135, "wall": 3665.2} {"step": 12647, "train_loss": 3.356428861618042, "lr": 0.0002785264840727564, "tps": 225822, "wall": 3670.6} {"step": 12648, "train_loss": 3.4955780506134033, "lr": 0.0002785083667213825, "tps": 225511, "wall": 3675.9} {"step": 12649, "train_loss": 3.43766450881958, "lr": 0.0002784902487072226, "tps": 225201, "wall": 3681.3} {"step": 12650, "train_loss": 3.334077835083008, "lr": 0.00027847213003048203, "tps": 224893, "wall": 3686.6} {"step": 12651, "train_loss": 3.4531235694885254, "lr": 0.000278454010691366, "tps": 224580, "wall": 3692.1} {"step": 12652, "train_loss": 3.42195463180542, "lr": 0.00027843589069007985, "tps": 224272, "wall": 3697.4} {"step": 12653, "train_loss": 3.451247453689575, "lr": 0.0002784177700268287, "tps": 223967, "wall": 3702.7} {"step": 12654, "train_loss": 3.4964864253997803, "lr": 0.0002783996487018179, "tps": 223661, "wall": 3708.1} {"step": 12655, "train_loss": 3.465087413787842, "lr": 0.0002783815267152527, "tps": 223355, "wall": 3713.5} {"step": 12656, "train_loss": 3.4651126861572266, "lr": 0.0002783634040673384, "tps": 223051, "wall": 3718.8} {"step": 12657, "train_loss": 3.46036696434021, "lr": 0.00027834528075828033, "tps": 222747, "wall": 3724.2} {"step": 12658, "train_loss": 3.3574047088623047, "lr": 0.0002783271567882838, "tps": 222446, "wall": 3729.5} {"step": 12659, "train_loss": 3.419607162475586, "lr": 0.00027830903215755404, "tps": 222143, "wall": 3734.9} {"step": 12660, "train_loss": 3.3308491706848145, "lr": 0.0002782909068662964, "tps": 221842, "wall": 3740.3} {"step": 12661, "train_loss": 3.37318754196167, "lr": 0.0002782727809147162, "tps": 221545, "wall": 3745.6} {"step": 12662, "train_loss": 3.4106063842773438, "lr": 0.00027825465430301885, "tps": 221239, "wall": 3751.1} {"step": 12663, "train_loss": 3.3672289848327637, "lr": 0.00027823652703140957, "tps": 220940, "wall": 3756.4} {"step": 12664, "train_loss": 3.4156856536865234, "lr": 0.0002782183991000938, "tps": 220641, "wall": 3761.8} {"step": 12665, "train_loss": 3.38999605178833, "lr": 0.0002782002705092768, "tps": 220344, "wall": 3767.2} {"step": 12666, "train_loss": 3.381385564804077, "lr": 0.000278182141259164, "tps": 220048, "wall": 3772.6} {"step": 12667, "train_loss": 3.4564931392669678, "lr": 0.0002781640113499608, "tps": 219754, "wall": 3777.9} {"step": 12668, "train_loss": 3.5147433280944824, "lr": 0.00027814588078187245, "tps": 219461, "wall": 3783.2} {"step": 12669, "train_loss": 3.3887460231781006, "lr": 0.00027812774955510454, "tps": 219168, "wall": 3788.6} {"step": 12670, "train_loss": 3.360076904296875, "lr": 0.00027810961766986227, "tps": 218875, "wall": 3794.0} {"step": 12671, "train_loss": 3.4229321479797363, "lr": 0.0002780914851263511, "tps": 218584, "wall": 3799.3} {"step": 12672, "train_loss": 3.3828039169311523, "lr": 0.00027807335192477653, "tps": 218294, "wall": 3804.7} {"step": 12673, "train_loss": 3.370889186859131, "lr": 0.00027805521806534376, "tps": 217996, "wall": 3810.2} {"step": 12674, "train_loss": 3.4382190704345703, "lr": 0.0002780370835482584, "tps": 217706, "wall": 3815.5} {"step": 12675, "train_loss": 3.399704933166504, "lr": 0.0002780189483737258, "tps": 217419, "wall": 3820.9} {"step": 12676, "train_loss": 3.406327724456787, "lr": 0.0002780008125419514, "tps": 217131, "wall": 3826.2} {"step": 12677, "train_loss": 3.3603756427764893, "lr": 0.0002779826760531407, "tps": 216845, "wall": 3831.6} {"step": 12678, "train_loss": 3.3787755966186523, "lr": 0.0002779645389074991, "tps": 216560, "wall": 3836.9} {"step": 12679, "train_loss": 3.480916738510132, "lr": 0.00027794640110523203, "tps": 216276, "wall": 3842.3} {"step": 12680, "train_loss": 3.401587724685669, "lr": 0.00027792826264654507, "tps": 215992, "wall": 3847.6} {"step": 12681, "train_loss": 3.5226871967315674, "lr": 0.00027791012353164355, "tps": 215710, "wall": 3853.0} {"step": 12682, "train_loss": 3.4599742889404297, "lr": 0.000277891983760733, "tps": 215428, "wall": 3858.3} {"step": 12683, "train_loss": 3.3430399894714355, "lr": 0.00027787384333401903, "tps": 215145, "wall": 3863.7} {"step": 12684, "train_loss": 3.300161838531494, "lr": 0.00027785570225170696, "tps": 214858, "wall": 3869.2} {"step": 12685, "train_loss": 3.4214653968811035, "lr": 0.00027783756051400236, "tps": 214579, "wall": 3874.5} {"step": 12686, "train_loss": 3.448507785797119, "lr": 0.00027781941812111076, "tps": 214298, "wall": 3879.9} {"step": 12687, "train_loss": 3.492008924484253, "lr": 0.0002778012750732376, "tps": 214020, "wall": 3885.2} {"step": 12688, "train_loss": 3.4341728687286377, "lr": 0.00027778313137058854, "tps": 213742, "wall": 3890.6} {"step": 12689, "train_loss": 3.344172477722168, "lr": 0.00027776498701336905, "tps": 213466, "wall": 3895.9} {"step": 12690, "train_loss": 3.442051410675049, "lr": 0.00027774684200178464, "tps": 213190, "wall": 3901.3} {"step": 12691, "train_loss": 3.3255932331085205, "lr": 0.00027772869633604084, "tps": 212915, "wall": 3906.6} {"step": 12692, "train_loss": 3.4616479873657227, "lr": 0.00027771055001634326, "tps": 212642, "wall": 3912.0} {"step": 12693, "train_loss": 3.388645648956299, "lr": 0.00027769240304289757, "tps": 212367, "wall": 3917.3} {"step": 12694, "train_loss": 3.412713050842285, "lr": 0.00027767425541590907, "tps": 212094, "wall": 3922.7} {"step": 12695, "train_loss": 3.4001553058624268, "lr": 0.00027765610713558354, "tps": 211817, "wall": 3928.1} {"step": 12696, "train_loss": 3.4797959327697754, "lr": 0.0002776379582021265, "tps": 211546, "wall": 3933.5} {"step": 12697, "train_loss": 3.368001937866211, "lr": 0.0002776198086157436, "tps": 211275, "wall": 3938.8} {"step": 12698, "train_loss": 3.3330750465393066, "lr": 0.0002776016583766403, "tps": 211005, "wall": 3944.2} {"step": 12699, "train_loss": 3.449700355529785, "lr": 0.00027758350748502235, "tps": 210736, "wall": 3949.5} {"step": 12700, "train_loss": 3.4309051036834717, "lr": 0.0002775653559410953, "tps": 210468, "wall": 3954.9} {"step": 12701, "train_loss": 3.446939468383789, "lr": 0.00027754720374506477, "tps": 210197, "wall": 3960.3} {"step": 12702, "train_loss": 3.4283485412597656, "lr": 0.00027752905089713643, "tps": 209932, "wall": 3965.6} {"step": 12703, "train_loss": 3.474174976348877, "lr": 0.0002775108973975159, "tps": 209665, "wall": 3970.9} {"step": 12704, "train_loss": 3.385622978210449, "lr": 0.0002774927432464088, "tps": 209398, "wall": 3976.3} {"step": 12705, "train_loss": 3.4064924716949463, "lr": 0.00027747458844402077, "tps": 209133, "wall": 3981.7} {"step": 12706, "train_loss": 3.50486159324646, "lr": 0.0002774564329905575, "tps": 208869, "wall": 3987.0} {"step": 12707, "train_loss": 3.362281322479248, "lr": 0.00027743827688622464, "tps": 208603, "wall": 3992.4} {"step": 12708, "train_loss": 3.4712581634521484, "lr": 0.0002774201201312279, "tps": 208339, "wall": 3997.8} {"step": 12709, "train_loss": 3.299995183944702, "lr": 0.00027740196272577294, "tps": 208077, "wall": 4003.1} {"step": 12710, "train_loss": 3.462395429611206, "lr": 0.00027738380467006547, "tps": 207816, "wall": 4008.5} {"step": 12711, "train_loss": 3.4314064979553223, "lr": 0.0002773656459643111, "tps": 207556, "wall": 4013.8} {"step": 12712, "train_loss": 3.4549107551574707, "lr": 0.00027734748660871556, "tps": 207294, "wall": 4019.2} {"step": 12713, "train_loss": 3.354001522064209, "lr": 0.00027732932660348464, "tps": 207034, "wall": 4024.6} {"step": 12714, "train_loss": 3.418013095855713, "lr": 0.00027731116594882405, "tps": 206773, "wall": 4030.0} {"step": 12715, "train_loss": 3.516962766647339, "lr": 0.00027729300464493934, "tps": 206514, "wall": 4035.3} {"step": 12716, "train_loss": 3.4750962257385254, "lr": 0.0002772748426920365, "tps": 206256, "wall": 4040.7} {"step": 12717, "train_loss": 3.3657567501068115, "lr": 0.0002772566800903211, "tps": 205999, "wall": 4046.1} {"step": 12718, "train_loss": 3.451019287109375, "lr": 0.00027723851683999893, "tps": 205738, "wall": 4051.5} {"step": 12719, "train_loss": 3.3216633796691895, "lr": 0.0002772203529412757, "tps": 205481, "wall": 4056.9} {"step": 12720, "train_loss": 3.416994094848633, "lr": 0.0002772021883943573, "tps": 205224, "wall": 4062.3} {"step": 12721, "train_loss": 3.4529995918273926, "lr": 0.00027718402319944934, "tps": 204970, "wall": 4067.6} {"step": 12722, "train_loss": 3.4430503845214844, "lr": 0.00027716585735675764, "tps": 204717, "wall": 4073.0} {"step": 12723, "train_loss": 3.3868558406829834, "lr": 0.00027714769086648814, "tps": 204465, "wall": 4078.3} {"step": 12724, "train_loss": 3.4222848415374756, "lr": 0.00027712952372884646, "tps": 204214, "wall": 4083.7} {"step": 12725, "train_loss": 3.401190757751465, "lr": 0.00027711135594403843, "tps": 203961, "wall": 4089.1} {"step": 12726, "train_loss": 3.465437412261963, "lr": 0.00027709318751226983, "tps": 203711, "wall": 4094.4} {"step": 12727, "train_loss": 3.442233085632324, "lr": 0.0002770750184337466, "tps": 203461, "wall": 4099.8} {"step": 12728, "train_loss": 3.3858530521392822, "lr": 0.0002770568487086744, "tps": 203211, "wall": 4105.1} {"step": 12729, "train_loss": 3.441575527191162, "lr": 0.00027703867833725915, "tps": 202957, "wall": 4110.6} {"step": 12730, "train_loss": 3.4127488136291504, "lr": 0.0002770205073197067, "tps": 202710, "wall": 4115.9} {"step": 12731, "train_loss": 3.333519458770752, "lr": 0.00027700233565622286, "tps": 202463, "wall": 4121.3} {"step": 12732, "train_loss": 3.420689105987549, "lr": 0.00027698416334701335, "tps": 202213, "wall": 4126.7} {"step": 12733, "train_loss": 3.368675708770752, "lr": 0.0002769659903922843, "tps": 201967, "wall": 4132.0} {"step": 12734, "train_loss": 3.424938440322876, "lr": 0.00027694781679224136, "tps": 201722, "wall": 4137.4} {"step": 12735, "train_loss": 3.4130921363830566, "lr": 0.0002769296425470905, "tps": 201477, "wall": 4142.7} {"step": 12736, "train_loss": 3.476970911026001, "lr": 0.00027691146765703757, "tps": 201233, "wall": 4148.1} {"step": 12737, "train_loss": 3.4146032333374023, "lr": 0.0002768932921222885, "tps": 200989, "wall": 4153.4} {"step": 12738, "train_loss": 3.3809375762939453, "lr": 0.00027687511594304905, "tps": 200745, "wall": 4158.8} {"step": 12739, "train_loss": 3.4281253814697266, "lr": 0.0002768569391195253, "tps": 200502, "wall": 4164.2} {"step": 12740, "train_loss": 3.4659955501556396, "lr": 0.000276838761651923, "tps": 200256, "wall": 4169.6} {"step": 12741, "train_loss": 3.282482862472534, "lr": 0.0002768205835404481, "tps": 200015, "wall": 4175.0} {"step": 12742, "train_loss": 3.40382981300354, "lr": 0.0002768024047853066, "tps": 199776, "wall": 4180.3} {"step": 12743, "train_loss": 3.4488513469696045, "lr": 0.00027678422538670444, "tps": 199536, "wall": 4185.6} {"step": 12744, "train_loss": 3.3903653621673584, "lr": 0.0002767660453448474, "tps": 199297, "wall": 4191.0} {"step": 12745, "train_loss": 3.4939279556274414, "lr": 0.00027674786465994167, "tps": 199058, "wall": 4196.4} {"step": 12746, "train_loss": 3.3069896697998047, "lr": 0.0002767296833321929, "tps": 198819, "wall": 4201.7} {"step": 12747, "train_loss": 3.417611598968506, "lr": 0.0002767115013618073, "tps": 198582, "wall": 4207.1} {"step": 12748, "train_loss": 3.543386220932007, "lr": 0.0002766933187489907, "tps": 198345, "wall": 4212.4} {"step": 12749, "train_loss": 3.402719497680664, "lr": 0.00027667513549394917, "tps": 198108, "wall": 4217.8} {"step": 12750, "train_loss": 3.387707471847534, "lr": 0.0002766569515968886, "tps": 197871, "wall": 4223.2} {"step": 12751, "train_loss": 3.448995590209961, "lr": 0.00027663876705801504, "tps": 197633, "wall": 4228.6} {"step": 12752, "train_loss": 3.3464956283569336, "lr": 0.00027662058187753443, "tps": 197400, "wall": 4233.9} {"step": 12753, "train_loss": 3.3432846069335938, "lr": 0.00027660239605565277, "tps": 197166, "wall": 4239.3} {"step": 12754, "train_loss": 3.3702540397644043, "lr": 0.0002765842095925762, "tps": 196933, "wall": 4244.6} {"step": 12755, "train_loss": 3.300922155380249, "lr": 0.00027656602248851063, "tps": 196701, "wall": 4250.0} {"step": 12756, "train_loss": 3.5268497467041016, "lr": 0.00027654783474366203, "tps": 196468, "wall": 4255.4} {"step": 12757, "train_loss": 3.3880615234375, "lr": 0.0002765296463582366, "tps": 196236, "wall": 4260.7} {"step": 12758, "train_loss": 3.3761754035949707, "lr": 0.0002765114573324402, "tps": 196007, "wall": 4266.0} {"step": 12759, "train_loss": 3.44576358795166, "lr": 0.000276493267666479, "tps": 195777, "wall": 4271.4} {"step": 12760, "train_loss": 3.3875131607055664, "lr": 0.00027647507736055897, "tps": 195546, "wall": 4276.8} {"step": 12761, "train_loss": 3.433091878890991, "lr": 0.00027645688641488616, "tps": 195316, "wall": 4282.1} {"step": 12762, "train_loss": 3.459024667739868, "lr": 0.00027643869482966673, "tps": 195086, "wall": 4287.5} {"step": 12763, "train_loss": 3.454944610595703, "lr": 0.0002764205026051067, "tps": 194854, "wall": 4293.0} {"step": 12764, "train_loss": 3.2897744178771973, "lr": 0.00027640230974141223, "tps": 194627, "wall": 4298.3} {"step": 12765, "train_loss": 3.3694682121276855, "lr": 0.0002763841162387894, "tps": 194400, "wall": 4303.6} {"step": 12766, "train_loss": 3.4350218772888184, "lr": 0.00027636592209744407, "tps": 194172, "wall": 4309.0} {"step": 12767, "train_loss": 3.368457794189453, "lr": 0.0002763477273175826, "tps": 193945, "wall": 4314.4} {"step": 12768, "train_loss": 3.397019624710083, "lr": 0.0002763295318994111, "tps": 193720, "wall": 4319.8} {"step": 12769, "train_loss": 3.453112840652466, "lr": 0.00027631133584313553, "tps": 193494, "wall": 4325.2} {"step": 12770, "train_loss": 3.371239185333252, "lr": 0.0002762931391489621, "tps": 193271, "wall": 4330.5} {"step": 12771, "train_loss": 3.4076104164123535, "lr": 0.000276274941817097, "tps": 193049, "wall": 4335.8} {"step": 12772, "train_loss": 3.444448471069336, "lr": 0.00027625674384774626, "tps": 192825, "wall": 4341.2} {"step": 12773, "train_loss": 3.403132438659668, "lr": 0.00027623854524111614, "tps": 192602, "wall": 4346.6} {"step": 12774, "train_loss": 3.3211886882781982, "lr": 0.00027622034599741267, "tps": 192376, "wall": 4352.0} {"step": 12775, "train_loss": 3.4564900398254395, "lr": 0.0002762021461168421, "tps": 192153, "wall": 4357.4} {"step": 12776, "train_loss": 3.5295586585998535, "lr": 0.0002761839455996106, "tps": 191932, "wall": 4362.7} {"step": 12777, "train_loss": 3.455955982208252, "lr": 0.00027616574444592427, "tps": 191712, "wall": 4368.1} {"step": 12778, "train_loss": 3.4976792335510254, "lr": 0.00027614754265598945, "tps": 191492, "wall": 4373.5} {"step": 12779, "train_loss": 3.3506360054016113, "lr": 0.00027612934023001214, "tps": 191272, "wall": 4378.8} {"step": 12780, "train_loss": 3.3116912841796875, "lr": 0.0002761111371681987, "tps": 191053, "wall": 4384.2} {"step": 12781, "train_loss": 3.3599958419799805, "lr": 0.0002760929334707552, "tps": 190832, "wall": 4389.6} {"step": 12782, "train_loss": 3.4342703819274902, "lr": 0.00027607472913788794, "tps": 190615, "wall": 4395.0} {"step": 12783, "train_loss": 3.318190574645996, "lr": 0.0002760565241698031, "tps": 190399, "wall": 4400.3} {"step": 12784, "train_loss": 3.459879159927368, "lr": 0.0002760383185667069, "tps": 190180, "wall": 4405.7} {"step": 12785, "train_loss": 3.3541147708892822, "lr": 0.00027602011232880563, "tps": 189960, "wall": 4411.1} {"step": 12786, "train_loss": 3.591139316558838, "lr": 0.00027600190545630553, "tps": 189742, "wall": 4416.5} {"step": 12787, "train_loss": 3.3850150108337402, "lr": 0.00027598369794941277, "tps": 189527, "wall": 4421.9} {"step": 12788, "train_loss": 3.4797215461730957, "lr": 0.0002759654898083337, "tps": 189311, "wall": 4427.3} {"step": 12789, "train_loss": 3.432412624359131, "lr": 0.0002759472810332744, "tps": 189097, "wall": 4432.7} {"step": 12790, "train_loss": 3.4329915046691895, "lr": 0.0002759290716244414, "tps": 188882, "wall": 4438.1} {"step": 12791, "train_loss": 3.468787670135498, "lr": 0.0002759108615820408, "tps": 188669, "wall": 4443.4} {"step": 12792, "train_loss": 3.4429221153259277, "lr": 0.000275892650906279, "tps": 188450, "wall": 4448.9} {"step": 12793, "train_loss": 3.3955812454223633, "lr": 0.0002758744395973621, "tps": 188240, "wall": 4454.2} {"step": 12794, "train_loss": 3.447852611541748, "lr": 0.00027585622765549666, "tps": 188029, "wall": 4459.6} {"step": 12795, "train_loss": 3.4553017616271973, "lr": 0.0002758380150808888, "tps": 187817, "wall": 4465.0} {"step": 12796, "train_loss": 3.348010540008545, "lr": 0.0002758198018737449, "tps": 187604, "wall": 4470.4} {"step": 12797, "train_loss": 3.524207830429077, "lr": 0.00027580158803427123, "tps": 187394, "wall": 4475.7} {"step": 12798, "train_loss": 3.3667757511138916, "lr": 0.00027578337356267416, "tps": 187185, "wall": 4481.1} {"step": 12799, "train_loss": 3.465876340866089, "lr": 0.00027576515845916005, "tps": 186975, "wall": 4486.5} {"step": 12800, "train_loss": 3.3049511909484863, "lr": 0.00027574694272393516, "tps": 186766, "wall": 4491.8} {"step": 12801, "train_loss": 3.463021755218506, "lr": 0.00027572872635720587, "tps": 186558, "wall": 4497.2} {"step": 12802, "train_loss": 3.398991584777832, "lr": 0.00027571050935917867, "tps": 186349, "wall": 4502.6} {"step": 12803, "train_loss": 3.47843861579895, "lr": 0.00027569229173005967, "tps": 186143, "wall": 4507.9} {"step": 12804, "train_loss": 3.4604296684265137, "lr": 0.00027567407347005546, "tps": 185936, "wall": 4513.3} {"step": 12805, "train_loss": 3.389294147491455, "lr": 0.0002756558545793723, "tps": 185729, "wall": 4518.7} {"step": 12806, "train_loss": 3.4488980770111084, "lr": 0.00027563763505821664, "tps": 185522, "wall": 4524.1} {"step": 12807, "train_loss": 3.3566699028015137, "lr": 0.0002756194149067948, "tps": 185311, "wall": 4529.6} {"step": 12808, "train_loss": 3.3809127807617188, "lr": 0.00027560119412531326, "tps": 185106, "wall": 4535.0} {"step": 12809, "train_loss": 3.401493549346924, "lr": 0.00027558297271397834, "tps": 184902, "wall": 4540.3} {"step": 12810, "train_loss": 3.4576876163482666, "lr": 0.0002755647506729965, "tps": 184698, "wall": 4545.7} {"step": 12811, "train_loss": 3.375595808029175, "lr": 0.00027554652800257417, "tps": 184495, "wall": 4551.0} {"step": 12812, "train_loss": 3.3434088230133057, "lr": 0.00027552830470291777, "tps": 184292, "wall": 4556.4} {"step": 12813, "train_loss": 3.3052709102630615, "lr": 0.0002755100807742338, "tps": 184088, "wall": 4561.8} {"step": 12814, "train_loss": 3.3704452514648438, "lr": 0.00027549185621672854, "tps": 183887, "wall": 4567.2} {"step": 12815, "train_loss": 3.4440207481384277, "lr": 0.00027547363103060855, "tps": 183685, "wall": 4572.5} {"step": 12816, "train_loss": 3.3886749744415283, "lr": 0.00027545540521608033, "tps": 183484, "wall": 4577.9} {"step": 12817, "train_loss": 3.4270405769348145, "lr": 0.00027543717877335014, "tps": 183282, "wall": 4583.3} {"step": 12818, "train_loss": 3.419149160385132, "lr": 0.00027541895170262473, "tps": 183079, "wall": 4588.7} {"step": 12819, "train_loss": 3.4588425159454346, "lr": 0.0002754007240041104, "tps": 182881, "wall": 4594.1} {"step": 12820, "train_loss": 3.409454822540283, "lr": 0.0002753824956780136, "tps": 182682, "wall": 4599.4} {"step": 12821, "train_loss": 3.452183485031128, "lr": 0.00027536426672454095, "tps": 182484, "wall": 4604.8} {"step": 12822, "train_loss": 3.494269371032715, "lr": 0.00027534603714389884, "tps": 182285, "wall": 4610.2} {"step": 12823, "train_loss": 3.442828416824341, "lr": 0.0002753278069362939, "tps": 182088, "wall": 4615.5} {"step": 12824, "train_loss": 3.569129228591919, "lr": 0.00027530957610193255, "tps": 181890, "wall": 4620.9} {"step": 12825, "train_loss": 3.442448377609253, "lr": 0.0002752913446410214, "tps": 181695, "wall": 4626.2} {"step": 12826, "train_loss": 3.35072660446167, "lr": 0.00027527311255376674, "tps": 181498, "wall": 4631.6} {"step": 12827, "train_loss": 3.3349123001098633, "lr": 0.00027525487984037537, "tps": 181302, "wall": 4637.0} {"step": 12828, "train_loss": 3.439891815185547, "lr": 0.0002752366465010537, "tps": 181106, "wall": 4642.4} {"step": 12829, "train_loss": 3.5248429775238037, "lr": 0.00027521841253600837, "tps": 180908, "wall": 4647.8} {"step": 12830, "train_loss": 3.460179328918457, "lr": 0.00027520017794544583, "tps": 180713, "wall": 4653.2} {"step": 12831, "train_loss": 3.4486770629882812, "lr": 0.0002751819427295727, "tps": 180519, "wall": 4658.5} {"step": 12832, "train_loss": 3.357903003692627, "lr": 0.00027516370688859555, "tps": 180323, "wall": 4664.0} {"step": 12833, "train_loss": 3.4152307510375977, "lr": 0.0002751454704227209, "tps": 180131, "wall": 4669.3} {"step": 12834, "train_loss": 3.491868019104004, "lr": 0.0002751272333321554, "tps": 179939, "wall": 4674.7} {"step": 12835, "train_loss": 3.4111173152923584, "lr": 0.00027510899561710567, "tps": 179747, "wall": 4680.0} {"step": 12836, "train_loss": 3.4141063690185547, "lr": 0.00027509075727777816, "tps": 179555, "wall": 4685.4} {"step": 12837, "train_loss": 3.3818321228027344, "lr": 0.00027507251831437965, "tps": 179363, "wall": 4690.8} {"step": 12838, "train_loss": 3.406907558441162, "lr": 0.0002750542787271166, "tps": 179173, "wall": 4696.1} {"step": 12839, "train_loss": 3.569169521331787, "lr": 0.00027503603851619575, "tps": 178982, "wall": 4701.5} {"step": 12840, "train_loss": 3.4326469898223877, "lr": 0.0002750177976818237, "tps": 178792, "wall": 4706.9} {"step": 12841, "train_loss": 3.463651657104492, "lr": 0.000274999556224207, "tps": 178599, "wall": 4712.3} {"step": 12842, "train_loss": 3.3249149322509766, "lr": 0.0002749813141435524, "tps": 178410, "wall": 4717.6} {"step": 12843, "train_loss": 3.3229973316192627, "lr": 0.0002749630714400665, "tps": 178222, "wall": 4723.0} {"step": 12844, "train_loss": 3.405198812484741, "lr": 0.00027494482811395594, "tps": 178033, "wall": 4728.4} {"step": 12845, "train_loss": 3.3442397117614746, "lr": 0.0002749265841654274, "tps": 177844, "wall": 4733.8} {"step": 12846, "train_loss": 3.357853889465332, "lr": 0.0002749083395946876, "tps": 177657, "wall": 4739.1} {"step": 12847, "train_loss": 3.4400200843811035, "lr": 0.00027489009440194304, "tps": 177469, "wall": 4744.5} {"step": 12848, "train_loss": 3.441763162612915, "lr": 0.00027487184858740053, "tps": 177282, "wall": 4749.9} {"step": 12849, "train_loss": 3.4174866676330566, "lr": 0.0002748536021512668, "tps": 177095, "wall": 4755.3} {"step": 12850, "train_loss": 3.4227399826049805, "lr": 0.0002748353550937486, "tps": 176910, "wall": 4760.6} {"step": 12851, "train_loss": 3.342705488204956, "lr": 0.0002748171074150524, "tps": 176725, "wall": 4766.0} {"step": 12852, "train_loss": 3.426823139190674, "lr": 0.00027479885911538504, "tps": 176538, "wall": 4771.4} {"step": 12853, "train_loss": 3.4798803329467773, "lr": 0.0002747806101949533, "tps": 176354, "wall": 4776.7} {"step": 12854, "train_loss": 3.5197291374206543, "lr": 0.0002747623606539638, "tps": 176170, "wall": 4782.1} {"step": 12855, "train_loss": 3.4056038856506348, "lr": 0.0002747441104926233, "tps": 175987, "wall": 4787.5} {"step": 12856, "train_loss": 3.405841588973999, "lr": 0.0002747258597111386, "tps": 175804, "wall": 4792.8} {"step": 12857, "train_loss": 3.5145018100738525, "lr": 0.00027470760830971636, "tps": 175621, "wall": 4798.2} {"step": 12858, "train_loss": 3.447352886199951, "lr": 0.0002746893562885634, "tps": 175439, "wall": 4803.5} {"step": 12859, "train_loss": 3.4945626258850098, "lr": 0.00027467110364788643, "tps": 175257, "wall": 4808.9} {"step": 12860, "train_loss": 3.4699959754943848, "lr": 0.0002746528503878923, "tps": 175075, "wall": 4814.3} {"step": 12861, "train_loss": 3.3931665420532227, "lr": 0.0002746345965087877, "tps": 174895, "wall": 4819.6} {"step": 12862, "train_loss": 3.3635289669036865, "lr": 0.00027461634201077944, "tps": 174714, "wall": 4825.0} {"step": 12863, "train_loss": 3.417914390563965, "lr": 0.00027459808689407427, "tps": 174531, "wall": 4830.4} {"step": 12864, "train_loss": 3.4703049659729004, "lr": 0.00027457983115887903, "tps": 174350, "wall": 4835.8} {"step": 12865, "train_loss": 3.397109031677246, "lr": 0.0002745615748054005, "tps": 174171, "wall": 4841.1} {"step": 12866, "train_loss": 3.513578176498413, "lr": 0.0002745433178338455, "tps": 173992, "wall": 4846.5} {"step": 12867, "train_loss": 3.3606526851654053, "lr": 0.00027452506024442085, "tps": 173813, "wall": 4851.8} {"step": 12868, "train_loss": 3.4406142234802246, "lr": 0.00027450680203733335, "tps": 173634, "wall": 4857.2} {"step": 12869, "train_loss": 3.412464141845703, "lr": 0.00027448854321278983, "tps": 173456, "wall": 4862.6} {"step": 12870, "train_loss": 3.391927719116211, "lr": 0.0002744702837709972, "tps": 173279, "wall": 4867.9} {"step": 12871, "train_loss": 3.4049580097198486, "lr": 0.00027445202371216223, "tps": 173102, "wall": 4873.3} {"step": 12872, "train_loss": 3.401984214782715, "lr": 0.00027443376303649177, "tps": 172924, "wall": 4878.7} {"step": 12873, "train_loss": 3.3699440956115723, "lr": 0.00027441550174419276, "tps": 172747, "wall": 4884.1} {"step": 12874, "train_loss": 3.4820947647094727, "lr": 0.00027439723983547197, "tps": 172567, "wall": 4889.5} {"step": 12875, "train_loss": 3.398624897003174, "lr": 0.00027437897731053624, "tps": 172393, "wall": 4894.9} {"step": 12876, "train_loss": 3.456355571746826, "lr": 0.00027436071416959263, "tps": 172217, "wall": 4900.2} {"step": 12877, "train_loss": 3.3777008056640625, "lr": 0.0002743424504128478, "tps": 172042, "wall": 4905.6} {"step": 12878, "train_loss": 3.4357190132141113, "lr": 0.0002743241860405088, "tps": 171867, "wall": 4911.0} {"step": 12879, "train_loss": 3.313642740249634, "lr": 0.0002743059210527825, "tps": 171694, "wall": 4916.3} {"step": 12880, "train_loss": 3.364030599594116, "lr": 0.0002742876554498758, "tps": 171518, "wall": 4921.7} {"step": 12881, "train_loss": 3.4250950813293457, "lr": 0.0002742693892319956, "tps": 171344, "wall": 4927.1} {"step": 12882, "train_loss": 3.303340435028076, "lr": 0.0002742511223993488, "tps": 171172, "wall": 4932.5} {"step": 12883, "train_loss": 3.4766054153442383, "lr": 0.0002742328549521423, "tps": 170999, "wall": 4937.8} {"step": 12884, "train_loss": 3.4381234645843506, "lr": 0.0002742145868905831, "tps": 170826, "wall": 4943.2} {"step": 12885, "train_loss": 3.441666603088379, "lr": 0.0002741963182148782, "tps": 170651, "wall": 4948.7} {"step": 12886, "train_loss": 3.390310049057007, "lr": 0.0002741780489252344, "tps": 170479, "wall": 4954.1} {"step": 12887, "train_loss": 3.4376912117004395, "lr": 0.0002741597790218588, "tps": 170307, "wall": 4959.4} {"step": 12888, "train_loss": 3.342057704925537, "lr": 0.00027414150850495824, "tps": 170135, "wall": 4964.8} {"step": 12889, "train_loss": 3.336240291595459, "lr": 0.0002741232373747398, "tps": 169964, "wall": 4970.2} {"step": 12890, "train_loss": 3.40395450592041, "lr": 0.00027410496563141034, "tps": 169794, "wall": 4975.6} {"step": 12891, "train_loss": 3.5983214378356934, "lr": 0.0002740866932751769, "tps": 169624, "wall": 4981.0} {"step": 12892, "train_loss": 3.347625494003296, "lr": 0.0002740684203062465, "tps": 169453, "wall": 4986.4} {"step": 12893, "train_loss": 3.3624520301818848, "lr": 0.0002740501467248261, "tps": 169284, "wall": 4991.7} {"step": 12894, "train_loss": 3.439887046813965, "lr": 0.00027403187253112276, "tps": 169115, "wall": 4997.1} {"step": 12895, "train_loss": 3.345972776412964, "lr": 0.0002740135977253434, "tps": 168947, "wall": 5002.5} {"step": 12896, "train_loss": 3.5242767333984375, "lr": 0.00027399532230769504, "tps": 168777, "wall": 5007.9} {"step": 12897, "train_loss": 3.547156810760498, "lr": 0.0002739770462783848, "tps": 168607, "wall": 5013.3} {"step": 12898, "train_loss": 3.4005720615386963, "lr": 0.0002739587696376197, "tps": 168441, "wall": 5018.7} {"step": 12899, "train_loss": 3.420226573944092, "lr": 0.0002739404923856066, "tps": 168274, "wall": 5024.0} {"step": 12900, "train_loss": 3.426619052886963, "lr": 0.00027392221452255284, "tps": 168108, "wall": 5029.4} {"step": 12901, "train_loss": 3.4271116256713867, "lr": 0.0002739039360486652, "tps": 167942, "wall": 5034.7} {"step": 12902, "train_loss": 3.4796018600463867, "lr": 0.0002738856569641509, "tps": 167776, "wall": 5040.1} {"step": 12903, "train_loss": 3.449402332305908, "lr": 0.00027386737726921696, "tps": 167611, "wall": 5045.5} {"step": 12904, "train_loss": 3.47108793258667, "lr": 0.0002738490969640705, "tps": 167446, "wall": 5050.8} {"step": 12905, "train_loss": 3.446989059448242, "lr": 0.0002738308160489185, "tps": 167282, "wall": 5056.2} {"step": 12906, "train_loss": 3.393073558807373, "lr": 0.0002738125345239682, "tps": 167118, "wall": 5061.5} {"step": 12907, "train_loss": 3.3582448959350586, "lr": 0.00027379425238942647, "tps": 166954, "wall": 5066.9} {"step": 12908, "train_loss": 3.3973679542541504, "lr": 0.0002737759696455006, "tps": 166788, "wall": 5072.3} {"step": 12909, "train_loss": 3.4105477333068848, "lr": 0.0002737576862923976, "tps": 166625, "wall": 5077.7} {"step": 12910, "train_loss": 3.3837997913360596, "lr": 0.00027373940233032466, "tps": 166463, "wall": 5083.0} {"step": 12911, "train_loss": 3.3728110790252686, "lr": 0.00027372111775948884, "tps": 166299, "wall": 5088.4} {"step": 12912, "train_loss": 3.3795011043548584, "lr": 0.00027370283258009733, "tps": 166137, "wall": 5093.8} {"step": 12913, "train_loss": 3.444178342819214, "lr": 0.00027368454679235716, "tps": 165975, "wall": 5099.1} {"step": 12914, "train_loss": 3.4549684524536133, "lr": 0.0002736662603964756, "tps": 165814, "wall": 5104.5} {"step": 12915, "train_loss": 3.3983874320983887, "lr": 0.00027364797339265973, "tps": 165653, "wall": 5109.8} {"step": 12916, "train_loss": 3.4045941829681396, "lr": 0.00027362968578111674, "tps": 165493, "wall": 5115.2} {"step": 12917, "train_loss": 3.4064486026763916, "lr": 0.00027361139756205375, "tps": 165331, "wall": 5120.6} {"step": 12918, "train_loss": 3.4619064331054688, "lr": 0.0002735931087356779, "tps": 165171, "wall": 5125.9} {"step": 12919, "train_loss": 3.335158348083496, "lr": 0.00027357481930219646, "tps": 165008, "wall": 5131.4} {"step": 12920, "train_loss": 3.3792481422424316, "lr": 0.00027355652926181655, "tps": 164849, "wall": 5136.7} {"step": 12921, "train_loss": 3.3906679153442383, "lr": 0.0002735382386147454, "tps": 164691, "wall": 5142.1} {"step": 12922, "train_loss": 3.360922336578369, "lr": 0.00027351994736119015, "tps": 164532, "wall": 5147.5} {"step": 12923, "train_loss": 3.3709921836853027, "lr": 0.00027350165550135805, "tps": 164373, "wall": 5152.8} {"step": 12924, "train_loss": 3.44948148727417, "lr": 0.0002734833630354564, "tps": 164214, "wall": 5158.2} {"step": 12925, "train_loss": 3.4802026748657227, "lr": 0.0002734650699636922, "tps": 164057, "wall": 5163.6} {"step": 12926, "train_loss": 3.4085121154785156, "lr": 0.00027344677628627284, "tps": 163899, "wall": 5168.9} {"step": 12927, "train_loss": 3.4863455295562744, "lr": 0.0002734284820034055, "tps": 163742, "wall": 5174.3} {"step": 12928, "train_loss": 3.310913324356079, "lr": 0.0002734101871152974, "tps": 163585, "wall": 5179.6} {"step": 12929, "train_loss": 3.4122390747070312, "lr": 0.00027339189162215577, "tps": 163429, "wall": 5185.0} {"step": 12930, "train_loss": 3.4192581176757812, "lr": 0.000273373595524188, "tps": 163270, "wall": 5190.4} {"step": 12931, "train_loss": 3.393982410430908, "lr": 0.0002733552988216012, "tps": 163115, "wall": 5195.8} {"step": 12932, "train_loss": 3.4079811573028564, "lr": 0.0002733370015146027, "tps": 162960, "wall": 5201.1} {"step": 12933, "train_loss": 3.438464641571045, "lr": 0.00027331870360339976, "tps": 162804, "wall": 5206.5} {"step": 12934, "train_loss": 3.3885104656219482, "lr": 0.0002733004050881997, "tps": 162650, "wall": 5211.8} {"step": 12935, "train_loss": 3.3261795043945312, "lr": 0.0002732821059692098, "tps": 162495, "wall": 5217.2} {"step": 12936, "train_loss": 3.4782662391662598, "lr": 0.00027326380624663726, "tps": 162340, "wall": 5222.6} {"step": 12937, "train_loss": 3.482069492340088, "lr": 0.0002732455059206894, "tps": 162187, "wall": 5227.9} {"step": 12938, "train_loss": 3.327406406402588, "lr": 0.0002732272049915736, "tps": 162034, "wall": 5233.3} {"step": 12939, "train_loss": 3.5822677612304688, "lr": 0.0002732089034594972, "tps": 161881, "wall": 5238.6} {"step": 12940, "train_loss": 3.44453501701355, "lr": 0.00027319060132466734, "tps": 161728, "wall": 5244.0} {"step": 12941, "train_loss": 3.3729124069213867, "lr": 0.0002731722985872916, "tps": 161573, "wall": 5249.4} {"step": 12942, "train_loss": 3.384424924850464, "lr": 0.00027315399524757716, "tps": 161421, "wall": 5254.8} {"step": 12943, "train_loss": 3.376028299331665, "lr": 0.00027313569130573133, "tps": 161269, "wall": 5260.1} {"step": 12944, "train_loss": 3.450263738632202, "lr": 0.00027311738676196156, "tps": 161117, "wall": 5265.5} {"step": 12945, "train_loss": 3.4763009548187256, "lr": 0.00027309908161647514, "tps": 160965, "wall": 5270.9} {"step": 12946, "train_loss": 3.4588918685913086, "lr": 0.00027308077586947943, "tps": 160813, "wall": 5276.3} {"step": 12947, "train_loss": 3.370274543762207, "lr": 0.00027306246952118183, "tps": 160662, "wall": 5281.6} {"step": 12948, "train_loss": 3.542006492614746, "lr": 0.00027304416257178975, "tps": 160511, "wall": 5287.0} {"step": 12949, "train_loss": 3.4431569576263428, "lr": 0.0002730258550215105, "tps": 160361, "wall": 5292.4} {"step": 12950, "train_loss": 3.4095618724823, "lr": 0.0002730075468705514, "tps": 160211, "wall": 5297.7} {"step": 12951, "train_loss": 3.4492440223693848, "lr": 0.0002729892381191201, "tps": 160061, "wall": 5303.1} {"step": 12952, "train_loss": 3.3746650218963623, "lr": 0.00027297092876742374, "tps": 159909, "wall": 5308.6} {"step": 12953, "train_loss": 3.421689748764038, "lr": 0.00027295261881566985, "tps": 159759, "wall": 5313.9} {"step": 12954, "train_loss": 3.436537027359009, "lr": 0.0002729343082640658, "tps": 159611, "wall": 5319.3} {"step": 12955, "train_loss": 3.3372802734375, "lr": 0.00027291599711281916, "tps": 159464, "wall": 5324.6} {"step": 12956, "train_loss": 3.3207907676696777, "lr": 0.00027289768536213713, "tps": 159316, "wall": 5330.0} {"step": 12957, "train_loss": 3.337221622467041, "lr": 0.00027287937301222735, "tps": 159169, "wall": 5335.3} {"step": 12958, "train_loss": 3.477914571762085, "lr": 0.00027286106006329706, "tps": 159022, "wall": 5340.6} {"step": 12959, "train_loss": 3.3174920082092285, "lr": 0.0002728427465155539, "tps": 158875, "wall": 5346.0} {"step": 12960, "train_loss": 3.3641295433044434, "lr": 0.00027282443236920523, "tps": 158727, "wall": 5351.4} {"step": 12961, "train_loss": 3.2865285873413086, "lr": 0.0002728061176244585, "tps": 158581, "wall": 5356.7} {"step": 12962, "train_loss": 3.3267781734466553, "lr": 0.0002727878022815213, "tps": 158434, "wall": 5362.1} {"step": 12963, "train_loss": 3.3903117179870605, "lr": 0.00027276948634060095, "tps": 158288, "wall": 5367.5} {"step": 12964, "train_loss": 3.3417763710021973, "lr": 0.000272751169801905, "tps": 158141, "wall": 5372.9} {"step": 12965, "train_loss": 3.409984588623047, "lr": 0.00027273285266564103, "tps": 157994, "wall": 5378.3} {"step": 12966, "train_loss": 3.453054904937744, "lr": 0.00027271453493201634, "tps": 157850, "wall": 5383.6} {"step": 12967, "train_loss": 3.410654067993164, "lr": 0.0002726962166012386, "tps": 157705, "wall": 5389.0} {"step": 12968, "train_loss": 3.3959310054779053, "lr": 0.0002726778976735153, "tps": 157559, "wall": 5394.4} {"step": 12969, "train_loss": 3.4260950088500977, "lr": 0.0002726595781490538, "tps": 157415, "wall": 5399.7} {"step": 12970, "train_loss": 3.3584699630737305, "lr": 0.00027264125802806187, "tps": 157271, "wall": 5405.1} {"step": 12971, "train_loss": 3.4523308277130127, "lr": 0.00027262293731074685, "tps": 157126, "wall": 5410.5} {"step": 12972, "train_loss": 3.3233489990234375, "lr": 0.00027260461599731644, "tps": 156982, "wall": 5415.9} {"step": 12973, "train_loss": 3.451671600341797, "lr": 0.00027258629408797805, "tps": 156838, "wall": 5421.3} {"step": 12974, "train_loss": 3.392521858215332, "lr": 0.00027256797158293925, "tps": 156695, "wall": 5426.6} {"step": 12975, "train_loss": 3.3993420600891113, "lr": 0.0002725496484824076, "tps": 156551, "wall": 5432.1} {"step": 12976, "train_loss": 3.378655433654785, "lr": 0.0002725313247865908, "tps": 156408, "wall": 5437.4} {"step": 12977, "train_loss": 3.456946849822998, "lr": 0.0002725130004956962, "tps": 156266, "wall": 5442.8} {"step": 12978, "train_loss": 3.3533148765563965, "lr": 0.0002724946756099315, "tps": 156124, "wall": 5448.2} {"step": 12979, "train_loss": 3.4233334064483643, "lr": 0.00027247635012950434, "tps": 155983, "wall": 5453.5} {"step": 12980, "train_loss": 3.3796558380126953, "lr": 0.0002724580240546222, "tps": 155841, "wall": 5458.9} {"step": 12981, "train_loss": 3.426051139831543, "lr": 0.0002724396973854927, "tps": 155701, "wall": 5464.2} {"step": 12982, "train_loss": 3.326402187347412, "lr": 0.00027242137012232354, "tps": 155560, "wall": 5469.6} {"step": 12983, "train_loss": 3.4073500633239746, "lr": 0.0002724030422653222, "tps": 155420, "wall": 5474.9} {"step": 12984, "train_loss": 3.43393611907959, "lr": 0.00027238471381469645, "tps": 155281, "wall": 5480.3} {"step": 12985, "train_loss": 3.4343795776367188, "lr": 0.0002723663847706538, "tps": 155142, "wall": 5485.6} {"step": 12986, "train_loss": 3.30730938911438, "lr": 0.00027234805513340186, "tps": 155001, "wall": 5491.0} {"step": 12987, "train_loss": 3.2710838317871094, "lr": 0.0002723297249031483, "tps": 154862, "wall": 5496.4} {"step": 12988, "train_loss": 3.391446590423584, "lr": 0.0002723113940801008, "tps": 154723, "wall": 5501.7} {"step": 12989, "train_loss": 3.468465566635132, "lr": 0.00027229306266446704, "tps": 154584, "wall": 5507.1} {"step": 12990, "train_loss": 3.3821277618408203, "lr": 0.00027227473065645464, "tps": 154446, "wall": 5512.5} {"step": 12991, "train_loss": 3.415318489074707, "lr": 0.00027225639805627123, "tps": 154308, "wall": 5517.8} {"step": 12992, "train_loss": 3.4526684284210205, "lr": 0.00027223806486412455, "tps": 154169, "wall": 5523.2} {"step": 12993, "train_loss": 3.4147844314575195, "lr": 0.0002722197310802222, "tps": 154033, "wall": 5528.5} {"step": 12994, "train_loss": 3.410226583480835, "lr": 0.0002722013967047719, "tps": 153896, "wall": 5533.9} {"step": 12995, "train_loss": 3.398221254348755, "lr": 0.00027218306173798143, "tps": 153759, "wall": 5539.2} {"step": 12996, "train_loss": 3.349440097808838, "lr": 0.0002721647261800584, "tps": 153624, "wall": 5544.5} {"step": 12997, "train_loss": 3.4047555923461914, "lr": 0.0002721463900312105, "tps": 153485, "wall": 5549.9} {"step": 12998, "train_loss": 3.3211169242858887, "lr": 0.0002721280532916454, "tps": 153350, "wall": 5555.3} {"step": 12999, "train_loss": 3.3391916751861572, "lr": 0.00027210971596157104, "tps": 153214, "wall": 5560.6} {"step": 13000, "train_loss": 3.396313190460205, "lr": 0.00027209137804119494, "tps": 153078, "wall": 5566.0, "val_loss_monitor": 3.486698235801689} {"step": 13001, "train_loss": 3.361274242401123, "lr": 0.00027207303953072484, "tps": 151984, "wall": 5606.5} {"step": 13002, "train_loss": 3.462357997894287, "lr": 0.00027205470043036863, "tps": 151848, "wall": 5611.9} {"step": 13003, "train_loss": 3.3961524963378906, "lr": 0.00027203636074033384, "tps": 151714, "wall": 5617.3} {"step": 13004, "train_loss": 3.399207353591919, "lr": 0.0002720180204608284, "tps": 151580, "wall": 5622.7} {"step": 13005, "train_loss": 3.2340762615203857, "lr": 0.00027199967959206, "tps": 151447, "wall": 5628.1} {"step": 13006, "train_loss": 3.3801660537719727, "lr": 0.00027198133813423645, "tps": 151313, "wall": 5633.5} {"step": 13007, "train_loss": 3.448089838027954, "lr": 0.00027196299608756545, "tps": 151180, "wall": 5638.9} {"step": 13008, "train_loss": 3.544320821762085, "lr": 0.0002719446534522548, "tps": 151047, "wall": 5644.3} {"step": 13009, "train_loss": 3.366349220275879, "lr": 0.0002719263102285124, "tps": 150913, "wall": 5649.7} {"step": 13010, "train_loss": 3.415621042251587, "lr": 0.00027190796641654585, "tps": 150781, "wall": 5655.1} {"step": 13011, "train_loss": 3.503640651702881, "lr": 0.0002718896220165631, "tps": 150648, "wall": 5660.6} {"step": 13012, "train_loss": 3.4134793281555176, "lr": 0.0002718712770287719, "tps": 150517, "wall": 5665.9} {"step": 13013, "train_loss": 3.351541042327881, "lr": 0.00027185293145338003, "tps": 150383, "wall": 5671.4} {"step": 13014, "train_loss": 3.4244191646575928, "lr": 0.0002718345852905954, "tps": 150252, "wall": 5676.8} {"step": 13015, "train_loss": 3.4687490463256836, "lr": 0.0002718162385406257, "tps": 150120, "wall": 5682.2} {"step": 13016, "train_loss": 3.432758331298828, "lr": 0.00027179789120367894, "tps": 149990, "wall": 5687.6} {"step": 13017, "train_loss": 3.448078155517578, "lr": 0.00027177954327996283, "tps": 149859, "wall": 5693.0} {"step": 13018, "train_loss": 3.377662181854248, "lr": 0.00027176119476968527, "tps": 149730, "wall": 5698.3} {"step": 13019, "train_loss": 3.39667010307312, "lr": 0.00027174284567305405, "tps": 149599, "wall": 5703.8} {"step": 13020, "train_loss": 3.4360122680664062, "lr": 0.00027172449599027716, "tps": 149469, "wall": 5709.2} {"step": 13021, "train_loss": 3.4667887687683105, "lr": 0.0002717061457215623, "tps": 149338, "wall": 5714.6} {"step": 13022, "train_loss": 3.496812343597412, "lr": 0.00027168779486711744, "tps": 149209, "wall": 5720.0} {"step": 13023, "train_loss": 3.341336250305176, "lr": 0.0002716694434271505, "tps": 149080, "wall": 5725.4} {"step": 13024, "train_loss": 3.501269817352295, "lr": 0.00027165109140186923, "tps": 148949, "wall": 5730.8} {"step": 13025, "train_loss": 3.2696797847747803, "lr": 0.00027163273879148166, "tps": 148821, "wall": 5736.2} {"step": 13026, "train_loss": 3.427736282348633, "lr": 0.00027161438559619564, "tps": 148693, "wall": 5741.6} {"step": 13027, "train_loss": 3.406874656677246, "lr": 0.000271596031816219, "tps": 148565, "wall": 5747.0} {"step": 13028, "train_loss": 3.3884670734405518, "lr": 0.00027157767745175973, "tps": 148437, "wall": 5752.4} {"step": 13029, "train_loss": 3.444697380065918, "lr": 0.00027155932250302574, "tps": 148309, "wall": 5757.8} {"step": 13030, "train_loss": 3.517446756362915, "lr": 0.00027154096697022505, "tps": 148181, "wall": 5763.2} {"step": 13031, "train_loss": 3.399000644683838, "lr": 0.0002715226108535654, "tps": 148055, "wall": 5768.6} {"step": 13032, "train_loss": 3.409811496734619, "lr": 0.0002715042541532548, "tps": 147928, "wall": 5774.0} {"step": 13033, "train_loss": 3.476980447769165, "lr": 0.0002714858968695013, "tps": 147801, "wall": 5779.3} {"step": 13034, "train_loss": 3.3603248596191406, "lr": 0.00027146753900251277, "tps": 147675, "wall": 5784.7} {"step": 13035, "train_loss": 3.4501428604125977, "lr": 0.0002714491805524971, "tps": 147547, "wall": 5790.2} {"step": 13036, "train_loss": 3.449375629425049, "lr": 0.00027143082151966243, "tps": 147423, "wall": 5795.5} {"step": 13037, "train_loss": 3.4415764808654785, "lr": 0.0002714124619042166, "tps": 147298, "wall": 5800.9} {"step": 13038, "train_loss": 3.447925567626953, "lr": 0.00027139410170636755, "tps": 147173, "wall": 5806.2} {"step": 13039, "train_loss": 3.3909738063812256, "lr": 0.0002713757409263234, "tps": 147048, "wall": 5811.6} {"step": 13040, "train_loss": 3.357907772064209, "lr": 0.0002713573795642921, "tps": 146924, "wall": 5817.0} {"step": 13041, "train_loss": 3.3770298957824707, "lr": 0.0002713390176204816, "tps": 146799, "wall": 5822.4} {"step": 13042, "train_loss": 3.3065378665924072, "lr": 0.00027132065509509994, "tps": 146674, "wall": 5827.8} {"step": 13043, "train_loss": 3.4294610023498535, "lr": 0.0002713022919883551, "tps": 146551, "wall": 5833.1} {"step": 13044, "train_loss": 3.347689390182495, "lr": 0.00027128392830045515, "tps": 146427, "wall": 5838.5} {"step": 13045, "train_loss": 3.370332717895508, "lr": 0.000271265564031608, "tps": 146304, "wall": 5843.9} {"step": 13046, "train_loss": 3.273231029510498, "lr": 0.00027124719918202186, "tps": 146178, "wall": 5849.3} {"step": 13047, "train_loss": 3.4468793869018555, "lr": 0.0002712288337519047, "tps": 146056, "wall": 5854.7} {"step": 13048, "train_loss": 3.377349853515625, "lr": 0.00027121046774146446, "tps": 145934, "wall": 5860.0} {"step": 13049, "train_loss": 3.413769006729126, "lr": 0.0002711921011509093, "tps": 145812, "wall": 5865.4} {"step": 13050, "train_loss": 3.401747941970825, "lr": 0.0002711737339804472, "tps": 145690, "wall": 5870.7} {"step": 13051, "train_loss": 3.428091526031494, "lr": 0.0002711553662302863, "tps": 145569, "wall": 5876.1} {"step": 13052, "train_loss": 3.3917160034179688, "lr": 0.0002711369979006347, "tps": 145448, "wall": 5881.4} {"step": 13053, "train_loss": 3.4569592475891113, "lr": 0.0002711186289917004, "tps": 145327, "wall": 5886.8} {"step": 13054, "train_loss": 3.4856534004211426, "lr": 0.0002711002595036915, "tps": 145206, "wall": 5892.1} {"step": 13055, "train_loss": 3.356147527694702, "lr": 0.0002710818894368161, "tps": 145085, "wall": 5897.5} {"step": 13056, "train_loss": 3.4473865032196045, "lr": 0.0002710635187912823, "tps": 144964, "wall": 5902.9} {"step": 13057, "train_loss": 3.4088199138641357, "lr": 0.00027104514756729815, "tps": 144841, "wall": 5908.3} {"step": 13058, "train_loss": 3.4518191814422607, "lr": 0.0002710267757650718, "tps": 144720, "wall": 5913.7} {"step": 13059, "train_loss": 3.426602840423584, "lr": 0.0002710084033848114, "tps": 144600, "wall": 5919.1} {"step": 13060, "train_loss": 3.3806746006011963, "lr": 0.0002709900304267251, "tps": 144478, "wall": 5924.5} {"step": 13061, "train_loss": 3.305803060531616, "lr": 0.0002709716568910209, "tps": 144359, "wall": 5929.8} {"step": 13062, "train_loss": 3.417895793914795, "lr": 0.00027095328277790704, "tps": 144239, "wall": 5935.2} {"step": 13063, "train_loss": 3.2852563858032227, "lr": 0.00027093490808759163, "tps": 144119, "wall": 5940.6} {"step": 13064, "train_loss": 3.369659185409546, "lr": 0.00027091653282028286, "tps": 144001, "wall": 5946.0} {"step": 13065, "train_loss": 3.404806613922119, "lr": 0.0002708981569761888, "tps": 143882, "wall": 5951.4} {"step": 13066, "train_loss": 3.376389741897583, "lr": 0.0002708797805555177, "tps": 143762, "wall": 5956.7} {"step": 13067, "train_loss": 3.356109857559204, "lr": 0.0002708614035584777, "tps": 143644, "wall": 5962.1} {"step": 13068, "train_loss": 3.485090494155884, "lr": 0.00027084302598527697, "tps": 143525, "wall": 5967.5} {"step": 13069, "train_loss": 3.4018216133117676, "lr": 0.00027082464783612363, "tps": 143403, "wall": 5973.0} {"step": 13070, "train_loss": 3.3467092514038086, "lr": 0.00027080626911122604, "tps": 143285, "wall": 5978.4} {"step": 13071, "train_loss": 3.383479356765747, "lr": 0.0002707878898107922, "tps": 143168, "wall": 5983.8} {"step": 13072, "train_loss": 3.3667612075805664, "lr": 0.00027076950993503037, "tps": 143049, "wall": 5989.2} {"step": 13073, "train_loss": 3.3630313873291016, "lr": 0.00027075112948414884, "tps": 142931, "wall": 5994.6} {"step": 13074, "train_loss": 3.387460231781006, "lr": 0.00027073274845835577, "tps": 142813, "wall": 6000.0} {"step": 13075, "train_loss": 3.3913683891296387, "lr": 0.0002707143668578594, "tps": 142695, "wall": 6005.4} {"step": 13076, "train_loss": 3.3821990489959717, "lr": 0.0002706959846828679, "tps": 142578, "wall": 6010.8} {"step": 13077, "train_loss": 3.443188428878784, "lr": 0.0002706776019335896, "tps": 142461, "wall": 6016.2} {"step": 13078, "train_loss": 3.4073007106781006, "lr": 0.0002706592186102326, "tps": 142344, "wall": 6021.6} {"step": 13079, "train_loss": 3.4092326164245605, "lr": 0.0002706408347130052, "tps": 142228, "wall": 6027.0} {"step": 13080, "train_loss": 3.3168702125549316, "lr": 0.0002706224502421158, "tps": 142110, "wall": 6032.5} {"step": 13081, "train_loss": 3.3291749954223633, "lr": 0.0002706040651977725, "tps": 141995, "wall": 6037.8} {"step": 13082, "train_loss": 3.2659168243408203, "lr": 0.0002705856795801836, "tps": 141879, "wall": 6043.2} {"step": 13083, "train_loss": 3.4240922927856445, "lr": 0.0002705672933895574, "tps": 141763, "wall": 6048.6} {"step": 13084, "train_loss": 3.4244823455810547, "lr": 0.00027054890662610217, "tps": 141647, "wall": 6054.0} {"step": 13085, "train_loss": 3.3682703971862793, "lr": 0.0002705305192900262, "tps": 141532, "wall": 6059.4} {"step": 13086, "train_loss": 3.426870346069336, "lr": 0.0002705121313815377, "tps": 141416, "wall": 6064.8} {"step": 13087, "train_loss": 3.471045732498169, "lr": 0.00027049374290084513, "tps": 141301, "wall": 6070.2} {"step": 13088, "train_loss": 3.338344097137451, "lr": 0.00027047535384815667, "tps": 141187, "wall": 6075.6} {"step": 13089, "train_loss": 3.4087605476379395, "lr": 0.0002704569642236807, "tps": 141073, "wall": 6081.0} {"step": 13090, "train_loss": 3.537856340408325, "lr": 0.0002704385740276254, "tps": 140960, "wall": 6086.3} {"step": 13091, "train_loss": 3.3669445514678955, "lr": 0.00027042018326019934, "tps": 140844, "wall": 6091.8} {"step": 13092, "train_loss": 3.4674081802368164, "lr": 0.0002704017919216107, "tps": 140730, "wall": 6097.2} {"step": 13093, "train_loss": 3.376713991165161, "lr": 0.0002703834000120678, "tps": 140616, "wall": 6102.6} {"step": 13094, "train_loss": 3.4388108253479004, "lr": 0.000270365007531779, "tps": 140502, "wall": 6108.0} {"step": 13095, "train_loss": 3.4217000007629395, "lr": 0.0002703466144809527, "tps": 140389, "wall": 6113.4} {"step": 13096, "train_loss": 3.3754849433898926, "lr": 0.0002703282208597972, "tps": 140276, "wall": 6118.8} {"step": 13097, "train_loss": 3.390476703643799, "lr": 0.00027030982666852095, "tps": 140163, "wall": 6124.2} {"step": 13098, "train_loss": 3.4886269569396973, "lr": 0.0002702914319073322, "tps": 140051, "wall": 6129.6} {"step": 13099, "train_loss": 3.389556884765625, "lr": 0.0002702730365764394, "tps": 139938, "wall": 6135.0} {"step": 13100, "train_loss": 3.4372363090515137, "lr": 0.00027025464067605094, "tps": 139826, "wall": 6140.4} {"step": 13101, "train_loss": 3.378351926803589, "lr": 0.0002702362442063752, "tps": 139714, "wall": 6145.8} {"step": 13102, "train_loss": 3.2106292247772217, "lr": 0.0002702178471676205, "tps": 139600, "wall": 6151.2} {"step": 13103, "train_loss": 3.356656074523926, "lr": 0.0002701994495599954, "tps": 139488, "wall": 6156.7} {"step": 13104, "train_loss": 3.385998010635376, "lr": 0.0002701810513837082, "tps": 139376, "wall": 6162.1} {"step": 13105, "train_loss": 3.4102139472961426, "lr": 0.00027016265263896734, "tps": 139265, "wall": 6167.5} {"step": 13106, "train_loss": 3.342478036880493, "lr": 0.0002701442533259812, "tps": 139153, "wall": 6172.9} {"step": 13107, "train_loss": 3.358341693878174, "lr": 0.0002701258534449582, "tps": 139043, "wall": 6178.2} {"step": 13108, "train_loss": 3.285487174987793, "lr": 0.0002701074529961069, "tps": 138932, "wall": 6183.6} {"step": 13109, "train_loss": 3.310028553009033, "lr": 0.00027008905197963565, "tps": 138822, "wall": 6189.0} {"step": 13110, "train_loss": 3.357999086380005, "lr": 0.0002700706503957529, "tps": 138712, "wall": 6194.4} {"step": 13111, "train_loss": 3.398104190826416, "lr": 0.00027005224824466713, "tps": 138602, "wall": 6199.8} {"step": 13112, "train_loss": 3.339268684387207, "lr": 0.0002700338455265868, "tps": 138491, "wall": 6205.2} {"step": 13113, "train_loss": 3.3401236534118652, "lr": 0.0002700154422417203, "tps": 138379, "wall": 6210.7} {"step": 13114, "train_loss": 3.3524110317230225, "lr": 0.00026999703839027616, "tps": 138270, "wall": 6216.1} {"step": 13115, "train_loss": 3.4506444931030273, "lr": 0.00026997863397246294, "tps": 138161, "wall": 6221.5} {"step": 13116, "train_loss": 3.4857099056243896, "lr": 0.000269960228988489, "tps": 138052, "wall": 6226.9} {"step": 13117, "train_loss": 3.4463939666748047, "lr": 0.0002699418234385629, "tps": 137943, "wall": 6232.3} {"step": 13118, "train_loss": 3.3722593784332275, "lr": 0.00026992341732289313, "tps": 137835, "wall": 6237.6} {"step": 13119, "train_loss": 3.327627420425415, "lr": 0.0002699050106416882, "tps": 137726, "wall": 6243.0} {"step": 13120, "train_loss": 3.357423782348633, "lr": 0.00026988660339515654, "tps": 137616, "wall": 6248.5} {"step": 13121, "train_loss": 3.468318462371826, "lr": 0.0002698681955835068, "tps": 137508, "wall": 6253.9} {"step": 13122, "train_loss": 3.4308929443359375, "lr": 0.0002698497872069474, "tps": 137401, "wall": 6259.3} {"step": 13123, "train_loss": 3.4953432083129883, "lr": 0.00026983137826568695, "tps": 137293, "wall": 6264.6} {"step": 13124, "train_loss": 3.438253164291382, "lr": 0.0002698129687599339, "tps": 137183, "wall": 6270.1} {"step": 13125, "train_loss": 3.5127995014190674, "lr": 0.0002697945586898969, "tps": 137076, "wall": 6275.5} {"step": 13126, "train_loss": 3.4768972396850586, "lr": 0.00026977614805578443, "tps": 136969, "wall": 6280.9} {"step": 13127, "train_loss": 3.4381980895996094, "lr": 0.00026975773685780505, "tps": 136862, "wall": 6286.3} {"step": 13128, "train_loss": 3.422635555267334, "lr": 0.0002697393250961674, "tps": 136755, "wall": 6291.7} {"step": 13129, "train_loss": 3.329641342163086, "lr": 0.00026972091277107995, "tps": 136649, "wall": 6297.0} {"step": 13130, "train_loss": 3.380401611328125, "lr": 0.0002697024998827512, "tps": 136543, "wall": 6302.4} {"step": 13131, "train_loss": 3.3422348499298096, "lr": 0.00026968408643138995, "tps": 136437, "wall": 6307.8} {"step": 13132, "train_loss": 3.580911159515381, "lr": 0.0002696656724172047, "tps": 136331, "wall": 6313.2} {"step": 13133, "train_loss": 3.4111781120300293, "lr": 0.000269647257840404, "tps": 136225, "wall": 6318.6} {"step": 13134, "train_loss": 3.4163734912872314, "lr": 0.0002696288427011964, "tps": 136120, "wall": 6323.9} {"step": 13135, "train_loss": 3.5277724266052246, "lr": 0.0002696104269997907, "tps": 136011, "wall": 6329.5} {"step": 13136, "train_loss": 3.3975253105163574, "lr": 0.00026959201073639536, "tps": 135905, "wall": 6334.9} {"step": 13137, "train_loss": 3.425267219543457, "lr": 0.000269573593911219, "tps": 135799, "wall": 6340.3} {"step": 13138, "train_loss": 3.4231252670288086, "lr": 0.0002695551765244704, "tps": 135693, "wall": 6345.7} {"step": 13139, "train_loss": 3.308821678161621, "lr": 0.00026953675857635794, "tps": 135588, "wall": 6351.1} {"step": 13140, "train_loss": 3.394900321960449, "lr": 0.00026951834006709043, "tps": 135483, "wall": 6356.5} {"step": 13141, "train_loss": 3.369324207305908, "lr": 0.00026949992099687656, "tps": 135378, "wall": 6362.0} {"step": 13142, "train_loss": 3.4169929027557373, "lr": 0.0002694815013659248, "tps": 135274, "wall": 6367.4} {"step": 13143, "train_loss": 3.319943904876709, "lr": 0.00026946308117444396, "tps": 135169, "wall": 6372.8} {"step": 13144, "train_loss": 3.416144371032715, "lr": 0.0002694446604226427, "tps": 135066, "wall": 6378.1} {"step": 13145, "train_loss": 3.4821345806121826, "lr": 0.00026942623911072966, "tps": 134961, "wall": 6383.6} {"step": 13146, "train_loss": 3.3878049850463867, "lr": 0.0002694078172389134, "tps": 134855, "wall": 6389.1} {"step": 13147, "train_loss": 3.4064135551452637, "lr": 0.0002693893948074028, "tps": 134753, "wall": 6394.4} {"step": 13148, "train_loss": 3.3935275077819824, "lr": 0.00026937097181640643, "tps": 134650, "wall": 6399.8} {"step": 13149, "train_loss": 3.487213611602783, "lr": 0.00026935254826613306, "tps": 134546, "wall": 6405.2} {"step": 13150, "train_loss": 3.3395047187805176, "lr": 0.0002693341241567914, "tps": 134444, "wall": 6410.6} {"step": 13151, "train_loss": 3.3814096450805664, "lr": 0.00026931569948859, "tps": 134341, "wall": 6415.9} {"step": 13152, "train_loss": 3.3868911266326904, "lr": 0.00026929727426173777, "tps": 134239, "wall": 6421.3} {"step": 13153, "train_loss": 3.425001859664917, "lr": 0.0002692788484764433, "tps": 134136, "wall": 6426.7} {"step": 13154, "train_loss": 3.4213106632232666, "lr": 0.0002692604221329154, "tps": 134033, "wall": 6432.1} {"step": 13155, "train_loss": 3.4227328300476074, "lr": 0.00026924199523136274, "tps": 133932, "wall": 6437.5} {"step": 13156, "train_loss": 3.4179258346557617, "lr": 0.00026922356777199415, "tps": 133830, "wall": 6442.9} {"step": 13157, "train_loss": 3.4609804153442383, "lr": 0.0002692051397550182, "tps": 133727, "wall": 6448.4} {"step": 13158, "train_loss": 3.3972206115722656, "lr": 0.00026918671118064387, "tps": 133626, "wall": 6453.7} {"step": 13159, "train_loss": 3.306865692138672, "lr": 0.0002691682820490798, "tps": 133524, "wall": 6459.1} {"step": 13160, "train_loss": 3.4436516761779785, "lr": 0.0002691498523605348, "tps": 133424, "wall": 6464.5} {"step": 13161, "train_loss": 3.361778736114502, "lr": 0.00026913142211521754, "tps": 133323, "wall": 6469.9} {"step": 13162, "train_loss": 3.4877686500549316, "lr": 0.000269112991313337, "tps": 133222, "wall": 6475.2} {"step": 13163, "train_loss": 3.3837890625, "lr": 0.00026909455995510165, "tps": 133122, "wall": 6480.6} {"step": 13164, "train_loss": 3.4111180305480957, "lr": 0.0002690761280407206, "tps": 133021, "wall": 6486.0} {"step": 13165, "train_loss": 3.396193504333496, "lr": 0.0002690576955704025, "tps": 132920, "wall": 6491.4} {"step": 13166, "train_loss": 3.3154520988464355, "lr": 0.0002690392625443561, "tps": 132820, "wall": 6496.8} {"step": 13167, "train_loss": 3.3751425743103027, "lr": 0.0002690208289627903, "tps": 132720, "wall": 6502.2} {"step": 13168, "train_loss": 3.308511734008789, "lr": 0.000269002394825914, "tps": 132620, "wall": 6507.6} {"step": 13169, "train_loss": 3.3990156650543213, "lr": 0.0002689839601339358, "tps": 132519, "wall": 6513.1} {"step": 13170, "train_loss": 3.2872262001037598, "lr": 0.00026896552488706477, "tps": 132420, "wall": 6518.5} {"step": 13171, "train_loss": 3.4196176528930664, "lr": 0.00026894708908550954, "tps": 132321, "wall": 6523.8} {"step": 13172, "train_loss": 3.3427326679229736, "lr": 0.000268928652729479, "tps": 132222, "wall": 6529.2} {"step": 13173, "train_loss": 3.4487133026123047, "lr": 0.0002689102158191821, "tps": 132122, "wall": 6534.6} {"step": 13174, "train_loss": 3.453754425048828, "lr": 0.00026889177835482764, "tps": 132024, "wall": 6540.0} {"step": 13175, "train_loss": 3.361238956451416, "lr": 0.0002688733403366245, "tps": 131924, "wall": 6545.4} {"step": 13176, "train_loss": 3.3877110481262207, "lr": 0.0002688549017647814, "tps": 131826, "wall": 6550.8} {"step": 13177, "train_loss": 3.362602710723877, "lr": 0.0002688364626395074, "tps": 131728, "wall": 6556.2} {"step": 13178, "train_loss": 3.3763697147369385, "lr": 0.0002688180229610113, "tps": 131630, "wall": 6561.6} {"step": 13179, "train_loss": 3.358769416809082, "lr": 0.00026879958272950203, "tps": 131532, "wall": 6566.9} {"step": 13180, "train_loss": 3.3040802478790283, "lr": 0.0002687811419451884, "tps": 131433, "wall": 6572.4} {"step": 13181, "train_loss": 3.416651964187622, "lr": 0.00026876270060827937, "tps": 131336, "wall": 6577.7} {"step": 13182, "train_loss": 3.340134620666504, "lr": 0.00026874425871898386, "tps": 131238, "wall": 6583.1} {"step": 13183, "train_loss": 3.3938841819763184, "lr": 0.0002687258162775107, "tps": 131141, "wall": 6588.5} {"step": 13184, "train_loss": 3.300354480743408, "lr": 0.00026870737328406883, "tps": 131044, "wall": 6593.9} {"step": 13185, "train_loss": 3.327549457550049, "lr": 0.0002686889297388672, "tps": 130947, "wall": 6599.3} {"step": 13186, "train_loss": 3.4609997272491455, "lr": 0.00026867048564211483, "tps": 130850, "wall": 6604.6} {"step": 13187, "train_loss": 3.379725456237793, "lr": 0.00026865204099402054, "tps": 130755, "wall": 6610.0} {"step": 13188, "train_loss": 3.2774744033813477, "lr": 0.00026863359579479333, "tps": 130658, "wall": 6615.4} {"step": 13189, "train_loss": 3.5297021865844727, "lr": 0.000268615150044642, "tps": 130562, "wall": 6620.7} {"step": 13190, "train_loss": 3.4716341495513916, "lr": 0.0002685967037437758, "tps": 130466, "wall": 6626.1} {"step": 13191, "train_loss": 3.3598906993865967, "lr": 0.00026857825689240335, "tps": 130369, "wall": 6631.5} {"step": 13192, "train_loss": 3.3274734020233154, "lr": 0.0002685598094907338, "tps": 130273, "wall": 6636.9} {"step": 13193, "train_loss": 3.3642590045928955, "lr": 0.0002685413615389762, "tps": 130178, "wall": 6642.3} {"step": 13194, "train_loss": 3.410231113433838, "lr": 0.0002685229130373393, "tps": 130083, "wall": 6647.6} {"step": 13195, "train_loss": 3.3929810523986816, "lr": 0.00026850446398603224, "tps": 129987, "wall": 6653.0} {"step": 13196, "train_loss": 3.4224963188171387, "lr": 0.000268486014385264, "tps": 129892, "wall": 6658.4} {"step": 13197, "train_loss": 3.450077533721924, "lr": 0.00026846756423524364, "tps": 129797, "wall": 6663.8} {"step": 13198, "train_loss": 3.345973253250122, "lr": 0.00026844911353618005, "tps": 129703, "wall": 6669.1} {"step": 13199, "train_loss": 3.510563373565674, "lr": 0.0002684306622882822, "tps": 129609, "wall": 6674.5} {"step": 13200, "train_loss": 3.4503703117370605, "lr": 0.0002684122104917593, "tps": 129515, "wall": 6679.8} {"step": 13201, "train_loss": 3.512453556060791, "lr": 0.00026839375814682024, "tps": 129420, "wall": 6685.2} {"step": 13202, "train_loss": 3.3643596172332764, "lr": 0.00026837530525367396, "tps": 129324, "wall": 6690.7} {"step": 13203, "train_loss": 3.4303011894226074, "lr": 0.0002683568518125298, "tps": 129231, "wall": 6696.0} {"step": 13204, "train_loss": 3.4346232414245605, "lr": 0.00026833839782359646, "tps": 129138, "wall": 6701.4} {"step": 13205, "train_loss": 3.4437477588653564, "lr": 0.0002683199432870832, "tps": 129044, "wall": 6706.7} {"step": 13206, "train_loss": 3.4262962341308594, "lr": 0.00026830148820319893, "tps": 128951, "wall": 6712.1} {"step": 13207, "train_loss": 3.383054733276367, "lr": 0.00026828303257215284, "tps": 128858, "wall": 6717.5} {"step": 13208, "train_loss": 3.443800687789917, "lr": 0.00026826457639415397, "tps": 128766, "wall": 6722.8} {"step": 13209, "train_loss": 3.3730554580688477, "lr": 0.0002682461196694113, "tps": 128673, "wall": 6728.1} {"step": 13210, "train_loss": 3.3370234966278076, "lr": 0.00026822766239813407, "tps": 128580, "wall": 6733.5} {"step": 13211, "train_loss": 3.4019951820373535, "lr": 0.0002682092045805312, "tps": 128487, "wall": 6738.9} {"step": 13212, "train_loss": 3.3824121952056885, "lr": 0.0002681907462168119, "tps": 128395, "wall": 6744.2} {"step": 13213, "train_loss": 3.4177141189575195, "lr": 0.00026817228730718516, "tps": 128300, "wall": 6749.7} {"step": 13214, "train_loss": 3.4443728923797607, "lr": 0.0002681538278518602, "tps": 128209, "wall": 6755.0} {"step": 13215, "train_loss": 3.3878321647644043, "lr": 0.00026813536785104603, "tps": 128118, "wall": 6760.3} {"step": 13216, "train_loss": 3.3869521617889404, "lr": 0.00026811690730495176, "tps": 128026, "wall": 6765.7} {"step": 13217, "train_loss": 3.432447910308838, "lr": 0.00026809844621378666, "tps": 127935, "wall": 6771.0} {"step": 13218, "train_loss": 3.4566917419433594, "lr": 0.00026807998457775977, "tps": 127844, "wall": 6776.4} {"step": 13219, "train_loss": 3.342564821243286, "lr": 0.0002680615223970802, "tps": 127753, "wall": 6781.7} {"step": 13220, "train_loss": 3.3620965480804443, "lr": 0.000268043059671957, "tps": 127662, "wall": 6787.1} {"step": 13221, "train_loss": 3.4044716358184814, "lr": 0.0002680245964025995, "tps": 127571, "wall": 6792.4} {"step": 13222, "train_loss": 3.3827452659606934, "lr": 0.0002680061325892168, "tps": 127481, "wall": 6797.7} {"step": 13223, "train_loss": 3.4487335681915283, "lr": 0.00026798766823201797, "tps": 127391, "wall": 6803.0} {"step": 13224, "train_loss": 3.4222750663757324, "lr": 0.00026796920333121234, "tps": 127300, "wall": 6808.4} {"step": 13225, "train_loss": 3.428158760070801, "lr": 0.00026795073788700885, "tps": 127210, "wall": 6813.7} {"step": 13226, "train_loss": 3.429506301879883, "lr": 0.00026793227189961683, "tps": 127120, "wall": 6819.1} {"step": 13227, "train_loss": 3.3933475017547607, "lr": 0.0002679138053692455, "tps": 127031, "wall": 6824.4} {"step": 13228, "train_loss": 3.626131296157837, "lr": 0.000267895338296104, "tps": 126942, "wall": 6829.7} {"step": 13229, "train_loss": 3.355990409851074, "lr": 0.00026787687068040143, "tps": 126852, "wall": 6835.0} {"step": 13230, "train_loss": 3.4057655334472656, "lr": 0.00026785840252234716, "tps": 126762, "wall": 6840.4} {"step": 13231, "train_loss": 3.349480390548706, "lr": 0.0002678399338221503, "tps": 126673, "wall": 6845.7} {"step": 13232, "train_loss": 3.3785014152526855, "lr": 0.0002678214645800201, "tps": 126584, "wall": 6851.0} {"step": 13233, "train_loss": 3.2804436683654785, "lr": 0.00026780299479616567, "tps": 126496, "wall": 6856.4} {"step": 13234, "train_loss": 3.379181146621704, "lr": 0.0002677845244707964, "tps": 126408, "wall": 6861.6} {"step": 13235, "train_loss": 3.383781909942627, "lr": 0.0002677660536041215, "tps": 126319, "wall": 6867.0} {"step": 13236, "train_loss": 3.4143974781036377, "lr": 0.0002677475821963501, "tps": 126229, "wall": 6872.4} {"step": 13237, "train_loss": 3.432187080383301, "lr": 0.00026772911024769153, "tps": 126141, "wall": 6877.7} {"step": 13238, "train_loss": 3.463470458984375, "lr": 0.00026771063775835497, "tps": 126053, "wall": 6883.1} {"step": 13239, "train_loss": 3.325751304626465, "lr": 0.00026769216472854974, "tps": 125965, "wall": 6888.4} {"step": 13240, "train_loss": 3.390054225921631, "lr": 0.0002676736911584851, "tps": 125877, "wall": 6893.7} {"step": 13241, "train_loss": 3.389195442199707, "lr": 0.0002676552170483703, "tps": 125790, "wall": 6899.0} {"step": 13242, "train_loss": 3.4178898334503174, "lr": 0.00026763674239841463, "tps": 125702, "wall": 6904.3} {"step": 13243, "train_loss": 3.409916877746582, "lr": 0.00026761826720882734, "tps": 125615, "wall": 6909.7} {"step": 13244, "train_loss": 3.429542064666748, "lr": 0.0002675997914798178, "tps": 125528, "wall": 6914.9} {"step": 13245, "train_loss": 3.396512031555176, "lr": 0.00026758131521159524, "tps": 125442, "wall": 6920.2} {"step": 13246, "train_loss": 3.5284245014190674, "lr": 0.00026756283840436893, "tps": 125355, "wall": 6925.5} {"step": 13247, "train_loss": 3.538771152496338, "lr": 0.0002675443610583482, "tps": 125267, "wall": 6930.9} {"step": 13248, "train_loss": 3.5013232231140137, "lr": 0.00026752588317374243, "tps": 125180, "wall": 6936.3} {"step": 13249, "train_loss": 3.45729398727417, "lr": 0.0002675074047507608, "tps": 125093, "wall": 6941.6} {"step": 13250, "train_loss": 3.369274854660034, "lr": 0.0002674889257896128, "tps": 125007, "wall": 6946.9} {"step": 13251, "train_loss": 3.463879108428955, "lr": 0.0002674704462905077, "tps": 124922, "wall": 6952.2} {"step": 13252, "train_loss": 3.445521831512451, "lr": 0.00026745196625365476, "tps": 124836, "wall": 6957.5} {"step": 13253, "train_loss": 3.4240024089813232, "lr": 0.0002674334856792634, "tps": 124750, "wall": 6962.8} {"step": 13254, "train_loss": 3.3662354946136475, "lr": 0.0002674150045675429, "tps": 124664, "wall": 6968.1} {"step": 13255, "train_loss": 3.3878092765808105, "lr": 0.00026739652291870274, "tps": 124579, "wall": 6973.4} {"step": 13256, "train_loss": 3.355898380279541, "lr": 0.00026737804073295214, "tps": 124493, "wall": 6978.7} {"step": 13257, "train_loss": 3.3887829780578613, "lr": 0.0002673595580105006, "tps": 124408, "wall": 6984.0} {"step": 13258, "train_loss": 3.326691150665283, "lr": 0.00026734107475155736, "tps": 124321, "wall": 6989.5} {"step": 13259, "train_loss": 3.470402240753174, "lr": 0.00026732259095633184, "tps": 124237, "wall": 6994.7} {"step": 13260, "train_loss": 3.3906795978546143, "lr": 0.0002673041066250335, "tps": 124151, "wall": 7000.1} {"step": 13261, "train_loss": 3.412402629852295, "lr": 0.0002672856217578717, "tps": 124066, "wall": 7005.4} {"step": 13262, "train_loss": 3.4462101459503174, "lr": 0.0002672671363550558, "tps": 123981, "wall": 7010.8} {"step": 13263, "train_loss": 3.343301296234131, "lr": 0.0002672486504167952, "tps": 123896, "wall": 7016.1} {"step": 13264, "train_loss": 3.369328260421753, "lr": 0.00026723016394329945, "tps": 123811, "wall": 7021.4} {"step": 13265, "train_loss": 3.2828283309936523, "lr": 0.0002672116769347777, "tps": 123727, "wall": 7026.8} {"step": 13266, "train_loss": 3.3945178985595703, "lr": 0.0002671931893914396, "tps": 123643, "wall": 7032.1} {"step": 13267, "train_loss": 3.378443479537964, "lr": 0.00026717470131349443, "tps": 123559, "wall": 7037.3} {"step": 13268, "train_loss": 3.2624475955963135, "lr": 0.0002671562127011517, "tps": 123475, "wall": 7042.7} {"step": 13269, "train_loss": 3.3125832080841064, "lr": 0.0002671377235546209, "tps": 123391, "wall": 7048.0} {"step": 13270, "train_loss": 3.4810988903045654, "lr": 0.00026711923387411134, "tps": 123306, "wall": 7053.4} {"step": 13271, "train_loss": 3.3333778381347656, "lr": 0.0002671007436598326, "tps": 123222, "wall": 7058.7} {"step": 13272, "train_loss": 3.3888278007507324, "lr": 0.0002670822529119941, "tps": 123139, "wall": 7064.0} {"step": 13273, "train_loss": 3.430786609649658, "lr": 0.00026706376163080535, "tps": 123055, "wall": 7069.4} {"step": 13274, "train_loss": 3.437098264694214, "lr": 0.00026704526981647563, "tps": 122972, "wall": 7074.7} {"step": 13275, "train_loss": 3.412966728210449, "lr": 0.0002670267774692146, "tps": 122889, "wall": 7080.0} {"step": 13276, "train_loss": 3.4384799003601074, "lr": 0.0002670082845892317, "tps": 122806, "wall": 7085.3} {"step": 13277, "train_loss": 3.4114389419555664, "lr": 0.0002669897911767364, "tps": 122723, "wall": 7090.6} {"step": 13278, "train_loss": 3.4679014682769775, "lr": 0.00026697129723193824, "tps": 122641, "wall": 7095.9} {"step": 13279, "train_loss": 3.3557400703430176, "lr": 0.00026695280275504667, "tps": 122559, "wall": 7101.2} {"step": 13280, "train_loss": 3.4820446968078613, "lr": 0.00026693430774627115, "tps": 122476, "wall": 7106.5} {"step": 13281, "train_loss": 3.3167359828948975, "lr": 0.0002669158122058213, "tps": 122392, "wall": 7111.9} {"step": 13282, "train_loss": 3.3485774993896484, "lr": 0.0002668973161339066, "tps": 122310, "wall": 7117.3} {"step": 13283, "train_loss": 3.359855890274048, "lr": 0.0002668788195307366, "tps": 122227, "wall": 7122.6} {"step": 13284, "train_loss": 3.4158902168273926, "lr": 0.0002668603223965207, "tps": 122146, "wall": 7127.9} {"step": 13285, "train_loss": 3.3362345695495605, "lr": 0.00026684182473146864, "tps": 122065, "wall": 7133.2} {"step": 13286, "train_loss": 3.412627696990967, "lr": 0.00026682332653578974, "tps": 121983, "wall": 7138.5} {"step": 13287, "train_loss": 3.3767993450164795, "lr": 0.00026680482780969367, "tps": 121902, "wall": 7143.8} {"step": 13288, "train_loss": 3.3547139167785645, "lr": 0.0002667863285533901, "tps": 121819, "wall": 7149.2} {"step": 13289, "train_loss": 3.423696994781494, "lr": 0.00026676782876708843, "tps": 121738, "wall": 7154.5} {"step": 13290, "train_loss": 3.4395313262939453, "lr": 0.00026674932845099816, "tps": 121657, "wall": 7159.7} {"step": 13291, "train_loss": 3.3815102577209473, "lr": 0.00026673082760532906, "tps": 121577, "wall": 7165.0} {"step": 13292, "train_loss": 3.354290008544922, "lr": 0.0002667123262302906, "tps": 121494, "wall": 7170.4} {"step": 13293, "train_loss": 3.419682025909424, "lr": 0.00026669382432609233, "tps": 121413, "wall": 7175.7} {"step": 13294, "train_loss": 3.397641658782959, "lr": 0.00026667532189294396, "tps": 121333, "wall": 7181.0} {"step": 13295, "train_loss": 3.3627891540527344, "lr": 0.000266656818931055, "tps": 121253, "wall": 7186.3} {"step": 13296, "train_loss": 3.390814781188965, "lr": 0.00026663831544063507, "tps": 121172, "wall": 7191.6} {"step": 13297, "train_loss": 3.4075441360473633, "lr": 0.0002666198114218938, "tps": 121092, "wall": 7196.9} {"step": 13298, "train_loss": 3.3638155460357666, "lr": 0.0002666013068750408, "tps": 121013, "wall": 7202.2} {"step": 13299, "train_loss": 3.3341915607452393, "lr": 0.00026658280180028563, "tps": 120932, "wall": 7207.6} {"step": 13300, "train_loss": 3.387557029724121, "lr": 0.00026656429619783796, "tps": 120852, "wall": 7212.9} {"step": 13301, "train_loss": 3.454359531402588, "lr": 0.0002665457900679074, "tps": 120772, "wall": 7218.2} {"step": 13302, "train_loss": 3.265033721923828, "lr": 0.00026652728341070367, "tps": 120692, "wall": 7223.5} {"step": 13303, "train_loss": 3.4068901538848877, "lr": 0.00026650877622643636, "tps": 120612, "wall": 7228.9} {"step": 13304, "train_loss": 3.4841816425323486, "lr": 0.00026649026851531505, "tps": 120532, "wall": 7234.2} {"step": 13305, "train_loss": 3.3754076957702637, "lr": 0.0002664717602775495, "tps": 120453, "wall": 7239.5} {"step": 13306, "train_loss": 3.3477189540863037, "lr": 0.00026645325151334936, "tps": 120374, "wall": 7244.8} {"step": 13307, "train_loss": 3.4508094787597656, "lr": 0.00026643474222292425, "tps": 120295, "wall": 7250.1} {"step": 13308, "train_loss": 3.418750047683716, "lr": 0.0002664162324064838, "tps": 120216, "wall": 7255.4} {"step": 13309, "train_loss": 3.3713479042053223, "lr": 0.00026639772206423786, "tps": 120137, "wall": 7260.7} {"step": 13310, "train_loss": 3.3940682411193848, "lr": 0.00026637921119639606, "tps": 120058, "wall": 7266.0} {"step": 13311, "train_loss": 3.3059940338134766, "lr": 0.00026636069980316793, "tps": 119981, "wall": 7271.3} {"step": 13312, "train_loss": 3.4309821128845215, "lr": 0.00026634218788476334, "tps": 119902, "wall": 7276.6} {"step": 13313, "train_loss": 3.354948043823242, "lr": 0.0002663236754413919, "tps": 119824, "wall": 7281.9} {"step": 13314, "train_loss": 3.413801670074463, "lr": 0.00026630516247326335, "tps": 119746, "wall": 7287.2} {"step": 13315, "train_loss": 3.4706521034240723, "lr": 0.00026628664898058755, "tps": 119667, "wall": 7292.5} {"step": 13316, "train_loss": 3.3516221046447754, "lr": 0.0002662681349635739, "tps": 119589, "wall": 7297.8} {"step": 13317, "train_loss": 3.475473403930664, "lr": 0.00026624962042243243, "tps": 119511, "wall": 7303.1} {"step": 13318, "train_loss": 3.4541921615600586, "lr": 0.0002662311053573727, "tps": 119434, "wall": 7308.4} {"step": 13319, "train_loss": 3.3317081928253174, "lr": 0.00026621258976860455, "tps": 119356, "wall": 7313.7} {"step": 13320, "train_loss": 3.5175509452819824, "lr": 0.0002661940736563377, "tps": 119279, "wall": 7319.0} {"step": 13321, "train_loss": 3.402590274810791, "lr": 0.00026617555702078177, "tps": 119202, "wall": 7324.3} {"step": 13322, "train_loss": 3.454270839691162, "lr": 0.0002661570398621468, "tps": 119124, "wall": 7329.6} {"step": 13323, "train_loss": 3.4641330242156982, "lr": 0.0002661385221806422, "tps": 119047, "wall": 7334.9} {"step": 13324, "train_loss": 3.3524746894836426, "lr": 0.00026612000397647806, "tps": 118970, "wall": 7340.2} {"step": 13325, "train_loss": 3.425441265106201, "lr": 0.000266101485249864, "tps": 118893, "wall": 7345.5} {"step": 13326, "train_loss": 3.460916519165039, "lr": 0.00026608296600100977, "tps": 118815, "wall": 7350.9} {"step": 13327, "train_loss": 3.363020420074463, "lr": 0.00026606444623012527, "tps": 118739, "wall": 7356.1} {"step": 13328, "train_loss": 3.373016357421875, "lr": 0.0002660459259374202, "tps": 118662, "wall": 7361.4} {"step": 13329, "train_loss": 3.558903694152832, "lr": 0.0002660274051231044, "tps": 118586, "wall": 7366.7} {"step": 13330, "train_loss": 3.3639321327209473, "lr": 0.00026600888378738765, "tps": 118509, "wall": 7372.1} {"step": 13331, "train_loss": 3.4891910552978516, "lr": 0.00026599036193047975, "tps": 118433, "wall": 7377.3} {"step": 13332, "train_loss": 3.457918882369995, "lr": 0.0002659718395525906, "tps": 118357, "wall": 7382.6} {"step": 13333, "train_loss": 3.386995553970337, "lr": 0.00026595331665392994, "tps": 118281, "wall": 7388.0} {"step": 13334, "train_loss": 3.3319931030273438, "lr": 0.0002659347932347076, "tps": 118205, "wall": 7393.2} {"step": 13335, "train_loss": 3.3253936767578125, "lr": 0.00026591626929513344, "tps": 118129, "wall": 7398.5} {"step": 13336, "train_loss": 3.3598527908325195, "lr": 0.0002658977448354174, "tps": 118054, "wall": 7403.8} {"step": 13337, "train_loss": 3.421731948852539, "lr": 0.00026587921985576907, "tps": 117977, "wall": 7409.2} {"step": 13338, "train_loss": 3.3475701808929443, "lr": 0.00026586069435639853, "tps": 117902, "wall": 7414.5} {"step": 13339, "train_loss": 3.4367289543151855, "lr": 0.0002658421683375156, "tps": 117826, "wall": 7419.8} {"step": 13340, "train_loss": 3.257296085357666, "lr": 0.00026582364179933004, "tps": 117751, "wall": 7425.1} {"step": 13341, "train_loss": 3.4011647701263428, "lr": 0.00026580511474205183, "tps": 117676, "wall": 7430.4} {"step": 13342, "train_loss": 3.4965124130249023, "lr": 0.00026578658716589073, "tps": 117601, "wall": 7435.7} {"step": 13343, "train_loss": 3.520639657974243, "lr": 0.0002657680590710568, "tps": 117526, "wall": 7441.0} {"step": 13344, "train_loss": 3.3217697143554688, "lr": 0.0002657495304577597, "tps": 117451, "wall": 7446.3} {"step": 13345, "train_loss": 3.3559353351593018, "lr": 0.0002657310013262095, "tps": 117377, "wall": 7451.6} {"step": 13346, "train_loss": 3.3965320587158203, "lr": 0.00026571247167661615, "tps": 117302, "wall": 7456.9} {"step": 13347, "train_loss": 3.469987154006958, "lr": 0.0002656939415091893, "tps": 117228, "wall": 7462.2} {"step": 13348, "train_loss": 3.3389017581939697, "lr": 0.000265675410824139, "tps": 117154, "wall": 7467.4} {"step": 13349, "train_loss": 3.465029716491699, "lr": 0.0002656568796216753, "tps": 117078, "wall": 7472.8} {"step": 13350, "train_loss": 3.3342888355255127, "lr": 0.00026563834790200794, "tps": 117004, "wall": 7478.1} {"step": 13351, "train_loss": 3.4699974060058594, "lr": 0.0002656198156653468, "tps": 116930, "wall": 7483.4} {"step": 13352, "train_loss": 3.4593186378479004, "lr": 0.0002656012829119021, "tps": 116856, "wall": 7488.7} {"step": 13353, "train_loss": 3.292772054672241, "lr": 0.0002655827496418835, "tps": 116782, "wall": 7494.0} {"step": 13354, "train_loss": 3.505110740661621, "lr": 0.0002655642158555011, "tps": 116708, "wall": 7499.3} {"step": 13355, "train_loss": 3.403071403503418, "lr": 0.00026554568155296473, "tps": 116635, "wall": 7504.6} {"step": 13356, "train_loss": 3.34391450881958, "lr": 0.00026552714673448453, "tps": 116561, "wall": 7509.9} {"step": 13357, "train_loss": 3.360124111175537, "lr": 0.0002655086114002702, "tps": 116488, "wall": 7515.2} {"step": 13358, "train_loss": 3.341731309890747, "lr": 0.000265490075550532, "tps": 116415, "wall": 7520.5} {"step": 13359, "train_loss": 3.394467353820801, "lr": 0.0002654715391854796, "tps": 116341, "wall": 7525.8} {"step": 13360, "train_loss": 3.4742631912231445, "lr": 0.0002654530023053233, "tps": 116267, "wall": 7531.1} {"step": 13361, "train_loss": 3.4133033752441406, "lr": 0.00026543446491027287, "tps": 116194, "wall": 7536.4} {"step": 13362, "train_loss": 3.3803441524505615, "lr": 0.00026541592700053836, "tps": 116121, "wall": 7541.7} {"step": 13363, "train_loss": 3.4105987548828125, "lr": 0.00026539738857632976, "tps": 116049, "wall": 7547.0} {"step": 13364, "train_loss": 3.346127986907959, "lr": 0.0002653788496378571, "tps": 115976, "wall": 7552.3} {"step": 13365, "train_loss": 3.382296085357666, "lr": 0.00026536031018533035, "tps": 115903, "wall": 7557.6} {"step": 13366, "train_loss": 3.4097981452941895, "lr": 0.00026534177021895957, "tps": 115831, "wall": 7562.9} {"step": 13367, "train_loss": 3.395718574523926, "lr": 0.0002653232297389548, "tps": 115758, "wall": 7568.2} {"step": 13368, "train_loss": 3.454033613204956, "lr": 0.000265304688745526, "tps": 115687, "wall": 7573.4} {"step": 13369, "train_loss": 3.433797597885132, "lr": 0.00026528614723888324, "tps": 115614, "wall": 7578.8} {"step": 13370, "train_loss": 3.3182215690612793, "lr": 0.00026526760521923656, "tps": 115542, "wall": 7584.1} {"step": 13371, "train_loss": 3.3451833724975586, "lr": 0.000265249062686796, "tps": 115468, "wall": 7589.5} {"step": 13372, "train_loss": 3.348287582397461, "lr": 0.00026523051964177154, "tps": 115397, "wall": 7594.7} {"step": 13373, "train_loss": 3.407102584838867, "lr": 0.0002652119760843734, "tps": 115326, "wall": 7600.0} {"step": 13374, "train_loss": 3.4326417446136475, "lr": 0.0002651934320148115, "tps": 115254, "wall": 7605.3} {"step": 13375, "train_loss": 3.4351630210876465, "lr": 0.0002651748874332959, "tps": 115183, "wall": 7610.6} {"step": 13376, "train_loss": 3.3502986431121826, "lr": 0.00026515634234003686, "tps": 115111, "wall": 7615.9} {"step": 13377, "train_loss": 3.3980014324188232, "lr": 0.0002651377967352443, "tps": 115040, "wall": 7621.1} {"step": 13378, "train_loss": 3.4140210151672363, "lr": 0.00026511925061912834, "tps": 114969, "wall": 7626.4} {"step": 13379, "train_loss": 3.363574743270874, "lr": 0.000265100703991899, "tps": 114898, "wall": 7631.7} {"step": 13380, "train_loss": 3.429497241973877, "lr": 0.0002650821568537665, "tps": 114827, "wall": 7637.0} {"step": 13381, "train_loss": 3.443521022796631, "lr": 0.00026506360920494084, "tps": 114756, "wall": 7642.3} {"step": 13382, "train_loss": 3.3444273471832275, "lr": 0.00026504506104563225, "tps": 114685, "wall": 7647.6} {"step": 13383, "train_loss": 3.399506092071533, "lr": 0.0002650265123760507, "tps": 114613, "wall": 7653.0} {"step": 13384, "train_loss": 3.334341049194336, "lr": 0.00026500796319640647, "tps": 114542, "wall": 7658.3} {"step": 13385, "train_loss": 3.4162027835845947, "lr": 0.00026498941350690947, "tps": 114472, "wall": 7663.5} {"step": 13386, "train_loss": 3.448706865310669, "lr": 0.00026497086330777006, "tps": 114402, "wall": 7668.8} {"step": 13387, "train_loss": 3.5040228366851807, "lr": 0.00026495231259919826, "tps": 114331, "wall": 7674.1} {"step": 13388, "train_loss": 3.359856367111206, "lr": 0.0002649337613814042, "tps": 114261, "wall": 7679.4} {"step": 13389, "train_loss": 3.50772762298584, "lr": 0.00026491520965459805, "tps": 114191, "wall": 7684.7} {"step": 13390, "train_loss": 3.4046411514282227, "lr": 0.00026489665741899005, "tps": 114121, "wall": 7690.0} {"step": 13391, "train_loss": 3.392930507659912, "lr": 0.00026487810467479023, "tps": 114051, "wall": 7695.3} {"step": 13392, "train_loss": 3.3969359397888184, "lr": 0.00026485955142220883, "tps": 113981, "wall": 7700.6} {"step": 13393, "train_loss": 3.349876880645752, "lr": 0.00026484099766145596, "tps": 113911, "wall": 7705.9} {"step": 13394, "train_loss": 3.39276385307312, "lr": 0.00026482244339274196, "tps": 113840, "wall": 7711.2} {"step": 13395, "train_loss": 3.413083791732788, "lr": 0.00026480388861627673, "tps": 113771, "wall": 7716.6} {"step": 13396, "train_loss": 3.449075698852539, "lr": 0.0002647853333322707, "tps": 113701, "wall": 7721.9} {"step": 13397, "train_loss": 3.4088668823242188, "lr": 0.00026476677754093403, "tps": 113631, "wall": 7727.2} {"step": 13398, "train_loss": 3.366586446762085, "lr": 0.00026474822124247685, "tps": 113562, "wall": 7732.5} {"step": 13399, "train_loss": 3.365731954574585, "lr": 0.00026472966443710945, "tps": 113493, "wall": 7737.7} {"step": 13400, "train_loss": 3.4087157249450684, "lr": 0.00026471110712504196, "tps": 113424, "wall": 7743.0} {"step": 13401, "train_loss": 3.426443576812744, "lr": 0.00026469254930648454, "tps": 113355, "wall": 7748.3} {"step": 13402, "train_loss": 3.371699810028076, "lr": 0.00026467399098164764, "tps": 113286, "wall": 7753.6} {"step": 13403, "train_loss": 3.428051710128784, "lr": 0.0002646554321507412, "tps": 113217, "wall": 7758.9} {"step": 13404, "train_loss": 3.3449862003326416, "lr": 0.0002646368728139758, "tps": 113148, "wall": 7764.2} {"step": 13405, "train_loss": 3.3670506477355957, "lr": 0.00026461831297156137, "tps": 113078, "wall": 7769.6} {"step": 13406, "train_loss": 3.3298544883728027, "lr": 0.0002645997526237082, "tps": 113010, "wall": 7774.9} {"step": 13407, "train_loss": 3.3132872581481934, "lr": 0.00026458119177062684, "tps": 112942, "wall": 7780.1} {"step": 13408, "train_loss": 3.4909892082214355, "lr": 0.00026456263041252717, "tps": 112874, "wall": 7785.4} {"step": 13409, "train_loss": 3.3991570472717285, "lr": 0.00026454406854961967, "tps": 112805, "wall": 7790.7} {"step": 13410, "train_loss": 3.3824872970581055, "lr": 0.0002645255061821145, "tps": 112737, "wall": 7796.0} {"step": 13411, "train_loss": 3.4936587810516357, "lr": 0.00026450694331022205, "tps": 112669, "wall": 7801.3} {"step": 13412, "train_loss": 3.4521026611328125, "lr": 0.00026448837993415245, "tps": 112601, "wall": 7806.6} {"step": 13413, "train_loss": 3.3017239570617676, "lr": 0.00026446981605411613, "tps": 112533, "wall": 7811.9} {"step": 13414, "train_loss": 3.4497995376586914, "lr": 0.00026445125167032333, "tps": 112465, "wall": 7817.2} {"step": 13415, "train_loss": 3.3573155403137207, "lr": 0.00026443268678298437, "tps": 112398, "wall": 7822.4} {"step": 13416, "train_loss": 3.395474433898926, "lr": 0.0002644141213923095, "tps": 112331, "wall": 7827.7} {"step": 13417, "train_loss": 3.3725104331970215, "lr": 0.0002643955554985091, "tps": 112262, "wall": 7833.1} {"step": 13418, "train_loss": 3.4858851432800293, "lr": 0.0002643769891017934, "tps": 112195, "wall": 7838.4} {"step": 13419, "train_loss": 3.3209118843078613, "lr": 0.00026435842220237275, "tps": 112127, "wall": 7843.7} {"step": 13420, "train_loss": 3.341654062271118, "lr": 0.0002643398548004575, "tps": 112060, "wall": 7849.0} {"step": 13421, "train_loss": 3.386521339416504, "lr": 0.00026432128689625803, "tps": 111992, "wall": 7854.3} {"step": 13422, "train_loss": 3.374621868133545, "lr": 0.0002643027184899846, "tps": 111925, "wall": 7859.6} {"step": 13423, "train_loss": 3.3376927375793457, "lr": 0.00026428414958184755, "tps": 111858, "wall": 7864.9} {"step": 13424, "train_loss": 3.338606595993042, "lr": 0.00026426558017205733, "tps": 111792, "wall": 7870.2} {"step": 13425, "train_loss": 3.382345676422119, "lr": 0.00026424701026082415, "tps": 111724, "wall": 7875.5} {"step": 13426, "train_loss": 3.3737564086914062, "lr": 0.00026422843984835845, "tps": 111658, "wall": 7880.8} {"step": 13427, "train_loss": 3.317237377166748, "lr": 0.0002642098689348706, "tps": 111591, "wall": 7886.0} {"step": 13428, "train_loss": 3.4457108974456787, "lr": 0.00026419129752057094, "tps": 111524, "wall": 7891.4} {"step": 13429, "train_loss": 3.3694005012512207, "lr": 0.0002641727256056699, "tps": 111457, "wall": 7896.7} {"step": 13430, "train_loss": 3.4569616317749023, "lr": 0.00026415415319037787, "tps": 111391, "wall": 7902.0} {"step": 13431, "train_loss": 3.3887624740600586, "lr": 0.00026413558027490514, "tps": 111325, "wall": 7907.3} {"step": 13432, "train_loss": 3.4512252807617188, "lr": 0.00026411700685946224, "tps": 111259, "wall": 7912.6} {"step": 13433, "train_loss": 3.379138469696045, "lr": 0.00026409843294425943, "tps": 111192, "wall": 7917.9} {"step": 13434, "train_loss": 3.411867618560791, "lr": 0.0002640798585295072, "tps": 111127, "wall": 7923.1} {"step": 13435, "train_loss": 3.398298740386963, "lr": 0.000264061283615416, "tps": 111061, "wall": 7928.4} {"step": 13436, "train_loss": 3.386934757232666, "lr": 0.0002640427082021961, "tps": 110995, "wall": 7933.7} {"step": 13437, "train_loss": 3.3608927726745605, "lr": 0.00026402413229005805, "tps": 110930, "wall": 7939.0} {"step": 13438, "train_loss": 3.371349811553955, "lr": 0.00026400555587921233, "tps": 110864, "wall": 7944.3} {"step": 13439, "train_loss": 3.3054192066192627, "lr": 0.0002639869789698692, "tps": 110797, "wall": 7949.6} {"step": 13440, "train_loss": 3.3415563106536865, "lr": 0.0002639684015622393, "tps": 110732, "wall": 7954.9} {"step": 13441, "train_loss": 3.1892101764678955, "lr": 0.0002639498236565328, "tps": 110667, "wall": 7960.2} {"step": 13442, "train_loss": 3.3818657398223877, "lr": 0.0002639312452529605, "tps": 110602, "wall": 7965.5} {"step": 13443, "train_loss": 3.385364055633545, "lr": 0.00026391266635173257, "tps": 110536, "wall": 7970.8} {"step": 13444, "train_loss": 3.265190362930298, "lr": 0.0002638940869530596, "tps": 110470, "wall": 7976.1} {"step": 13445, "train_loss": 3.402125358581543, "lr": 0.0002638755070571521, "tps": 110405, "wall": 7981.4} {"step": 13446, "train_loss": 3.3888087272644043, "lr": 0.0002638569266642204, "tps": 110340, "wall": 7986.7} {"step": 13447, "train_loss": 3.4235100746154785, "lr": 0.00026383834577447504, "tps": 110276, "wall": 7992.0} {"step": 13448, "train_loss": 3.3994503021240234, "lr": 0.0002638197643881266, "tps": 110211, "wall": 7997.3} {"step": 13449, "train_loss": 3.22634220123291, "lr": 0.00026380118250538546, "tps": 110146, "wall": 8002.6} {"step": 13450, "train_loss": 3.325821876525879, "lr": 0.00026378260012646215, "tps": 110081, "wall": 8007.9} {"step": 13451, "train_loss": 3.399848699569702, "lr": 0.0002637640172515672, "tps": 110016, "wall": 8013.2} {"step": 13452, "train_loss": 3.340703248977661, "lr": 0.0002637454338809111, "tps": 109952, "wall": 8018.5} {"step": 13453, "train_loss": 3.375077247619629, "lr": 0.00026372685001470434, "tps": 109888, "wall": 8023.8} {"step": 13454, "train_loss": 3.2021985054016113, "lr": 0.00026370826565315743, "tps": 109823, "wall": 8029.1} {"step": 13455, "train_loss": 3.4414024353027344, "lr": 0.000263689680796481, "tps": 109759, "wall": 8034.4} {"step": 13456, "train_loss": 3.28752064704895, "lr": 0.00026367109544488544, "tps": 109696, "wall": 8039.7} {"step": 13457, "train_loss": 3.348076820373535, "lr": 0.0002636525095985814, "tps": 109632, "wall": 8044.9} {"step": 13458, "train_loss": 3.4757096767425537, "lr": 0.00026363392325777924, "tps": 109567, "wall": 8050.3} {"step": 13459, "train_loss": 3.4554882049560547, "lr": 0.0002636153364226898, "tps": 109504, "wall": 8055.5} {"step": 13460, "train_loss": 3.455343723297119, "lr": 0.00026359674909352343, "tps": 109440, "wall": 8060.8} {"step": 13461, "train_loss": 3.362541913986206, "lr": 0.00026357816127049066, "tps": 109376, "wall": 8066.1} {"step": 13462, "train_loss": 3.4791312217712402, "lr": 0.0002635595729538022, "tps": 109312, "wall": 8071.5} {"step": 13463, "train_loss": 3.339794397354126, "lr": 0.00026354098414366846, "tps": 109249, "wall": 8076.7} {"step": 13464, "train_loss": 3.3343141078948975, "lr": 0.00026352239484030013, "tps": 109186, "wall": 8082.0} {"step": 13465, "train_loss": 3.413278818130493, "lr": 0.00026350380504390784, "tps": 109122, "wall": 8087.3} {"step": 13466, "train_loss": 3.4294419288635254, "lr": 0.00026348521475470197, "tps": 109059, "wall": 8092.6} {"step": 13467, "train_loss": 3.3865723609924316, "lr": 0.0002634666239728933, "tps": 108996, "wall": 8097.9} {"step": 13468, "train_loss": 3.4883742332458496, "lr": 0.0002634480326986923, "tps": 108932, "wall": 8103.2} {"step": 13469, "train_loss": 3.4121875762939453, "lr": 0.00026342944093230974, "tps": 108869, "wall": 8108.5} {"step": 13470, "train_loss": 3.3369030952453613, "lr": 0.0002634108486739561, "tps": 108806, "wall": 8113.8} {"step": 13471, "train_loss": 3.3491148948669434, "lr": 0.0002633922559238419, "tps": 108744, "wall": 8119.1} {"step": 13472, "train_loss": 3.3748769760131836, "lr": 0.00026337366268217797, "tps": 108681, "wall": 8124.3} {"step": 13473, "train_loss": 3.2949421405792236, "lr": 0.0002633550689491748, "tps": 108617, "wall": 8129.7} {"step": 13474, "train_loss": 3.452833652496338, "lr": 0.0002633364747250431, "tps": 108555, "wall": 8135.0} {"step": 13475, "train_loss": 3.4811129570007324, "lr": 0.00026331788000999353, "tps": 108492, "wall": 8140.3} {"step": 13476, "train_loss": 3.3508148193359375, "lr": 0.00026329928480423655, "tps": 108430, "wall": 8145.6} {"step": 13477, "train_loss": 3.3349666595458984, "lr": 0.000263280689107983, "tps": 108368, "wall": 8150.9} {"step": 13478, "train_loss": 3.472033977508545, "lr": 0.00026326209292144344, "tps": 108305, "wall": 8156.2} {"step": 13479, "train_loss": 3.438810348510742, "lr": 0.0002632434962448286, "tps": 108244, "wall": 8161.4} {"step": 13480, "train_loss": 3.3338003158569336, "lr": 0.00026322489907834904, "tps": 108182, "wall": 8166.7} {"step": 13481, "train_loss": 3.3510732650756836, "lr": 0.0002632063014222155, "tps": 108120, "wall": 8172.0} {"step": 13482, "train_loss": 3.336552619934082, "lr": 0.00026318770327663865, "tps": 108058, "wall": 8177.3} {"step": 13483, "train_loss": 3.302886486053467, "lr": 0.00026316910464182916, "tps": 107996, "wall": 8182.6} {"step": 13484, "train_loss": 3.3057188987731934, "lr": 0.0002631505055179977, "tps": 107934, "wall": 8187.8} {"step": 13485, "train_loss": 3.366236686706543, "lr": 0.00026313190590535496, "tps": 107872, "wall": 8193.2} {"step": 13486, "train_loss": 3.354205846786499, "lr": 0.00026311330580411173, "tps": 107811, "wall": 8198.4} {"step": 13487, "train_loss": 3.28354811668396, "lr": 0.00026309470521447857, "tps": 107750, "wall": 8203.7} {"step": 13488, "train_loss": 3.2921934127807617, "lr": 0.0002630761041366663, "tps": 107689, "wall": 8208.9} {"step": 13489, "train_loss": 3.3941762447357178, "lr": 0.0002630575025708856, "tps": 107627, "wall": 8214.2} {"step": 13490, "train_loss": 3.4150242805480957, "lr": 0.0002630389005173471, "tps": 107566, "wall": 8219.5} {"step": 13491, "train_loss": 3.4213919639587402, "lr": 0.00026302029797626165, "tps": 107505, "wall": 8224.8} {"step": 13492, "train_loss": 3.2725985050201416, "lr": 0.00026300169494784, "tps": 107444, "wall": 8230.1} {"step": 13493, "train_loss": 3.419149160385132, "lr": 0.0002629830914322928, "tps": 107383, "wall": 8235.3} {"step": 13494, "train_loss": 3.2752766609191895, "lr": 0.0002629644874298307, "tps": 107322, "wall": 8240.6} {"step": 13495, "train_loss": 3.423919916152954, "lr": 0.00026294588294066464, "tps": 107262, "wall": 8245.9} {"step": 13496, "train_loss": 3.302478313446045, "lr": 0.00026292727796500533, "tps": 107200, "wall": 8251.3} {"step": 13497, "train_loss": 3.3465354442596436, "lr": 0.00026290867250306345, "tps": 107139, "wall": 8256.6} {"step": 13498, "train_loss": 3.3979477882385254, "lr": 0.00026289006655504983, "tps": 107078, "wall": 8261.9} {"step": 13499, "train_loss": 3.404844284057617, "lr": 0.0002628714601211752, "tps": 107018, "wall": 8267.1} {"step": 13500, "train_loss": 3.2181742191314697, "lr": 0.0002628528532016504, "tps": 106958, "wall": 8272.4} {"step": 13501, "train_loss": 3.369692802429199, "lr": 0.0002628342457966861, "tps": 106895, "wall": 8277.8} {"step": 13502, "train_loss": 3.339995861053467, "lr": 0.00026281563790649316, "tps": 106835, "wall": 8283.2} {"step": 13503, "train_loss": 3.4385976791381836, "lr": 0.0002627970295312824, "tps": 106774, "wall": 8288.5} {"step": 13504, "train_loss": 3.371431350708008, "lr": 0.0002627784206712645, "tps": 106714, "wall": 8293.7} {"step": 13505, "train_loss": 3.279874086380005, "lr": 0.0002627598113266504, "tps": 106654, "wall": 8299.0} {"step": 13506, "train_loss": 3.267800807952881, "lr": 0.00026274120149765085, "tps": 106595, "wall": 8304.3} {"step": 13507, "train_loss": 3.3653926849365234, "lr": 0.0002627225911844766, "tps": 106533, "wall": 8309.7} {"step": 13508, "train_loss": 3.3789446353912354, "lr": 0.0002627039803873385, "tps": 106474, "wall": 8314.9} {"step": 13509, "train_loss": 3.4370365142822266, "lr": 0.00026268536910644747, "tps": 106414, "wall": 8320.2} {"step": 13510, "train_loss": 3.348275661468506, "lr": 0.00026266675734201424, "tps": 106355, "wall": 8325.5} {"step": 13511, "train_loss": 3.3819289207458496, "lr": 0.0002626481450942497, "tps": 106295, "wall": 8330.7} {"step": 13512, "train_loss": 3.4300570487976074, "lr": 0.0002626295323633646, "tps": 106236, "wall": 8336.0} {"step": 13513, "train_loss": 3.496594190597534, "lr": 0.00026261091914956997, "tps": 106176, "wall": 8341.3} {"step": 13514, "train_loss": 3.398560047149658, "lr": 0.0002625923054530765, "tps": 106117, "wall": 8346.6} {"step": 13515, "train_loss": 3.444056749343872, "lr": 0.00026257369127409504, "tps": 106058, "wall": 8351.9} {"step": 13516, "train_loss": 3.370553970336914, "lr": 0.00026255507661283655, "tps": 105998, "wall": 8357.2} {"step": 13517, "train_loss": 3.396413803100586, "lr": 0.0002625364614695118, "tps": 105939, "wall": 8362.5} {"step": 13518, "train_loss": 3.458265781402588, "lr": 0.00026251784584433173, "tps": 105880, "wall": 8367.7} {"step": 13519, "train_loss": 3.263092517852783, "lr": 0.00026249922973750725, "tps": 105820, "wall": 8373.1} {"step": 13520, "train_loss": 3.398670196533203, "lr": 0.00026248061314924914, "tps": 105761, "wall": 8378.4} {"step": 13521, "train_loss": 3.4743576049804688, "lr": 0.0002624619960797683, "tps": 105702, "wall": 8383.7} {"step": 13522, "train_loss": 3.3360583782196045, "lr": 0.00026244337852927575, "tps": 105644, "wall": 8388.9} {"step": 13523, "train_loss": 3.387202262878418, "lr": 0.00026242476049798233, "tps": 105585, "wall": 8394.2} {"step": 13524, "train_loss": 3.4182801246643066, "lr": 0.00026240614198609895, "tps": 105527, "wall": 8399.5} {"step": 13525, "train_loss": 3.284977436065674, "lr": 0.0002623875229938364, "tps": 105468, "wall": 8404.7} {"step": 13526, "train_loss": 3.2529921531677246, "lr": 0.0002623689035214057, "tps": 105410, "wall": 8410.1} {"step": 13527, "train_loss": 3.323112964630127, "lr": 0.0002623502835690179, "tps": 105351, "wall": 8415.4} {"step": 13528, "train_loss": 3.383343458175659, "lr": 0.00026233166313688365, "tps": 105292, "wall": 8420.7} {"step": 13529, "train_loss": 3.489915370941162, "lr": 0.00026231304222521407, "tps": 105234, "wall": 8425.9} {"step": 13530, "train_loss": 3.4313883781433105, "lr": 0.0002622944208342201, "tps": 105175, "wall": 8431.3} {"step": 13531, "train_loss": 3.403988838195801, "lr": 0.0002622757989641126, "tps": 105117, "wall": 8436.6} {"step": 13532, "train_loss": 3.362931251525879, "lr": 0.00026225717661510254, "tps": 105059, "wall": 8441.9} {"step": 13533, "train_loss": 3.3879146575927734, "lr": 0.00026223855378740095, "tps": 105001, "wall": 8447.1} {"step": 13534, "train_loss": 3.3174707889556885, "lr": 0.00026221993048121877, "tps": 104943, "wall": 8452.4} {"step": 13535, "train_loss": 3.4242191314697266, "lr": 0.0002622013066967669, "tps": 104886, "wall": 8457.7} {"step": 13536, "train_loss": 3.30580997467041, "lr": 0.00026218268243425626, "tps": 104828, "wall": 8463.0} {"step": 13537, "train_loss": 3.375741481781006, "lr": 0.00026216405769389806, "tps": 104770, "wall": 8468.3} {"step": 13538, "train_loss": 3.391941547393799, "lr": 0.00026214543247590305, "tps": 104713, "wall": 8473.5} {"step": 13539, "train_loss": 3.3685595989227295, "lr": 0.00026212680678048227, "tps": 104656, "wall": 8478.8} {"step": 13540, "train_loss": 3.321927547454834, "lr": 0.0002621081806078468, "tps": 104598, "wall": 8484.1} {"step": 13541, "train_loss": 3.3671875, "lr": 0.00026208955395820756, "tps": 104539, "wall": 8489.5} {"step": 13542, "train_loss": 3.4562032222747803, "lr": 0.0002620709268317756, "tps": 104482, "wall": 8494.7} {"step": 13543, "train_loss": 3.388014554977417, "lr": 0.00026205229922876186, "tps": 104425, "wall": 8500.0} {"step": 13544, "train_loss": 3.3513150215148926, "lr": 0.00026203367114937745, "tps": 104368, "wall": 8505.3} {"step": 13545, "train_loss": 3.3917276859283447, "lr": 0.0002620150425938333, "tps": 104311, "wall": 8510.6} {"step": 13546, "train_loss": 3.3353817462921143, "lr": 0.0002619964135623405, "tps": 104254, "wall": 8515.8} {"step": 13547, "train_loss": 3.4301629066467285, "lr": 0.00026197778405511005, "tps": 104198, "wall": 8521.1} {"step": 13548, "train_loss": 3.356452465057373, "lr": 0.00026195915407235294, "tps": 104141, "wall": 8526.4} {"step": 13549, "train_loss": 3.4441943168640137, "lr": 0.0002619405236142803, "tps": 104084, "wall": 8531.7} {"step": 13550, "train_loss": 3.4375030994415283, "lr": 0.00026192189268110317, "tps": 104027, "wall": 8536.9} {"step": 13551, "train_loss": 3.4256393909454346, "lr": 0.0002619032612730326, "tps": 103971, "wall": 8542.2} {"step": 13552, "train_loss": 3.398698329925537, "lr": 0.0002618846293902795, "tps": 103914, "wall": 8547.5} {"step": 13553, "train_loss": 3.4248523712158203, "lr": 0.0002618659970330551, "tps": 103857, "wall": 8552.8} {"step": 13554, "train_loss": 3.391326427459717, "lr": 0.0002618473642015705, "tps": 103800, "wall": 8558.1} {"step": 13555, "train_loss": 3.4242448806762695, "lr": 0.0002618287308960366, "tps": 103744, "wall": 8563.4} {"step": 13556, "train_loss": 3.4626522064208984, "lr": 0.0002618100971166646, "tps": 103688, "wall": 8568.7} {"step": 13557, "train_loss": 3.3600358963012695, "lr": 0.0002617914628636656, "tps": 103632, "wall": 8573.9} {"step": 13558, "train_loss": 3.364345073699951, "lr": 0.0002617728281372506, "tps": 103576, "wall": 8579.2} {"step": 13559, "train_loss": 3.443126678466797, "lr": 0.00026175419293763077, "tps": 103520, "wall": 8584.4} {"step": 13560, "train_loss": 3.335090160369873, "lr": 0.00026173555726501715, "tps": 103464, "wall": 8589.7} {"step": 13561, "train_loss": 3.3038041591644287, "lr": 0.0002617169211196209, "tps": 103408, "wall": 8595.0} {"step": 13562, "train_loss": 3.3757593631744385, "lr": 0.0002616982845016531, "tps": 103352, "wall": 8600.3} {"step": 13563, "train_loss": 3.307279586791992, "lr": 0.00026167964741132487, "tps": 103297, "wall": 8605.5} {"step": 13564, "train_loss": 3.4238338470458984, "lr": 0.0002616610098488474, "tps": 103240, "wall": 8610.9} {"step": 13565, "train_loss": 3.4201066493988037, "lr": 0.0002616423718144317, "tps": 103185, "wall": 8616.2} {"step": 13566, "train_loss": 3.294353485107422, "lr": 0.000261623733308289, "tps": 103130, "wall": 8621.4} {"step": 13567, "train_loss": 3.4074208736419678, "lr": 0.0002616050943306303, "tps": 103074, "wall": 8626.7} {"step": 13568, "train_loss": 3.4047794342041016, "lr": 0.00026158645488166696, "tps": 103019, "wall": 8631.9} {"step": 13569, "train_loss": 3.4070887565612793, "lr": 0.00026156781496160995, "tps": 102964, "wall": 8637.2} {"step": 13570, "train_loss": 3.3289108276367188, "lr": 0.00026154917457067045, "tps": 102909, "wall": 8642.5} {"step": 13571, "train_loss": 3.4077439308166504, "lr": 0.00026153053370905975, "tps": 102854, "wall": 8647.7} {"step": 13572, "train_loss": 3.410330057144165, "lr": 0.00026151189237698884, "tps": 102799, "wall": 8653.0} {"step": 13573, "train_loss": 3.424561023712158, "lr": 0.000261493250574669, "tps": 102744, "wall": 8658.3} {"step": 13574, "train_loss": 3.397794723510742, "lr": 0.00026147460830231134, "tps": 102689, "wall": 8663.5} {"step": 13575, "train_loss": 3.4581546783447266, "lr": 0.00026145596556012714, "tps": 102633, "wall": 8668.9} {"step": 13576, "train_loss": 3.4649124145507812, "lr": 0.00026143732234832744, "tps": 102578, "wall": 8674.1} {"step": 13577, "train_loss": 3.4381840229034424, "lr": 0.0002614186786671236, "tps": 102523, "wall": 8679.4} {"step": 13578, "train_loss": 3.391591787338257, "lr": 0.0002614000345167266, "tps": 102469, "wall": 8684.7} {"step": 13579, "train_loss": 3.3549540042877197, "lr": 0.0002613813898973479, "tps": 102414, "wall": 8689.9} {"step": 13580, "train_loss": 3.395423412322998, "lr": 0.0002613627448091985, "tps": 102360, "wall": 8695.2} {"step": 13581, "train_loss": 3.381791591644287, "lr": 0.00026134409925248974, "tps": 102305, "wall": 8700.5} {"step": 13582, "train_loss": 3.3822872638702393, "lr": 0.0002613254532274327, "tps": 102251, "wall": 8705.7} {"step": 13583, "train_loss": 3.396409511566162, "lr": 0.00026130680673423876, "tps": 102197, "wall": 8711.0} {"step": 13584, "train_loss": 3.433659791946411, "lr": 0.0002612881597731191, "tps": 102143, "wall": 8716.3} {"step": 13585, "train_loss": 3.4107751846313477, "lr": 0.0002612695123442849, "tps": 102088, "wall": 8721.5} {"step": 13586, "train_loss": 3.374274492263794, "lr": 0.0002612508644479474, "tps": 102034, "wall": 8726.8} {"step": 13587, "train_loss": 3.504617214202881, "lr": 0.00026123221608431794, "tps": 101979, "wall": 8732.2} {"step": 13588, "train_loss": 3.3893775939941406, "lr": 0.0002612135672536077, "tps": 101925, "wall": 8737.5} {"step": 13589, "train_loss": 3.3357365131378174, "lr": 0.00026119491795602783, "tps": 101871, "wall": 8742.8} {"step": 13590, "train_loss": 3.4416441917419434, "lr": 0.0002611762681917898, "tps": 101817, "wall": 8748.0} {"step": 13591, "train_loss": 3.512319326400757, "lr": 0.0002611576179611048, "tps": 101763, "wall": 8753.3} {"step": 13592, "train_loss": 3.368130683898926, "lr": 0.000261138967264184, "tps": 101709, "wall": 8758.6} {"step": 13593, "train_loss": 3.401258945465088, "lr": 0.0002611203161012388, "tps": 101655, "wall": 8763.9} {"step": 13594, "train_loss": 3.379220962524414, "lr": 0.0002611016644724805, "tps": 101601, "wall": 8769.2} {"step": 13595, "train_loss": 3.3856871128082275, "lr": 0.0002610830123781202, "tps": 101547, "wall": 8774.5} {"step": 13596, "train_loss": 3.308220863342285, "lr": 0.0002610643598183693, "tps": 101494, "wall": 8779.8} {"step": 13597, "train_loss": 3.3620455265045166, "lr": 0.00026104570679343916, "tps": 101440, "wall": 8785.1} {"step": 13598, "train_loss": 3.4314708709716797, "lr": 0.0002610270533035411, "tps": 101386, "wall": 8790.4} {"step": 13599, "train_loss": 3.4437527656555176, "lr": 0.0002610083993488863, "tps": 101332, "wall": 8795.7} {"step": 13600, "train_loss": 3.4725780487060547, "lr": 0.00026098974492968607, "tps": 101279, "wall": 8801.0} {"step": 13601, "train_loss": 3.3824734687805176, "lr": 0.00026097109004615194, "tps": 101226, "wall": 8806.2} {"step": 13602, "train_loss": 3.4054453372955322, "lr": 0.000260952434698495, "tps": 101173, "wall": 8811.5} {"step": 13603, "train_loss": 3.32277774810791, "lr": 0.0002609337788869266, "tps": 101120, "wall": 8816.7} {"step": 13604, "train_loss": 3.5282766819000244, "lr": 0.00026091512261165826, "tps": 101067, "wall": 8822.0} {"step": 13605, "train_loss": 3.3516452312469482, "lr": 0.0002608964658729011, "tps": 101014, "wall": 8827.3} {"step": 13606, "train_loss": 3.3505845069885254, "lr": 0.0002608778086708666, "tps": 100961, "wall": 8832.5} {"step": 13607, "train_loss": 3.3637189865112305, "lr": 0.00026085915100576606, "tps": 100909, "wall": 8837.8} {"step": 13608, "train_loss": 3.4367213249206543, "lr": 0.00026084049287781097, "tps": 100856, "wall": 8843.1} {"step": 13609, "train_loss": 3.3177788257598877, "lr": 0.00026082183428721245, "tps": 100802, "wall": 8848.4} {"step": 13610, "train_loss": 3.4574763774871826, "lr": 0.00026080317523418197, "tps": 100750, "wall": 8853.7} {"step": 13611, "train_loss": 3.315986156463623, "lr": 0.00026078451571893095, "tps": 100697, "wall": 8859.0} {"step": 13612, "train_loss": 3.387728214263916, "lr": 0.00026076585574167076, "tps": 100644, "wall": 8864.3} {"step": 13613, "train_loss": 3.41581392288208, "lr": 0.00026074719530261265, "tps": 100592, "wall": 8869.6} {"step": 13614, "train_loss": 3.3569798469543457, "lr": 0.00026072853440196815, "tps": 100539, "wall": 8874.8} {"step": 13615, "train_loss": 3.336451768875122, "lr": 0.00026070987303994863, "tps": 100487, "wall": 8880.1} {"step": 13616, "train_loss": 3.284471035003662, "lr": 0.00026069121121676545, "tps": 100434, "wall": 8885.4} {"step": 13617, "train_loss": 3.3170042037963867, "lr": 0.00026067254893263, "tps": 100382, "wall": 8890.7} {"step": 13618, "train_loss": 3.4178671836853027, "lr": 0.0002606538861877538, "tps": 100330, "wall": 8896.0} {"step": 13619, "train_loss": 3.3800129890441895, "lr": 0.0002606352229823482, "tps": 100277, "wall": 8901.3} {"step": 13620, "train_loss": 3.474287509918213, "lr": 0.0002606165593166245, "tps": 100225, "wall": 8906.5} {"step": 13621, "train_loss": 3.386202812194824, "lr": 0.00026059789519079416, "tps": 100173, "wall": 8911.9} {"step": 13622, "train_loss": 3.3371589183807373, "lr": 0.0002605792306050688, "tps": 100121, "wall": 8917.1} {"step": 13623, "train_loss": 3.346311330795288, "lr": 0.00026056056555965966, "tps": 100069, "wall": 8922.4} {"step": 13624, "train_loss": 3.3299620151519775, "lr": 0.00026054190005477825, "tps": 100017, "wall": 8927.7} {"step": 13625, "train_loss": 3.2589457035064697, "lr": 0.00026052323409063606, "tps": 99965, "wall": 8933.0} {"step": 13626, "train_loss": 3.3856441974639893, "lr": 0.0002605045676674444, "tps": 99913, "wall": 8938.3} {"step": 13627, "train_loss": 3.501042366027832, "lr": 0.0002604859007854148, "tps": 99862, "wall": 8943.5} {"step": 13628, "train_loss": 3.3935508728027344, "lr": 0.00026046723344475876, "tps": 99809, "wall": 8948.9} {"step": 13629, "train_loss": 3.403956890106201, "lr": 0.00026044856564568777, "tps": 99758, "wall": 8954.2} {"step": 13630, "train_loss": 3.3213343620300293, "lr": 0.0002604298973884131, "tps": 99706, "wall": 8959.5} {"step": 13631, "train_loss": 3.442317008972168, "lr": 0.0002604112286731465, "tps": 99655, "wall": 8964.8} {"step": 13632, "train_loss": 3.4276885986328125, "lr": 0.00026039255950009927, "tps": 99603, "wall": 8970.1} {"step": 13633, "train_loss": 3.398130416870117, "lr": 0.00026037388986948295, "tps": 99551, "wall": 8975.4} {"step": 13634, "train_loss": 3.3422350883483887, "lr": 0.00026035521978150895, "tps": 99500, "wall": 8980.7} {"step": 13635, "train_loss": 3.3985493183135986, "lr": 0.0002603365492363889, "tps": 99449, "wall": 8986.0} {"step": 13636, "train_loss": 3.1956419944763184, "lr": 0.00026031787823433425, "tps": 99398, "wall": 8991.2} {"step": 13637, "train_loss": 3.441836357116699, "lr": 0.0002602992067755565, "tps": 99347, "wall": 8996.5} {"step": 13638, "train_loss": 3.3102688789367676, "lr": 0.000260280534860267, "tps": 99296, "wall": 9001.8} {"step": 13639, "train_loss": 3.421159505844116, "lr": 0.00026026186248867767, "tps": 99245, "wall": 9007.1} {"step": 13640, "train_loss": 3.387226104736328, "lr": 0.00026024318966099964, "tps": 99194, "wall": 9012.4} {"step": 13641, "train_loss": 3.3826684951782227, "lr": 0.0002602245163774446, "tps": 99143, "wall": 9017.6} {"step": 13642, "train_loss": 3.4000041484832764, "lr": 0.00026020584263822407, "tps": 99093, "wall": 9022.9} {"step": 13643, "train_loss": 3.3844833374023438, "lr": 0.0002601871684435496, "tps": 99041, "wall": 9028.2} {"step": 13644, "train_loss": 3.4147789478302, "lr": 0.00026016849379363263, "tps": 98990, "wall": 9033.6} {"step": 13645, "train_loss": 3.4468491077423096, "lr": 0.00026014981868868487, "tps": 98940, "wall": 9038.8} {"step": 13646, "train_loss": 3.3937149047851562, "lr": 0.00026013114312891777, "tps": 98889, "wall": 9044.1} {"step": 13647, "train_loss": 3.335509777069092, "lr": 0.00026011246711454285, "tps": 98839, "wall": 9049.4} {"step": 13648, "train_loss": 3.4360733032226562, "lr": 0.0002600937906457718, "tps": 98788, "wall": 9054.7} {"step": 13649, "train_loss": 3.41286563873291, "lr": 0.0002600751137228162, "tps": 98738, "wall": 9060.0} {"step": 13650, "train_loss": 3.4730536937713623, "lr": 0.0002600564363458874, "tps": 98687, "wall": 9065.3} {"step": 13651, "train_loss": 3.5161073207855225, "lr": 0.0002600377585151972, "tps": 98637, "wall": 9070.5} {"step": 13652, "train_loss": 3.396019458770752, "lr": 0.0002600190802309571, "tps": 98588, "wall": 9075.8} {"step": 13653, "train_loss": 3.439713954925537, "lr": 0.00026000040149337867, "tps": 98538, "wall": 9081.0} {"step": 13654, "train_loss": 3.4018609523773193, "lr": 0.00025998172230267346, "tps": 98487, "wall": 9086.4} {"step": 13655, "train_loss": 3.3660426139831543, "lr": 0.0002599630426590532, "tps": 98436, "wall": 9091.7} {"step": 13656, "train_loss": 3.308586597442627, "lr": 0.0002599443625627295, "tps": 98386, "wall": 9097.0} {"step": 13657, "train_loss": 3.296947479248047, "lr": 0.00025992568201391387, "tps": 98335, "wall": 9102.4} {"step": 13658, "train_loss": 3.3224053382873535, "lr": 0.0002599070010128179, "tps": 98285, "wall": 9107.7} {"step": 13659, "train_loss": 3.3791160583496094, "lr": 0.0002598883195596533, "tps": 98236, "wall": 9113.0} {"step": 13660, "train_loss": 3.2976131439208984, "lr": 0.00025986963765463165, "tps": 98186, "wall": 9118.2} {"step": 13661, "train_loss": 3.4230844974517822, "lr": 0.00025985095529796454, "tps": 98137, "wall": 9123.5} {"step": 13662, "train_loss": 3.45466947555542, "lr": 0.0002598322724898638, "tps": 98087, "wall": 9128.8} {"step": 13663, "train_loss": 3.4346399307250977, "lr": 0.00025981358923054073, "tps": 98037, "wall": 9134.1} {"step": 13664, "train_loss": 3.3676719665527344, "lr": 0.00025979490552020725, "tps": 97988, "wall": 9139.4} {"step": 13665, "train_loss": 3.488222360610962, "lr": 0.000259776221359075, "tps": 97938, "wall": 9144.7} {"step": 13666, "train_loss": 3.4020586013793945, "lr": 0.0002597575367473555, "tps": 97888, "wall": 9150.0} {"step": 13667, "train_loss": 3.3066699504852295, "lr": 0.00025973885168526043, "tps": 97838, "wall": 9155.3} {"step": 13668, "train_loss": 3.4275455474853516, "lr": 0.0002597201661730015, "tps": 97789, "wall": 9160.6} {"step": 13669, "train_loss": 3.3630783557891846, "lr": 0.0002597014802107905, "tps": 97740, "wall": 9165.9} {"step": 13670, "train_loss": 3.4236326217651367, "lr": 0.00025968279379883885, "tps": 97691, "wall": 9171.2} {"step": 13671, "train_loss": 3.3478102684020996, "lr": 0.0002596641069373584, "tps": 97642, "wall": 9176.5} {"step": 13672, "train_loss": 3.372757911682129, "lr": 0.0002596454196265608, "tps": 97592, "wall": 9181.8} {"step": 13673, "train_loss": 3.336822271347046, "lr": 0.0002596267318666578, "tps": 97544, "wall": 9187.0} {"step": 13674, "train_loss": 3.354424476623535, "lr": 0.000259608043657861, "tps": 97494, "wall": 9192.3} {"step": 13675, "train_loss": 3.373885154724121, "lr": 0.00025958935500038213, "tps": 97446, "wall": 9197.6} {"step": 13676, "train_loss": 3.4355826377868652, "lr": 0.00025957066589443295, "tps": 97397, "wall": 9202.9} {"step": 13677, "train_loss": 3.2777903079986572, "lr": 0.00025955197634022504, "tps": 97347, "wall": 9208.2} {"step": 13678, "train_loss": 3.433303117752075, "lr": 0.0002595332863379702, "tps": 97298, "wall": 9213.6} {"step": 13679, "train_loss": 3.333299160003662, "lr": 0.0002595145958878803, "tps": 97249, "wall": 9218.9} {"step": 13680, "train_loss": 3.2690773010253906, "lr": 0.0002594959049901668, "tps": 97201, "wall": 9224.2} {"step": 13681, "train_loss": 3.3964619636535645, "lr": 0.00025947721364504153, "tps": 97152, "wall": 9229.4} {"step": 13682, "train_loss": 3.386298656463623, "lr": 0.00025945852185271627, "tps": 97104, "wall": 9234.7} {"step": 13683, "train_loss": 3.3894453048706055, "lr": 0.0002594398296134028, "tps": 97056, "wall": 9240.0} {"step": 13684, "train_loss": 3.290651798248291, "lr": 0.00025942113692731277, "tps": 97007, "wall": 9245.2} {"step": 13685, "train_loss": 3.435134172439575, "lr": 0.0002594024437946579, "tps": 96959, "wall": 9250.5} {"step": 13686, "train_loss": 3.4139816761016846, "lr": 0.00025938375021565015, "tps": 96911, "wall": 9255.8} {"step": 13687, "train_loss": 3.413743495941162, "lr": 0.0002593650561905011, "tps": 96863, "wall": 9261.1} {"step": 13688, "train_loss": 3.3871681690216064, "lr": 0.0002593463617194225, "tps": 96815, "wall": 9266.3} {"step": 13689, "train_loss": 3.394366502761841, "lr": 0.00025932766680262625, "tps": 96766, "wall": 9271.7} {"step": 13690, "train_loss": 3.4000167846679688, "lr": 0.00025930897144032405, "tps": 96718, "wall": 9277.0} {"step": 13691, "train_loss": 3.3837461471557617, "lr": 0.00025929027563272765, "tps": 96670, "wall": 9282.2} {"step": 13692, "train_loss": 3.4267733097076416, "lr": 0.0002592715793800489, "tps": 96622, "wall": 9287.5} {"step": 13693, "train_loss": 3.361253499984741, "lr": 0.0002592528826824997, "tps": 96574, "wall": 9292.8} {"step": 13694, "train_loss": 3.3999345302581787, "lr": 0.0002592341855402916, "tps": 96527, "wall": 9298.1} {"step": 13695, "train_loss": 3.4169325828552246, "lr": 0.0002592154879536365, "tps": 96479, "wall": 9303.3} {"step": 13696, "train_loss": 3.3652732372283936, "lr": 0.00025919678992274625, "tps": 96431, "wall": 9308.7} {"step": 13697, "train_loss": 3.4364185333251953, "lr": 0.0002591780914478327, "tps": 96383, "wall": 9314.0} {"step": 13698, "train_loss": 3.447261333465576, "lr": 0.0002591593925291076, "tps": 96335, "wall": 9319.2} {"step": 13699, "train_loss": 3.3909401893615723, "lr": 0.00025914069316678264, "tps": 96288, "wall": 9324.5} {"step": 13700, "train_loss": 3.3748154640197754, "lr": 0.00025912199336106996, "tps": 96239, "wall": 9329.9} {"step": 13701, "train_loss": 3.3367879390716553, "lr": 0.0002591032931121812, "tps": 96192, "wall": 9335.2} {"step": 13702, "train_loss": 3.442052125930786, "lr": 0.0002590845924203282, "tps": 96145, "wall": 9340.4} {"step": 13703, "train_loss": 3.4181642532348633, "lr": 0.00025906589128572274, "tps": 96098, "wall": 9345.7} {"step": 13704, "train_loss": 3.4949569702148438, "lr": 0.0002590471897085769, "tps": 96050, "wall": 9351.0} {"step": 13705, "train_loss": 3.4334464073181152, "lr": 0.0002590284876891023, "tps": 96003, "wall": 9356.3} {"step": 13706, "train_loss": 3.391685962677002, "lr": 0.0002590097852275108, "tps": 95956, "wall": 9361.6} {"step": 13707, "train_loss": 3.3264994621276855, "lr": 0.0002589910823240145, "tps": 95909, "wall": 9366.8} {"step": 13708, "train_loss": 3.470130205154419, "lr": 0.00025897237897882505, "tps": 95862, "wall": 9372.1} {"step": 13709, "train_loss": 3.317445993423462, "lr": 0.00025895367519215433, "tps": 95815, "wall": 9377.4} {"step": 13710, "train_loss": 3.472127914428711, "lr": 0.00025893497096421436, "tps": 95768, "wall": 9382.6} {"step": 13711, "train_loss": 3.4173810482025146, "lr": 0.0002589162662952168, "tps": 95721, "wall": 9387.9} {"step": 13712, "train_loss": 3.4361400604248047, "lr": 0.00025889756118537374, "tps": 95673, "wall": 9393.3} {"step": 13713, "train_loss": 3.3830387592315674, "lr": 0.00025887885563489707, "tps": 95626, "wall": 9398.7} {"step": 13714, "train_loss": 3.4155943393707275, "lr": 0.00025886014964399855, "tps": 95579, "wall": 9404.0} {"step": 13715, "train_loss": 3.323498487472534, "lr": 0.0002588414432128902, "tps": 95533, "wall": 9409.2} {"step": 13716, "train_loss": 3.3327784538269043, "lr": 0.0002588227363417838, "tps": 95486, "wall": 9414.5} {"step": 13717, "train_loss": 3.281658172607422, "lr": 0.00025880402903089136, "tps": 95439, "wall": 9419.8} {"step": 13718, "train_loss": 3.4035325050354004, "lr": 0.00025878532128042483, "tps": 95393, "wall": 9425.0} {"step": 13719, "train_loss": 3.3507559299468994, "lr": 0.0002587666130905961, "tps": 95347, "wall": 9430.3} {"step": 13720, "train_loss": 3.2490367889404297, "lr": 0.000258747904461617, "tps": 95300, "wall": 9435.6} {"step": 13721, "train_loss": 3.3339929580688477, "lr": 0.0002587291953936996, "tps": 95254, "wall": 9440.9} {"step": 13722, "train_loss": 3.4193596839904785, "lr": 0.00025871048588705574, "tps": 95208, "wall": 9446.1} {"step": 13723, "train_loss": 3.2697367668151855, "lr": 0.0002586917759418974, "tps": 95161, "wall": 9451.5} {"step": 13724, "train_loss": 3.5199615955352783, "lr": 0.0002586730655584366, "tps": 95114, "wall": 9456.8} {"step": 13725, "train_loss": 3.228411912918091, "lr": 0.0002586543547368852, "tps": 95068, "wall": 9462.1} {"step": 13726, "train_loss": 3.506373882293701, "lr": 0.0002586356434774551, "tps": 95022, "wall": 9467.3} {"step": 13727, "train_loss": 3.3962221145629883, "lr": 0.0002586169317803584, "tps": 94976, "wall": 9472.6} {"step": 13728, "train_loss": 3.4144327640533447, "lr": 0.00025859821964580704, "tps": 94930, "wall": 9477.9} {"step": 13729, "train_loss": 3.342906951904297, "lr": 0.0002585795070740129, "tps": 94884, "wall": 9483.2} {"step": 13730, "train_loss": 3.346194267272949, "lr": 0.000258560794065188, "tps": 94838, "wall": 9488.5} {"step": 13731, "train_loss": 3.447553873062134, "lr": 0.0002585420806195444, "tps": 94793, "wall": 9493.7} {"step": 13732, "train_loss": 3.3877148628234863, "lr": 0.000258523366737294, "tps": 94747, "wall": 9499.0} {"step": 13733, "train_loss": 3.4961886405944824, "lr": 0.00025850465241864884, "tps": 94701, "wall": 9504.3} {"step": 13734, "train_loss": 3.4017953872680664, "lr": 0.0002584859376638209, "tps": 94654, "wall": 9509.7} {"step": 13735, "train_loss": 3.4212589263916016, "lr": 0.00025846722247302217, "tps": 94609, "wall": 9514.9} {"step": 13736, "train_loss": 3.3834023475646973, "lr": 0.0002584485068464646, "tps": 94563, "wall": 9520.3} {"step": 13737, "train_loss": 3.3918089866638184, "lr": 0.0002584297907843603, "tps": 94518, "wall": 9525.5} {"step": 13738, "train_loss": 3.3708386421203613, "lr": 0.0002584110742869213, "tps": 94472, "wall": 9530.8} {"step": 13739, "train_loss": 3.3769354820251465, "lr": 0.00025839235735435946, "tps": 94426, "wall": 9536.1} {"step": 13740, "train_loss": 3.4130189418792725, "lr": 0.000258373639986887, "tps": 94380, "wall": 9541.4} {"step": 13741, "train_loss": 3.356189489364624, "lr": 0.00025835492218471593, "tps": 94335, "wall": 9546.7} {"step": 13742, "train_loss": 3.3830270767211914, "lr": 0.0002583362039480581, "tps": 94290, "wall": 9552.0} {"step": 13743, "train_loss": 3.386566400527954, "lr": 0.00025831748527712576, "tps": 94245, "wall": 9557.3} {"step": 13744, "train_loss": 3.377486228942871, "lr": 0.00025829876617213085, "tps": 94199, "wall": 9562.6} {"step": 13745, "train_loss": 3.397080421447754, "lr": 0.00025828004663328545, "tps": 94154, "wall": 9567.9} {"step": 13746, "train_loss": 3.265091896057129, "lr": 0.00025826132666080157, "tps": 94108, "wall": 9573.2} {"step": 13747, "train_loss": 3.4130842685699463, "lr": 0.00025824260625489134, "tps": 94063, "wall": 9578.5} {"step": 13748, "train_loss": 3.278989553451538, "lr": 0.0002582238854157668, "tps": 94018, "wall": 9583.8} {"step": 13749, "train_loss": 3.368000030517578, "lr": 0.00025820516414364, "tps": 93973, "wall": 9589.1} {"step": 13750, "train_loss": 3.3738794326782227, "lr": 0.00025818644243872307, "tps": 93928, "wall": 9594.4} {"step": 13751, "train_loss": 3.3357632160186768, "lr": 0.00025816772030122807, "tps": 93883, "wall": 9599.7} {"step": 13752, "train_loss": 3.376958131790161, "lr": 0.000258148997731367, "tps": 93838, "wall": 9605.0} {"step": 13753, "train_loss": 3.427305221557617, "lr": 0.0002581302747293521, "tps": 93793, "wall": 9610.3} {"step": 13754, "train_loss": 3.5235753059387207, "lr": 0.00025811155129539534, "tps": 93748, "wall": 9615.6} {"step": 13755, "train_loss": 3.4229183197021484, "lr": 0.00025809282742970886, "tps": 93704, "wall": 9620.8} {"step": 13756, "train_loss": 3.349238872528076, "lr": 0.0002580741031325047, "tps": 93659, "wall": 9626.1} {"step": 13757, "train_loss": 3.3793654441833496, "lr": 0.0002580553784039952, "tps": 93614, "wall": 9631.5} {"step": 13758, "train_loss": 3.3538155555725098, "lr": 0.00025803665324439223, "tps": 93570, "wall": 9636.7} {"step": 13759, "train_loss": 3.4366090297698975, "lr": 0.00025801792765390793, "tps": 93525, "wall": 9642.0} {"step": 13760, "train_loss": 3.3524272441864014, "lr": 0.00025799920163275457, "tps": 93480, "wall": 9647.3} {"step": 13761, "train_loss": 3.4705350399017334, "lr": 0.0002579804751811442, "tps": 93436, "wall": 9652.7} {"step": 13762, "train_loss": 3.3317692279815674, "lr": 0.000257961748299289, "tps": 93391, "wall": 9657.9} {"step": 13763, "train_loss": 3.4039101600646973, "lr": 0.00025794302098740095, "tps": 93347, "wall": 9663.2} {"step": 13764, "train_loss": 3.381265878677368, "lr": 0.0002579242932456924, "tps": 93302, "wall": 9668.5} {"step": 13765, "train_loss": 3.3471755981445312, "lr": 0.0002579055650743753, "tps": 93258, "wall": 9673.8} {"step": 13766, "train_loss": 3.442068338394165, "lr": 0.00025788683647366196, "tps": 93214, "wall": 9679.1} {"step": 13767, "train_loss": 3.4142260551452637, "lr": 0.0002578681074437645, "tps": 93170, "wall": 9684.4} {"step": 13768, "train_loss": 3.3545949459075928, "lr": 0.00025784937798489506, "tps": 93125, "wall": 9689.8} {"step": 13769, "train_loss": 3.462373733520508, "lr": 0.0002578306480972658, "tps": 93081, "wall": 9695.1} {"step": 13770, "train_loss": 3.3979413509368896, "lr": 0.00025781191778108896, "tps": 93037, "wall": 9700.3} {"step": 13771, "train_loss": 3.2437236309051514, "lr": 0.0002577931870365767, "tps": 92993, "wall": 9705.6} {"step": 13772, "train_loss": 3.3230767250061035, "lr": 0.0002577744558639411, "tps": 92950, "wall": 9710.9} {"step": 13773, "train_loss": 3.4586944580078125, "lr": 0.0002577557242633944, "tps": 92906, "wall": 9716.2} {"step": 13774, "train_loss": 3.3127098083496094, "lr": 0.0002577369922351488, "tps": 92862, "wall": 9721.4} {"step": 13775, "train_loss": 3.4116098880767822, "lr": 0.0002577182597794166, "tps": 92818, "wall": 9726.7} {"step": 13776, "train_loss": 3.304556369781494, "lr": 0.00025769952689640987, "tps": 92775, "wall": 9732.0} {"step": 13777, "train_loss": 3.367276906967163, "lr": 0.00025768079358634094, "tps": 92731, "wall": 9737.3} {"step": 13778, "train_loss": 3.3786160945892334, "lr": 0.0002576620598494218, "tps": 92687, "wall": 9742.6} {"step": 13779, "train_loss": 3.300626754760742, "lr": 0.00025764332568586494, "tps": 92644, "wall": 9747.9} {"step": 13780, "train_loss": 3.277440071105957, "lr": 0.00025762459109588234, "tps": 92599, "wall": 9753.3} {"step": 13781, "train_loss": 3.453268527984619, "lr": 0.0002576058560796864, "tps": 92556, "wall": 9758.5} {"step": 13782, "train_loss": 3.3871495723724365, "lr": 0.00025758712063748924, "tps": 92513, "wall": 9763.8} {"step": 13783, "train_loss": 3.499131202697754, "lr": 0.00025756838476950316, "tps": 92470, "wall": 9769.1} {"step": 13784, "train_loss": 3.419450044631958, "lr": 0.0002575496484759404, "tps": 92427, "wall": 9774.3} {"step": 13785, "train_loss": 3.407216787338257, "lr": 0.0002575309117570132, "tps": 92383, "wall": 9779.6} {"step": 13786, "train_loss": 3.236649751663208, "lr": 0.00025751217461293376, "tps": 92340, "wall": 9785.0} {"step": 13787, "train_loss": 3.466197967529297, "lr": 0.00025749343704391443, "tps": 92296, "wall": 9790.3} {"step": 13788, "train_loss": 3.418651580810547, "lr": 0.0002574746990501674, "tps": 92254, "wall": 9795.5} {"step": 13789, "train_loss": 3.452028512954712, "lr": 0.00025745596063190494, "tps": 92210, "wall": 9800.8} {"step": 13790, "train_loss": 3.342478036880493, "lr": 0.0002574372217893393, "tps": 92167, "wall": 9806.1} {"step": 13791, "train_loss": 3.4288487434387207, "lr": 0.0002574184825226828, "tps": 92124, "wall": 9811.4} {"step": 13792, "train_loss": 3.38423228263855, "lr": 0.00025739974283214785, "tps": 92081, "wall": 9816.7} {"step": 13793, "train_loss": 3.345097541809082, "lr": 0.0002573810027179464, "tps": 92038, "wall": 9822.0} {"step": 13794, "train_loss": 3.41204833984375, "lr": 0.00025736226218029095, "tps": 91995, "wall": 9827.3} {"step": 13795, "train_loss": 3.47709321975708, "lr": 0.00025734352121939386, "tps": 91953, "wall": 9832.6} {"step": 13796, "train_loss": 3.3383421897888184, "lr": 0.0002573247798354673, "tps": 91910, "wall": 9837.9} {"step": 13797, "train_loss": 3.3583266735076904, "lr": 0.00025730603802872357, "tps": 91867, "wall": 9843.1} {"step": 13798, "train_loss": 3.2769551277160645, "lr": 0.0002572872957993751, "tps": 91824, "wall": 9848.5} {"step": 13799, "train_loss": 3.3352975845336914, "lr": 0.0002572685531476341, "tps": 91781, "wall": 9853.8} {"step": 13800, "train_loss": 3.3087782859802246, "lr": 0.0002572498100737129, "tps": 91738, "wall": 9859.1} {"step": 13801, "train_loss": 3.3411917686462402, "lr": 0.00025723106657782384, "tps": 91696, "wall": 9864.4} {"step": 13802, "train_loss": 3.410592794418335, "lr": 0.00025721232266017927, "tps": 91652, "wall": 9869.8} {"step": 13803, "train_loss": 3.3061251640319824, "lr": 0.0002571935783209915, "tps": 91610, "wall": 9875.1} {"step": 13804, "train_loss": 3.4499075412750244, "lr": 0.0002571748335604728, "tps": 91567, "wall": 9880.4} {"step": 13805, "train_loss": 3.342587471008301, "lr": 0.0002571560883788356, "tps": 91525, "wall": 9885.6} {"step": 13806, "train_loss": 3.419517755508423, "lr": 0.00025713734277629227, "tps": 91482, "wall": 9891.0} {"step": 13807, "train_loss": 3.4377918243408203, "lr": 0.0002571185967530551, "tps": 91440, "wall": 9896.2} {"step": 13808, "train_loss": 3.3053619861602783, "lr": 0.00025709985030933634, "tps": 91398, "wall": 9901.5} {"step": 13809, "train_loss": 3.376920461654663, "lr": 0.00025708110344534863, "tps": 91356, "wall": 9906.8} {"step": 13810, "train_loss": 3.3329834938049316, "lr": 0.0002570623561613041, "tps": 91314, "wall": 9912.1} {"step": 13811, "train_loss": 3.5145673751831055, "lr": 0.0002570436084574152, "tps": 91272, "wall": 9917.4} {"step": 13812, "train_loss": 3.4154715538024902, "lr": 0.0002570248603338943, "tps": 91229, "wall": 9922.7} {"step": 13813, "train_loss": 3.3100743293762207, "lr": 0.0002570061117909537, "tps": 91187, "wall": 9928.0} {"step": 13814, "train_loss": 3.3027853965759277, "lr": 0.000256987362828806, "tps": 91145, "wall": 9933.4} {"step": 13815, "train_loss": 3.398904800415039, "lr": 0.0002569686134476634, "tps": 91103, "wall": 9938.7} {"step": 13816, "train_loss": 3.4551968574523926, "lr": 0.0002569498636477383, "tps": 91061, "wall": 9944.0} {"step": 13817, "train_loss": 3.45169997215271, "lr": 0.00025693111342924317, "tps": 91019, "wall": 9949.3} {"step": 13818, "train_loss": 3.4842448234558105, "lr": 0.00025691236279239046, "tps": 90977, "wall": 9954.5} {"step": 13819, "train_loss": 3.3327364921569824, "lr": 0.0002568936117373924, "tps": 90936, "wall": 9959.8} {"step": 13820, "train_loss": 3.4727046489715576, "lr": 0.0002568748602644616, "tps": 90894, "wall": 9965.1} {"step": 13821, "train_loss": 3.428968906402588, "lr": 0.0002568561083738104, "tps": 90852, "wall": 9970.4} {"step": 13822, "train_loss": 3.3760361671447754, "lr": 0.00025683735606565113, "tps": 90811, "wall": 9975.7} {"step": 13823, "train_loss": 3.3575618267059326, "lr": 0.0002568186033401963, "tps": 90769, "wall": 9981.0} {"step": 13824, "train_loss": 3.3521745204925537, "lr": 0.00025679985019765836, "tps": 90728, "wall": 9986.3} {"step": 13825, "train_loss": 3.3498167991638184, "lr": 0.00025678109663824974, "tps": 90685, "wall": 9991.7} {"step": 13826, "train_loss": 3.426140785217285, "lr": 0.00025676234266218287, "tps": 90644, "wall": 9997.0} {"step": 13827, "train_loss": 3.329986572265625, "lr": 0.00025674358826967015, "tps": 90602, "wall": 10002.3} {"step": 13828, "train_loss": 3.239945888519287, "lr": 0.0002567248334609241, "tps": 90561, "wall": 10007.6} {"step": 13829, "train_loss": 3.36807918548584, "lr": 0.0002567060782361572, "tps": 90519, "wall": 10012.9} {"step": 13830, "train_loss": 3.3967206478118896, "lr": 0.0002566873225955818, "tps": 90478, "wall": 10018.2} {"step": 13831, "train_loss": 3.28197979927063, "lr": 0.0002566685665394104, "tps": 90437, "wall": 10023.4} {"step": 13832, "train_loss": 3.3930447101593018, "lr": 0.00025664981006785553, "tps": 90396, "wall": 10028.7} {"step": 13833, "train_loss": 3.4478800296783447, "lr": 0.0002566310531811297, "tps": 90354, "wall": 10034.1} {"step": 13834, "train_loss": 3.440013885498047, "lr": 0.0002566122958794452, "tps": 90313, "wall": 10039.4} {"step": 13835, "train_loss": 3.416700601577759, "lr": 0.00025659353816301475, "tps": 90271, "wall": 10044.7} {"step": 13836, "train_loss": 3.434767723083496, "lr": 0.00025657478003205064, "tps": 90229, "wall": 10050.1} {"step": 13837, "train_loss": 3.360146999359131, "lr": 0.00025655602148676545, "tps": 90188, "wall": 10055.5} {"step": 13838, "train_loss": 3.4528470039367676, "lr": 0.0002565372625273717, "tps": 90146, "wall": 10060.8} {"step": 13839, "train_loss": 3.314659595489502, "lr": 0.00025651850315408183, "tps": 90105, "wall": 10066.2} {"step": 13840, "train_loss": 3.3237428665161133, "lr": 0.0002564997433671084, "tps": 90063, "wall": 10071.6} {"step": 13841, "train_loss": 3.4373080730438232, "lr": 0.0002564809831666639, "tps": 90022, "wall": 10077.0} {"step": 13842, "train_loss": 3.450241804122925, "lr": 0.0002564622225529608, "tps": 89980, "wall": 10082.3} {"step": 13843, "train_loss": 3.3679909706115723, "lr": 0.00025644346152621175, "tps": 89939, "wall": 10087.7} {"step": 13844, "train_loss": 3.3198299407958984, "lr": 0.0002564247000866292, "tps": 89898, "wall": 10093.1} {"step": 13845, "train_loss": 3.4675912857055664, "lr": 0.0002564059382344256, "tps": 89856, "wall": 10098.4} {"step": 13846, "train_loss": 3.453049898147583, "lr": 0.00025638717596981365, "tps": 89815, "wall": 10103.8} {"step": 13847, "train_loss": 3.3910183906555176, "lr": 0.0002563684132930057, "tps": 89773, "wall": 10109.3} {"step": 13848, "train_loss": 3.3752663135528564, "lr": 0.0002563496502042145, "tps": 89732, "wall": 10114.6} {"step": 13849, "train_loss": 3.32550311088562, "lr": 0.00025633088670365243, "tps": 89691, "wall": 10120.0} {"step": 13850, "train_loss": 3.366673469543457, "lr": 0.0002563121227915321, "tps": 89650, "wall": 10125.3} {"step": 13851, "train_loss": 3.429734468460083, "lr": 0.0002562933584680661, "tps": 89609, "wall": 10130.7} {"step": 13852, "train_loss": 3.355013132095337, "lr": 0.000256274593733467, "tps": 89568, "wall": 10136.1} {"step": 13853, "train_loss": 3.3894400596618652, "lr": 0.0002562558285879473, "tps": 89527, "wall": 10141.5} {"step": 13854, "train_loss": 3.3010501861572266, "lr": 0.00025623706303171963, "tps": 89486, "wall": 10146.9} {"step": 13855, "train_loss": 3.4391562938690186, "lr": 0.0002562182970649965, "tps": 89445, "wall": 10152.2} {"step": 13856, "train_loss": 3.4705333709716797, "lr": 0.00025619953068799065, "tps": 89404, "wall": 10157.6} {"step": 13857, "train_loss": 3.255460262298584, "lr": 0.00025618076390091453, "tps": 89363, "wall": 10163.0} {"step": 13858, "train_loss": 3.316647529602051, "lr": 0.00025616199670398066, "tps": 89322, "wall": 10168.4} {"step": 13859, "train_loss": 3.467402935028076, "lr": 0.0002561432290974018, "tps": 89281, "wall": 10173.8} {"step": 13860, "train_loss": 3.2870051860809326, "lr": 0.0002561244610813905, "tps": 89240, "wall": 10179.2} {"step": 13861, "train_loss": 3.4544389247894287, "lr": 0.0002561056926561594, "tps": 89199, "wall": 10184.5} {"step": 13862, "train_loss": 3.384363889694214, "lr": 0.00025608692382192097, "tps": 89159, "wall": 10189.9} {"step": 13863, "train_loss": 3.386932611465454, "lr": 0.0002560681545788879, "tps": 89118, "wall": 10195.3} {"step": 13864, "train_loss": 3.380828380584717, "lr": 0.00025604938492727295, "tps": 89078, "wall": 10200.7} {"step": 13865, "train_loss": 3.356351613998413, "lr": 0.00025603061486728857, "tps": 89037, "wall": 10206.0} {"step": 13866, "train_loss": 3.284303665161133, "lr": 0.00025601184439914734, "tps": 88997, "wall": 10211.4} {"step": 13867, "train_loss": 3.308267116546631, "lr": 0.00025599307352306203, "tps": 88957, "wall": 10216.8} {"step": 13868, "train_loss": 3.4259071350097656, "lr": 0.00025597430223924525, "tps": 88917, "wall": 10222.1} {"step": 13869, "train_loss": 3.297149896621704, "lr": 0.0002559555305479097, "tps": 88877, "wall": 10227.4} {"step": 13870, "train_loss": 3.3835394382476807, "lr": 0.0002559367584492678, "tps": 88836, "wall": 10232.8} {"step": 13871, "train_loss": 3.3735435009002686, "lr": 0.00025591798594353253, "tps": 88797, "wall": 10238.1} {"step": 13872, "train_loss": 3.292895555496216, "lr": 0.0002558992130309163, "tps": 88757, "wall": 10243.4} {"step": 13873, "train_loss": 3.314643383026123, "lr": 0.00025588043971163174, "tps": 88717, "wall": 10248.7} {"step": 13874, "train_loss": 3.3008909225463867, "lr": 0.0002558616659858918, "tps": 88678, "wall": 10254.0} {"step": 13875, "train_loss": 3.4451797008514404, "lr": 0.0002558428918539088, "tps": 88638, "wall": 10259.3} {"step": 13876, "train_loss": 3.3034963607788086, "lr": 0.00025582411731589564, "tps": 88599, "wall": 10264.6} {"step": 13877, "train_loss": 3.441758632659912, "lr": 0.000255805342372065, "tps": 88560, "wall": 10269.9} {"step": 13878, "train_loss": 3.440901756286621, "lr": 0.00025578656702262946, "tps": 88521, "wall": 10275.2} {"step": 13879, "train_loss": 3.389193296432495, "lr": 0.0002557677912678017, "tps": 88481, "wall": 10280.5} {"step": 13880, "train_loss": 3.394289970397949, "lr": 0.00025574901510779457, "tps": 88442, "wall": 10285.8} {"step": 13881, "train_loss": 3.506394386291504, "lr": 0.0002557302385428206, "tps": 88403, "wall": 10291.2} {"step": 13882, "train_loss": 3.344985008239746, "lr": 0.00025571146157309256, "tps": 88363, "wall": 10296.5} {"step": 13883, "train_loss": 3.393630266189575, "lr": 0.00025569268419882316, "tps": 88325, "wall": 10301.7} {"step": 13884, "train_loss": 3.3861870765686035, "lr": 0.00025567390642022516, "tps": 88285, "wall": 10307.1} {"step": 13885, "train_loss": 3.538426637649536, "lr": 0.00025565512823751114, "tps": 88247, "wall": 10312.3} {"step": 13886, "train_loss": 3.3650827407836914, "lr": 0.0002556363496508939, "tps": 88208, "wall": 10317.6} {"step": 13887, "train_loss": 3.40112042427063, "lr": 0.0002556175706605862, "tps": 88169, "wall": 10322.9} {"step": 13888, "train_loss": 3.4526913166046143, "lr": 0.0002555987912668007, "tps": 88131, "wall": 10328.1} {"step": 13889, "train_loss": 3.3738439083099365, "lr": 0.00025558001146975016, "tps": 88092, "wall": 10333.4} {"step": 13890, "train_loss": 3.3611955642700195, "lr": 0.00025556123126964733, "tps": 88053, "wall": 10338.7} {"step": 13891, "train_loss": 3.280797243118286, "lr": 0.000255542450666705, "tps": 88015, "wall": 10344.0} {"step": 13892, "train_loss": 3.4123964309692383, "lr": 0.00025552366966113586, "tps": 87975, "wall": 10349.3} {"step": 13893, "train_loss": 3.3897337913513184, "lr": 0.0002555048882531526, "tps": 87937, "wall": 10354.6} {"step": 13894, "train_loss": 3.4232850074768066, "lr": 0.0002554861064429681, "tps": 87898, "wall": 10359.9} {"step": 13895, "train_loss": 3.395449161529541, "lr": 0.000255467324230795, "tps": 87860, "wall": 10365.2} {"step": 13896, "train_loss": 3.5150609016418457, "lr": 0.00025544854161684623, "tps": 87821, "wall": 10370.5} {"step": 13897, "train_loss": 3.388375759124756, "lr": 0.0002554297586013344, "tps": 87783, "wall": 10375.7} {"step": 13898, "train_loss": 3.3215749263763428, "lr": 0.00025541097518447237, "tps": 87745, "wall": 10381.0} {"step": 13899, "train_loss": 3.478346347808838, "lr": 0.00025539219136647286, "tps": 87706, "wall": 10386.3} {"step": 13900, "train_loss": 3.413341999053955, "lr": 0.00025537340714754873, "tps": 87668, "wall": 10391.7} {"step": 13901, "train_loss": 3.282214879989624, "lr": 0.00025535462252791275, "tps": 87629, "wall": 10396.9} {"step": 13902, "train_loss": 3.368861198425293, "lr": 0.00025533583750777763, "tps": 87591, "wall": 10402.2} {"step": 13903, "train_loss": 3.4736454486846924, "lr": 0.00025531705208735626, "tps": 87553, "wall": 10407.5} {"step": 13904, "train_loss": 3.348271369934082, "lr": 0.0002552982662668614, "tps": 87514, "wall": 10412.9} {"step": 13905, "train_loss": 3.3714492321014404, "lr": 0.00025527948004650593, "tps": 87476, "wall": 10418.2} {"step": 13906, "train_loss": 3.3207411766052246, "lr": 0.0002552606934265025, "tps": 87438, "wall": 10423.5} {"step": 13907, "train_loss": 3.3776979446411133, "lr": 0.0002552419064070641, "tps": 87400, "wall": 10428.7} {"step": 13908, "train_loss": 3.376077175140381, "lr": 0.0002552231189884035, "tps": 87362, "wall": 10434.0} {"step": 13909, "train_loss": 3.4691028594970703, "lr": 0.00025520433117073345, "tps": 87324, "wall": 10439.3} {"step": 13910, "train_loss": 3.3676252365112305, "lr": 0.00025518554295426684, "tps": 87286, "wall": 10444.6} {"step": 13911, "train_loss": 3.2913458347320557, "lr": 0.00025516675433921655, "tps": 87249, "wall": 10449.8} {"step": 13912, "train_loss": 3.3606557846069336, "lr": 0.0002551479653257953, "tps": 87211, "wall": 10455.1} {"step": 13913, "train_loss": 3.482977867126465, "lr": 0.00025512917591421596, "tps": 87172, "wall": 10460.5} {"step": 13914, "train_loss": 3.342574119567871, "lr": 0.0002551103861046916, "tps": 87134, "wall": 10465.8} {"step": 13915, "train_loss": 3.391179323196411, "lr": 0.0002550915958974347, "tps": 87096, "wall": 10471.1} {"step": 13916, "train_loss": 3.3133692741394043, "lr": 0.00025507280529265836, "tps": 87058, "wall": 10476.4} {"step": 13917, "train_loss": 3.3238625526428223, "lr": 0.0002550540142905754, "tps": 87020, "wall": 10481.7} {"step": 13918, "train_loss": 3.3431763648986816, "lr": 0.00025503522289139867, "tps": 86983, "wall": 10487.0} {"step": 13919, "train_loss": 3.253871202468872, "lr": 0.000255016431095341, "tps": 86945, "wall": 10492.3} {"step": 13920, "train_loss": 3.3686702251434326, "lr": 0.0002549976389026153, "tps": 86907, "wall": 10497.6} {"step": 13921, "train_loss": 3.38494873046875, "lr": 0.00025497884631343453, "tps": 86870, "wall": 10502.9} {"step": 13922, "train_loss": 3.3931407928466797, "lr": 0.0002549600533280114, "tps": 86833, "wall": 10508.2} {"step": 13923, "train_loss": 3.3602492809295654, "lr": 0.00025494125994655897, "tps": 86795, "wall": 10513.4} {"step": 13924, "train_loss": 3.312995433807373, "lr": 0.00025492246616929006, "tps": 86758, "wall": 10518.7} {"step": 13925, "train_loss": 3.2534475326538086, "lr": 0.0002549036719964175, "tps": 86721, "wall": 10524.0} {"step": 13926, "train_loss": 3.292901039123535, "lr": 0.0002548848774281543, "tps": 86682, "wall": 10529.4} {"step": 13927, "train_loss": 3.349679708480835, "lr": 0.0002548660824647133, "tps": 86645, "wall": 10534.7} {"step": 13928, "train_loss": 3.3602099418640137, "lr": 0.00025484728710630747, "tps": 86607, "wall": 10540.0} {"step": 13929, "train_loss": 3.4236488342285156, "lr": 0.00025482849135314965, "tps": 86570, "wall": 10545.3} {"step": 13930, "train_loss": 3.4397499561309814, "lr": 0.00025480969520545277, "tps": 86533, "wall": 10550.6} {"step": 13931, "train_loss": 3.355074644088745, "lr": 0.0002547908986634299, "tps": 86496, "wall": 10555.9} {"step": 13932, "train_loss": 3.308617115020752, "lr": 0.00025477210172729375, "tps": 86459, "wall": 10561.2} {"step": 13933, "train_loss": 3.3646199703216553, "lr": 0.0002547533043972573, "tps": 86422, "wall": 10566.5} {"step": 13934, "train_loss": 3.4798593521118164, "lr": 0.00025473450667353365, "tps": 86384, "wall": 10571.8} {"step": 13935, "train_loss": 3.431063652038574, "lr": 0.0002547157085563356, "tps": 86348, "wall": 10577.0} {"step": 13936, "train_loss": 3.354647397994995, "lr": 0.00025469691004587606, "tps": 86311, "wall": 10582.4} {"step": 13937, "train_loss": 3.43271803855896, "lr": 0.00025467811114236814, "tps": 86274, "wall": 10587.7} {"step": 13938, "train_loss": 3.403564691543579, "lr": 0.00025465931184602466, "tps": 86236, "wall": 10593.0} {"step": 13939, "train_loss": 3.425464391708374, "lr": 0.0002546405121570586, "tps": 86199, "wall": 10598.3} {"step": 13940, "train_loss": 3.411447763442993, "lr": 0.00025462171207568294, "tps": 86162, "wall": 10603.6} {"step": 13941, "train_loss": 3.2946877479553223, "lr": 0.0002546029116021107, "tps": 86125, "wall": 10608.9} {"step": 13942, "train_loss": 3.3558924198150635, "lr": 0.0002545841107365548, "tps": 86089, "wall": 10614.2} {"step": 13943, "train_loss": 3.360403299331665, "lr": 0.00025456530947922816, "tps": 86052, "wall": 10619.5} {"step": 13944, "train_loss": 3.307699680328369, "lr": 0.0002545465078303439, "tps": 86015, "wall": 10624.8} {"step": 13945, "train_loss": 3.306594133377075, "lr": 0.0002545277057901148, "tps": 85978, "wall": 10630.1} {"step": 13946, "train_loss": 3.3429815769195557, "lr": 0.00025450890335875414, "tps": 85942, "wall": 10635.4} {"step": 13947, "train_loss": 3.309147834777832, "lr": 0.00025449010053647466, "tps": 85905, "wall": 10640.7} {"step": 13948, "train_loss": 3.4016923904418945, "lr": 0.0002544712973234895, "tps": 85868, "wall": 10646.0} {"step": 13949, "train_loss": 3.3593082427978516, "lr": 0.0002544524937200116, "tps": 85831, "wall": 10651.4} {"step": 13950, "train_loss": 3.4364476203918457, "lr": 0.000254433689726254, "tps": 85795, "wall": 10656.6} {"step": 13951, "train_loss": 3.334869384765625, "lr": 0.0002544148853424297, "tps": 85759, "wall": 10661.9} {"step": 13952, "train_loss": 3.4108290672302246, "lr": 0.00025439608056875175, "tps": 85723, "wall": 10667.2} {"step": 13953, "train_loss": 3.2631216049194336, "lr": 0.00025437727540543307, "tps": 85686, "wall": 10672.5} {"step": 13954, "train_loss": 3.359405517578125, "lr": 0.00025435846985268675, "tps": 85650, "wall": 10677.8} {"step": 13955, "train_loss": 3.3235907554626465, "lr": 0.0002543396639107259, "tps": 85613, "wall": 10683.1} {"step": 13956, "train_loss": 3.356346607208252, "lr": 0.00025432085757976343, "tps": 85577, "wall": 10688.4} {"step": 13957, "train_loss": 3.327629327774048, "lr": 0.0002543020508600124, "tps": 85541, "wall": 10693.7} {"step": 13958, "train_loss": 3.3918566703796387, "lr": 0.00025428324375168594, "tps": 85504, "wall": 10699.0} {"step": 13959, "train_loss": 3.337019920349121, "lr": 0.00025426443625499706, "tps": 85468, "wall": 10704.3} {"step": 13960, "train_loss": 3.3944203853607178, "lr": 0.00025424562837015875, "tps": 85431, "wall": 10709.7} {"step": 13961, "train_loss": 3.361602783203125, "lr": 0.000254226820097384, "tps": 85395, "wall": 10715.0} {"step": 13962, "train_loss": 3.4758028984069824, "lr": 0.0002542080114368862, "tps": 85359, "wall": 10720.2} {"step": 13963, "train_loss": 3.321978807449341, "lr": 0.00025418920238887805, "tps": 85323, "wall": 10725.6} {"step": 13964, "train_loss": 3.3642067909240723, "lr": 0.0002541703929535728, "tps": 85287, "wall": 10730.9} {"step": 13965, "train_loss": 3.3406505584716797, "lr": 0.00025415158313118346, "tps": 85251, "wall": 10736.1} {"step": 13966, "train_loss": 3.3872733116149902, "lr": 0.0002541327729219232, "tps": 85216, "wall": 10741.4} {"step": 13967, "train_loss": 3.4005961418151855, "lr": 0.00025411396232600495, "tps": 85180, "wall": 10746.7} {"step": 13968, "train_loss": 3.257725715637207, "lr": 0.000254095151343642, "tps": 85143, "wall": 10752.1} {"step": 13969, "train_loss": 3.352132797241211, "lr": 0.0002540763399750473, "tps": 85107, "wall": 10757.4} {"step": 13970, "train_loss": 3.291706085205078, "lr": 0.00025405752822043394, "tps": 85072, "wall": 10762.7} {"step": 13971, "train_loss": 3.440009593963623, "lr": 0.00025403871608001505, "tps": 85036, "wall": 10767.9} {"step": 13972, "train_loss": 3.3016490936279297, "lr": 0.00025401990355400383, "tps": 85000, "wall": 10773.3} {"step": 13973, "train_loss": 3.4945602416992188, "lr": 0.0002540010906426132, "tps": 84964, "wall": 10778.7} {"step": 13974, "train_loss": 3.3759284019470215, "lr": 0.0002539822773460564, "tps": 84928, "wall": 10784.0} {"step": 13975, "train_loss": 3.3861026763916016, "lr": 0.0002539634636645466, "tps": 84892, "wall": 10789.3} {"step": 13976, "train_loss": 3.373893976211548, "lr": 0.00025394464959829674, "tps": 84856, "wall": 10794.6} {"step": 13977, "train_loss": 3.2917733192443848, "lr": 0.00025392583514752016, "tps": 84821, "wall": 10799.9} {"step": 13978, "train_loss": 3.4551355838775635, "lr": 0.0002539070203124298, "tps": 84785, "wall": 10805.2} {"step": 13979, "train_loss": 3.3147788047790527, "lr": 0.0002538882050932389, "tps": 84750, "wall": 10810.5} {"step": 13980, "train_loss": 3.388526201248169, "lr": 0.00025386938949016055, "tps": 84715, "wall": 10815.8} {"step": 13981, "train_loss": 3.325045108795166, "lr": 0.0002538505735034079, "tps": 84679, "wall": 10821.0} {"step": 13982, "train_loss": 3.404855251312256, "lr": 0.00025383175713319424, "tps": 84644, "wall": 10826.3} {"step": 13983, "train_loss": 3.340510368347168, "lr": 0.0002538129403797326, "tps": 84608, "wall": 10831.7} {"step": 13984, "train_loss": 3.3278822898864746, "lr": 0.00025379412324323604, "tps": 84573, "wall": 10837.0} {"step": 13985, "train_loss": 3.318678855895996, "lr": 0.0002537753057239179, "tps": 84537, "wall": 10842.3} {"step": 13986, "train_loss": 3.4340338706970215, "lr": 0.00025375648782199124, "tps": 84502, "wall": 10847.6} {"step": 13987, "train_loss": 3.4333114624023438, "lr": 0.00025373766953766926, "tps": 84467, "wall": 10852.9} {"step": 13988, "train_loss": 3.4528648853302, "lr": 0.0002537188508711651, "tps": 84432, "wall": 10858.2} {"step": 13989, "train_loss": 3.4276766777038574, "lr": 0.000253700031822692, "tps": 84396, "wall": 10863.5} {"step": 13990, "train_loss": 3.302426338195801, "lr": 0.00025368121239246317, "tps": 84361, "wall": 10868.9} {"step": 13991, "train_loss": 3.399035930633545, "lr": 0.0002536623925806916, "tps": 84325, "wall": 10874.2} {"step": 13992, "train_loss": 3.322211980819702, "lr": 0.00025364357238759073, "tps": 84290, "wall": 10879.5} {"step": 13993, "train_loss": 3.409590244293213, "lr": 0.0002536247518133737, "tps": 84255, "wall": 10884.8} {"step": 13994, "train_loss": 3.330777645111084, "lr": 0.00025360593085825366, "tps": 84220, "wall": 10890.2} {"step": 13995, "train_loss": 3.327638626098633, "lr": 0.00025358710952244374, "tps": 84185, "wall": 10895.5} {"step": 13996, "train_loss": 3.440499782562256, "lr": 0.00025356828780615724, "tps": 84150, "wall": 10900.8} {"step": 13997, "train_loss": 3.292522668838501, "lr": 0.0002535494657096073, "tps": 84115, "wall": 10906.1} {"step": 13998, "train_loss": 3.466655731201172, "lr": 0.0002535306432330073, "tps": 84081, "wall": 10911.4} {"step": 13999, "train_loss": 3.39461088180542, "lr": 0.0002535118203765704, "tps": 84046, "wall": 10916.6} {"step": 14000, "train_loss": 3.405421495437622, "lr": 0.00025349299714050967, "tps": 84011, "wall": 10921.9, "val_loss_monitor": 3.4716723763222825} {"step": 14001, "train_loss": 3.308936595916748, "lr": 0.0002534741735250385, "tps": 83710, "wall": 10962.0} {"step": 14002, "train_loss": 3.342855453491211, "lr": 0.00025345534953037, "tps": 83675, "wall": 10967.4} {"step": 14003, "train_loss": 3.293999433517456, "lr": 0.00025343652515671765, "tps": 83641, "wall": 10972.7} {"step": 14004, "train_loss": 3.4108974933624268, "lr": 0.00025341770040429443, "tps": 83606, "wall": 10978.0} {"step": 14005, "train_loss": 3.3342909812927246, "lr": 0.0002533988752733137, "tps": 83571, "wall": 10983.4} {"step": 14006, "train_loss": 3.4926347732543945, "lr": 0.00025338004976398876, "tps": 83536, "wall": 10988.7} {"step": 14007, "train_loss": 3.475794792175293, "lr": 0.0002533612238765328, "tps": 83502, "wall": 10994.0} {"step": 14008, "train_loss": 3.42829966545105, "lr": 0.00025334239761115905, "tps": 83467, "wall": 10999.4} {"step": 14009, "train_loss": 3.407097339630127, "lr": 0.00025332357096808077, "tps": 83432, "wall": 11004.8} {"step": 14010, "train_loss": 3.3169519901275635, "lr": 0.0002533047439475114, "tps": 83397, "wall": 11010.2} {"step": 14011, "train_loss": 3.427563428878784, "lr": 0.000253285916549664, "tps": 83363, "wall": 11015.5} {"step": 14012, "train_loss": 3.2156982421875, "lr": 0.0002532670887747519, "tps": 83328, "wall": 11020.9} {"step": 14013, "train_loss": 3.420809030532837, "lr": 0.00025324826062298855, "tps": 83294, "wall": 11026.2} {"step": 14014, "train_loss": 3.3753111362457275, "lr": 0.000253229432094587, "tps": 83259, "wall": 11031.6} {"step": 14015, "train_loss": 3.3379478454589844, "lr": 0.00025321060318976064, "tps": 83225, "wall": 11036.9} {"step": 14016, "train_loss": 3.3102245330810547, "lr": 0.00025319177390872285, "tps": 83191, "wall": 11042.3} {"step": 14017, "train_loss": 3.3532023429870605, "lr": 0.0002531729442516868, "tps": 83156, "wall": 11047.6} {"step": 14018, "train_loss": 3.310635566711426, "lr": 0.0002531541142188658, "tps": 83122, "wall": 11053.0} {"step": 14019, "train_loss": 3.399878740310669, "lr": 0.0002531352838104733, "tps": 83088, "wall": 11058.3} {"step": 14020, "train_loss": 3.423471689224243, "lr": 0.0002531164530267225, "tps": 83054, "wall": 11063.6} {"step": 14021, "train_loss": 3.5620696544647217, "lr": 0.00025309762186782664, "tps": 83019, "wall": 11069.0} {"step": 14022, "train_loss": 3.406468152999878, "lr": 0.0002530787903339992, "tps": 82985, "wall": 11074.3} {"step": 14023, "train_loss": 3.5242490768432617, "lr": 0.0002530599584254534, "tps": 82951, "wall": 11079.7} {"step": 14024, "train_loss": 3.4067792892456055, "lr": 0.00025304112614240264, "tps": 82917, "wall": 11085.0} {"step": 14025, "train_loss": 3.410750389099121, "lr": 0.0002530222934850602, "tps": 82883, "wall": 11090.3} {"step": 14026, "train_loss": 3.4567339420318604, "lr": 0.0002530034604536394, "tps": 82849, "wall": 11095.7} {"step": 14027, "train_loss": 3.3638999462127686, "lr": 0.00025298462704835366, "tps": 82815, "wall": 11101.0} {"step": 14028, "train_loss": 3.3627214431762695, "lr": 0.00025296579326941626, "tps": 82781, "wall": 11106.4} {"step": 14029, "train_loss": 3.403985023498535, "lr": 0.0002529469591170406, "tps": 82748, "wall": 11111.7} {"step": 14030, "train_loss": 3.3886961936950684, "lr": 0.00025292812459143995, "tps": 82714, "wall": 11117.0} {"step": 14031, "train_loss": 3.3782248497009277, "lr": 0.0002529092896928278, "tps": 82680, "wall": 11122.3} {"step": 14032, "train_loss": 3.5240321159362793, "lr": 0.00025289045442141735, "tps": 82647, "wall": 11127.6} {"step": 14033, "train_loss": 3.398103713989258, "lr": 0.00025287161877742204, "tps": 82613, "wall": 11133.0} {"step": 14034, "train_loss": 3.3300395011901855, "lr": 0.0002528527827610554, "tps": 82579, "wall": 11138.3} {"step": 14035, "train_loss": 3.3967785835266113, "lr": 0.0002528339463725305, "tps": 82546, "wall": 11143.6} {"step": 14036, "train_loss": 3.431246280670166, "lr": 0.00025281510961206095, "tps": 82512, "wall": 11148.9} {"step": 14037, "train_loss": 3.304577350616455, "lr": 0.0002527962724798601, "tps": 82479, "wall": 11154.2} {"step": 14038, "train_loss": 3.399045944213867, "lr": 0.00025277743497614124, "tps": 82446, "wall": 11159.5} {"step": 14039, "train_loss": 3.3975117206573486, "lr": 0.0002527585971011178, "tps": 82413, "wall": 11164.8} {"step": 14040, "train_loss": 3.3575429916381836, "lr": 0.00025273975885500323, "tps": 82379, "wall": 11170.2} {"step": 14041, "train_loss": 3.409440755844116, "lr": 0.00025272092023801096, "tps": 82346, "wall": 11175.4} {"step": 14042, "train_loss": 3.3336031436920166, "lr": 0.00025270208125035426, "tps": 82313, "wall": 11180.7} {"step": 14043, "train_loss": 3.3994905948638916, "lr": 0.00025268324189224665, "tps": 82280, "wall": 11186.0} {"step": 14044, "train_loss": 3.306300401687622, "lr": 0.0002526644021639015, "tps": 82246, "wall": 11191.4} {"step": 14045, "train_loss": 3.407240152359009, "lr": 0.0002526455620655322, "tps": 82213, "wall": 11196.7} {"step": 14046, "train_loss": 3.400813579559326, "lr": 0.0002526267215973523, "tps": 82180, "wall": 11202.0} {"step": 14047, "train_loss": 3.361607074737549, "lr": 0.0002526078807595751, "tps": 82147, "wall": 11207.3} {"step": 14048, "train_loss": 3.373476505279541, "lr": 0.000252589039552414, "tps": 82114, "wall": 11212.6} {"step": 14049, "train_loss": 3.425346851348877, "lr": 0.0002525701979760825, "tps": 82081, "wall": 11217.9} {"step": 14050, "train_loss": 3.357573986053467, "lr": 0.00025255135603079404, "tps": 82048, "wall": 11223.2} {"step": 14051, "train_loss": 3.5079216957092285, "lr": 0.0002525325137167621, "tps": 82015, "wall": 11228.5} {"step": 14052, "train_loss": 3.3795671463012695, "lr": 0.00025251367103420005, "tps": 81982, "wall": 11233.8} {"step": 14053, "train_loss": 3.3603262901306152, "lr": 0.00025249482798332136, "tps": 81949, "wall": 11239.1} {"step": 14054, "train_loss": 3.4110429286956787, "lr": 0.0002524759845643396, "tps": 81916, "wall": 11244.4} {"step": 14055, "train_loss": 3.3945465087890625, "lr": 0.00025245714077746806, "tps": 81883, "wall": 11249.8} {"step": 14056, "train_loss": 3.441113233566284, "lr": 0.00025243829662292025, "tps": 81851, "wall": 11255.0} {"step": 14057, "train_loss": 3.269853115081787, "lr": 0.00025241945210090975, "tps": 81818, "wall": 11260.3} {"step": 14058, "train_loss": 3.363426685333252, "lr": 0.00025240060721164984, "tps": 81786, "wall": 11265.6} {"step": 14059, "train_loss": 3.473759174346924, "lr": 0.00025238176195535415, "tps": 81753, "wall": 11270.9} {"step": 14060, "train_loss": 3.3590588569641113, "lr": 0.00025236291633223606, "tps": 81720, "wall": 11276.2} {"step": 14061, "train_loss": 3.4787096977233887, "lr": 0.0002523440703425092, "tps": 81688, "wall": 11281.5} {"step": 14062, "train_loss": 3.297696828842163, "lr": 0.0002523252239863869, "tps": 81656, "wall": 11286.8} {"step": 14063, "train_loss": 3.420598030090332, "lr": 0.00025230637726408265, "tps": 81623, "wall": 11292.1} {"step": 14064, "train_loss": 3.421626091003418, "lr": 0.0002522875301758102, "tps": 81591, "wall": 11297.4} {"step": 14065, "train_loss": 3.3155758380889893, "lr": 0.0002522686827217827, "tps": 81558, "wall": 11302.7} {"step": 14066, "train_loss": 3.4647579193115234, "lr": 0.0002522498349022138, "tps": 81526, "wall": 11308.0} {"step": 14067, "train_loss": 3.4170174598693848, "lr": 0.0002522309867173171, "tps": 81493, "wall": 11313.3} {"step": 14068, "train_loss": 3.459261417388916, "lr": 0.000252212138167306, "tps": 81461, "wall": 11318.5} {"step": 14069, "train_loss": 3.3560872077941895, "lr": 0.0002521932892523941, "tps": 81429, "wall": 11323.8} {"step": 14070, "train_loss": 3.4627790451049805, "lr": 0.0002521744399727948, "tps": 81397, "wall": 11329.1} {"step": 14071, "train_loss": 3.461648941040039, "lr": 0.0002521555903287219, "tps": 81364, "wall": 11334.4} {"step": 14072, "train_loss": 3.390024185180664, "lr": 0.0002521367403203885, "tps": 81332, "wall": 11339.7} {"step": 14073, "train_loss": 3.4192564487457275, "lr": 0.00025211788994800846, "tps": 81300, "wall": 11345.0} {"step": 14074, "train_loss": 3.445316791534424, "lr": 0.00025209903921179526, "tps": 81268, "wall": 11350.3} {"step": 14075, "train_loss": 3.3762333393096924, "lr": 0.0002520801881119624, "tps": 81236, "wall": 11355.5} {"step": 14076, "train_loss": 3.3842384815216064, "lr": 0.00025206133664872337, "tps": 81204, "wall": 11360.8} {"step": 14077, "train_loss": 3.345062255859375, "lr": 0.00025204248482229175, "tps": 81172, "wall": 11366.1} {"step": 14078, "train_loss": 3.5437088012695312, "lr": 0.0002520236326328813, "tps": 81139, "wall": 11371.5} {"step": 14079, "train_loss": 3.364384651184082, "lr": 0.0002520047800807052, "tps": 81108, "wall": 11376.7} {"step": 14080, "train_loss": 3.3494300842285156, "lr": 0.00025198592716597733, "tps": 81075, "wall": 11382.1} {"step": 14081, "train_loss": 3.423358917236328, "lr": 0.0002519670738889112, "tps": 81044, "wall": 11387.4} {"step": 14082, "train_loss": 3.3454599380493164, "lr": 0.00025194822024972026, "tps": 81012, "wall": 11392.6} {"step": 14083, "train_loss": 3.3256473541259766, "lr": 0.00025192936624861815, "tps": 80980, "wall": 11397.9} {"step": 14084, "train_loss": 3.4442248344421387, "lr": 0.0002519105118858185, "tps": 80948, "wall": 11403.2} {"step": 14085, "train_loss": 3.370288848876953, "lr": 0.00025189165716153473, "tps": 80917, "wall": 11408.5} {"step": 14086, "train_loss": 3.379108190536499, "lr": 0.00025187280207598066, "tps": 80885, "wall": 11413.8} {"step": 14087, "train_loss": 3.2724599838256836, "lr": 0.00025185394662936974, "tps": 80853, "wall": 11419.0} {"step": 14088, "train_loss": 3.4535341262817383, "lr": 0.00025183509082191553, "tps": 80821, "wall": 11424.4} {"step": 14089, "train_loss": 3.489983081817627, "lr": 0.00025181623465383177, "tps": 80789, "wall": 11429.7} {"step": 14090, "train_loss": 3.38680362701416, "lr": 0.00025179737812533194, "tps": 80757, "wall": 11435.0} {"step": 14091, "train_loss": 3.3682799339294434, "lr": 0.00025177852123662973, "tps": 80726, "wall": 11440.3} {"step": 14092, "train_loss": 3.500643253326416, "lr": 0.00025175966398793863, "tps": 80694, "wall": 11445.6} {"step": 14093, "train_loss": 3.379352569580078, "lr": 0.0002517408063794724, "tps": 80662, "wall": 11450.9} {"step": 14094, "train_loss": 3.417677402496338, "lr": 0.0002517219484114446, "tps": 80631, "wall": 11456.2} {"step": 14095, "train_loss": 3.4363129138946533, "lr": 0.0002517030900840688, "tps": 80600, "wall": 11461.5} {"step": 14096, "train_loss": 3.4124081134796143, "lr": 0.0002516842313975587, "tps": 80568, "wall": 11466.7} {"step": 14097, "train_loss": 3.38663911819458, "lr": 0.00025166537235212796, "tps": 80537, "wall": 11472.0} {"step": 14098, "train_loss": 3.438866376876831, "lr": 0.00025164651294799014, "tps": 80506, "wall": 11477.3} {"step": 14099, "train_loss": 3.334956645965576, "lr": 0.00025162765318535886, "tps": 80474, "wall": 11482.6} {"step": 14100, "train_loss": 3.382169246673584, "lr": 0.0002516087930644479, "tps": 80443, "wall": 11487.9} {"step": 14101, "train_loss": 3.3934028148651123, "lr": 0.0002515899325854708, "tps": 80411, "wall": 11493.3} {"step": 14102, "train_loss": 3.43196964263916, "lr": 0.00025157107174864123, "tps": 80379, "wall": 11498.6} {"step": 14103, "train_loss": 3.4133944511413574, "lr": 0.00025155221055417283, "tps": 80348, "wall": 11503.9} {"step": 14104, "train_loss": 3.355358839035034, "lr": 0.00025153334900227924, "tps": 80317, "wall": 11509.2} {"step": 14105, "train_loss": 3.4273853302001953, "lr": 0.00025151448709317427, "tps": 80285, "wall": 11514.5} {"step": 14106, "train_loss": 3.3662562370300293, "lr": 0.0002514956248270714, "tps": 80254, "wall": 11519.8} {"step": 14107, "train_loss": 3.275822639465332, "lr": 0.0002514767622041844, "tps": 80223, "wall": 11525.1} {"step": 14108, "train_loss": 3.297567129135132, "lr": 0.000251457899224727, "tps": 80192, "wall": 11530.4} {"step": 14109, "train_loss": 3.4284095764160156, "lr": 0.0002514390358889128, "tps": 80161, "wall": 11535.7} {"step": 14110, "train_loss": 3.4251058101654053, "lr": 0.00025142017219695545, "tps": 80129, "wall": 11541.0} {"step": 14111, "train_loss": 3.3225865364074707, "lr": 0.0002514013081490687, "tps": 80098, "wall": 11546.3} {"step": 14112, "train_loss": 3.3833606243133545, "lr": 0.0002513824437454662, "tps": 80067, "wall": 11551.7} {"step": 14113, "train_loss": 3.417302131652832, "lr": 0.00025136357898636173, "tps": 80036, "wall": 11557.0} {"step": 14114, "train_loss": 3.360280990600586, "lr": 0.000251344713871969, "tps": 80005, "wall": 11562.2} {"step": 14115, "train_loss": 3.464352607727051, "lr": 0.00025132584840250157, "tps": 79974, "wall": 11567.5} {"step": 14116, "train_loss": 3.2997424602508545, "lr": 0.00025130698257817325, "tps": 79943, "wall": 11572.8} {"step": 14117, "train_loss": 3.3828916549682617, "lr": 0.00025128811639919775, "tps": 79912, "wall": 11578.1} {"step": 14118, "train_loss": 3.5287909507751465, "lr": 0.00025126924986578874, "tps": 79881, "wall": 11583.4} {"step": 14119, "train_loss": 3.326864719390869, "lr": 0.00025125038297816004, "tps": 79850, "wall": 11588.7} {"step": 14120, "train_loss": 3.4570374488830566, "lr": 0.00025123151573652524, "tps": 79819, "wall": 11594.0} {"step": 14121, "train_loss": 3.4010255336761475, "lr": 0.0002512126481410982, "tps": 79789, "wall": 11599.3} {"step": 14122, "train_loss": 3.270984411239624, "lr": 0.0002511937801920926, "tps": 79758, "wall": 11604.6} {"step": 14123, "train_loss": 3.3761684894561768, "lr": 0.0002511749118897221, "tps": 79726, "wall": 11610.0} {"step": 14124, "train_loss": 3.3874948024749756, "lr": 0.0002511560432342005, "tps": 79696, "wall": 11615.3} {"step": 14125, "train_loss": 3.398226261138916, "lr": 0.0002511371742257416, "tps": 79665, "wall": 11620.5} {"step": 14126, "train_loss": 3.392181396484375, "lr": 0.00025111830486455915, "tps": 79635, "wall": 11625.8} {"step": 14127, "train_loss": 3.3927993774414062, "lr": 0.00025109943515086685, "tps": 79604, "wall": 11631.1} {"step": 14128, "train_loss": 3.380772590637207, "lr": 0.0002510805650848784, "tps": 79573, "wall": 11636.5} {"step": 14129, "train_loss": 3.351391077041626, "lr": 0.0002510616946668077, "tps": 79542, "wall": 11641.9} {"step": 14130, "train_loss": 3.425306558609009, "lr": 0.00025104282389686836, "tps": 79512, "wall": 11647.1} {"step": 14131, "train_loss": 3.4503419399261475, "lr": 0.00025102395277527427, "tps": 79481, "wall": 11652.5} {"step": 14132, "train_loss": 3.395531177520752, "lr": 0.00025100508130223925, "tps": 79450, "wall": 11657.8} {"step": 14133, "train_loss": 3.2881274223327637, "lr": 0.00025098620947797693, "tps": 79420, "wall": 11663.1} {"step": 14134, "train_loss": 3.358635425567627, "lr": 0.00025096733730270107, "tps": 79389, "wall": 11668.4} {"step": 14135, "train_loss": 3.4151554107666016, "lr": 0.0002509484647766256, "tps": 79358, "wall": 11673.8} {"step": 14136, "train_loss": 3.392124652862549, "lr": 0.00025092959189996426, "tps": 79328, "wall": 11679.0} {"step": 14137, "train_loss": 3.51670241355896, "lr": 0.0002509107186729308, "tps": 79298, "wall": 11684.4} {"step": 14138, "train_loss": 3.476846694946289, "lr": 0.0002508918450957391, "tps": 79267, "wall": 11689.6} {"step": 14139, "train_loss": 3.4052610397338867, "lr": 0.00025087297116860286, "tps": 79237, "wall": 11694.9} {"step": 14140, "train_loss": 3.3423657417297363, "lr": 0.00025085409689173596, "tps": 79207, "wall": 11700.2} {"step": 14141, "train_loss": 3.3206088542938232, "lr": 0.00025083522226535215, "tps": 79177, "wall": 11705.5} {"step": 14142, "train_loss": 3.390526294708252, "lr": 0.0002508163472896653, "tps": 79146, "wall": 11710.8} {"step": 14143, "train_loss": 3.3334507942199707, "lr": 0.0002507974719648892, "tps": 79116, "wall": 11716.1} {"step": 14144, "train_loss": 3.433534860610962, "lr": 0.0002507785962912377, "tps": 79086, "wall": 11721.5} {"step": 14145, "train_loss": 3.371702194213867, "lr": 0.0002507597202689245, "tps": 79056, "wall": 11726.8} {"step": 14146, "train_loss": 3.4296398162841797, "lr": 0.00025074084389816364, "tps": 79025, "wall": 11732.1} {"step": 14147, "train_loss": 3.551016330718994, "lr": 0.00025072196717916876, "tps": 78995, "wall": 11737.4} {"step": 14148, "train_loss": 3.43896746635437, "lr": 0.00025070309011215376, "tps": 78965, "wall": 11742.8} {"step": 14149, "train_loss": 3.3649613857269287, "lr": 0.00025068421269733255, "tps": 78934, "wall": 11748.1} {"step": 14150, "train_loss": 3.3644416332244873, "lr": 0.0002506653349349189, "tps": 78904, "wall": 11753.4} {"step": 14151, "train_loss": 3.31484317779541, "lr": 0.0002506464568251267, "tps": 78874, "wall": 11758.7} {"step": 14152, "train_loss": 3.4409420490264893, "lr": 0.0002506275783681697, "tps": 78845, "wall": 11764.0} {"step": 14153, "train_loss": 3.4035277366638184, "lr": 0.0002506086995642619, "tps": 78815, "wall": 11769.3} {"step": 14154, "train_loss": 3.4674770832061768, "lr": 0.00025058982041361715, "tps": 78785, "wall": 11774.5} {"step": 14155, "train_loss": 3.3684964179992676, "lr": 0.0002505709409164492, "tps": 78755, "wall": 11779.8} {"step": 14156, "train_loss": 3.416018486022949, "lr": 0.00025055206107297195, "tps": 78725, "wall": 11785.1} {"step": 14157, "train_loss": 3.402851104736328, "lr": 0.0002505331808833993, "tps": 78695, "wall": 11790.5} {"step": 14158, "train_loss": 3.3011903762817383, "lr": 0.00025051430034794516, "tps": 78665, "wall": 11795.8} {"step": 14159, "train_loss": 3.430675506591797, "lr": 0.00025049541946682336, "tps": 78636, "wall": 11801.1} {"step": 14160, "train_loss": 3.375051975250244, "lr": 0.0002504765382402478, "tps": 78606, "wall": 11806.3} {"step": 14161, "train_loss": 3.4719882011413574, "lr": 0.00025045765666843235, "tps": 78576, "wall": 11811.7} {"step": 14162, "train_loss": 3.372631072998047, "lr": 0.0002504387747515909, "tps": 78547, "wall": 11817.0} {"step": 14163, "train_loss": 3.3925976753234863, "lr": 0.0002504198924899374, "tps": 78517, "wall": 11822.2} {"step": 14164, "train_loss": 3.3848650455474854, "lr": 0.00025040100988368575, "tps": 78487, "wall": 11827.5} {"step": 14165, "train_loss": 3.3987536430358887, "lr": 0.00025038212693304974, "tps": 78458, "wall": 11832.8} {"step": 14166, "train_loss": 3.4159257411956787, "lr": 0.0002503632436382435, "tps": 78428, "wall": 11838.1} {"step": 14167, "train_loss": 3.319284677505493, "lr": 0.00025034435999948064, "tps": 78399, "wall": 11843.4} {"step": 14168, "train_loss": 3.3593273162841797, "lr": 0.0002503254760169752, "tps": 78369, "wall": 11848.8} {"step": 14169, "train_loss": 3.340672016143799, "lr": 0.00025030659169094125, "tps": 78339, "wall": 11854.1} {"step": 14170, "train_loss": 3.3224387168884277, "lr": 0.00025028770702159256, "tps": 78310, "wall": 11859.3} {"step": 14171, "train_loss": 3.440354824066162, "lr": 0.000250268822009143, "tps": 78280, "wall": 11864.6} {"step": 14172, "train_loss": 3.4081196784973145, "lr": 0.0002502499366538067, "tps": 78251, "wall": 11869.9} {"step": 14173, "train_loss": 3.340730905532837, "lr": 0.0002502310509557974, "tps": 78222, "wall": 11875.2} {"step": 14174, "train_loss": 3.449817657470703, "lr": 0.00025021216491532915, "tps": 78193, "wall": 11880.5} {"step": 14175, "train_loss": 3.3289146423339844, "lr": 0.00025019327853261587, "tps": 78164, "wall": 11885.7} {"step": 14176, "train_loss": 3.421489715576172, "lr": 0.0002501743918078715, "tps": 78135, "wall": 11891.0} {"step": 14177, "train_loss": 3.437230110168457, "lr": 0.00025015550474130995, "tps": 78105, "wall": 11896.3} {"step": 14178, "train_loss": 3.364790439605713, "lr": 0.00025013661733314525, "tps": 78076, "wall": 11901.6} {"step": 14179, "train_loss": 3.429365634918213, "lr": 0.0002501177295835913, "tps": 78047, "wall": 11906.9} {"step": 14180, "train_loss": 3.3976261615753174, "lr": 0.0002500988414928621, "tps": 78017, "wall": 11912.3} {"step": 14181, "train_loss": 3.337575912475586, "lr": 0.0002500799530611716, "tps": 77988, "wall": 11917.6} {"step": 14182, "train_loss": 3.385517120361328, "lr": 0.00025006106428873367, "tps": 77959, "wall": 11922.9} {"step": 14183, "train_loss": 3.3197689056396484, "lr": 0.0002500421751757625, "tps": 77930, "wall": 11928.2} {"step": 14184, "train_loss": 3.4209511280059814, "lr": 0.0002500232857224719, "tps": 77900, "wall": 11933.5} {"step": 14185, "train_loss": 3.4356472492218018, "lr": 0.0002500043959290759, "tps": 77871, "wall": 11938.8} {"step": 14186, "train_loss": 3.414323568344116, "lr": 0.00024998550579578843, "tps": 77843, "wall": 11944.0} {"step": 14187, "train_loss": 3.292872905731201, "lr": 0.0002499666153228236, "tps": 77814, "wall": 11949.3} {"step": 14188, "train_loss": 3.382326602935791, "lr": 0.00024994772451039524, "tps": 77785, "wall": 11954.6} {"step": 14189, "train_loss": 3.455268144607544, "lr": 0.00024992883335871755, "tps": 77756, "wall": 11959.8} {"step": 14190, "train_loss": 3.406764030456543, "lr": 0.00024990994186800436, "tps": 77727, "wall": 11965.1} {"step": 14191, "train_loss": 3.37809419631958, "lr": 0.00024989105003846976, "tps": 77698, "wall": 11970.5} {"step": 14192, "train_loss": 3.425229787826538, "lr": 0.00024987215787032765, "tps": 77669, "wall": 11975.7} {"step": 14193, "train_loss": 3.436107873916626, "lr": 0.0002498532653637922, "tps": 77641, "wall": 11981.0} {"step": 14194, "train_loss": 3.4224307537078857, "lr": 0.0002498343725190773, "tps": 77612, "wall": 11986.3} {"step": 14195, "train_loss": 3.3551483154296875, "lr": 0.00024981547933639704, "tps": 77583, "wall": 11991.5} {"step": 14196, "train_loss": 3.377962350845337, "lr": 0.0002497965858159654, "tps": 77555, "wall": 11996.8} {"step": 14197, "train_loss": 3.450270652770996, "lr": 0.00024977769195799645, "tps": 77526, "wall": 12002.0} {"step": 14198, "train_loss": 3.3411829471588135, "lr": 0.0002497587977627042, "tps": 77498, "wall": 12007.3} {"step": 14199, "train_loss": 3.455265522003174, "lr": 0.0002497399032303027, "tps": 77470, "wall": 12012.5} {"step": 14200, "train_loss": 3.3311023712158203, "lr": 0.00024972100836100585, "tps": 77441, "wall": 12017.8} {"step": 14201, "train_loss": 3.3924481868743896, "lr": 0.0002497021131550279, "tps": 77413, "wall": 12023.1} {"step": 14202, "train_loss": 3.440666913986206, "lr": 0.0002496832176125828, "tps": 77384, "wall": 12028.3} {"step": 14203, "train_loss": 3.405653715133667, "lr": 0.00024966432173388457, "tps": 77355, "wall": 12033.7} {"step": 14204, "train_loss": 3.3930609226226807, "lr": 0.0002496454255191473, "tps": 77327, "wall": 12038.9} {"step": 14205, "train_loss": 3.3971853256225586, "lr": 0.0002496265289685851, "tps": 77299, "wall": 12044.2} {"step": 14206, "train_loss": 3.393498420715332, "lr": 0.00024960763208241196, "tps": 77270, "wall": 12049.4} {"step": 14207, "train_loss": 3.3634378910064697, "lr": 0.0002495887348608419, "tps": 77242, "wall": 12054.7} {"step": 14208, "train_loss": 3.347219705581665, "lr": 0.0002495698373040892, "tps": 77214, "wall": 12059.9} {"step": 14209, "train_loss": 3.376896619796753, "lr": 0.00024955093941236763, "tps": 77185, "wall": 12065.2} {"step": 14210, "train_loss": 3.3701980113983154, "lr": 0.0002495320411858914, "tps": 77157, "wall": 12070.5} {"step": 14211, "train_loss": 3.3537395000457764, "lr": 0.00024951314262487473, "tps": 77129, "wall": 12075.8} {"step": 14212, "train_loss": 3.4119009971618652, "lr": 0.00024949424372953157, "tps": 77100, "wall": 12081.1} {"step": 14213, "train_loss": 3.4505109786987305, "lr": 0.0002494753445000759, "tps": 77072, "wall": 12086.3} {"step": 14214, "train_loss": 3.3279433250427246, "lr": 0.0002494564449367221, "tps": 77044, "wall": 12091.7} {"step": 14215, "train_loss": 3.373239517211914, "lr": 0.000249437545039684, "tps": 77016, "wall": 12096.9} {"step": 14216, "train_loss": 3.424651622772217, "lr": 0.0002494186448091758, "tps": 76988, "wall": 12102.2} {"step": 14217, "train_loss": 3.365729570388794, "lr": 0.00024939974424541164, "tps": 76959, "wall": 12107.5} {"step": 14218, "train_loss": 3.4036736488342285, "lr": 0.0002493808433486055, "tps": 76931, "wall": 12112.7} {"step": 14219, "train_loss": 3.31943416595459, "lr": 0.0002493619421189716, "tps": 76903, "wall": 12118.0} {"step": 14220, "train_loss": 3.3644118309020996, "lr": 0.00024934304055672406, "tps": 76875, "wall": 12123.3} {"step": 14221, "train_loss": 3.4710590839385986, "lr": 0.00024932413866207703, "tps": 76848, "wall": 12128.5} {"step": 14222, "train_loss": 3.3313565254211426, "lr": 0.00024930523643524455, "tps": 76819, "wall": 12133.8} {"step": 14223, "train_loss": 3.2087690830230713, "lr": 0.0002492863338764407, "tps": 76791, "wall": 12139.1} {"step": 14224, "train_loss": 3.323026657104492, "lr": 0.0002492674309858797, "tps": 76764, "wall": 12144.4} {"step": 14225, "train_loss": 3.375087022781372, "lr": 0.0002492485277637757, "tps": 76735, "wall": 12149.7} {"step": 14226, "train_loss": 3.439901351928711, "lr": 0.0002492296242103427, "tps": 76707, "wall": 12155.0} {"step": 14227, "train_loss": 3.3171451091766357, "lr": 0.000249210720325795, "tps": 76680, "wall": 12160.2} {"step": 14228, "train_loss": 3.532843828201294, "lr": 0.00024919181611034673, "tps": 76652, "wall": 12165.5} {"step": 14229, "train_loss": 3.3581910133361816, "lr": 0.0002491729115642119, "tps": 76624, "wall": 12170.8} {"step": 14230, "train_loss": 3.348534345626831, "lr": 0.0002491540066876048, "tps": 76596, "wall": 12176.1} {"step": 14231, "train_loss": 3.3370823860168457, "lr": 0.00024913510148073955, "tps": 76568, "wall": 12181.3} {"step": 14232, "train_loss": 3.265012502670288, "lr": 0.00024911619594383024, "tps": 76541, "wall": 12186.6} {"step": 14233, "train_loss": 3.252314567565918, "lr": 0.00024909729007709114, "tps": 76513, "wall": 12191.8} {"step": 14234, "train_loss": 3.4343862533569336, "lr": 0.0002490783838807363, "tps": 76485, "wall": 12197.1} {"step": 14235, "train_loss": 3.431417942047119, "lr": 0.00024905947735498, "tps": 76458, "wall": 12202.4} {"step": 14236, "train_loss": 3.3455235958099365, "lr": 0.00024904057050003633, "tps": 76430, "wall": 12207.6} {"step": 14237, "train_loss": 3.454543113708496, "lr": 0.0002490216633161195, "tps": 76402, "wall": 12213.0} {"step": 14238, "train_loss": 3.437882900238037, "lr": 0.0002490027558034438, "tps": 76374, "wall": 12218.2} {"step": 14239, "train_loss": 3.4490485191345215, "lr": 0.00024898384796222326, "tps": 76347, "wall": 12223.5} {"step": 14240, "train_loss": 3.454742431640625, "lr": 0.0002489649397926721, "tps": 76320, "wall": 12228.7} {"step": 14241, "train_loss": 3.388108730316162, "lr": 0.0002489460312950045, "tps": 76292, "wall": 12234.0} {"step": 14242, "train_loss": 3.414830207824707, "lr": 0.0002489271224694348, "tps": 76265, "wall": 12239.2} {"step": 14243, "train_loss": 3.461061477661133, "lr": 0.000248908213316177, "tps": 76237, "wall": 12244.5} {"step": 14244, "train_loss": 3.4156088829040527, "lr": 0.00024888930383544543, "tps": 76210, "wall": 12249.7} {"step": 14245, "train_loss": 3.333080530166626, "lr": 0.00024887039402745427, "tps": 76183, "wall": 12255.0} {"step": 14246, "train_loss": 3.3714818954467773, "lr": 0.00024885148389241775, "tps": 76156, "wall": 12260.2} {"step": 14247, "train_loss": 3.4379281997680664, "lr": 0.00024883257343054994, "tps": 76128, "wall": 12265.5} {"step": 14248, "train_loss": 3.359443187713623, "lr": 0.0002488136626420653, "tps": 76100, "wall": 12270.9} {"step": 14249, "train_loss": 3.4212520122528076, "lr": 0.0002487947515271779, "tps": 76073, "wall": 12276.1} {"step": 14250, "train_loss": 3.3506078720092773, "lr": 0.00024877584008610194, "tps": 76046, "wall": 12281.4} {"step": 14251, "train_loss": 3.4211549758911133, "lr": 0.00024875692831905177, "tps": 76019, "wall": 12286.6} {"step": 14252, "train_loss": 3.231375217437744, "lr": 0.00024873801622624157, "tps": 75991, "wall": 12291.9} {"step": 14253, "train_loss": 3.3335537910461426, "lr": 0.0002487191038078855, "tps": 75964, "wall": 12297.2} {"step": 14254, "train_loss": 3.4710912704467773, "lr": 0.0002487001910641979, "tps": 75937, "wall": 12302.4} {"step": 14255, "train_loss": 3.4505577087402344, "lr": 0.000248681277995393, "tps": 75910, "wall": 12307.7} {"step": 14256, "train_loss": 3.4301884174346924, "lr": 0.000248662364601685, "tps": 75883, "wall": 12313.0} {"step": 14257, "train_loss": 3.279690742492676, "lr": 0.0002486434508832882, "tps": 75855, "wall": 12318.3} {"step": 14258, "train_loss": 3.4509694576263428, "lr": 0.0002486245368404169, "tps": 75828, "wall": 12323.5} {"step": 14259, "train_loss": 3.397822856903076, "lr": 0.00024860562247328526, "tps": 75801, "wall": 12328.9} {"step": 14260, "train_loss": 3.2628977298736572, "lr": 0.0002485867077821075, "tps": 75773, "wall": 12334.2} {"step": 14261, "train_loss": 3.3488128185272217, "lr": 0.0002485677927670981, "tps": 75746, "wall": 12339.5} {"step": 14262, "train_loss": 3.4028520584106445, "lr": 0.0002485488774284711, "tps": 75719, "wall": 12344.7} {"step": 14263, "train_loss": 3.395071268081665, "lr": 0.0002485299617664409, "tps": 75693, "wall": 12350.0} {"step": 14264, "train_loss": 3.499821662902832, "lr": 0.0002485110457812218, "tps": 75666, "wall": 12355.2} {"step": 14265, "train_loss": 3.3920106887817383, "lr": 0.00024849212947302795, "tps": 75639, "wall": 12360.4} {"step": 14266, "train_loss": 3.3350963592529297, "lr": 0.00024847321284207375, "tps": 75612, "wall": 12365.7} {"step": 14267, "train_loss": 3.388475179672241, "lr": 0.0002484542958885734, "tps": 75585, "wall": 12370.9} {"step": 14268, "train_loss": 3.439692497253418, "lr": 0.00024843537861274134, "tps": 75559, "wall": 12376.2} {"step": 14269, "train_loss": 3.3780007362365723, "lr": 0.00024841646101479177, "tps": 75532, "wall": 12381.4} {"step": 14270, "train_loss": 3.4775800704956055, "lr": 0.0002483975430949389, "tps": 75505, "wall": 12386.7} {"step": 14271, "train_loss": 3.4496750831604004, "lr": 0.0002483786248533972, "tps": 75478, "wall": 12392.0} {"step": 14272, "train_loss": 3.3355305194854736, "lr": 0.0002483597062903809, "tps": 75451, "wall": 12397.3} {"step": 14273, "train_loss": 3.4027514457702637, "lr": 0.00024834078740610424, "tps": 75424, "wall": 12402.5} {"step": 14274, "train_loss": 3.413203239440918, "lr": 0.0002483218682007817, "tps": 75398, "wall": 12407.8} {"step": 14275, "train_loss": 3.307431936264038, "lr": 0.00024830294867462746, "tps": 75371, "wall": 12413.0} {"step": 14276, "train_loss": 3.303952217102051, "lr": 0.00024828402882785594, "tps": 75345, "wall": 12418.3} {"step": 14277, "train_loss": 3.4191150665283203, "lr": 0.0002482651086606813, "tps": 75318, "wall": 12423.6} {"step": 14278, "train_loss": 3.3026113510131836, "lr": 0.0002482461881733181, "tps": 75291, "wall": 12428.8} {"step": 14279, "train_loss": 3.435244560241699, "lr": 0.00024822726736598044, "tps": 75264, "wall": 12434.1} {"step": 14280, "train_loss": 3.3747122287750244, "lr": 0.00024820834623888287, "tps": 75238, "wall": 12439.4} {"step": 14281, "train_loss": 3.316315174102783, "lr": 0.00024818942479223953, "tps": 75212, "wall": 12444.6} {"step": 14282, "train_loss": 3.3967812061309814, "lr": 0.000248170503026265, "tps": 75185, "wall": 12449.9} {"step": 14283, "train_loss": 3.3760054111480713, "lr": 0.00024815158094117337, "tps": 75158, "wall": 12455.2} {"step": 14284, "train_loss": 3.349339008331299, "lr": 0.0002481326585371792, "tps": 75132, "wall": 12460.4} {"step": 14285, "train_loss": 3.45124888420105, "lr": 0.00024811373581449663, "tps": 75105, "wall": 12465.7} {"step": 14286, "train_loss": 3.4005751609802246, "lr": 0.00024809481277334025, "tps": 75079, "wall": 12471.0} {"step": 14287, "train_loss": 3.3519349098205566, "lr": 0.00024807588941392424, "tps": 75052, "wall": 12476.3} {"step": 14288, "train_loss": 3.4299376010894775, "lr": 0.00024805696573646305, "tps": 75026, "wall": 12481.5} {"step": 14289, "train_loss": 3.326539993286133, "lr": 0.0002480380417411711, "tps": 74999, "wall": 12486.8} {"step": 14290, "train_loss": 3.2723069190979004, "lr": 0.0002480191174282626, "tps": 74973, "wall": 12492.1} {"step": 14291, "train_loss": 3.317026138305664, "lr": 0.00024800019279795204, "tps": 74947, "wall": 12497.3} {"step": 14292, "train_loss": 3.4193267822265625, "lr": 0.0002479812678504538, "tps": 74920, "wall": 12502.6} {"step": 14293, "train_loss": 3.360163927078247, "lr": 0.00024796234258598227, "tps": 74894, "wall": 12507.9} {"step": 14294, "train_loss": 3.3964743614196777, "lr": 0.0002479434170047518, "tps": 74868, "wall": 12513.2} {"step": 14295, "train_loss": 3.4252185821533203, "lr": 0.0002479244911069767, "tps": 74842, "wall": 12518.4} {"step": 14296, "train_loss": 3.3622021675109863, "lr": 0.0002479055648928716, "tps": 74816, "wall": 12523.6} {"step": 14297, "train_loss": 3.4174323081970215, "lr": 0.00024788663836265067, "tps": 74789, "wall": 12528.9} {"step": 14298, "train_loss": 3.409773826599121, "lr": 0.00024786771151652845, "tps": 74763, "wall": 12534.1} {"step": 14299, "train_loss": 3.4231362342834473, "lr": 0.0002478487843547192, "tps": 74737, "wall": 12539.4} {"step": 14300, "train_loss": 3.4096524715423584, "lr": 0.00024782985687743747, "tps": 74711, "wall": 12544.7} {"step": 14301, "train_loss": 3.351973533630371, "lr": 0.00024781092908489756, "tps": 74683, "wall": 12550.2} {"step": 14302, "train_loss": 3.306882858276367, "lr": 0.000247792000977314, "tps": 74657, "wall": 12555.5} {"step": 14303, "train_loss": 3.366722822189331, "lr": 0.0002477730725549011, "tps": 74631, "wall": 12560.7} {"step": 14304, "train_loss": 3.3242223262786865, "lr": 0.0002477541438178734, "tps": 74605, "wall": 12566.0} {"step": 14305, "train_loss": 3.436829090118408, "lr": 0.0002477352147664452, "tps": 74578, "wall": 12571.4} {"step": 14306, "train_loss": 3.40230655670166, "lr": 0.00024771628540083105, "tps": 74552, "wall": 12576.6} {"step": 14307, "train_loss": 3.3912148475646973, "lr": 0.0002476973557212453, "tps": 74526, "wall": 12581.9} {"step": 14308, "train_loss": 3.352360963821411, "lr": 0.00024767842572790235, "tps": 74501, "wall": 12587.1} {"step": 14309, "train_loss": 3.4775285720825195, "lr": 0.0002476594954210167, "tps": 74475, "wall": 12592.4} {"step": 14310, "train_loss": 3.3454670906066895, "lr": 0.00024764056480080284, "tps": 74448, "wall": 12597.7} {"step": 14311, "train_loss": 3.352429151535034, "lr": 0.00024762163386747517, "tps": 74422, "wall": 12603.0} {"step": 14312, "train_loss": 3.3498215675354004, "lr": 0.0002476027026212481, "tps": 74396, "wall": 12608.3} {"step": 14313, "train_loss": 3.382753372192383, "lr": 0.0002475837710623361, "tps": 74370, "wall": 12613.6} {"step": 14314, "train_loss": 3.396937370300293, "lr": 0.0002475648391909537, "tps": 74344, "wall": 12618.9} {"step": 14315, "train_loss": 3.423858165740967, "lr": 0.0002475459070073153, "tps": 74318, "wall": 12624.2} {"step": 14316, "train_loss": 3.4544501304626465, "lr": 0.0002475269745116354, "tps": 74292, "wall": 12629.5} {"step": 14317, "train_loss": 3.3597445487976074, "lr": 0.00024750804170412834, "tps": 74266, "wall": 12634.8} {"step": 14318, "train_loss": 3.4527435302734375, "lr": 0.0002474891085850088, "tps": 74241, "wall": 12640.0} {"step": 14319, "train_loss": 3.440774917602539, "lr": 0.00024747017515449113, "tps": 74215, "wall": 12645.4} {"step": 14320, "train_loss": 3.3027820587158203, "lr": 0.0002474512414127898, "tps": 74189, "wall": 12650.6} {"step": 14321, "train_loss": 3.352891206741333, "lr": 0.00024743230736011936, "tps": 74163, "wall": 12655.9} {"step": 14322, "train_loss": 3.440937042236328, "lr": 0.0002474133729966942, "tps": 74137, "wall": 12661.2} {"step": 14323, "train_loss": 3.3645715713500977, "lr": 0.0002473944383227289, "tps": 74112, "wall": 12666.4} {"step": 14324, "train_loss": 3.4165334701538086, "lr": 0.00024737550333843797, "tps": 74086, "wall": 12671.7} {"step": 14325, "train_loss": 3.3779520988464355, "lr": 0.00024735656804403575, "tps": 74060, "wall": 12677.0} {"step": 14326, "train_loss": 3.430701732635498, "lr": 0.000247337632439737, "tps": 74035, "wall": 12682.3} {"step": 14327, "train_loss": 3.3287100791931152, "lr": 0.00024731869652575597, "tps": 74009, "wall": 12687.5} {"step": 14328, "train_loss": 3.3990025520324707, "lr": 0.00024729976030230726, "tps": 73983, "wall": 12692.9} {"step": 14329, "train_loss": 3.457017421722412, "lr": 0.00024728082376960543, "tps": 73958, "wall": 12698.2} {"step": 14330, "train_loss": 3.370270252227783, "lr": 0.0002472618869278649, "tps": 73932, "wall": 12703.4} {"step": 14331, "train_loss": 3.344176769256592, "lr": 0.00024724294977730027, "tps": 73907, "wall": 12708.7} {"step": 14332, "train_loss": 3.390486717224121, "lr": 0.000247224012318126, "tps": 73881, "wall": 12714.0} {"step": 14333, "train_loss": 3.358821153640747, "lr": 0.00024720507455055677, "tps": 73855, "wall": 12719.3} {"step": 14334, "train_loss": 3.343308687210083, "lr": 0.00024718613647480687, "tps": 73830, "wall": 12724.5} {"step": 14335, "train_loss": 3.3110060691833496, "lr": 0.0002471671980910909, "tps": 73804, "wall": 12729.9} {"step": 14336, "train_loss": 3.3606057167053223, "lr": 0.0002471482593996235, "tps": 73778, "wall": 12735.2} {"step": 14337, "train_loss": 3.403911590576172, "lr": 0.0002471293204006192, "tps": 73753, "wall": 12740.5} {"step": 14338, "train_loss": 3.372258424758911, "lr": 0.00024711038109429245, "tps": 73728, "wall": 12745.8} {"step": 14339, "train_loss": 3.4236021041870117, "lr": 0.00024709144148085785, "tps": 73702, "wall": 12751.2} {"step": 14340, "train_loss": 3.430433750152588, "lr": 0.00024707250156052985, "tps": 73676, "wall": 12756.4} {"step": 14341, "train_loss": 3.3055343627929688, "lr": 0.0002470535613335232, "tps": 73651, "wall": 12761.7} {"step": 14342, "train_loss": 3.348940134048462, "lr": 0.0002470346208000523, "tps": 73626, "wall": 12767.0} {"step": 14343, "train_loss": 3.3698859214782715, "lr": 0.00024701567996033175, "tps": 73600, "wall": 12772.3} {"step": 14344, "train_loss": 3.449751615524292, "lr": 0.0002469967388145761, "tps": 73575, "wall": 12777.6} {"step": 14345, "train_loss": 3.4590001106262207, "lr": 0.00024697779736299996, "tps": 73549, "wall": 12782.9} {"step": 14346, "train_loss": 3.405210018157959, "lr": 0.0002469588556058179, "tps": 73524, "wall": 12788.1} {"step": 14347, "train_loss": 3.314301013946533, "lr": 0.0002469399135432444, "tps": 73499, "wall": 12793.4} {"step": 14348, "train_loss": 3.4243288040161133, "lr": 0.00024692097117549416, "tps": 73474, "wall": 12798.7} {"step": 14349, "train_loss": 3.387864589691162, "lr": 0.00024690202850278164, "tps": 73448, "wall": 12804.0} {"step": 14350, "train_loss": 3.390854597091675, "lr": 0.0002468830855253215, "tps": 73423, "wall": 12809.4} {"step": 14351, "train_loss": 3.3400092124938965, "lr": 0.00024686414224332835, "tps": 73397, "wall": 12814.7} {"step": 14352, "train_loss": 3.4116101264953613, "lr": 0.0002468451986570167, "tps": 73372, "wall": 12820.0} {"step": 14353, "train_loss": 3.313640832901001, "lr": 0.0002468262547666012, "tps": 73347, "wall": 12825.3} {"step": 14354, "train_loss": 3.3961892127990723, "lr": 0.0002468073105722965, "tps": 73322, "wall": 12830.7} {"step": 14355, "train_loss": 3.390805244445801, "lr": 0.0002467883660743171, "tps": 73296, "wall": 12835.9} {"step": 14356, "train_loss": 3.394810676574707, "lr": 0.00024676942127287757, "tps": 73271, "wall": 12841.2} {"step": 14357, "train_loss": 3.3094677925109863, "lr": 0.00024675047616819267, "tps": 73246, "wall": 12846.5} {"step": 14358, "train_loss": 3.4032509326934814, "lr": 0.00024673153076047684, "tps": 73221, "wall": 12851.8} {"step": 14359, "train_loss": 3.2972328662872314, "lr": 0.00024671258504994486, "tps": 73196, "wall": 12857.1} {"step": 14360, "train_loss": 3.501394033432007, "lr": 0.0002466936390368113, "tps": 73171, "wall": 12862.4} {"step": 14361, "train_loss": 3.2865405082702637, "lr": 0.00024667469272129065, "tps": 73146, "wall": 12867.7} {"step": 14362, "train_loss": 3.332336664199829, "lr": 0.0002466557461035977, "tps": 73121, "wall": 12873.0} {"step": 14363, "train_loss": 3.323916435241699, "lr": 0.000246636799183947, "tps": 73096, "wall": 12878.3} {"step": 14364, "train_loss": 3.414217948913574, "lr": 0.0002466178519625532, "tps": 73071, "wall": 12883.6} {"step": 14365, "train_loss": 3.366927146911621, "lr": 0.00024659890443963094, "tps": 73046, "wall": 12888.9} {"step": 14366, "train_loss": 3.3705976009368896, "lr": 0.00024657995661539483, "tps": 73021, "wall": 12894.2} {"step": 14367, "train_loss": 3.4968302249908447, "lr": 0.00024656100849005963, "tps": 72996, "wall": 12899.5} {"step": 14368, "train_loss": 3.395747661590576, "lr": 0.00024654206006383985, "tps": 72972, "wall": 12904.7} {"step": 14369, "train_loss": 3.3101720809936523, "lr": 0.00024652311133695014, "tps": 72947, "wall": 12910.0} {"step": 14370, "train_loss": 3.304987668991089, "lr": 0.00024650416230960514, "tps": 72922, "wall": 12915.3} {"step": 14371, "train_loss": 3.4638919830322266, "lr": 0.00024648521298201967, "tps": 72898, "wall": 12920.6} {"step": 14372, "train_loss": 3.4494028091430664, "lr": 0.0002464662633544082, "tps": 72873, "wall": 12925.9} {"step": 14373, "train_loss": 3.488745927810669, "lr": 0.00024644731342698544, "tps": 72847, "wall": 12931.3} {"step": 14374, "train_loss": 3.3069586753845215, "lr": 0.0002464283631999662, "tps": 72823, "wall": 12936.5} {"step": 14375, "train_loss": 3.4273276329040527, "lr": 0.0002464094126735649, "tps": 72798, "wall": 12941.8} {"step": 14376, "train_loss": 3.284245729446411, "lr": 0.00024639046184799635, "tps": 72773, "wall": 12947.1} {"step": 14377, "train_loss": 3.411722421646118, "lr": 0.0002463715107234753, "tps": 72749, "wall": 12952.4} {"step": 14378, "train_loss": 3.4096031188964844, "lr": 0.0002463525593002163, "tps": 72724, "wall": 12957.7} {"step": 14379, "train_loss": 3.324720859527588, "lr": 0.0002463336075784341, "tps": 72699, "wall": 12963.0} {"step": 14380, "train_loss": 3.413677215576172, "lr": 0.00024631465555834337, "tps": 72675, "wall": 12968.3} {"step": 14381, "train_loss": 3.4566071033477783, "lr": 0.00024629570324015887, "tps": 72650, "wall": 12973.6} {"step": 14382, "train_loss": 3.463941812515259, "lr": 0.0002462767506240951, "tps": 72625, "wall": 12978.9} {"step": 14383, "train_loss": 3.4207582473754883, "lr": 0.00024625779771036694, "tps": 72601, "wall": 12984.2} {"step": 14384, "train_loss": 3.446409225463867, "lr": 0.000246238844499189, "tps": 72576, "wall": 12989.5} {"step": 14385, "train_loss": 3.4471123218536377, "lr": 0.000246219890990776, "tps": 72552, "wall": 12994.8} {"step": 14386, "train_loss": 3.447838068008423, "lr": 0.0002462009371853427, "tps": 72527, "wall": 13000.0} {"step": 14387, "train_loss": 3.337010383605957, "lr": 0.00024618198308310374, "tps": 72503, "wall": 13005.4} {"step": 14388, "train_loss": 3.389491558074951, "lr": 0.00024616302868427385, "tps": 72479, "wall": 13010.6} {"step": 14389, "train_loss": 3.3652474880218506, "lr": 0.00024614407398906775, "tps": 72454, "wall": 13015.9} {"step": 14390, "train_loss": 3.4101171493530273, "lr": 0.00024612511899770024, "tps": 72430, "wall": 13021.1} {"step": 14391, "train_loss": 3.4549405574798584, "lr": 0.0002461061637103859, "tps": 72406, "wall": 13026.4} {"step": 14392, "train_loss": 3.5308008193969727, "lr": 0.00024608720812733956, "tps": 72382, "wall": 13031.7} {"step": 14393, "train_loss": 3.3934097290039062, "lr": 0.00024606825224877585, "tps": 72357, "wall": 13036.9} {"step": 14394, "train_loss": 3.29496431350708, "lr": 0.0002460492960749097, "tps": 72333, "wall": 13042.2} {"step": 14395, "train_loss": 3.483407735824585, "lr": 0.00024603033960595555, "tps": 72309, "wall": 13047.5} {"step": 14396, "train_loss": 3.3320276737213135, "lr": 0.0002460113828421284, "tps": 72284, "wall": 13052.8} {"step": 14397, "train_loss": 3.3928732872009277, "lr": 0.0002459924257836428, "tps": 72260, "wall": 13058.1} {"step": 14398, "train_loss": 3.353865146636963, "lr": 0.00024597346843071373, "tps": 72236, "wall": 13063.4} {"step": 14399, "train_loss": 3.2634615898132324, "lr": 0.0002459545107835558, "tps": 72212, "wall": 13068.7} {"step": 14400, "train_loss": 3.30491304397583, "lr": 0.00024593555284238366, "tps": 72188, "wall": 13073.9} {"step": 14401, "train_loss": 3.4793906211853027, "lr": 0.0002459165946074123, "tps": 72164, "wall": 13079.2} {"step": 14402, "train_loss": 3.4028823375701904, "lr": 0.0002458976360788563, "tps": 72140, "wall": 13084.5} {"step": 14403, "train_loss": 3.407839298248291, "lr": 0.00024587867725693043, "tps": 72116, "wall": 13089.7} {"step": 14404, "train_loss": 3.360610008239746, "lr": 0.0002458597181418495, "tps": 72091, "wall": 13095.0} {"step": 14405, "train_loss": 3.499344825744629, "lr": 0.00024584075873382836, "tps": 72068, "wall": 13100.3} {"step": 14406, "train_loss": 3.3294014930725098, "lr": 0.00024582179903308163, "tps": 72043, "wall": 13105.6} {"step": 14407, "train_loss": 3.4200010299682617, "lr": 0.0002458028390398242, "tps": 72019, "wall": 13110.9} {"step": 14408, "train_loss": 3.435479164123535, "lr": 0.0002457838787542708, "tps": 71995, "wall": 13116.2} {"step": 14409, "train_loss": 3.424846649169922, "lr": 0.00024576491817663627, "tps": 71971, "wall": 13121.4} {"step": 14410, "train_loss": 3.3747401237487793, "lr": 0.0002457459573071353, "tps": 71948, "wall": 13126.7} {"step": 14411, "train_loss": 3.3948135375976562, "lr": 0.0002457269961459828, "tps": 71924, "wall": 13132.0} {"step": 14412, "train_loss": 3.270486831665039, "lr": 0.0002457080346933935, "tps": 71900, "wall": 13137.2} {"step": 14413, "train_loss": 3.2550745010375977, "lr": 0.0002456890729495821, "tps": 71876, "wall": 13142.5} {"step": 14414, "train_loss": 3.356649875640869, "lr": 0.0002456701109147635, "tps": 71852, "wall": 13147.7} {"step": 14415, "train_loss": 3.503591537475586, "lr": 0.0002456511485891526, "tps": 71829, "wall": 13153.0} {"step": 14416, "train_loss": 3.433746337890625, "lr": 0.00024563218597296394, "tps": 71805, "wall": 13158.3} {"step": 14417, "train_loss": 3.3963022232055664, "lr": 0.0002456132230664126, "tps": 71781, "wall": 13163.5} {"step": 14418, "train_loss": 3.40681529045105, "lr": 0.00024559425986971333, "tps": 71757, "wall": 13168.8} {"step": 14419, "train_loss": 3.290666341781616, "lr": 0.00024557529638308083, "tps": 71733, "wall": 13174.1} {"step": 14420, "train_loss": 3.330927848815918, "lr": 0.00024555633260673, "tps": 71710, "wall": 13179.4} {"step": 14421, "train_loss": 3.3625214099884033, "lr": 0.0002455373685408757, "tps": 71686, "wall": 13184.7} {"step": 14422, "train_loss": 3.4618911743164062, "lr": 0.00024551840418573264, "tps": 71662, "wall": 13189.9} {"step": 14423, "train_loss": 3.543734550476074, "lr": 0.00024549943954151564, "tps": 71639, "wall": 13195.2} {"step": 14424, "train_loss": 3.4369614124298096, "lr": 0.00024548047460843975, "tps": 71615, "wall": 13200.4} {"step": 14425, "train_loss": 3.372836112976074, "lr": 0.00024546150938671964, "tps": 71591, "wall": 13205.7} {"step": 14426, "train_loss": 3.3662524223327637, "lr": 0.00024544254387657015, "tps": 71568, "wall": 13211.0} {"step": 14427, "train_loss": 3.4616758823394775, "lr": 0.00024542357807820606, "tps": 71544, "wall": 13216.3} {"step": 14428, "train_loss": 3.4290666580200195, "lr": 0.00024540461199184247, "tps": 71520, "wall": 13221.6} {"step": 14429, "train_loss": 3.3799731731414795, "lr": 0.00024538564561769395, "tps": 71497, "wall": 13226.9} {"step": 14430, "train_loss": 3.319521903991699, "lr": 0.0002453666789559755, "tps": 71473, "wall": 13232.2} {"step": 14431, "train_loss": 3.4006152153015137, "lr": 0.00024534771200690193, "tps": 71449, "wall": 13237.5} {"step": 14432, "train_loss": 3.3710227012634277, "lr": 0.0002453287447706881, "tps": 71426, "wall": 13242.7} {"step": 14433, "train_loss": 3.424293279647827, "lr": 0.0002453097772475489, "tps": 71403, "wall": 13248.0} {"step": 14434, "train_loss": 3.3625364303588867, "lr": 0.0002452908094376991, "tps": 71379, "wall": 13253.2} {"step": 14435, "train_loss": 3.435502767562866, "lr": 0.00024527184134135377, "tps": 71356, "wall": 13258.5} {"step": 14436, "train_loss": 3.264876365661621, "lr": 0.0002452528729587276, "tps": 71333, "wall": 13263.7} {"step": 14437, "train_loss": 3.3920087814331055, "lr": 0.0002452339042900355, "tps": 71309, "wall": 13269.0} {"step": 14438, "train_loss": 3.444547414779663, "lr": 0.0002452149353354924, "tps": 71286, "wall": 13274.2} {"step": 14439, "train_loss": 3.414412498474121, "lr": 0.0002451959660953131, "tps": 71263, "wall": 13279.5} {"step": 14440, "train_loss": 3.3383548259735107, "lr": 0.00024517699656971255, "tps": 71240, "wall": 13284.7} {"step": 14441, "train_loss": 3.4365696907043457, "lr": 0.0002451580267589056, "tps": 71216, "wall": 13290.1} {"step": 14442, "train_loss": 3.369105577468872, "lr": 0.0002451390566631072, "tps": 71193, "wall": 13295.3} {"step": 14443, "train_loss": 3.399293899536133, "lr": 0.00024512008628253226, "tps": 71170, "wall": 13300.6} {"step": 14444, "train_loss": 3.460597515106201, "lr": 0.00024510111561739544, "tps": 71146, "wall": 13305.8} {"step": 14445, "train_loss": 3.3119757175445557, "lr": 0.000245082144667912, "tps": 71123, "wall": 13311.1} {"step": 14446, "train_loss": 3.429960250854492, "lr": 0.0002450631734342966, "tps": 71100, "wall": 13316.4} {"step": 14447, "train_loss": 3.412353515625, "lr": 0.00024504420191676427, "tps": 71076, "wall": 13321.7} {"step": 14448, "train_loss": 3.4171695709228516, "lr": 0.00024502523011552983, "tps": 71053, "wall": 13327.0} {"step": 14449, "train_loss": 3.478794813156128, "lr": 0.00024500625803080823, "tps": 71030, "wall": 13332.2} {"step": 14450, "train_loss": 3.2981066703796387, "lr": 0.00024498728566281437, "tps": 71007, "wall": 13337.5} {"step": 14451, "train_loss": 3.4016592502593994, "lr": 0.00024496831301176313, "tps": 70984, "wall": 13342.8} {"step": 14452, "train_loss": 3.3438377380371094, "lr": 0.0002449493400778697, "tps": 70961, "wall": 13348.0} {"step": 14453, "train_loss": 3.3808822631835938, "lr": 0.0002449303668613486, "tps": 70937, "wall": 13353.4} {"step": 14454, "train_loss": 3.43119740486145, "lr": 0.00024491139336241496, "tps": 70914, "wall": 13358.6} {"step": 14455, "train_loss": 3.3480963706970215, "lr": 0.00024489241958128375, "tps": 70891, "wall": 13363.9} {"step": 14456, "train_loss": 3.3809685707092285, "lr": 0.00024487344551816993, "tps": 70868, "wall": 13369.2} {"step": 14457, "train_loss": 3.357142925262451, "lr": 0.00024485447117328824, "tps": 70845, "wall": 13374.4} {"step": 14458, "train_loss": 3.463918924331665, "lr": 0.0002448354965468538, "tps": 70823, "wall": 13379.6} {"step": 14459, "train_loss": 3.492401599884033, "lr": 0.0002448165216390816, "tps": 70800, "wall": 13384.9} {"step": 14460, "train_loss": 3.310382604598999, "lr": 0.00024479754645018647, "tps": 70777, "wall": 13390.1} {"step": 14461, "train_loss": 3.3711299896240234, "lr": 0.00024477857098038333, "tps": 70754, "wall": 13395.4} {"step": 14462, "train_loss": 3.3518013954162598, "lr": 0.0002447595952298872, "tps": 70731, "wall": 13400.6} {"step": 14463, "train_loss": 3.307813882827759, "lr": 0.00024474061919891314, "tps": 70708, "wall": 13405.8} {"step": 14464, "train_loss": 3.448319911956787, "lr": 0.0002447216428876759, "tps": 70685, "wall": 13411.2} {"step": 14465, "train_loss": 3.439037799835205, "lr": 0.00024470266629639053, "tps": 70662, "wall": 13416.5} {"step": 14466, "train_loss": 3.3831136226654053, "lr": 0.0002446836894252722, "tps": 70639, "wall": 13421.8} {"step": 14467, "train_loss": 3.355759859085083, "lr": 0.0002446647122745355, "tps": 70617, "wall": 13427.0} {"step": 14468, "train_loss": 3.393380641937256, "lr": 0.00024464573484439566, "tps": 70594, "wall": 13432.3} {"step": 14469, "train_loss": 3.451866626739502, "lr": 0.0002446267571350677, "tps": 70571, "wall": 13437.5} {"step": 14470, "train_loss": 3.462582588195801, "lr": 0.0002446077791467664, "tps": 70548, "wall": 13442.8} {"step": 14471, "train_loss": 3.467266082763672, "lr": 0.0002445888008797068, "tps": 70526, "wall": 13448.0} {"step": 14472, "train_loss": 3.5141286849975586, "lr": 0.000244569822334104, "tps": 70503, "wall": 13453.3} {"step": 14473, "train_loss": 3.3734796047210693, "lr": 0.00024455084351017296, "tps": 70480, "wall": 13458.6} {"step": 14474, "train_loss": 3.4309303760528564, "lr": 0.0002445318644081286, "tps": 70457, "wall": 13463.9} {"step": 14475, "train_loss": 3.39058256149292, "lr": 0.00024451288502818594, "tps": 70434, "wall": 13469.2} {"step": 14476, "train_loss": 3.3980860710144043, "lr": 0.00024449390537056, "tps": 70412, "wall": 13474.5} {"step": 14477, "train_loss": 3.4461326599121094, "lr": 0.00024447492543546584, "tps": 70389, "wall": 13479.7} {"step": 14478, "train_loss": 3.4721102714538574, "lr": 0.00024445594522311834, "tps": 70366, "wall": 13485.0} {"step": 14479, "train_loss": 3.396364688873291, "lr": 0.00024443696473373257, "tps": 70344, "wall": 13490.2} {"step": 14480, "train_loss": 3.3543896675109863, "lr": 0.0002444179839675236, "tps": 70321, "wall": 13495.5} {"step": 14481, "train_loss": 3.436720371246338, "lr": 0.00024439900292470623, "tps": 70299, "wall": 13500.7} {"step": 14482, "train_loss": 3.387316942214966, "lr": 0.00024438002160549575, "tps": 70276, "wall": 13506.0} {"step": 14483, "train_loss": 3.347379684448242, "lr": 0.0002443610400101071, "tps": 70254, "wall": 13511.2} {"step": 14484, "train_loss": 3.265854835510254, "lr": 0.0002443420581387552, "tps": 70231, "wall": 13516.5} {"step": 14485, "train_loss": 3.4145257472991943, "lr": 0.0002443230759916552, "tps": 70209, "wall": 13521.7} {"step": 14486, "train_loss": 3.418667793273926, "lr": 0.00024430409356902203, "tps": 70187, "wall": 13527.0} {"step": 14487, "train_loss": 3.3627829551696777, "lr": 0.0002442851108710708, "tps": 70164, "wall": 13532.3} {"step": 14488, "train_loss": 3.457446336746216, "lr": 0.0002442661278980165, "tps": 70141, "wall": 13537.6} {"step": 14489, "train_loss": 3.2916688919067383, "lr": 0.0002442471446500742, "tps": 70119, "wall": 13542.8} {"step": 14490, "train_loss": 3.2395076751708984, "lr": 0.000244228161127459, "tps": 70097, "wall": 13548.1} {"step": 14491, "train_loss": 3.372147798538208, "lr": 0.0002442091773303858, "tps": 70074, "wall": 13553.4} {"step": 14492, "train_loss": 3.3461716175079346, "lr": 0.00024419019325906975, "tps": 70052, "wall": 13558.6} {"step": 14493, "train_loss": 3.391090154647827, "lr": 0.0002441712089137259, "tps": 70030, "wall": 13563.8} {"step": 14494, "train_loss": 3.4146008491516113, "lr": 0.0002441522242945693, "tps": 70008, "wall": 13569.1} {"step": 14495, "train_loss": 3.3439226150512695, "lr": 0.0002441332394018149, "tps": 69985, "wall": 13574.3} {"step": 14496, "train_loss": 3.317531108856201, "lr": 0.00024411425423567792, "tps": 69963, "wall": 13579.6} {"step": 14497, "train_loss": 3.3317649364471436, "lr": 0.0002440952687963734, "tps": 69941, "wall": 13584.9} {"step": 14498, "train_loss": 3.409968137741089, "lr": 0.00024407628308411634, "tps": 69918, "wall": 13590.2} {"step": 14499, "train_loss": 3.3938913345336914, "lr": 0.0002440572970991218, "tps": 69896, "wall": 13595.4} {"step": 14500, "train_loss": 3.400226593017578, "lr": 0.00024403831084160498, "tps": 69874, "wall": 13600.7} {"step": 14501, "train_loss": 3.3269474506378174, "lr": 0.00024401932431178085, "tps": 69851, "wall": 13606.1} {"step": 14502, "train_loss": 3.4219396114349365, "lr": 0.00024400033750986445, "tps": 69828, "wall": 13611.4} {"step": 14503, "train_loss": 3.410958766937256, "lr": 0.00024398135043607102, "tps": 69806, "wall": 13616.7} {"step": 14504, "train_loss": 3.3976540565490723, "lr": 0.0002439623630906155, "tps": 69784, "wall": 13622.0} {"step": 14505, "train_loss": 3.394721031188965, "lr": 0.00024394337547371304, "tps": 69762, "wall": 13627.2} {"step": 14506, "train_loss": 3.438755512237549, "lr": 0.00024392438758557875, "tps": 69740, "wall": 13632.5} {"step": 14507, "train_loss": 3.382406711578369, "lr": 0.00024390539942642766, "tps": 69718, "wall": 13637.7} {"step": 14508, "train_loss": 3.292433261871338, "lr": 0.00024388641099647496, "tps": 69695, "wall": 13643.0} {"step": 14509, "train_loss": 3.4769186973571777, "lr": 0.00024386742229593568, "tps": 69673, "wall": 13648.3} {"step": 14510, "train_loss": 3.3997225761413574, "lr": 0.00024384843332502496, "tps": 69651, "wall": 13653.6} {"step": 14511, "train_loss": 3.3426637649536133, "lr": 0.00024382944408395788, "tps": 69629, "wall": 13658.8} {"step": 14512, "train_loss": 3.430666923522949, "lr": 0.00024381045457294955, "tps": 69607, "wall": 13664.1} {"step": 14513, "train_loss": 3.350494861602783, "lr": 0.00024379146479221512, "tps": 69585, "wall": 13669.3} {"step": 14514, "train_loss": 3.2817604541778564, "lr": 0.0002437724747419697, "tps": 69563, "wall": 13674.6} {"step": 14515, "train_loss": 3.402477502822876, "lr": 0.00024375348442242842, "tps": 69541, "wall": 13679.8} {"step": 14516, "train_loss": 3.3940799236297607, "lr": 0.00024373449383380632, "tps": 69520, "wall": 13685.0} {"step": 14517, "train_loss": 3.3641910552978516, "lr": 0.0002437155029763187, "tps": 69498, "wall": 13690.3} {"step": 14518, "train_loss": 3.3399455547332764, "lr": 0.00024369651185018046, "tps": 69476, "wall": 13695.5} {"step": 14519, "train_loss": 3.43133807182312, "lr": 0.00024367752045560695, "tps": 69454, "wall": 13700.8} {"step": 14520, "train_loss": 3.3600168228149414, "lr": 0.00024365852879281317, "tps": 69432, "wall": 13706.0} {"step": 14521, "train_loss": 3.3541793823242188, "lr": 0.00024363953686201427, "tps": 69410, "wall": 13711.3} {"step": 14522, "train_loss": 3.399442672729492, "lr": 0.00024362054466342542, "tps": 69388, "wall": 13716.6} {"step": 14523, "train_loss": 3.4142045974731445, "lr": 0.00024360155219726185, "tps": 69367, "wall": 13721.9} {"step": 14524, "train_loss": 3.431011915206909, "lr": 0.00024358255946373847, "tps": 69345, "wall": 13727.1} {"step": 14525, "train_loss": 3.4279685020446777, "lr": 0.00024356356646307065, "tps": 69323, "wall": 13732.4} {"step": 14526, "train_loss": 3.3708724975585938, "lr": 0.00024354457319547348, "tps": 69301, "wall": 13737.6} {"step": 14527, "train_loss": 3.3924672603607178, "lr": 0.00024352557966116214, "tps": 69280, "wall": 13742.8} {"step": 14528, "train_loss": 3.458858013153076, "lr": 0.0002435065858603517, "tps": 69258, "wall": 13748.1} {"step": 14529, "train_loss": 3.3209643363952637, "lr": 0.00024348759179325743, "tps": 69236, "wall": 13753.3} {"step": 14530, "train_loss": 3.4443135261535645, "lr": 0.0002434685974600945, "tps": 69215, "wall": 13758.6} {"step": 14531, "train_loss": 3.4263906478881836, "lr": 0.00024344960286107795, "tps": 69193, "wall": 13763.8} {"step": 14532, "train_loss": 3.3842568397521973, "lr": 0.00024343060799642297, "tps": 69171, "wall": 13769.1} {"step": 14533, "train_loss": 3.290569305419922, "lr": 0.00024341161286634493, "tps": 69150, "wall": 13774.3} {"step": 14534, "train_loss": 3.37740159034729, "lr": 0.00024339261747105884, "tps": 69128, "wall": 13779.6} {"step": 14535, "train_loss": 3.354825973510742, "lr": 0.00024337362181077983, "tps": 69107, "wall": 13784.8} {"step": 14536, "train_loss": 3.3858439922332764, "lr": 0.00024335462588572326, "tps": 69086, "wall": 13790.0} {"step": 14537, "train_loss": 3.4235637187957764, "lr": 0.0002433356296961042, "tps": 69064, "wall": 13795.2} {"step": 14538, "train_loss": 3.4272780418395996, "lr": 0.00024331663324213788, "tps": 69043, "wall": 13800.4} {"step": 14539, "train_loss": 3.317760705947876, "lr": 0.00024329763652403946, "tps": 69021, "wall": 13805.7} {"step": 14540, "train_loss": 3.3973846435546875, "lr": 0.00024327863954202409, "tps": 69000, "wall": 13810.9} {"step": 14541, "train_loss": 3.2662901878356934, "lr": 0.0002432596422963071, "tps": 68979, "wall": 13816.1} {"step": 14542, "train_loss": 3.387960195541382, "lr": 0.00024324064478710363, "tps": 68957, "wall": 13821.3} {"step": 14543, "train_loss": 3.4827632904052734, "lr": 0.00024322164701462887, "tps": 68936, "wall": 13826.6} {"step": 14544, "train_loss": 3.4439239501953125, "lr": 0.00024320264897909803, "tps": 68914, "wall": 13831.9} {"step": 14545, "train_loss": 3.512521266937256, "lr": 0.0002431836506807263, "tps": 68893, "wall": 13837.1} {"step": 14546, "train_loss": 3.300872325897217, "lr": 0.0002431646521197289, "tps": 68872, "wall": 13842.4} {"step": 14547, "train_loss": 3.449770927429199, "lr": 0.00024314565329632112, "tps": 68850, "wall": 13847.6} {"step": 14548, "train_loss": 3.3115086555480957, "lr": 0.00024312665421071815, "tps": 68829, "wall": 13852.8} {"step": 14549, "train_loss": 3.4790496826171875, "lr": 0.00024310765486313516, "tps": 68808, "wall": 13858.1} {"step": 14550, "train_loss": 3.394887685775757, "lr": 0.0002430886552537874, "tps": 68786, "wall": 13863.3} {"step": 14551, "train_loss": 3.321823835372925, "lr": 0.00024306965538289013, "tps": 68765, "wall": 13868.5} {"step": 14552, "train_loss": 3.4403839111328125, "lr": 0.0002430506552506585, "tps": 68744, "wall": 13873.8} {"step": 14553, "train_loss": 3.3406972885131836, "lr": 0.0002430316548573078, "tps": 68722, "wall": 13879.1} {"step": 14554, "train_loss": 3.455049514770508, "lr": 0.00024301265420305338, "tps": 68701, "wall": 13884.3} {"step": 14555, "train_loss": 3.4305858612060547, "lr": 0.00024299365328811026, "tps": 68680, "wall": 13889.6} {"step": 14556, "train_loss": 3.3597750663757324, "lr": 0.00024297465211269378, "tps": 68658, "wall": 13894.9} {"step": 14557, "train_loss": 3.362175941467285, "lr": 0.00024295565067701923, "tps": 68637, "wall": 13900.1} {"step": 14558, "train_loss": 3.3463497161865234, "lr": 0.0002429366489813019, "tps": 68616, "wall": 13905.4} {"step": 14559, "train_loss": 3.290299654006958, "lr": 0.00024291764702575686, "tps": 68595, "wall": 13910.7} {"step": 14560, "train_loss": 3.3420450687408447, "lr": 0.00024289864481059952, "tps": 68574, "wall": 13915.9} {"step": 14561, "train_loss": 3.389538049697876, "lr": 0.00024287964233604516, "tps": 68552, "wall": 13921.1} {"step": 14562, "train_loss": 3.4753663539886475, "lr": 0.0002428606396023089, "tps": 68531, "wall": 13926.4} {"step": 14563, "train_loss": 3.362929344177246, "lr": 0.00024284163660960603, "tps": 68510, "wall": 13931.6} {"step": 14564, "train_loss": 3.394733190536499, "lr": 0.00024282263335815194, "tps": 68489, "wall": 13936.9} {"step": 14565, "train_loss": 3.412923574447632, "lr": 0.00024280362984816184, "tps": 68468, "wall": 13942.1} {"step": 14566, "train_loss": 3.424651622772217, "lr": 0.00024278462607985093, "tps": 68447, "wall": 13947.3} {"step": 14567, "train_loss": 3.401017427444458, "lr": 0.00024276562205343454, "tps": 68426, "wall": 13952.6} {"step": 14568, "train_loss": 3.4434783458709717, "lr": 0.000242746617769128, "tps": 68405, "wall": 13957.9} {"step": 14569, "train_loss": 3.424952983856201, "lr": 0.0002427276132271465, "tps": 68384, "wall": 13963.1} {"step": 14570, "train_loss": 3.369178295135498, "lr": 0.0002427086084277054, "tps": 68363, "wall": 13968.3} {"step": 14571, "train_loss": 3.415872097015381, "lr": 0.00024268960337101993, "tps": 68342, "wall": 13973.6} {"step": 14572, "train_loss": 3.29843807220459, "lr": 0.00024267059805730545, "tps": 68321, "wall": 13978.8} {"step": 14573, "train_loss": 3.4850568771362305, "lr": 0.00024265159248677715, "tps": 68301, "wall": 13984.0} {"step": 14574, "train_loss": 3.4141812324523926, "lr": 0.00024263258665965044, "tps": 68280, "wall": 13989.2} {"step": 14575, "train_loss": 3.353192090988159, "lr": 0.00024261358057614055, "tps": 68259, "wall": 13994.5} {"step": 14576, "train_loss": 3.353235960006714, "lr": 0.00024259457423646277, "tps": 68238, "wall": 13999.7} {"step": 14577, "train_loss": 3.3479204177856445, "lr": 0.00024257556764083237, "tps": 68217, "wall": 14005.0} {"step": 14578, "train_loss": 3.3634138107299805, "lr": 0.00024255656078946486, "tps": 68196, "wall": 14010.3} {"step": 14579, "train_loss": 3.3558692932128906, "lr": 0.00024253755368257532, "tps": 68175, "wall": 14015.5} {"step": 14580, "train_loss": 3.343487501144409, "lr": 0.00024251854632037918, "tps": 68154, "wall": 14020.7} {"step": 14581, "train_loss": 3.3924484252929688, "lr": 0.00024249953870309173, "tps": 68134, "wall": 14025.9} {"step": 14582, "train_loss": 3.4550559520721436, "lr": 0.00024248053083092828, "tps": 68113, "wall": 14031.2} {"step": 14583, "train_loss": 3.456273317337036, "lr": 0.00024246152270410414, "tps": 68092, "wall": 14036.4} {"step": 14584, "train_loss": 3.4146881103515625, "lr": 0.0002424425143228347, "tps": 68072, "wall": 14041.6} {"step": 14585, "train_loss": 3.3763651847839355, "lr": 0.00024242350568733523, "tps": 68051, "wall": 14046.8} {"step": 14586, "train_loss": 3.393047571182251, "lr": 0.00024240449679782105, "tps": 68030, "wall": 14052.1} {"step": 14587, "train_loss": 3.2977559566497803, "lr": 0.00024238548765450753, "tps": 68009, "wall": 14057.4} {"step": 14588, "train_loss": 3.37713360786438, "lr": 0.00024236647825761002, "tps": 67989, "wall": 14062.6} {"step": 14589, "train_loss": 3.349792003631592, "lr": 0.00024234746860734384, "tps": 67968, "wall": 14067.8} {"step": 14590, "train_loss": 3.5038204193115234, "lr": 0.00024232845870392425, "tps": 67947, "wall": 14073.1} {"step": 14591, "train_loss": 3.407803773880005, "lr": 0.00024230944854756667, "tps": 67926, "wall": 14078.4} {"step": 14592, "train_loss": 3.318424701690674, "lr": 0.00024229043813848655, "tps": 67906, "wall": 14083.7} {"step": 14593, "train_loss": 3.4634852409362793, "lr": 0.00024227142747689913, "tps": 67885, "wall": 14088.9} {"step": 14594, "train_loss": 3.3620705604553223, "lr": 0.00024225241656301969, "tps": 67865, "wall": 14094.1} {"step": 14595, "train_loss": 3.3009018898010254, "lr": 0.00024223340539706372, "tps": 67844, "wall": 14099.4} {"step": 14596, "train_loss": 3.3826847076416016, "lr": 0.0002422143939792465, "tps": 67823, "wall": 14104.6} {"step": 14597, "train_loss": 3.4625163078308105, "lr": 0.00024219538230978348, "tps": 67803, "wall": 14109.8} {"step": 14598, "train_loss": 3.479593515396118, "lr": 0.00024217637038888995, "tps": 67782, "wall": 14115.1} {"step": 14599, "train_loss": 3.407244920730591, "lr": 0.00024215735821678128, "tps": 67762, "wall": 14120.3} {"step": 14600, "train_loss": 3.446829319000244, "lr": 0.00024213834579367286, "tps": 67741, "wall": 14125.6} {"step": 14601, "train_loss": 3.396389961242676, "lr": 0.00024211933311978006, "tps": 67720, "wall": 14131.0} {"step": 14602, "train_loss": 3.3655917644500732, "lr": 0.0002421003201953183, "tps": 67700, "wall": 14136.2} {"step": 14603, "train_loss": 3.3290722370147705, "lr": 0.00024208130702050285, "tps": 67679, "wall": 14141.5} {"step": 14604, "train_loss": 3.452646017074585, "lr": 0.00024206229359554916, "tps": 67659, "wall": 14146.7} {"step": 14605, "train_loss": 3.4331045150756836, "lr": 0.00024204327992067271, "tps": 67638, "wall": 14152.0} {"step": 14606, "train_loss": 3.4407029151916504, "lr": 0.0002420242659960887, "tps": 67618, "wall": 14157.2} {"step": 14607, "train_loss": 3.3975441455841064, "lr": 0.00024200525182201265, "tps": 67597, "wall": 14162.5} {"step": 14608, "train_loss": 3.4666919708251953, "lr": 0.00024198623739865994, "tps": 67577, "wall": 14167.7} {"step": 14609, "train_loss": 3.3193979263305664, "lr": 0.0002419672227262459, "tps": 67556, "wall": 14173.0} {"step": 14610, "train_loss": 3.334057331085205, "lr": 0.00024194820780498594, "tps": 67536, "wall": 14178.2} {"step": 14611, "train_loss": 3.3709874153137207, "lr": 0.00024192919263509556, "tps": 67516, "wall": 14183.5} {"step": 14612, "train_loss": 3.3294239044189453, "lr": 0.0002419101772167901, "tps": 67495, "wall": 14188.7} {"step": 14613, "train_loss": 3.4220259189605713, "lr": 0.00024189116155028494, "tps": 67474, "wall": 14194.1} {"step": 14614, "train_loss": 3.4044647216796875, "lr": 0.0002418721456357955, "tps": 67454, "wall": 14199.3} {"step": 14615, "train_loss": 3.3791213035583496, "lr": 0.0002418531294735372, "tps": 67434, "wall": 14204.6} {"step": 14616, "train_loss": 3.3291420936584473, "lr": 0.00024183411306372555, "tps": 67413, "wall": 14209.9} {"step": 14617, "train_loss": 3.3227641582489014, "lr": 0.00024181509640657577, "tps": 67393, "wall": 14215.2} {"step": 14618, "train_loss": 3.393786907196045, "lr": 0.0002417960795023035, "tps": 67373, "wall": 14220.4} {"step": 14619, "train_loss": 3.4386181831359863, "lr": 0.000241777062351124, "tps": 67352, "wall": 14225.6} {"step": 14620, "train_loss": 3.522305488586426, "lr": 0.00024175804495325288, "tps": 67332, "wall": 14230.9} {"step": 14621, "train_loss": 3.3563578128814697, "lr": 0.00024173902730890528, "tps": 67312, "wall": 14236.2} {"step": 14622, "train_loss": 3.348489761352539, "lr": 0.00024172000941829688, "tps": 67291, "wall": 14241.5} {"step": 14623, "train_loss": 3.3554227352142334, "lr": 0.00024170099128164308, "tps": 67271, "wall": 14246.8} {"step": 14624, "train_loss": 3.2863688468933105, "lr": 0.00024168197289915923, "tps": 67250, "wall": 14252.1} {"step": 14625, "train_loss": 3.3953933715820312, "lr": 0.00024166295427106082, "tps": 67230, "wall": 14257.4} {"step": 14626, "train_loss": 3.2816572189331055, "lr": 0.00024164393539756332, "tps": 67209, "wall": 14262.7} {"step": 14627, "train_loss": 3.380852222442627, "lr": 0.00024162491627888208, "tps": 67189, "wall": 14268.0} {"step": 14628, "train_loss": 3.390101432800293, "lr": 0.00024160589691523266, "tps": 67169, "wall": 14273.2} {"step": 14629, "train_loss": 3.4042916297912598, "lr": 0.00024158687730683047, "tps": 67149, "wall": 14278.5} {"step": 14630, "train_loss": 3.343905448913574, "lr": 0.00024156785745389097, "tps": 67128, "wall": 14283.8} {"step": 14631, "train_loss": 3.398836612701416, "lr": 0.0002415488373566296, "tps": 67108, "wall": 14289.1} {"step": 14632, "train_loss": 3.382362127304077, "lr": 0.00024152981701526183, "tps": 67088, "wall": 14294.3} {"step": 14633, "train_loss": 3.324845314025879, "lr": 0.00024151079643000317, "tps": 67068, "wall": 14299.6} {"step": 14634, "train_loss": 3.3052399158477783, "lr": 0.000241491775601069, "tps": 67048, "wall": 14304.9} {"step": 14635, "train_loss": 3.42588472366333, "lr": 0.00024147275452867485, "tps": 67027, "wall": 14310.3} {"step": 14636, "train_loss": 3.2649948596954346, "lr": 0.00024145373321303622, "tps": 67007, "wall": 14315.5} {"step": 14637, "train_loss": 3.4188296794891357, "lr": 0.00024143471165436847, "tps": 66987, "wall": 14320.8} {"step": 14638, "train_loss": 3.3469016551971436, "lr": 0.0002414156898528872, "tps": 66967, "wall": 14326.1} {"step": 14639, "train_loss": 3.494364023208618, "lr": 0.00024139666780880777, "tps": 66947, "wall": 14331.3} {"step": 14640, "train_loss": 3.2863919734954834, "lr": 0.00024137764552234576, "tps": 66927, "wall": 14336.6} {"step": 14641, "train_loss": 3.438640594482422, "lr": 0.00024135862299371668, "tps": 66907, "wall": 14341.8} {"step": 14642, "train_loss": 3.245689630508423, "lr": 0.0002413396002231359, "tps": 66887, "wall": 14347.2} {"step": 14643, "train_loss": 3.283735752105713, "lr": 0.000241320577210819, "tps": 66867, "wall": 14352.5} {"step": 14644, "train_loss": 3.395449638366699, "lr": 0.00024130155395698144, "tps": 66847, "wall": 14357.8} {"step": 14645, "train_loss": 3.3596067428588867, "lr": 0.00024128253046183873, "tps": 66827, "wall": 14363.0} {"step": 14646, "train_loss": 3.290290594100952, "lr": 0.00024126350672560638, "tps": 66807, "wall": 14368.3} {"step": 14647, "train_loss": 3.3648734092712402, "lr": 0.00024124448274849984, "tps": 66786, "wall": 14373.7} {"step": 14648, "train_loss": 3.304403305053711, "lr": 0.00024122545853073462, "tps": 66766, "wall": 14378.9} {"step": 14649, "train_loss": 3.3863701820373535, "lr": 0.0002412064340725263, "tps": 66746, "wall": 14384.2} {"step": 14650, "train_loss": 3.3797621726989746, "lr": 0.00024118740937409037, "tps": 66727, "wall": 14389.5} {"step": 14651, "train_loss": 3.497608184814453, "lr": 0.00024116838443564227, "tps": 66707, "wall": 14394.8} {"step": 14652, "train_loss": 3.346332550048828, "lr": 0.00024114935925739764, "tps": 66687, "wall": 14400.0} {"step": 14653, "train_loss": 3.2918221950531006, "lr": 0.0002411303338395719, "tps": 66667, "wall": 14405.3} {"step": 14654, "train_loss": 3.3946614265441895, "lr": 0.0002411113081823805, "tps": 66647, "wall": 14410.6} {"step": 14655, "train_loss": 3.3269107341766357, "lr": 0.00024109228228603918, "tps": 66627, "wall": 14415.9} {"step": 14656, "train_loss": 3.350162982940674, "lr": 0.0002410732561507633, "tps": 66607, "wall": 14421.1} {"step": 14657, "train_loss": 3.352970600128174, "lr": 0.00024105422977676843, "tps": 66588, "wall": 14426.4} {"step": 14658, "train_loss": 3.4659478664398193, "lr": 0.00024103520316427011, "tps": 66568, "wall": 14431.7} {"step": 14659, "train_loss": 3.3759286403656006, "lr": 0.00024101617631348384, "tps": 66548, "wall": 14437.0} {"step": 14660, "train_loss": 3.32818603515625, "lr": 0.00024099714922462523, "tps": 66528, "wall": 14442.3} {"step": 14661, "train_loss": 3.3876776695251465, "lr": 0.00024097812189790974, "tps": 66508, "wall": 14447.6} {"step": 14662, "train_loss": 3.3949408531188965, "lr": 0.000240959094333553, "tps": 66488, "wall": 14452.9} {"step": 14663, "train_loss": 3.338151454925537, "lr": 0.00024094006653177052, "tps": 66469, "wall": 14458.1} {"step": 14664, "train_loss": 3.2992377281188965, "lr": 0.00024092103849277776, "tps": 66449, "wall": 14463.4} {"step": 14665, "train_loss": 3.3529341220855713, "lr": 0.00024090201021679036, "tps": 66429, "wall": 14468.7} {"step": 14666, "train_loss": 3.41085147857666, "lr": 0.00024088298170402386, "tps": 66410, "wall": 14473.9} {"step": 14667, "train_loss": 3.4435760974884033, "lr": 0.00024086395295469388, "tps": 66390, "wall": 14479.2} {"step": 14668, "train_loss": 3.405222177505493, "lr": 0.00024084492396901581, "tps": 66371, "wall": 14484.4} {"step": 14669, "train_loss": 3.2922611236572266, "lr": 0.00024082589474720535, "tps": 66351, "wall": 14489.8} {"step": 14670, "train_loss": 3.363938570022583, "lr": 0.0002408068652894781, "tps": 66331, "wall": 14495.0} {"step": 14671, "train_loss": 3.473543643951416, "lr": 0.00024078783559604948, "tps": 66312, "wall": 14500.3} {"step": 14672, "train_loss": 3.446223258972168, "lr": 0.00024076880566713515, "tps": 66292, "wall": 14505.5} {"step": 14673, "train_loss": 3.4493861198425293, "lr": 0.00024074977550295068, "tps": 66273, "wall": 14510.8} {"step": 14674, "train_loss": 3.5202138423919678, "lr": 0.00024073074510371162, "tps": 66253, "wall": 14516.0} {"step": 14675, "train_loss": 3.4040634632110596, "lr": 0.00024071171446963355, "tps": 66234, "wall": 14521.3} {"step": 14676, "train_loss": 3.341966152191162, "lr": 0.000240692683600932, "tps": 66214, "wall": 14526.5} {"step": 14677, "train_loss": 3.415851593017578, "lr": 0.00024067365249782273, "tps": 66195, "wall": 14531.8} {"step": 14678, "train_loss": 3.2753000259399414, "lr": 0.00024065462116052113, "tps": 66176, "wall": 14537.0} {"step": 14679, "train_loss": 3.3806238174438477, "lr": 0.00024063558958924288, "tps": 66156, "wall": 14542.3} {"step": 14680, "train_loss": 3.371830701828003, "lr": 0.00024061655778420362, "tps": 66137, "wall": 14547.6} {"step": 14681, "train_loss": 3.4393796920776367, "lr": 0.00024059752574561878, "tps": 66117, "wall": 14552.9} {"step": 14682, "train_loss": 3.402118682861328, "lr": 0.00024057849347370404, "tps": 66097, "wall": 14558.2} {"step": 14683, "train_loss": 3.395435094833374, "lr": 0.00024055946096867512, "tps": 66078, "wall": 14563.5} {"step": 14684, "train_loss": 3.4599790573120117, "lr": 0.00024054042823074746, "tps": 66059, "wall": 14568.7} {"step": 14685, "train_loss": 3.3555657863616943, "lr": 0.0002405213952601367, "tps": 66039, "wall": 14574.0} {"step": 14686, "train_loss": 3.3626599311828613, "lr": 0.00024050236205705843, "tps": 66020, "wall": 14579.2} {"step": 14687, "train_loss": 3.2754640579223633, "lr": 0.00024048332862172838, "tps": 66001, "wall": 14584.5} {"step": 14688, "train_loss": 3.483349323272705, "lr": 0.00024046429495436203, "tps": 65982, "wall": 14589.7} {"step": 14689, "train_loss": 3.394749402999878, "lr": 0.00024044526105517506, "tps": 65962, "wall": 14595.0} {"step": 14690, "train_loss": 3.4969277381896973, "lr": 0.00024042622692438306, "tps": 65943, "wall": 14600.2} {"step": 14691, "train_loss": 3.430781841278076, "lr": 0.0002404071925622016, "tps": 65924, "wall": 14605.5} {"step": 14692, "train_loss": 3.489084482192993, "lr": 0.00024038815796884646, "tps": 65904, "wall": 14610.9} {"step": 14693, "train_loss": 3.4406189918518066, "lr": 0.00024036912314453313, "tps": 65885, "wall": 14616.1} {"step": 14694, "train_loss": 3.377310276031494, "lr": 0.00024035008808947721, "tps": 65866, "wall": 14621.4} {"step": 14695, "train_loss": 3.445047378540039, "lr": 0.00024033105280389446, "tps": 65846, "wall": 14626.6} {"step": 14696, "train_loss": 3.464766025543213, "lr": 0.00024031201728800036, "tps": 65827, "wall": 14631.9} {"step": 14697, "train_loss": 3.3001749515533447, "lr": 0.00024029298154201075, "tps": 65808, "wall": 14637.1} {"step": 14698, "train_loss": 3.368469715118408, "lr": 0.0002402739455661411, "tps": 65789, "wall": 14642.4} {"step": 14699, "train_loss": 3.4083669185638428, "lr": 0.00024025490936060707, "tps": 65770, "wall": 14647.6} {"step": 14700, "train_loss": 3.391993761062622, "lr": 0.00024023587292562436, "tps": 65751, "wall": 14652.9} {"step": 14701, "train_loss": 3.3189220428466797, "lr": 0.00024021683626140856, "tps": 65731, "wall": 14658.2} {"step": 14702, "train_loss": 3.3683979511260986, "lr": 0.0002401977993681753, "tps": 65712, "wall": 14663.5} {"step": 14703, "train_loss": 3.3570218086242676, "lr": 0.00024017876224614036, "tps": 65693, "wall": 14668.7} {"step": 14704, "train_loss": 3.4097726345062256, "lr": 0.00024015972489551933, "tps": 65674, "wall": 14674.1} {"step": 14705, "train_loss": 3.402390241622925, "lr": 0.00024014068731652776, "tps": 65655, "wall": 14679.3} {"step": 14706, "train_loss": 3.292212963104248, "lr": 0.00024012164950938143, "tps": 65636, "wall": 14684.6} {"step": 14707, "train_loss": 3.488279342651367, "lr": 0.00024010261147429596, "tps": 65617, "wall": 14689.8} {"step": 14708, "train_loss": 3.36893892288208, "lr": 0.00024008357321148708, "tps": 65597, "wall": 14695.1} {"step": 14709, "train_loss": 3.3738512992858887, "lr": 0.00024006453472117035, "tps": 65578, "wall": 14700.4} {"step": 14710, "train_loss": 3.3585166931152344, "lr": 0.00024004549600356145, "tps": 65559, "wall": 14705.6} {"step": 14711, "train_loss": 3.424405336380005, "lr": 0.0002400264570588761, "tps": 65540, "wall": 14710.9} {"step": 14712, "train_loss": 3.4165072441101074, "lr": 0.00024000741788733, "tps": 65521, "wall": 14716.2} {"step": 14713, "train_loss": 3.38686466217041, "lr": 0.0002399883784891388, "tps": 65502, "wall": 14721.5} {"step": 14714, "train_loss": 3.406803607940674, "lr": 0.0002399693388645181, "tps": 65483, "wall": 14726.7} {"step": 14715, "train_loss": 3.2929975986480713, "lr": 0.00023995029901368366, "tps": 65464, "wall": 14732.0} {"step": 14716, "train_loss": 3.3996264934539795, "lr": 0.00023993125893685116, "tps": 65445, "wall": 14737.3} {"step": 14717, "train_loss": 3.4913737773895264, "lr": 0.00023991221863423631, "tps": 65426, "wall": 14742.5} {"step": 14718, "train_loss": 3.4087915420532227, "lr": 0.0002398931781060548, "tps": 65408, "wall": 14747.8} {"step": 14719, "train_loss": 3.3072566986083984, "lr": 0.00023987413735252223, "tps": 65389, "wall": 14753.0} {"step": 14720, "train_loss": 3.399426221847534, "lr": 0.0002398550963738544, "tps": 65370, "wall": 14758.2} {"step": 14721, "train_loss": 3.3125157356262207, "lr": 0.00023983605517026693, "tps": 65351, "wall": 14763.5} {"step": 14722, "train_loss": 3.3471121788024902, "lr": 0.00023981701374197557, "tps": 65332, "wall": 14768.8} {"step": 14723, "train_loss": 3.438476800918579, "lr": 0.00023979797208919593, "tps": 65314, "wall": 14774.0} {"step": 14724, "train_loss": 3.395578145980835, "lr": 0.0002397789302121439, "tps": 65295, "wall": 14779.3} {"step": 14725, "train_loss": 3.39935040473938, "lr": 0.00023975988811103505, "tps": 65276, "wall": 14784.6} {"step": 14726, "train_loss": 3.3212060928344727, "lr": 0.0002397408457860851, "tps": 65257, "wall": 14789.9} {"step": 14727, "train_loss": 3.378207206726074, "lr": 0.00023972180323750974, "tps": 65238, "wall": 14795.2} {"step": 14728, "train_loss": 3.3647758960723877, "lr": 0.0002397027604655248, "tps": 65219, "wall": 14800.4} {"step": 14729, "train_loss": 3.3149285316467285, "lr": 0.0002396837174703459, "tps": 65200, "wall": 14805.7} {"step": 14730, "train_loss": 3.3671391010284424, "lr": 0.00023966467425218878, "tps": 65182, "wall": 14811.0} {"step": 14731, "train_loss": 3.4477670192718506, "lr": 0.00023964563081126921, "tps": 65163, "wall": 14816.2} {"step": 14732, "train_loss": 3.426888942718506, "lr": 0.00023962658714780276, "tps": 65144, "wall": 14821.5} {"step": 14733, "train_loss": 3.4271278381347656, "lr": 0.00023960754326200534, "tps": 65125, "wall": 14826.8} {"step": 14734, "train_loss": 3.375847339630127, "lr": 0.0002395884991540926, "tps": 65107, "wall": 14832.1} {"step": 14735, "train_loss": 3.3850443363189697, "lr": 0.0002395694548242803, "tps": 65088, "wall": 14837.3} {"step": 14736, "train_loss": 3.39200758934021, "lr": 0.00023955041027278417, "tps": 65069, "wall": 14842.6} {"step": 14737, "train_loss": 3.3646974563598633, "lr": 0.00023953136549981988, "tps": 65051, "wall": 14847.8} {"step": 14738, "train_loss": 3.3018009662628174, "lr": 0.0002395123205056033, "tps": 65032, "wall": 14853.2} {"step": 14739, "train_loss": 3.3041763305664062, "lr": 0.00023949327529035005, "tps": 65013, "wall": 14858.4} {"step": 14740, "train_loss": 3.4081954956054688, "lr": 0.0002394742298542759, "tps": 64994, "wall": 14863.7} {"step": 14741, "train_loss": 3.4773309230804443, "lr": 0.00023945518419759667, "tps": 64976, "wall": 14869.0} {"step": 14742, "train_loss": 3.4238462448120117, "lr": 0.00023943613832052803, "tps": 64957, "wall": 14874.3} {"step": 14743, "train_loss": 3.3839333057403564, "lr": 0.00023941709222328577, "tps": 64939, "wall": 14879.5} {"step": 14744, "train_loss": 3.420180082321167, "lr": 0.00023939804590608561, "tps": 64920, "wall": 14884.8} {"step": 14745, "train_loss": 3.3294413089752197, "lr": 0.0002393789993691434, "tps": 64902, "wall": 14890.0} {"step": 14746, "train_loss": 3.439969539642334, "lr": 0.0002393599526126748, "tps": 64883, "wall": 14895.3} {"step": 14747, "train_loss": 3.3593969345092773, "lr": 0.0002393409056368956, "tps": 64864, "wall": 14900.6} {"step": 14748, "train_loss": 3.378438711166382, "lr": 0.0002393218584420216, "tps": 64846, "wall": 14905.8} {"step": 14749, "train_loss": 3.322567939758301, "lr": 0.0002393028110282685, "tps": 64827, "wall": 14911.1} {"step": 14750, "train_loss": 3.2861199378967285, "lr": 0.00023928376339585214, "tps": 64809, "wall": 14916.4} {"step": 14751, "train_loss": 3.3666110038757324, "lr": 0.00023926471554498827, "tps": 64791, "wall": 14921.6} {"step": 14752, "train_loss": 3.351140260696411, "lr": 0.00023924566747589266, "tps": 64772, "wall": 14926.9} {"step": 14753, "train_loss": 3.3575921058654785, "lr": 0.00023922661918878108, "tps": 64754, "wall": 14932.1} {"step": 14754, "train_loss": 3.3073480129241943, "lr": 0.00023920757068386932, "tps": 64735, "wall": 14937.4} {"step": 14755, "train_loss": 3.3936972618103027, "lr": 0.0002391885219613732, "tps": 64717, "wall": 14942.7} {"step": 14756, "train_loss": 3.4399542808532715, "lr": 0.00023916947302150842, "tps": 64699, "wall": 14947.9} {"step": 14757, "train_loss": 3.300161123275757, "lr": 0.00023915042386449077, "tps": 64680, "wall": 14953.1} {"step": 14758, "train_loss": 3.4429421424865723, "lr": 0.00023913137449053617, "tps": 64662, "wall": 14958.4} {"step": 14759, "train_loss": 3.378145694732666, "lr": 0.0002391123248998603, "tps": 64644, "wall": 14963.6} {"step": 14760, "train_loss": 3.3281776905059814, "lr": 0.00023909327509267895, "tps": 64625, "wall": 14968.9} {"step": 14761, "train_loss": 3.402791738510132, "lr": 0.00023907422506920796, "tps": 64607, "wall": 14974.2} {"step": 14762, "train_loss": 3.419092893600464, "lr": 0.00023905517482966312, "tps": 64588, "wall": 14979.5} {"step": 14763, "train_loss": 3.2725744247436523, "lr": 0.00023903612437426022, "tps": 64570, "wall": 14984.7} {"step": 14764, "train_loss": 3.374845266342163, "lr": 0.00023901707370321509, "tps": 64552, "wall": 14990.0} {"step": 14765, "train_loss": 3.400862693786621, "lr": 0.00023899802281674356, "tps": 64534, "wall": 14995.3} {"step": 14766, "train_loss": 3.3828701972961426, "lr": 0.00023897897171506132, "tps": 64515, "wall": 15000.5} {"step": 14767, "train_loss": 3.4130375385284424, "lr": 0.00023895992039838428, "tps": 64497, "wall": 15005.8} {"step": 14768, "train_loss": 3.3650588989257812, "lr": 0.00023894086886692831, "tps": 64479, "wall": 15011.0} {"step": 14769, "train_loss": 3.3887927532196045, "lr": 0.00023892181712090906, "tps": 64460, "wall": 15016.3} {"step": 14770, "train_loss": 3.3014841079711914, "lr": 0.00023890276516054244, "tps": 64442, "wall": 15021.6} {"step": 14771, "train_loss": 3.5145530700683594, "lr": 0.00023888371298604432, "tps": 64424, "wall": 15026.8} {"step": 14772, "train_loss": 3.319183111190796, "lr": 0.00023886466059763048, "tps": 64406, "wall": 15032.2} {"step": 14773, "train_loss": 3.293581485748291, "lr": 0.0002388456079955167, "tps": 64387, "wall": 15037.4} {"step": 14774, "train_loss": 3.3342442512512207, "lr": 0.00023882655517991886, "tps": 64369, "wall": 15042.7} {"step": 14775, "train_loss": 3.301060199737549, "lr": 0.00023880750215105287, "tps": 64351, "wall": 15047.9} {"step": 14776, "train_loss": 3.3127448558807373, "lr": 0.00023878844890913437, "tps": 64333, "wall": 15053.2} {"step": 14777, "train_loss": 3.40803861618042, "lr": 0.00023876939545437934, "tps": 64315, "wall": 15058.4} {"step": 14778, "train_loss": 3.417417049407959, "lr": 0.00023875034178700362, "tps": 64297, "wall": 15063.7} {"step": 14779, "train_loss": 3.3972480297088623, "lr": 0.000238731287907223, "tps": 64279, "wall": 15068.9} {"step": 14780, "train_loss": 3.2886159420013428, "lr": 0.0002387122338152533, "tps": 64261, "wall": 15074.2} {"step": 14781, "train_loss": 3.42240047454834, "lr": 0.00023869317951131044, "tps": 64243, "wall": 15079.4} {"step": 14782, "train_loss": 3.4357619285583496, "lr": 0.00023867412499561024, "tps": 64225, "wall": 15084.7} {"step": 14783, "train_loss": 3.254941463470459, "lr": 0.0002386550702683685, "tps": 64207, "wall": 15090.0} {"step": 14784, "train_loss": 3.436436891555786, "lr": 0.00023863601532980112, "tps": 64189, "wall": 15095.2} {"step": 14785, "train_loss": 3.4310898780822754, "lr": 0.00023861696018012398, "tps": 64171, "wall": 15100.5} {"step": 14786, "train_loss": 3.5101161003112793, "lr": 0.00023859790481955292, "tps": 64153, "wall": 15105.7} {"step": 14787, "train_loss": 3.338259220123291, "lr": 0.00023857884924830374, "tps": 64135, "wall": 15111.0} {"step": 14788, "train_loss": 3.492419958114624, "lr": 0.00023855979346659237, "tps": 64117, "wall": 15116.2} {"step": 14789, "train_loss": 3.4442291259765625, "lr": 0.00023854073747463467, "tps": 64099, "wall": 15121.5} {"step": 14790, "train_loss": 3.290454864501953, "lr": 0.0002385216812726465, "tps": 64081, "wall": 15126.7} {"step": 14791, "train_loss": 3.266097068786621, "lr": 0.0002385026248608437, "tps": 64063, "wall": 15132.0} {"step": 14792, "train_loss": 3.4193708896636963, "lr": 0.00023848356823944213, "tps": 64045, "wall": 15137.2} {"step": 14793, "train_loss": 3.445065975189209, "lr": 0.0002384645114086578, "tps": 64027, "wall": 15142.5} {"step": 14794, "train_loss": 3.3922362327575684, "lr": 0.00023844545436870642, "tps": 64010, "wall": 15147.7} {"step": 14795, "train_loss": 3.343419313430786, "lr": 0.00023842639711980392, "tps": 63991, "wall": 15153.0} {"step": 14796, "train_loss": 3.3818435668945312, "lr": 0.00023840733966216623, "tps": 63974, "wall": 15158.3} {"step": 14797, "train_loss": 3.3139660358428955, "lr": 0.00023838828199600917, "tps": 63956, "wall": 15163.5} {"step": 14798, "train_loss": 3.3334801197052, "lr": 0.00023836922412154868, "tps": 63938, "wall": 15168.8} {"step": 14799, "train_loss": 3.3752713203430176, "lr": 0.00023835016603900058, "tps": 63920, "wall": 15174.1} {"step": 14800, "train_loss": 3.381441116333008, "lr": 0.00023833110774858086, "tps": 63902, "wall": 15179.3} {"step": 14801, "train_loss": 3.347245693206787, "lr": 0.00023831204925050536, "tps": 63884, "wall": 15184.6} {"step": 14802, "train_loss": 3.3372366428375244, "lr": 0.00023829299054498995, "tps": 63867, "wall": 15189.8} {"step": 14803, "train_loss": 3.296426296234131, "lr": 0.00023827393163225057, "tps": 63849, "wall": 15195.1} {"step": 14804, "train_loss": 3.3490853309631348, "lr": 0.00023825487251250306, "tps": 63831, "wall": 15200.4} {"step": 14805, "train_loss": 3.471684455871582, "lr": 0.00023823581318596344, "tps": 63813, "wall": 15205.6} {"step": 14806, "train_loss": 3.268907308578491, "lr": 0.0002382167536528475, "tps": 63795, "wall": 15211.0} {"step": 14807, "train_loss": 3.4272499084472656, "lr": 0.00023819769391337118, "tps": 63777, "wall": 15216.2} {"step": 14808, "train_loss": 3.2562973499298096, "lr": 0.0002381786339677504, "tps": 63759, "wall": 15221.5} {"step": 14809, "train_loss": 3.419739246368408, "lr": 0.00023815957381620107, "tps": 63742, "wall": 15226.8} {"step": 14810, "train_loss": 3.414769172668457, "lr": 0.00023814051345893918, "tps": 63724, "wall": 15232.1} {"step": 14811, "train_loss": 3.3541321754455566, "lr": 0.00023812145289618046, "tps": 63706, "wall": 15237.3} {"step": 14812, "train_loss": 3.377991199493408, "lr": 0.00023810239212814098, "tps": 63689, "wall": 15242.6} {"step": 14813, "train_loss": 3.453657388687134, "lr": 0.00023808333115503665, "tps": 63671, "wall": 15247.8} {"step": 14814, "train_loss": 3.4988036155700684, "lr": 0.00023806426997708332, "tps": 63653, "wall": 15253.2} {"step": 14815, "train_loss": 3.2929811477661133, "lr": 0.000238045208594497, "tps": 63635, "wall": 15258.4} {"step": 14816, "train_loss": 3.4088759422302246, "lr": 0.00023802614700749365, "tps": 63618, "wall": 15263.7} {"step": 14817, "train_loss": 3.3311262130737305, "lr": 0.000238007085216289, "tps": 63600, "wall": 15269.0} {"step": 14818, "train_loss": 3.392561435699463, "lr": 0.00023798802322109916, "tps": 63582, "wall": 15274.2} {"step": 14819, "train_loss": 3.3980937004089355, "lr": 0.00023796896102214, "tps": 63565, "wall": 15279.5} {"step": 14820, "train_loss": 3.3590569496154785, "lr": 0.00023794989861962757, "tps": 63547, "wall": 15284.7} {"step": 14821, "train_loss": 3.5026283264160156, "lr": 0.00023793083601377762, "tps": 63530, "wall": 15289.9} {"step": 14822, "train_loss": 3.4123902320861816, "lr": 0.00023791177320480622, "tps": 63512, "wall": 15295.2} {"step": 14823, "train_loss": 3.4304234981536865, "lr": 0.0002378927101929293, "tps": 63495, "wall": 15300.4} {"step": 14824, "train_loss": 3.3439316749572754, "lr": 0.00023787364697836277, "tps": 63477, "wall": 15305.7} {"step": 14825, "train_loss": 3.2848334312438965, "lr": 0.00023785458356132263, "tps": 63460, "wall": 15310.9} {"step": 14826, "train_loss": 3.4018850326538086, "lr": 0.00023783551994202475, "tps": 63443, "wall": 15316.1} {"step": 14827, "train_loss": 3.371492385864258, "lr": 0.0002378164561206852, "tps": 63425, "wall": 15321.4} {"step": 14828, "train_loss": 3.3554725646972656, "lr": 0.00023779739209751978, "tps": 63407, "wall": 15326.7} {"step": 14829, "train_loss": 3.435256242752075, "lr": 0.00023777832787274462, "tps": 63389, "wall": 15332.1} {"step": 14830, "train_loss": 3.3857436180114746, "lr": 0.0002377592634465756, "tps": 63372, "wall": 15337.3} {"step": 14831, "train_loss": 3.409301996231079, "lr": 0.00023774019881922867, "tps": 63355, "wall": 15342.5} {"step": 14832, "train_loss": 3.4111342430114746, "lr": 0.00023772113399091977, "tps": 63337, "wall": 15347.8} {"step": 14833, "train_loss": 3.300797462463379, "lr": 0.00023770206896186493, "tps": 63320, "wall": 15353.1} {"step": 14834, "train_loss": 3.402643918991089, "lr": 0.00023768300373228014, "tps": 63303, "wall": 15358.3} {"step": 14835, "train_loss": 3.4567372798919678, "lr": 0.00023766393830238129, "tps": 63285, "wall": 15363.5} {"step": 14836, "train_loss": 3.4802517890930176, "lr": 0.00023764487267238432, "tps": 63268, "wall": 15368.8} {"step": 14837, "train_loss": 3.377629041671753, "lr": 0.00023762580684250537, "tps": 63251, "wall": 15374.0} {"step": 14838, "train_loss": 3.3735146522521973, "lr": 0.0002376067408129603, "tps": 63233, "wall": 15379.3} {"step": 14839, "train_loss": 3.4035234451293945, "lr": 0.0002375876745839651, "tps": 63216, "wall": 15384.5} {"step": 14840, "train_loss": 3.3964619636535645, "lr": 0.00023756860815573583, "tps": 63199, "wall": 15389.8} {"step": 14841, "train_loss": 3.3488450050354004, "lr": 0.00023754954152848838, "tps": 63181, "wall": 15395.0} {"step": 14842, "train_loss": 3.5356404781341553, "lr": 0.00023753047470243877, "tps": 63164, "wall": 15400.2} {"step": 14843, "train_loss": 3.327613115310669, "lr": 0.00023751140767780298, "tps": 63147, "wall": 15405.4} {"step": 14844, "train_loss": 3.3694562911987305, "lr": 0.000237492340454797, "tps": 63130, "wall": 15410.7} {"step": 14845, "train_loss": 3.3414816856384277, "lr": 0.00023747327303363686, "tps": 63113, "wall": 15415.9} {"step": 14846, "train_loss": 3.3956527709960938, "lr": 0.00023745420541453855, "tps": 63095, "wall": 15421.2} {"step": 14847, "train_loss": 3.3795504570007324, "lr": 0.00023743513759771808, "tps": 63078, "wall": 15426.4} {"step": 14848, "train_loss": 3.3728890419006348, "lr": 0.0002374160695833914, "tps": 63061, "wall": 15431.6} {"step": 14849, "train_loss": 3.4115004539489746, "lr": 0.00023739700137177452, "tps": 63044, "wall": 15436.9} {"step": 14850, "train_loss": 3.3428454399108887, "lr": 0.00023737793296308354, "tps": 63027, "wall": 15442.1} {"step": 14851, "train_loss": 3.376927137374878, "lr": 0.00023735886435753432, "tps": 63010, "wall": 15447.3} {"step": 14852, "train_loss": 3.37893009185791, "lr": 0.000237339795555343, "tps": 62992, "wall": 15452.7} {"step": 14853, "train_loss": 3.360191822052002, "lr": 0.0002373207265567255, "tps": 62975, "wall": 15458.0} {"step": 14854, "train_loss": 3.3565189838409424, "lr": 0.0002373016573618979, "tps": 62958, "wall": 15463.2} {"step": 14855, "train_loss": 3.351696729660034, "lr": 0.00023728258797107613, "tps": 62941, "wall": 15468.5} {"step": 14856, "train_loss": 3.361518383026123, "lr": 0.0002372635183844763, "tps": 62923, "wall": 15473.7} {"step": 14857, "train_loss": 3.3560290336608887, "lr": 0.00023724444860231448, "tps": 62906, "wall": 15478.9} {"step": 14858, "train_loss": 3.3377487659454346, "lr": 0.0002372253786248065, "tps": 62889, "wall": 15484.2} {"step": 14859, "train_loss": 3.3556277751922607, "lr": 0.00023720630845216857, "tps": 62872, "wall": 15489.4} {"step": 14860, "train_loss": 3.3407790660858154, "lr": 0.00023718723808461664, "tps": 62855, "wall": 15494.7} {"step": 14861, "train_loss": 3.4191014766693115, "lr": 0.0002371681675223667, "tps": 62838, "wall": 15499.9} {"step": 14862, "train_loss": 3.425851583480835, "lr": 0.00023714909676563487, "tps": 62821, "wall": 15505.2} {"step": 14863, "train_loss": 3.286308526992798, "lr": 0.00023713002581463713, "tps": 62804, "wall": 15510.5} {"step": 14864, "train_loss": 3.3811309337615967, "lr": 0.00023711095466958954, "tps": 62787, "wall": 15515.7} {"step": 14865, "train_loss": 3.3499691486358643, "lr": 0.0002370918833307081, "tps": 62770, "wall": 15520.9} {"step": 14866, "train_loss": 3.3560290336608887, "lr": 0.00023707281179820888, "tps": 62753, "wall": 15526.2} {"step": 14867, "train_loss": 3.4211859703063965, "lr": 0.000237053740072308, "tps": 62736, "wall": 15531.4} {"step": 14868, "train_loss": 3.4448447227478027, "lr": 0.00023703466815322134, "tps": 62719, "wall": 15536.6} {"step": 14869, "train_loss": 3.3206865787506104, "lr": 0.00023701559604116508, "tps": 62702, "wall": 15541.9} {"step": 14870, "train_loss": 3.3331658840179443, "lr": 0.00023699652373635526, "tps": 62686, "wall": 15547.1} {"step": 14871, "train_loss": 3.3390862941741943, "lr": 0.00023697745123900786, "tps": 62669, "wall": 15552.3} {"step": 14872, "train_loss": 3.454723358154297, "lr": 0.00023695837854933896, "tps": 62652, "wall": 15557.6} {"step": 14873, "train_loss": 3.3531763553619385, "lr": 0.00023693930566756467, "tps": 62635, "wall": 15562.8} {"step": 14874, "train_loss": 3.4161794185638428, "lr": 0.000236920232593901, "tps": 62618, "wall": 15568.0} {"step": 14875, "train_loss": 3.3605339527130127, "lr": 0.00023690115932856401, "tps": 62601, "wall": 15573.3} {"step": 14876, "train_loss": 3.31874418258667, "lr": 0.00023688208587176974, "tps": 62584, "wall": 15578.6} {"step": 14877, "train_loss": 3.3326735496520996, "lr": 0.0002368630122237343, "tps": 62567, "wall": 15583.8} {"step": 14878, "train_loss": 3.3865983486175537, "lr": 0.00023684393838467377, "tps": 62550, "wall": 15589.1} {"step": 14879, "train_loss": 3.4703431129455566, "lr": 0.0002368248643548042, "tps": 62533, "wall": 15594.3} {"step": 14880, "train_loss": 3.32327938079834, "lr": 0.00023680579013434164, "tps": 62517, "wall": 15599.6} {"step": 14881, "train_loss": 3.369626522064209, "lr": 0.00023678671572350223, "tps": 62500, "wall": 15604.8} {"step": 14882, "train_loss": 3.527034282684326, "lr": 0.00023676764112250194, "tps": 62483, "wall": 15610.1} {"step": 14883, "train_loss": 3.41121506690979, "lr": 0.00023674856633155688, "tps": 62466, "wall": 15615.3} {"step": 14884, "train_loss": 3.4087958335876465, "lr": 0.00023672949135088316, "tps": 62449, "wall": 15620.6} {"step": 14885, "train_loss": 3.37260103225708, "lr": 0.00023671041618069692, "tps": 62432, "wall": 15625.9} {"step": 14886, "train_loss": 3.350511074066162, "lr": 0.00023669134082121413, "tps": 62415, "wall": 15631.2} {"step": 14887, "train_loss": 3.365543842315674, "lr": 0.0002366722652726509, "tps": 62399, "wall": 15636.4} {"step": 14888, "train_loss": 3.3864262104034424, "lr": 0.00023665318953522345, "tps": 62382, "wall": 15641.6} {"step": 14889, "train_loss": 3.410466432571411, "lr": 0.00023663411360914767, "tps": 62365, "wall": 15646.9} {"step": 14890, "train_loss": 3.328369140625, "lr": 0.00023661503749463982, "tps": 62349, "wall": 15652.1} {"step": 14891, "train_loss": 3.338810682296753, "lr": 0.00023659596119191592, "tps": 62332, "wall": 15657.4} {"step": 14892, "train_loss": 3.439772367477417, "lr": 0.00023657688470119203, "tps": 62315, "wall": 15662.6} {"step": 14893, "train_loss": 3.4279024600982666, "lr": 0.00023655780802268428, "tps": 62299, "wall": 15667.8} {"step": 14894, "train_loss": 3.3992342948913574, "lr": 0.00023653873115660884, "tps": 62282, "wall": 15673.1} {"step": 14895, "train_loss": 3.3076865673065186, "lr": 0.00023651965410318172, "tps": 62265, "wall": 15678.3} {"step": 14896, "train_loss": 3.343630075454712, "lr": 0.00023650057686261912, "tps": 62249, "wall": 15683.6} {"step": 14897, "train_loss": 3.3815627098083496, "lr": 0.00023648149943513702, "tps": 62232, "wall": 15688.8} {"step": 14898, "train_loss": 3.4252829551696777, "lr": 0.00023646242182095168, "tps": 62215, "wall": 15694.1} {"step": 14899, "train_loss": 3.3534457683563232, "lr": 0.0002364433440202791, "tps": 62199, "wall": 15699.3} {"step": 14900, "train_loss": 3.4402501583099365, "lr": 0.0002364242660333354, "tps": 62182, "wall": 15704.5} {"step": 14901, "train_loss": 3.3861327171325684, "lr": 0.0002364051878603368, "tps": 62166, "wall": 15709.8} {"step": 14902, "train_loss": 3.409569501876831, "lr": 0.00023638610950149925, "tps": 62149, "wall": 15715.0} {"step": 14903, "train_loss": 3.37951397895813, "lr": 0.00023636703095703898, "tps": 62133, "wall": 15720.2} {"step": 14904, "train_loss": 3.4188826084136963, "lr": 0.0002363479522271721, "tps": 62116, "wall": 15725.5} {"step": 14905, "train_loss": 3.3606481552124023, "lr": 0.00023632887331211482, "tps": 62100, "wall": 15730.7} {"step": 14906, "train_loss": 3.310134172439575, "lr": 0.0002363097942120831, "tps": 62083, "wall": 15735.9} {"step": 14907, "train_loss": 3.406216859817505, "lr": 0.00023629071492729312, "tps": 62067, "wall": 15741.2} {"step": 14908, "train_loss": 3.373622417449951, "lr": 0.00023627163545796113, "tps": 62050, "wall": 15746.4} {"step": 14909, "train_loss": 3.267402172088623, "lr": 0.0002362525558043031, "tps": 62033, "wall": 15751.8} {"step": 14910, "train_loss": 3.460303783416748, "lr": 0.00023623347596653525, "tps": 62017, "wall": 15757.0} {"step": 14911, "train_loss": 3.306942939758301, "lr": 0.0002362143959448737, "tps": 62000, "wall": 15762.2} {"step": 14912, "train_loss": 3.3484058380126953, "lr": 0.00023619531573953472, "tps": 61984, "wall": 15767.5} {"step": 14913, "train_loss": 3.5439419746398926, "lr": 0.00023617623535073418, "tps": 61968, "wall": 15772.7} {"step": 14914, "train_loss": 3.342257499694824, "lr": 0.0002361571547786884, "tps": 61951, "wall": 15777.9} {"step": 14915, "train_loss": 3.331148624420166, "lr": 0.00023613807402361357, "tps": 61935, "wall": 15783.1} {"step": 14916, "train_loss": 3.3335227966308594, "lr": 0.00023611899308572566, "tps": 61919, "wall": 15788.4} {"step": 14917, "train_loss": 3.4019501209259033, "lr": 0.00023609991196524099, "tps": 61902, "wall": 15793.6} {"step": 14918, "train_loss": 3.376775026321411, "lr": 0.00023608083066237564, "tps": 61886, "wall": 15798.8} {"step": 14919, "train_loss": 3.2985925674438477, "lr": 0.00023606174917734576, "tps": 61869, "wall": 15804.1} {"step": 14920, "train_loss": 3.3508009910583496, "lr": 0.00023604266751036748, "tps": 61853, "wall": 15809.4} {"step": 14921, "train_loss": 3.272700786590576, "lr": 0.00023602358566165706, "tps": 61836, "wall": 15814.6} {"step": 14922, "train_loss": 3.4690542221069336, "lr": 0.00023600450363143059, "tps": 61820, "wall": 15819.8} {"step": 14923, "train_loss": 3.367572069168091, "lr": 0.0002359854214199042, "tps": 61804, "wall": 15825.1} {"step": 14924, "train_loss": 3.4181416034698486, "lr": 0.0002359663390272941, "tps": 61788, "wall": 15830.3} {"step": 14925, "train_loss": 3.2851991653442383, "lr": 0.00023594725645381646, "tps": 61771, "wall": 15835.6} {"step": 14926, "train_loss": 3.416109561920166, "lr": 0.00023592817369968741, "tps": 61755, "wall": 15840.8} {"step": 14927, "train_loss": 3.381669282913208, "lr": 0.00023590909076512317, "tps": 61739, "wall": 15846.0} {"step": 14928, "train_loss": 3.4022512435913086, "lr": 0.0002358900076503399, "tps": 61722, "wall": 15851.3} {"step": 14929, "train_loss": 3.4673473834991455, "lr": 0.00023587092435555375, "tps": 61706, "wall": 15856.5} {"step": 14930, "train_loss": 3.388984203338623, "lr": 0.0002358518408809809, "tps": 61690, "wall": 15861.8} {"step": 14931, "train_loss": 3.389766216278076, "lr": 0.00023583275722683755, "tps": 61673, "wall": 15867.1} {"step": 14932, "train_loss": 3.359691619873047, "lr": 0.00023581367339333987, "tps": 61657, "wall": 15872.4} {"step": 14933, "train_loss": 3.414146661758423, "lr": 0.000235794589380704, "tps": 61641, "wall": 15877.7} {"step": 14934, "train_loss": 3.3847532272338867, "lr": 0.00023577550518914618, "tps": 61624, "wall": 15882.9} {"step": 14935, "train_loss": 3.2988758087158203, "lr": 0.00023575642081888267, "tps": 61608, "wall": 15888.2} {"step": 14936, "train_loss": 3.340707540512085, "lr": 0.0002357373362701295, "tps": 61592, "wall": 15893.4} {"step": 14937, "train_loss": 3.3611695766448975, "lr": 0.00023571825154310294, "tps": 61575, "wall": 15898.7} {"step": 14938, "train_loss": 3.358645439147949, "lr": 0.0002356991666380192, "tps": 61559, "wall": 15904.0} {"step": 14939, "train_loss": 3.3550941944122314, "lr": 0.0002356800815550944, "tps": 61543, "wall": 15909.2} {"step": 14940, "train_loss": 3.4148287773132324, "lr": 0.00023566099629454486, "tps": 61527, "wall": 15914.5} {"step": 14941, "train_loss": 3.3560943603515625, "lr": 0.00023564191085658664, "tps": 61511, "wall": 15919.7} {"step": 14942, "train_loss": 3.371112823486328, "lr": 0.00023562282524143603, "tps": 61495, "wall": 15924.9} {"step": 14943, "train_loss": 3.3124468326568604, "lr": 0.0002356037394493092, "tps": 61478, "wall": 15930.3} {"step": 14944, "train_loss": 3.4168131351470947, "lr": 0.00023558465348042242, "tps": 61462, "wall": 15935.5} {"step": 14945, "train_loss": 3.3588075637817383, "lr": 0.0002355655673349918, "tps": 61446, "wall": 15940.7} {"step": 14946, "train_loss": 3.458071708679199, "lr": 0.0002355464810132336, "tps": 61430, "wall": 15945.9} {"step": 14947, "train_loss": 3.372530698776245, "lr": 0.00023552739451536398, "tps": 61414, "wall": 15951.2} {"step": 14948, "train_loss": 3.295151472091675, "lr": 0.0002355083078415992, "tps": 61398, "wall": 15956.4} {"step": 14949, "train_loss": 3.3792877197265625, "lr": 0.00023548922099215553, "tps": 61382, "wall": 15961.7} {"step": 14950, "train_loss": 3.382988929748535, "lr": 0.0002354701339672491, "tps": 61366, "wall": 15966.9} {"step": 14951, "train_loss": 3.357616901397705, "lr": 0.00023545104676709616, "tps": 61350, "wall": 15972.2} {"step": 14952, "train_loss": 3.389267921447754, "lr": 0.00023543195939191295, "tps": 61333, "wall": 15977.4} {"step": 14953, "train_loss": 3.4061644077301025, "lr": 0.0002354128718419156, "tps": 61317, "wall": 15982.7} {"step": 14954, "train_loss": 3.408125877380371, "lr": 0.00023539378411732047, "tps": 61302, "wall": 15987.9} {"step": 14955, "train_loss": 3.334784746170044, "lr": 0.00023537469621834372, "tps": 61285, "wall": 15993.2} {"step": 14956, "train_loss": 3.34724760055542, "lr": 0.00023535560814520151, "tps": 61269, "wall": 15998.5} {"step": 14957, "train_loss": 3.320655345916748, "lr": 0.00023533651989811016, "tps": 61253, "wall": 16003.8} {"step": 14958, "train_loss": 3.345196485519409, "lr": 0.00023531743147728594, "tps": 61237, "wall": 16009.0} {"step": 14959, "train_loss": 3.439858913421631, "lr": 0.000235298342882945, "tps": 61221, "wall": 16014.3} {"step": 14960, "train_loss": 3.402615547180176, "lr": 0.00023527925411530364, "tps": 61205, "wall": 16019.5} {"step": 14961, "train_loss": 3.4850659370422363, "lr": 0.000235260165174578, "tps": 61189, "wall": 16024.8} {"step": 14962, "train_loss": 3.374437093734741, "lr": 0.00023524107606098435, "tps": 61173, "wall": 16030.0} {"step": 14963, "train_loss": 3.332090377807617, "lr": 0.00023522198677473907, "tps": 61157, "wall": 16035.2} {"step": 14964, "train_loss": 3.405139684677124, "lr": 0.0002352028973160582, "tps": 61141, "wall": 16040.5} {"step": 14965, "train_loss": 3.3933379650115967, "lr": 0.00023518380768515815, "tps": 61125, "wall": 16045.8} {"step": 14966, "train_loss": 3.369874954223633, "lr": 0.00023516471788225513, "tps": 61109, "wall": 16051.1} {"step": 14967, "train_loss": 3.3316328525543213, "lr": 0.00023514562790756535, "tps": 61093, "wall": 16056.3} {"step": 14968, "train_loss": 3.3929941654205322, "lr": 0.000235126537761305, "tps": 61077, "wall": 16061.6} {"step": 14969, "train_loss": 3.2918143272399902, "lr": 0.00023510744744369047, "tps": 61062, "wall": 16066.8} {"step": 14970, "train_loss": 3.3799352645874023, "lr": 0.000235088356954938, "tps": 61046, "wall": 16072.0} {"step": 14971, "train_loss": 3.386399269104004, "lr": 0.00023506926629526372, "tps": 61030, "wall": 16077.3} {"step": 14972, "train_loss": 3.5140156745910645, "lr": 0.000235050175464884, "tps": 61014, "wall": 16082.5} {"step": 14973, "train_loss": 3.2680883407592773, "lr": 0.00023503108446401515, "tps": 60998, "wall": 16087.8} {"step": 14974, "train_loss": 3.355767011642456, "lr": 0.00023501199329287328, "tps": 60983, "wall": 16093.0} {"step": 14975, "train_loss": 3.518101215362549, "lr": 0.00023499290195167473, "tps": 60967, "wall": 16098.2} {"step": 14976, "train_loss": 3.327383041381836, "lr": 0.00023497381044063585, "tps": 60951, "wall": 16103.4} {"step": 14977, "train_loss": 3.410871982574463, "lr": 0.00023495471875997282, "tps": 60935, "wall": 16108.7} {"step": 14978, "train_loss": 3.3245785236358643, "lr": 0.00023493562690990184, "tps": 60919, "wall": 16114.0} {"step": 14979, "train_loss": 3.2806396484375, "lr": 0.00023491653489063935, "tps": 60904, "wall": 16119.3} {"step": 14980, "train_loss": 3.3903441429138184, "lr": 0.00023489744270240154, "tps": 60888, "wall": 16124.5} {"step": 14981, "train_loss": 3.4533443450927734, "lr": 0.0002348783503454047, "tps": 60872, "wall": 16129.7} {"step": 14982, "train_loss": 3.4483180046081543, "lr": 0.00023485925781986503, "tps": 60857, "wall": 16135.0} {"step": 14983, "train_loss": 3.3627235889434814, "lr": 0.000234840165125999, "tps": 60841, "wall": 16140.2} {"step": 14984, "train_loss": 3.366358518600464, "lr": 0.00023482107226402267, "tps": 60825, "wall": 16145.4} {"step": 14985, "train_loss": 3.3485708236694336, "lr": 0.00023480197923415254, "tps": 60809, "wall": 16150.7} {"step": 14986, "train_loss": 3.4737813472747803, "lr": 0.00023478288603660468, "tps": 60794, "wall": 16156.0} {"step": 14987, "train_loss": 3.382323741912842, "lr": 0.00023476379267159555, "tps": 60778, "wall": 16161.3} {"step": 14988, "train_loss": 3.395462989807129, "lr": 0.00023474469913934134, "tps": 60762, "wall": 16166.5} {"step": 14989, "train_loss": 3.3894381523132324, "lr": 0.00023472560544005836, "tps": 60746, "wall": 16171.9} {"step": 14990, "train_loss": 3.35006046295166, "lr": 0.000234706511573963, "tps": 60730, "wall": 16177.1} {"step": 14991, "train_loss": 3.407057285308838, "lr": 0.0002346874175412715, "tps": 60715, "wall": 16182.4} {"step": 14992, "train_loss": 3.451915979385376, "lr": 0.00023466832334220007, "tps": 60699, "wall": 16187.6} {"step": 14993, "train_loss": 3.4302520751953125, "lr": 0.0002346492289769651, "tps": 60684, "wall": 16192.8} {"step": 14994, "train_loss": 3.337618827819824, "lr": 0.00023463013444578284, "tps": 60668, "wall": 16198.1} {"step": 14995, "train_loss": 3.360236644744873, "lr": 0.00023461103974886966, "tps": 60652, "wall": 16203.3} {"step": 14996, "train_loss": 3.298424482345581, "lr": 0.00023459194488644177, "tps": 60637, "wall": 16208.6} {"step": 14997, "train_loss": 3.31227707862854, "lr": 0.00023457284985871563, "tps": 60621, "wall": 16213.8} {"step": 14998, "train_loss": 3.2823052406311035, "lr": 0.00023455375466590738, "tps": 60606, "wall": 16219.0} {"step": 14999, "train_loss": 3.3717026710510254, "lr": 0.00023453465930823347, "tps": 60590, "wall": 16224.3} {"step": 15000, "train_loss": 3.4074721336364746, "lr": 0.00023451556378591018, "tps": 60574, "wall": 16229.7, "val_loss_monitor": 3.4538085790105097, "val_loss_full": 3.470632591192862} {"step": 15001, "train_loss": 3.3772315979003906, "lr": 0.00023449646809915376, "tps": 60110, "wall": 16356.1} {"step": 15002, "train_loss": 3.351262092590332, "lr": 0.00023447737224818052, "tps": 60094, "wall": 16361.6} {"step": 15003, "train_loss": 3.3069770336151123, "lr": 0.00023445827623320685, "tps": 60078, "wall": 16367.0} {"step": 15004, "train_loss": 3.242124319076538, "lr": 0.00023443918005444908, "tps": 60062, "wall": 16372.4} {"step": 15005, "train_loss": 3.3468639850616455, "lr": 0.0002344200837121235, "tps": 60046, "wall": 16377.8} {"step": 15006, "train_loss": 3.337665319442749, "lr": 0.00023440098720644632, "tps": 60031, "wall": 16383.1} {"step": 15007, "train_loss": 3.4059040546417236, "lr": 0.0002343818905376341, "tps": 60015, "wall": 16388.6} {"step": 15008, "train_loss": 3.276202917098999, "lr": 0.000234362793705903, "tps": 59999, "wall": 16394.0} {"step": 15009, "train_loss": 3.4341578483581543, "lr": 0.00023434369671146942, "tps": 59983, "wall": 16399.4} {"step": 15010, "train_loss": 3.352328062057495, "lr": 0.00023432459955454964, "tps": 59967, "wall": 16404.8} {"step": 15011, "train_loss": 3.3150503635406494, "lr": 0.00023430550223536004, "tps": 59951, "wall": 16410.3} {"step": 15012, "train_loss": 3.3181915283203125, "lr": 0.00023428640475411694, "tps": 59935, "wall": 16415.7} {"step": 15013, "train_loss": 3.381321907043457, "lr": 0.00023426730711103666, "tps": 59920, "wall": 16421.1} {"step": 15014, "train_loss": 3.335904359817505, "lr": 0.00023424820930633558, "tps": 59904, "wall": 16426.5} {"step": 15015, "train_loss": 3.3526840209960938, "lr": 0.00023422911134023, "tps": 59889, "wall": 16431.8} {"step": 15016, "train_loss": 3.323453187942505, "lr": 0.00023421001321293622, "tps": 59873, "wall": 16437.2} {"step": 15017, "train_loss": 3.3918633460998535, "lr": 0.00023419091492467073, "tps": 59857, "wall": 16442.6} {"step": 15018, "train_loss": 3.4134724140167236, "lr": 0.0002341718164756497, "tps": 59842, "wall": 16448.0} {"step": 15019, "train_loss": 3.3548524379730225, "lr": 0.0002341527178660896, "tps": 59827, "wall": 16453.3} {"step": 15020, "train_loss": 3.3403608798980713, "lr": 0.0002341336190962068, "tps": 59811, "wall": 16458.7} {"step": 15021, "train_loss": 3.485854148864746, "lr": 0.00023411452016621756, "tps": 59796, "wall": 16464.0} {"step": 15022, "train_loss": 3.4603781700134277, "lr": 0.0002340954210763383, "tps": 59780, "wall": 16469.4} {"step": 15023, "train_loss": 3.337629795074463, "lr": 0.00023407632182678527, "tps": 59765, "wall": 16474.7} {"step": 15024, "train_loss": 3.405330181121826, "lr": 0.00023405722241777498, "tps": 59749, "wall": 16480.0} {"step": 15025, "train_loss": 3.3391659259796143, "lr": 0.00023403812284952368, "tps": 59734, "wall": 16485.4} {"step": 15026, "train_loss": 3.363562822341919, "lr": 0.00023401902312224774, "tps": 59719, "wall": 16490.7} {"step": 15027, "train_loss": 3.3969998359680176, "lr": 0.00023399992323616363, "tps": 59703, "wall": 16496.0} {"step": 15028, "train_loss": 3.350205659866333, "lr": 0.00023398082319148756, "tps": 59688, "wall": 16501.2} {"step": 15029, "train_loss": 3.2308013439178467, "lr": 0.00023396172298843597, "tps": 59673, "wall": 16506.5} {"step": 15030, "train_loss": 3.305708408355713, "lr": 0.0002339426226272253, "tps": 59658, "wall": 16511.8} {"step": 15031, "train_loss": 3.374063014984131, "lr": 0.00023392352210807179, "tps": 59643, "wall": 16517.1} {"step": 15032, "train_loss": 3.335198402404785, "lr": 0.00023390442143119184, "tps": 59628, "wall": 16522.4} {"step": 15033, "train_loss": 3.348968505859375, "lr": 0.00023388532059680185, "tps": 59613, "wall": 16527.7} {"step": 15034, "train_loss": 3.4785420894622803, "lr": 0.00023386621960511832, "tps": 59597, "wall": 16533.0} {"step": 15035, "train_loss": 3.391599655151367, "lr": 0.00023384711845635735, "tps": 59582, "wall": 16538.3} {"step": 15036, "train_loss": 3.345798969268799, "lr": 0.00023382801715073556, "tps": 59567, "wall": 16543.5} {"step": 15037, "train_loss": 3.3543343544006348, "lr": 0.00023380891568846926, "tps": 59552, "wall": 16548.8} {"step": 15038, "train_loss": 3.3479905128479004, "lr": 0.00023378981406977473, "tps": 59538, "wall": 16554.1} {"step": 15039, "train_loss": 3.314692974090576, "lr": 0.00023377071229486847, "tps": 59523, "wall": 16559.3} {"step": 15040, "train_loss": 3.443483591079712, "lr": 0.00023375161036396684, "tps": 59508, "wall": 16564.5} {"step": 15041, "train_loss": 3.4540960788726807, "lr": 0.00023373250827728629, "tps": 59493, "wall": 16569.8} {"step": 15042, "train_loss": 3.418776035308838, "lr": 0.00023371340603504313, "tps": 59478, "wall": 16575.0} {"step": 15043, "train_loss": 3.360367774963379, "lr": 0.0002336943036374537, "tps": 59463, "wall": 16580.2} {"step": 15044, "train_loss": 3.4175846576690674, "lr": 0.00023367520108473445, "tps": 59449, "wall": 16585.5} {"step": 15045, "train_loss": 3.370500326156616, "lr": 0.00023365609837710185, "tps": 59433, "wall": 16590.8} {"step": 15046, "train_loss": 3.2613131999969482, "lr": 0.0002336369955147722, "tps": 59418, "wall": 16596.1} {"step": 15047, "train_loss": 3.303725242614746, "lr": 0.0002336178924979619, "tps": 59404, "wall": 16601.3} {"step": 15048, "train_loss": 3.4193649291992188, "lr": 0.00023359878932688744, "tps": 59389, "wall": 16606.6} {"step": 15049, "train_loss": 3.326021671295166, "lr": 0.00023357968600176509, "tps": 59374, "wall": 16611.8} {"step": 15050, "train_loss": 3.3689627647399902, "lr": 0.00023356058252281135, "tps": 59359, "wall": 16617.0} {"step": 15051, "train_loss": 3.4284749031066895, "lr": 0.00023354147889024263, "tps": 59345, "wall": 16622.2} {"step": 15052, "train_loss": 3.3108437061309814, "lr": 0.00023352237510427523, "tps": 59330, "wall": 16627.4} {"step": 15053, "train_loss": 3.4081499576568604, "lr": 0.0002335032711651257, "tps": 59315, "wall": 16632.7} {"step": 15054, "train_loss": 3.450857639312744, "lr": 0.00023348416707301035, "tps": 59301, "wall": 16637.9} {"step": 15055, "train_loss": 3.3390705585479736, "lr": 0.00023346506282814563, "tps": 59286, "wall": 16643.1} {"step": 15056, "train_loss": 3.367701530456543, "lr": 0.00023344595843074797, "tps": 59271, "wall": 16648.3} {"step": 15057, "train_loss": 3.346947193145752, "lr": 0.0002334268538810337, "tps": 59256, "wall": 16653.6} {"step": 15058, "train_loss": 3.3561525344848633, "lr": 0.00023340774917921943, "tps": 59242, "wall": 16658.8} {"step": 15059, "train_loss": 3.4798471927642822, "lr": 0.00023338864432552133, "tps": 59227, "wall": 16664.1} {"step": 15060, "train_loss": 3.3287277221679688, "lr": 0.00023336953932015595, "tps": 59212, "wall": 16669.3} {"step": 15061, "train_loss": 3.351900339126587, "lr": 0.00023335043416333978, "tps": 59198, "wall": 16674.6} {"step": 15062, "train_loss": 3.3991174697875977, "lr": 0.00023333132885528914, "tps": 59183, "wall": 16679.8} {"step": 15063, "train_loss": 3.435720443725586, "lr": 0.00023331222339622047, "tps": 59168, "wall": 16685.0} {"step": 15064, "train_loss": 3.3277595043182373, "lr": 0.0002332931177863502, "tps": 59154, "wall": 16690.2} {"step": 15065, "train_loss": 3.355147361755371, "lr": 0.00023327401202589485, "tps": 59139, "wall": 16695.5} {"step": 15066, "train_loss": 3.3343005180358887, "lr": 0.0002332549061150707, "tps": 59124, "wall": 16700.8} {"step": 15067, "train_loss": 3.383577346801758, "lr": 0.00023323580005409428, "tps": 59110, "wall": 16706.0} {"step": 15068, "train_loss": 3.4653191566467285, "lr": 0.00023321669384318198, "tps": 59095, "wall": 16711.3} {"step": 15069, "train_loss": 3.348257541656494, "lr": 0.00023319758748255027, "tps": 59080, "wall": 16716.5} {"step": 15070, "train_loss": 3.3145692348480225, "lr": 0.00023317848097241558, "tps": 59066, "wall": 16721.7} {"step": 15071, "train_loss": 3.3845033645629883, "lr": 0.00023315937431299432, "tps": 59051, "wall": 16727.0} {"step": 15072, "train_loss": 3.478198528289795, "lr": 0.00023314026750450299, "tps": 59037, "wall": 16732.2} {"step": 15073, "train_loss": 3.374178171157837, "lr": 0.00023312116054715799, "tps": 59022, "wall": 16737.5} {"step": 15074, "train_loss": 3.299375057220459, "lr": 0.00023310205344117578, "tps": 59008, "wall": 16742.7} {"step": 15075, "train_loss": 3.308500051498413, "lr": 0.00023308294618677283, "tps": 58993, "wall": 16747.9} {"step": 15076, "train_loss": 3.4352612495422363, "lr": 0.00023306383878416548, "tps": 58979, "wall": 16753.2} {"step": 15077, "train_loss": 3.368391513824463, "lr": 0.00023304473123357026, "tps": 58964, "wall": 16758.4} {"step": 15078, "train_loss": 3.385866165161133, "lr": 0.0002330256235352037, "tps": 58949, "wall": 16763.7} {"step": 15079, "train_loss": 3.4120826721191406, "lr": 0.00023300651568928214, "tps": 58935, "wall": 16769.0} {"step": 15080, "train_loss": 3.3316214084625244, "lr": 0.00023298740769602203, "tps": 58920, "wall": 16774.3} {"step": 15081, "train_loss": 3.3307244777679443, "lr": 0.00023296829955563982, "tps": 58905, "wall": 16779.6} {"step": 15082, "train_loss": 3.443653106689453, "lr": 0.00023294919126835219, "tps": 58891, "wall": 16784.8} {"step": 15083, "train_loss": 3.3708088397979736, "lr": 0.00023293008283437522, "tps": 58876, "wall": 16790.0} {"step": 15084, "train_loss": 3.3162198066711426, "lr": 0.00023291097425392568, "tps": 58862, "wall": 16795.3} {"step": 15085, "train_loss": 3.4919519424438477, "lr": 0.0002328918655272199, "tps": 58847, "wall": 16800.6} {"step": 15086, "train_loss": 3.287666082382202, "lr": 0.0002328727566544744, "tps": 58833, "wall": 16805.8} {"step": 15087, "train_loss": 3.3998522758483887, "lr": 0.00023285364763590556, "tps": 58818, "wall": 16811.1} {"step": 15088, "train_loss": 3.4168574810028076, "lr": 0.00023283453847172992, "tps": 58804, "wall": 16816.4} {"step": 15089, "train_loss": 3.3837838172912598, "lr": 0.000232815429162164, "tps": 58789, "wall": 16821.7} {"step": 15090, "train_loss": 3.3119778633117676, "lr": 0.00023279631970742415, "tps": 58775, "wall": 16826.9} {"step": 15091, "train_loss": 3.475231170654297, "lr": 0.00023277721010772688, "tps": 58760, "wall": 16832.2} {"step": 15092, "train_loss": 3.339190721511841, "lr": 0.00023275810036328868, "tps": 58745, "wall": 16837.5} {"step": 15093, "train_loss": 3.4308390617370605, "lr": 0.0002327389904743261, "tps": 58731, "wall": 16842.8} {"step": 15094, "train_loss": 3.338876962661743, "lr": 0.00023271988044105548, "tps": 58716, "wall": 16848.1} {"step": 15095, "train_loss": 3.3854761123657227, "lr": 0.00023270077026369342, "tps": 58702, "wall": 16853.4} {"step": 15096, "train_loss": 3.5348358154296875, "lr": 0.0002326816599424563, "tps": 58687, "wall": 16858.7} {"step": 15097, "train_loss": 3.435521125793457, "lr": 0.00023266254947756064, "tps": 58672, "wall": 16864.0} {"step": 15098, "train_loss": 3.335249900817871, "lr": 0.00023264343886922296, "tps": 58658, "wall": 16869.3} {"step": 15099, "train_loss": 3.3072433471679688, "lr": 0.00023262432811765974, "tps": 58643, "wall": 16874.7} {"step": 15100, "train_loss": 3.3838891983032227, "lr": 0.00023260521722308743, "tps": 58629, "wall": 16880.0} {"step": 15101, "train_loss": 3.389157295227051, "lr": 0.0002325861061857225, "tps": 58614, "wall": 16885.3} {"step": 15102, "train_loss": 3.308314800262451, "lr": 0.0002325669950057815, "tps": 58599, "wall": 16890.8} {"step": 15103, "train_loss": 3.384237766265869, "lr": 0.00023254788368348096, "tps": 58584, "wall": 16896.1} {"step": 15104, "train_loss": 3.29933500289917, "lr": 0.00023252877221903724, "tps": 58570, "wall": 16901.5} {"step": 15105, "train_loss": 3.349522352218628, "lr": 0.00023250966061266697, "tps": 58555, "wall": 16906.8} {"step": 15106, "train_loss": 3.324251174926758, "lr": 0.00023249054886458653, "tps": 58540, "wall": 16912.1} {"step": 15107, "train_loss": 3.3379037380218506, "lr": 0.0002324714369750125, "tps": 58526, "wall": 16917.5} {"step": 15108, "train_loss": 3.2928922176361084, "lr": 0.00023245232494416133, "tps": 58511, "wall": 16922.8} {"step": 15109, "train_loss": 3.3945791721343994, "lr": 0.00023243321277224962, "tps": 58496, "wall": 16928.2} {"step": 15110, "train_loss": 3.4321298599243164, "lr": 0.0002324141004594938, "tps": 58482, "wall": 16933.5} {"step": 15111, "train_loss": 3.417943000793457, "lr": 0.0002323949880061103, "tps": 58467, "wall": 16938.9} {"step": 15112, "train_loss": 3.347161054611206, "lr": 0.00023237587541231577, "tps": 58453, "wall": 16944.3} {"step": 15113, "train_loss": 3.30326509475708, "lr": 0.0002323567626783266, "tps": 58437, "wall": 16949.8} {"step": 15114, "train_loss": 3.298614740371704, "lr": 0.00023233764980435938, "tps": 58423, "wall": 16955.1} {"step": 15115, "train_loss": 3.3731777667999268, "lr": 0.0002323185367906306, "tps": 58408, "wall": 16960.5} {"step": 15116, "train_loss": 3.394315719604492, "lr": 0.0002322994236373568, "tps": 58394, "wall": 16965.9} {"step": 15117, "train_loss": 3.350040912628174, "lr": 0.00023228031034475444, "tps": 58379, "wall": 16971.3} {"step": 15118, "train_loss": 3.3890883922576904, "lr": 0.00023226119691303998, "tps": 58365, "wall": 16976.6} {"step": 15119, "train_loss": 3.254002809524536, "lr": 0.00023224208334243014, "tps": 58350, "wall": 16981.9} {"step": 15120, "train_loss": 3.2623372077941895, "lr": 0.00023222296963314122, "tps": 58335, "wall": 16987.3} {"step": 15121, "train_loss": 3.2992019653320312, "lr": 0.00023220385578538993, "tps": 58321, "wall": 16992.7} {"step": 15122, "train_loss": 3.4439635276794434, "lr": 0.00023218474179939272, "tps": 58306, "wall": 16998.1} {"step": 15123, "train_loss": 3.3688924312591553, "lr": 0.00023216562767536597, "tps": 58291, "wall": 17003.5} {"step": 15124, "train_loss": 3.408379077911377, "lr": 0.00023214651341352637, "tps": 58277, "wall": 17008.9} {"step": 15125, "train_loss": 3.2997677326202393, "lr": 0.00023212739901409045, "tps": 58262, "wall": 17014.4} {"step": 15126, "train_loss": 3.4646143913269043, "lr": 0.00023210828447727474, "tps": 58247, "wall": 17019.8} {"step": 15127, "train_loss": 3.3588991165161133, "lr": 0.00023208916980329566, "tps": 58233, "wall": 17025.2} {"step": 15128, "train_loss": 3.495108127593994, "lr": 0.00023207005499236984, "tps": 58218, "wall": 17030.6} {"step": 15129, "train_loss": 3.405019998550415, "lr": 0.00023205094004471373, "tps": 58203, "wall": 17036.0} {"step": 15130, "train_loss": 3.457855701446533, "lr": 0.000232031824960544, "tps": 58189, "wall": 17041.4} {"step": 15131, "train_loss": 3.4702422618865967, "lr": 0.00023201270974007704, "tps": 58174, "wall": 17046.8} {"step": 15132, "train_loss": 3.3228347301483154, "lr": 0.00023199359438352946, "tps": 58159, "wall": 17052.3} {"step": 15133, "train_loss": 3.368203639984131, "lr": 0.00023197447889111784, "tps": 58144, "wall": 17057.8} {"step": 15134, "train_loss": 3.3398540019989014, "lr": 0.00023195536326305863, "tps": 58130, "wall": 17063.2} {"step": 15135, "train_loss": 3.3775181770324707, "lr": 0.00023193624749956842, "tps": 58115, "wall": 17068.5} {"step": 15136, "train_loss": 3.448530673980713, "lr": 0.0002319171316008638, "tps": 58101, "wall": 17074.0} {"step": 15137, "train_loss": 3.4288172721862793, "lr": 0.0002318980155671612, "tps": 58086, "wall": 17079.5} {"step": 15138, "train_loss": 3.3535711765289307, "lr": 0.00023187889939867726, "tps": 58071, "wall": 17084.9} {"step": 15139, "train_loss": 3.4179391860961914, "lr": 0.00023185978309562852, "tps": 58057, "wall": 17090.3} {"step": 15140, "train_loss": 3.409518003463745, "lr": 0.00023184066665823152, "tps": 58042, "wall": 17095.7} {"step": 15141, "train_loss": 3.271195411682129, "lr": 0.00023182155008670278, "tps": 58028, "wall": 17101.1} {"step": 15142, "train_loss": 3.3553028106689453, "lr": 0.00023180243338125886, "tps": 58013, "wall": 17106.6} {"step": 15143, "train_loss": 3.4262874126434326, "lr": 0.0002317833165421164, "tps": 57998, "wall": 17112.0} {"step": 15144, "train_loss": 3.296661853790283, "lr": 0.00023176419956949187, "tps": 57984, "wall": 17117.5} {"step": 15145, "train_loss": 3.3984620571136475, "lr": 0.00023174508246360186, "tps": 57969, "wall": 17123.0} {"step": 15146, "train_loss": 3.397519111633301, "lr": 0.00023172596522466287, "tps": 57954, "wall": 17128.4} {"step": 15147, "train_loss": 3.3974363803863525, "lr": 0.0002317068478528916, "tps": 57939, "wall": 17134.0} {"step": 15148, "train_loss": 3.4796502590179443, "lr": 0.00023168773034850447, "tps": 57925, "wall": 17139.4} {"step": 15149, "train_loss": 3.34067964553833, "lr": 0.00023166861271171806, "tps": 57910, "wall": 17144.9} {"step": 15150, "train_loss": 3.343043327331543, "lr": 0.00023164949494274906, "tps": 57895, "wall": 17150.4} {"step": 15151, "train_loss": 3.267693042755127, "lr": 0.00023163037704181392, "tps": 57881, "wall": 17155.9} {"step": 15152, "train_loss": 3.2709219455718994, "lr": 0.0002316112590091292, "tps": 57866, "wall": 17161.4} {"step": 15153, "train_loss": 3.3868656158447266, "lr": 0.00023159214084491155, "tps": 57851, "wall": 17166.9} {"step": 15154, "train_loss": 3.3772244453430176, "lr": 0.0002315730225493775, "tps": 57836, "wall": 17172.4} {"step": 15155, "train_loss": 3.35392427444458, "lr": 0.00023155390412274362, "tps": 57822, "wall": 17177.8} {"step": 15156, "train_loss": 3.3984055519104004, "lr": 0.00023153478556522643, "tps": 57807, "wall": 17183.4} {"step": 15157, "train_loss": 3.2742295265197754, "lr": 0.00023151566687704266, "tps": 57792, "wall": 17188.9} {"step": 15158, "train_loss": 3.4629502296447754, "lr": 0.00023149654805840872, "tps": 57777, "wall": 17194.5} {"step": 15159, "train_loss": 3.438772201538086, "lr": 0.00023147742910954126, "tps": 57763, "wall": 17199.9} {"step": 15160, "train_loss": 3.510211706161499, "lr": 0.00023145831003065697, "tps": 57748, "wall": 17205.5} {"step": 15161, "train_loss": 3.2797961235046387, "lr": 0.00023143919082197224, "tps": 57733, "wall": 17211.0} {"step": 15162, "train_loss": 3.48238468170166, "lr": 0.00023142007148370373, "tps": 57718, "wall": 17216.6} {"step": 15163, "train_loss": 3.526319980621338, "lr": 0.00023140095201606804, "tps": 57704, "wall": 17222.0} {"step": 15164, "train_loss": 3.4094438552856445, "lr": 0.0002313818324192818, "tps": 57689, "wall": 17227.6} {"step": 15165, "train_loss": 3.3772006034851074, "lr": 0.00023136271269356143, "tps": 57675, "wall": 17233.1} {"step": 15166, "train_loss": 3.3633182048797607, "lr": 0.00023134359283912375, "tps": 57660, "wall": 17238.6} {"step": 15167, "train_loss": 3.340125560760498, "lr": 0.00023132447285618518, "tps": 57645, "wall": 17244.2} {"step": 15168, "train_loss": 3.322791576385498, "lr": 0.00023130535274496237, "tps": 57630, "wall": 17249.8} {"step": 15169, "train_loss": 3.385136127471924, "lr": 0.00023128623250567195, "tps": 57616, "wall": 17255.2} {"step": 15170, "train_loss": 3.4301419258117676, "lr": 0.00023126711213853046, "tps": 57601, "wall": 17260.7} {"step": 15171, "train_loss": 3.305354595184326, "lr": 0.00023124799164375451, "tps": 57586, "wall": 17266.3} {"step": 15172, "train_loss": 3.3471360206604004, "lr": 0.00023122887102156067, "tps": 57572, "wall": 17271.8} {"step": 15173, "train_loss": 3.4056525230407715, "lr": 0.0002312097502721656, "tps": 57557, "wall": 17277.4} {"step": 15174, "train_loss": 3.2923378944396973, "lr": 0.0002311906293957859, "tps": 57542, "wall": 17283.0} {"step": 15175, "train_loss": 3.442948341369629, "lr": 0.00023117150839263814, "tps": 57528, "wall": 17288.5} {"step": 15176, "train_loss": 3.3830835819244385, "lr": 0.00023115238726293885, "tps": 57513, "wall": 17294.0} {"step": 15177, "train_loss": 3.3759889602661133, "lr": 0.0002311332660069048, "tps": 57499, "wall": 17299.5} {"step": 15178, "train_loss": 3.3841283321380615, "lr": 0.0002311141446247525, "tps": 57484, "wall": 17305.1} {"step": 15179, "train_loss": 3.3592276573181152, "lr": 0.00023109502311669853, "tps": 57469, "wall": 17310.7} {"step": 15180, "train_loss": 3.4366345405578613, "lr": 0.0002310759014829596, "tps": 57454, "wall": 17316.3} {"step": 15181, "train_loss": 3.396442413330078, "lr": 0.00023105677972375216, "tps": 57439, "wall": 17321.9} {"step": 15182, "train_loss": 3.2607288360595703, "lr": 0.00023103765783929298, "tps": 57425, "wall": 17327.4} {"step": 15183, "train_loss": 3.3600990772247314, "lr": 0.00023101853582979863, "tps": 57410, "wall": 17333.0} {"step": 15184, "train_loss": 3.3778181076049805, "lr": 0.0002309994136954857, "tps": 57396, "wall": 17338.5} {"step": 15185, "train_loss": 3.4041316509246826, "lr": 0.0002309802914365708, "tps": 57381, "wall": 17344.1} {"step": 15186, "train_loss": 3.4174294471740723, "lr": 0.00023096116905327055, "tps": 57367, "wall": 17349.6} {"step": 15187, "train_loss": 3.393615245819092, "lr": 0.00023094204654580165, "tps": 57352, "wall": 17355.2} {"step": 15188, "train_loss": 3.2826526165008545, "lr": 0.0002309229239143806, "tps": 57337, "wall": 17360.7} {"step": 15189, "train_loss": 3.392946243286133, "lr": 0.0002309038011592241, "tps": 57323, "wall": 17366.3} {"step": 15190, "train_loss": 3.3472819328308105, "lr": 0.00023088467828054877, "tps": 57308, "wall": 17371.9} {"step": 15191, "train_loss": 3.414778470993042, "lr": 0.0002308655552785712, "tps": 57293, "wall": 17377.5} {"step": 15192, "train_loss": 3.340284824371338, "lr": 0.00023084643215350793, "tps": 57279, "wall": 17383.1} {"step": 15193, "train_loss": 3.339583158493042, "lr": 0.00023082730890557583, "tps": 57264, "wall": 17388.6} {"step": 15194, "train_loss": 3.289706230163574, "lr": 0.00023080818553499133, "tps": 57250, "wall": 17394.1} {"step": 15195, "train_loss": 3.2871460914611816, "lr": 0.00023078906204197113, "tps": 57235, "wall": 17399.7} {"step": 15196, "train_loss": 3.4407742023468018, "lr": 0.00023076993842673186, "tps": 57221, "wall": 17405.3} {"step": 15197, "train_loss": 3.4842090606689453, "lr": 0.0002307508146894901, "tps": 57206, "wall": 17410.8} {"step": 15198, "train_loss": 3.4074158668518066, "lr": 0.00023073169083046255, "tps": 57192, "wall": 17416.4} {"step": 15199, "train_loss": 3.3099663257598877, "lr": 0.00023071256684986584, "tps": 57177, "wall": 17422.0} {"step": 15200, "train_loss": 3.362513780593872, "lr": 0.0002306934427479166, "tps": 57162, "wall": 17427.6} {"step": 15201, "train_loss": 3.324967384338379, "lr": 0.00023067431852483145, "tps": 57148, "wall": 17433.2} {"step": 15202, "train_loss": 3.3990464210510254, "lr": 0.00023065519418082704, "tps": 57133, "wall": 17438.8} {"step": 15203, "train_loss": 3.3016581535339355, "lr": 0.00023063606971612002, "tps": 57119, "wall": 17444.4} {"step": 15204, "train_loss": 3.340280532836914, "lr": 0.00023061694513092706, "tps": 57104, "wall": 17450.0} {"step": 15205, "train_loss": 3.4097588062286377, "lr": 0.00023059782042546476, "tps": 57090, "wall": 17455.6} {"step": 15206, "train_loss": 3.409931182861328, "lr": 0.00023057869559994974, "tps": 57075, "wall": 17461.2} {"step": 15207, "train_loss": 3.3836793899536133, "lr": 0.0002305595706545987, "tps": 57061, "wall": 17466.7} {"step": 15208, "train_loss": 3.4164743423461914, "lr": 0.0002305404455896283, "tps": 57046, "wall": 17472.3} {"step": 15209, "train_loss": 3.364220142364502, "lr": 0.00023052132040525506, "tps": 57032, "wall": 17477.8} {"step": 15210, "train_loss": 3.301436424255371, "lr": 0.0002305021951016958, "tps": 57018, "wall": 17483.4} {"step": 15211, "train_loss": 3.4374048709869385, "lr": 0.0002304830696791672, "tps": 57003, "wall": 17488.9} {"step": 15212, "train_loss": 3.391341209411621, "lr": 0.00023046394413788574, "tps": 56988, "wall": 17494.6} {"step": 15213, "train_loss": 3.2526092529296875, "lr": 0.0002304448184780681, "tps": 56974, "wall": 17500.2} {"step": 15214, "train_loss": 3.4395737648010254, "lr": 0.00023042569269993103, "tps": 56959, "wall": 17505.8} {"step": 15215, "train_loss": 3.2914984226226807, "lr": 0.00023040656680369117, "tps": 56945, "wall": 17511.4} {"step": 15216, "train_loss": 3.369114398956299, "lr": 0.00023038744078956517, "tps": 56931, "wall": 17517.0} {"step": 15217, "train_loss": 3.4604744911193848, "lr": 0.00023036831465776962, "tps": 56916, "wall": 17522.6} {"step": 15218, "train_loss": 3.295362949371338, "lr": 0.0002303491884085213, "tps": 56902, "wall": 17528.2} {"step": 15219, "train_loss": 3.3602640628814697, "lr": 0.00023033006204203676, "tps": 56887, "wall": 17533.7} {"step": 15220, "train_loss": 3.3884024620056152, "lr": 0.00023031093555853275, "tps": 56873, "wall": 17539.4} {"step": 15221, "train_loss": 3.428255796432495, "lr": 0.0002302918089582259, "tps": 56859, "wall": 17545.0} {"step": 15222, "train_loss": 3.474233865737915, "lr": 0.0002302726822413329, "tps": 56844, "wall": 17550.7} {"step": 15223, "train_loss": 3.3683438301086426, "lr": 0.0002302535554080704, "tps": 56829, "wall": 17556.3} {"step": 15224, "train_loss": 3.4103307723999023, "lr": 0.000230234428458655, "tps": 56815, "wall": 17561.9} {"step": 15225, "train_loss": 3.3143985271453857, "lr": 0.00023021530139330355, "tps": 56800, "wall": 17567.5} {"step": 15226, "train_loss": 3.3513827323913574, "lr": 0.00023019617421223253, "tps": 56786, "wall": 17573.1} {"step": 15227, "train_loss": 3.3661904335021973, "lr": 0.0002301770469156587, "tps": 56772, "wall": 17578.8} {"step": 15228, "train_loss": 3.34885311126709, "lr": 0.0002301579195037988, "tps": 56757, "wall": 17584.4} {"step": 15229, "train_loss": 3.481753349304199, "lr": 0.00023013879197686938, "tps": 56743, "wall": 17590.0} {"step": 15230, "train_loss": 3.398454427719116, "lr": 0.00023011966433508717, "tps": 56728, "wall": 17595.6} {"step": 15231, "train_loss": 3.3041038513183594, "lr": 0.00023010053657866885, "tps": 56714, "wall": 17601.2} {"step": 15232, "train_loss": 3.3428335189819336, "lr": 0.00023008140870783118, "tps": 56700, "wall": 17606.8} {"step": 15233, "train_loss": 3.3977909088134766, "lr": 0.0002300622807227907, "tps": 56685, "wall": 17612.6} {"step": 15234, "train_loss": 3.4116036891937256, "lr": 0.00023004315262376416, "tps": 56671, "wall": 17618.1} {"step": 15235, "train_loss": 3.420299530029297, "lr": 0.0002300240244109683, "tps": 56657, "wall": 17623.7} {"step": 15236, "train_loss": 3.3626785278320312, "lr": 0.0002300048960846197, "tps": 56642, "wall": 17629.3} {"step": 15237, "train_loss": 3.3767447471618652, "lr": 0.00022998576764493507, "tps": 56628, "wall": 17634.9} {"step": 15238, "train_loss": 3.510122537612915, "lr": 0.00022996663909213117, "tps": 56614, "wall": 17640.5} {"step": 15239, "train_loss": 3.3460941314697266, "lr": 0.00022994751042642464, "tps": 56599, "wall": 17646.2} {"step": 15240, "train_loss": 3.39507794380188, "lr": 0.00022992838164803217, "tps": 56585, "wall": 17651.8} {"step": 15241, "train_loss": 3.296262502670288, "lr": 0.0002299092527571704, "tps": 56571, "wall": 17657.4} {"step": 15242, "train_loss": 3.2850403785705566, "lr": 0.0002298901237540562, "tps": 56556, "wall": 17663.1} {"step": 15243, "train_loss": 3.365445852279663, "lr": 0.00022987099463890606, "tps": 56542, "wall": 17668.7} {"step": 15244, "train_loss": 3.324756145477295, "lr": 0.00022985186541193674, "tps": 56527, "wall": 17674.4} {"step": 15245, "train_loss": 3.3295657634735107, "lr": 0.000229832736073365, "tps": 56513, "wall": 17680.0} {"step": 15246, "train_loss": 3.2457056045532227, "lr": 0.00022981360662340748, "tps": 56499, "wall": 17685.7} {"step": 15247, "train_loss": 3.298623561859131, "lr": 0.00022979447706228086, "tps": 56485, "wall": 17691.3} {"step": 15248, "train_loss": 3.337388277053833, "lr": 0.00022977534739020193, "tps": 56470, "wall": 17696.9} {"step": 15249, "train_loss": 3.31781268119812, "lr": 0.00022975621760738734, "tps": 56456, "wall": 17702.6} {"step": 15250, "train_loss": 3.358344316482544, "lr": 0.00022973708771405375, "tps": 56442, "wall": 17708.2} {"step": 15251, "train_loss": 3.357971668243408, "lr": 0.0002297179577104179, "tps": 56427, "wall": 17713.9} {"step": 15252, "train_loss": 3.329468011856079, "lr": 0.00022969882759669652, "tps": 56413, "wall": 17719.5} {"step": 15253, "train_loss": 3.3250434398651123, "lr": 0.0002296796973731063, "tps": 56399, "wall": 17725.2} {"step": 15254, "train_loss": 3.502570390701294, "lr": 0.00022966056703986395, "tps": 56384, "wall": 17731.0} {"step": 15255, "train_loss": 3.403329610824585, "lr": 0.00022964143659718613, "tps": 56370, "wall": 17736.5} {"step": 15256, "train_loss": 3.339218854904175, "lr": 0.00022962230604528966, "tps": 56356, "wall": 17742.1} {"step": 15257, "train_loss": 3.3758068084716797, "lr": 0.0002296031753843911, "tps": 56342, "wall": 17747.7} {"step": 15258, "train_loss": 3.408339500427246, "lr": 0.0002295840446147073, "tps": 56328, "wall": 17753.3} {"step": 15259, "train_loss": 3.386805534362793, "lr": 0.00022956491373645496, "tps": 56314, "wall": 17759.0} {"step": 15260, "train_loss": 3.3931238651275635, "lr": 0.00022954578274985075, "tps": 56299, "wall": 17764.6} {"step": 15261, "train_loss": 3.3050875663757324, "lr": 0.00022952665165511133, "tps": 56285, "wall": 17770.3} {"step": 15262, "train_loss": 3.4820733070373535, "lr": 0.0002295075204524536, "tps": 56271, "wall": 17775.9} {"step": 15263, "train_loss": 3.41658091545105, "lr": 0.00022948838914209403, "tps": 56257, "wall": 17781.5} {"step": 15264, "train_loss": 3.3257219791412354, "lr": 0.00022946925772424952, "tps": 56243, "wall": 17787.1} {"step": 15265, "train_loss": 3.4149363040924072, "lr": 0.00022945012619913683, "tps": 56228, "wall": 17793.0} {"step": 15266, "train_loss": 3.4375157356262207, "lr": 0.00022943099456697246, "tps": 56214, "wall": 17798.6} {"step": 15267, "train_loss": 3.354245185852051, "lr": 0.00022941186282797332, "tps": 56200, "wall": 17804.3} {"step": 15268, "train_loss": 3.3411145210266113, "lr": 0.0002293927309823561, "tps": 56185, "wall": 17810.0} {"step": 15269, "train_loss": 3.4748775959014893, "lr": 0.00022937359903033762, "tps": 56171, "wall": 17815.7} {"step": 15270, "train_loss": 3.4013943672180176, "lr": 0.0002293544669721344, "tps": 56157, "wall": 17821.4} {"step": 15271, "train_loss": 3.4083034992218018, "lr": 0.00022933533480796325, "tps": 56143, "wall": 17827.0} {"step": 15272, "train_loss": 3.332165479660034, "lr": 0.00022931620253804097, "tps": 56129, "wall": 17832.6} {"step": 15273, "train_loss": 3.3612658977508545, "lr": 0.00022929707016258424, "tps": 56115, "wall": 17838.3} {"step": 15274, "train_loss": 3.364328145980835, "lr": 0.00022927793768180976, "tps": 56100, "wall": 17844.0} {"step": 15275, "train_loss": 3.363518238067627, "lr": 0.00022925880509593434, "tps": 56086, "wall": 17849.8} {"step": 15276, "train_loss": 3.3781819343566895, "lr": 0.00022923967240517462, "tps": 56072, "wall": 17855.5} {"step": 15277, "train_loss": 3.3510332107543945, "lr": 0.00022922053960974746, "tps": 56057, "wall": 17861.2} {"step": 15278, "train_loss": 3.342367649078369, "lr": 0.00022920140670986948, "tps": 56043, "wall": 17866.9} {"step": 15279, "train_loss": 3.359678268432617, "lr": 0.00022918227370575752, "tps": 56029, "wall": 17872.5} {"step": 15280, "train_loss": 3.398655652999878, "lr": 0.0002291631405976282, "tps": 56015, "wall": 17878.1} {"step": 15281, "train_loss": 3.405609130859375, "lr": 0.0002291440073856984, "tps": 56001, "wall": 17883.7} {"step": 15282, "train_loss": 3.2769393920898438, "lr": 0.00022912487407018476, "tps": 55987, "wall": 17889.4} {"step": 15283, "train_loss": 3.399524450302124, "lr": 0.00022910574065130402, "tps": 55973, "wall": 17895.0} {"step": 15284, "train_loss": 3.345454216003418, "lr": 0.00022908660712927294, "tps": 55959, "wall": 17900.7} {"step": 15285, "train_loss": 3.4831295013427734, "lr": 0.00022906747350430836, "tps": 55945, "wall": 17906.4} {"step": 15286, "train_loss": 3.3781661987304688, "lr": 0.00022904833977662695, "tps": 55931, "wall": 17912.1} {"step": 15287, "train_loss": 3.4331934452056885, "lr": 0.0002290292059464454, "tps": 55917, "wall": 17917.8} {"step": 15288, "train_loss": 3.3282041549682617, "lr": 0.0002290100720139805, "tps": 55903, "wall": 17923.4} {"step": 15289, "train_loss": 3.3518478870391846, "lr": 0.0002289909379794491, "tps": 55889, "wall": 17929.1} {"step": 15290, "train_loss": 3.469564914703369, "lr": 0.0002289718038430678, "tps": 55875, "wall": 17934.7} {"step": 15291, "train_loss": 3.3115668296813965, "lr": 0.0002289526696050534, "tps": 55861, "wall": 17940.3} {"step": 15292, "train_loss": 3.536630868911743, "lr": 0.00022893353526562277, "tps": 55848, "wall": 17945.9} {"step": 15293, "train_loss": 3.3179588317871094, "lr": 0.0002289144008249925, "tps": 55834, "wall": 17951.6} {"step": 15294, "train_loss": 3.3514297008514404, "lr": 0.0002288952662833794, "tps": 55820, "wall": 17957.2} {"step": 15295, "train_loss": 3.2807743549346924, "lr": 0.00022887613164100033, "tps": 55806, "wall": 17962.7} {"step": 15296, "train_loss": 3.2864205837249756, "lr": 0.00022885699689807187, "tps": 55792, "wall": 17968.4} {"step": 15297, "train_loss": 3.3459231853485107, "lr": 0.00022883786205481094, "tps": 55778, "wall": 17974.0} {"step": 15298, "train_loss": 3.3848001956939697, "lr": 0.0002288187271114342, "tps": 55765, "wall": 17979.6} {"step": 15299, "train_loss": 3.369877338409424, "lr": 0.0002287995920681584, "tps": 55751, "wall": 17985.3} {"step": 15300, "train_loss": 3.2544078826904297, "lr": 0.00022878045692520044, "tps": 55737, "wall": 17990.9} {"step": 15301, "train_loss": 3.3035030364990234, "lr": 0.00022876132168277692, "tps": 55723, "wall": 17996.5} {"step": 15302, "train_loss": 3.3330535888671875, "lr": 0.0002287421863411047, "tps": 55710, "wall": 18002.1} {"step": 15303, "train_loss": 3.3326196670532227, "lr": 0.0002287230509004005, "tps": 55696, "wall": 18007.6} {"step": 15304, "train_loss": 3.3534798622131348, "lr": 0.00022870391536088108, "tps": 55682, "wall": 18013.2} {"step": 15305, "train_loss": 3.3724365234375, "lr": 0.00022868477972276327, "tps": 55669, "wall": 18018.8} {"step": 15306, "train_loss": 3.3351311683654785, "lr": 0.00022866564398626378, "tps": 55655, "wall": 18024.4} {"step": 15307, "train_loss": 3.2694272994995117, "lr": 0.00022864650815159946, "tps": 55641, "wall": 18030.1} {"step": 15308, "train_loss": 3.434176206588745, "lr": 0.00022862737221898702, "tps": 55628, "wall": 18035.7} {"step": 15309, "train_loss": 3.351475715637207, "lr": 0.0002286082361886432, "tps": 55614, "wall": 18041.3} {"step": 15310, "train_loss": 3.3912782669067383, "lr": 0.00022858910006078484, "tps": 55600, "wall": 18046.9} {"step": 15311, "train_loss": 3.5356035232543945, "lr": 0.00022856996383562869, "tps": 55587, "wall": 18052.4} {"step": 15312, "train_loss": 3.295065402984619, "lr": 0.0002285508275133915, "tps": 55573, "wall": 18058.0} {"step": 15313, "train_loss": 3.3789422512054443, "lr": 0.0002285316910942901, "tps": 55560, "wall": 18063.5} {"step": 15314, "train_loss": 3.411991834640503, "lr": 0.00022851255457854124, "tps": 55547, "wall": 18069.1} {"step": 15315, "train_loss": 3.361083984375, "lr": 0.0002284934179663617, "tps": 55533, "wall": 18074.6} {"step": 15316, "train_loss": 3.392854690551758, "lr": 0.0002284742812579682, "tps": 55520, "wall": 18080.2} {"step": 15317, "train_loss": 3.318636417388916, "lr": 0.00022845514445357773, "tps": 55506, "wall": 18085.7} {"step": 15318, "train_loss": 3.3589513301849365, "lr": 0.00022843600755340679, "tps": 55493, "wall": 18091.3} {"step": 15319, "train_loss": 3.3335886001586914, "lr": 0.00022841687055767237, "tps": 55479, "wall": 18096.9} {"step": 15320, "train_loss": 3.5208334922790527, "lr": 0.00022839773346659118, "tps": 55466, "wall": 18102.5} {"step": 15321, "train_loss": 3.4479639530181885, "lr": 0.00022837859628038, "tps": 55452, "wall": 18108.0} {"step": 15322, "train_loss": 3.353782892227173, "lr": 0.00022835945899925557, "tps": 55439, "wall": 18113.6} {"step": 15323, "train_loss": 3.308743476867676, "lr": 0.0002283403216234348, "tps": 55426, "wall": 18119.1} {"step": 15324, "train_loss": 3.399764060974121, "lr": 0.0002283211841531344, "tps": 55412, "wall": 18124.7} {"step": 15325, "train_loss": 3.440333843231201, "lr": 0.00022830204658857116, "tps": 55399, "wall": 18130.2} {"step": 15326, "train_loss": 3.3752613067626953, "lr": 0.0002282829089299619, "tps": 55386, "wall": 18135.8} {"step": 15327, "train_loss": 3.3029444217681885, "lr": 0.00022826377117752343, "tps": 55372, "wall": 18141.3} {"step": 15328, "train_loss": 3.462023973464966, "lr": 0.0002282446333314725, "tps": 55359, "wall": 18146.9} {"step": 15329, "train_loss": 3.329216718673706, "lr": 0.00022822549539202585, "tps": 55345, "wall": 18152.5} {"step": 15330, "train_loss": 3.405867099761963, "lr": 0.00022820635735940043, "tps": 55332, "wall": 18158.0} {"step": 15331, "train_loss": 3.3756656646728516, "lr": 0.00022818721923381294, "tps": 55319, "wall": 18163.5} {"step": 15332, "train_loss": 3.3782689571380615, "lr": 0.00022816808101548013, "tps": 55306, "wall": 18169.0} {"step": 15333, "train_loss": 3.2955939769744873, "lr": 0.0002281489427046189, "tps": 55293, "wall": 18174.6} {"step": 15334, "train_loss": 3.3804237842559814, "lr": 0.00022812980430144607, "tps": 55279, "wall": 18180.1} {"step": 15335, "train_loss": 3.429741144180298, "lr": 0.0002281106658061783, "tps": 55266, "wall": 18185.6} {"step": 15336, "train_loss": 3.350731611251831, "lr": 0.0002280915272190324, "tps": 55253, "wall": 18191.1} {"step": 15337, "train_loss": 3.294440746307373, "lr": 0.0002280723885402254, "tps": 55240, "wall": 18196.6} {"step": 15338, "train_loss": 3.448772668838501, "lr": 0.0002280532497699738, "tps": 55227, "wall": 18202.1} {"step": 15339, "train_loss": 3.3789992332458496, "lr": 0.0002280341109084946, "tps": 55214, "wall": 18207.7} {"step": 15340, "train_loss": 3.3188586235046387, "lr": 0.0002280149719560046, "tps": 55201, "wall": 18213.2} {"step": 15341, "train_loss": 3.38038969039917, "lr": 0.00022799583291272053, "tps": 55187, "wall": 18218.8} {"step": 15342, "train_loss": 3.3793561458587646, "lr": 0.00022797669377885922, "tps": 55174, "wall": 18224.3} {"step": 15343, "train_loss": 3.350151538848877, "lr": 0.00022795755455463752, "tps": 55161, "wall": 18229.8} {"step": 15344, "train_loss": 3.461677074432373, "lr": 0.00022793841524027225, "tps": 55148, "wall": 18235.3} {"step": 15345, "train_loss": 3.424826145172119, "lr": 0.0002279192758359801, "tps": 55135, "wall": 18240.8} {"step": 15346, "train_loss": 3.2752747535705566, "lr": 0.00022790013634197797, "tps": 55122, "wall": 18246.4} {"step": 15347, "train_loss": 3.3918495178222656, "lr": 0.00022788099675848274, "tps": 55109, "wall": 18251.8} {"step": 15348, "train_loss": 3.34324049949646, "lr": 0.00022786185708571107, "tps": 55096, "wall": 18257.3} {"step": 15349, "train_loss": 3.3687920570373535, "lr": 0.00022784271732387987, "tps": 55083, "wall": 18262.8} {"step": 15350, "train_loss": 3.403658866882324, "lr": 0.00022782357747320604, "tps": 55070, "wall": 18268.3} {"step": 15351, "train_loss": 3.4960598945617676, "lr": 0.0002278044375339062, "tps": 55057, "wall": 18273.8} {"step": 15352, "train_loss": 3.387458324432373, "lr": 0.0002277852975061973, "tps": 55044, "wall": 18279.3} {"step": 15353, "train_loss": 3.3410112857818604, "lr": 0.00022776615739029615, "tps": 55031, "wall": 18284.8} {"step": 15354, "train_loss": 3.4015493392944336, "lr": 0.00022774701718641956, "tps": 55018, "wall": 18290.3} {"step": 15355, "train_loss": 3.4043123722076416, "lr": 0.00022772787689478427, "tps": 55005, "wall": 18295.8} {"step": 15356, "train_loss": 3.3238413333892822, "lr": 0.00022770873651560715, "tps": 54992, "wall": 18301.2} {"step": 15357, "train_loss": 3.2634153366088867, "lr": 0.00022768959604910517, "tps": 54979, "wall": 18306.7} {"step": 15358, "train_loss": 3.508765697479248, "lr": 0.00022767045549549494, "tps": 54966, "wall": 18312.3} {"step": 15359, "train_loss": 3.3067007064819336, "lr": 0.00022765131485499342, "tps": 54954, "wall": 18317.7} {"step": 15360, "train_loss": 3.373263359069824, "lr": 0.00022763217412781735, "tps": 54941, "wall": 18323.2} {"step": 15361, "train_loss": 3.3671748638153076, "lr": 0.00022761303331418368, "tps": 54928, "wall": 18328.7} {"step": 15362, "train_loss": 3.3832504749298096, "lr": 0.00022759389241430906, "tps": 54915, "wall": 18334.2} {"step": 15363, "train_loss": 3.3851242065429688, "lr": 0.00022757475142841046, "tps": 54902, "wall": 18339.7} {"step": 15364, "train_loss": 3.3843655586242676, "lr": 0.00022755561035670466, "tps": 54889, "wall": 18345.2} {"step": 15365, "train_loss": 3.242140293121338, "lr": 0.00022753646919940846, "tps": 54876, "wall": 18350.7} {"step": 15366, "train_loss": 3.329782247543335, "lr": 0.00022751732795673878, "tps": 54863, "wall": 18356.2} {"step": 15367, "train_loss": 3.3298819065093994, "lr": 0.0002274981866289124, "tps": 54851, "wall": 18361.6} {"step": 15368, "train_loss": 3.3452441692352295, "lr": 0.00022747904521614617, "tps": 54838, "wall": 18367.1} {"step": 15369, "train_loss": 3.3248839378356934, "lr": 0.00022745990371865688, "tps": 54825, "wall": 18372.6} {"step": 15370, "train_loss": 3.4313769340515137, "lr": 0.0002274407621366614, "tps": 54812, "wall": 18378.0} {"step": 15371, "train_loss": 3.3834948539733887, "lr": 0.00022742162047037655, "tps": 54800, "wall": 18383.5} {"step": 15372, "train_loss": 3.346125602722168, "lr": 0.0002274024787200192, "tps": 54787, "wall": 18389.0} {"step": 15373, "train_loss": 3.379049301147461, "lr": 0.00022738333688580617, "tps": 54774, "wall": 18394.6} {"step": 15374, "train_loss": 3.401926279067993, "lr": 0.00022736419496795432, "tps": 54761, "wall": 18400.1} {"step": 15375, "train_loss": 3.3526320457458496, "lr": 0.00022734505296668044, "tps": 54748, "wall": 18405.5} {"step": 15376, "train_loss": 3.3431613445281982, "lr": 0.0002273259108822014, "tps": 54736, "wall": 18410.9} {"step": 15377, "train_loss": 3.3982722759246826, "lr": 0.00022730676871473407, "tps": 54723, "wall": 18416.4} {"step": 15378, "train_loss": 3.400078773498535, "lr": 0.00022728762646449528, "tps": 54711, "wall": 18421.8} {"step": 15379, "train_loss": 3.2807719707489014, "lr": 0.00022726848413170183, "tps": 54698, "wall": 18427.3} {"step": 15380, "train_loss": 3.2668488025665283, "lr": 0.00022724934171657063, "tps": 54685, "wall": 18432.7} {"step": 15381, "train_loss": 3.2973546981811523, "lr": 0.00022723019921931848, "tps": 54673, "wall": 18438.2} {"step": 15382, "train_loss": 3.37801456451416, "lr": 0.00022721105664016224, "tps": 54660, "wall": 18443.7} {"step": 15383, "train_loss": 3.3711373805999756, "lr": 0.00022719191397931873, "tps": 54647, "wall": 18449.1} {"step": 15384, "train_loss": 3.4493746757507324, "lr": 0.00022717277123700486, "tps": 54635, "wall": 18454.7} {"step": 15385, "train_loss": 3.344506025314331, "lr": 0.0002271536284134375, "tps": 54622, "wall": 18460.1} {"step": 15386, "train_loss": 3.2965023517608643, "lr": 0.00022713448550883337, "tps": 54609, "wall": 18465.5} {"step": 15387, "train_loss": 3.2828338146209717, "lr": 0.00022711534252340939, "tps": 54597, "wall": 18471.0} {"step": 15388, "train_loss": 3.4620180130004883, "lr": 0.0002270961994573825, "tps": 54585, "wall": 18476.4} {"step": 15389, "train_loss": 3.2891578674316406, "lr": 0.00022707705631096943, "tps": 54572, "wall": 18481.8} {"step": 15390, "train_loss": 3.4626054763793945, "lr": 0.00022705791308438706, "tps": 54560, "wall": 18487.2} {"step": 15391, "train_loss": 3.3881542682647705, "lr": 0.0002270387697778523, "tps": 54547, "wall": 18492.7} {"step": 15392, "train_loss": 3.3438634872436523, "lr": 0.00022701962639158198, "tps": 54535, "wall": 18498.1} {"step": 15393, "train_loss": 3.3975911140441895, "lr": 0.00022700048292579296, "tps": 54522, "wall": 18503.5} {"step": 15394, "train_loss": 3.260941982269287, "lr": 0.0002269813393807021, "tps": 54509, "wall": 18509.1} {"step": 15395, "train_loss": 3.3347718715667725, "lr": 0.00022696219575652626, "tps": 54497, "wall": 18514.6} {"step": 15396, "train_loss": 3.399717330932617, "lr": 0.00022694305205348222, "tps": 54484, "wall": 18520.0} {"step": 15397, "train_loss": 3.38077974319458, "lr": 0.00022692390827178693, "tps": 54472, "wall": 18525.4} {"step": 15398, "train_loss": 3.3559346199035645, "lr": 0.0002269047644116573, "tps": 54459, "wall": 18530.9} {"step": 15399, "train_loss": 3.3386266231536865, "lr": 0.00022688562047331007, "tps": 54447, "wall": 18536.3} {"step": 15400, "train_loss": 3.3871729373931885, "lr": 0.00022686647645696217, "tps": 54434, "wall": 18541.8} {"step": 15401, "train_loss": 3.3961362838745117, "lr": 0.00022684733236283045, "tps": 54422, "wall": 18547.2} {"step": 15402, "train_loss": 3.408705472946167, "lr": 0.00022682818819113178, "tps": 54410, "wall": 18552.6} {"step": 15403, "train_loss": 3.372931718826294, "lr": 0.00022680904394208303, "tps": 54397, "wall": 18558.0} {"step": 15404, "train_loss": 3.335437774658203, "lr": 0.00022678989961590103, "tps": 54385, "wall": 18563.4} {"step": 15405, "train_loss": 3.3759970664978027, "lr": 0.00022677075521280275, "tps": 54373, "wall": 18568.9} {"step": 15406, "train_loss": 3.4131298065185547, "lr": 0.00022675161073300494, "tps": 54360, "wall": 18574.5} {"step": 15407, "train_loss": 3.4165613651275635, "lr": 0.0002267324661767245, "tps": 54347, "wall": 18579.9} {"step": 15408, "train_loss": 3.2723708152770996, "lr": 0.0002267133215441783, "tps": 54335, "wall": 18585.3} {"step": 15409, "train_loss": 3.356703281402588, "lr": 0.00022669417683558334, "tps": 54323, "wall": 18590.8} {"step": 15410, "train_loss": 3.349090814590454, "lr": 0.00022667503205115632, "tps": 54310, "wall": 18596.2} {"step": 15411, "train_loss": 3.3375957012176514, "lr": 0.00022665588719111414, "tps": 54298, "wall": 18601.6} {"step": 15412, "train_loss": 3.42592716217041, "lr": 0.00022663674225567376, "tps": 54286, "wall": 18607.1} {"step": 15413, "train_loss": 3.419762372970581, "lr": 0.00022661759724505197, "tps": 54273, "wall": 18612.5} {"step": 15414, "train_loss": 3.4323782920837402, "lr": 0.00022659845215946569, "tps": 54261, "wall": 18617.9} {"step": 15415, "train_loss": 3.294208526611328, "lr": 0.00022657930699913182, "tps": 54249, "wall": 18623.3} {"step": 15416, "train_loss": 3.301095962524414, "lr": 0.00022656016176426716, "tps": 54237, "wall": 18628.7} {"step": 15417, "train_loss": 3.3550095558166504, "lr": 0.00022654101645508865, "tps": 54224, "wall": 18634.2} {"step": 15418, "train_loss": 3.4757065773010254, "lr": 0.00022652187107181316, "tps": 54212, "wall": 18639.6} {"step": 15419, "train_loss": 3.291165351867676, "lr": 0.00022650272561465756, "tps": 54200, "wall": 18645.0} {"step": 15420, "train_loss": 3.361342191696167, "lr": 0.00022648358008383874, "tps": 54188, "wall": 18650.4} {"step": 15421, "train_loss": 3.394430160522461, "lr": 0.00022646443447957353, "tps": 54176, "wall": 18655.8} {"step": 15422, "train_loss": 3.2924818992614746, "lr": 0.00022644528880207894, "tps": 54163, "wall": 18661.1} {"step": 15423, "train_loss": 3.38437557220459, "lr": 0.00022642614305157165, "tps": 54151, "wall": 18666.6} {"step": 15424, "train_loss": 3.5296835899353027, "lr": 0.00022640699722826875, "tps": 54139, "wall": 18671.9} {"step": 15425, "train_loss": 3.2561967372894287, "lr": 0.00022638785133238703, "tps": 54127, "wall": 18677.3} {"step": 15426, "train_loss": 3.2655587196350098, "lr": 0.00022636870536414335, "tps": 54115, "wall": 18682.7} {"step": 15427, "train_loss": 3.4118874073028564, "lr": 0.00022634955932375467, "tps": 54103, "wall": 18688.2} {"step": 15428, "train_loss": 3.3247694969177246, "lr": 0.0002263304132114378, "tps": 54090, "wall": 18693.6} {"step": 15429, "train_loss": 3.341433525085449, "lr": 0.00022631126702740971, "tps": 54078, "wall": 18699.0} {"step": 15430, "train_loss": 3.3779492378234863, "lr": 0.00022629212077188724, "tps": 54066, "wall": 18704.4} {"step": 15431, "train_loss": 3.291332244873047, "lr": 0.00022627297444508725, "tps": 54054, "wall": 18709.8} {"step": 15432, "train_loss": 3.3373639583587646, "lr": 0.0002262538280472267, "tps": 54042, "wall": 18715.2} {"step": 15433, "train_loss": 3.3930773735046387, "lr": 0.00022623468157852242, "tps": 54030, "wall": 18720.6} {"step": 15434, "train_loss": 3.3338847160339355, "lr": 0.00022621553503919138, "tps": 54018, "wall": 18726.0} {"step": 15435, "train_loss": 3.318610668182373, "lr": 0.00022619638842945032, "tps": 54006, "wall": 18731.4} {"step": 15436, "train_loss": 3.4799067974090576, "lr": 0.00022617724174951636, "tps": 53994, "wall": 18736.7} {"step": 15437, "train_loss": 3.3645055294036865, "lr": 0.00022615809499960623, "tps": 53982, "wall": 18742.1} {"step": 15438, "train_loss": 3.3440937995910645, "lr": 0.00022613894817993685, "tps": 53970, "wall": 18747.6} {"step": 15439, "train_loss": 3.404418706893921, "lr": 0.00022611980129072512, "tps": 53957, "wall": 18753.0} {"step": 15440, "train_loss": 3.2213735580444336, "lr": 0.00022610065433218795, "tps": 53945, "wall": 18758.4} {"step": 15441, "train_loss": 3.3840975761413574, "lr": 0.00022608150730454228, "tps": 53934, "wall": 18763.8} {"step": 15442, "train_loss": 3.3566179275512695, "lr": 0.00022606236020800494, "tps": 53921, "wall": 18769.2} {"step": 15443, "train_loss": 3.3168764114379883, "lr": 0.00022604321304279284, "tps": 53910, "wall": 18774.6} {"step": 15444, "train_loss": 3.309236526489258, "lr": 0.00022602406580912292, "tps": 53898, "wall": 18780.0} {"step": 15445, "train_loss": 3.3686885833740234, "lr": 0.000226004918507212, "tps": 53885, "wall": 18785.4} {"step": 15446, "train_loss": 3.3534626960754395, "lr": 0.00022598577113727713, "tps": 53874, "wall": 18790.8} {"step": 15447, "train_loss": 3.402961015701294, "lr": 0.00022596662369953508, "tps": 53861, "wall": 18796.2} {"step": 15448, "train_loss": 3.3987159729003906, "lr": 0.00022594747619420277, "tps": 53849, "wall": 18801.6} {"step": 15449, "train_loss": 3.352175712585449, "lr": 0.00022592832862149714, "tps": 53837, "wall": 18807.1} {"step": 15450, "train_loss": 3.3323633670806885, "lr": 0.00022590918098163508, "tps": 53825, "wall": 18812.5} {"step": 15451, "train_loss": 3.3648626804351807, "lr": 0.00022589003327483354, "tps": 53813, "wall": 18817.9} {"step": 15452, "train_loss": 3.325042486190796, "lr": 0.00022587088550130933, "tps": 53801, "wall": 18823.3} {"step": 15453, "train_loss": 3.300281047821045, "lr": 0.00022585173766127942, "tps": 53789, "wall": 18828.7} {"step": 15454, "train_loss": 3.3889591693878174, "lr": 0.00022583258975496074, "tps": 53777, "wall": 18834.1} {"step": 15455, "train_loss": 3.3366620540618896, "lr": 0.00022581344178257014, "tps": 53766, "wall": 18839.5} {"step": 15456, "train_loss": 3.4733214378356934, "lr": 0.00022579429374432457, "tps": 53754, "wall": 18844.8} {"step": 15457, "train_loss": 3.379595994949341, "lr": 0.00022577514564044092, "tps": 53742, "wall": 18850.3} {"step": 15458, "train_loss": 3.2830810546875, "lr": 0.0002257559974711361, "tps": 53730, "wall": 18855.7} {"step": 15459, "train_loss": 3.4069290161132812, "lr": 0.0002257368492366271, "tps": 53718, "wall": 18861.1} {"step": 15460, "train_loss": 3.2980127334594727, "lr": 0.0002257177009371307, "tps": 53706, "wall": 18866.5} {"step": 15461, "train_loss": 3.3950228691101074, "lr": 0.00022569855257286383, "tps": 53694, "wall": 18872.0} {"step": 15462, "train_loss": 3.3591179847717285, "lr": 0.00022567940414404349, "tps": 53682, "wall": 18877.4} {"step": 15463, "train_loss": 3.3245089054107666, "lr": 0.0002256602556508866, "tps": 53670, "wall": 18882.8} {"step": 15464, "train_loss": 3.369382858276367, "lr": 0.00022564110709361003, "tps": 53658, "wall": 18888.2} {"step": 15465, "train_loss": 3.330681800842285, "lr": 0.00022562195847243061, "tps": 53646, "wall": 18893.6} {"step": 15466, "train_loss": 3.3494338989257812, "lr": 0.0002256028097875654, "tps": 53634, "wall": 18899.0} {"step": 15467, "train_loss": 3.436051368713379, "lr": 0.00022558366103923129, "tps": 53623, "wall": 18904.3} {"step": 15468, "train_loss": 3.3952300548553467, "lr": 0.00022556451222764502, "tps": 53611, "wall": 18909.7} {"step": 15469, "train_loss": 3.382728338241577, "lr": 0.00022554536335302373, "tps": 53599, "wall": 18915.1} {"step": 15470, "train_loss": 3.4815828800201416, "lr": 0.00022552621441558434, "tps": 53587, "wall": 18920.4} {"step": 15471, "train_loss": 3.3605380058288574, "lr": 0.0002255070654155436, "tps": 53576, "wall": 18925.8} {"step": 15472, "train_loss": 3.4544219970703125, "lr": 0.0002254879163531186, "tps": 53564, "wall": 18931.3} {"step": 15473, "train_loss": 3.3847641944885254, "lr": 0.0002254687672285262, "tps": 53552, "wall": 18936.7} {"step": 15474, "train_loss": 3.4432921409606934, "lr": 0.00022544961804198322, "tps": 53540, "wall": 18942.1} {"step": 15475, "train_loss": 3.321828842163086, "lr": 0.0002254304687937067, "tps": 53528, "wall": 18947.4} {"step": 15476, "train_loss": 3.422212600708008, "lr": 0.00022541131948391354, "tps": 53517, "wall": 18952.8} {"step": 15477, "train_loss": 3.303419351577759, "lr": 0.00022539217011282068, "tps": 53505, "wall": 18958.2} {"step": 15478, "train_loss": 3.434783697128296, "lr": 0.00022537302068064498, "tps": 53493, "wall": 18963.5} {"step": 15479, "train_loss": 3.381436824798584, "lr": 0.00022535387118760344, "tps": 53482, "wall": 18968.9} {"step": 15480, "train_loss": 3.4629788398742676, "lr": 0.00022533472163391297, "tps": 53470, "wall": 18974.3} {"step": 15481, "train_loss": 3.3902697563171387, "lr": 0.0002253155720197905, "tps": 53458, "wall": 18979.6} {"step": 15482, "train_loss": 3.4539871215820312, "lr": 0.00022529642234545287, "tps": 53446, "wall": 18985.1} {"step": 15483, "train_loss": 3.4011621475219727, "lr": 0.00022527727261111716, "tps": 53435, "wall": 18990.5} {"step": 15484, "train_loss": 3.318878412246704, "lr": 0.00022525812281700019, "tps": 53423, "wall": 18995.9} {"step": 15485, "train_loss": 3.3376054763793945, "lr": 0.0002252389729633189, "tps": 53411, "wall": 19001.2} {"step": 15486, "train_loss": 3.354275703430176, "lr": 0.00022521982305029025, "tps": 53400, "wall": 19006.6} {"step": 15487, "train_loss": 3.37699556350708, "lr": 0.00022520067307813118, "tps": 53388, "wall": 19011.9} {"step": 15488, "train_loss": 3.333784580230713, "lr": 0.0002251815230470586, "tps": 53376, "wall": 19017.3} {"step": 15489, "train_loss": 3.364288330078125, "lr": 0.00022516237295728942, "tps": 53365, "wall": 19022.7} {"step": 15490, "train_loss": 3.2695395946502686, "lr": 0.00022514322280904066, "tps": 53353, "wall": 19028.0} {"step": 15491, "train_loss": 3.38045072555542, "lr": 0.00022512407260252918, "tps": 53342, "wall": 19033.4} {"step": 15492, "train_loss": 3.4238152503967285, "lr": 0.00022510492233797185, "tps": 53330, "wall": 19038.8} {"step": 15493, "train_loss": 3.532292366027832, "lr": 0.00022508577201558571, "tps": 53318, "wall": 19044.2} {"step": 15494, "train_loss": 3.4233157634735107, "lr": 0.00022506662163558776, "tps": 53307, "wall": 19049.6} {"step": 15495, "train_loss": 3.352680206298828, "lr": 0.00022504747119819478, "tps": 53295, "wall": 19055.0} {"step": 15496, "train_loss": 3.3829562664031982, "lr": 0.0002250283207036237, "tps": 53283, "wall": 19060.4} {"step": 15497, "train_loss": 3.2297565937042236, "lr": 0.0002250091701520917, "tps": 53272, "wall": 19065.7} {"step": 15498, "train_loss": 3.4252758026123047, "lr": 0.0002249900195438154, "tps": 53260, "wall": 19071.2} {"step": 15499, "train_loss": 3.2693159580230713, "lr": 0.00022497086887901193, "tps": 53249, "wall": 19076.6} {"step": 15500, "train_loss": 3.403651237487793, "lr": 0.00022495171815789826, "tps": 53237, "wall": 19081.9} {"step": 15501, "train_loss": 3.418771743774414, "lr": 0.00022493256738069118, "tps": 53225, "wall": 19087.5} {"step": 15502, "train_loss": 3.3575961589813232, "lr": 0.00022491341654760772, "tps": 53213, "wall": 19092.9} {"step": 15503, "train_loss": 3.39274263381958, "lr": 0.0002248942656588648, "tps": 53202, "wall": 19098.3} {"step": 15504, "train_loss": 3.333897113800049, "lr": 0.00022487511471467944, "tps": 53190, "wall": 19103.6} {"step": 15505, "train_loss": 3.2696800231933594, "lr": 0.00022485596371526846, "tps": 53179, "wall": 19109.0} {"step": 15506, "train_loss": 3.352903366088867, "lr": 0.00022483681266084884, "tps": 53167, "wall": 19114.4} {"step": 15507, "train_loss": 3.4890832901000977, "lr": 0.00022481766155163762, "tps": 53156, "wall": 19119.8} {"step": 15508, "train_loss": 3.280646324157715, "lr": 0.0002247985103878516, "tps": 53144, "wall": 19125.1} {"step": 15509, "train_loss": 3.309931516647339, "lr": 0.00022477935916970782, "tps": 53133, "wall": 19130.5} {"step": 15510, "train_loss": 3.2932791709899902, "lr": 0.00022476020789742322, "tps": 53121, "wall": 19135.9} {"step": 15511, "train_loss": 3.2652924060821533, "lr": 0.00022474105657121474, "tps": 53110, "wall": 19141.2} {"step": 15512, "train_loss": 3.289001941680908, "lr": 0.0002247219051912993, "tps": 53098, "wall": 19146.6} {"step": 15513, "train_loss": 3.3712658882141113, "lr": 0.0002247027537578938, "tps": 53087, "wall": 19152.0} {"step": 15514, "train_loss": 3.3930916786193848, "lr": 0.0002246836022712153, "tps": 53075, "wall": 19157.4} {"step": 15515, "train_loss": 3.336716890335083, "lr": 0.00022466445073148075, "tps": 53064, "wall": 19162.8} {"step": 15516, "train_loss": 3.37595796585083, "lr": 0.00022464529913890697, "tps": 53052, "wall": 19168.1} {"step": 15517, "train_loss": 3.281405210494995, "lr": 0.00022462614749371102, "tps": 53040, "wall": 19173.6} {"step": 15518, "train_loss": 3.398526430130005, "lr": 0.00022460699579610985, "tps": 53029, "wall": 19179.0} {"step": 15519, "train_loss": 3.407576322555542, "lr": 0.00022458784404632033, "tps": 53018, "wall": 19184.3} {"step": 15520, "train_loss": 3.3267762660980225, "lr": 0.00022456869224455944, "tps": 53006, "wall": 19189.8} {"step": 15521, "train_loss": 3.367689371109009, "lr": 0.00022454954039104424, "tps": 52995, "wall": 19195.1} {"step": 15522, "train_loss": 3.3580164909362793, "lr": 0.0002245303884859916, "tps": 52983, "wall": 19200.5} {"step": 15523, "train_loss": 3.392754554748535, "lr": 0.0002245112365296184, "tps": 52972, "wall": 19205.8} {"step": 15524, "train_loss": 3.439492702484131, "lr": 0.0002244920845221417, "tps": 52961, "wall": 19211.2} {"step": 15525, "train_loss": 3.357692241668701, "lr": 0.00022447293246377842, "tps": 52949, "wall": 19216.6} {"step": 15526, "train_loss": 3.355971336364746, "lr": 0.00022445378035474556, "tps": 52938, "wall": 19222.0} {"step": 15527, "train_loss": 3.329484224319458, "lr": 0.00022443462819526002, "tps": 52926, "wall": 19227.3} {"step": 15528, "train_loss": 3.504422187805176, "lr": 0.00022441547598553877, "tps": 52915, "wall": 19232.8} {"step": 15529, "train_loss": 3.4018707275390625, "lr": 0.00022439632372579872, "tps": 52904, "wall": 19238.1} {"step": 15530, "train_loss": 3.3516030311584473, "lr": 0.0002243771714162569, "tps": 52892, "wall": 19243.4} {"step": 15531, "train_loss": 3.264179229736328, "lr": 0.0002243580190571303, "tps": 52881, "wall": 19248.7} {"step": 15532, "train_loss": 3.4137792587280273, "lr": 0.00022433886664863578, "tps": 52870, "wall": 19254.1} {"step": 15533, "train_loss": 3.2752017974853516, "lr": 0.00022431971419099034, "tps": 52859, "wall": 19259.5} {"step": 15534, "train_loss": 3.3111417293548584, "lr": 0.00022430056168441093, "tps": 52847, "wall": 19264.8} {"step": 15535, "train_loss": 3.2570700645446777, "lr": 0.00022428140912911454, "tps": 52836, "wall": 19270.2} {"step": 15536, "train_loss": 3.3356144428253174, "lr": 0.0002242622565253181, "tps": 52825, "wall": 19275.6} {"step": 15537, "train_loss": 3.4069528579711914, "lr": 0.00022424310387323862, "tps": 52813, "wall": 19281.0} {"step": 15538, "train_loss": 3.4286608695983887, "lr": 0.00022422395117309302, "tps": 52802, "wall": 19286.3} {"step": 15539, "train_loss": 3.397296905517578, "lr": 0.0002242047984250983, "tps": 52790, "wall": 19291.8} {"step": 15540, "train_loss": 3.4888577461242676, "lr": 0.00022418564562947136, "tps": 52779, "wall": 19297.1} {"step": 15541, "train_loss": 3.458160877227783, "lr": 0.00022416649278642924, "tps": 52768, "wall": 19302.5} {"step": 15542, "train_loss": 3.3675413131713867, "lr": 0.0002241473398961888, "tps": 52756, "wall": 19308.0} {"step": 15543, "train_loss": 3.3779447078704834, "lr": 0.00022412818695896709, "tps": 52745, "wall": 19313.3} {"step": 15544, "train_loss": 3.3382363319396973, "lr": 0.0002241090339749811, "tps": 52734, "wall": 19318.6} {"step": 15545, "train_loss": 3.3161773681640625, "lr": 0.0002240898809444477, "tps": 52723, "wall": 19324.0} {"step": 15546, "train_loss": 3.3259661197662354, "lr": 0.0002240707278675839, "tps": 52711, "wall": 19329.4} {"step": 15547, "train_loss": 3.358567714691162, "lr": 0.00022405157474460668, "tps": 52700, "wall": 19334.7} {"step": 15548, "train_loss": 3.1866509914398193, "lr": 0.0002240324215757331, "tps": 52689, "wall": 19340.1} {"step": 15549, "train_loss": 3.3674874305725098, "lr": 0.00022401326836117994, "tps": 52677, "wall": 19345.6} {"step": 15550, "train_loss": 3.217620372772217, "lr": 0.00022399411510116423, "tps": 52666, "wall": 19351.0} {"step": 15551, "train_loss": 3.454195499420166, "lr": 0.00022397496179590306, "tps": 52655, "wall": 19356.3} {"step": 15552, "train_loss": 3.36653470993042, "lr": 0.00022395580844561326, "tps": 52644, "wall": 19361.7} {"step": 15553, "train_loss": 3.344270706176758, "lr": 0.0002239366550505118, "tps": 52633, "wall": 19367.0} {"step": 15554, "train_loss": 3.370150327682495, "lr": 0.00022391750161081575, "tps": 52621, "wall": 19372.4} {"step": 15555, "train_loss": 3.3965744972229004, "lr": 0.00022389834812674205, "tps": 52610, "wall": 19377.7} {"step": 15556, "train_loss": 3.321958303451538, "lr": 0.00022387919459850763, "tps": 52599, "wall": 19383.1} {"step": 15557, "train_loss": 3.342940092086792, "lr": 0.0002238600410263294, "tps": 52588, "wall": 19388.4} {"step": 15558, "train_loss": 3.3314459323883057, "lr": 0.00022384088741042457, "tps": 52577, "wall": 19393.8} {"step": 15559, "train_loss": 3.384441614151001, "lr": 0.00022382173375100987, "tps": 52566, "wall": 19399.1} {"step": 15560, "train_loss": 3.3555257320404053, "lr": 0.00022380258004830235, "tps": 52555, "wall": 19404.4} {"step": 15561, "train_loss": 3.4307479858398438, "lr": 0.000223783426302519, "tps": 52543, "wall": 19409.9} {"step": 15562, "train_loss": 3.380148410797119, "lr": 0.00022376427251387683, "tps": 52532, "wall": 19415.2} {"step": 15563, "train_loss": 3.383049249649048, "lr": 0.00022374511868259277, "tps": 52521, "wall": 19420.6} {"step": 15564, "train_loss": 3.3985893726348877, "lr": 0.00022372596480888378, "tps": 52510, "wall": 19425.9} {"step": 15565, "train_loss": 3.300565481185913, "lr": 0.00022370681089296693, "tps": 52499, "wall": 19431.4} {"step": 15566, "train_loss": 3.4008431434631348, "lr": 0.00022368765693505903, "tps": 52488, "wall": 19436.7} {"step": 15567, "train_loss": 3.3288023471832275, "lr": 0.0002236685029353772, "tps": 52477, "wall": 19442.0} {"step": 15568, "train_loss": 3.3018531799316406, "lr": 0.00022364934889413838, "tps": 52466, "wall": 19447.4} {"step": 15569, "train_loss": 3.4591619968414307, "lr": 0.00022363019481155951, "tps": 52455, "wall": 19452.8} {"step": 15570, "train_loss": 3.2986574172973633, "lr": 0.00022361104068785762, "tps": 52443, "wall": 19458.1} {"step": 15571, "train_loss": 3.3283863067626953, "lr": 0.00022359188652324962, "tps": 52432, "wall": 19463.5} {"step": 15572, "train_loss": 3.3622934818267822, "lr": 0.00022357273231795262, "tps": 52421, "wall": 19468.9} {"step": 15573, "train_loss": 3.3204832077026367, "lr": 0.00022355357807218344, "tps": 52410, "wall": 19474.3} {"step": 15574, "train_loss": 3.2722697257995605, "lr": 0.00022353442378615914, "tps": 52399, "wall": 19479.6} {"step": 15575, "train_loss": 3.4588828086853027, "lr": 0.00022351526946009674, "tps": 52388, "wall": 19484.9} {"step": 15576, "train_loss": 3.3272485733032227, "lr": 0.00022349611509421316, "tps": 52377, "wall": 19490.3} {"step": 15577, "train_loss": 3.2839808464050293, "lr": 0.0002234769606887254, "tps": 52366, "wall": 19495.7} {"step": 15578, "train_loss": 3.310465097427368, "lr": 0.00022345780624385042, "tps": 52355, "wall": 19501.1} {"step": 15579, "train_loss": 3.4294960498809814, "lr": 0.00022343865175980524, "tps": 52344, "wall": 19506.4} {"step": 15580, "train_loss": 3.2620749473571777, "lr": 0.0002234194972368068, "tps": 52333, "wall": 19511.8} {"step": 15581, "train_loss": 3.3328909873962402, "lr": 0.00022340034267507214, "tps": 52322, "wall": 19517.1} {"step": 15582, "train_loss": 3.345871925354004, "lr": 0.00022338118807481823, "tps": 52311, "wall": 19522.5} {"step": 15583, "train_loss": 3.255887269973755, "lr": 0.000223362033436262, "tps": 52300, "wall": 19527.8} {"step": 15584, "train_loss": 3.366170644760132, "lr": 0.00022334287875962048, "tps": 52289, "wall": 19533.3} {"step": 15585, "train_loss": 3.3263981342315674, "lr": 0.0002233237240451107, "tps": 52278, "wall": 19538.6} {"step": 15586, "train_loss": 3.3065271377563477, "lr": 0.00022330456929294955, "tps": 52267, "wall": 19544.0} {"step": 15587, "train_loss": 3.3650600910186768, "lr": 0.00022328541450335405, "tps": 52256, "wall": 19549.3} {"step": 15588, "train_loss": 3.31518292427063, "lr": 0.0002232662596765412, "tps": 52245, "wall": 19554.7} {"step": 15589, "train_loss": 3.418138027191162, "lr": 0.00022324710481272798, "tps": 52234, "wall": 19560.0} {"step": 15590, "train_loss": 3.287195920944214, "lr": 0.00022322794991213143, "tps": 52223, "wall": 19565.4} {"step": 15591, "train_loss": 3.3589162826538086, "lr": 0.00022320879497496842, "tps": 52212, "wall": 19570.7} {"step": 15592, "train_loss": 3.423398017883301, "lr": 0.00022318964000145607, "tps": 52201, "wall": 19576.1} {"step": 15593, "train_loss": 3.3495054244995117, "lr": 0.00022317048499181124, "tps": 52190, "wall": 19581.4} {"step": 15594, "train_loss": 3.409904956817627, "lr": 0.00022315132994625106, "tps": 52179, "wall": 19586.8} {"step": 15595, "train_loss": 3.363673686981201, "lr": 0.00022313217486499235, "tps": 52168, "wall": 19592.2} {"step": 15596, "train_loss": 3.3481431007385254, "lr": 0.0002231130197482523, "tps": 52157, "wall": 19597.6} {"step": 15597, "train_loss": 3.3870534896850586, "lr": 0.00022309386459624776, "tps": 52146, "wall": 19603.0} {"step": 15598, "train_loss": 3.3544178009033203, "lr": 0.00022307470940919567, "tps": 52135, "wall": 19608.4} {"step": 15599, "train_loss": 3.363393545150757, "lr": 0.00022305555418731325, "tps": 52124, "wall": 19613.7} {"step": 15600, "train_loss": 3.2736361026763916, "lr": 0.0002230363989308172, "tps": 52113, "wall": 19619.1} {"step": 15601, "train_loss": 3.4228734970092773, "lr": 0.00022301724363992475, "tps": 52103, "wall": 19624.4} {"step": 15602, "train_loss": 3.3688669204711914, "lr": 0.0002229980883148528, "tps": 52092, "wall": 19629.8} {"step": 15603, "train_loss": 3.301030158996582, "lr": 0.0002229789329558183, "tps": 52081, "wall": 19635.2} {"step": 15604, "train_loss": 3.393411636352539, "lr": 0.00022295977756303832, "tps": 52070, "wall": 19640.6} {"step": 15605, "train_loss": 3.2909274101257324, "lr": 0.0002229406221367298, "tps": 52059, "wall": 19646.0} {"step": 15606, "train_loss": 3.3533313274383545, "lr": 0.00022292146667710977, "tps": 52048, "wall": 19651.4} {"step": 15607, "train_loss": 3.257828712463379, "lr": 0.00022290231118439523, "tps": 52037, "wall": 19656.8} {"step": 15608, "train_loss": 3.4389500617980957, "lr": 0.0002228831556588031, "tps": 52026, "wall": 19662.2} {"step": 15609, "train_loss": 3.3203563690185547, "lr": 0.00022286400010055045, "tps": 52015, "wall": 19667.5} {"step": 15610, "train_loss": 3.4469223022460938, "lr": 0.00022284484450985423, "tps": 52004, "wall": 19672.9} {"step": 15611, "train_loss": 3.3499484062194824, "lr": 0.00022282568888693148, "tps": 51993, "wall": 19678.3} {"step": 15612, "train_loss": 3.388930559158325, "lr": 0.0002228065332319992, "tps": 51982, "wall": 19683.7} {"step": 15613, "train_loss": 3.3614425659179688, "lr": 0.00022278737754527427, "tps": 51972, "wall": 19689.0} {"step": 15614, "train_loss": 3.330476760864258, "lr": 0.00022276822182697384, "tps": 51961, "wall": 19694.4} {"step": 15615, "train_loss": 3.3415284156799316, "lr": 0.00022274906607731488, "tps": 51950, "wall": 19699.8} {"step": 15616, "train_loss": 3.4079103469848633, "lr": 0.00022272991029651432, "tps": 51939, "wall": 19705.1} {"step": 15617, "train_loss": 3.355363130569458, "lr": 0.00022271075448478914, "tps": 51928, "wall": 19710.6} {"step": 15618, "train_loss": 3.328125, "lr": 0.00022269159864235643, "tps": 51917, "wall": 19715.9} {"step": 15619, "train_loss": 3.4128408432006836, "lr": 0.00022267244276943316, "tps": 51907, "wall": 19721.3} {"step": 15620, "train_loss": 3.4374241828918457, "lr": 0.0002226532868662363, "tps": 51896, "wall": 19726.6} {"step": 15621, "train_loss": 3.2001123428344727, "lr": 0.0002226341309329828, "tps": 51885, "wall": 19732.0} {"step": 15622, "train_loss": 3.342526435852051, "lr": 0.0002226149749698898, "tps": 51874, "wall": 19737.4} {"step": 15623, "train_loss": 3.2705764770507812, "lr": 0.00022259581897717424, "tps": 51863, "wall": 19742.7} {"step": 15624, "train_loss": 3.439664840698242, "lr": 0.00022257666295505307, "tps": 51853, "wall": 19748.1} {"step": 15625, "train_loss": 3.348013401031494, "lr": 0.00022255750690374328, "tps": 51842, "wall": 19753.6} {"step": 15626, "train_loss": 3.357579469680786, "lr": 0.00022253835082346196, "tps": 51831, "wall": 19758.9} {"step": 15627, "train_loss": 3.38248610496521, "lr": 0.00022251919471442605, "tps": 51820, "wall": 19764.3} {"step": 15628, "train_loss": 3.4069337844848633, "lr": 0.00022250003857685258, "tps": 51809, "wall": 19769.7} {"step": 15629, "train_loss": 3.3411736488342285, "lr": 0.00022248088241095854, "tps": 51798, "wall": 19775.1} {"step": 15630, "train_loss": 3.295872211456299, "lr": 0.0002224617262169609, "tps": 51787, "wall": 19780.6} {"step": 15631, "train_loss": 3.3776793479919434, "lr": 0.00022244256999507674, "tps": 51777, "wall": 19785.9} {"step": 15632, "train_loss": 3.318108558654785, "lr": 0.000222423413745523, "tps": 51766, "wall": 19791.3} {"step": 15633, "train_loss": 3.2507786750793457, "lr": 0.0002224042574685167, "tps": 51755, "wall": 19796.7} {"step": 15634, "train_loss": 3.300149917602539, "lr": 0.0002223851011642748, "tps": 51744, "wall": 19802.1} {"step": 15635, "train_loss": 3.3675036430358887, "lr": 0.00022236594483301437, "tps": 51734, "wall": 19807.4} {"step": 15636, "train_loss": 3.2946109771728516, "lr": 0.00022234678847495238, "tps": 51723, "wall": 19812.9} {"step": 15637, "train_loss": 3.3045389652252197, "lr": 0.00022232763209030588, "tps": 51712, "wall": 19818.3} {"step": 15638, "train_loss": 3.297786235809326, "lr": 0.00022230847567929177, "tps": 51701, "wall": 19823.7} {"step": 15639, "train_loss": 3.3655166625976562, "lr": 0.00022228931924212714, "tps": 51691, "wall": 19829.0} {"step": 15640, "train_loss": 3.406458616256714, "lr": 0.00022227016277902908, "tps": 51680, "wall": 19834.5} {"step": 15641, "train_loss": 3.359558582305908, "lr": 0.00022225100629021439, "tps": 51669, "wall": 19839.9} {"step": 15642, "train_loss": 3.3771042823791504, "lr": 0.00022223184977590018, "tps": 51658, "wall": 19845.3} {"step": 15643, "train_loss": 3.4242746829986572, "lr": 0.00022221269323630346, "tps": 51648, "wall": 19850.6} {"step": 15644, "train_loss": 3.3355233669281006, "lr": 0.00022219353667164127, "tps": 51637, "wall": 19856.0} {"step": 15645, "train_loss": 3.380147933959961, "lr": 0.00022217438008213054, "tps": 51626, "wall": 19861.4} {"step": 15646, "train_loss": 3.461638927459717, "lr": 0.00022215522346798837, "tps": 51615, "wall": 19866.8} {"step": 15647, "train_loss": 3.3744287490844727, "lr": 0.00022213606682943167, "tps": 51605, "wall": 19872.1} {"step": 15648, "train_loss": 3.4143412113189697, "lr": 0.00022211691016667747, "tps": 51594, "wall": 19877.5} {"step": 15649, "train_loss": 3.3782474994659424, "lr": 0.00022209775347994278, "tps": 51583, "wall": 19882.9} {"step": 15650, "train_loss": 3.4826886653900146, "lr": 0.00022207859676944477, "tps": 51573, "wall": 19888.3} {"step": 15651, "train_loss": 3.3943047523498535, "lr": 0.00022205944003540014, "tps": 51562, "wall": 19893.8} {"step": 15652, "train_loss": 3.438239812850952, "lr": 0.00022204028327802613, "tps": 51551, "wall": 19899.2} {"step": 15653, "train_loss": 3.4119925498962402, "lr": 0.00022202112649753964, "tps": 51540, "wall": 19904.6} {"step": 15654, "train_loss": 3.305896759033203, "lr": 0.0002220019696941578, "tps": 51530, "wall": 19910.1} {"step": 15655, "train_loss": 3.468783140182495, "lr": 0.00022198281286809745, "tps": 51519, "wall": 19915.4} {"step": 15656, "train_loss": 3.3630318641662598, "lr": 0.0002219636560195757, "tps": 51508, "wall": 19920.8} {"step": 15657, "train_loss": 3.324779987335205, "lr": 0.0002219444991488096, "tps": 51498, "wall": 19926.2} {"step": 15658, "train_loss": 3.307168960571289, "lr": 0.00022192534225601608, "tps": 51487, "wall": 19931.6} {"step": 15659, "train_loss": 3.381807327270508, "lr": 0.00022190618534141215, "tps": 51476, "wall": 19937.0} {"step": 15660, "train_loss": 3.309048891067505, "lr": 0.000221887028405215, "tps": 51466, "wall": 19942.4} {"step": 15661, "train_loss": 3.3240084648132324, "lr": 0.00022186787144764128, "tps": 51455, "wall": 19947.8} {"step": 15662, "train_loss": 3.3084957599639893, "lr": 0.00022184871446890832, "tps": 51444, "wall": 19953.3} {"step": 15663, "train_loss": 3.255178451538086, "lr": 0.000221829557469233, "tps": 51434, "wall": 19958.7} {"step": 15664, "train_loss": 3.367504119873047, "lr": 0.0002218104004488324, "tps": 51423, "wall": 19964.1} {"step": 15665, "train_loss": 3.386680841445923, "lr": 0.00022179124340792342, "tps": 51412, "wall": 19969.5} {"step": 15666, "train_loss": 3.492629289627075, "lr": 0.00022177208634672316, "tps": 51402, "wall": 19974.9} {"step": 15667, "train_loss": 3.2449588775634766, "lr": 0.00022175292926544863, "tps": 51391, "wall": 19980.3} {"step": 15668, "train_loss": 3.287243604660034, "lr": 0.00022173377216431678, "tps": 51380, "wall": 19985.7} {"step": 15669, "train_loss": 3.3826351165771484, "lr": 0.00022171461504354468, "tps": 51370, "wall": 19991.1} {"step": 15670, "train_loss": 3.455357789993286, "lr": 0.00022169545790334932, "tps": 51359, "wall": 19996.5} {"step": 15671, "train_loss": 3.378154754638672, "lr": 0.00022167630074394778, "tps": 51349, "wall": 20001.9} {"step": 15672, "train_loss": 3.3048806190490723, "lr": 0.00022165714356555695, "tps": 51338, "wall": 20007.4} {"step": 15673, "train_loss": 3.34665584564209, "lr": 0.00022163798636839395, "tps": 51327, "wall": 20012.9} {"step": 15674, "train_loss": 3.363473415374756, "lr": 0.00022161882915267578, "tps": 51316, "wall": 20018.3} {"step": 15675, "train_loss": 3.3159003257751465, "lr": 0.00022159967191861935, "tps": 51306, "wall": 20023.7} {"step": 15676, "train_loss": 3.367642402648926, "lr": 0.00022158051466644176, "tps": 51295, "wall": 20029.1} {"step": 15677, "train_loss": 3.487208127975464, "lr": 0.00022156135739636007, "tps": 51285, "wall": 20034.5} {"step": 15678, "train_loss": 3.368309736251831, "lr": 0.00022154220010859116, "tps": 51274, "wall": 20039.8} {"step": 15679, "train_loss": 3.3861732482910156, "lr": 0.00022152304280335217, "tps": 51264, "wall": 20045.2} {"step": 15680, "train_loss": 3.3326215744018555, "lr": 0.0002215038854808601, "tps": 51253, "wall": 20050.6} {"step": 15681, "train_loss": 3.309891700744629, "lr": 0.00022148472814133188, "tps": 51243, "wall": 20056.0} {"step": 15682, "train_loss": 3.387052536010742, "lr": 0.0002214655707849846, "tps": 51232, "wall": 20061.4} {"step": 15683, "train_loss": 3.300412654876709, "lr": 0.00022144641341203527, "tps": 51222, "wall": 20066.7} {"step": 15684, "train_loss": 3.312260866165161, "lr": 0.0002214272560227009, "tps": 51211, "wall": 20072.2} {"step": 15685, "train_loss": 3.27632474899292, "lr": 0.00022140809861719848, "tps": 51201, "wall": 20077.7} {"step": 15686, "train_loss": 3.326200246810913, "lr": 0.00022138894119574495, "tps": 51190, "wall": 20083.1} {"step": 15687, "train_loss": 3.28190279006958, "lr": 0.00022136978375855755, "tps": 51180, "wall": 20088.5} {"step": 15688, "train_loss": 3.274601459503174, "lr": 0.0002213506263058531, "tps": 51169, "wall": 20093.8} {"step": 15689, "train_loss": 3.2979683876037598, "lr": 0.0002213314688378487, "tps": 51159, "wall": 20099.2} {"step": 15690, "train_loss": 3.4605507850646973, "lr": 0.00022131231135476135, "tps": 51148, "wall": 20104.6} {"step": 15691, "train_loss": 3.3560104370117188, "lr": 0.0002212931538568081, "tps": 51138, "wall": 20110.0} {"step": 15692, "train_loss": 3.3964431285858154, "lr": 0.00022127399634420592, "tps": 51127, "wall": 20115.4} {"step": 15693, "train_loss": 3.340479850769043, "lr": 0.00022125483881717175, "tps": 51117, "wall": 20120.8} {"step": 15694, "train_loss": 3.3803634643554688, "lr": 0.00022123568127592282, "tps": 51107, "wall": 20126.2} {"step": 15695, "train_loss": 3.2756752967834473, "lr": 0.00022121652372067598, "tps": 51096, "wall": 20131.6} {"step": 15696, "train_loss": 3.279550552368164, "lr": 0.00022119736615164824, "tps": 51085, "wall": 20137.1} {"step": 15697, "train_loss": 3.304760456085205, "lr": 0.0002211782085690567, "tps": 51075, "wall": 20142.5} {"step": 15698, "train_loss": 3.3592350482940674, "lr": 0.00022115905097311843, "tps": 51064, "wall": 20147.9} {"step": 15699, "train_loss": 3.440302848815918, "lr": 0.00022113989336405032, "tps": 51054, "wall": 20153.3} {"step": 15700, "train_loss": 3.3638205528259277, "lr": 0.0002211207357420694, "tps": 51044, "wall": 20158.7} {"step": 15701, "train_loss": 3.4009783267974854, "lr": 0.00022110157810739276, "tps": 51033, "wall": 20164.0} {"step": 15702, "train_loss": 3.2758097648620605, "lr": 0.00022108242046023734, "tps": 51023, "wall": 20169.4} {"step": 15703, "train_loss": 3.448213577270508, "lr": 0.0002210632628008202, "tps": 51013, "wall": 20174.8} {"step": 15704, "train_loss": 3.357616424560547, "lr": 0.00022104410512935845, "tps": 51002, "wall": 20180.2} {"step": 15705, "train_loss": 3.2194125652313232, "lr": 0.00022102494744606898, "tps": 50992, "wall": 20185.6} {"step": 15706, "train_loss": 3.296605110168457, "lr": 0.00022100578975116876, "tps": 50981, "wall": 20191.1} {"step": 15707, "train_loss": 3.3308305740356445, "lr": 0.00022098663204487502, "tps": 50971, "wall": 20196.5} {"step": 15708, "train_loss": 3.3681366443634033, "lr": 0.0002209674743274046, "tps": 50960, "wall": 20201.9} {"step": 15709, "train_loss": 3.268303394317627, "lr": 0.00022094831659897458, "tps": 50950, "wall": 20207.4} {"step": 15710, "train_loss": 3.4381275177001953, "lr": 0.00022092915885980202, "tps": 50939, "wall": 20212.8} {"step": 15711, "train_loss": 3.249008893966675, "lr": 0.00022091000111010387, "tps": 50929, "wall": 20218.2} {"step": 15712, "train_loss": 3.282604217529297, "lr": 0.00022089084335009718, "tps": 50917, "wall": 20224.2} {"step": 15713, "train_loss": 3.3255157470703125, "lr": 0.00022087168557999895, "tps": 50905, "wall": 20230.1} {"step": 15714, "train_loss": 3.2908401489257812, "lr": 0.00022085252780002624, "tps": 50895, "wall": 20235.5} {"step": 15715, "train_loss": 3.3305952548980713, "lr": 0.00022083337001039603, "tps": 50885, "wall": 20240.9} {"step": 15716, "train_loss": 3.312417507171631, "lr": 0.0002208142122113254, "tps": 50875, "wall": 20246.3} {"step": 15717, "train_loss": 3.405989646911621, "lr": 0.00022079505440303132, "tps": 50864, "wall": 20251.7} {"step": 15718, "train_loss": 3.3908181190490723, "lr": 0.00022077589658573077, "tps": 50854, "wall": 20257.1} {"step": 15719, "train_loss": 3.309760570526123, "lr": 0.0002207567387596409, "tps": 50844, "wall": 20262.5} {"step": 15720, "train_loss": 3.341770887374878, "lr": 0.00022073758092497857, "tps": 50833, "wall": 20267.9} {"step": 15721, "train_loss": 3.3986682891845703, "lr": 0.00022071842308196091, "tps": 50823, "wall": 20273.3} {"step": 15722, "train_loss": 3.4134788513183594, "lr": 0.00022069926523080497, "tps": 50813, "wall": 20278.7} {"step": 15723, "train_loss": 3.444561719894409, "lr": 0.00022068010737172767, "tps": 50802, "wall": 20284.1} {"step": 15724, "train_loss": 3.4073266983032227, "lr": 0.00022066094950494604, "tps": 50792, "wall": 20289.5} {"step": 15725, "train_loss": 3.320859909057617, "lr": 0.0002206417916306772, "tps": 50782, "wall": 20294.9} {"step": 15726, "train_loss": 3.3984930515289307, "lr": 0.00022062263374913806, "tps": 50771, "wall": 20300.3} {"step": 15727, "train_loss": 3.336289644241333, "lr": 0.00022060347586054575, "tps": 50761, "wall": 20305.7} {"step": 15728, "train_loss": 3.3136544227600098, "lr": 0.00022058431796511717, "tps": 50751, "wall": 20311.2} {"step": 15729, "train_loss": 3.5083301067352295, "lr": 0.00022056516006306942, "tps": 50740, "wall": 20316.6} {"step": 15730, "train_loss": 3.358590602874756, "lr": 0.0002205460021546195, "tps": 50730, "wall": 20322.0} {"step": 15731, "train_loss": 3.4859421253204346, "lr": 0.00022052684423998448, "tps": 50720, "wall": 20327.4} {"step": 15732, "train_loss": 3.491420030593872, "lr": 0.00022050768631938134, "tps": 50709, "wall": 20332.9} {"step": 15733, "train_loss": 3.3661327362060547, "lr": 0.00022048852839302705, "tps": 50699, "wall": 20338.3} {"step": 15734, "train_loss": 3.26939058303833, "lr": 0.00022046937046113873, "tps": 50689, "wall": 20343.7} {"step": 15735, "train_loss": 3.421891689300537, "lr": 0.0002204502125239334, "tps": 50679, "wall": 20349.1} {"step": 15736, "train_loss": 3.3135321140289307, "lr": 0.00022043105458162794, "tps": 50668, "wall": 20354.5} {"step": 15737, "train_loss": 3.269514799118042, "lr": 0.00022041189663443952, "tps": 50658, "wall": 20359.9} {"step": 15738, "train_loss": 3.3696517944335938, "lr": 0.00022039273868258504, "tps": 50648, "wall": 20365.3} {"step": 15739, "train_loss": 3.333408832550049, "lr": 0.00022037358072628168, "tps": 50637, "wall": 20370.8} {"step": 15740, "train_loss": 3.324338674545288, "lr": 0.00022035442276574637, "tps": 50627, "wall": 20376.2} {"step": 15741, "train_loss": 3.310976505279541, "lr": 0.00022033526480119608, "tps": 50617, "wall": 20381.6} {"step": 15742, "train_loss": 3.383284568786621, "lr": 0.00022031610683284796, "tps": 50607, "wall": 20387.0} {"step": 15743, "train_loss": 3.3805482387542725, "lr": 0.00022029694886091896, "tps": 50597, "wall": 20392.5} {"step": 15744, "train_loss": 3.357182025909424, "lr": 0.00022027779088562607, "tps": 50586, "wall": 20397.9} {"step": 15745, "train_loss": 3.3271865844726562, "lr": 0.00022025863290718633, "tps": 50576, "wall": 20403.2} {"step": 15746, "train_loss": 3.317200183868408, "lr": 0.00022023947492581686, "tps": 50566, "wall": 20408.6} {"step": 15747, "train_loss": 3.4826340675354004, "lr": 0.00022022031694173455, "tps": 50556, "wall": 20414.0} {"step": 15748, "train_loss": 3.268939256668091, "lr": 0.00022020115895515647, "tps": 50546, "wall": 20419.4} {"step": 15749, "train_loss": 3.309382438659668, "lr": 0.00022018200096629974, "tps": 50536, "wall": 20424.8} {"step": 15750, "train_loss": 3.315122127532959, "lr": 0.00022016284297538116, "tps": 50525, "wall": 20430.3} {"step": 15751, "train_loss": 3.4020800590515137, "lr": 0.000220143684982618, "tps": 50515, "wall": 20435.7} {"step": 15752, "train_loss": 3.391416549682617, "lr": 0.00022012452698822715, "tps": 50505, "wall": 20441.1} {"step": 15753, "train_loss": 3.2477645874023438, "lr": 0.00022010536899242554, "tps": 50495, "wall": 20446.5} {"step": 15754, "train_loss": 3.3675665855407715, "lr": 0.0002200862109954304, "tps": 50485, "wall": 20451.9} {"step": 15755, "train_loss": 3.3556177616119385, "lr": 0.00022006705299745861, "tps": 50474, "wall": 20457.4} {"step": 15756, "train_loss": 3.3011646270751953, "lr": 0.00022004789499872733, "tps": 50464, "wall": 20462.8} {"step": 15757, "train_loss": 3.351285457611084, "lr": 0.00022002873699945342, "tps": 50454, "wall": 20468.2} {"step": 15758, "train_loss": 3.325279712677002, "lr": 0.00022000957899985396, "tps": 50444, "wall": 20473.6} {"step": 15759, "train_loss": 3.345000982284546, "lr": 0.00021999042100014608, "tps": 50434, "wall": 20479.1} {"step": 15760, "train_loss": 3.325265884399414, "lr": 0.00021997126300054665, "tps": 50424, "wall": 20484.5} {"step": 15761, "train_loss": 3.3061814308166504, "lr": 0.00021995210500127277, "tps": 50413, "wall": 20490.1} {"step": 15762, "train_loss": 3.2881808280944824, "lr": 0.00021993294700254143, "tps": 50403, "wall": 20495.5} {"step": 15763, "train_loss": 3.2618348598480225, "lr": 0.00021991378900456968, "tps": 50393, "wall": 20500.9} {"step": 15764, "train_loss": 3.3489532470703125, "lr": 0.0002198946310075745, "tps": 50383, "wall": 20506.4} {"step": 15765, "train_loss": 3.3790042400360107, "lr": 0.000219875473011773, "tps": 50372, "wall": 20511.8} {"step": 15766, "train_loss": 3.240756034851074, "lr": 0.00021985631501738215, "tps": 50362, "wall": 20517.2} {"step": 15767, "train_loss": 3.289234161376953, "lr": 0.00021983715702461894, "tps": 50352, "wall": 20522.7} {"step": 15768, "train_loss": 3.4733715057373047, "lr": 0.00021981799903370038, "tps": 50342, "wall": 20528.1} {"step": 15769, "train_loss": 3.3329660892486572, "lr": 0.00021979884104484355, "tps": 50332, "wall": 20533.5} {"step": 15770, "train_loss": 3.3554787635803223, "lr": 0.00021977968305826555, "tps": 50322, "wall": 20539.0} {"step": 15771, "train_loss": 3.3112974166870117, "lr": 0.00021976052507418327, "tps": 50312, "wall": 20544.5} {"step": 15772, "train_loss": 3.210916042327881, "lr": 0.00021974136709281372, "tps": 50301, "wall": 20550.0} {"step": 15773, "train_loss": 3.3228321075439453, "lr": 0.00021972220911437403, "tps": 50291, "wall": 20555.5} {"step": 15774, "train_loss": 3.3328585624694824, "lr": 0.00021970305113908114, "tps": 50281, "wall": 20560.9} {"step": 15775, "train_loss": 3.3034749031066895, "lr": 0.0002196838931671521, "tps": 50271, "wall": 20566.4} {"step": 15776, "train_loss": 3.416688919067383, "lr": 0.00021966473519880394, "tps": 50260, "wall": 20572.0} {"step": 15777, "train_loss": 3.371737480163574, "lr": 0.00021964557723425375, "tps": 50250, "wall": 20577.5} {"step": 15778, "train_loss": 3.361629009246826, "lr": 0.0002196264192737184, "tps": 50240, "wall": 20582.9} {"step": 15779, "train_loss": 3.4290285110473633, "lr": 0.00021960726131741503, "tps": 50230, "wall": 20588.4} {"step": 15780, "train_loss": 3.33323073387146, "lr": 0.0002195881033655606, "tps": 50219, "wall": 20594.0} {"step": 15781, "train_loss": 3.2879884243011475, "lr": 0.00021956894541837215, "tps": 50209, "wall": 20599.5} {"step": 15782, "train_loss": 3.358732223510742, "lr": 0.0002195497874760667, "tps": 50199, "wall": 20605.0} {"step": 15783, "train_loss": 3.3826072216033936, "lr": 0.00021953062953886137, "tps": 50188, "wall": 20610.7} {"step": 15784, "train_loss": 3.253647565841675, "lr": 0.00021951147160697302, "tps": 50178, "wall": 20616.2} {"step": 15785, "train_loss": 3.381977081298828, "lr": 0.00021949231368061876, "tps": 50168, "wall": 20621.7} {"step": 15786, "train_loss": 3.248729705810547, "lr": 0.00021947315576001554, "tps": 50157, "wall": 20627.3} {"step": 15787, "train_loss": 3.333117961883545, "lr": 0.00021945399784538053, "tps": 50147, "wall": 20632.8} {"step": 15788, "train_loss": 3.4371590614318848, "lr": 0.00021943483993693065, "tps": 50137, "wall": 20638.3} {"step": 15789, "train_loss": 3.3825080394744873, "lr": 0.0002194156820348829, "tps": 50126, "wall": 20643.9} {"step": 15790, "train_loss": 3.3516793251037598, "lr": 0.0002193965241394544, "tps": 50116, "wall": 20649.5} {"step": 15791, "train_loss": 3.28074049949646, "lr": 0.00021937736625086203, "tps": 50106, "wall": 20655.0} {"step": 15792, "train_loss": 3.287734031677246, "lr": 0.0002193582083693229, "tps": 50096, "wall": 20660.5} {"step": 15793, "train_loss": 3.3406615257263184, "lr": 0.00021933905049505406, "tps": 50085, "wall": 20666.1} {"step": 15794, "train_loss": 3.4162099361419678, "lr": 0.00021931989262827245, "tps": 50075, "wall": 20671.7} {"step": 15795, "train_loss": 3.409902811050415, "lr": 0.00021930073476919516, "tps": 50064, "wall": 20677.3} {"step": 15796, "train_loss": 3.287952423095703, "lr": 0.00021928157691803916, "tps": 50054, "wall": 20682.8} {"step": 15797, "train_loss": 3.290933132171631, "lr": 0.00021926241907502153, "tps": 50044, "wall": 20688.3} {"step": 15798, "train_loss": 3.2708780765533447, "lr": 0.00021924326124035922, "tps": 50034, "wall": 20693.9} {"step": 15799, "train_loss": 3.2865078449249268, "lr": 0.0002192241034142693, "tps": 50024, "wall": 20699.4} {"step": 15800, "train_loss": 3.3841893672943115, "lr": 0.00021920494559696878, "tps": 50013, "wall": 20705.0} {"step": 15801, "train_loss": 3.3590505123138428, "lr": 0.00021918578778867468, "tps": 50003, "wall": 20710.6} {"step": 15802, "train_loss": 3.326918125152588, "lr": 0.00021916662998960402, "tps": 49993, "wall": 20716.2} {"step": 15803, "train_loss": 3.3202691078186035, "lr": 0.00021914747219997383, "tps": 49982, "wall": 20721.8} {"step": 15804, "train_loss": 3.3519129753112793, "lr": 0.0002191283144200011, "tps": 49972, "wall": 20727.4} {"step": 15805, "train_loss": 3.2284114360809326, "lr": 0.00021910915664990287, "tps": 49961, "wall": 20733.1} {"step": 15806, "train_loss": 3.3226120471954346, "lr": 0.00021908999888989617, "tps": 49951, "wall": 20738.7} {"step": 15807, "train_loss": 3.2819225788116455, "lr": 0.00021907084114019805, "tps": 49941, "wall": 20744.3} {"step": 15808, "train_loss": 3.394336462020874, "lr": 0.00021905168340102544, "tps": 49930, "wall": 20749.9} {"step": 15809, "train_loss": 3.3379101753234863, "lr": 0.0002190325256725954, "tps": 49920, "wall": 20755.5} {"step": 15810, "train_loss": 3.4146223068237305, "lr": 0.00021901336795512503, "tps": 49910, "wall": 20761.0} {"step": 15811, "train_loss": 3.3553736209869385, "lr": 0.00021899421024883125, "tps": 49900, "wall": 20766.6} {"step": 15812, "train_loss": 3.3965024948120117, "lr": 0.0002189750525539311, "tps": 49889, "wall": 20772.2} {"step": 15813, "train_loss": 3.374699354171753, "lr": 0.0002189558948706416, "tps": 49879, "wall": 20777.9} {"step": 15814, "train_loss": 3.367072582244873, "lr": 0.00021893673719917983, "tps": 49869, "wall": 20783.5} {"step": 15815, "train_loss": 3.4296207427978516, "lr": 0.0002189175795397627, "tps": 49858, "wall": 20789.1} {"step": 15816, "train_loss": 3.2744574546813965, "lr": 0.0002188984218926073, "tps": 49848, "wall": 20794.8} {"step": 15817, "train_loss": 3.323181390762329, "lr": 0.0002188792642579307, "tps": 49837, "wall": 20800.5} {"step": 15818, "train_loss": 3.366708993911743, "lr": 0.00021886010663594977, "tps": 49827, "wall": 20806.1} {"step": 15819, "train_loss": 3.4548141956329346, "lr": 0.00021884094902688164, "tps": 49817, "wall": 20811.7} {"step": 15820, "train_loss": 3.353071689605713, "lr": 0.00021882179143094333, "tps": 49806, "wall": 20817.3} {"step": 15821, "train_loss": 3.4327380657196045, "lr": 0.0002188026338483518, "tps": 49796, "wall": 20823.0} {"step": 15822, "train_loss": 3.3389101028442383, "lr": 0.00021878347627932412, "tps": 49785, "wall": 20828.7} {"step": 15823, "train_loss": 3.3710172176361084, "lr": 0.00021876431872407722, "tps": 49775, "wall": 20834.3} {"step": 15824, "train_loss": 3.352450370788574, "lr": 0.00021874516118282827, "tps": 49765, "wall": 20840.0} {"step": 15825, "train_loss": 3.423243999481201, "lr": 0.00021872600365579418, "tps": 49754, "wall": 20845.6} {"step": 15826, "train_loss": 3.38919734954834, "lr": 0.00021870684614319193, "tps": 49744, "wall": 20851.4} {"step": 15827, "train_loss": 3.2600107192993164, "lr": 0.0002186876886452387, "tps": 49734, "wall": 20857.0} {"step": 15828, "train_loss": 3.4404373168945312, "lr": 0.00021866853116215133, "tps": 49723, "wall": 20862.7} {"step": 15829, "train_loss": 3.4970884323120117, "lr": 0.00021864937369414693, "tps": 49713, "wall": 20868.3} {"step": 15830, "train_loss": 3.418363094329834, "lr": 0.00021863021624144246, "tps": 49703, "wall": 20874.0} {"step": 15831, "train_loss": 3.2522315979003906, "lr": 0.00021861105880425504, "tps": 49692, "wall": 20879.7} {"step": 15832, "train_loss": 3.375225067138672, "lr": 0.0002185919013828016, "tps": 49682, "wall": 20885.4} {"step": 15833, "train_loss": 3.3770294189453125, "lr": 0.00021857274397729914, "tps": 49671, "wall": 20891.0} {"step": 15834, "train_loss": 3.3563168048858643, "lr": 0.0002185535865879648, "tps": 49661, "wall": 20896.7} {"step": 15835, "train_loss": 3.3033182621002197, "lr": 0.0002185344292150154, "tps": 49651, "wall": 20902.4} {"step": 15836, "train_loss": 3.326160430908203, "lr": 0.00021851527185866814, "tps": 49640, "wall": 20908.0} {"step": 15837, "train_loss": 3.3767383098602295, "lr": 0.00021849611451913998, "tps": 49630, "wall": 20913.8} {"step": 15838, "train_loss": 3.380735158920288, "lr": 0.00021847695719664784, "tps": 49619, "wall": 20919.5} {"step": 15839, "train_loss": 3.407787561416626, "lr": 0.00021845779989140883, "tps": 49609, "wall": 20925.2} {"step": 15840, "train_loss": 3.3616743087768555, "lr": 0.00021843864260363995, "tps": 49599, "wall": 20930.9} {"step": 15841, "train_loss": 3.33132266998291, "lr": 0.0002184194853335583, "tps": 49588, "wall": 20936.6} {"step": 15842, "train_loss": 3.4087624549865723, "lr": 0.00021840032808138072, "tps": 49578, "wall": 20942.2} {"step": 15843, "train_loss": 3.310053825378418, "lr": 0.00021838117084732427, "tps": 49568, "wall": 20947.9} {"step": 15844, "train_loss": 3.294438362121582, "lr": 0.00021836201363160612, "tps": 49557, "wall": 20953.6} {"step": 15845, "train_loss": 3.4043478965759277, "lr": 0.00021834285643444306, "tps": 49547, "wall": 20959.2} {"step": 15846, "train_loss": 3.3676397800445557, "lr": 0.00021832369925605226, "tps": 49537, "wall": 20965.0} {"step": 15847, "train_loss": 3.431696891784668, "lr": 0.0002183045420966507, "tps": 49526, "wall": 20970.8} {"step": 15848, "train_loss": 3.346376419067383, "lr": 0.00021828538495645536, "tps": 49516, "wall": 20976.5} {"step": 15849, "train_loss": 3.2694971561431885, "lr": 0.00021826622783568324, "tps": 49505, "wall": 20982.3} {"step": 15850, "train_loss": 3.206186056137085, "lr": 0.0002182470707345514, "tps": 49495, "wall": 20988.0} {"step": 15851, "train_loss": 3.2810561656951904, "lr": 0.0002182279136532769, "tps": 49485, "wall": 20993.7} {"step": 15852, "train_loss": 3.318460702896118, "lr": 0.00021820875659207665, "tps": 49474, "wall": 20999.4} {"step": 15853, "train_loss": 3.390089988708496, "lr": 0.00021818959955116767, "tps": 49464, "wall": 21005.1} {"step": 15854, "train_loss": 3.43928861618042, "lr": 0.00021817044253076703, "tps": 49454, "wall": 21010.8} {"step": 15855, "train_loss": 3.438568115234375, "lr": 0.00021815128553109175, "tps": 49443, "wall": 21016.6} {"step": 15856, "train_loss": 3.372704029083252, "lr": 0.00021813212855235876, "tps": 49433, "wall": 21022.3} {"step": 15857, "train_loss": 3.4401988983154297, "lr": 0.0002181129715947851, "tps": 49423, "wall": 21028.0} {"step": 15858, "train_loss": 3.3759260177612305, "lr": 0.00021809381465858784, "tps": 49412, "wall": 21033.8} {"step": 15859, "train_loss": 3.3374714851379395, "lr": 0.00021807465774398397, "tps": 49402, "wall": 21039.5} {"step": 15860, "train_loss": 3.345802068710327, "lr": 0.00021805550085119042, "tps": 49391, "wall": 21045.2} {"step": 15861, "train_loss": 3.2982678413391113, "lr": 0.00021803634398042431, "tps": 49381, "wall": 21051.0} {"step": 15862, "train_loss": 3.356163501739502, "lr": 0.0002180171871319026, "tps": 49371, "wall": 21056.7} {"step": 15863, "train_loss": 3.3707664012908936, "lr": 0.00021799803030584224, "tps": 49360, "wall": 21062.5} {"step": 15864, "train_loss": 3.325045585632324, "lr": 0.00021797887350246043, "tps": 49350, "wall": 21068.2} {"step": 15865, "train_loss": 3.3068246841430664, "lr": 0.00021795971672197392, "tps": 49340, "wall": 21073.9} {"step": 15866, "train_loss": 3.3785133361816406, "lr": 0.00021794055996459993, "tps": 49329, "wall": 21079.7} {"step": 15867, "train_loss": 3.3182616233825684, "lr": 0.00021792140323055535, "tps": 49319, "wall": 21085.4} {"step": 15868, "train_loss": 3.3933818340301514, "lr": 0.00021790224652005723, "tps": 49309, "wall": 21091.2} {"step": 15869, "train_loss": 3.426236629486084, "lr": 0.00021788308983332257, "tps": 49298, "wall": 21097.0} {"step": 15870, "train_loss": 3.348288059234619, "lr": 0.0002178639331705684, "tps": 49288, "wall": 21102.7} {"step": 15871, "train_loss": 3.372197389602661, "lr": 0.0002178447765320117, "tps": 49278, "wall": 21108.4} {"step": 15872, "train_loss": 3.368985176086426, "lr": 0.00021782561991786947, "tps": 49268, "wall": 21114.1} {"step": 15873, "train_loss": 3.3826651573181152, "lr": 0.0002178064633283588, "tps": 49257, "wall": 21119.8} {"step": 15874, "train_loss": 3.3242504596710205, "lr": 0.00021778730676369658, "tps": 49247, "wall": 21125.6} {"step": 15875, "train_loss": 3.326735258102417, "lr": 0.0002177681502240999, "tps": 49237, "wall": 21131.4} {"step": 15876, "train_loss": 3.344346046447754, "lr": 0.00021774899370978568, "tps": 49226, "wall": 21137.1} {"step": 15877, "train_loss": 3.359363555908203, "lr": 0.00021772983722097097, "tps": 49216, "wall": 21142.8} {"step": 15878, "train_loss": 3.2447762489318848, "lr": 0.00021771068075787287, "tps": 49206, "wall": 21148.6} {"step": 15879, "train_loss": 3.406022310256958, "lr": 0.00021769152432070827, "tps": 49195, "wall": 21154.4} {"step": 15880, "train_loss": 3.37627911567688, "lr": 0.0002176723679096942, "tps": 49185, "wall": 21160.2} {"step": 15881, "train_loss": 3.3880598545074463, "lr": 0.00021765321152504767, "tps": 49175, "wall": 21166.0} {"step": 15882, "train_loss": 3.431307792663574, "lr": 0.00021763405516698567, "tps": 49164, "wall": 21171.8} {"step": 15883, "train_loss": 3.327411651611328, "lr": 0.00021761489883572526, "tps": 49154, "wall": 21177.6} {"step": 15884, "train_loss": 3.347752094268799, "lr": 0.00021759574253148335, "tps": 49144, "wall": 21183.3} {"step": 15885, "train_loss": 3.3505263328552246, "lr": 0.00021757658625447704, "tps": 49133, "wall": 21189.1} {"step": 15886, "train_loss": 3.319517135620117, "lr": 0.00021755743000492333, "tps": 49123, "wall": 21194.9} {"step": 15887, "train_loss": 3.236215114593506, "lr": 0.0002175382737830391, "tps": 49113, "wall": 21200.6} {"step": 15888, "train_loss": 3.352050542831421, "lr": 0.0002175191175890415, "tps": 49103, "wall": 21206.4} {"step": 15889, "train_loss": 3.461581230163574, "lr": 0.00021749996142314743, "tps": 49092, "wall": 21212.3} {"step": 15890, "train_loss": 3.385178804397583, "lr": 0.00021748080528557394, "tps": 49082, "wall": 21218.1} {"step": 15891, "train_loss": 3.4038052558898926, "lr": 0.00021746164917653808, "tps": 49072, "wall": 21223.9} {"step": 15892, "train_loss": 3.3809032440185547, "lr": 0.00021744249309625673, "tps": 49061, "wall": 21229.6} {"step": 15893, "train_loss": 3.3507165908813477, "lr": 0.00021742333704494695, "tps": 49051, "wall": 21235.4} {"step": 15894, "train_loss": 3.3407866954803467, "lr": 0.00021740418102282578, "tps": 49041, "wall": 21241.2} {"step": 15895, "train_loss": 3.309915542602539, "lr": 0.0002173850250301102, "tps": 49030, "wall": 21247.0} {"step": 15896, "train_loss": 3.4185092449188232, "lr": 0.00021736586906701718, "tps": 49020, "wall": 21252.8} {"step": 15897, "train_loss": 3.3684821128845215, "lr": 0.00021734671313376373, "tps": 49010, "wall": 21258.6} {"step": 15898, "train_loss": 3.3209996223449707, "lr": 0.00021732755723056685, "tps": 48999, "wall": 21264.4} {"step": 15899, "train_loss": 3.314857006072998, "lr": 0.00021730840135764359, "tps": 48989, "wall": 21270.3} {"step": 15900, "train_loss": 3.371277332305908, "lr": 0.00021728924551521085, "tps": 48979, "wall": 21276.1} {"step": 15901, "train_loss": 3.2888946533203125, "lr": 0.00021727008970348575, "tps": 48968, "wall": 21281.9} {"step": 15902, "train_loss": 3.3348588943481445, "lr": 0.00021725093392268514, "tps": 48958, "wall": 21287.8} {"step": 15903, "train_loss": 3.158651113510132, "lr": 0.00021723177817302615, "tps": 48948, "wall": 21293.5} {"step": 15904, "train_loss": 3.337798595428467, "lr": 0.0002172126224547257, "tps": 48938, "wall": 21299.3} {"step": 15905, "train_loss": 3.319681167602539, "lr": 0.00021719346676800084, "tps": 48927, "wall": 21305.1} {"step": 15906, "train_loss": 3.3662571907043457, "lr": 0.00021717431111306854, "tps": 48917, "wall": 21310.9} {"step": 15907, "train_loss": 3.343430280685425, "lr": 0.0002171551554901458, "tps": 48907, "wall": 21316.8} {"step": 15908, "train_loss": 3.2878761291503906, "lr": 0.0002171359998994496, "tps": 48897, "wall": 21322.6} {"step": 15909, "train_loss": 3.49345064163208, "lr": 0.00021711684434119698, "tps": 48886, "wall": 21328.4} {"step": 15910, "train_loss": 3.326462984085083, "lr": 0.00021709768881560484, "tps": 48876, "wall": 21334.3} {"step": 15911, "train_loss": 3.433915615081787, "lr": 0.00021707853332289024, "tps": 48866, "wall": 21340.1} {"step": 15912, "train_loss": 3.395632266998291, "lr": 0.0002170593778632702, "tps": 48855, "wall": 21345.9} {"step": 15913, "train_loss": 3.3565189838409424, "lr": 0.0002170402224369617, "tps": 48845, "wall": 21351.7} {"step": 15914, "train_loss": 3.308518886566162, "lr": 0.00021702106704418167, "tps": 48835, "wall": 21357.5} {"step": 15915, "train_loss": 3.318168878555298, "lr": 0.00021700191168514725, "tps": 48825, "wall": 21363.3} {"step": 15916, "train_loss": 3.3612287044525146, "lr": 0.00021698275636007527, "tps": 48815, "wall": 21369.1} {"step": 15917, "train_loss": 3.5107929706573486, "lr": 0.00021696360106918276, "tps": 48804, "wall": 21375.0} {"step": 15918, "train_loss": 3.3362059593200684, "lr": 0.00021694444581268684, "tps": 48794, "wall": 21380.8} {"step": 15919, "train_loss": 3.415846586227417, "lr": 0.0002169252905908043, "tps": 48784, "wall": 21386.6} {"step": 15920, "train_loss": 3.3295063972473145, "lr": 0.00021690613540375226, "tps": 48773, "wall": 21392.5} {"step": 15921, "train_loss": 3.4350409507751465, "lr": 0.0002168869802517477, "tps": 48763, "wall": 21398.4} {"step": 15922, "train_loss": 3.4311017990112305, "lr": 0.00021686782513500764, "tps": 48753, "wall": 21404.2} {"step": 15923, "train_loss": 3.402554988861084, "lr": 0.00021684867005374896, "tps": 48743, "wall": 21410.0} {"step": 15924, "train_loss": 3.254716157913208, "lr": 0.00021682951500818874, "tps": 48732, "wall": 21415.9} {"step": 15925, "train_loss": 3.369410514831543, "lr": 0.00021681035999854395, "tps": 48722, "wall": 21421.7} {"step": 15926, "train_loss": 3.4674761295318604, "lr": 0.0002167912050250316, "tps": 48712, "wall": 21427.5} {"step": 15927, "train_loss": 3.407923698425293, "lr": 0.0002167720500878686, "tps": 48702, "wall": 21433.3} {"step": 15928, "train_loss": 3.2262332439422607, "lr": 0.00021675289518727212, "tps": 48692, "wall": 21439.1} {"step": 15929, "train_loss": 3.285656452178955, "lr": 0.00021673374032345888, "tps": 48682, "wall": 21445.0} {"step": 15930, "train_loss": 3.464214324951172, "lr": 0.00021671458549664605, "tps": 48671, "wall": 21451.0} {"step": 15931, "train_loss": 3.384726047515869, "lr": 0.00021669543070705055, "tps": 48661, "wall": 21456.8} {"step": 15932, "train_loss": 3.301191806793213, "lr": 0.0002166762759548894, "tps": 48651, "wall": 21462.6} {"step": 15933, "train_loss": 3.298862934112549, "lr": 0.00021665712124037962, "tps": 48641, "wall": 21468.5} {"step": 15934, "train_loss": 3.3766627311706543, "lr": 0.00021663796656373808, "tps": 48630, "wall": 21474.4} {"step": 15935, "train_loss": 3.259613275527954, "lr": 0.00021661881192518186, "tps": 48620, "wall": 21480.2} {"step": 15936, "train_loss": 3.4009714126586914, "lr": 0.0002165996573249279, "tps": 48610, "wall": 21486.0} {"step": 15937, "train_loss": 3.3063127994537354, "lr": 0.00021658050276319332, "tps": 48600, "wall": 21491.9} {"step": 15938, "train_loss": 3.2548270225524902, "lr": 0.00021656134824019483, "tps": 48590, "wall": 21497.7} {"step": 15939, "train_loss": 3.4189419746398926, "lr": 0.00021654219375614968, "tps": 48579, "wall": 21503.6} {"step": 15940, "train_loss": 3.317443609237671, "lr": 0.0002165230393112747, "tps": 48569, "wall": 21509.5} {"step": 15941, "train_loss": 3.3722071647644043, "lr": 0.00021650388490578694, "tps": 48559, "wall": 21515.3} {"step": 15942, "train_loss": 3.227731227874756, "lr": 0.00021648473053990333, "tps": 48549, "wall": 21521.2} {"step": 15943, "train_loss": 3.2860615253448486, "lr": 0.00021646557621384096, "tps": 48539, "wall": 21527.1} {"step": 15944, "train_loss": 3.3313140869140625, "lr": 0.00021644642192781665, "tps": 48528, "wall": 21533.0} {"step": 15945, "train_loss": 3.279918670654297, "lr": 0.00021642726768204747, "tps": 48518, "wall": 21538.8} {"step": 15946, "train_loss": 3.3087587356567383, "lr": 0.00021640811347675042, "tps": 48508, "wall": 21544.7} {"step": 15947, "train_loss": 3.2888286113739014, "lr": 0.0002163889593121425, "tps": 48498, "wall": 21550.6} {"step": 15948, "train_loss": 3.300515651702881, "lr": 0.00021636980518844058, "tps": 48488, "wall": 21556.4} {"step": 15949, "train_loss": 3.375401258468628, "lr": 0.00021635065110586172, "tps": 48478, "wall": 21562.3} {"step": 15950, "train_loss": 3.401120662689209, "lr": 0.00021633149706462291, "tps": 48468, "wall": 21568.1} {"step": 15951, "train_loss": 3.3986310958862305, "lr": 0.00021631234306494106, "tps": 48457, "wall": 21574.1} {"step": 15952, "train_loss": 3.2897839546203613, "lr": 0.00021629318910703317, "tps": 48447, "wall": 21580.0} {"step": 15953, "train_loss": 3.41040301322937, "lr": 0.0002162740351911163, "tps": 48437, "wall": 21585.8} {"step": 15954, "train_loss": 3.3081436157226562, "lr": 0.00021625488131740732, "tps": 48427, "wall": 21591.7} {"step": 15955, "train_loss": 3.395688056945801, "lr": 0.00021623572748612321, "tps": 48417, "wall": 21597.5} {"step": 15956, "train_loss": 3.357761859893799, "lr": 0.00021621657369748105, "tps": 48406, "wall": 21603.5} {"step": 15957, "train_loss": 3.2971925735473633, "lr": 0.00021619741995169774, "tps": 48396, "wall": 21609.3} {"step": 15958, "train_loss": 3.3933846950531006, "lr": 0.00021617826624899022, "tps": 48386, "wall": 21615.2} {"step": 15959, "train_loss": 3.2915964126586914, "lr": 0.00021615911258957552, "tps": 48376, "wall": 21621.0} {"step": 15960, "train_loss": 3.3407816886901855, "lr": 0.00021613995897367064, "tps": 48366, "wall": 21626.9} {"step": 15961, "train_loss": 3.2391157150268555, "lr": 0.0002161208054014925, "tps": 48356, "wall": 21632.8} {"step": 15962, "train_loss": 3.267536163330078, "lr": 0.00021610165187325805, "tps": 48346, "wall": 21638.7} {"step": 15963, "train_loss": 3.36301326751709, "lr": 0.00021608249838918432, "tps": 48336, "wall": 21644.6} {"step": 15964, "train_loss": 3.3650176525115967, "lr": 0.00021606334494948825, "tps": 48326, "wall": 21650.5} {"step": 15965, "train_loss": 3.442188024520874, "lr": 0.00021604419155438683, "tps": 48315, "wall": 21656.4} {"step": 15966, "train_loss": 3.409623384475708, "lr": 0.00021602503820409706, "tps": 48305, "wall": 21662.2} {"step": 15967, "train_loss": 3.2293076515197754, "lr": 0.00021600588489883586, "tps": 48295, "wall": 21668.1} {"step": 15968, "train_loss": 3.2759127616882324, "lr": 0.00021598673163882018, "tps": 48285, "wall": 21674.0} {"step": 15969, "train_loss": 3.2548365592956543, "lr": 0.000215967578424267, "tps": 48275, "wall": 21679.9} {"step": 15970, "train_loss": 3.3903775215148926, "lr": 0.00021594842525539339, "tps": 48265, "wall": 21685.8} {"step": 15971, "train_loss": 3.345360279083252, "lr": 0.00021592927213241617, "tps": 48255, "wall": 21691.7} {"step": 15972, "train_loss": 3.372194290161133, "lr": 0.00021591011905555237, "tps": 48245, "wall": 21697.6} {"step": 15973, "train_loss": 3.4351320266723633, "lr": 0.00021589096602501898, "tps": 48235, "wall": 21703.5} {"step": 15974, "train_loss": 3.271636724472046, "lr": 0.00021587181304103296, "tps": 48225, "wall": 21709.3} {"step": 15975, "train_loss": 3.260653018951416, "lr": 0.00021585266010381123, "tps": 48215, "wall": 21715.2} {"step": 15976, "train_loss": 3.4878242015838623, "lr": 0.00021583350721357083, "tps": 48205, "wall": 21721.1} {"step": 15977, "train_loss": 3.336151599884033, "lr": 0.0002158143543705287, "tps": 48195, "wall": 21727.0} {"step": 15978, "train_loss": 3.3643386363983154, "lr": 0.00021579520157490175, "tps": 48185, "wall": 21732.9} {"step": 15979, "train_loss": 3.4648256301879883, "lr": 0.000215776048826907, "tps": 48175, "wall": 21738.7} {"step": 15980, "train_loss": 3.3391244411468506, "lr": 0.00021575689612676145, "tps": 48165, "wall": 21744.6} {"step": 15981, "train_loss": 3.2683143615722656, "lr": 0.00021573774347468194, "tps": 48154, "wall": 21750.6} {"step": 15982, "train_loss": 3.407348394393921, "lr": 0.0002157185908708855, "tps": 48144, "wall": 21756.5} {"step": 15983, "train_loss": 3.3077878952026367, "lr": 0.00021569943831558912, "tps": 48134, "wall": 21762.4} {"step": 15984, "train_loss": 3.4003429412841797, "lr": 0.00021568028580900975, "tps": 48124, "wall": 21768.3} {"step": 15985, "train_loss": 3.2714099884033203, "lr": 0.0002156611333513643, "tps": 48114, "wall": 21774.1} {"step": 15986, "train_loss": 3.4004175662994385, "lr": 0.00021564198094286977, "tps": 48104, "wall": 21780.0} {"step": 15987, "train_loss": 3.2664623260498047, "lr": 0.00021562282858374315, "tps": 48095, "wall": 21785.8} {"step": 15988, "train_loss": 3.3496575355529785, "lr": 0.00021560367627420135, "tps": 48085, "wall": 21791.7} {"step": 15989, "train_loss": 3.3909478187561035, "lr": 0.0002155845240144613, "tps": 48075, "wall": 21797.5} {"step": 15990, "train_loss": 3.4021594524383545, "lr": 0.00021556537180474005, "tps": 48065, "wall": 21803.4} {"step": 15991, "train_loss": 3.3951773643493652, "lr": 0.0002155462196452545, "tps": 48055, "wall": 21809.3} {"step": 15992, "train_loss": 3.3340611457824707, "lr": 0.0002155270675362216, "tps": 48045, "wall": 21815.1} {"step": 15993, "train_loss": 3.2620232105255127, "lr": 0.00021550791547785832, "tps": 48035, "wall": 21821.0} {"step": 15994, "train_loss": 3.3388898372650146, "lr": 0.00021548876347038168, "tps": 48025, "wall": 21826.8} {"step": 15995, "train_loss": 3.3898749351501465, "lr": 0.00021546961151400852, "tps": 48015, "wall": 21832.6} {"step": 15996, "train_loss": 3.3289551734924316, "lr": 0.0002154504596089558, "tps": 48006, "wall": 21838.4} {"step": 15997, "train_loss": 3.323512554168701, "lr": 0.00021543130775544058, "tps": 47996, "wall": 21844.2} {"step": 15998, "train_loss": 3.411522388458252, "lr": 0.00021541215595367974, "tps": 47986, "wall": 21850.0} {"step": 15999, "train_loss": 3.372486114501953, "lr": 0.00021539300420389022, "tps": 47976, "wall": 21855.8} {"step": 16000, "train_loss": 3.306445598602295, "lr": 0.00021537385250628902, "tps": 47967, "wall": 21861.7, "val_loss_monitor": 3.436424881555407} {"step": 16001, "train_loss": 3.290085792541504, "lr": 0.00021535470086109308, "tps": 47876, "wall": 21904.6} {"step": 16002, "train_loss": 3.588639259338379, "lr": 0.00021533554926851935, "tps": 47866, "wall": 21910.4} {"step": 16003, "train_loss": 3.223283052444458, "lr": 0.00021531639772878473, "tps": 47856, "wall": 21916.2} {"step": 16004, "train_loss": 3.3977150917053223, "lr": 0.00021529724624210625, "tps": 47846, "wall": 21922.0} {"step": 16005, "train_loss": 3.346501588821411, "lr": 0.0002152780948087008, "tps": 47837, "wall": 21927.9} {"step": 16006, "train_loss": 3.335477828979492, "lr": 0.0002152589434287853, "tps": 47827, "wall": 21933.8} {"step": 16007, "train_loss": 3.29536771774292, "lr": 0.00021523979210257683, "tps": 47817, "wall": 21939.5} {"step": 16008, "train_loss": 3.3626770973205566, "lr": 0.0002152206408302922, "tps": 47808, "wall": 21945.4} {"step": 16009, "train_loss": 3.435455560684204, "lr": 0.00021520148961214842, "tps": 47798, "wall": 21951.2} {"step": 16010, "train_loss": 3.3693957328796387, "lr": 0.00021518233844836245, "tps": 47788, "wall": 21957.1} {"step": 16011, "train_loss": 3.3436756134033203, "lr": 0.00021516318733915118, "tps": 47778, "wall": 21962.9} {"step": 16012, "train_loss": 3.4818856716156006, "lr": 0.00021514403628473158, "tps": 47769, "wall": 21968.7} {"step": 16013, "train_loss": 3.308607578277588, "lr": 0.00021512488528532063, "tps": 47759, "wall": 21974.6} {"step": 16014, "train_loss": 3.3377785682678223, "lr": 0.00021510573434113526, "tps": 47749, "wall": 21980.4} {"step": 16015, "train_loss": 3.3398244380950928, "lr": 0.00021508658345239235, "tps": 47740, "wall": 21986.2} {"step": 16016, "train_loss": 3.3776965141296387, "lr": 0.00021506743261930886, "tps": 47730, "wall": 21992.1} {"step": 16017, "train_loss": 3.3408427238464355, "lr": 0.00021504828184210179, "tps": 47720, "wall": 21997.9} {"step": 16018, "train_loss": 3.3893589973449707, "lr": 0.00021502913112098814, "tps": 47711, "wall": 22003.8} {"step": 16019, "train_loss": 3.4337518215179443, "lr": 0.0002150099804561846, "tps": 47701, "wall": 22009.5} {"step": 16020, "train_loss": 3.3516030311584473, "lr": 0.00021499082984790838, "tps": 47691, "wall": 22015.3} {"step": 16021, "train_loss": 3.2913200855255127, "lr": 0.00021497167929637628, "tps": 47682, "wall": 22021.1} {"step": 16022, "train_loss": 3.337522268295288, "lr": 0.00021495252880180532, "tps": 47672, "wall": 22026.9} {"step": 16023, "train_loss": 3.3223042488098145, "lr": 0.0002149333783644123, "tps": 47663, "wall": 22032.6} {"step": 16024, "train_loss": 3.220320463180542, "lr": 0.0002149142279844143, "tps": 47653, "wall": 22038.4} {"step": 16025, "train_loss": 3.3815555572509766, "lr": 0.0002148950776620282, "tps": 47644, "wall": 22044.1} {"step": 16026, "train_loss": 3.4009437561035156, "lr": 0.00021487592739747094, "tps": 47634, "wall": 22049.9} {"step": 16027, "train_loss": 3.299360513687134, "lr": 0.0002148567771909594, "tps": 47625, "wall": 22055.8} {"step": 16028, "train_loss": 3.4297842979431152, "lr": 0.0002148376270427106, "tps": 47615, "wall": 22061.6} {"step": 16029, "train_loss": 3.4154608249664307, "lr": 0.00021481847695294147, "tps": 47606, "wall": 22067.3} {"step": 16030, "train_loss": 3.407961845397949, "lr": 0.00021479932692186884, "tps": 47596, "wall": 22073.1} {"step": 16031, "train_loss": 3.3507885932922363, "lr": 0.0002147801769497098, "tps": 47587, "wall": 22078.8} {"step": 16032, "train_loss": 3.3753604888916016, "lr": 0.00021476102703668116, "tps": 47577, "wall": 22084.6} {"step": 16033, "train_loss": 3.2184433937072754, "lr": 0.00021474187718299988, "tps": 47568, "wall": 22090.3} {"step": 16034, "train_loss": 3.403228282928467, "lr": 0.0002147227273888829, "tps": 47559, "wall": 22096.0} {"step": 16035, "train_loss": 3.4440321922302246, "lr": 0.0002147035776545472, "tps": 47550, "wall": 22101.7} {"step": 16036, "train_loss": 3.3663909435272217, "lr": 0.00021468442798020955, "tps": 47540, "wall": 22107.4} {"step": 16037, "train_loss": 3.331772804260254, "lr": 0.00021466527836608705, "tps": 47531, "wall": 22113.1} {"step": 16038, "train_loss": 3.313321352005005, "lr": 0.0002146461288123966, "tps": 47522, "wall": 22118.8} {"step": 16039, "train_loss": 3.3408451080322266, "lr": 0.00021462697931935506, "tps": 47512, "wall": 22124.5} {"step": 16040, "train_loss": 3.3468427658081055, "lr": 0.0002146078298871794, "tps": 47503, "wall": 22130.2} {"step": 16041, "train_loss": 3.317387342453003, "lr": 0.00021458868051608653, "tps": 47494, "wall": 22135.9} {"step": 16042, "train_loss": 3.3596348762512207, "lr": 0.00021456953120629337, "tps": 47485, "wall": 22141.5} {"step": 16043, "train_loss": 3.316030502319336, "lr": 0.00021455038195801685, "tps": 47475, "wall": 22147.2} {"step": 16044, "train_loss": 3.2891786098480225, "lr": 0.0002145312327714739, "tps": 47466, "wall": 22152.9} {"step": 16045, "train_loss": 3.3811593055725098, "lr": 0.00021451208364688148, "tps": 47457, "wall": 22158.6} {"step": 16046, "train_loss": 3.34710693359375, "lr": 0.0002144929345844564, "tps": 47448, "wall": 22164.2} {"step": 16047, "train_loss": 3.388664484024048, "lr": 0.0002144737855844157, "tps": 47439, "wall": 22169.9} {"step": 16048, "train_loss": 3.4108214378356934, "lr": 0.00021445463664697626, "tps": 47429, "wall": 22175.7} {"step": 16049, "train_loss": 3.476979970932007, "lr": 0.000214435487772355, "tps": 47420, "wall": 22181.4} {"step": 16050, "train_loss": 3.2974538803100586, "lr": 0.00021441633896076884, "tps": 47411, "wall": 22187.0} {"step": 16051, "train_loss": 3.2664670944213867, "lr": 0.00021439719021243468, "tps": 47402, "wall": 22192.6} {"step": 16052, "train_loss": 3.34749174118042, "lr": 0.00021437804152756943, "tps": 47393, "wall": 22198.3} {"step": 16053, "train_loss": 3.3161139488220215, "lr": 0.00021435889290639004, "tps": 47384, "wall": 22203.9} {"step": 16054, "train_loss": 3.3197176456451416, "lr": 0.00021433974434911343, "tps": 47375, "wall": 22209.5} {"step": 16055, "train_loss": 3.35886812210083, "lr": 0.00021432059585595653, "tps": 47366, "wall": 22215.2} {"step": 16056, "train_loss": 3.3671951293945312, "lr": 0.0002143014474271362, "tps": 47357, "wall": 22220.8} {"step": 16057, "train_loss": 3.347524404525757, "lr": 0.00021428229906286932, "tps": 47347, "wall": 22226.4} {"step": 16058, "train_loss": 3.3806991577148438, "lr": 0.00021426315076337297, "tps": 47338, "wall": 22232.1} {"step": 16059, "train_loss": 3.3299546241760254, "lr": 0.0002142440025288639, "tps": 47329, "wall": 22237.8} {"step": 16060, "train_loss": 3.2576189041137695, "lr": 0.0002142248543595591, "tps": 47320, "wall": 22243.4} {"step": 16061, "train_loss": 3.441135883331299, "lr": 0.00021420570625567544, "tps": 47311, "wall": 22249.0} {"step": 16062, "train_loss": 3.329829692840576, "lr": 0.00021418655821742988, "tps": 47302, "wall": 22254.7} {"step": 16063, "train_loss": 3.253141403198242, "lr": 0.00021416741024503927, "tps": 47293, "wall": 22260.3} {"step": 16064, "train_loss": 3.359307289123535, "lr": 0.0002141482623387206, "tps": 47284, "wall": 22265.9} {"step": 16065, "train_loss": 3.3968539237976074, "lr": 0.00021412911449869074, "tps": 47275, "wall": 22271.5} {"step": 16066, "train_loss": 3.2310619354248047, "lr": 0.00021410996672516653, "tps": 47266, "wall": 22277.1} {"step": 16067, "train_loss": 3.433138847351074, "lr": 0.0002140908190183649, "tps": 47257, "wall": 22282.7} {"step": 16068, "train_loss": 3.3112993240356445, "lr": 0.00021407167137850287, "tps": 47248, "wall": 22288.3} {"step": 16069, "train_loss": 3.3681282997131348, "lr": 0.00021405252380579727, "tps": 47239, "wall": 22294.0} {"step": 16070, "train_loss": 3.3641278743743896, "lr": 0.000214033376300465, "tps": 47230, "wall": 22299.6} {"step": 16071, "train_loss": 3.2957239151000977, "lr": 0.00021401422886272288, "tps": 47221, "wall": 22305.3} {"step": 16072, "train_loss": 3.2331385612487793, "lr": 0.00021399508149278802, "tps": 47212, "wall": 22310.9} {"step": 16073, "train_loss": 3.448172092437744, "lr": 0.00021397593419087715, "tps": 47203, "wall": 22316.5} {"step": 16074, "train_loss": 3.2075438499450684, "lr": 0.00021395678695720717, "tps": 47194, "wall": 22322.1} {"step": 16075, "train_loss": 3.372234582901001, "lr": 0.00021393763979199513, "tps": 47186, "wall": 22327.7} {"step": 16076, "train_loss": 3.3061535358428955, "lr": 0.0002139184926954578, "tps": 47177, "wall": 22333.3} {"step": 16077, "train_loss": 3.353938341140747, "lr": 0.0002138993456678121, "tps": 47168, "wall": 22338.9} {"step": 16078, "train_loss": 3.343573808670044, "lr": 0.00021388019870927492, "tps": 47159, "wall": 22344.5} {"step": 16079, "train_loss": 3.3777546882629395, "lr": 0.00021386105182006322, "tps": 47150, "wall": 22350.2} {"step": 16080, "train_loss": 3.3144373893737793, "lr": 0.00021384190500039384, "tps": 47141, "wall": 22355.8} {"step": 16081, "train_loss": 3.327132225036621, "lr": 0.00021382275825048366, "tps": 47132, "wall": 22361.5} {"step": 16082, "train_loss": 3.385739326477051, "lr": 0.0002138036115705497, "tps": 47123, "wall": 22367.0} {"step": 16083, "train_loss": 3.350647449493408, "lr": 0.0002137844649608087, "tps": 47114, "wall": 22372.7} {"step": 16084, "train_loss": 3.3999547958374023, "lr": 0.0002137653184214776, "tps": 47105, "wall": 22378.3} {"step": 16085, "train_loss": 3.293252944946289, "lr": 0.00021374617195277335, "tps": 47096, "wall": 22383.9} {"step": 16086, "train_loss": 3.269031286239624, "lr": 0.00021372702555491277, "tps": 47088, "wall": 22389.5} {"step": 16087, "train_loss": 3.3122317790985107, "lr": 0.00021370787922811278, "tps": 47079, "wall": 22395.1} {"step": 16088, "train_loss": 3.279083251953125, "lr": 0.00021368873297259033, "tps": 47070, "wall": 22400.7} {"step": 16089, "train_loss": 3.325730323791504, "lr": 0.0002136695867885622, "tps": 47061, "wall": 22406.3} {"step": 16090, "train_loss": 3.3473165035247803, "lr": 0.00021365044067624535, "tps": 47052, "wall": 22412.1} {"step": 16091, "train_loss": 3.3062493801116943, "lr": 0.00021363129463585666, "tps": 47043, "wall": 22417.7} {"step": 16092, "train_loss": 3.1457157135009766, "lr": 0.00021361214866761304, "tps": 47034, "wall": 22423.3} {"step": 16093, "train_loss": 3.341803550720215, "lr": 0.00021359300277173126, "tps": 47025, "wall": 22428.9} {"step": 16094, "train_loss": 3.313793182373047, "lr": 0.00021357385694842834, "tps": 47017, "wall": 22434.4} {"step": 16095, "train_loss": 3.2893621921539307, "lr": 0.00021355471119792116, "tps": 47008, "wall": 22439.9} {"step": 16096, "train_loss": 3.3610689640045166, "lr": 0.00021353556552042652, "tps": 46999, "wall": 22445.6} {"step": 16097, "train_loss": 3.207679033279419, "lr": 0.0002135164199161614, "tps": 46990, "wall": 22451.3} {"step": 16098, "train_loss": 3.4126200675964355, "lr": 0.00021349727438534254, "tps": 46981, "wall": 22456.9} {"step": 16099, "train_loss": 3.309466600418091, "lr": 0.0002134781289281869, "tps": 46972, "wall": 22462.5} {"step": 16100, "train_loss": 3.3082170486450195, "lr": 0.00021345898354491145, "tps": 46964, "wall": 22468.1} {"step": 16101, "train_loss": 3.3076443672180176, "lr": 0.00021343983823573291, "tps": 46955, "wall": 22473.9} {"step": 16102, "train_loss": 3.4487977027893066, "lr": 0.00021342069300086825, "tps": 46946, "wall": 22479.4} {"step": 16103, "train_loss": 3.2916183471679688, "lr": 0.0002134015478405344, "tps": 46937, "wall": 22485.0} {"step": 16104, "train_loss": 3.3587443828582764, "lr": 0.00021338240275494812, "tps": 46928, "wall": 22490.6} {"step": 16105, "train_loss": 3.3068861961364746, "lr": 0.00021336325774432634, "tps": 46920, "wall": 22496.1} {"step": 16106, "train_loss": 3.327758312225342, "lr": 0.0002133441128088859, "tps": 46911, "wall": 22501.7} {"step": 16107, "train_loss": 3.3155720233917236, "lr": 0.00021332496794884383, "tps": 46902, "wall": 22507.3} {"step": 16108, "train_loss": 3.466796875, "lr": 0.00021330582316441676, "tps": 46894, "wall": 22512.9} {"step": 16109, "train_loss": 3.307100296020508, "lr": 0.00021328667845582172, "tps": 46885, "wall": 22518.5} {"step": 16110, "train_loss": 3.4501724243164062, "lr": 0.0002132675338232756, "tps": 46876, "wall": 22524.1} {"step": 16111, "train_loss": 3.3564281463623047, "lr": 0.00021324838926699516, "tps": 46867, "wall": 22529.7} {"step": 16112, "train_loss": 3.358755111694336, "lr": 0.00021322924478719735, "tps": 46858, "wall": 22535.3} {"step": 16113, "train_loss": 3.389772415161133, "lr": 0.00021321010038409904, "tps": 46850, "wall": 22540.9} {"step": 16114, "train_loss": 3.266571044921875, "lr": 0.0002131909560579171, "tps": 46841, "wall": 22546.4} {"step": 16115, "train_loss": 3.321593761444092, "lr": 0.00021317181180886832, "tps": 46833, "wall": 22552.0} {"step": 16116, "train_loss": 3.3274991512298584, "lr": 0.00021315266763716962, "tps": 46824, "wall": 22557.6} {"step": 16117, "train_loss": 3.4393959045410156, "lr": 0.00021313352354303792, "tps": 46815, "wall": 22563.3} {"step": 16118, "train_loss": 3.3500757217407227, "lr": 0.00021311437952669003, "tps": 46806, "wall": 22568.9} {"step": 16119, "train_loss": 3.2388148307800293, "lr": 0.00021309523558834278, "tps": 46798, "wall": 22574.5} {"step": 16120, "train_loss": 3.2494897842407227, "lr": 0.0002130760917282131, "tps": 46789, "wall": 22580.0} {"step": 16121, "train_loss": 3.3942437171936035, "lr": 0.00021305694794651787, "tps": 46780, "wall": 22585.6} {"step": 16122, "train_loss": 3.3639845848083496, "lr": 0.0002130378042434739, "tps": 46771, "wall": 22591.2} {"step": 16123, "train_loss": 3.3141660690307617, "lr": 0.00021301866061929797, "tps": 46763, "wall": 22596.8} {"step": 16124, "train_loss": 3.3713088035583496, "lr": 0.00021299951707420714, "tps": 46754, "wall": 22602.3} {"step": 16125, "train_loss": 3.3528552055358887, "lr": 0.00021298037360841806, "tps": 46746, "wall": 22607.9} {"step": 16126, "train_loss": 3.341078519821167, "lr": 0.00021296123022214775, "tps": 46737, "wall": 22613.5} {"step": 16127, "train_loss": 3.3737142086029053, "lr": 0.00021294208691561303, "tps": 46729, "wall": 22619.0} {"step": 16128, "train_loss": 3.326038122177124, "lr": 0.00021292294368903067, "tps": 46720, "wall": 22624.6} {"step": 16129, "train_loss": 3.4857192039489746, "lr": 0.0002129038005426176, "tps": 46711, "wall": 22630.1} {"step": 16130, "train_loss": 3.3923821449279785, "lr": 0.00021288465747659068, "tps": 46703, "wall": 22635.7} {"step": 16131, "train_loss": 3.421825647354126, "lr": 0.00021286551449116673, "tps": 46694, "wall": 22641.2} {"step": 16132, "train_loss": 3.2778496742248535, "lr": 0.00021284637158656264, "tps": 46686, "wall": 22646.8} {"step": 16133, "train_loss": 3.381375312805176, "lr": 0.00021282722876299524, "tps": 46677, "wall": 22652.5} {"step": 16134, "train_loss": 3.368741035461426, "lr": 0.00021280808602068137, "tps": 46668, "wall": 22658.1} {"step": 16135, "train_loss": 3.3384270668029785, "lr": 0.0002127889433598379, "tps": 46660, "wall": 22663.7} {"step": 16136, "train_loss": 3.435587167739868, "lr": 0.00021276980078068161, "tps": 46651, "wall": 22669.2} {"step": 16137, "train_loss": 3.316502571105957, "lr": 0.0002127506582834295, "tps": 46643, "wall": 22674.8} {"step": 16138, "train_loss": 3.3682656288146973, "lr": 0.0002127315158682982, "tps": 46634, "wall": 22680.3} {"step": 16139, "train_loss": 3.38839054107666, "lr": 0.00021271237353550482, "tps": 46625, "wall": 22685.9} {"step": 16140, "train_loss": 3.3495376110076904, "lr": 0.00021269323128526594, "tps": 46617, "wall": 22691.5} {"step": 16141, "train_loss": 3.3996028900146484, "lr": 0.00021267408911779863, "tps": 46608, "wall": 22697.0} {"step": 16142, "train_loss": 3.4137673377990723, "lr": 0.00021265494703331963, "tps": 46600, "wall": 22702.6} {"step": 16143, "train_loss": 3.3388142585754395, "lr": 0.00021263580503204574, "tps": 46591, "wall": 22708.2} {"step": 16144, "train_loss": 3.3673291206359863, "lr": 0.00021261666311419387, "tps": 46582, "wall": 22713.9} {"step": 16145, "train_loss": 3.382378578186035, "lr": 0.00021259752127998085, "tps": 46574, "wall": 22719.5} {"step": 16146, "train_loss": 3.27205753326416, "lr": 0.0002125783795296235, "tps": 46565, "wall": 22725.0} {"step": 16147, "train_loss": 3.2867112159729004, "lr": 0.00021255923786333872, "tps": 46557, "wall": 22730.5} {"step": 16148, "train_loss": 3.449434757232666, "lr": 0.00021254009628134322, "tps": 46548, "wall": 22736.1} {"step": 16149, "train_loss": 3.299647808074951, "lr": 0.0002125209547838539, "tps": 46540, "wall": 22741.7} {"step": 16150, "train_loss": 3.4150772094726562, "lr": 0.0002125018133710876, "tps": 46531, "wall": 22747.2} {"step": 16151, "train_loss": 3.3273470401763916, "lr": 0.00021248267204326124, "tps": 46523, "wall": 22752.8} {"step": 16152, "train_loss": 3.3207430839538574, "lr": 0.00021246353080059155, "tps": 46515, "wall": 22758.3} {"step": 16153, "train_loss": 3.2083873748779297, "lr": 0.0002124443896432954, "tps": 46506, "wall": 22763.8} {"step": 16154, "train_loss": 3.344883918762207, "lr": 0.00021242524857158964, "tps": 46498, "wall": 22769.4} {"step": 16155, "train_loss": 3.399522066116333, "lr": 0.000212406107585691, "tps": 46489, "wall": 22775.0} {"step": 16156, "train_loss": 3.323606491088867, "lr": 0.0002123869666858164, "tps": 46480, "wall": 22780.6} {"step": 16157, "train_loss": 3.2580981254577637, "lr": 0.00021236782587218272, "tps": 46472, "wall": 22786.2} {"step": 16158, "train_loss": 3.3914825916290283, "lr": 0.00021234868514500668, "tps": 46464, "wall": 22791.7} {"step": 16159, "train_loss": 3.41770076751709, "lr": 0.00021232954450450508, "tps": 46455, "wall": 22797.3} {"step": 16160, "train_loss": 3.383009433746338, "lr": 0.00021231040395089487, "tps": 46447, "wall": 22802.8} {"step": 16161, "train_loss": 3.3226447105407715, "lr": 0.00021229126348439286, "tps": 46438, "wall": 22808.4} {"step": 16162, "train_loss": 3.3402342796325684, "lr": 0.00021227212310521578, "tps": 46430, "wall": 22814.0} {"step": 16163, "train_loss": 3.265535593032837, "lr": 0.00021225298281358056, "tps": 46421, "wall": 22819.6} {"step": 16164, "train_loss": 3.3595662117004395, "lr": 0.00021223384260970395, "tps": 46413, "wall": 22825.2} {"step": 16165, "train_loss": 3.4070816040039062, "lr": 0.00021221470249380278, "tps": 46404, "wall": 22830.9} {"step": 16166, "train_loss": 3.251835823059082, "lr": 0.00021219556246609384, "tps": 46396, "wall": 22836.4} {"step": 16167, "train_loss": 3.3242287635803223, "lr": 0.00021217642252679403, "tps": 46387, "wall": 22842.0} {"step": 16168, "train_loss": 3.2305359840393066, "lr": 0.00021215728267612015, "tps": 46379, "wall": 22847.5} {"step": 16169, "train_loss": 3.3645691871643066, "lr": 0.00021213814291428897, "tps": 46370, "wall": 22853.1} {"step": 16170, "train_loss": 3.3049426078796387, "lr": 0.00021211900324151733, "tps": 46362, "wall": 22858.7} {"step": 16171, "train_loss": 3.3418664932250977, "lr": 0.00021209986365802207, "tps": 46353, "wall": 22864.3} {"step": 16172, "train_loss": 3.264444351196289, "lr": 0.00021208072416401997, "tps": 46345, "wall": 22869.9} {"step": 16173, "train_loss": 3.3542442321777344, "lr": 0.00021206158475972782, "tps": 46337, "wall": 22875.4} {"step": 16174, "train_loss": 3.304588794708252, "lr": 0.00021204244544536255, "tps": 46328, "wall": 22881.0} {"step": 16175, "train_loss": 3.310671329498291, "lr": 0.00021202330622114085, "tps": 46320, "wall": 22886.5} {"step": 16176, "train_loss": 3.3590807914733887, "lr": 0.00021200416708727952, "tps": 46311, "wall": 22892.2} {"step": 16177, "train_loss": 3.315924644470215, "lr": 0.00021198502804399544, "tps": 46303, "wall": 22897.7} {"step": 16178, "train_loss": 3.3069093227386475, "lr": 0.00021196588909150546, "tps": 46294, "wall": 22903.3} {"step": 16179, "train_loss": 3.3365025520324707, "lr": 0.0002119467502300262, "tps": 46286, "wall": 22908.9} {"step": 16180, "train_loss": 3.3323817253112793, "lr": 0.0002119276114597747, "tps": 46278, "wall": 22914.5} {"step": 16181, "train_loss": 3.3322081565856934, "lr": 0.0002119084727809676, "tps": 46269, "wall": 22920.0} {"step": 16182, "train_loss": 3.3978939056396484, "lr": 0.00021188933419382178, "tps": 46261, "wall": 22925.5} {"step": 16183, "train_loss": 3.2684781551361084, "lr": 0.00021187019569855403, "tps": 46253, "wall": 22931.1} {"step": 16184, "train_loss": 3.353787899017334, "lr": 0.00021185105729538113, "tps": 46244, "wall": 22936.6} {"step": 16185, "train_loss": 3.3094568252563477, "lr": 0.00021183191898451988, "tps": 46236, "wall": 22942.2} {"step": 16186, "train_loss": 3.357940435409546, "lr": 0.0002118127807661871, "tps": 46228, "wall": 22947.8} {"step": 16187, "train_loss": 3.37455153465271, "lr": 0.0002117936426405996, "tps": 46219, "wall": 22953.4} {"step": 16188, "train_loss": 3.36979079246521, "lr": 0.00021177450460797416, "tps": 46211, "wall": 22958.9} {"step": 16189, "train_loss": 3.3274407386779785, "lr": 0.00021175536666852757, "tps": 46203, "wall": 22964.4} {"step": 16190, "train_loss": 3.3629541397094727, "lr": 0.00021173622882247664, "tps": 46194, "wall": 22970.0} {"step": 16191, "train_loss": 3.2763500213623047, "lr": 0.0002117170910700381, "tps": 46186, "wall": 22975.5} {"step": 16192, "train_loss": 3.341022491455078, "lr": 0.00021169795341142886, "tps": 46178, "wall": 22981.0} {"step": 16193, "train_loss": 3.3310115337371826, "lr": 0.00021167881584686563, "tps": 46169, "wall": 22986.6} {"step": 16194, "train_loss": 3.3691468238830566, "lr": 0.00021165967837656524, "tps": 46161, "wall": 22992.1} {"step": 16195, "train_loss": 3.402632236480713, "lr": 0.00021164054100074447, "tps": 46153, "wall": 22997.7} {"step": 16196, "train_loss": 3.338867425918579, "lr": 0.00021162140371962012, "tps": 46145, "wall": 23003.2} {"step": 16197, "train_loss": 3.3659636974334717, "lr": 0.0002116022665334089, "tps": 46136, "wall": 23008.8} {"step": 16198, "train_loss": 3.3335070610046387, "lr": 0.0002115831294423277, "tps": 46128, "wall": 23014.5} {"step": 16199, "train_loss": 3.4183976650238037, "lr": 0.00021156399244659326, "tps": 46119, "wall": 23020.0} {"step": 16200, "train_loss": 3.3253986835479736, "lr": 0.0002115448555464224, "tps": 46111, "wall": 23025.6} {"step": 16201, "train_loss": 3.453444242477417, "lr": 0.00021152571874203183, "tps": 46103, "wall": 23031.1} {"step": 16202, "train_loss": 3.426633358001709, "lr": 0.00021150658203363838, "tps": 46095, "wall": 23036.7} {"step": 16203, "train_loss": 3.307149887084961, "lr": 0.0002114874454214588, "tps": 46086, "wall": 23042.3} {"step": 16204, "train_loss": 3.3467226028442383, "lr": 0.00021146830890570993, "tps": 46078, "wall": 23047.8} {"step": 16205, "train_loss": 3.338279962539673, "lr": 0.00021144917248660855, "tps": 46070, "wall": 23053.3} {"step": 16206, "train_loss": 3.3934943675994873, "lr": 0.00021143003616437138, "tps": 46062, "wall": 23058.9} {"step": 16207, "train_loss": 3.332731246948242, "lr": 0.0002114108999392152, "tps": 46053, "wall": 23064.4} {"step": 16208, "train_loss": 3.313936233520508, "lr": 0.00021139176381135686, "tps": 46045, "wall": 23070.1} {"step": 16209, "train_loss": 3.386873960494995, "lr": 0.00021137262778101308, "tps": 46037, "wall": 23075.6} {"step": 16210, "train_loss": 3.386502265930176, "lr": 0.00021135349184840058, "tps": 46029, "wall": 23081.1} {"step": 16211, "train_loss": 3.3345723152160645, "lr": 0.00021133435601373627, "tps": 46020, "wall": 23086.7} {"step": 16212, "train_loss": 3.4076530933380127, "lr": 0.00021131522027723678, "tps": 46012, "wall": 23092.2} {"step": 16213, "train_loss": 3.30778169631958, "lr": 0.00021129608463911893, "tps": 46004, "wall": 23097.8} {"step": 16214, "train_loss": 3.3226184844970703, "lr": 0.00021127694909959957, "tps": 45996, "wall": 23103.3} {"step": 16215, "train_loss": 3.3698415756225586, "lr": 0.0002112578136588954, "tps": 45988, "wall": 23108.9} {"step": 16216, "train_loss": 3.344052791595459, "lr": 0.00021123867831722315, "tps": 45979, "wall": 23114.4} {"step": 16217, "train_loss": 3.456453323364258, "lr": 0.00021121954307479963, "tps": 45971, "wall": 23120.0} {"step": 16218, "train_loss": 3.3283066749572754, "lr": 0.00021120040793184166, "tps": 45963, "wall": 23125.5} {"step": 16219, "train_loss": 3.353576183319092, "lr": 0.00021118127288856587, "tps": 45955, "wall": 23131.2} {"step": 16220, "train_loss": 3.2612814903259277, "lr": 0.00021116213794518908, "tps": 45946, "wall": 23136.7} {"step": 16221, "train_loss": 3.3252739906311035, "lr": 0.00021114300310192815, "tps": 45938, "wall": 23142.2} {"step": 16222, "train_loss": 3.385680675506592, "lr": 0.00021112386835899974, "tps": 45930, "wall": 23147.7} {"step": 16223, "train_loss": 3.40006685256958, "lr": 0.00021110473371662057, "tps": 45922, "wall": 23153.3} {"step": 16224, "train_loss": 3.268561363220215, "lr": 0.0002110855991750075, "tps": 45914, "wall": 23158.9} {"step": 16225, "train_loss": 3.2826735973358154, "lr": 0.00021106646473437727, "tps": 45906, "wall": 23164.4} {"step": 16226, "train_loss": 3.3432669639587402, "lr": 0.0002110473303949466, "tps": 45897, "wall": 23169.9} {"step": 16227, "train_loss": 3.390226125717163, "lr": 0.0002110281961569322, "tps": 45889, "wall": 23175.5} {"step": 16228, "train_loss": 3.372471570968628, "lr": 0.00021100906202055098, "tps": 45881, "wall": 23181.1} {"step": 16229, "train_loss": 3.3364555835723877, "lr": 0.0002109899279860195, "tps": 45873, "wall": 23186.6} {"step": 16230, "train_loss": 3.2130415439605713, "lr": 0.00021097079405355462, "tps": 45865, "wall": 23192.2} {"step": 16231, "train_loss": 3.3710927963256836, "lr": 0.00021095166022337312, "tps": 45857, "wall": 23197.7} {"step": 16232, "train_loss": 3.283564329147339, "lr": 0.0002109325264956917, "tps": 45848, "wall": 23203.3} {"step": 16233, "train_loss": 3.3331046104431152, "lr": 0.00021091339287072707, "tps": 45840, "wall": 23208.8} {"step": 16234, "train_loss": 3.3290789127349854, "lr": 0.000210894259348696, "tps": 45832, "wall": 23214.4} {"step": 16235, "train_loss": 3.332862138748169, "lr": 0.0002108751259298153, "tps": 45824, "wall": 23219.9} {"step": 16236, "train_loss": 3.285306930541992, "lr": 0.00021085599261430168, "tps": 45816, "wall": 23225.4} {"step": 16237, "train_loss": 3.3650171756744385, "lr": 0.0002108368594023718, "tps": 45808, "wall": 23230.9} {"step": 16238, "train_loss": 3.391563892364502, "lr": 0.00021081772629424252, "tps": 45800, "wall": 23236.5} {"step": 16239, "train_loss": 3.325226306915283, "lr": 0.00021079859329013054, "tps": 45792, "wall": 23242.0} {"step": 16240, "train_loss": 3.338517904281616, "lr": 0.00021077946039025256, "tps": 45784, "wall": 23247.6} {"step": 16241, "train_loss": 3.396519184112549, "lr": 0.00021076032759482537, "tps": 45775, "wall": 23253.2} {"step": 16242, "train_loss": 3.272353410720825, "lr": 0.00021074119490406573, "tps": 45767, "wall": 23258.8} {"step": 16243, "train_loss": 3.37605357170105, "lr": 0.0002107220623181903, "tps": 45759, "wall": 23264.3} {"step": 16244, "train_loss": 3.327878475189209, "lr": 0.0002107029298374158, "tps": 45751, "wall": 23269.9} {"step": 16245, "train_loss": 3.390094757080078, "lr": 0.0002106837974619591, "tps": 45743, "wall": 23275.4} {"step": 16246, "train_loss": 3.2533469200134277, "lr": 0.00021066466519203676, "tps": 45735, "wall": 23281.0} {"step": 16247, "train_loss": 3.3649203777313232, "lr": 0.00021064553302786566, "tps": 45727, "wall": 23286.5} {"step": 16248, "train_loss": 3.33089542388916, "lr": 0.00021062640096966247, "tps": 45719, "wall": 23292.1} {"step": 16249, "train_loss": 3.303654670715332, "lr": 0.0002106072690176439, "tps": 45710, "wall": 23297.7} {"step": 16250, "train_loss": 3.3475470542907715, "lr": 0.0002105881371720267, "tps": 45702, "wall": 23303.2} {"step": 16251, "train_loss": 3.2501883506774902, "lr": 0.0002105690054330275, "tps": 45694, "wall": 23308.7} {"step": 16252, "train_loss": 3.389216899871826, "lr": 0.00021054987380086324, "tps": 45686, "wall": 23314.4} {"step": 16253, "train_loss": 3.348928689956665, "lr": 0.0002105307422757505, "tps": 45678, "wall": 23319.9} {"step": 16254, "train_loss": 3.3864922523498535, "lr": 0.00021051161085790598, "tps": 45670, "wall": 23325.4} {"step": 16255, "train_loss": 3.2826526165008545, "lr": 0.0002104924795475465, "tps": 45662, "wall": 23331.0} {"step": 16256, "train_loss": 3.364588975906372, "lr": 0.0002104733483448887, "tps": 45654, "wall": 23336.6} {"step": 16257, "train_loss": 3.3527324199676514, "lr": 0.00021045421725014932, "tps": 45646, "wall": 23342.1} {"step": 16258, "train_loss": 3.3362600803375244, "lr": 0.00021043508626354505, "tps": 45638, "wall": 23347.6} {"step": 16259, "train_loss": 3.419354200363159, "lr": 0.00021041595538529273, "tps": 45630, "wall": 23353.2} {"step": 16260, "train_loss": 3.413259267807007, "lr": 0.0002103968246156089, "tps": 45622, "wall": 23358.7} {"step": 16261, "train_loss": 3.3296544551849365, "lr": 0.00021037769395471035, "tps": 45614, "wall": 23364.3} {"step": 16262, "train_loss": 3.345461368560791, "lr": 0.00021035856340281388, "tps": 45606, "wall": 23369.9} {"step": 16263, "train_loss": 3.3045146465301514, "lr": 0.00021033943296013612, "tps": 45598, "wall": 23375.4} {"step": 16264, "train_loss": 3.2209339141845703, "lr": 0.0002103203026268937, "tps": 45590, "wall": 23380.9} {"step": 16265, "train_loss": 3.254460096359253, "lr": 0.00021030117240330352, "tps": 45582, "wall": 23386.5} {"step": 16266, "train_loss": 3.422903537750244, "lr": 0.00021028204228958216, "tps": 45574, "wall": 23392.0} {"step": 16267, "train_loss": 3.457123041152954, "lr": 0.00021026291228594634, "tps": 45566, "wall": 23397.6} {"step": 16268, "train_loss": 3.2615628242492676, "lr": 0.00021024378239261276, "tps": 45558, "wall": 23403.2} {"step": 16269, "train_loss": 3.3115601539611816, "lr": 0.00021022465260979814, "tps": 45550, "wall": 23408.7} {"step": 16270, "train_loss": 3.2184998989105225, "lr": 0.0002102055229377192, "tps": 45542, "wall": 23414.3} {"step": 16271, "train_loss": 3.3399441242218018, "lr": 0.00021018639337659262, "tps": 45534, "wall": 23419.8} {"step": 16272, "train_loss": 3.368110418319702, "lr": 0.00021016726392663509, "tps": 45526, "wall": 23425.4} {"step": 16273, "train_loss": 3.3423571586608887, "lr": 0.00021014813458806333, "tps": 45517, "wall": 23431.0} {"step": 16274, "train_loss": 3.320622205734253, "lr": 0.0002101290053610941, "tps": 45510, "wall": 23436.6} {"step": 16275, "train_loss": 3.365671157836914, "lr": 0.0002101098762459439, "tps": 45502, "wall": 23442.1} {"step": 16276, "train_loss": 3.3053712844848633, "lr": 0.00021009074724282964, "tps": 45494, "wall": 23447.6} {"step": 16277, "train_loss": 3.375912666320801, "lr": 0.00021007161835196792, "tps": 45486, "wall": 23453.1} {"step": 16278, "train_loss": 3.4085628986358643, "lr": 0.00021005248957357546, "tps": 45478, "wall": 23458.7} {"step": 16279, "train_loss": 3.3083927631378174, "lr": 0.0002100333609078689, "tps": 45470, "wall": 23464.2} {"step": 16280, "train_loss": 3.3509581089019775, "lr": 0.00021001423235506502, "tps": 45462, "wall": 23469.8} {"step": 16281, "train_loss": 3.358706474304199, "lr": 0.0002099951039153804, "tps": 45454, "wall": 23475.3} {"step": 16282, "train_loss": 3.3539328575134277, "lr": 0.0002099759755890318, "tps": 45446, "wall": 23480.9} {"step": 16283, "train_loss": 3.3644979000091553, "lr": 0.00020995684737623588, "tps": 45438, "wall": 23486.4} {"step": 16284, "train_loss": 3.228365898132324, "lr": 0.0002099377192772094, "tps": 45430, "wall": 23492.0} {"step": 16285, "train_loss": 3.2712934017181396, "lr": 0.00020991859129216892, "tps": 45422, "wall": 23497.6} {"step": 16286, "train_loss": 3.353209972381592, "lr": 0.0002098994634213312, "tps": 45414, "wall": 23503.1} {"step": 16287, "train_loss": 3.4580864906311035, "lr": 0.00020988033566491293, "tps": 45406, "wall": 23508.7} {"step": 16288, "train_loss": 3.3191752433776855, "lr": 0.00020986120802313072, "tps": 45398, "wall": 23514.3} {"step": 16289, "train_loss": 3.3335680961608887, "lr": 0.0002098420804962013, "tps": 45390, "wall": 23519.9} {"step": 16290, "train_loss": 3.29303240776062, "lr": 0.00020982295308434137, "tps": 45382, "wall": 23525.5} {"step": 16291, "train_loss": 3.4013712406158447, "lr": 0.00020980382578776756, "tps": 45374, "wall": 23531.0} {"step": 16292, "train_loss": 3.3947641849517822, "lr": 0.00020978469860669655, "tps": 45366, "wall": 23536.6} {"step": 16293, "train_loss": 3.261019706726074, "lr": 0.00020976557154134504, "tps": 45358, "wall": 23542.2} {"step": 16294, "train_loss": 3.3392529487609863, "lr": 0.00020974644459192973, "tps": 45350, "wall": 23547.7} {"step": 16295, "train_loss": 3.4018163681030273, "lr": 0.00020972731775866716, "tps": 45342, "wall": 23553.5} {"step": 16296, "train_loss": 3.4448232650756836, "lr": 0.00020970819104177416, "tps": 45334, "wall": 23559.1} {"step": 16297, "train_loss": 3.344247817993164, "lr": 0.00020968906444146734, "tps": 45326, "wall": 23564.7} {"step": 16298, "train_loss": 3.3360207080841064, "lr": 0.00020966993795796333, "tps": 45318, "wall": 23570.3} {"step": 16299, "train_loss": 3.3476552963256836, "lr": 0.00020965081159147876, "tps": 45310, "wall": 23576.0} {"step": 16300, "train_loss": 3.317078113555908, "lr": 0.00020963168534223042, "tps": 45302, "wall": 23581.6} {"step": 16301, "train_loss": 3.381082057952881, "lr": 0.00020961255921043496, "tps": 45294, "wall": 23587.2} {"step": 16302, "train_loss": 3.407512664794922, "lr": 0.00020959343319630887, "tps": 45286, "wall": 23592.8} {"step": 16303, "train_loss": 3.4208405017852783, "lr": 0.00020957430730006901, "tps": 45278, "wall": 23598.4} {"step": 16304, "train_loss": 3.305586814880371, "lr": 0.00020955518152193198, "tps": 45270, "wall": 23604.0} {"step": 16305, "train_loss": 3.3087732791900635, "lr": 0.0002095360558621144, "tps": 45262, "wall": 23609.7} {"step": 16306, "train_loss": 3.4040961265563965, "lr": 0.0002095169303208329, "tps": 45254, "wall": 23615.4} {"step": 16307, "train_loss": 3.3232839107513428, "lr": 0.00020949780489830423, "tps": 45246, "wall": 23620.9} {"step": 16308, "train_loss": 3.3862123489379883, "lr": 0.00020947867959474498, "tps": 45238, "wall": 23626.6} {"step": 16309, "train_loss": 3.4037530422210693, "lr": 0.0002094595544103718, "tps": 45230, "wall": 23632.3} {"step": 16310, "train_loss": 3.284621238708496, "lr": 0.00020944042934540135, "tps": 45222, "wall": 23638.0} {"step": 16311, "train_loss": 3.390922784805298, "lr": 0.00020942130440005033, "tps": 45213, "wall": 23643.7} {"step": 16312, "train_loss": 3.353724956512451, "lr": 0.00020940217957453533, "tps": 45205, "wall": 23649.4} {"step": 16313, "train_loss": 3.3587324619293213, "lr": 0.000209383054869073, "tps": 45197, "wall": 23655.1} {"step": 16314, "train_loss": 3.402177095413208, "lr": 0.00020936393028388005, "tps": 45189, "wall": 23660.8} {"step": 16315, "train_loss": 3.3698627948760986, "lr": 0.000209344805819173, "tps": 45181, "wall": 23666.4} {"step": 16316, "train_loss": 3.296833038330078, "lr": 0.0002093256814751686, "tps": 45173, "wall": 23672.2} {"step": 16317, "train_loss": 3.4358105659484863, "lr": 0.00020930655725208346, "tps": 45165, "wall": 23677.9} {"step": 16318, "train_loss": 3.3868675231933594, "lr": 0.00020928743315013423, "tps": 45157, "wall": 23683.5} {"step": 16319, "train_loss": 3.290881395339966, "lr": 0.0002092683091695375, "tps": 45149, "wall": 23689.2} {"step": 16320, "train_loss": 3.3470420837402344, "lr": 0.00020924918531050994, "tps": 45141, "wall": 23694.9} {"step": 16321, "train_loss": 3.3979272842407227, "lr": 0.0002092300615732682, "tps": 45132, "wall": 23700.6} {"step": 16322, "train_loss": 3.3768482208251953, "lr": 0.00020921093795802894, "tps": 45124, "wall": 23706.3} {"step": 16323, "train_loss": 3.4118382930755615, "lr": 0.00020919181446500874, "tps": 45116, "wall": 23712.0} {"step": 16324, "train_loss": 3.371218204498291, "lr": 0.00020917269109442424, "tps": 45108, "wall": 23717.7} {"step": 16325, "train_loss": 3.309424877166748, "lr": 0.00020915356784649206, "tps": 45100, "wall": 23723.4} {"step": 16326, "train_loss": 3.259913921356201, "lr": 0.0002091344447214289, "tps": 45092, "wall": 23729.1} {"step": 16327, "train_loss": 3.388159990310669, "lr": 0.0002091153217194513, "tps": 45084, "wall": 23734.9} {"step": 16328, "train_loss": 3.383378028869629, "lr": 0.000209096198840776, "tps": 45076, "wall": 23740.6} {"step": 16329, "train_loss": 3.3410675525665283, "lr": 0.00020907707608561947, "tps": 45068, "wall": 23746.3} {"step": 16330, "train_loss": 3.2418251037597656, "lr": 0.00020905795345419842, "tps": 45060, "wall": 23752.0} {"step": 16331, "train_loss": 3.3134782314300537, "lr": 0.0002090388309467295, "tps": 45052, "wall": 23757.7} {"step": 16332, "train_loss": 3.400378704071045, "lr": 0.00020901970856342924, "tps": 45043, "wall": 23763.4} {"step": 16333, "train_loss": 3.3382062911987305, "lr": 0.00020900058630451436, "tps": 45035, "wall": 23769.2} {"step": 16334, "train_loss": 3.4050092697143555, "lr": 0.00020898146417020144, "tps": 45027, "wall": 23775.0} {"step": 16335, "train_loss": 3.4716029167175293, "lr": 0.00020896234216070706, "tps": 45019, "wall": 23780.7} {"step": 16336, "train_loss": 3.3914337158203125, "lr": 0.00020894322027624785, "tps": 45011, "wall": 23786.5} {"step": 16337, "train_loss": 3.2700512409210205, "lr": 0.00020892409851704048, "tps": 45003, "wall": 23792.3} {"step": 16338, "train_loss": 3.329301357269287, "lr": 0.00020890497688330154, "tps": 44994, "wall": 23798.1} {"step": 16339, "train_loss": 3.3622989654541016, "lr": 0.00020888585537524756, "tps": 44986, "wall": 23803.8} {"step": 16340, "train_loss": 3.316288709640503, "lr": 0.00020886673399309524, "tps": 44978, "wall": 23809.6} {"step": 16341, "train_loss": 3.278902292251587, "lr": 0.0002088476127370612, "tps": 44970, "wall": 23815.4} {"step": 16342, "train_loss": 3.31069278717041, "lr": 0.00020882849160736196, "tps": 44962, "wall": 23821.1} {"step": 16343, "train_loss": 3.3112988471984863, "lr": 0.00020880937060421416, "tps": 44954, "wall": 23826.8} {"step": 16344, "train_loss": 3.256730079650879, "lr": 0.00020879024972783445, "tps": 44946, "wall": 23832.6} {"step": 16345, "train_loss": 3.361466646194458, "lr": 0.0002087711289784394, "tps": 44938, "wall": 23838.3} {"step": 16346, "train_loss": 3.3372597694396973, "lr": 0.00020875200835624553, "tps": 44930, "wall": 23844.1} {"step": 16347, "train_loss": 3.270059585571289, "lr": 0.00020873288786146956, "tps": 44921, "wall": 23849.9} {"step": 16348, "train_loss": 3.1936492919921875, "lr": 0.00020871376749432812, "tps": 44913, "wall": 23855.7} {"step": 16349, "train_loss": 3.2362797260284424, "lr": 0.00020869464725503764, "tps": 44905, "wall": 23861.5} {"step": 16350, "train_loss": 3.3353090286254883, "lr": 0.00020867552714381486, "tps": 44897, "wall": 23867.3} {"step": 16351, "train_loss": 3.371215343475342, "lr": 0.00020865640716087635, "tps": 44889, "wall": 23873.1} {"step": 16352, "train_loss": 3.322343349456787, "lr": 0.0002086372873064386, "tps": 44881, "wall": 23878.9} {"step": 16353, "train_loss": 3.2640011310577393, "lr": 0.0002086181675807183, "tps": 44873, "wall": 23884.6} {"step": 16354, "train_loss": 3.3870232105255127, "lr": 0.00020859904798393197, "tps": 44864, "wall": 23890.5} {"step": 16355, "train_loss": 3.376988410949707, "lr": 0.00020857992851629632, "tps": 44856, "wall": 23896.2} {"step": 16356, "train_loss": 3.385312080383301, "lr": 0.00020856080917802783, "tps": 44848, "wall": 23902.0} {"step": 16357, "train_loss": 3.2540781497955322, "lr": 0.0002085416899693431, "tps": 44840, "wall": 23907.8} {"step": 16358, "train_loss": 3.3010060787200928, "lr": 0.00020852257089045873, "tps": 44832, "wall": 23913.7} {"step": 16359, "train_loss": 3.313201665878296, "lr": 0.00020850345194159132, "tps": 44824, "wall": 23919.5} {"step": 16360, "train_loss": 3.3758442401885986, "lr": 0.00020848433312295738, "tps": 44816, "wall": 23925.2} {"step": 16361, "train_loss": 3.421945333480835, "lr": 0.00020846521443477364, "tps": 44807, "wall": 23931.0} {"step": 16362, "train_loss": 3.38291335105896, "lr": 0.00020844609587725645, "tps": 44799, "wall": 23936.8} {"step": 16363, "train_loss": 3.347280502319336, "lr": 0.00020842697745062258, "tps": 44791, "wall": 23942.6} {"step": 16364, "train_loss": 3.4207448959350586, "lr": 0.00020840785915508846, "tps": 44783, "wall": 23948.5} {"step": 16365, "train_loss": 3.282578945159912, "lr": 0.00020838874099087087, "tps": 44775, "wall": 23954.2} {"step": 16366, "train_loss": 3.225773811340332, "lr": 0.00020836962295818615, "tps": 44767, "wall": 23960.0} {"step": 16367, "train_loss": 3.2955892086029053, "lr": 0.000208350505057251, "tps": 44759, "wall": 23965.9} {"step": 16368, "train_loss": 3.309396266937256, "lr": 0.00020833138728828198, "tps": 44750, "wall": 23971.8} {"step": 16369, "train_loss": 3.3359317779541016, "lr": 0.0002083122696514956, "tps": 44742, "wall": 23977.6} {"step": 16370, "train_loss": 3.3201844692230225, "lr": 0.00020829315214710846, "tps": 44734, "wall": 23983.4} {"step": 16371, "train_loss": 3.3337998390197754, "lr": 0.00020827403477533717, "tps": 44726, "wall": 23989.2} {"step": 16372, "train_loss": 3.336498498916626, "lr": 0.00020825491753639818, "tps": 44718, "wall": 23995.0} {"step": 16373, "train_loss": 3.375251054763794, "lr": 0.00020823580043050814, "tps": 44710, "wall": 24000.8} {"step": 16374, "train_loss": 3.2644834518432617, "lr": 0.00020821668345788363, "tps": 44702, "wall": 24006.7} {"step": 16375, "train_loss": 3.226196765899658, "lr": 0.00020819756661874116, "tps": 44694, "wall": 24012.5} {"step": 16376, "train_loss": 3.3175814151763916, "lr": 0.00020817844991329726, "tps": 44686, "wall": 24018.3} {"step": 16377, "train_loss": 3.1451659202575684, "lr": 0.00020815933334176855, "tps": 44677, "wall": 24024.1} {"step": 16378, "train_loss": 3.3268964290618896, "lr": 0.00020814021690437158, "tps": 44669, "wall": 24030.0} {"step": 16379, "train_loss": 3.341726303100586, "lr": 0.00020812110060132279, "tps": 44661, "wall": 24036.0} {"step": 16380, "train_loss": 3.271247625350952, "lr": 0.00020810198443283885, "tps": 44653, "wall": 24041.8} {"step": 16381, "train_loss": 3.4330053329467773, "lr": 0.00020808286839913627, "tps": 44645, "wall": 24047.7} {"step": 16382, "train_loss": 3.4269843101501465, "lr": 0.00020806375250043165, "tps": 44636, "wall": 24053.6} {"step": 16383, "train_loss": 3.3233532905578613, "lr": 0.00020804463673694144, "tps": 44628, "wall": 24059.4} {"step": 16384, "train_loss": 3.440415859222412, "lr": 0.00020802552110888223, "tps": 44620, "wall": 24065.2} {"step": 16385, "train_loss": 3.2316248416900635, "lr": 0.00020800640561647061, "tps": 44611, "wall": 24071.6} {"step": 16386, "train_loss": 3.286426544189453, "lr": 0.00020798729025992306, "tps": 44602, "wall": 24077.8} {"step": 16387, "train_loss": 3.264141082763672, "lr": 0.00020796817503945607, "tps": 44594, "wall": 24083.6} {"step": 16388, "train_loss": 3.4008560180664062, "lr": 0.00020794905995528634, "tps": 44586, "wall": 24089.5} {"step": 16389, "train_loss": 3.27329421043396, "lr": 0.00020792994500763023, "tps": 44578, "wall": 24095.5} {"step": 16390, "train_loss": 3.4368762969970703, "lr": 0.0002079108301967044, "tps": 44570, "wall": 24101.3} {"step": 16391, "train_loss": 3.3083996772766113, "lr": 0.0002078917155227253, "tps": 44562, "wall": 24107.2} {"step": 16392, "train_loss": 3.3473355770111084, "lr": 0.0002078726009859096, "tps": 44553, "wall": 24113.1} {"step": 16393, "train_loss": 3.207056999206543, "lr": 0.00020785348658647365, "tps": 44545, "wall": 24119.0} {"step": 16394, "train_loss": 3.308467388153076, "lr": 0.00020783437232463404, "tps": 44537, "wall": 24124.8} {"step": 16395, "train_loss": 3.4131577014923096, "lr": 0.00020781525820060738, "tps": 44529, "wall": 24130.7} {"step": 16396, "train_loss": 3.2774152755737305, "lr": 0.0002077961442146101, "tps": 44521, "wall": 24136.6} {"step": 16397, "train_loss": 3.3202967643737793, "lr": 0.00020777703036685874, "tps": 44513, "wall": 24142.5} {"step": 16398, "train_loss": 3.419893503189087, "lr": 0.00020775791665756993, "tps": 44504, "wall": 24148.4} {"step": 16399, "train_loss": 3.366192579269409, "lr": 0.00020773880308696003, "tps": 44496, "wall": 24154.5} {"step": 16400, "train_loss": 3.3149545192718506, "lr": 0.00020771968965524563, "tps": 44488, "wall": 24160.3} {"step": 16401, "train_loss": 3.3472201824188232, "lr": 0.00020770057636264322, "tps": 44480, "wall": 24166.2} {"step": 16402, "train_loss": 3.302417516708374, "lr": 0.0002076814632093694, "tps": 44472, "wall": 24172.2} {"step": 16403, "train_loss": 3.3455159664154053, "lr": 0.00020766235019564064, "tps": 44463, "wall": 24178.1} {"step": 16404, "train_loss": 3.3077332973480225, "lr": 0.0002076432373216734, "tps": 44455, "wall": 24183.9} {"step": 16405, "train_loss": 3.380892515182495, "lr": 0.0002076241245876843, "tps": 44447, "wall": 24189.9} {"step": 16406, "train_loss": 3.2087063789367676, "lr": 0.00020760501199388972, "tps": 44439, "wall": 24195.7} {"step": 16407, "train_loss": 3.342334747314453, "lr": 0.00020758589954050628, "tps": 44431, "wall": 24201.6} {"step": 16408, "train_loss": 3.416463851928711, "lr": 0.0002075667872277504, "tps": 44423, "wall": 24207.5} {"step": 16409, "train_loss": 3.28568172454834, "lr": 0.00020754767505583869, "tps": 44414, "wall": 24213.6} {"step": 16410, "train_loss": 3.304359197616577, "lr": 0.0002075285630249875, "tps": 44406, "wall": 24219.6} {"step": 16411, "train_loss": 3.414659023284912, "lr": 0.00020750945113541346, "tps": 44398, "wall": 24225.5} {"step": 16412, "train_loss": 3.43967342376709, "lr": 0.00020749033938733308, "tps": 44390, "wall": 24231.5} {"step": 16413, "train_loss": 3.4027273654937744, "lr": 0.00020747122778096277, "tps": 44382, "wall": 24237.4} {"step": 16414, "train_loss": 3.4258859157562256, "lr": 0.00020745211631651906, "tps": 44373, "wall": 24243.4} {"step": 16415, "train_loss": 3.4367897510528564, "lr": 0.00020743300499421853, "tps": 44365, "wall": 24249.5} {"step": 16416, "train_loss": 3.374972105026245, "lr": 0.00020741389381427752, "tps": 44357, "wall": 24255.4} {"step": 16417, "train_loss": 3.4538965225219727, "lr": 0.0002073947827769126, "tps": 44349, "wall": 24261.3} {"step": 16418, "train_loss": 3.3069229125976562, "lr": 0.0002073756718823403, "tps": 44341, "wall": 24267.2} {"step": 16419, "train_loss": 3.421961784362793, "lr": 0.00020735656113077705, "tps": 44332, "wall": 24273.2} {"step": 16420, "train_loss": 3.330160140991211, "lr": 0.00020733745052243938, "tps": 44324, "wall": 24279.2} {"step": 16421, "train_loss": 3.281191349029541, "lr": 0.0002073183400575437, "tps": 44316, "wall": 24285.1} {"step": 16422, "train_loss": 3.48292875289917, "lr": 0.00020729922973630665, "tps": 44308, "wall": 24291.1} {"step": 16423, "train_loss": 3.301786422729492, "lr": 0.00020728011955894454, "tps": 44300, "wall": 24297.1} {"step": 16424, "train_loss": 3.3429884910583496, "lr": 0.00020726100952567396, "tps": 44291, "wall": 24303.0} {"step": 16425, "train_loss": 3.3366849422454834, "lr": 0.00020724189963671134, "tps": 44283, "wall": 24309.1} {"step": 16426, "train_loss": 3.3620927333831787, "lr": 0.00020722278989227313, "tps": 44275, "wall": 24315.0} {"step": 16427, "train_loss": 3.2442774772644043, "lr": 0.00020720368029257587, "tps": 44267, "wall": 24320.9} {"step": 16428, "train_loss": 3.3976922035217285, "lr": 0.00020718457083783603, "tps": 44259, "wall": 24326.8} {"step": 16429, "train_loss": 3.343597412109375, "lr": 0.0002071654615282701, "tps": 44251, "wall": 24332.9} {"step": 16430, "train_loss": 3.2586185932159424, "lr": 0.00020714635236409446, "tps": 44242, "wall": 24338.8} {"step": 16431, "train_loss": 3.3574421405792236, "lr": 0.00020712724334552563, "tps": 44234, "wall": 24344.8} {"step": 16432, "train_loss": 3.3147809505462646, "lr": 0.0002071081344727801, "tps": 44226, "wall": 24350.7} {"step": 16433, "train_loss": 3.3318042755126953, "lr": 0.00020708902574607434, "tps": 44218, "wall": 24356.6} {"step": 16434, "train_loss": 3.3564062118530273, "lr": 0.00020706991716562483, "tps": 44210, "wall": 24362.5} {"step": 16435, "train_loss": 3.290132522583008, "lr": 0.00020705080873164797, "tps": 44202, "wall": 24368.5} {"step": 16436, "train_loss": 3.354942798614502, "lr": 0.00020703170044436016, "tps": 44194, "wall": 24374.4} {"step": 16437, "train_loss": 3.36082124710083, "lr": 0.00020701259230397807, "tps": 44186, "wall": 24380.2} {"step": 16438, "train_loss": 3.3841490745544434, "lr": 0.00020699348431071796, "tps": 44178, "wall": 24386.3} {"step": 16439, "train_loss": 3.3573570251464844, "lr": 0.00020697437646479642, "tps": 44170, "wall": 24392.3} {"step": 16440, "train_loss": 3.1692614555358887, "lr": 0.00020695526876642983, "tps": 44162, "wall": 24398.1} {"step": 16441, "train_loss": 3.363049030303955, "lr": 0.0002069361612158346, "tps": 44154, "wall": 24404.1} {"step": 16442, "train_loss": 3.2979278564453125, "lr": 0.00020691705381322727, "tps": 44146, "wall": 24410.0} {"step": 16443, "train_loss": 3.3506622314453125, "lr": 0.00020689794655882432, "tps": 44138, "wall": 24416.0} {"step": 16444, "train_loss": 3.421886920928955, "lr": 0.0002068788394528421, "tps": 44130, "wall": 24421.9} {"step": 16445, "train_loss": 3.3351590633392334, "lr": 0.0002068597324954971, "tps": 44121, "wall": 24427.9} {"step": 16446, "train_loss": 3.383967876434326, "lr": 0.00020684062568700572, "tps": 44114, "wall": 24433.7} {"step": 16447, "train_loss": 3.388913869857788, "lr": 0.00020682151902758452, "tps": 44106, "wall": 24439.7} {"step": 16448, "train_loss": 3.296607494354248, "lr": 0.00020680241251744982, "tps": 44098, "wall": 24445.6} {"step": 16449, "train_loss": 3.3691279888153076, "lr": 0.00020678330615681812, "tps": 44089, "wall": 24451.6} {"step": 16450, "train_loss": 3.298067092895508, "lr": 0.00020676419994590582, "tps": 44081, "wall": 24457.5} {"step": 16451, "train_loss": 3.348801851272583, "lr": 0.00020674509388492939, "tps": 44073, "wall": 24463.5} {"step": 16452, "train_loss": 3.3363609313964844, "lr": 0.00020672598797410525, "tps": 44065, "wall": 24469.4} {"step": 16453, "train_loss": 3.4539988040924072, "lr": 0.00020670688221364984, "tps": 44057, "wall": 24475.3} {"step": 16454, "train_loss": 3.2863028049468994, "lr": 0.00020668777660377962, "tps": 44049, "wall": 24481.2} {"step": 16455, "train_loss": 3.321255922317505, "lr": 0.00020666867114471095, "tps": 44042, "wall": 24487.0} {"step": 16456, "train_loss": 3.2341017723083496, "lr": 0.0002066495658366603, "tps": 44034, "wall": 24493.0} {"step": 16457, "train_loss": 3.2713570594787598, "lr": 0.00020663046067984412, "tps": 44026, "wall": 24498.9} {"step": 16458, "train_loss": 3.317307472229004, "lr": 0.0002066113556744788, "tps": 44018, "wall": 24504.8} {"step": 16459, "train_loss": 3.3220510482788086, "lr": 0.00020659225082078072, "tps": 44010, "wall": 24510.8} {"step": 16460, "train_loss": 3.337287425994873, "lr": 0.00020657314611896633, "tps": 44002, "wall": 24516.7} {"step": 16461, "train_loss": 3.2890512943267822, "lr": 0.00020655404156925212, "tps": 43994, "wall": 24522.6} {"step": 16462, "train_loss": 3.3141539096832275, "lr": 0.00020653493717185444, "tps": 43986, "wall": 24528.6} {"step": 16463, "train_loss": 3.329998016357422, "lr": 0.0002065158329269897, "tps": 43978, "wall": 24534.5} {"step": 16464, "train_loss": 3.299123764038086, "lr": 0.00020649672883487442, "tps": 43970, "wall": 24540.4} {"step": 16465, "train_loss": 3.3597190380096436, "lr": 0.00020647762489572484, "tps": 43962, "wall": 24546.3} {"step": 16466, "train_loss": 3.3022284507751465, "lr": 0.00020645852110975747, "tps": 43954, "wall": 24552.3} {"step": 16467, "train_loss": 3.366556167602539, "lr": 0.00020643941747718874, "tps": 43946, "wall": 24558.2} {"step": 16468, "train_loss": 3.374983072280884, "lr": 0.00020642031399823498, "tps": 43938, "wall": 24564.1} {"step": 16469, "train_loss": 3.4139130115509033, "lr": 0.00020640121067311265, "tps": 43930, "wall": 24570.0} {"step": 16470, "train_loss": 3.3091835975646973, "lr": 0.00020638210750203816, "tps": 43922, "wall": 24576.0} {"step": 16471, "train_loss": 3.2238943576812744, "lr": 0.00020636300448522788, "tps": 43914, "wall": 24581.9} {"step": 16472, "train_loss": 3.457406997680664, "lr": 0.00020634390162289825, "tps": 43907, "wall": 24587.7} {"step": 16473, "train_loss": 3.4227967262268066, "lr": 0.0002063247989152656, "tps": 43899, "wall": 24593.5} {"step": 16474, "train_loss": 3.2651636600494385, "lr": 0.0002063056963625464, "tps": 43891, "wall": 24599.3} {"step": 16475, "train_loss": 3.303892135620117, "lr": 0.00020628659396495697, "tps": 43883, "wall": 24605.2} {"step": 16476, "train_loss": 3.3818068504333496, "lr": 0.00020626749172271378, "tps": 43876, "wall": 24611.0} {"step": 16477, "train_loss": 3.2888457775115967, "lr": 0.00020624838963603318, "tps": 43868, "wall": 24617.0} {"step": 16478, "train_loss": 3.2647223472595215, "lr": 0.00020622928770513155, "tps": 43860, "wall": 24622.8} {"step": 16479, "train_loss": 3.2658255100250244, "lr": 0.0002062101859302253, "tps": 43852, "wall": 24628.6} {"step": 16480, "train_loss": 3.2572262287139893, "lr": 0.0002061910843115308, "tps": 43844, "wall": 24634.6} {"step": 16481, "train_loss": 3.277824878692627, "lr": 0.00020617198284926454, "tps": 43837, "wall": 24640.5} {"step": 16482, "train_loss": 3.374603509902954, "lr": 0.0002061528815436427, "tps": 43829, "wall": 24646.2} {"step": 16483, "train_loss": 3.285430431365967, "lr": 0.00020613378039488177, "tps": 43821, "wall": 24652.1} {"step": 16484, "train_loss": 3.381625175476074, "lr": 0.00020611467940319814, "tps": 43814, "wall": 24657.9} {"step": 16485, "train_loss": 3.30010986328125, "lr": 0.0002060955785688082, "tps": 43806, "wall": 24663.8} {"step": 16486, "train_loss": 3.387260913848877, "lr": 0.00020607647789192828, "tps": 43798, "wall": 24669.6} {"step": 16487, "train_loss": 3.4239234924316406, "lr": 0.00020605737737277476, "tps": 43790, "wall": 24675.5} {"step": 16488, "train_loss": 3.391486644744873, "lr": 0.00020603827701156405, "tps": 43782, "wall": 24681.3} {"step": 16489, "train_loss": 3.410123586654663, "lr": 0.00020601917680851246, "tps": 43775, "wall": 24687.2} {"step": 16490, "train_loss": 3.346299171447754, "lr": 0.0002060000767638364, "tps": 43767, "wall": 24693.1} {"step": 16491, "train_loss": 3.188838005065918, "lr": 0.0002059809768777523, "tps": 43759, "wall": 24699.0} {"step": 16492, "train_loss": 3.3270201683044434, "lr": 0.00020596187715047636, "tps": 43752, "wall": 24704.8} {"step": 16493, "train_loss": 3.2653284072875977, "lr": 0.0002059427775822251, "tps": 43744, "wall": 24710.6} {"step": 16494, "train_loss": 3.4200692176818848, "lr": 0.0002059236781732148, "tps": 43736, "wall": 24716.4} {"step": 16495, "train_loss": 3.326490640640259, "lr": 0.00020590457892366178, "tps": 43729, "wall": 24722.2} {"step": 16496, "train_loss": 3.2595596313476562, "lr": 0.00020588547983378251, "tps": 43721, "wall": 24728.0} {"step": 16497, "train_loss": 3.2691125869750977, "lr": 0.00020586638090379323, "tps": 43714, "wall": 24733.8} {"step": 16498, "train_loss": 3.440624237060547, "lr": 0.00020584728213391041, "tps": 43706, "wall": 24739.6} {"step": 16499, "train_loss": 3.2980799674987793, "lr": 0.00020582818352435033, "tps": 43698, "wall": 24745.3} {"step": 16500, "train_loss": 3.351519823074341, "lr": 0.00020580908507532932, "tps": 43691, "wall": 24751.2} {"step": 16501, "train_loss": 3.414330005645752, "lr": 0.0002057899867870638, "tps": 43683, "wall": 24757.2} {"step": 16502, "train_loss": 3.3433213233947754, "lr": 0.0002057708886597701, "tps": 43675, "wall": 24762.9} {"step": 16503, "train_loss": 3.423553466796875, "lr": 0.0002057517906936645, "tps": 43668, "wall": 24768.7} {"step": 16504, "train_loss": 3.360752820968628, "lr": 0.00020573269288896338, "tps": 43660, "wall": 24774.4} {"step": 16505, "train_loss": 3.4381937980651855, "lr": 0.00020571359524588313, "tps": 43653, "wall": 24780.2} {"step": 16506, "train_loss": 3.302942991256714, "lr": 0.00020569449776464, "tps": 43645, "wall": 24785.9} {"step": 16507, "train_loss": 3.35811448097229, "lr": 0.00020567540044545037, "tps": 43638, "wall": 24791.6} {"step": 16508, "train_loss": 3.3067946434020996, "lr": 0.00020565630328853063, "tps": 43631, "wall": 24797.3} {"step": 16509, "train_loss": 3.285834789276123, "lr": 0.00020563720629409704, "tps": 43623, "wall": 24803.1} {"step": 16510, "train_loss": 3.3553626537323, "lr": 0.00020561810946236592, "tps": 43616, "wall": 24808.8} {"step": 16511, "train_loss": 3.410844326019287, "lr": 0.0002055990127935537, "tps": 43608, "wall": 24814.7} {"step": 16512, "train_loss": 3.392090320587158, "lr": 0.0002055799162878766, "tps": 43601, "wall": 24820.3} {"step": 16513, "train_loss": 3.2998127937316895, "lr": 0.000205560819945551, "tps": 43593, "wall": 24826.1} {"step": 16514, "train_loss": 3.364312171936035, "lr": 0.0002055417237667932, "tps": 43586, "wall": 24831.7} {"step": 16515, "train_loss": 3.4191389083862305, "lr": 0.00020552262775181955, "tps": 43579, "wall": 24837.5} {"step": 16516, "train_loss": 3.352978229522705, "lr": 0.00020550353190084634, "tps": 43571, "wall": 24843.2} {"step": 16517, "train_loss": 3.321800470352173, "lr": 0.0002054844362140899, "tps": 43564, "wall": 24848.9} {"step": 16518, "train_loss": 3.411036491394043, "lr": 0.0002054653406917666, "tps": 43556, "wall": 24854.6} {"step": 16519, "train_loss": 3.331768274307251, "lr": 0.0002054462453340926, "tps": 43549, "wall": 24860.3} {"step": 16520, "train_loss": 3.2515881061553955, "lr": 0.0002054271501412844, "tps": 43542, "wall": 24866.0} {"step": 16521, "train_loss": 3.3984060287475586, "lr": 0.00020540805511355824, "tps": 43534, "wall": 24871.9} {"step": 16522, "train_loss": 3.358279228210449, "lr": 0.00020538896025113043, "tps": 43527, "wall": 24877.6} {"step": 16523, "train_loss": 3.3563122749328613, "lr": 0.00020536986555421725, "tps": 43519, "wall": 24883.3} {"step": 16524, "train_loss": 3.358569622039795, "lr": 0.000205350771023035, "tps": 43512, "wall": 24889.0} {"step": 16525, "train_loss": 3.356044292449951, "lr": 0.00020533167665780005, "tps": 43505, "wall": 24894.7} {"step": 16526, "train_loss": 3.334949493408203, "lr": 0.00020531258245872863, "tps": 43497, "wall": 24900.3} {"step": 16527, "train_loss": 3.3275716304779053, "lr": 0.00020529348842603703, "tps": 43490, "wall": 24906.0} {"step": 16528, "train_loss": 3.419692039489746, "lr": 0.00020527439455994166, "tps": 43483, "wall": 24911.6} {"step": 16529, "train_loss": 3.408576726913452, "lr": 0.0002052553008606587, "tps": 43476, "wall": 24917.3} {"step": 16530, "train_loss": 3.3081703186035156, "lr": 0.00020523620732840452, "tps": 43468, "wall": 24923.0} {"step": 16531, "train_loss": 3.3516671657562256, "lr": 0.00020521711396339539, "tps": 43461, "wall": 24928.7} {"step": 16532, "train_loss": 3.4224114418029785, "lr": 0.0002051980207658476, "tps": 43454, "wall": 24934.5} {"step": 16533, "train_loss": 3.3079404830932617, "lr": 0.00020517892773597738, "tps": 43446, "wall": 24940.2} {"step": 16534, "train_loss": 3.336568832397461, "lr": 0.00020515983487400105, "tps": 43439, "wall": 24945.8} {"step": 16535, "train_loss": 3.3892822265625, "lr": 0.000205140742180135, "tps": 43432, "wall": 24951.5} {"step": 16536, "train_loss": 3.2622766494750977, "lr": 0.0002051216496545954, "tps": 43425, "wall": 24957.2} {"step": 16537, "train_loss": 3.2888479232788086, "lr": 0.0002051025572975985, "tps": 43417, "wall": 24962.9} {"step": 16538, "train_loss": 3.31723690032959, "lr": 0.00020508346510936072, "tps": 43410, "wall": 24968.5} {"step": 16539, "train_loss": 3.383918285369873, "lr": 0.0002050643730900982, "tps": 43403, "wall": 24974.2} {"step": 16540, "train_loss": 3.3834848403930664, "lr": 0.00020504528124002728, "tps": 43396, "wall": 24979.8} {"step": 16541, "train_loss": 3.33481502532959, "lr": 0.0002050261895593642, "tps": 43388, "wall": 24985.6} {"step": 16542, "train_loss": 3.3352084159851074, "lr": 0.00020500709804832526, "tps": 43381, "wall": 24991.2} {"step": 16543, "train_loss": 3.2716314792633057, "lr": 0.00020498800670712677, "tps": 43374, "wall": 24996.9} {"step": 16544, "train_loss": 3.3546597957611084, "lr": 0.00020496891553598495, "tps": 43367, "wall": 25002.5} {"step": 16545, "train_loss": 3.3322854042053223, "lr": 0.00020494982453511603, "tps": 43360, "wall": 25008.2} {"step": 16546, "train_loss": 3.3066117763519287, "lr": 0.00020493073370473632, "tps": 43352, "wall": 25013.8} {"step": 16547, "train_loss": 3.3328826427459717, "lr": 0.00020491164304506208, "tps": 43345, "wall": 25019.5} {"step": 16548, "train_loss": 3.3404736518859863, "lr": 0.0002048925525563096, "tps": 43338, "wall": 25025.1} {"step": 16549, "train_loss": 3.2734673023223877, "lr": 0.00020487346223869505, "tps": 43331, "wall": 25030.8} {"step": 16550, "train_loss": 3.3764872550964355, "lr": 0.00020485437209243475, "tps": 43324, "wall": 25036.5} {"step": 16551, "train_loss": 3.3433945178985596, "lr": 0.0002048352821177449, "tps": 43317, "wall": 25042.1} {"step": 16552, "train_loss": 3.404690742492676, "lr": 0.0002048161923148419, "tps": 43310, "wall": 25047.7} {"step": 16553, "train_loss": 3.2541394233703613, "lr": 0.00020479710268394178, "tps": 43302, "wall": 25053.4} {"step": 16554, "train_loss": 3.2988533973693848, "lr": 0.00020477801322526097, "tps": 43295, "wall": 25059.0} {"step": 16555, "train_loss": 3.3450300693511963, "lr": 0.00020475892393901566, "tps": 43288, "wall": 25064.6} {"step": 16556, "train_loss": 3.3054563999176025, "lr": 0.00020473983482542204, "tps": 43281, "wall": 25070.3} {"step": 16557, "train_loss": 3.37762713432312, "lr": 0.00020472074588469643, "tps": 43274, "wall": 25075.9} {"step": 16558, "train_loss": 3.4133660793304443, "lr": 0.00020470165711705506, "tps": 43267, "wall": 25081.5} {"step": 16559, "train_loss": 3.2813892364501953, "lr": 0.0002046825685227141, "tps": 43260, "wall": 25087.1} {"step": 16560, "train_loss": 3.3197946548461914, "lr": 0.00020466348010188986, "tps": 43253, "wall": 25092.8} {"step": 16561, "train_loss": 3.299187660217285, "lr": 0.0002046443918547985, "tps": 43246, "wall": 25098.4} {"step": 16562, "train_loss": 3.2709312438964844, "lr": 0.00020462530378165635, "tps": 43239, "wall": 25104.0} {"step": 16563, "train_loss": 3.3681020736694336, "lr": 0.0002046062158826796, "tps": 43231, "wall": 25109.6} {"step": 16564, "train_loss": 3.33504581451416, "lr": 0.0002045871281580844, "tps": 43224, "wall": 25115.3} {"step": 16565, "train_loss": 3.360017776489258, "lr": 0.00020456804060808712, "tps": 43217, "wall": 25120.9} {"step": 16566, "train_loss": 3.4599831104278564, "lr": 0.00020454895323290386, "tps": 43210, "wall": 25126.6} {"step": 16567, "train_loss": 3.3516502380371094, "lr": 0.00020452986603275092, "tps": 43203, "wall": 25132.2} {"step": 16568, "train_loss": 3.328871965408325, "lr": 0.00020451077900784448, "tps": 43196, "wall": 25137.7} {"step": 16569, "train_loss": 3.3122398853302, "lr": 0.0002044916921584008, "tps": 43189, "wall": 25143.4} {"step": 16570, "train_loss": 3.3518519401550293, "lr": 0.00020447260548463604, "tps": 43182, "wall": 25149.1} {"step": 16571, "train_loss": 3.339887857437134, "lr": 0.0002044535189867664, "tps": 43175, "wall": 25154.6} {"step": 16572, "train_loss": 3.25602388381958, "lr": 0.0002044344326650083, "tps": 43168, "wall": 25160.3} {"step": 16573, "train_loss": 3.429478645324707, "lr": 0.00020441534651957763, "tps": 43161, "wall": 25165.9} {"step": 16574, "train_loss": 3.3021905422210693, "lr": 0.00020439626055069078, "tps": 43154, "wall": 25171.6} {"step": 16575, "train_loss": 3.2818760871887207, "lr": 0.000204377174758564, "tps": 43147, "wall": 25177.2} {"step": 16576, "train_loss": 3.3844292163848877, "lr": 0.0002043580891434134, "tps": 43140, "wall": 25182.8} {"step": 16577, "train_loss": 3.3088371753692627, "lr": 0.00020433900370545516, "tps": 43133, "wall": 25188.5} {"step": 16578, "train_loss": 3.3226208686828613, "lr": 0.0002043199184449056, "tps": 43126, "wall": 25194.1} {"step": 16579, "train_loss": 3.3180055618286133, "lr": 0.00020430083336198088, "tps": 43119, "wall": 25199.7} {"step": 16580, "train_loss": 3.426581382751465, "lr": 0.00020428174845689708, "tps": 43112, "wall": 25205.3} {"step": 16581, "train_loss": 3.421700954437256, "lr": 0.00020426266372987052, "tps": 43105, "wall": 25210.9} {"step": 16582, "train_loss": 3.288672924041748, "lr": 0.00020424357918111738, "tps": 43098, "wall": 25216.4} {"step": 16583, "train_loss": 3.290731906890869, "lr": 0.00020422449481085378, "tps": 43091, "wall": 25222.1} {"step": 16584, "train_loss": 3.3460702896118164, "lr": 0.000204205410619296, "tps": 43084, "wall": 25227.6} {"step": 16585, "train_loss": 3.3432912826538086, "lr": 0.0002041863266066602, "tps": 43077, "wall": 25233.3} {"step": 16586, "train_loss": 3.2349138259887695, "lr": 0.0002041672427731625, "tps": 43070, "wall": 25238.9} {"step": 16587, "train_loss": 3.2956438064575195, "lr": 0.00020414815911901912, "tps": 43063, "wall": 25244.4} {"step": 16588, "train_loss": 3.1764912605285645, "lr": 0.00020412907564444627, "tps": 43056, "wall": 25250.0} {"step": 16589, "train_loss": 3.418102264404297, "lr": 0.00020410999234966016, "tps": 43049, "wall": 25255.6} {"step": 16590, "train_loss": 3.3095502853393555, "lr": 0.00020409090923487685, "tps": 43042, "wall": 25261.2} {"step": 16591, "train_loss": 3.3373985290527344, "lr": 0.0002040718263003126, "tps": 43035, "wall": 25266.8} {"step": 16592, "train_loss": 3.4306840896606445, "lr": 0.0002040527435461836, "tps": 43028, "wall": 25272.3} {"step": 16593, "train_loss": 3.3638336658477783, "lr": 0.00020403366097270596, "tps": 43021, "wall": 25277.9} {"step": 16594, "train_loss": 3.2738101482391357, "lr": 0.0002040145785800958, "tps": 43015, "wall": 25283.4} {"step": 16595, "train_loss": 3.3230504989624023, "lr": 0.00020399549636856943, "tps": 43008, "wall": 25289.0} {"step": 16596, "train_loss": 3.378223419189453, "lr": 0.00020397641433834296, "tps": 43001, "wall": 25294.7} {"step": 16597, "train_loss": 3.321363925933838, "lr": 0.00020395733248963248, "tps": 42994, "wall": 25300.3} {"step": 16598, "train_loss": 3.2874326705932617, "lr": 0.00020393825082265426, "tps": 42987, "wall": 25305.9} {"step": 16599, "train_loss": 3.2478604316711426, "lr": 0.00020391916933762438, "tps": 42980, "wall": 25311.4} {"step": 16600, "train_loss": 3.305978298187256, "lr": 0.00020390008803475903, "tps": 42973, "wall": 25317.0} {"step": 16601, "train_loss": 3.380305767059326, "lr": 0.00020388100691427435, "tps": 42966, "wall": 25322.6} {"step": 16602, "train_loss": 3.3470139503479004, "lr": 0.00020386192597638653, "tps": 42959, "wall": 25328.1} {"step": 16603, "train_loss": 3.3363354206085205, "lr": 0.00020384284522131165, "tps": 42953, "wall": 25333.7} {"step": 16604, "train_loss": 3.3147459030151367, "lr": 0.00020382376464926592, "tps": 42946, "wall": 25339.2} {"step": 16605, "train_loss": 3.250498056411743, "lr": 0.00020380468426046543, "tps": 42939, "wall": 25344.8} {"step": 16606, "train_loss": 3.3941152095794678, "lr": 0.0002037856040551263, "tps": 42932, "wall": 25350.5} {"step": 16607, "train_loss": 3.3583903312683105, "lr": 0.0002037665240334648, "tps": 42925, "wall": 25356.0} {"step": 16608, "train_loss": 3.430713176727295, "lr": 0.000203747444195697, "tps": 42918, "wall": 25361.6} {"step": 16609, "train_loss": 3.2483010292053223, "lr": 0.00020372836454203897, "tps": 42912, "wall": 25367.1} {"step": 16610, "train_loss": 3.2809698581695557, "lr": 0.00020370928507270692, "tps": 42905, "wall": 25372.7} {"step": 16611, "train_loss": 3.30612850189209, "lr": 0.000203690205787917, "tps": 42898, "wall": 25378.2} {"step": 16612, "train_loss": 3.368544578552246, "lr": 0.00020367112668788528, "tps": 42891, "wall": 25383.8} {"step": 16613, "train_loss": 3.359623670578003, "lr": 0.00020365204777282792, "tps": 42884, "wall": 25389.3} {"step": 16614, "train_loss": 3.413299798965454, "lr": 0.0002036329690429611, "tps": 42877, "wall": 25394.9} {"step": 16615, "train_loss": 3.245303153991699, "lr": 0.00020361389049850087, "tps": 42871, "wall": 25400.5} {"step": 16616, "train_loss": 3.4576988220214844, "lr": 0.0002035948121396633, "tps": 42864, "wall": 25406.0} {"step": 16617, "train_loss": 3.318444013595581, "lr": 0.0002035757339666647, "tps": 42857, "wall": 25411.7} {"step": 16618, "train_loss": 3.3303003311157227, "lr": 0.000203556655979721, "tps": 42850, "wall": 25417.2} {"step": 16619, "train_loss": 3.354074716567993, "lr": 0.00020353757817904842, "tps": 42843, "wall": 25422.8} {"step": 16620, "train_loss": 3.3654661178588867, "lr": 0.00020351850056486302, "tps": 42837, "wall": 25428.3} {"step": 16621, "train_loss": 3.418548107147217, "lr": 0.00020349942313738098, "tps": 42830, "wall": 25433.8} {"step": 16622, "train_loss": 3.3237719535827637, "lr": 0.00020348034589681832, "tps": 42823, "wall": 25439.4} {"step": 16623, "train_loss": 3.2603518962860107, "lr": 0.00020346126884339123, "tps": 42816, "wall": 25444.9} {"step": 16624, "train_loss": 3.35361385345459, "lr": 0.00020344219197731577, "tps": 42810, "wall": 25450.5} {"step": 16625, "train_loss": 3.350931167602539, "lr": 0.00020342311529880807, "tps": 42803, "wall": 25456.1} {"step": 16626, "train_loss": 3.351717948913574, "lr": 0.00020340403880808418, "tps": 42796, "wall": 25461.7} {"step": 16627, "train_loss": 3.359490394592285, "lr": 0.00020338496250536027, "tps": 42789, "wall": 25467.2} {"step": 16628, "train_loss": 3.4210753440856934, "lr": 0.0002033658863908524, "tps": 42782, "wall": 25472.9} {"step": 16629, "train_loss": 3.3679251670837402, "lr": 0.00020334681046477662, "tps": 42775, "wall": 25478.4} {"step": 16630, "train_loss": 3.4576499462127686, "lr": 0.00020332773472734914, "tps": 42769, "wall": 25484.0} {"step": 16631, "train_loss": 3.4629316329956055, "lr": 0.00020330865917878596, "tps": 42762, "wall": 25489.5} {"step": 16632, "train_loss": 3.438581943511963, "lr": 0.00020328958381930318, "tps": 42755, "wall": 25495.1} {"step": 16633, "train_loss": 3.338836193084717, "lr": 0.0002032705086491169, "tps": 42748, "wall": 25500.7} {"step": 16634, "train_loss": 3.2447667121887207, "lr": 0.00020325143366844325, "tps": 42742, "wall": 25506.2} {"step": 16635, "train_loss": 3.328591823577881, "lr": 0.00020323235887749822, "tps": 42735, "wall": 25511.8} {"step": 16636, "train_loss": 3.273963451385498, "lr": 0.0002032132842764979, "tps": 42728, "wall": 25517.3} {"step": 16637, "train_loss": 3.334120512008667, "lr": 0.00020319420986565848, "tps": 42721, "wall": 25522.9} {"step": 16638, "train_loss": 3.403562307357788, "lr": 0.00020317513564519591, "tps": 42715, "wall": 25528.4} {"step": 16639, "train_loss": 3.364989757537842, "lr": 0.0002031560616153263, "tps": 42708, "wall": 25534.1} {"step": 16640, "train_loss": 3.3012218475341797, "lr": 0.00020313698777626576, "tps": 42701, "wall": 25539.6} {"step": 16641, "train_loss": 3.3749725818634033, "lr": 0.00020311791412823036, "tps": 42695, "wall": 25545.1} {"step": 16642, "train_loss": 3.3947644233703613, "lr": 0.0002030988406714361, "tps": 42688, "wall": 25550.7} {"step": 16643, "train_loss": 3.3045997619628906, "lr": 0.0002030797674060991, "tps": 42681, "wall": 25556.2} {"step": 16644, "train_loss": 3.313523292541504, "lr": 0.00020306069433243543, "tps": 42674, "wall": 25561.8} {"step": 16645, "train_loss": 3.400932550430298, "lr": 0.0002030416214506611, "tps": 42668, "wall": 25567.3} {"step": 16646, "train_loss": 3.3093442916870117, "lr": 0.00020302254876099224, "tps": 42661, "wall": 25572.9} {"step": 16647, "train_loss": 3.4327845573425293, "lr": 0.0002030034762636448, "tps": 42654, "wall": 25578.4} {"step": 16648, "train_loss": 3.3068203926086426, "lr": 0.000202984403958835, "tps": 42648, "wall": 25584.0} {"step": 16649, "train_loss": 3.2994651794433594, "lr": 0.0002029653318467787, "tps": 42641, "wall": 25589.5} {"step": 16650, "train_loss": 3.4008803367614746, "lr": 0.00020294625992769207, "tps": 42634, "wall": 25595.3} {"step": 16651, "train_loss": 3.4211628437042236, "lr": 0.00020292718820179116, "tps": 42627, "wall": 25600.7} {"step": 16652, "train_loss": 3.370958089828491, "lr": 0.00020290811666929197, "tps": 42621, "wall": 25606.3} {"step": 16653, "train_loss": 3.4537739753723145, "lr": 0.00020288904533041056, "tps": 42614, "wall": 25611.8} {"step": 16654, "train_loss": 3.3181869983673096, "lr": 0.00020286997418536297, "tps": 42607, "wall": 25617.4} {"step": 16655, "train_loss": 3.3691234588623047, "lr": 0.0002028509032343652, "tps": 42601, "wall": 25622.9} {"step": 16656, "train_loss": 3.3782365322113037, "lr": 0.00020283183247763335, "tps": 42594, "wall": 25628.4} {"step": 16657, "train_loss": 3.3728439807891846, "lr": 0.0002028127619153834, "tps": 42587, "wall": 25634.0} {"step": 16658, "train_loss": 3.3813514709472656, "lr": 0.0002027936915478315, "tps": 42581, "wall": 25639.4} {"step": 16659, "train_loss": 3.41485333442688, "lr": 0.00020277462137519353, "tps": 42574, "wall": 25644.9} {"step": 16660, "train_loss": 3.3389744758605957, "lr": 0.0002027555513976856, "tps": 42568, "wall": 25650.6} {"step": 16661, "train_loss": 3.358372926712036, "lr": 0.0002027364816155237, "tps": 42561, "wall": 25656.1} {"step": 16662, "train_loss": 3.4302713871002197, "lr": 0.0002027174120289239, "tps": 42554, "wall": 25661.6} {"step": 16663, "train_loss": 3.253251552581787, "lr": 0.00020269834263810218, "tps": 42548, "wall": 25667.1} {"step": 16664, "train_loss": 3.3164048194885254, "lr": 0.00020267927344327458, "tps": 42541, "wall": 25672.7} {"step": 16665, "train_loss": 3.2655792236328125, "lr": 0.00020266020444465705, "tps": 42535, "wall": 25678.2} {"step": 16666, "train_loss": 3.3791110515594482, "lr": 0.00020264113564246575, "tps": 42528, "wall": 25683.7} {"step": 16667, "train_loss": 3.3536953926086426, "lr": 0.0002026220670369165, "tps": 42521, "wall": 25689.3} {"step": 16668, "train_loss": 3.374856948852539, "lr": 0.00020260299862822555, "tps": 42515, "wall": 25694.9} {"step": 16669, "train_loss": 3.3791441917419434, "lr": 0.00020258393041660866, "tps": 42508, "wall": 25700.5} {"step": 16670, "train_loss": 3.395235538482666, "lr": 0.00020256486240228196, "tps": 42501, "wall": 25706.0} {"step": 16671, "train_loss": 3.383942127227783, "lr": 0.0002025457945854615, "tps": 42494, "wall": 25711.6} {"step": 16672, "train_loss": 3.3704824447631836, "lr": 0.00020252672696636318, "tps": 42488, "wall": 25717.2} {"step": 16673, "train_loss": 3.326005220413208, "lr": 0.00020250765954520303, "tps": 42481, "wall": 25722.7} {"step": 16674, "train_loss": 3.274810314178467, "lr": 0.00020248859232219709, "tps": 42475, "wall": 25728.2} {"step": 16675, "train_loss": 3.2749247550964355, "lr": 0.00020246952529756132, "tps": 42468, "wall": 25733.7} {"step": 16676, "train_loss": 3.3155739307403564, "lr": 0.00020245045847151172, "tps": 42462, "wall": 25739.2} {"step": 16677, "train_loss": 3.4148566722869873, "lr": 0.00020243139184426422, "tps": 42455, "wall": 25744.8} {"step": 16678, "train_loss": 3.253775119781494, "lr": 0.00020241232541603492, "tps": 42449, "wall": 25750.3} {"step": 16679, "train_loss": 3.2593448162078857, "lr": 0.00020239325918703976, "tps": 42442, "wall": 25755.8} {"step": 16680, "train_loss": 3.2901864051818848, "lr": 0.00020237419315749468, "tps": 42435, "wall": 25761.4} {"step": 16681, "train_loss": 3.2341907024383545, "lr": 0.00020235512732761572, "tps": 42429, "wall": 25766.9} {"step": 16682, "train_loss": 3.3065409660339355, "lr": 0.00020233606169761884, "tps": 42422, "wall": 25772.5} {"step": 16683, "train_loss": 3.4147896766662598, "lr": 0.00020231699626771993, "tps": 42416, "wall": 25778.0} {"step": 16684, "train_loss": 3.4371402263641357, "lr": 0.0002022979310381351, "tps": 42409, "wall": 25783.6} {"step": 16685, "train_loss": 3.3605525493621826, "lr": 0.00020227886600908027, "tps": 42402, "wall": 25789.1} {"step": 16686, "train_loss": 3.306224822998047, "lr": 0.0002022598011807714, "tps": 42396, "wall": 25794.6} {"step": 16687, "train_loss": 3.367945432662964, "lr": 0.00020224073655342447, "tps": 42389, "wall": 25800.1} {"step": 16688, "train_loss": 3.3476438522338867, "lr": 0.00020222167212725545, "tps": 42383, "wall": 25805.6} {"step": 16689, "train_loss": 3.3645477294921875, "lr": 0.0002022026079024802, "tps": 42376, "wall": 25811.1} {"step": 16690, "train_loss": 3.347543954849243, "lr": 0.0002021835438793149, "tps": 42370, "wall": 25816.6} {"step": 16691, "train_loss": 3.4052915573120117, "lr": 0.0002021644800579753, "tps": 42364, "wall": 25822.1} {"step": 16692, "train_loss": 3.311161518096924, "lr": 0.00020214541643867744, "tps": 42357, "wall": 25827.6} {"step": 16693, "train_loss": 3.227133274078369, "lr": 0.00020212635302163724, "tps": 42350, "wall": 25833.2} {"step": 16694, "train_loss": 3.281313180923462, "lr": 0.00020210728980707074, "tps": 42344, "wall": 25838.7} {"step": 16695, "train_loss": 3.431584358215332, "lr": 0.00020208822679519382, "tps": 42337, "wall": 25844.2} {"step": 16696, "train_loss": 3.218559741973877, "lr": 0.00020206916398622245, "tps": 42331, "wall": 25849.7} {"step": 16697, "train_loss": 3.2891323566436768, "lr": 0.00020205010138037253, "tps": 42324, "wall": 25855.3} {"step": 16698, "train_loss": 3.4082484245300293, "lr": 0.00020203103897786003, "tps": 42318, "wall": 25860.8} {"step": 16699, "train_loss": 3.3551383018493652, "lr": 0.00020201197677890091, "tps": 42311, "wall": 25866.3} {"step": 16700, "train_loss": 3.38181209564209, "lr": 0.00020199291478371106, "tps": 42305, "wall": 25871.8} {"step": 16701, "train_loss": 3.290660858154297, "lr": 0.00020197385299250647, "tps": 42298, "wall": 25877.4} {"step": 16702, "train_loss": 3.3408493995666504, "lr": 0.00020195479140550307, "tps": 42292, "wall": 25882.9} {"step": 16703, "train_loss": 3.35162353515625, "lr": 0.00020193573002291672, "tps": 42285, "wall": 25888.4} {"step": 16704, "train_loss": 3.2554211616516113, "lr": 0.00020191666884496342, "tps": 42279, "wall": 25894.0} {"step": 16705, "train_loss": 3.253044605255127, "lr": 0.00020189760787185909, "tps": 42272, "wall": 25899.5} {"step": 16706, "train_loss": 3.2840471267700195, "lr": 0.00020187854710381959, "tps": 42266, "wall": 25905.1} {"step": 16707, "train_loss": 3.3441717624664307, "lr": 0.00020185948654106092, "tps": 42259, "wall": 25910.6} {"step": 16708, "train_loss": 3.3369712829589844, "lr": 0.000201840426183799, "tps": 42253, "wall": 25916.1} {"step": 16709, "train_loss": 3.3212082386016846, "lr": 0.00020182136603224965, "tps": 42246, "wall": 25921.5} {"step": 16710, "train_loss": 3.421229362487793, "lr": 0.0002018023060866289, "tps": 42240, "wall": 25927.1} {"step": 16711, "train_loss": 3.2494850158691406, "lr": 0.00020178324634715256, "tps": 42234, "wall": 25932.6} {"step": 16712, "train_loss": 3.300661087036133, "lr": 0.00020176418681403665, "tps": 42227, "wall": 25938.1} {"step": 16713, "train_loss": 3.371903896331787, "lr": 0.000201745127487497, "tps": 42221, "wall": 25943.6} {"step": 16714, "train_loss": 3.3073410987854004, "lr": 0.0002017260683677495, "tps": 42214, "wall": 25949.1} {"step": 16715, "train_loss": 3.403963804244995, "lr": 0.00020170700945501015, "tps": 42208, "wall": 25954.7} {"step": 16716, "train_loss": 3.396881580352783, "lr": 0.00020168795074949474, "tps": 42201, "wall": 25960.2} {"step": 16717, "train_loss": 3.2994558811187744, "lr": 0.00020166889225141921, "tps": 42195, "wall": 25965.7} {"step": 16718, "train_loss": 3.2518885135650635, "lr": 0.00020164983396099947, "tps": 42188, "wall": 25971.2} {"step": 16719, "train_loss": 3.3546648025512695, "lr": 0.0002016307758784514, "tps": 42182, "wall": 25976.7} {"step": 16720, "train_loss": 3.370945692062378, "lr": 0.00020161171800399088, "tps": 42176, "wall": 25982.2} {"step": 16721, "train_loss": 3.326308250427246, "lr": 0.00020159266033783384, "tps": 42169, "wall": 25987.7} {"step": 16722, "train_loss": 3.339975595474243, "lr": 0.00020157360288019618, "tps": 42163, "wall": 25993.2} {"step": 16723, "train_loss": 3.3988990783691406, "lr": 0.00020155454563129368, "tps": 42156, "wall": 25998.7} {"step": 16724, "train_loss": 3.3998396396636963, "lr": 0.00020153548859134227, "tps": 42150, "wall": 26004.2} {"step": 16725, "train_loss": 3.2839105129241943, "lr": 0.00020151643176055792, "tps": 42144, "wall": 26009.7} {"step": 16726, "train_loss": 3.2437572479248047, "lr": 0.00020149737513915636, "tps": 42137, "wall": 26015.3} {"step": 16727, "train_loss": 3.3475165367126465, "lr": 0.00020147831872735354, "tps": 42131, "wall": 26020.9} {"step": 16728, "train_loss": 3.331847667694092, "lr": 0.00020145926252536538, "tps": 42124, "wall": 26026.4} {"step": 16729, "train_loss": 3.3134384155273438, "lr": 0.00020144020653340764, "tps": 42118, "wall": 26031.8} {"step": 16730, "train_loss": 3.384336471557617, "lr": 0.00020142115075169628, "tps": 42112, "wall": 26037.3} {"step": 16731, "train_loss": 3.3432259559631348, "lr": 0.00020140209518044712, "tps": 42105, "wall": 26042.8} {"step": 16732, "train_loss": 3.462261915206909, "lr": 0.00020138303981987604, "tps": 42099, "wall": 26048.3} {"step": 16733, "train_loss": 3.3301053047180176, "lr": 0.0002013639846701989, "tps": 42092, "wall": 26053.8} {"step": 16734, "train_loss": 3.330961227416992, "lr": 0.00020134492973163153, "tps": 42086, "wall": 26059.3} {"step": 16735, "train_loss": 3.3924360275268555, "lr": 0.00020132587500438983, "tps": 42080, "wall": 26064.8} {"step": 16736, "train_loss": 3.3906989097595215, "lr": 0.00020130682048868955, "tps": 42073, "wall": 26070.4} {"step": 16737, "train_loss": 3.4389216899871826, "lr": 0.00020128776618474667, "tps": 42067, "wall": 26075.9} {"step": 16738, "train_loss": 3.2724480628967285, "lr": 0.00020126871209277702, "tps": 42061, "wall": 26081.3} {"step": 16739, "train_loss": 3.3465449810028076, "lr": 0.0002012496582129964, "tps": 42054, "wall": 26086.8} {"step": 16740, "train_loss": 3.326847553253174, "lr": 0.00020123060454562067, "tps": 42048, "wall": 26092.3} {"step": 16741, "train_loss": 3.4611666202545166, "lr": 0.0002012115510908656, "tps": 42041, "wall": 26097.8} {"step": 16742, "train_loss": 3.3870480060577393, "lr": 0.00020119249784894717, "tps": 42035, "wall": 26103.3} {"step": 16743, "train_loss": 3.4154601097106934, "lr": 0.00020117344482008113, "tps": 42029, "wall": 26108.8} {"step": 16744, "train_loss": 3.3214993476867676, "lr": 0.00020115439200448328, "tps": 42022, "wall": 26114.4} {"step": 16745, "train_loss": 3.2821483612060547, "lr": 0.00020113533940236956, "tps": 42016, "wall": 26119.9} {"step": 16746, "train_loss": 3.3189518451690674, "lr": 0.0002011162870139557, "tps": 42010, "wall": 26125.4} {"step": 16747, "train_loss": 3.183811902999878, "lr": 0.00020109723483945758, "tps": 42003, "wall": 26131.0} {"step": 16748, "train_loss": 3.348548412322998, "lr": 0.00020107818287909096, "tps": 41997, "wall": 26136.5} {"step": 16749, "train_loss": 3.3692235946655273, "lr": 0.0002010591311330718, "tps": 41991, "wall": 26141.9} {"step": 16750, "train_loss": 3.262209415435791, "lr": 0.00020104007960161573, "tps": 41984, "wall": 26147.5} {"step": 16751, "train_loss": 3.360013246536255, "lr": 0.0002010210282849387, "tps": 41978, "wall": 26153.0} {"step": 16752, "train_loss": 3.365182638168335, "lr": 0.00020100197718325654, "tps": 41971, "wall": 26158.6} {"step": 16753, "train_loss": 3.3411788940429688, "lr": 0.00020098292629678493, "tps": 41965, "wall": 26164.1} {"step": 16754, "train_loss": 3.271914482116699, "lr": 0.0002009638756257398, "tps": 41959, "wall": 26169.7} {"step": 16755, "train_loss": 3.2398200035095215, "lr": 0.0002009448251703369, "tps": 41952, "wall": 26175.2} {"step": 16756, "train_loss": 3.315812587738037, "lr": 0.00020092577493079205, "tps": 41946, "wall": 26180.7} {"step": 16757, "train_loss": 3.312119960784912, "lr": 0.0002009067249073211, "tps": 41940, "wall": 26186.2} {"step": 16758, "train_loss": 3.361264944076538, "lr": 0.00020088767510013976, "tps": 41933, "wall": 26191.8} {"step": 16759, "train_loss": 3.2844314575195312, "lr": 0.00020086862550946388, "tps": 41927, "wall": 26197.4} {"step": 16760, "train_loss": 3.3868515491485596, "lr": 0.00020084957613550924, "tps": 41920, "wall": 26203.0} {"step": 16761, "train_loss": 3.441222667694092, "lr": 0.00020083052697849162, "tps": 41914, "wall": 26208.5} {"step": 16762, "train_loss": 3.3828701972961426, "lr": 0.00020081147803862684, "tps": 41908, "wall": 26214.0} {"step": 16763, "train_loss": 3.3121132850646973, "lr": 0.0002007924293161307, "tps": 41901, "wall": 26219.6} {"step": 16764, "train_loss": 3.3030261993408203, "lr": 0.0002007733808112189, "tps": 41895, "wall": 26225.1} {"step": 16765, "train_loss": 3.4358768463134766, "lr": 0.00020075433252410733, "tps": 41888, "wall": 26230.7} {"step": 16766, "train_loss": 3.2709922790527344, "lr": 0.00020073528445501175, "tps": 41882, "wall": 26236.2} {"step": 16767, "train_loss": 3.3440089225769043, "lr": 0.00020071623660414788, "tps": 41876, "wall": 26241.8} {"step": 16768, "train_loss": 3.3834493160247803, "lr": 0.0002006971889717315, "tps": 41869, "wall": 26247.4} {"step": 16769, "train_loss": 3.402571678161621, "lr": 0.00020067814155797845, "tps": 41863, "wall": 26253.0} {"step": 16770, "train_loss": 3.3659019470214844, "lr": 0.0002006590943631044, "tps": 41857, "wall": 26258.5} {"step": 16771, "train_loss": 3.268296241760254, "lr": 0.0002006400473873253, "tps": 41850, "wall": 26264.1} {"step": 16772, "train_loss": 3.236429214477539, "lr": 0.0002006210006308567, "tps": 41844, "wall": 26269.7} {"step": 16773, "train_loss": 3.280097007751465, "lr": 0.00020060195409391446, "tps": 41837, "wall": 26275.2} {"step": 16774, "train_loss": 3.3752551078796387, "lr": 0.00020058290777671432, "tps": 41831, "wall": 26280.8} {"step": 16775, "train_loss": 3.3220338821411133, "lr": 0.00020056386167947206, "tps": 41825, "wall": 26286.3} {"step": 16776, "train_loss": 3.32267427444458, "lr": 0.00020054481580240342, "tps": 41818, "wall": 26291.9} {"step": 16777, "train_loss": 3.27937650680542, "lr": 0.0002005257701457242, "tps": 41812, "wall": 26297.4} {"step": 16778, "train_loss": 3.3265295028686523, "lr": 0.00020050672470965007, "tps": 41806, "wall": 26302.9} {"step": 16779, "train_loss": 3.377945899963379, "lr": 0.0002004876794943968, "tps": 41799, "wall": 26308.5} {"step": 16780, "train_loss": 3.2258737087249756, "lr": 0.00020046863450018019, "tps": 41793, "wall": 26314.2} {"step": 16781, "train_loss": 3.356705904006958, "lr": 0.00020044958972721593, "tps": 41787, "wall": 26319.8} {"step": 16782, "train_loss": 3.333559513092041, "lr": 0.00020043054517571976, "tps": 41780, "wall": 26325.3} {"step": 16783, "train_loss": 3.3638367652893066, "lr": 0.00020041150084590745, "tps": 41774, "wall": 26330.9} {"step": 16784, "train_loss": 3.55552339553833, "lr": 0.00020039245673799476, "tps": 41768, "wall": 26336.4} {"step": 16785, "train_loss": 3.37109637260437, "lr": 0.00020037341285219728, "tps": 41761, "wall": 26341.9} {"step": 16786, "train_loss": 3.335096597671509, "lr": 0.00020035436918873088, "tps": 41755, "wall": 26347.5} {"step": 16787, "train_loss": 3.2899398803710938, "lr": 0.00020033532574781132, "tps": 41749, "wall": 26353.1} {"step": 16788, "train_loss": 3.4697108268737793, "lr": 0.0002003162825296542, "tps": 41742, "wall": 26358.6} {"step": 16789, "train_loss": 3.294509172439575, "lr": 0.0002002972395344753, "tps": 41736, "wall": 26364.1} {"step": 16790, "train_loss": 3.2031288146972656, "lr": 0.0002002781967624903, "tps": 41730, "wall": 26369.6} {"step": 16791, "train_loss": 3.207930564880371, "lr": 0.000200259154213915, "tps": 41723, "wall": 26375.3} {"step": 16792, "train_loss": 3.2713377475738525, "lr": 0.00020024011188896505, "tps": 41717, "wall": 26380.8} {"step": 16793, "train_loss": 3.2888076305389404, "lr": 0.0002002210697878562, "tps": 41711, "wall": 26386.4} {"step": 16794, "train_loss": 3.2088844776153564, "lr": 0.00020020202791080417, "tps": 41705, "wall": 26391.9} {"step": 16795, "train_loss": 3.320596694946289, "lr": 0.00020018298625802455, "tps": 41698, "wall": 26397.3} {"step": 16796, "train_loss": 3.4752566814422607, "lr": 0.00020016394482973317, "tps": 41692, "wall": 26402.9} {"step": 16797, "train_loss": 3.36305570602417, "lr": 0.0002001449036261457, "tps": 41686, "wall": 26408.5} {"step": 16798, "train_loss": 3.281928539276123, "lr": 0.0002001258626474779, "tps": 41680, "wall": 26414.0} {"step": 16799, "train_loss": 3.349060535430908, "lr": 0.0002001068218939453, "tps": 41673, "wall": 26419.5} {"step": 16800, "train_loss": 3.24806809425354, "lr": 0.00020008778136576373, "tps": 41667, "wall": 26425.0} {"step": 16801, "train_loss": 3.3186848163604736, "lr": 0.0002000687410631489, "tps": 41661, "wall": 26430.6} {"step": 16802, "train_loss": 3.4285709857940674, "lr": 0.00020004970098631638, "tps": 41655, "wall": 26436.2} {"step": 16803, "train_loss": 3.2542686462402344, "lr": 0.00020003066113548194, "tps": 41648, "wall": 26441.7} {"step": 16804, "train_loss": 3.3330612182617188, "lr": 0.00020001162151086135, "tps": 41642, "wall": 26447.2} {"step": 16805, "train_loss": 3.3511078357696533, "lr": 0.00019999258211267007, "tps": 41636, "wall": 26452.8} {"step": 16806, "train_loss": 3.2838289737701416, "lr": 0.00019997354294112394, "tps": 41630, "wall": 26458.3} {"step": 16807, "train_loss": 3.2924678325653076, "lr": 0.0001999545039964386, "tps": 41623, "wall": 26463.8} {"step": 16808, "train_loss": 3.334545850753784, "lr": 0.00019993546527882975, "tps": 41617, "wall": 26469.4} {"step": 16809, "train_loss": 3.3509037494659424, "lr": 0.00019991642678851302, "tps": 41611, "wall": 26474.8} {"step": 16810, "train_loss": 3.282412528991699, "lr": 0.00019989738852570406, "tps": 41605, "wall": 26480.3} {"step": 16811, "train_loss": 3.307095766067505, "lr": 0.00019987835049061864, "tps": 41599, "wall": 26485.9} {"step": 16812, "train_loss": 3.3874785900115967, "lr": 0.00019985931268347228, "tps": 41592, "wall": 26491.5} {"step": 16813, "train_loss": 3.373600959777832, "lr": 0.00019984027510448074, "tps": 41586, "wall": 26497.0} {"step": 16814, "train_loss": 3.2874574661254883, "lr": 0.00019982123775385971, "tps": 41580, "wall": 26502.5} {"step": 16815, "train_loss": 3.354785680770874, "lr": 0.00019980220063182472, "tps": 41574, "wall": 26508.0} {"step": 16816, "train_loss": 3.370145797729492, "lr": 0.0001997831637385915, "tps": 41568, "wall": 26513.5} {"step": 16817, "train_loss": 3.4183552265167236, "lr": 0.00019976412707437571, "tps": 41561, "wall": 26519.1} {"step": 16818, "train_loss": 3.40146803855896, "lr": 0.000199745090639393, "tps": 41555, "wall": 26524.6} {"step": 16819, "train_loss": 3.231973648071289, "lr": 0.00019972605443385896, "tps": 41549, "wall": 26530.1} {"step": 16820, "train_loss": 3.147549629211426, "lr": 0.00019970701845798932, "tps": 41543, "wall": 26535.7} {"step": 16821, "train_loss": 3.370046377182007, "lr": 0.00019968798271199965, "tps": 41537, "wall": 26541.3} {"step": 16822, "train_loss": 3.259735107421875, "lr": 0.0001996689471961056, "tps": 41530, "wall": 26546.8} {"step": 16823, "train_loss": 3.343322277069092, "lr": 0.0001996499119105228, "tps": 41524, "wall": 26552.4} {"step": 16824, "train_loss": 3.2619831562042236, "lr": 0.00019963087685546694, "tps": 41518, "wall": 26557.9} {"step": 16825, "train_loss": 3.4147558212280273, "lr": 0.0001996118420311536, "tps": 41512, "wall": 26563.4} {"step": 16826, "train_loss": 3.2437686920166016, "lr": 0.0001995928074377984, "tps": 41506, "wall": 26569.0} {"step": 16827, "train_loss": 3.2855544090270996, "lr": 0.00019957377307561699, "tps": 41499, "wall": 26574.5} {"step": 16828, "train_loss": 3.258655309677124, "lr": 0.000199554738944825, "tps": 41493, "wall": 26580.0} {"step": 16829, "train_loss": 3.3235793113708496, "lr": 0.00019953570504563798, "tps": 41487, "wall": 26585.5} {"step": 16830, "train_loss": 3.367750406265259, "lr": 0.00019951667137827164, "tps": 41481, "wall": 26591.0} {"step": 16831, "train_loss": 3.3068766593933105, "lr": 0.0001994976379429416, "tps": 41475, "wall": 26596.4} {"step": 16832, "train_loss": 3.3439106941223145, "lr": 0.00019947860473986336, "tps": 41469, "wall": 26601.9} {"step": 16833, "train_loss": 3.2366132736206055, "lr": 0.00019945957176925258, "tps": 41463, "wall": 26607.5} {"step": 16834, "train_loss": 3.270918369293213, "lr": 0.00019944053903132495, "tps": 41456, "wall": 26613.1} {"step": 16835, "train_loss": 3.368009567260742, "lr": 0.00019942150652629598, "tps": 41450, "wall": 26618.6} {"step": 16836, "train_loss": 3.2419896125793457, "lr": 0.0001994024742543813, "tps": 41444, "wall": 26624.1} {"step": 16837, "train_loss": 3.404660701751709, "lr": 0.00019938344221579648, "tps": 41438, "wall": 26629.7} {"step": 16838, "train_loss": 3.3260257244110107, "lr": 0.00019936441041075716, "tps": 41432, "wall": 26635.2} {"step": 16839, "train_loss": 3.1882126331329346, "lr": 0.00019934537883947894, "tps": 41426, "wall": 26640.8} {"step": 16840, "train_loss": 3.381990432739258, "lr": 0.00019932634750217734, "tps": 41420, "wall": 26646.3} {"step": 16841, "train_loss": 3.3026177883148193, "lr": 0.00019930731639906802, "tps": 41413, "wall": 26651.8} {"step": 16842, "train_loss": 3.3137471675872803, "lr": 0.00019928828553036652, "tps": 41407, "wall": 26657.3} {"step": 16843, "train_loss": 3.418004035949707, "lr": 0.00019926925489628845, "tps": 41401, "wall": 26662.8} {"step": 16844, "train_loss": 3.38167142868042, "lr": 0.0001992502244970494, "tps": 41395, "wall": 26668.4} {"step": 16845, "train_loss": 3.1911308765411377, "lr": 0.0001992311943328649, "tps": 41389, "wall": 26674.0} {"step": 16846, "train_loss": 3.3845081329345703, "lr": 0.0001992121644039506, "tps": 41383, "wall": 26679.5} {"step": 16847, "train_loss": 3.2705631256103516, "lr": 0.00019919313471052194, "tps": 41377, "wall": 26685.0} {"step": 16848, "train_loss": 3.3190808296203613, "lr": 0.00019917410525279467, "tps": 41371, "wall": 26690.5} {"step": 16849, "train_loss": 3.3078317642211914, "lr": 0.0001991550760309842, "tps": 41364, "wall": 26696.1} {"step": 16850, "train_loss": 3.33804988861084, "lr": 0.00019913604704530617, "tps": 41358, "wall": 26701.6} {"step": 16851, "train_loss": 3.2617902755737305, "lr": 0.0001991170182959762, "tps": 41352, "wall": 26707.1} {"step": 16852, "train_loss": 3.2170333862304688, "lr": 0.00019909798978320965, "tps": 41346, "wall": 26712.6} {"step": 16853, "train_loss": 3.233633041381836, "lr": 0.0001990789615072223, "tps": 41340, "wall": 26718.1} {"step": 16854, "train_loss": 3.3812637329101562, "lr": 0.00019905993346822952, "tps": 41334, "wall": 26723.6} {"step": 16855, "train_loss": 3.339383125305176, "lr": 0.00019904090566644708, "tps": 41328, "wall": 26729.1} {"step": 16856, "train_loss": 3.478949546813965, "lr": 0.00019902187810209027, "tps": 41322, "wall": 26734.7} {"step": 16857, "train_loss": 3.233832836151123, "lr": 0.0001990028507753748, "tps": 41316, "wall": 26740.3} {"step": 16858, "train_loss": 3.3739774227142334, "lr": 0.0001989838236865162, "tps": 41310, "wall": 26745.8} {"step": 16859, "train_loss": 3.380575656890869, "lr": 0.00019896479683572996, "tps": 41304, "wall": 26751.2} {"step": 16860, "train_loss": 3.224790334701538, "lr": 0.00019894577022323162, "tps": 41298, "wall": 26756.7} {"step": 16861, "train_loss": 3.2637078762054443, "lr": 0.00019892674384923672, "tps": 41292, "wall": 26762.2} {"step": 16862, "train_loss": 3.354980707168579, "lr": 0.0001989077177139609, "tps": 41285, "wall": 26767.8} {"step": 16863, "train_loss": 3.2610275745391846, "lr": 0.0001988886918176195, "tps": 41279, "wall": 26773.3} {"step": 16864, "train_loss": 3.3083152770996094, "lr": 0.00019886966616042818, "tps": 41273, "wall": 26778.8} {"step": 16865, "train_loss": 3.2869744300842285, "lr": 0.00019885064074260243, "tps": 41267, "wall": 26784.3} {"step": 16866, "train_loss": 3.382504463195801, "lr": 0.00019883161556435774, "tps": 41261, "wall": 26789.8} {"step": 16867, "train_loss": 3.307766914367676, "lr": 0.00019881259062590968, "tps": 41255, "wall": 26795.4} {"step": 16868, "train_loss": 3.362962245941162, "lr": 0.00019879356592747373, "tps": 41249, "wall": 26800.8} {"step": 16869, "train_loss": 3.2871766090393066, "lr": 0.0001987745414692654, "tps": 41243, "wall": 26806.3} {"step": 16870, "train_loss": 3.387934684753418, "lr": 0.00019875551725150023, "tps": 41237, "wall": 26811.8} {"step": 16871, "train_loss": 3.372164726257324, "lr": 0.00019873649327439366, "tps": 41231, "wall": 26817.3} {"step": 16872, "train_loss": 3.3247735500335693, "lr": 0.00019871746953816134, "tps": 41225, "wall": 26822.8} {"step": 16873, "train_loss": 3.326103448867798, "lr": 0.00019869844604301863, "tps": 41219, "wall": 26828.3} {"step": 16874, "train_loss": 3.289785146713257, "lr": 0.00019867942278918105, "tps": 41213, "wall": 26833.8} {"step": 16875, "train_loss": 3.4170656204223633, "lr": 0.00019866039977686417, "tps": 41207, "wall": 26839.3} {"step": 16876, "train_loss": 3.3469839096069336, "lr": 0.00019864137700628337, "tps": 41201, "wall": 26844.8} {"step": 16877, "train_loss": 3.3634192943573, "lr": 0.00019862235447765426, "tps": 41195, "wall": 26850.4} {"step": 16878, "train_loss": 3.262946128845215, "lr": 0.0001986033321911923, "tps": 41189, "wall": 26855.9} {"step": 16879, "train_loss": 3.309999942779541, "lr": 0.0001985843101471129, "tps": 41183, "wall": 26861.4} {"step": 16880, "train_loss": 3.1972336769104004, "lr": 0.00019856528834563157, "tps": 41177, "wall": 26866.9} {"step": 16881, "train_loss": 3.3232884407043457, "lr": 0.00019854626678696385, "tps": 41171, "wall": 26872.4} {"step": 16882, "train_loss": 3.4312257766723633, "lr": 0.00019852724547132517, "tps": 41165, "wall": 26877.9} {"step": 16883, "train_loss": 3.2599258422851562, "lr": 0.00019850822439893104, "tps": 41159, "wall": 26883.4} {"step": 16884, "train_loss": 3.364764928817749, "lr": 0.00019848920356999687, "tps": 41153, "wall": 26888.9} {"step": 16885, "train_loss": 3.3017067909240723, "lr": 0.0001984701829847382, "tps": 41147, "wall": 26894.5} {"step": 16886, "train_loss": 3.3177645206451416, "lr": 0.00019845116264337044, "tps": 41141, "wall": 26899.9} {"step": 16887, "train_loss": 3.333737373352051, "lr": 0.00019843214254610904, "tps": 41135, "wall": 26905.4} {"step": 16888, "train_loss": 3.3103814125061035, "lr": 0.00019841312269316955, "tps": 41129, "wall": 26911.0} {"step": 16889, "train_loss": 3.3039495944976807, "lr": 0.0001983941030847674, "tps": 41123, "wall": 26916.5} {"step": 16890, "train_loss": 3.4310717582702637, "lr": 0.00019837508372111797, "tps": 41117, "wall": 26922.0} {"step": 16891, "train_loss": 3.285879611968994, "lr": 0.00019835606460243677, "tps": 41111, "wall": 26927.5} {"step": 16892, "train_loss": 3.373594045639038, "lr": 0.00019833704572893925, "tps": 41105, "wall": 26933.0} {"step": 16893, "train_loss": 3.348052978515625, "lr": 0.0001983180271008408, "tps": 41099, "wall": 26938.5} {"step": 16894, "train_loss": 3.2698988914489746, "lr": 0.000198299008718357, "tps": 41093, "wall": 26944.0} {"step": 16895, "train_loss": 3.384023904800415, "lr": 0.00019827999058170316, "tps": 41087, "wall": 26949.7} {"step": 16896, "train_loss": 3.367339611053467, "lr": 0.00019826097269109476, "tps": 41081, "wall": 26955.1} {"step": 16897, "train_loss": 3.3291025161743164, "lr": 0.0001982419550467472, "tps": 41075, "wall": 26960.6} {"step": 16898, "train_loss": 3.453415870666504, "lr": 0.00019822293764887596, "tps": 41069, "wall": 26966.2} {"step": 16899, "train_loss": 3.2803590297698975, "lr": 0.00019820392049769653, "tps": 41063, "wall": 26971.8} {"step": 16900, "train_loss": 3.311882257461548, "lr": 0.0001981849035934242, "tps": 41057, "wall": 26977.2} {"step": 16901, "train_loss": 3.327779531478882, "lr": 0.0001981658869362745, "tps": 41051, "wall": 26982.7} {"step": 16902, "train_loss": 3.3691611289978027, "lr": 0.0001981468705264628, "tps": 41045, "wall": 26988.2} {"step": 16903, "train_loss": 3.3278653621673584, "lr": 0.00019812785436420453, "tps": 41040, "wall": 26993.7} {"step": 16904, "train_loss": 3.328197717666626, "lr": 0.00019810883844971507, "tps": 41034, "wall": 26999.2} {"step": 16905, "train_loss": 3.3727829456329346, "lr": 0.00019808982278320998, "tps": 41028, "wall": 27004.6} {"step": 16906, "train_loss": 3.3644700050354004, "lr": 0.00019807080736490446, "tps": 41022, "wall": 27010.1} {"step": 16907, "train_loss": 3.2365705966949463, "lr": 0.00019805179219501407, "tps": 41016, "wall": 27015.6} {"step": 16908, "train_loss": 3.3413500785827637, "lr": 0.00019803277727375415, "tps": 41010, "wall": 27021.1} {"step": 16909, "train_loss": 3.2803754806518555, "lr": 0.00019801376260134013, "tps": 41004, "wall": 27026.6} {"step": 16910, "train_loss": 3.265333652496338, "lr": 0.0001979947481779874, "tps": 40998, "wall": 27032.2} {"step": 16911, "train_loss": 3.384033203125, "lr": 0.0001979757340039113, "tps": 40992, "wall": 27037.7} {"step": 16912, "train_loss": 3.402575969696045, "lr": 0.00019795672007932736, "tps": 40986, "wall": 27043.2} {"step": 16913, "train_loss": 3.331942081451416, "lr": 0.0001979377064044508, "tps": 40980, "wall": 27048.7} {"step": 16914, "train_loss": 3.3178892135620117, "lr": 0.00019791869297949713, "tps": 40974, "wall": 27054.2} {"step": 16915, "train_loss": 3.320047378540039, "lr": 0.00019789967980468173, "tps": 40968, "wall": 27059.7} {"step": 16916, "train_loss": 3.25827956199646, "lr": 0.00019788066688021996, "tps": 40963, "wall": 27065.2} {"step": 16917, "train_loss": 3.310356378555298, "lr": 0.00019786165420632715, "tps": 40957, "wall": 27070.7} {"step": 16918, "train_loss": 3.341592788696289, "lr": 0.00019784264178321869, "tps": 40951, "wall": 27076.2} {"step": 16919, "train_loss": 3.34365177154541, "lr": 0.0001978236296111101, "tps": 40945, "wall": 27081.6} {"step": 16920, "train_loss": 3.3253366947174072, "lr": 0.00019780461769021654, "tps": 40939, "wall": 27087.1} {"step": 16921, "train_loss": 3.284841299057007, "lr": 0.00019778560602075345, "tps": 40933, "wall": 27092.7} {"step": 16922, "train_loss": 3.3396711349487305, "lr": 0.0001977665946029363, "tps": 40927, "wall": 27098.2} {"step": 16923, "train_loss": 3.43681001663208, "lr": 0.00019774758343698033, "tps": 40921, "wall": 27103.6} {"step": 16924, "train_loss": 3.373955011367798, "lr": 0.00019772857252310094, "tps": 40916, "wall": 27109.1} {"step": 16925, "train_loss": 3.3097102642059326, "lr": 0.00019770956186151347, "tps": 40910, "wall": 27114.5} {"step": 16926, "train_loss": 3.4500677585601807, "lr": 0.0001976905514524333, "tps": 40904, "wall": 27120.0} {"step": 16927, "train_loss": 3.4675748348236084, "lr": 0.00019767154129607576, "tps": 40898, "wall": 27125.4} {"step": 16928, "train_loss": 3.3929500579833984, "lr": 0.00019765253139265623, "tps": 40892, "wall": 27130.9} {"step": 16929, "train_loss": 3.4575142860412598, "lr": 0.00019763352174239005, "tps": 40887, "wall": 27136.3} {"step": 16930, "train_loss": 3.335291862487793, "lr": 0.00019761451234549248, "tps": 40881, "wall": 27141.7} {"step": 16931, "train_loss": 3.298764944076538, "lr": 0.00019759550320217896, "tps": 40875, "wall": 27147.2} {"step": 16932, "train_loss": 3.3893990516662598, "lr": 0.00019757649431266484, "tps": 40869, "wall": 27152.8} {"step": 16933, "train_loss": 3.2516379356384277, "lr": 0.00019755748567716532, "tps": 40863, "wall": 27158.3} {"step": 16934, "train_loss": 3.3976213932037354, "lr": 0.00019753847729589582, "tps": 40857, "wall": 27163.7} {"step": 16935, "train_loss": 3.331634044647217, "lr": 0.00019751946916907173, "tps": 40852, "wall": 27169.1} {"step": 16936, "train_loss": 3.311908483505249, "lr": 0.00019750046129690828, "tps": 40846, "wall": 27174.6} {"step": 16937, "train_loss": 3.290677785873413, "lr": 0.00019748145367962084, "tps": 40840, "wall": 27180.1} {"step": 16938, "train_loss": 3.260047435760498, "lr": 0.00019746244631742464, "tps": 40834, "wall": 27185.5} {"step": 16939, "train_loss": 3.351688861846924, "lr": 0.00019744343921053518, "tps": 40829, "wall": 27191.0} {"step": 16940, "train_loss": 3.28436279296875, "lr": 0.00019742443235916765, "tps": 40823, "wall": 27196.3} {"step": 16941, "train_loss": 3.325047492980957, "lr": 0.00019740542576353733, "tps": 40817, "wall": 27201.8} {"step": 16942, "train_loss": 3.2550830841064453, "lr": 0.00019738641942385955, "tps": 40811, "wall": 27207.3} {"step": 16943, "train_loss": 3.3499526977539062, "lr": 0.00019736741334034963, "tps": 40805, "wall": 27212.8} {"step": 16944, "train_loss": 3.3460307121276855, "lr": 0.00019734840751322295, "tps": 40800, "wall": 27218.3} {"step": 16945, "train_loss": 3.3540432453155518, "lr": 0.00019732940194269464, "tps": 40794, "wall": 27223.7} {"step": 16946, "train_loss": 3.433365821838379, "lr": 0.0001973103966289801, "tps": 40788, "wall": 27229.2} {"step": 16947, "train_loss": 3.406104564666748, "lr": 0.0001972913915722947, "tps": 40782, "wall": 27234.6} {"step": 16948, "train_loss": 3.354065418243408, "lr": 0.00019727238677285356, "tps": 40777, "wall": 27240.1} {"step": 16949, "train_loss": 3.289346933364868, "lr": 0.00019725338223087205, "tps": 40771, "wall": 27245.5} {"step": 16950, "train_loss": 3.3059401512145996, "lr": 0.00019723437794656547, "tps": 40765, "wall": 27250.9} {"step": 16951, "train_loss": 3.357189893722534, "lr": 0.00019721537392014917, "tps": 40759, "wall": 27256.3} {"step": 16952, "train_loss": 3.1333038806915283, "lr": 0.00019719637015183829, "tps": 40754, "wall": 27261.7} {"step": 16953, "train_loss": 3.317570209503174, "lr": 0.0001971773666418481, "tps": 40748, "wall": 27267.2} {"step": 16954, "train_loss": 3.390317440032959, "lr": 0.00019715836339039404, "tps": 40742, "wall": 27272.8} {"step": 16955, "train_loss": 3.3149452209472656, "lr": 0.00019713936039769122, "tps": 40736, "wall": 27278.2} {"step": 16956, "train_loss": 3.2954208850860596, "lr": 0.00019712035766395497, "tps": 40731, "wall": 27283.6} {"step": 16957, "train_loss": 3.211940288543701, "lr": 0.0001971013551894005, "tps": 40725, "wall": 27289.1} {"step": 16958, "train_loss": 3.281895160675049, "lr": 0.0001970823529742432, "tps": 40719, "wall": 27294.5} {"step": 16959, "train_loss": 3.3548550605773926, "lr": 0.0001970633510186982, "tps": 40713, "wall": 27300.0} {"step": 16960, "train_loss": 3.3705101013183594, "lr": 0.00019704434932298076, "tps": 40708, "wall": 27305.5} {"step": 16961, "train_loss": 3.3033275604248047, "lr": 0.00019702534788730626, "tps": 40702, "wall": 27310.9} {"step": 16962, "train_loss": 3.405198812484741, "lr": 0.0001970063467118898, "tps": 40696, "wall": 27316.4} {"step": 16963, "train_loss": 3.354745388031006, "lr": 0.00019698734579694672, "tps": 40691, "wall": 27321.8} {"step": 16964, "train_loss": 3.309234619140625, "lr": 0.00019696834514269223, "tps": 40685, "wall": 27327.2} {"step": 16965, "train_loss": 3.335853099822998, "lr": 0.00019694934474934157, "tps": 40679, "wall": 27332.7} {"step": 16966, "train_loss": 3.309129476547241, "lr": 0.00019693034461710997, "tps": 40673, "wall": 27338.2} {"step": 16967, "train_loss": 3.3620617389678955, "lr": 0.00019691134474621267, "tps": 40668, "wall": 27343.6} {"step": 16968, "train_loss": 3.3331804275512695, "lr": 0.0001968923451368649, "tps": 40662, "wall": 27349.0} {"step": 16969, "train_loss": 3.339968204498291, "lr": 0.00019687334578928192, "tps": 40656, "wall": 27354.5} {"step": 16970, "train_loss": 3.3646063804626465, "lr": 0.00019685434670367892, "tps": 40651, "wall": 27359.9} {"step": 16971, "train_loss": 3.3137543201446533, "lr": 0.00019683534788027113, "tps": 40645, "wall": 27365.4} {"step": 16972, "train_loss": 3.387080192565918, "lr": 0.0001968163493192738, "tps": 40639, "wall": 27370.9} {"step": 16973, "train_loss": 3.3961217403411865, "lr": 0.00019679735102090206, "tps": 40633, "wall": 27376.3} {"step": 16974, "train_loss": 3.2963099479675293, "lr": 0.00019677835298537123, "tps": 40628, "wall": 27381.8} {"step": 16975, "train_loss": 3.3296263217926025, "lr": 0.00019675935521289644, "tps": 40622, "wall": 27387.3} {"step": 16976, "train_loss": 3.2758595943450928, "lr": 0.00019674035770369294, "tps": 40616, "wall": 27392.8} {"step": 16977, "train_loss": 3.181812047958374, "lr": 0.00019672136045797593, "tps": 40610, "wall": 27398.2} {"step": 16978, "train_loss": 3.2389183044433594, "lr": 0.00019670236347596066, "tps": 40605, "wall": 27403.7} {"step": 16979, "train_loss": 3.33609676361084, "lr": 0.0001966833667578622, "tps": 40599, "wall": 27409.1} {"step": 16980, "train_loss": 3.2618861198425293, "lr": 0.00019666437030389585, "tps": 40594, "wall": 27414.5} {"step": 16981, "train_loss": 3.3386735916137695, "lr": 0.00019664537411427681, "tps": 40588, "wall": 27420.0} {"step": 16982, "train_loss": 3.3631086349487305, "lr": 0.00019662637818922019, "tps": 40582, "wall": 27425.4} {"step": 16983, "train_loss": 3.3194477558135986, "lr": 0.00019660738252894126, "tps": 40577, "wall": 27430.8} {"step": 16984, "train_loss": 3.4200148582458496, "lr": 0.00019658838713365514, "tps": 40571, "wall": 27436.3} {"step": 16985, "train_loss": 3.354687213897705, "lr": 0.00019656939200357701, "tps": 40565, "wall": 27441.7} {"step": 16986, "train_loss": 3.420733690261841, "lr": 0.00019655039713892212, "tps": 40560, "wall": 27447.1} {"step": 16987, "train_loss": 3.3138818740844727, "lr": 0.00019653140253990558, "tps": 40554, "wall": 27452.6} {"step": 16988, "train_loss": 3.4249792098999023, "lr": 0.0001965124082067426, "tps": 40548, "wall": 27458.1} {"step": 16989, "train_loss": 3.342405319213867, "lr": 0.0001964934141396483, "tps": 40543, "wall": 27463.6} {"step": 16990, "train_loss": 3.315021514892578, "lr": 0.0001964744203388379, "tps": 40537, "wall": 27469.0} {"step": 16991, "train_loss": 3.296782970428467, "lr": 0.00019645542680452656, "tps": 40531, "wall": 27474.4} {"step": 16992, "train_loss": 3.375441551208496, "lr": 0.00019643643353692937, "tps": 40526, "wall": 27479.9} {"step": 16993, "train_loss": 3.268472671508789, "lr": 0.00019641744053626155, "tps": 40520, "wall": 27485.4} {"step": 16994, "train_loss": 3.174405336380005, "lr": 0.00019639844780273825, "tps": 40514, "wall": 27490.8} {"step": 16995, "train_loss": 3.27296781539917, "lr": 0.00019637945533657462, "tps": 40509, "wall": 27496.2} {"step": 16996, "train_loss": 3.4160046577453613, "lr": 0.0001963604631379858, "tps": 40503, "wall": 27501.6} {"step": 16997, "train_loss": 3.417449474334717, "lr": 0.0001963414712071869, "tps": 40497, "wall": 27507.1} {"step": 16998, "train_loss": 3.256612539291382, "lr": 0.00019632247954439312, "tps": 40492, "wall": 27512.6} {"step": 16999, "train_loss": 3.3442466259002686, "lr": 0.00019630348814981952, "tps": 40486, "wall": 27518.0} {"step": 17000, "train_loss": 3.3576858043670654, "lr": 0.00019628449702368137, "tps": 40480, "wall": 27523.5, "val_loss_monitor": 3.424180444699837} {"step": 17001, "train_loss": 3.399872303009033, "lr": 0.00019626550616619367, "tps": 40423, "wall": 27564.2} {"step": 17002, "train_loss": 3.3402457237243652, "lr": 0.00019624651557757162, "tps": 40417, "wall": 27569.7} {"step": 17003, "train_loss": 3.3950307369232178, "lr": 0.0001962275252580303, "tps": 40412, "wall": 27575.3} {"step": 17004, "train_loss": 3.276221513748169, "lr": 0.00019620853520778487, "tps": 40406, "wall": 27580.8} {"step": 17005, "train_loss": 3.4211230278015137, "lr": 0.0001961895454270505, "tps": 40400, "wall": 27586.2} {"step": 17006, "train_loss": 3.3971807956695557, "lr": 0.0001961705559160422, "tps": 40395, "wall": 27591.7} {"step": 17007, "train_loss": 3.254828929901123, "lr": 0.0001961515666749751, "tps": 40389, "wall": 27597.2} {"step": 17008, "train_loss": 3.334136486053467, "lr": 0.0001961325777040644, "tps": 40383, "wall": 27602.7} {"step": 17009, "train_loss": 3.2562918663024902, "lr": 0.0001961135890035251, "tps": 40378, "wall": 27608.2} {"step": 17010, "train_loss": 3.3571395874023438, "lr": 0.00019609460057357238, "tps": 40372, "wall": 27613.7} {"step": 17011, "train_loss": 3.351902961730957, "lr": 0.00019607561241442127, "tps": 40366, "wall": 27619.1} {"step": 17012, "train_loss": 3.406043767929077, "lr": 0.000196056624526287, "tps": 40361, "wall": 27624.6} {"step": 17013, "train_loss": 3.362670660018921, "lr": 0.00019603763690938456, "tps": 40355, "wall": 27630.2} {"step": 17014, "train_loss": 3.308431625366211, "lr": 0.00019601864956392905, "tps": 40349, "wall": 27635.8} {"step": 17015, "train_loss": 3.255410671234131, "lr": 0.0001959996624901356, "tps": 40344, "wall": 27641.2} {"step": 17016, "train_loss": 3.2858166694641113, "lr": 0.0001959806756882192, "tps": 40338, "wall": 27646.7} {"step": 17017, "train_loss": 3.2910337448120117, "lr": 0.00019596168915839507, "tps": 40332, "wall": 27652.2} {"step": 17018, "train_loss": 3.2401559352874756, "lr": 0.00019594270290087824, "tps": 40327, "wall": 27657.7} {"step": 17019, "train_loss": 3.331136703491211, "lr": 0.0001959237169158837, "tps": 40321, "wall": 27663.2} {"step": 17020, "train_loss": 3.3606925010681152, "lr": 0.00019590473120362667, "tps": 40315, "wall": 27668.7} {"step": 17021, "train_loss": 3.3222200870513916, "lr": 0.0001958857457643221, "tps": 40310, "wall": 27674.2} {"step": 17022, "train_loss": 3.3709442615509033, "lr": 0.00019586676059818513, "tps": 40304, "wall": 27679.7} {"step": 17023, "train_loss": 3.3334786891937256, "lr": 0.0001958477757054308, "tps": 40298, "wall": 27685.3} {"step": 17024, "train_loss": 3.25112247467041, "lr": 0.00019582879108627417, "tps": 40293, "wall": 27690.9} {"step": 17025, "train_loss": 3.3268074989318848, "lr": 0.00019580980674093032, "tps": 40287, "wall": 27696.4} {"step": 17026, "train_loss": 3.3325774669647217, "lr": 0.00019579082266961426, "tps": 40281, "wall": 27701.9} {"step": 17027, "train_loss": 3.2233707904815674, "lr": 0.00019577183887254109, "tps": 40276, "wall": 27707.3} {"step": 17028, "train_loss": 3.370504856109619, "lr": 0.00019575285534992584, "tps": 40270, "wall": 27712.8} {"step": 17029, "train_loss": 3.3307254314422607, "lr": 0.00019573387210198356, "tps": 40265, "wall": 27718.2} {"step": 17030, "train_loss": 3.3321609497070312, "lr": 0.00019571488912892925, "tps": 40259, "wall": 27723.7} {"step": 17031, "train_loss": 3.2734646797180176, "lr": 0.000195695906430978, "tps": 40254, "wall": 27729.1} {"step": 17032, "train_loss": 3.4176290035247803, "lr": 0.00019567692400834487, "tps": 40248, "wall": 27734.5} {"step": 17033, "train_loss": 3.366271495819092, "lr": 0.00019565794186124485, "tps": 40242, "wall": 27740.1} {"step": 17034, "train_loss": 3.336345672607422, "lr": 0.00019563895998989296, "tps": 40237, "wall": 27745.6} {"step": 17035, "train_loss": 3.332052230834961, "lr": 0.00019561997839450426, "tps": 40231, "wall": 27751.1} {"step": 17036, "train_loss": 3.208075761795044, "lr": 0.00019560099707529376, "tps": 40226, "wall": 27756.6} {"step": 17037, "train_loss": 3.272113561630249, "lr": 0.00019558201603247653, "tps": 40220, "wall": 27762.1} {"step": 17038, "train_loss": 3.2873027324676514, "lr": 0.00019556303526626744, "tps": 40214, "wall": 27767.6} {"step": 17039, "train_loss": 3.3066763877868652, "lr": 0.00019554405477688173, "tps": 40209, "wall": 27773.0} {"step": 17040, "train_loss": 3.329591751098633, "lr": 0.0001955250745645342, "tps": 40203, "wall": 27778.5} {"step": 17041, "train_loss": 3.363126039505005, "lr": 0.00019550609462944, "tps": 40198, "wall": 27784.0} {"step": 17042, "train_loss": 3.3160221576690674, "lr": 0.0001954871149718141, "tps": 40192, "wall": 27789.4} {"step": 17043, "train_loss": 3.3470513820648193, "lr": 0.00019546813559187144, "tps": 40187, "wall": 27794.8} {"step": 17044, "train_loss": 3.3056161403656006, "lr": 0.00019544915648982706, "tps": 40181, "wall": 27800.3} {"step": 17045, "train_loss": 3.414405584335327, "lr": 0.00019543017766589604, "tps": 40176, "wall": 27805.8} {"step": 17046, "train_loss": 3.2218995094299316, "lr": 0.0001954111991202932, "tps": 40170, "wall": 27811.3} {"step": 17047, "train_loss": 3.292731761932373, "lr": 0.00019539222085323367, "tps": 40164, "wall": 27816.8} {"step": 17048, "train_loss": 3.201259136199951, "lr": 0.00019537324286493242, "tps": 40159, "wall": 27822.3} {"step": 17049, "train_loss": 3.3185479640960693, "lr": 0.0001953542651556044, "tps": 40153, "wall": 27827.7} {"step": 17050, "train_loss": 3.480846405029297, "lr": 0.00019533528772546456, "tps": 40148, "wall": 27833.2} {"step": 17051, "train_loss": 3.2950220108032227, "lr": 0.0001953163105747279, "tps": 40142, "wall": 27838.6} {"step": 17052, "train_loss": 3.3466267585754395, "lr": 0.0001952973337036095, "tps": 40137, "wall": 27844.1} {"step": 17053, "train_loss": 3.3395681381225586, "lr": 0.00019527835711232415, "tps": 40131, "wall": 27849.6} {"step": 17054, "train_loss": 3.2688536643981934, "lr": 0.00019525938080108696, "tps": 40126, "wall": 27855.1} {"step": 17055, "train_loss": 3.404536247253418, "lr": 0.0001952404047701128, "tps": 40120, "wall": 27860.5} {"step": 17056, "train_loss": 3.3169422149658203, "lr": 0.00019522142901961674, "tps": 40115, "wall": 27866.0} {"step": 17057, "train_loss": 3.334714651107788, "lr": 0.0001952024535498136, "tps": 40109, "wall": 27871.6} {"step": 17058, "train_loss": 3.3152916431427, "lr": 0.00019518347836091843, "tps": 40103, "wall": 27877.2} {"step": 17059, "train_loss": 3.550335645675659, "lr": 0.00019516450345314617, "tps": 40098, "wall": 27882.6} {"step": 17060, "train_loss": 3.3161489963531494, "lr": 0.00019514552882671175, "tps": 40092, "wall": 27888.1} {"step": 17061, "train_loss": 3.3701887130737305, "lr": 0.00019512655448183014, "tps": 40087, "wall": 27893.6} {"step": 17062, "train_loss": 3.400636672973633, "lr": 0.00019510758041871632, "tps": 40081, "wall": 27899.1} {"step": 17063, "train_loss": 3.262010335922241, "lr": 0.00019508860663758508, "tps": 40075, "wall": 27904.7} {"step": 17064, "train_loss": 3.2700161933898926, "lr": 0.00019506963313865145, "tps": 40070, "wall": 27910.2} {"step": 17065, "train_loss": 3.384964942932129, "lr": 0.0001950506599221304, "tps": 40064, "wall": 27915.8} {"step": 17066, "train_loss": 3.3708677291870117, "lr": 0.00019503168698823683, "tps": 40059, "wall": 27921.3} {"step": 17067, "train_loss": 3.3529276847839355, "lr": 0.0001950127143371857, "tps": 40053, "wall": 27926.9} {"step": 17068, "train_loss": 3.410770893096924, "lr": 0.0001949937419691918, "tps": 40047, "wall": 27932.4} {"step": 17069, "train_loss": 3.2871713638305664, "lr": 0.00019497476988447022, "tps": 40042, "wall": 27938.0} {"step": 17070, "train_loss": 3.304048538208008, "lr": 0.00019495579808323578, "tps": 40036, "wall": 27943.6} {"step": 17071, "train_loss": 3.24355411529541, "lr": 0.0001949368265657034, "tps": 40030, "wall": 27949.1} {"step": 17072, "train_loss": 3.325833797454834, "lr": 0.00019491785533208802, "tps": 40025, "wall": 27954.6} {"step": 17073, "train_loss": 3.318660020828247, "lr": 0.00019489888438260452, "tps": 40019, "wall": 27960.2} {"step": 17074, "train_loss": 3.3496627807617188, "lr": 0.0001948799137174678, "tps": 40014, "wall": 27965.8} {"step": 17075, "train_loss": 3.286679267883301, "lr": 0.00019486094333689277, "tps": 40008, "wall": 27971.3} {"step": 17076, "train_loss": 3.400801658630371, "lr": 0.0001948419732410944, "tps": 40002, "wall": 27976.9} {"step": 17077, "train_loss": 3.364030599594116, "lr": 0.0001948230034302875, "tps": 39997, "wall": 27982.5} {"step": 17078, "train_loss": 3.3117895126342773, "lr": 0.00019480403390468692, "tps": 39991, "wall": 27988.0} {"step": 17079, "train_loss": 3.35849666595459, "lr": 0.00019478506466450766, "tps": 39986, "wall": 27993.7} {"step": 17080, "train_loss": 3.256398916244507, "lr": 0.00019476609570996453, "tps": 39980, "wall": 27999.3} {"step": 17081, "train_loss": 3.3851466178894043, "lr": 0.00019474712704127244, "tps": 39974, "wall": 28004.9} {"step": 17082, "train_loss": 3.3921895027160645, "lr": 0.00019472815865864625, "tps": 39969, "wall": 28010.5} {"step": 17083, "train_loss": 3.2587432861328125, "lr": 0.00019470919056230085, "tps": 39963, "wall": 28016.0} {"step": 17084, "train_loss": 3.1604719161987305, "lr": 0.0001946902227524511, "tps": 39957, "wall": 28021.6} {"step": 17085, "train_loss": 3.4000959396362305, "lr": 0.0001946712552293119, "tps": 39952, "wall": 28027.1} {"step": 17086, "train_loss": 3.3766229152679443, "lr": 0.00019465228799309808, "tps": 39946, "wall": 28032.8} {"step": 17087, "train_loss": 3.2978460788726807, "lr": 0.00019463332104402455, "tps": 39940, "wall": 28038.3} {"step": 17088, "train_loss": 3.2706871032714844, "lr": 0.00019461435438230607, "tps": 39935, "wall": 28044.0} {"step": 17089, "train_loss": 3.2687244415283203, "lr": 0.0001945953880081576, "tps": 39929, "wall": 28049.6} {"step": 17090, "train_loss": 3.290897846221924, "lr": 0.0001945764219217939, "tps": 39923, "wall": 28055.3} {"step": 17091, "train_loss": 3.3266215324401855, "lr": 0.0001945574561234299, "tps": 39918, "wall": 28061.0} {"step": 17092, "train_loss": 3.290980100631714, "lr": 0.00019453849061328038, "tps": 39912, "wall": 28066.5} {"step": 17093, "train_loss": 3.2986583709716797, "lr": 0.0001945195253915603, "tps": 39906, "wall": 28072.2} {"step": 17094, "train_loss": 3.3676657676696777, "lr": 0.00019450056045848432, "tps": 39901, "wall": 28077.7} {"step": 17095, "train_loss": 3.28220796585083, "lr": 0.00019448159581426743, "tps": 39895, "wall": 28083.3} {"step": 17096, "train_loss": 3.411081314086914, "lr": 0.00019446263145912442, "tps": 39890, "wall": 28089.0} {"step": 17097, "train_loss": 3.256608009338379, "lr": 0.00019444366739327005, "tps": 39884, "wall": 28094.6} {"step": 17098, "train_loss": 3.3056516647338867, "lr": 0.0001944247036169192, "tps": 39878, "wall": 28100.2} {"step": 17099, "train_loss": 3.3518857955932617, "lr": 0.00019440574013028674, "tps": 39873, "wall": 28105.8} {"step": 17100, "train_loss": 3.3150064945220947, "lr": 0.00019438677693358738, "tps": 39867, "wall": 28111.5} {"step": 17101, "train_loss": 3.248790979385376, "lr": 0.00019436781402703602, "tps": 39861, "wall": 28117.1} {"step": 17102, "train_loss": 3.362299919128418, "lr": 0.00019434885141084745, "tps": 39855, "wall": 28122.8} {"step": 17103, "train_loss": 3.3897171020507812, "lr": 0.00019432988908523648, "tps": 39850, "wall": 28128.5} {"step": 17104, "train_loss": 3.2001118659973145, "lr": 0.00019431092705041793, "tps": 39844, "wall": 28134.1} {"step": 17105, "train_loss": 3.3142411708831787, "lr": 0.00019429196530660657, "tps": 39838, "wall": 28139.8} {"step": 17106, "train_loss": 3.30391263961792, "lr": 0.00019427300385401725, "tps": 39833, "wall": 28145.4} {"step": 17107, "train_loss": 3.284151554107666, "lr": 0.0001942540426928647, "tps": 39827, "wall": 28151.1} {"step": 17108, "train_loss": 3.3918561935424805, "lr": 0.0001942350818233638, "tps": 39821, "wall": 28156.7} {"step": 17109, "train_loss": 3.3867714405059814, "lr": 0.00019421612124572923, "tps": 39816, "wall": 28162.3} {"step": 17110, "train_loss": 3.377399444580078, "lr": 0.00019419716096017586, "tps": 39810, "wall": 28168.0} {"step": 17111, "train_loss": 3.419487953186035, "lr": 0.00019417820096691846, "tps": 39804, "wall": 28173.7} {"step": 17112, "train_loss": 3.2903692722320557, "lr": 0.00019415924126617174, "tps": 39799, "wall": 28179.4} {"step": 17113, "train_loss": 3.3402152061462402, "lr": 0.00019414028185815054, "tps": 39793, "wall": 28185.1} {"step": 17114, "train_loss": 3.357806444168091, "lr": 0.0001941213227430697, "tps": 39787, "wall": 28190.8} {"step": 17115, "train_loss": 3.4086785316467285, "lr": 0.00019410236392114385, "tps": 39782, "wall": 28196.5} {"step": 17116, "train_loss": 3.2427468299865723, "lr": 0.00019408340539258783, "tps": 39776, "wall": 28202.1} {"step": 17117, "train_loss": 3.3124592304229736, "lr": 0.00019406444715761639, "tps": 39770, "wall": 28207.8} {"step": 17118, "train_loss": 3.291949510574341, "lr": 0.00019404548921644432, "tps": 39765, "wall": 28213.5} {"step": 17119, "train_loss": 3.302151679992676, "lr": 0.0001940265315692863, "tps": 39759, "wall": 28219.1} {"step": 17120, "train_loss": 3.2714085578918457, "lr": 0.0001940075742163572, "tps": 39753, "wall": 28224.8} {"step": 17121, "train_loss": 3.252617359161377, "lr": 0.0001939886171578717, "tps": 39747, "wall": 28230.6} {"step": 17122, "train_loss": 3.3852367401123047, "lr": 0.0001939696603940445, "tps": 39742, "wall": 28236.3} {"step": 17123, "train_loss": 3.249678611755371, "lr": 0.00019395070392509042, "tps": 39736, "wall": 28242.0} {"step": 17124, "train_loss": 3.3863847255706787, "lr": 0.00019393174775122422, "tps": 39730, "wall": 28247.7} {"step": 17125, "train_loss": 3.2814579010009766, "lr": 0.0001939127918726605, "tps": 39725, "wall": 28253.4} {"step": 17126, "train_loss": 3.1860315799713135, "lr": 0.00019389383628961416, "tps": 39719, "wall": 28259.2} {"step": 17127, "train_loss": 3.2888710498809814, "lr": 0.00019387488100229983, "tps": 39713, "wall": 28264.8} {"step": 17128, "train_loss": 3.2647311687469482, "lr": 0.0001938559260109323, "tps": 39708, "wall": 28270.5} {"step": 17129, "train_loss": 3.377695083618164, "lr": 0.0001938369713157262, "tps": 39702, "wall": 28276.2} {"step": 17130, "train_loss": 3.342120885848999, "lr": 0.00019381801691689633, "tps": 39696, "wall": 28282.0} {"step": 17131, "train_loss": 3.3604516983032227, "lr": 0.0001937990628146574, "tps": 39690, "wall": 28287.7} {"step": 17132, "train_loss": 3.5622007846832275, "lr": 0.00019378010900922407, "tps": 39684, "wall": 28293.5} {"step": 17133, "train_loss": 3.2962052822113037, "lr": 0.00019376115550081107, "tps": 39679, "wall": 28299.2} {"step": 17134, "train_loss": 3.3753600120544434, "lr": 0.00019374220228963318, "tps": 39673, "wall": 28305.0} {"step": 17135, "train_loss": 3.251585006713867, "lr": 0.00019372324937590496, "tps": 39667, "wall": 28310.7} {"step": 17136, "train_loss": 3.285971164703369, "lr": 0.00019370429675984126, "tps": 39662, "wall": 28316.4} {"step": 17137, "train_loss": 3.3434207439422607, "lr": 0.0001936853444416567, "tps": 39656, "wall": 28322.2} {"step": 17138, "train_loss": 3.332407236099243, "lr": 0.00019366639242156594, "tps": 39650, "wall": 28327.9} {"step": 17139, "train_loss": 3.218682050704956, "lr": 0.00019364744069978377, "tps": 39644, "wall": 28333.7} {"step": 17140, "train_loss": 3.3138632774353027, "lr": 0.00019362848927652478, "tps": 39639, "wall": 28339.4} {"step": 17141, "train_loss": 3.295393228530884, "lr": 0.0001936095381520037, "tps": 39633, "wall": 28345.2} {"step": 17142, "train_loss": 3.3165009021759033, "lr": 0.0001935905873264352, "tps": 39627, "wall": 28351.0} {"step": 17143, "train_loss": 3.3879594802856445, "lr": 0.00019357163680003395, "tps": 39621, "wall": 28356.7} {"step": 17144, "train_loss": 3.1786670684814453, "lr": 0.0001935526865730146, "tps": 39616, "wall": 28362.5} {"step": 17145, "train_loss": 3.463125228881836, "lr": 0.0001935337366455919, "tps": 39610, "wall": 28368.2} {"step": 17146, "train_loss": 3.2359964847564697, "lr": 0.00019351478701798045, "tps": 39604, "wall": 28374.0} {"step": 17147, "train_loss": 3.2613067626953125, "lr": 0.0001934958376903949, "tps": 39599, "wall": 28379.7} {"step": 17148, "train_loss": 3.3497700691223145, "lr": 0.00019347688866304998, "tps": 39593, "wall": 28385.4} {"step": 17149, "train_loss": 3.331149101257324, "lr": 0.00019345793993616025, "tps": 39587, "wall": 28391.2} {"step": 17150, "train_loss": 3.294168710708618, "lr": 0.00019343899150994044, "tps": 39582, "wall": 28396.9} {"step": 17151, "train_loss": 3.379441738128662, "lr": 0.00019342004338460518, "tps": 39576, "wall": 28402.7} {"step": 17152, "train_loss": 3.246779441833496, "lr": 0.00019340109556036908, "tps": 39570, "wall": 28408.4} {"step": 17153, "train_loss": 3.4006521701812744, "lr": 0.00019338214803744678, "tps": 39564, "wall": 28414.3} {"step": 17154, "train_loss": 3.370234489440918, "lr": 0.000193363200816053, "tps": 39559, "wall": 28420.0} {"step": 17155, "train_loss": 3.394052028656006, "lr": 0.00019334425389640235, "tps": 39553, "wall": 28425.7} {"step": 17156, "train_loss": 3.2611420154571533, "lr": 0.0001933253072787094, "tps": 39547, "wall": 28431.5} {"step": 17157, "train_loss": 3.392193555831909, "lr": 0.0001933063609631888, "tps": 39542, "wall": 28437.2} {"step": 17158, "train_loss": 3.355959177017212, "lr": 0.00019328741495005521, "tps": 39536, "wall": 28443.0} {"step": 17159, "train_loss": 3.3733887672424316, "lr": 0.0001932684692395232, "tps": 39530, "wall": 28448.8} {"step": 17160, "train_loss": 3.2722935676574707, "lr": 0.0001932495238318074, "tps": 39524, "wall": 28454.6} {"step": 17161, "train_loss": 3.2535955905914307, "lr": 0.00019323057872712248, "tps": 39519, "wall": 28460.4} {"step": 17162, "train_loss": 3.2739789485931396, "lr": 0.000193211633925683, "tps": 39513, "wall": 28466.2} {"step": 17163, "train_loss": 3.2267534732818604, "lr": 0.00019319268942770358, "tps": 39507, "wall": 28472.1} {"step": 17164, "train_loss": 3.317082405090332, "lr": 0.00019317374523339882, "tps": 39501, "wall": 28477.9} {"step": 17165, "train_loss": 3.3077847957611084, "lr": 0.0001931548013429833, "tps": 39495, "wall": 28483.7} {"step": 17166, "train_loss": 3.339139461517334, "lr": 0.00019313585775667172, "tps": 39490, "wall": 28489.5} {"step": 17167, "train_loss": 3.228217124938965, "lr": 0.0001931169144746785, "tps": 39484, "wall": 28495.2} {"step": 17168, "train_loss": 3.3434317111968994, "lr": 0.0001930979714972184, "tps": 39478, "wall": 28501.0} {"step": 17169, "train_loss": 3.2163455486297607, "lr": 0.00019307902882450596, "tps": 39473, "wall": 28506.8} {"step": 17170, "train_loss": 3.2817344665527344, "lr": 0.00019306008645675565, "tps": 39467, "wall": 28512.6} {"step": 17171, "train_loss": 3.3542346954345703, "lr": 0.00019304114439418216, "tps": 39461, "wall": 28518.4} {"step": 17172, "train_loss": 3.308580160140991, "lr": 0.0001930222026370001, "tps": 39456, "wall": 28524.1} {"step": 17173, "train_loss": 3.308513641357422, "lr": 0.00019300326118542395, "tps": 39450, "wall": 28530.0} {"step": 17174, "train_loss": 3.3428659439086914, "lr": 0.0001929843200396683, "tps": 39444, "wall": 28535.8} {"step": 17175, "train_loss": 3.3853142261505127, "lr": 0.00019296537919994778, "tps": 39438, "wall": 28541.6} {"step": 17176, "train_loss": 3.372661828994751, "lr": 0.00019294643866647686, "tps": 39433, "wall": 28547.4} {"step": 17177, "train_loss": 3.3877487182617188, "lr": 0.00019292749843947014, "tps": 39427, "wall": 28553.2} {"step": 17178, "train_loss": 3.1871390342712402, "lr": 0.00019290855851914222, "tps": 39421, "wall": 28559.1} {"step": 17179, "train_loss": 3.478788375854492, "lr": 0.00019288961890570762, "tps": 39415, "wall": 28564.9} {"step": 17180, "train_loss": 3.3640313148498535, "lr": 0.00019287067959938083, "tps": 39410, "wall": 28570.7} {"step": 17181, "train_loss": 3.3121042251586914, "lr": 0.00019285174060037648, "tps": 39404, "wall": 28576.5} {"step": 17182, "train_loss": 3.3722939491271973, "lr": 0.00019283280190890914, "tps": 39398, "wall": 28582.3} {"step": 17183, "train_loss": 3.307474136352539, "lr": 0.0001928138635251932, "tps": 39392, "wall": 28588.1} {"step": 17184, "train_loss": 3.3015971183776855, "lr": 0.0001927949254494433, "tps": 39387, "wall": 28594.0} {"step": 17185, "train_loss": 3.3133585453033447, "lr": 0.00019277598768187404, "tps": 39381, "wall": 28599.8} {"step": 17186, "train_loss": 3.287092924118042, "lr": 0.00019275705022269978, "tps": 39375, "wall": 28605.6} {"step": 17187, "train_loss": 3.3599863052368164, "lr": 0.00019273811307213512, "tps": 39370, "wall": 28611.4} {"step": 17188, "train_loss": 3.2546298503875732, "lr": 0.0001927191762303947, "tps": 39364, "wall": 28617.3} {"step": 17189, "train_loss": 3.2829995155334473, "lr": 0.00019270023969769281, "tps": 39358, "wall": 28623.1} {"step": 17190, "train_loss": 3.3144640922546387, "lr": 0.0001926813034742441, "tps": 39352, "wall": 28628.9} {"step": 17191, "train_loss": 3.281999111175537, "lr": 0.00019266236756026306, "tps": 39347, "wall": 28634.7} {"step": 17192, "train_loss": 3.3091650009155273, "lr": 0.00019264343195596423, "tps": 39341, "wall": 28640.6} {"step": 17193, "train_loss": 3.3721604347229004, "lr": 0.0001926244966615621, "tps": 39335, "wall": 28646.4} {"step": 17194, "train_loss": 3.2976813316345215, "lr": 0.00019260556167727112, "tps": 39329, "wall": 28652.3} {"step": 17195, "train_loss": 3.2550580501556396, "lr": 0.00019258662700330582, "tps": 39324, "wall": 28658.0} {"step": 17196, "train_loss": 3.3347177505493164, "lr": 0.0001925676926398807, "tps": 39318, "wall": 28663.8} {"step": 17197, "train_loss": 3.350043296813965, "lr": 0.00019254875858721023, "tps": 39312, "wall": 28669.7} {"step": 17198, "train_loss": 3.457948684692383, "lr": 0.0001925298248455089, "tps": 39307, "wall": 28675.5} {"step": 17199, "train_loss": 3.4199700355529785, "lr": 0.00019251089141499126, "tps": 39301, "wall": 28681.3} {"step": 17200, "train_loss": 3.3915486335754395, "lr": 0.00019249195829587165, "tps": 39295, "wall": 28687.1} {"step": 17201, "train_loss": 3.2902419567108154, "lr": 0.00019247302548836465, "tps": 39290, "wall": 28692.9} {"step": 17202, "train_loss": 3.373732089996338, "lr": 0.00019245409299268476, "tps": 39284, "wall": 28698.8} {"step": 17203, "train_loss": 3.226916790008545, "lr": 0.00019243516080904636, "tps": 39278, "wall": 28704.5} {"step": 17204, "train_loss": 3.29089093208313, "lr": 0.0001924162289376639, "tps": 39273, "wall": 28710.4} {"step": 17205, "train_loss": 3.452681064605713, "lr": 0.00019239729737875196, "tps": 39267, "wall": 28716.4} {"step": 17206, "train_loss": 3.2873778343200684, "lr": 0.0001923783661325249, "tps": 39261, "wall": 28722.1} {"step": 17207, "train_loss": 3.473128318786621, "lr": 0.0001923594351991972, "tps": 39256, "wall": 28727.9} {"step": 17208, "train_loss": 3.3097987174987793, "lr": 0.00019234050457898332, "tps": 39250, "wall": 28733.7} {"step": 17209, "train_loss": 3.3131513595581055, "lr": 0.00019232157427209772, "tps": 39244, "wall": 28739.5} {"step": 17210, "train_loss": 3.317068576812744, "lr": 0.00019230264427875477, "tps": 39239, "wall": 28745.3} {"step": 17211, "train_loss": 3.3103528022766113, "lr": 0.00019228371459916902, "tps": 39233, "wall": 28751.2} {"step": 17212, "train_loss": 3.328371286392212, "lr": 0.00019226478523355484, "tps": 39227, "wall": 28756.9} {"step": 17213, "train_loss": 3.2849836349487305, "lr": 0.00019224585618212662, "tps": 39222, "wall": 28762.7} {"step": 17214, "train_loss": 3.322507858276367, "lr": 0.00019222692744509892, "tps": 39216, "wall": 28768.5} {"step": 17215, "train_loss": 3.3612449169158936, "lr": 0.00019220799902268607, "tps": 39210, "wall": 28774.4} {"step": 17216, "train_loss": 3.392240047454834, "lr": 0.00019218907091510246, "tps": 39205, "wall": 28780.1} {"step": 17217, "train_loss": 3.3452959060668945, "lr": 0.0001921701431225626, "tps": 39199, "wall": 28785.9} {"step": 17218, "train_loss": 3.3165693283081055, "lr": 0.00019215121564528084, "tps": 39194, "wall": 28791.7} {"step": 17219, "train_loss": 3.3143234252929688, "lr": 0.00019213228848347167, "tps": 39188, "wall": 28797.4} {"step": 17220, "train_loss": 3.317539691925049, "lr": 0.00019211336163734937, "tps": 39182, "wall": 28803.2} {"step": 17221, "train_loss": 3.341012477874756, "lr": 0.00019209443510712846, "tps": 39177, "wall": 28809.0} {"step": 17222, "train_loss": 3.3140506744384766, "lr": 0.00019207550889302334, "tps": 39171, "wall": 28814.7} {"step": 17223, "train_loss": 3.4258229732513428, "lr": 0.00019205658299524826, "tps": 39166, "wall": 28820.5} {"step": 17224, "train_loss": 3.3444831371307373, "lr": 0.00019203765741401777, "tps": 39160, "wall": 28826.2} {"step": 17225, "train_loss": 3.171278953552246, "lr": 0.00019201873214954622, "tps": 39155, "wall": 28832.0} {"step": 17226, "train_loss": 3.358245849609375, "lr": 0.000191999807202048, "tps": 39149, "wall": 28837.7} {"step": 17227, "train_loss": 3.4779484272003174, "lr": 0.00019198088257173747, "tps": 39144, "wall": 28843.5} {"step": 17228, "train_loss": 3.247622489929199, "lr": 0.00019196195825882896, "tps": 39138, "wall": 28849.2} {"step": 17229, "train_loss": 3.3024964332580566, "lr": 0.00019194303426353702, "tps": 39133, "wall": 28854.9} {"step": 17230, "train_loss": 3.2641661167144775, "lr": 0.0001919241105860758, "tps": 39127, "wall": 28860.6} {"step": 17231, "train_loss": 3.2080280780792236, "lr": 0.00019190518722665982, "tps": 39122, "wall": 28866.3} {"step": 17232, "train_loss": 3.3544602394104004, "lr": 0.00019188626418550344, "tps": 39116, "wall": 28871.9} {"step": 17233, "train_loss": 3.3449275493621826, "lr": 0.00019186734146282088, "tps": 39111, "wall": 28877.6} {"step": 17234, "train_loss": 3.31461238861084, "lr": 0.00019184841905882664, "tps": 39106, "wall": 28883.3} {"step": 17235, "train_loss": 3.3687541484832764, "lr": 0.00019182949697373506, "tps": 39100, "wall": 28889.0} {"step": 17236, "train_loss": 3.303664207458496, "lr": 0.00019181057520776043, "tps": 39095, "wall": 28894.8} {"step": 17237, "train_loss": 3.2975244522094727, "lr": 0.00019179165376111718, "tps": 39089, "wall": 28900.4} {"step": 17238, "train_loss": 3.305525779724121, "lr": 0.00019177273263401952, "tps": 39084, "wall": 28906.2} {"step": 17239, "train_loss": 3.3354663848876953, "lr": 0.00019175381182668196, "tps": 39078, "wall": 28911.8} {"step": 17240, "train_loss": 3.3098342418670654, "lr": 0.0001917348913393187, "tps": 39073, "wall": 28917.5} {"step": 17241, "train_loss": 3.290449380874634, "lr": 0.00019171597117214413, "tps": 39068, "wall": 28923.2} {"step": 17242, "train_loss": 3.3307595252990723, "lr": 0.00019169705132537253, "tps": 39062, "wall": 28928.9} {"step": 17243, "train_loss": 3.303709030151367, "lr": 0.00019167813179921833, "tps": 39057, "wall": 28934.5} {"step": 17244, "train_loss": 3.383336067199707, "lr": 0.00019165921259389572, "tps": 39051, "wall": 28940.2} {"step": 17245, "train_loss": 3.3240532875061035, "lr": 0.0001916402937096191, "tps": 39046, "wall": 28946.0} {"step": 17246, "train_loss": 3.305820941925049, "lr": 0.0001916213751466028, "tps": 39040, "wall": 28951.7} {"step": 17247, "train_loss": 3.3454761505126953, "lr": 0.0001916024569050611, "tps": 39035, "wall": 28957.4} {"step": 17248, "train_loss": 3.432353973388672, "lr": 0.00019158353898520827, "tps": 39030, "wall": 28963.1} {"step": 17249, "train_loss": 3.3413047790527344, "lr": 0.0001915646213872587, "tps": 39024, "wall": 28968.8} {"step": 17250, "train_loss": 3.36568546295166, "lr": 0.00019154570411142658, "tps": 39019, "wall": 28974.4} {"step": 17251, "train_loss": 3.262296199798584, "lr": 0.00019152678715792627, "tps": 39013, "wall": 28980.0} {"step": 17252, "train_loss": 3.3225972652435303, "lr": 0.0001915078705269721, "tps": 39008, "wall": 28985.6} {"step": 17253, "train_loss": 3.2468199729919434, "lr": 0.0001914889542187783, "tps": 39003, "wall": 28991.2} {"step": 17254, "train_loss": 3.29934024810791, "lr": 0.00019147003823355912, "tps": 38998, "wall": 28996.8} {"step": 17255, "train_loss": 3.385798692703247, "lr": 0.0001914511225715289, "tps": 38992, "wall": 29002.5} {"step": 17256, "train_loss": 3.2547333240509033, "lr": 0.00019143220723290196, "tps": 38987, "wall": 29008.1} {"step": 17257, "train_loss": 3.2804946899414062, "lr": 0.0001914132922178925, "tps": 38981, "wall": 29014.0} {"step": 17258, "train_loss": 3.353564739227295, "lr": 0.00019139437752671476, "tps": 38976, "wall": 29019.7} {"step": 17259, "train_loss": 3.262834072113037, "lr": 0.00019137546315958312, "tps": 38971, "wall": 29025.4} {"step": 17260, "train_loss": 3.402611494064331, "lr": 0.0001913565491167118, "tps": 38965, "wall": 29031.0} {"step": 17261, "train_loss": 3.397700786590576, "lr": 0.00019133763539831496, "tps": 38960, "wall": 29036.6} {"step": 17262, "train_loss": 3.2958579063415527, "lr": 0.00019131872200460695, "tps": 38955, "wall": 29042.3} {"step": 17263, "train_loss": 3.3313519954681396, "lr": 0.0001912998089358021, "tps": 38949, "wall": 29047.8} {"step": 17264, "train_loss": 3.2357797622680664, "lr": 0.00019128089619211452, "tps": 38944, "wall": 29053.5} {"step": 17265, "train_loss": 3.386575222015381, "lr": 0.00019126198377375844, "tps": 38939, "wall": 29059.2} {"step": 17266, "train_loss": 3.3828351497650146, "lr": 0.00019124307168094827, "tps": 38933, "wall": 29064.9} {"step": 17267, "train_loss": 3.3519303798675537, "lr": 0.00019122415991389805, "tps": 38928, "wall": 29070.5} {"step": 17268, "train_loss": 3.2658262252807617, "lr": 0.00019120524847282213, "tps": 38923, "wall": 29076.2} {"step": 17269, "train_loss": 3.2598578929901123, "lr": 0.00019118633735793478, "tps": 38918, "wall": 29081.8} {"step": 17270, "train_loss": 3.2923974990844727, "lr": 0.00019116742656945005, "tps": 38912, "wall": 29087.4} {"step": 17271, "train_loss": 3.322037696838379, "lr": 0.00019114851610758232, "tps": 38907, "wall": 29093.0} {"step": 17272, "train_loss": 3.3439931869506836, "lr": 0.00019112960597254578, "tps": 38902, "wall": 29098.7} {"step": 17273, "train_loss": 3.382354497909546, "lr": 0.0001911106961645546, "tps": 38896, "wall": 29104.4} {"step": 17274, "train_loss": 3.2820539474487305, "lr": 0.00019109178668382301, "tps": 38891, "wall": 29110.0} {"step": 17275, "train_loss": 3.353931188583374, "lr": 0.00019107287753056525, "tps": 38886, "wall": 29115.6} {"step": 17276, "train_loss": 3.406589984893799, "lr": 0.00019105396870499548, "tps": 38881, "wall": 29121.2} {"step": 17277, "train_loss": 3.26646089553833, "lr": 0.00019103506020732796, "tps": 38875, "wall": 29126.9} {"step": 17278, "train_loss": 3.243277072906494, "lr": 0.00019101615203777686, "tps": 38870, "wall": 29132.6} {"step": 17279, "train_loss": 3.3625497817993164, "lr": 0.00019099724419655627, "tps": 38865, "wall": 29138.2} {"step": 17280, "train_loss": 3.270930767059326, "lr": 0.00019097833668388047, "tps": 38859, "wall": 29143.9} {"step": 17281, "train_loss": 3.2710893154144287, "lr": 0.0001909594294999637, "tps": 38854, "wall": 29149.4} {"step": 17282, "train_loss": 3.2811989784240723, "lr": 0.00019094052264502005, "tps": 38849, "wall": 29155.1} {"step": 17283, "train_loss": 3.3178160190582275, "lr": 0.00019092161611926375, "tps": 38844, "wall": 29160.7} {"step": 17284, "train_loss": 3.3563456535339355, "lr": 0.000190902709922909, "tps": 38838, "wall": 29166.3} {"step": 17285, "train_loss": 3.3302955627441406, "lr": 0.00019088380405616983, "tps": 38833, "wall": 29171.9} {"step": 17286, "train_loss": 3.3999733924865723, "lr": 0.00019086489851926052, "tps": 38828, "wall": 29177.4} {"step": 17287, "train_loss": 3.3274898529052734, "lr": 0.00019084599331239526, "tps": 38823, "wall": 29183.0} {"step": 17288, "train_loss": 3.4970293045043945, "lr": 0.00019082708843578815, "tps": 38818, "wall": 29188.6} {"step": 17289, "train_loss": 3.3188185691833496, "lr": 0.0001908081838896534, "tps": 38813, "wall": 29194.3} {"step": 17290, "train_loss": 3.3055596351623535, "lr": 0.000190789279674205, "tps": 38807, "wall": 29199.8} {"step": 17291, "train_loss": 3.3644649982452393, "lr": 0.00019077037578965739, "tps": 38802, "wall": 29205.4} {"step": 17292, "train_loss": 3.3054141998291016, "lr": 0.00019075147223622443, "tps": 38797, "wall": 29211.0} {"step": 17293, "train_loss": 3.2975218296051025, "lr": 0.00019073256901412034, "tps": 38792, "wall": 29216.6} {"step": 17294, "train_loss": 3.3091378211975098, "lr": 0.00019071366612355938, "tps": 38787, "wall": 29222.2} {"step": 17295, "train_loss": 3.2433316707611084, "lr": 0.00019069476356475557, "tps": 38782, "wall": 29227.7} {"step": 17296, "train_loss": 3.3108677864074707, "lr": 0.00019067586133792306, "tps": 38776, "wall": 29233.3} {"step": 17297, "train_loss": 3.303311347961426, "lr": 0.00019065695944327592, "tps": 38771, "wall": 29239.0} {"step": 17298, "train_loss": 3.2859039306640625, "lr": 0.00019063805788102842, "tps": 38766, "wall": 29244.5} {"step": 17299, "train_loss": 3.3625030517578125, "lr": 0.00019061915665139455, "tps": 38761, "wall": 29250.1} {"step": 17300, "train_loss": 3.299501895904541, "lr": 0.00019060025575458846, "tps": 38756, "wall": 29255.7} {"step": 17301, "train_loss": 3.293928861618042, "lr": 0.00019058135519082434, "tps": 38750, "wall": 29261.3} {"step": 17302, "train_loss": 3.3268351554870605, "lr": 0.00019056245496031613, "tps": 38745, "wall": 29267.0} {"step": 17303, "train_loss": 3.373138904571533, "lr": 0.00019054355506327802, "tps": 38740, "wall": 29272.6} {"step": 17304, "train_loss": 3.3135733604431152, "lr": 0.00019052465549992414, "tps": 38735, "wall": 29278.1} {"step": 17305, "train_loss": 3.3882007598876953, "lr": 0.00019050575627046858, "tps": 38730, "wall": 29283.6} {"step": 17306, "train_loss": 3.4823992252349854, "lr": 0.00019048685737512537, "tps": 38725, "wall": 29289.2} {"step": 17307, "train_loss": 3.2376980781555176, "lr": 0.00019046795881410859, "tps": 38720, "wall": 29294.8} {"step": 17308, "train_loss": 3.441707134246826, "lr": 0.00019044906058763246, "tps": 38714, "wall": 29300.4} {"step": 17309, "train_loss": 3.32588529586792, "lr": 0.00019043016269591097, "tps": 38709, "wall": 29306.0} {"step": 17310, "train_loss": 3.404160499572754, "lr": 0.00019041126513915814, "tps": 38704, "wall": 29311.7} {"step": 17311, "train_loss": 3.3491506576538086, "lr": 0.00019039236791758816, "tps": 38699, "wall": 29317.2} {"step": 17312, "train_loss": 3.358639717102051, "lr": 0.000190373471031415, "tps": 38694, "wall": 29322.8} {"step": 17313, "train_loss": 3.3708620071411133, "lr": 0.00019035457448085273, "tps": 38689, "wall": 29328.4} {"step": 17314, "train_loss": 3.3218984603881836, "lr": 0.00019033567826611547, "tps": 38683, "wall": 29334.0} {"step": 17315, "train_loss": 3.244821786880493, "lr": 0.00019031678238741733, "tps": 38678, "wall": 29339.6} {"step": 17316, "train_loss": 3.337031602859497, "lr": 0.00019029788684497216, "tps": 38673, "wall": 29345.2} {"step": 17317, "train_loss": 3.287250518798828, "lr": 0.00019027899163899417, "tps": 38668, "wall": 29350.7} {"step": 17318, "train_loss": 3.279155969619751, "lr": 0.00019026009676969744, "tps": 38663, "wall": 29356.2} {"step": 17319, "train_loss": 3.307568073272705, "lr": 0.0001902412022372959, "tps": 38658, "wall": 29361.8} {"step": 17320, "train_loss": 3.252952814102173, "lr": 0.0001902223080420036, "tps": 38653, "wall": 29367.4} {"step": 17321, "train_loss": 3.3593204021453857, "lr": 0.00019020341418403468, "tps": 38648, "wall": 29373.0} {"step": 17322, "train_loss": 3.2133090496063232, "lr": 0.00019018452066360303, "tps": 38643, "wall": 29378.6} {"step": 17323, "train_loss": 3.334596633911133, "lr": 0.00019016562748092275, "tps": 38638, "wall": 29384.1} {"step": 17324, "train_loss": 3.3798794746398926, "lr": 0.00019014673463620786, "tps": 38633, "wall": 29389.7} {"step": 17325, "train_loss": 3.2675180435180664, "lr": 0.0001901278421296724, "tps": 38627, "wall": 29395.2} {"step": 17326, "train_loss": 3.282320499420166, "lr": 0.0001901089499615303, "tps": 38622, "wall": 29400.8} {"step": 17327, "train_loss": 3.2595510482788086, "lr": 0.00019009005813199568, "tps": 38617, "wall": 29406.3} {"step": 17328, "train_loss": 3.3575587272644043, "lr": 0.00019007116664128252, "tps": 38612, "wall": 29411.9} {"step": 17329, "train_loss": 3.2221713066101074, "lr": 0.00019005227548960475, "tps": 38607, "wall": 29417.5} {"step": 17330, "train_loss": 3.3194727897644043, "lr": 0.00019003338467717647, "tps": 38602, "wall": 29423.1} {"step": 17331, "train_loss": 3.366574287414551, "lr": 0.00019001449420421156, "tps": 38597, "wall": 29428.6} {"step": 17332, "train_loss": 3.4428250789642334, "lr": 0.00018999560407092418, "tps": 38592, "wall": 29434.2} {"step": 17333, "train_loss": 3.3911614418029785, "lr": 0.00018997671427752817, "tps": 38587, "wall": 29439.8} {"step": 17334, "train_loss": 3.3330063819885254, "lr": 0.00018995782482423757, "tps": 38582, "wall": 29445.3} {"step": 17335, "train_loss": 3.297356605529785, "lr": 0.00018993893571126632, "tps": 38577, "wall": 29450.9} {"step": 17336, "train_loss": 3.2925782203674316, "lr": 0.00018992004693882847, "tps": 38572, "wall": 29456.4} {"step": 17337, "train_loss": 3.310312032699585, "lr": 0.00018990115850713797, "tps": 38567, "wall": 29462.0} {"step": 17338, "train_loss": 3.3666605949401855, "lr": 0.00018988227041640877, "tps": 38562, "wall": 29467.5} {"step": 17339, "train_loss": 3.3000969886779785, "lr": 0.00018986338266685482, "tps": 38557, "wall": 29473.0} {"step": 17340, "train_loss": 3.297529458999634, "lr": 0.00018984449525869006, "tps": 38552, "wall": 29478.6} {"step": 17341, "train_loss": 3.2925915718078613, "lr": 0.00018982560819212854, "tps": 38546, "wall": 29484.2} {"step": 17342, "train_loss": 3.334688425064087, "lr": 0.0001898067214673842, "tps": 38541, "wall": 29489.7} {"step": 17343, "train_loss": 3.2716712951660156, "lr": 0.00018978783508467092, "tps": 38536, "wall": 29495.4} {"step": 17344, "train_loss": 3.3183133602142334, "lr": 0.00018976894904420264, "tps": 38531, "wall": 29501.0} {"step": 17345, "train_loss": 3.2726781368255615, "lr": 0.0001897500633461934, "tps": 38526, "wall": 29506.5} {"step": 17346, "train_loss": 3.3915913105010986, "lr": 0.00018973117799085706, "tps": 38521, "wall": 29512.1} {"step": 17347, "train_loss": 3.372891664505005, "lr": 0.00018971229297840751, "tps": 38516, "wall": 29517.6} {"step": 17348, "train_loss": 3.232443332672119, "lr": 0.00018969340830905882, "tps": 38511, "wall": 29523.1} {"step": 17349, "train_loss": 3.3629565238952637, "lr": 0.00018967452398302483, "tps": 38506, "wall": 29528.7} {"step": 17350, "train_loss": 3.3930020332336426, "lr": 0.00018965564000051943, "tps": 38501, "wall": 29534.2} {"step": 17351, "train_loss": 3.3205862045288086, "lr": 0.00018963675636175662, "tps": 38496, "wall": 29539.7} {"step": 17352, "train_loss": 3.344967842102051, "lr": 0.00018961787306695028, "tps": 38491, "wall": 29545.3} {"step": 17353, "train_loss": 3.3840103149414062, "lr": 0.0001895989901163143, "tps": 38486, "wall": 29550.9} {"step": 17354, "train_loss": 3.3125975131988525, "lr": 0.00018958010751006258, "tps": 38481, "wall": 29556.5} {"step": 17355, "train_loss": 3.2793211936950684, "lr": 0.0001895612252484091, "tps": 38476, "wall": 29562.0} {"step": 17356, "train_loss": 3.41804575920105, "lr": 0.0001895423433315677, "tps": 38471, "wall": 29567.5} {"step": 17357, "train_loss": 3.268984794616699, "lr": 0.00018952346175975224, "tps": 38466, "wall": 29573.1} {"step": 17358, "train_loss": 3.2786941528320312, "lr": 0.00018950458053317669, "tps": 38461, "wall": 29578.6} {"step": 17359, "train_loss": 3.310311794281006, "lr": 0.0001894856996520549, "tps": 38456, "wall": 29584.2} {"step": 17360, "train_loss": 3.2178587913513184, "lr": 0.00018946681911660072, "tps": 38451, "wall": 29589.7} {"step": 17361, "train_loss": 3.2335243225097656, "lr": 0.0001894479389270281, "tps": 38446, "wall": 29595.2} {"step": 17362, "train_loss": 3.1894586086273193, "lr": 0.00018942905908355092, "tps": 38441, "wall": 29600.8} {"step": 17363, "train_loss": 3.3458919525146484, "lr": 0.00018941017958638292, "tps": 38436, "wall": 29606.4} {"step": 17364, "train_loss": 3.376948833465576, "lr": 0.00018939130043573813, "tps": 38431, "wall": 29612.0} {"step": 17365, "train_loss": 3.300670862197876, "lr": 0.00018937242163183035, "tps": 38426, "wall": 29617.5} {"step": 17366, "train_loss": 3.261094093322754, "lr": 0.00018935354317487337, "tps": 38421, "wall": 29623.1} {"step": 17367, "train_loss": 3.310072660446167, "lr": 0.00018933466506508112, "tps": 38416, "wall": 29628.6} {"step": 17368, "train_loss": 3.4051413536071777, "lr": 0.00018931578730266746, "tps": 38411, "wall": 29634.1} {"step": 17369, "train_loss": 3.323910713195801, "lr": 0.00018929690988784629, "tps": 38406, "wall": 29639.7} {"step": 17370, "train_loss": 3.3172428607940674, "lr": 0.0001892780328208313, "tps": 38401, "wall": 29645.2} {"step": 17371, "train_loss": 3.2774572372436523, "lr": 0.00018925915610183643, "tps": 38396, "wall": 29650.7} {"step": 17372, "train_loss": 3.3875865936279297, "lr": 0.00018924027973107554, "tps": 38391, "wall": 29656.2} {"step": 17373, "train_loss": 3.386049747467041, "lr": 0.00018922140370876238, "tps": 38386, "wall": 29661.8} {"step": 17374, "train_loss": 3.308506727218628, "lr": 0.00018920252803511086, "tps": 38381, "wall": 29667.3} {"step": 17375, "train_loss": 3.228544235229492, "lr": 0.00018918365271033478, "tps": 38376, "wall": 29673.0} {"step": 17376, "train_loss": 3.242244243621826, "lr": 0.00018916477773464786, "tps": 38371, "wall": 29678.5} {"step": 17377, "train_loss": 3.3186848163604736, "lr": 0.00018914590310826408, "tps": 38366, "wall": 29684.0} {"step": 17378, "train_loss": 3.330282211303711, "lr": 0.00018912702883139716, "tps": 38362, "wall": 29689.5} {"step": 17379, "train_loss": 3.1851627826690674, "lr": 0.000189108154904261, "tps": 38357, "wall": 29695.0} {"step": 17380, "train_loss": 3.369081735610962, "lr": 0.00018908928132706923, "tps": 38352, "wall": 29700.6} {"step": 17381, "train_loss": 3.296355962753296, "lr": 0.00018907040810003576, "tps": 38347, "wall": 29706.1} {"step": 17382, "train_loss": 3.293177604675293, "lr": 0.0001890515352233744, "tps": 38342, "wall": 29711.5} {"step": 17383, "train_loss": 3.307802677154541, "lr": 0.00018903266269729895, "tps": 38337, "wall": 29717.1} {"step": 17384, "train_loss": 3.3373231887817383, "lr": 0.0001890137905220232, "tps": 38332, "wall": 29722.6} {"step": 17385, "train_loss": 3.2627925872802734, "lr": 0.00018899491869776082, "tps": 38327, "wall": 29728.1} {"step": 17386, "train_loss": 3.3369436264038086, "lr": 0.00018897604722472577, "tps": 38322, "wall": 29733.8} {"step": 17387, "train_loss": 3.4428274631500244, "lr": 0.00018895717610313163, "tps": 38317, "wall": 29739.3} {"step": 17388, "train_loss": 3.2411465644836426, "lr": 0.00018893830533319234, "tps": 38312, "wall": 29744.8} {"step": 17389, "train_loss": 3.399531126022339, "lr": 0.00018891943491512164, "tps": 38307, "wall": 29750.4} {"step": 17390, "train_loss": 3.4636168479919434, "lr": 0.00018890056484913324, "tps": 38302, "wall": 29755.9} {"step": 17391, "train_loss": 3.214501142501831, "lr": 0.0001888816951354409, "tps": 38298, "wall": 29761.4} {"step": 17392, "train_loss": 3.271228075027466, "lr": 0.0001888628257742584, "tps": 38293, "wall": 29766.9} {"step": 17393, "train_loss": 3.394998073577881, "lr": 0.0001888439567657995, "tps": 38288, "wall": 29772.4} {"step": 17394, "train_loss": 3.2555439472198486, "lr": 0.00018882508811027794, "tps": 38283, "wall": 29777.9} {"step": 17395, "train_loss": 3.2943646907806396, "lr": 0.00018880621980790747, "tps": 38278, "wall": 29783.4} {"step": 17396, "train_loss": 3.3109025955200195, "lr": 0.00018878735185890187, "tps": 38273, "wall": 29789.0} {"step": 17397, "train_loss": 3.41007137298584, "lr": 0.0001887684842634748, "tps": 38268, "wall": 29794.6} {"step": 17398, "train_loss": 3.298072576522827, "lr": 0.00018874961702184, "tps": 38263, "wall": 29800.1} {"step": 17399, "train_loss": 3.4596121311187744, "lr": 0.0001887307501342113, "tps": 38258, "wall": 29805.6} {"step": 17400, "train_loss": 3.314267158508301, "lr": 0.0001887118836008023, "tps": 38253, "wall": 29811.1} {"step": 17401, "train_loss": 3.279855251312256, "lr": 0.0001886930174218268, "tps": 38249, "wall": 29816.6} {"step": 17402, "train_loss": 3.2951087951660156, "lr": 0.00018867415159749847, "tps": 38244, "wall": 29822.1} {"step": 17403, "train_loss": 3.214564085006714, "lr": 0.00018865528612803107, "tps": 38239, "wall": 29827.6} {"step": 17404, "train_loss": 3.331519603729248, "lr": 0.00018863642101363826, "tps": 38234, "wall": 29833.1} {"step": 17405, "train_loss": 3.3450264930725098, "lr": 0.00018861755625453375, "tps": 38229, "wall": 29838.6} {"step": 17406, "train_loss": 3.29459285736084, "lr": 0.00018859869185093136, "tps": 38224, "wall": 29844.2} {"step": 17407, "train_loss": 3.3906617164611816, "lr": 0.00018857982780304462, "tps": 38219, "wall": 29849.7} {"step": 17408, "train_loss": 3.2900006771087646, "lr": 0.00018856096411108727, "tps": 38214, "wall": 29855.3} {"step": 17409, "train_loss": 3.4082813262939453, "lr": 0.00018854210077527307, "tps": 38209, "wall": 29860.8} {"step": 17410, "train_loss": 3.3365256786346436, "lr": 0.00018852323779581557, "tps": 38205, "wall": 29866.4} {"step": 17411, "train_loss": 3.2672195434570312, "lr": 0.0001885043751729286, "tps": 38200, "wall": 29871.9} {"step": 17412, "train_loss": 3.3625376224517822, "lr": 0.00018848551290682574, "tps": 38195, "wall": 29877.3} {"step": 17413, "train_loss": 3.309541702270508, "lr": 0.00018846665099772074, "tps": 38190, "wall": 29882.9} {"step": 17414, "train_loss": 3.331386089324951, "lr": 0.00018844778944582718, "tps": 38185, "wall": 29888.4} {"step": 17415, "train_loss": 3.322033405303955, "lr": 0.00018842892825135881, "tps": 38180, "wall": 29893.9} {"step": 17416, "train_loss": 3.287747859954834, "lr": 0.00018841006741452927, "tps": 38175, "wall": 29899.4} {"step": 17417, "train_loss": 3.298417568206787, "lr": 0.00018839120693555216, "tps": 38171, "wall": 29904.9} {"step": 17418, "train_loss": 3.3625991344451904, "lr": 0.00018837234681464112, "tps": 38166, "wall": 29910.4} {"step": 17419, "train_loss": 3.339409351348877, "lr": 0.00018835348705200993, "tps": 38161, "wall": 29916.0} {"step": 17420, "train_loss": 3.359954833984375, "lr": 0.0001883346276478721, "tps": 38156, "wall": 29921.5} {"step": 17421, "train_loss": 3.401210069656372, "lr": 0.00018831576860244126, "tps": 38151, "wall": 29927.0} {"step": 17422, "train_loss": 3.3093652725219727, "lr": 0.00018829690991593122, "tps": 38146, "wall": 29932.5} {"step": 17423, "train_loss": 3.355649948120117, "lr": 0.00018827805158855548, "tps": 38142, "wall": 29938.0} {"step": 17424, "train_loss": 3.315129518508911, "lr": 0.00018825919362052763, "tps": 38137, "wall": 29943.4} {"step": 17425, "train_loss": 3.236693859100342, "lr": 0.00018824033601206138, "tps": 38132, "wall": 29949.0} {"step": 17426, "train_loss": 3.3096914291381836, "lr": 0.00018822147876337036, "tps": 38127, "wall": 29954.5} {"step": 17427, "train_loss": 3.2098612785339355, "lr": 0.0001882026218746681, "tps": 38122, "wall": 29960.0} {"step": 17428, "train_loss": 3.3240346908569336, "lr": 0.00018818376534616827, "tps": 38118, "wall": 29965.5} {"step": 17429, "train_loss": 3.3182950019836426, "lr": 0.00018816490917808446, "tps": 38113, "wall": 29971.1} {"step": 17430, "train_loss": 3.254732370376587, "lr": 0.0001881460533706303, "tps": 38108, "wall": 29976.6} {"step": 17431, "train_loss": 3.374021530151367, "lr": 0.00018812719792401933, "tps": 38103, "wall": 29982.1} {"step": 17432, "train_loss": 3.3718063831329346, "lr": 0.0001881083428384652, "tps": 38098, "wall": 29987.6} {"step": 17433, "train_loss": 3.3262412548065186, "lr": 0.00018808948811418157, "tps": 38093, "wall": 29993.1} {"step": 17434, "train_loss": 3.331233501434326, "lr": 0.00018807063375138187, "tps": 38089, "wall": 29998.6} {"step": 17435, "train_loss": 3.218076229095459, "lr": 0.00018805177975027973, "tps": 38084, "wall": 30004.1} {"step": 17436, "train_loss": 3.3969380855560303, "lr": 0.00018803292611108886, "tps": 38079, "wall": 30009.7} {"step": 17437, "train_loss": 3.2740213871002197, "lr": 0.00018801407283402263, "tps": 38074, "wall": 30015.3} {"step": 17438, "train_loss": 3.2925901412963867, "lr": 0.00018799521991929473, "tps": 38069, "wall": 30020.7} {"step": 17439, "train_loss": 3.4410223960876465, "lr": 0.00018797636736711873, "tps": 38064, "wall": 30026.2} {"step": 17440, "train_loss": 3.2427451610565186, "lr": 0.0001879575151777082, "tps": 38060, "wall": 30031.9} {"step": 17441, "train_loss": 3.2351999282836914, "lr": 0.00018793866335127665, "tps": 38055, "wall": 30037.4} {"step": 17442, "train_loss": 3.213071346282959, "lr": 0.00018791981188803764, "tps": 38050, "wall": 30042.9} {"step": 17443, "train_loss": 3.250119686126709, "lr": 0.0001879009607882048, "tps": 38045, "wall": 30048.4} {"step": 17444, "train_loss": 3.389240264892578, "lr": 0.00018788211005199156, "tps": 38040, "wall": 30053.8} {"step": 17445, "train_loss": 3.369171142578125, "lr": 0.0001878632596796115, "tps": 38036, "wall": 30059.3} {"step": 17446, "train_loss": 3.35213041305542, "lr": 0.00018784440967127824, "tps": 38031, "wall": 30064.8} {"step": 17447, "train_loss": 3.3510119915008545, "lr": 0.0001878255600272052, "tps": 38026, "wall": 30070.3} {"step": 17448, "train_loss": 3.359250545501709, "lr": 0.00018780671074760598, "tps": 38021, "wall": 30075.9} {"step": 17449, "train_loss": 3.2404978275299072, "lr": 0.00018778786183269405, "tps": 38016, "wall": 30081.4} {"step": 17450, "train_loss": 3.2764382362365723, "lr": 0.00018776901328268296, "tps": 38012, "wall": 30086.8} {"step": 17451, "train_loss": 3.4256443977355957, "lr": 0.00018775016509778626, "tps": 38007, "wall": 30092.4} {"step": 17452, "train_loss": 3.3353123664855957, "lr": 0.0001877313172782174, "tps": 38002, "wall": 30097.9} {"step": 17453, "train_loss": 3.3629629611968994, "lr": 0.00018771246982418992, "tps": 37997, "wall": 30103.4} {"step": 17454, "train_loss": 3.38543701171875, "lr": 0.00018769362273591736, "tps": 37993, "wall": 30108.9} {"step": 17455, "train_loss": 3.2911694049835205, "lr": 0.00018767477601361318, "tps": 37988, "wall": 30114.3} {"step": 17456, "train_loss": 3.2983450889587402, "lr": 0.00018765592965749091, "tps": 37983, "wall": 30119.8} {"step": 17457, "train_loss": 3.3737921714782715, "lr": 0.00018763708366776393, "tps": 37978, "wall": 30125.3} {"step": 17458, "train_loss": 3.296414375305176, "lr": 0.00018761823804464594, "tps": 37974, "wall": 30130.8} {"step": 17459, "train_loss": 3.2920713424682617, "lr": 0.00018759939278835023, "tps": 37969, "wall": 30136.3} {"step": 17460, "train_loss": 3.245206832885742, "lr": 0.00018758054789909037, "tps": 37964, "wall": 30141.8} {"step": 17461, "train_loss": 3.419356107711792, "lr": 0.0001875617033770798, "tps": 37959, "wall": 30147.3} {"step": 17462, "train_loss": 3.277618408203125, "lr": 0.00018754285922253203, "tps": 37955, "wall": 30152.8} {"step": 17463, "train_loss": 3.3947815895080566, "lr": 0.00018752401543566048, "tps": 37950, "wall": 30158.3} {"step": 17464, "train_loss": 3.370878219604492, "lr": 0.00018750517201667863, "tps": 37945, "wall": 30163.8} {"step": 17465, "train_loss": 3.4127984046936035, "lr": 0.0001874863289658, "tps": 37940, "wall": 30169.3} {"step": 17466, "train_loss": 3.3204185962677, "lr": 0.00018746748628323796, "tps": 37936, "wall": 30174.8} {"step": 17467, "train_loss": 3.281338691711426, "lr": 0.00018744864396920597, "tps": 37931, "wall": 30180.2} {"step": 17468, "train_loss": 3.303668975830078, "lr": 0.00018742980202391757, "tps": 37926, "wall": 30185.7} {"step": 17469, "train_loss": 3.278820037841797, "lr": 0.00018741096044758607, "tps": 37922, "wall": 30191.2} {"step": 17470, "train_loss": 3.330907106399536, "lr": 0.00018739211924042505, "tps": 37917, "wall": 30196.7} {"step": 17471, "train_loss": 3.2852227687835693, "lr": 0.00018737327840264784, "tps": 37912, "wall": 30202.1} {"step": 17472, "train_loss": 3.271801471710205, "lr": 0.0001873544379344679, "tps": 37907, "wall": 30207.7} {"step": 17473, "train_loss": 3.2542614936828613, "lr": 0.00018733559783609859, "tps": 37903, "wall": 30213.2} {"step": 17474, "train_loss": 3.290848970413208, "lr": 0.00018731675810775342, "tps": 37898, "wall": 30218.7} {"step": 17475, "train_loss": 3.388767719268799, "lr": 0.00018729791874964584, "tps": 37893, "wall": 30224.3} {"step": 17476, "train_loss": 3.4125664234161377, "lr": 0.00018727907976198913, "tps": 37888, "wall": 30229.7} {"step": 17477, "train_loss": 3.37164044380188, "lr": 0.0001872602411449968, "tps": 37884, "wall": 30235.2} {"step": 17478, "train_loss": 3.3091421127319336, "lr": 0.00018724140289888224, "tps": 37879, "wall": 30240.7} {"step": 17479, "train_loss": 3.3499085903167725, "lr": 0.00018722256502385885, "tps": 37874, "wall": 30246.2} {"step": 17480, "train_loss": 3.226158618927002, "lr": 0.00018720372752014001, "tps": 37870, "wall": 30251.6} {"step": 17481, "train_loss": 3.219829559326172, "lr": 0.0001871848903879391, "tps": 37865, "wall": 30257.1} {"step": 17482, "train_loss": 3.1742608547210693, "lr": 0.00018716605362746957, "tps": 37860, "wall": 30262.6} {"step": 17483, "train_loss": 3.2723238468170166, "lr": 0.00018714721723894472, "tps": 37856, "wall": 30268.1} {"step": 17484, "train_loss": 3.3891067504882812, "lr": 0.00018712838122257798, "tps": 37851, "wall": 30273.7} {"step": 17485, "train_loss": 3.354435920715332, "lr": 0.00018710954557858275, "tps": 37846, "wall": 30279.2} {"step": 17486, "train_loss": 3.2978110313415527, "lr": 0.00018709071030717232, "tps": 37841, "wall": 30284.7} {"step": 17487, "train_loss": 3.3934359550476074, "lr": 0.0001870718754085601, "tps": 37837, "wall": 30290.2} {"step": 17488, "train_loss": 3.335469961166382, "lr": 0.00018705304088295952, "tps": 37832, "wall": 30295.7} {"step": 17489, "train_loss": 3.2582316398620605, "lr": 0.00018703420673058378, "tps": 37827, "wall": 30301.2} {"step": 17490, "train_loss": 3.284785032272339, "lr": 0.00018701537295164638, "tps": 37823, "wall": 30306.7} {"step": 17491, "train_loss": 3.3532142639160156, "lr": 0.00018699653954636062, "tps": 37818, "wall": 30312.2} {"step": 17492, "train_loss": 3.3485865592956543, "lr": 0.00018697770651493985, "tps": 37813, "wall": 30317.6} {"step": 17493, "train_loss": 3.3253979682922363, "lr": 0.0001869588738575974, "tps": 37809, "wall": 30323.1} {"step": 17494, "train_loss": 3.3150582313537598, "lr": 0.00018694004157454664, "tps": 37804, "wall": 30328.6} {"step": 17495, "train_loss": 3.3424577713012695, "lr": 0.00018692120966600086, "tps": 37799, "wall": 30334.1} {"step": 17496, "train_loss": 3.266228675842285, "lr": 0.0001869023781321734, "tps": 37794, "wall": 30339.6} {"step": 17497, "train_loss": 3.384899377822876, "lr": 0.00018688354697327756, "tps": 37790, "wall": 30345.1} {"step": 17498, "train_loss": 3.302802801132202, "lr": 0.00018686471618952676, "tps": 37785, "wall": 30350.6} {"step": 17499, "train_loss": 3.265537738800049, "lr": 0.0001868458857811342, "tps": 37780, "wall": 30356.1} {"step": 17500, "train_loss": 3.3606059551239014, "lr": 0.00018682705574831325, "tps": 37776, "wall": 30361.5} {"step": 17501, "train_loss": 3.362248420715332, "lr": 0.00018680822609127716, "tps": 37771, "wall": 30367.2} {"step": 17502, "train_loss": 3.2718095779418945, "lr": 0.0001867893968102394, "tps": 37766, "wall": 30372.7} {"step": 17503, "train_loss": 3.189624786376953, "lr": 0.00018677056790541302, "tps": 37762, "wall": 30378.1} {"step": 17504, "train_loss": 3.333641529083252, "lr": 0.00018675173937701152, "tps": 37757, "wall": 30383.6} {"step": 17505, "train_loss": 3.1930580139160156, "lr": 0.00018673291122524814, "tps": 37752, "wall": 30389.1} {"step": 17506, "train_loss": 3.329075813293457, "lr": 0.00018671408345033607, "tps": 37747, "wall": 30394.7} {"step": 17507, "train_loss": 3.3324267864227295, "lr": 0.0001866952560524887, "tps": 37743, "wall": 30400.2} {"step": 17508, "train_loss": 3.3565220832824707, "lr": 0.00018667642903191927, "tps": 37738, "wall": 30405.7} {"step": 17509, "train_loss": 3.300300359725952, "lr": 0.00018665760238884108, "tps": 37734, "wall": 30411.1} {"step": 17510, "train_loss": 3.22896409034729, "lr": 0.00018663877612346726, "tps": 37729, "wall": 30416.5} {"step": 17511, "train_loss": 3.3079898357391357, "lr": 0.0001866199502360113, "tps": 37724, "wall": 30422.0} {"step": 17512, "train_loss": 3.231184482574463, "lr": 0.00018660112472668633, "tps": 37720, "wall": 30427.5} {"step": 17513, "train_loss": 3.4255106449127197, "lr": 0.0001865822995957056, "tps": 37715, "wall": 30432.9} {"step": 17514, "train_loss": 3.3050966262817383, "lr": 0.0001865634748432824, "tps": 37711, "wall": 30438.4} {"step": 17515, "train_loss": 3.2524642944335938, "lr": 0.00018654465046962998, "tps": 37706, "wall": 30443.8} {"step": 17516, "train_loss": 3.293985605239868, "lr": 0.00018652582647496154, "tps": 37701, "wall": 30449.4} {"step": 17517, "train_loss": 3.281505584716797, "lr": 0.00018650700285949038, "tps": 37696, "wall": 30454.9} {"step": 17518, "train_loss": 3.263841152191162, "lr": 0.00018648817962342972, "tps": 37692, "wall": 30460.4} {"step": 17519, "train_loss": 3.352452278137207, "lr": 0.00018646935676699275, "tps": 37687, "wall": 30465.9} {"step": 17520, "train_loss": 3.349669933319092, "lr": 0.0001864505342903927, "tps": 37683, "wall": 30471.4} {"step": 17521, "train_loss": 3.3968324661254883, "lr": 0.0001864317121938428, "tps": 37678, "wall": 30476.9} {"step": 17522, "train_loss": 3.3450660705566406, "lr": 0.0001864128904775564, "tps": 37673, "wall": 30482.4} {"step": 17523, "train_loss": 3.2460880279541016, "lr": 0.00018639406914174646, "tps": 37669, "wall": 30487.8} {"step": 17524, "train_loss": 3.1594927310943604, "lr": 0.00018637524818662632, "tps": 37664, "wall": 30493.3} {"step": 17525, "train_loss": 3.249204635620117, "lr": 0.00018635642761240928, "tps": 37659, "wall": 30498.8} {"step": 17526, "train_loss": 3.2344770431518555, "lr": 0.0001863376074193084, "tps": 37655, "wall": 30504.3} {"step": 17527, "train_loss": 3.3362977504730225, "lr": 0.0001863187876075369, "tps": 37650, "wall": 30509.7} {"step": 17528, "train_loss": 3.3161745071411133, "lr": 0.000186299968177308, "tps": 37646, "wall": 30515.3} {"step": 17529, "train_loss": 3.2333693504333496, "lr": 0.00018628114912883493, "tps": 37641, "wall": 30520.8} {"step": 17530, "train_loss": 3.351651668548584, "lr": 0.0001862623304623308, "tps": 37636, "wall": 30526.2} {"step": 17531, "train_loss": 3.316096782684326, "lr": 0.0001862435121780088, "tps": 37632, "wall": 30531.7} {"step": 17532, "train_loss": 3.343425750732422, "lr": 0.00018622469427608218, "tps": 37627, "wall": 30537.2} {"step": 17533, "train_loss": 3.348513126373291, "lr": 0.000186205876756764, "tps": 37622, "wall": 30542.8} {"step": 17534, "train_loss": 3.42368221282959, "lr": 0.0001861870596202675, "tps": 37618, "wall": 30548.3} {"step": 17535, "train_loss": 3.2739014625549316, "lr": 0.0001861682428668058, "tps": 37613, "wall": 30553.8} {"step": 17536, "train_loss": 3.3573503494262695, "lr": 0.0001861494264965921, "tps": 37608, "wall": 30559.3} {"step": 17537, "train_loss": 3.318913459777832, "lr": 0.0001861306105098395, "tps": 37604, "wall": 30564.8} {"step": 17538, "train_loss": 3.4050827026367188, "lr": 0.00018611179490676114, "tps": 37599, "wall": 30570.3} {"step": 17539, "train_loss": 3.3914918899536133, "lr": 0.00018609297968757028, "tps": 37595, "wall": 30575.8} {"step": 17540, "train_loss": 3.3047077655792236, "lr": 0.00018607416485247991, "tps": 37590, "wall": 30581.3} {"step": 17541, "train_loss": 3.3077054023742676, "lr": 0.00018605535040170325, "tps": 37585, "wall": 30586.8} {"step": 17542, "train_loss": 3.3625450134277344, "lr": 0.00018603653633545347, "tps": 37581, "wall": 30592.3} {"step": 17543, "train_loss": 3.287637710571289, "lr": 0.0001860177226539436, "tps": 37576, "wall": 30597.8} {"step": 17544, "train_loss": 3.1512069702148438, "lr": 0.00018599890935738685, "tps": 37572, "wall": 30603.3} {"step": 17545, "train_loss": 3.284815788269043, "lr": 0.00018598009644599627, "tps": 37567, "wall": 30608.8} {"step": 17546, "train_loss": 3.367490768432617, "lr": 0.00018596128391998497, "tps": 37562, "wall": 30614.2} {"step": 17547, "train_loss": 3.2730984687805176, "lr": 0.0001859424717795661, "tps": 37558, "wall": 30619.7} {"step": 17548, "train_loss": 3.295414924621582, "lr": 0.00018592366002495277, "tps": 37553, "wall": 30625.1} {"step": 17549, "train_loss": 3.3361053466796875, "lr": 0.00018590484865635808, "tps": 37549, "wall": 30630.6} {"step": 17550, "train_loss": 3.3498167991638184, "lr": 0.00018588603767399504, "tps": 37544, "wall": 30636.1} {"step": 17551, "train_loss": 3.244354724884033, "lr": 0.00018586722707807684, "tps": 37540, "wall": 30641.6} {"step": 17552, "train_loss": 3.264899730682373, "lr": 0.0001858484168688166, "tps": 37535, "wall": 30647.0} {"step": 17553, "train_loss": 3.3462138175964355, "lr": 0.00018582960704642724, "tps": 37531, "wall": 30652.5} {"step": 17554, "train_loss": 3.425701379776001, "lr": 0.000185810797611122, "tps": 37526, "wall": 30657.9} {"step": 17555, "train_loss": 3.334200859069824, "lr": 0.00018579198856311387, "tps": 37522, "wall": 30663.3} {"step": 17556, "train_loss": 3.293783187866211, "lr": 0.00018577317990261597, "tps": 37517, "wall": 30668.8} {"step": 17557, "train_loss": 3.3494153022766113, "lr": 0.00018575437162984132, "tps": 37512, "wall": 30674.2} {"step": 17558, "train_loss": 3.4155352115631104, "lr": 0.000185735563745003, "tps": 37508, "wall": 30679.7} {"step": 17559, "train_loss": 3.2991738319396973, "lr": 0.0001857167562483141, "tps": 37503, "wall": 30685.1} {"step": 17560, "train_loss": 3.3351194858551025, "lr": 0.0001856979491399876, "tps": 37499, "wall": 30690.6} {"step": 17561, "train_loss": 3.217557907104492, "lr": 0.0001856791424202366, "tps": 37494, "wall": 30696.1} {"step": 17562, "train_loss": 3.355081796646118, "lr": 0.00018566033608927418, "tps": 37490, "wall": 30701.6} {"step": 17563, "train_loss": 3.37477445602417, "lr": 0.0001856415301473133, "tps": 37485, "wall": 30707.1} {"step": 17564, "train_loss": 3.2933566570281982, "lr": 0.00018562272459456697, "tps": 37481, "wall": 30712.5} {"step": 17565, "train_loss": 3.2591476440429688, "lr": 0.00018560391943124832, "tps": 37476, "wall": 30718.0} {"step": 17566, "train_loss": 3.359121561050415, "lr": 0.00018558511465757032, "tps": 37472, "wall": 30723.5} {"step": 17567, "train_loss": 3.3858845233917236, "lr": 0.00018556631027374603, "tps": 37467, "wall": 30728.9} {"step": 17568, "train_loss": 3.283545970916748, "lr": 0.00018554750627998838, "tps": 37463, "wall": 30734.3} {"step": 17569, "train_loss": 3.378444194793701, "lr": 0.00018552870267651055, "tps": 37458, "wall": 30739.8} {"step": 17570, "train_loss": 3.2261605262756348, "lr": 0.00018550989946352532, "tps": 37453, "wall": 30745.3} {"step": 17571, "train_loss": 3.2348761558532715, "lr": 0.0001854910966412459, "tps": 37449, "wall": 30750.8} {"step": 17572, "train_loss": 3.3921968936920166, "lr": 0.00018547229420988516, "tps": 37444, "wall": 30756.2} {"step": 17573, "train_loss": 3.338009834289551, "lr": 0.0001854534921696562, "tps": 37440, "wall": 30761.7} {"step": 17574, "train_loss": 3.3516993522644043, "lr": 0.00018543469052077188, "tps": 37435, "wall": 30767.2} {"step": 17575, "train_loss": 3.2767441272735596, "lr": 0.00018541588926344527, "tps": 37431, "wall": 30772.6} {"step": 17576, "train_loss": 3.2977709770202637, "lr": 0.00018539708839788936, "tps": 37426, "wall": 30778.1} {"step": 17577, "train_loss": 3.3304715156555176, "lr": 0.0001853782879243171, "tps": 37422, "wall": 30783.6} {"step": 17578, "train_loss": 3.275026798248291, "lr": 0.00018535948784294143, "tps": 37417, "wall": 30789.0} {"step": 17579, "train_loss": 3.365190029144287, "lr": 0.00018534068815397544, "tps": 37413, "wall": 30794.5} {"step": 17580, "train_loss": 3.306044578552246, "lr": 0.00018532188885763188, "tps": 37408, "wall": 30799.9} {"step": 17581, "train_loss": 3.3547186851501465, "lr": 0.00018530308995412393, "tps": 37404, "wall": 30805.3} {"step": 17582, "train_loss": 3.2668066024780273, "lr": 0.00018528429144366442, "tps": 37399, "wall": 30810.8} {"step": 17583, "train_loss": 3.3821377754211426, "lr": 0.00018526549332646637, "tps": 37395, "wall": 30816.3} {"step": 17584, "train_loss": 3.499657154083252, "lr": 0.0001852466956027427, "tps": 37390, "wall": 30821.7} {"step": 17585, "train_loss": 3.286339044570923, "lr": 0.00018522789827270627, "tps": 37386, "wall": 30827.2} {"step": 17586, "train_loss": 3.3295953273773193, "lr": 0.00018520910133657017, "tps": 37381, "wall": 30832.7} {"step": 17587, "train_loss": 3.3757565021514893, "lr": 0.00018519030479454717, "tps": 37377, "wall": 30838.1} {"step": 17588, "train_loss": 3.326961040496826, "lr": 0.00018517150864685037, "tps": 37372, "wall": 30843.5} {"step": 17589, "train_loss": 3.3535807132720947, "lr": 0.00018515271289369257, "tps": 37368, "wall": 30849.0} {"step": 17590, "train_loss": 3.407144546508789, "lr": 0.00018513391753528669, "tps": 37363, "wall": 30854.5} {"step": 17591, "train_loss": 3.313596725463867, "lr": 0.00018511512257184568, "tps": 37359, "wall": 30859.9} {"step": 17592, "train_loss": 3.300367832183838, "lr": 0.00018509632800358246, "tps": 37355, "wall": 30865.3} {"step": 17593, "train_loss": 3.305218458175659, "lr": 0.00018507753383071, "tps": 37350, "wall": 30870.9} {"step": 17594, "train_loss": 3.371342182159424, "lr": 0.00018505874005344102, "tps": 37345, "wall": 30876.4} {"step": 17595, "train_loss": 3.2817883491516113, "lr": 0.00018503994667198854, "tps": 37341, "wall": 30881.8} {"step": 17596, "train_loss": 3.376190185546875, "lr": 0.00018502115368656548, "tps": 37336, "wall": 30887.3} {"step": 17597, "train_loss": 3.266514778137207, "lr": 0.0001850023610973847, "tps": 37332, "wall": 30892.7} {"step": 17598, "train_loss": 3.3082032203674316, "lr": 0.00018498356890465903, "tps": 37328, "wall": 30898.1} {"step": 17599, "train_loss": 3.331700325012207, "lr": 0.00018496477710860135, "tps": 37323, "wall": 30903.6} {"step": 17600, "train_loss": 3.3131566047668457, "lr": 0.00018494598570942462, "tps": 37319, "wall": 30909.0} {"step": 17601, "train_loss": 3.302583932876587, "lr": 0.00018492719470734165, "tps": 37314, "wall": 30914.5} {"step": 17602, "train_loss": 3.273590326309204, "lr": 0.0001849084041025653, "tps": 37310, "wall": 30920.0} {"step": 17603, "train_loss": 3.2951223850250244, "lr": 0.0001848896138953085, "tps": 37305, "wall": 30925.4} {"step": 17604, "train_loss": 3.3718228340148926, "lr": 0.00018487082408578397, "tps": 37301, "wall": 30931.0} {"step": 17605, "train_loss": 3.289097785949707, "lr": 0.0001848520346742047, "tps": 37296, "wall": 30936.5} {"step": 17606, "train_loss": 3.2216126918792725, "lr": 0.0001848332456607835, "tps": 37292, "wall": 30941.9} {"step": 17607, "train_loss": 3.2698540687561035, "lr": 0.00018481445704573312, "tps": 37287, "wall": 30947.4} {"step": 17608, "train_loss": 3.224013566970825, "lr": 0.00018479566882926652, "tps": 37283, "wall": 30952.8} {"step": 17609, "train_loss": 3.4700708389282227, "lr": 0.0001847768810115965, "tps": 37278, "wall": 30958.3} {"step": 17610, "train_loss": 3.3328442573547363, "lr": 0.00018475809359293587, "tps": 37274, "wall": 30963.7} {"step": 17611, "train_loss": 3.4598264694213867, "lr": 0.00018473930657349747, "tps": 37269, "wall": 30969.2} {"step": 17612, "train_loss": 3.3007171154022217, "lr": 0.00018472051995349409, "tps": 37265, "wall": 30974.6} {"step": 17613, "train_loss": 3.333179473876953, "lr": 0.00018470173373313862, "tps": 37261, "wall": 30980.1} {"step": 17614, "train_loss": 3.2109322547912598, "lr": 0.00018468294791264378, "tps": 37256, "wall": 30985.6} {"step": 17615, "train_loss": 3.2793095111846924, "lr": 0.00018466416249222247, "tps": 37252, "wall": 30991.1} {"step": 17616, "train_loss": 3.4038965702056885, "lr": 0.00018464537747208738, "tps": 37247, "wall": 30996.5} {"step": 17617, "train_loss": 3.3807756900787354, "lr": 0.0001846265928524513, "tps": 37243, "wall": 31002.0} {"step": 17618, "train_loss": 3.3103036880493164, "lr": 0.00018460780863352723, "tps": 37238, "wall": 31007.4} {"step": 17619, "train_loss": 3.276362419128418, "lr": 0.00018458902481552776, "tps": 37234, "wall": 31012.9} {"step": 17620, "train_loss": 3.2826082706451416, "lr": 0.00018457024139866568, "tps": 37229, "wall": 31018.3} {"step": 17621, "train_loss": 3.4120898246765137, "lr": 0.0001845514583831539, "tps": 37225, "wall": 31023.8} {"step": 17622, "train_loss": 3.3281078338623047, "lr": 0.00018453267576920505, "tps": 37221, "wall": 31029.2} {"step": 17623, "train_loss": 3.144167900085449, "lr": 0.000184513893557032, "tps": 37216, "wall": 31034.6} {"step": 17624, "train_loss": 3.293865203857422, "lr": 0.0001844951117468475, "tps": 37212, "wall": 31040.1} {"step": 17625, "train_loss": 3.2668306827545166, "lr": 0.00018447633033886427, "tps": 37207, "wall": 31045.7} {"step": 17626, "train_loss": 3.2591395378112793, "lr": 0.0001844575493332951, "tps": 37203, "wall": 31051.2} {"step": 17627, "train_loss": 3.337618827819824, "lr": 0.00018443876873035274, "tps": 37198, "wall": 31056.7} {"step": 17628, "train_loss": 3.279792070388794, "lr": 0.0001844199885302499, "tps": 37194, "wall": 31062.1} {"step": 17629, "train_loss": 3.319112777709961, "lr": 0.0001844012087331994, "tps": 37189, "wall": 31067.5} {"step": 17630, "train_loss": 3.344693183898926, "lr": 0.0001843824293394139, "tps": 37185, "wall": 31072.9} {"step": 17631, "train_loss": 3.3855984210968018, "lr": 0.00018436365034910624, "tps": 37181, "wall": 31078.3} {"step": 17632, "train_loss": 3.2366018295288086, "lr": 0.000184344871762489, "tps": 37176, "wall": 31083.8} {"step": 17633, "train_loss": 3.269463300704956, "lr": 0.00018432609357977496, "tps": 37172, "wall": 31089.3} {"step": 17634, "train_loss": 3.4458868503570557, "lr": 0.0001843073158011769, "tps": 37167, "wall": 31094.7} {"step": 17635, "train_loss": 3.2617244720458984, "lr": 0.00018428853842690753, "tps": 37163, "wall": 31100.2} {"step": 17636, "train_loss": 3.236279010772705, "lr": 0.00018426976145717946, "tps": 37159, "wall": 31105.6} {"step": 17637, "train_loss": 3.3446364402770996, "lr": 0.0001842509848922055, "tps": 37154, "wall": 31111.2} {"step": 17638, "train_loss": 3.2747488021850586, "lr": 0.00018423220873219832, "tps": 37150, "wall": 31116.6} {"step": 17639, "train_loss": 3.3000612258911133, "lr": 0.00018421343297737064, "tps": 37145, "wall": 31122.1} {"step": 17640, "train_loss": 3.3722755908966064, "lr": 0.00018419465762793506, "tps": 37141, "wall": 31127.6} {"step": 17641, "train_loss": 3.2971274852752686, "lr": 0.00018417588268410437, "tps": 37136, "wall": 31133.0} {"step": 17642, "train_loss": 3.339914321899414, "lr": 0.0001841571081460913, "tps": 37132, "wall": 31138.5} {"step": 17643, "train_loss": 3.3622310161590576, "lr": 0.00018413833401410834, "tps": 37128, "wall": 31144.0} {"step": 17644, "train_loss": 3.3731911182403564, "lr": 0.0001841195602883683, "tps": 37123, "wall": 31149.5} {"step": 17645, "train_loss": 3.345364570617676, "lr": 0.00018410078696908384, "tps": 37119, "wall": 31155.0} {"step": 17646, "train_loss": 3.3764867782592773, "lr": 0.0001840820140564676, "tps": 37114, "wall": 31160.5} {"step": 17647, "train_loss": 3.302710771560669, "lr": 0.00018406324155073223, "tps": 37110, "wall": 31165.9} {"step": 17648, "train_loss": 3.367325782775879, "lr": 0.00018404446945209042, "tps": 37105, "wall": 31171.5} {"step": 17649, "train_loss": 3.3697285652160645, "lr": 0.0001840256977607548, "tps": 37101, "wall": 31176.9} {"step": 17650, "train_loss": 3.3186087608337402, "lr": 0.00018400692647693801, "tps": 37097, "wall": 31182.4} {"step": 17651, "train_loss": 3.389061450958252, "lr": 0.0001839881556008527, "tps": 37092, "wall": 31187.8} {"step": 17652, "train_loss": 3.274629831314087, "lr": 0.0001839693851327116, "tps": 37088, "wall": 31193.3} {"step": 17653, "train_loss": 3.279550075531006, "lr": 0.00018395061507272712, "tps": 37084, "wall": 31198.7} {"step": 17654, "train_loss": 3.3116817474365234, "lr": 0.00018393184542111213, "tps": 37079, "wall": 31204.1} {"step": 17655, "train_loss": 3.4347643852233887, "lr": 0.0001839130761780791, "tps": 37075, "wall": 31209.6} {"step": 17656, "train_loss": 3.2547545433044434, "lr": 0.0001838943073438407, "tps": 37070, "wall": 31215.0} {"step": 17657, "train_loss": 3.326385021209717, "lr": 0.00018387553891860954, "tps": 37066, "wall": 31220.5} {"step": 17658, "train_loss": 3.3963522911071777, "lr": 0.00018385677090259822, "tps": 37062, "wall": 31225.9} {"step": 17659, "train_loss": 3.377307653427124, "lr": 0.00018383800329601938, "tps": 37057, "wall": 31231.4} {"step": 17660, "train_loss": 3.3084752559661865, "lr": 0.0001838192360990856, "tps": 37053, "wall": 31236.9} {"step": 17661, "train_loss": 3.3068323135375977, "lr": 0.00018380046931200942, "tps": 37048, "wall": 31242.3} {"step": 17662, "train_loss": 3.3349528312683105, "lr": 0.00018378170293500352, "tps": 37044, "wall": 31247.8} {"step": 17663, "train_loss": 3.4074456691741943, "lr": 0.0001837629369682804, "tps": 37040, "wall": 31253.3} {"step": 17664, "train_loss": 3.2497658729553223, "lr": 0.00018374417141205275, "tps": 37035, "wall": 31258.7} {"step": 17665, "train_loss": 3.3369522094726562, "lr": 0.0001837254062665331, "tps": 37031, "wall": 31264.2} {"step": 17666, "train_loss": 3.304971933364868, "lr": 0.00018370664153193392, "tps": 37027, "wall": 31269.6} {"step": 17667, "train_loss": 3.33624267578125, "lr": 0.00018368787720846795, "tps": 37022, "wall": 31275.1} {"step": 17668, "train_loss": 3.2986021041870117, "lr": 0.00018366911329634758, "tps": 37018, "wall": 31280.6} {"step": 17669, "train_loss": 3.3169779777526855, "lr": 0.0001836503497957856, "tps": 37014, "wall": 31286.0} {"step": 17670, "train_loss": 3.3346645832061768, "lr": 0.00018363158670699434, "tps": 37009, "wall": 31291.6} {"step": 17671, "train_loss": 3.3501524925231934, "lr": 0.00018361282403018642, "tps": 37005, "wall": 31297.0} {"step": 17672, "train_loss": 3.354757785797119, "lr": 0.00018359406176557448, "tps": 37000, "wall": 31302.4} {"step": 17673, "train_loss": 3.304281234741211, "lr": 0.00018357529991337086, "tps": 36996, "wall": 31307.9} {"step": 17674, "train_loss": 3.323209524154663, "lr": 0.0001835565384737883, "tps": 36992, "wall": 31313.3} {"step": 17675, "train_loss": 3.3278298377990723, "lr": 0.00018353777744703923, "tps": 36987, "wall": 31318.7} {"step": 17676, "train_loss": 3.309673309326172, "lr": 0.00018351901683333615, "tps": 36983, "wall": 31324.1} {"step": 17677, "train_loss": 3.29638671875, "lr": 0.00018350025663289166, "tps": 36979, "wall": 31329.6} {"step": 17678, "train_loss": 3.2476019859313965, "lr": 0.0001834814968459182, "tps": 36974, "wall": 31335.0} {"step": 17679, "train_loss": 3.383965492248535, "lr": 0.00018346273747262836, "tps": 36970, "wall": 31340.5} {"step": 17680, "train_loss": 3.314100980758667, "lr": 0.00018344397851323462, "tps": 36966, "wall": 31346.0} {"step": 17681, "train_loss": 3.3967630863189697, "lr": 0.00018342521996794937, "tps": 36961, "wall": 31351.5} {"step": 17682, "train_loss": 3.2583436965942383, "lr": 0.00018340646183698532, "tps": 36957, "wall": 31356.9} {"step": 17683, "train_loss": 3.451998233795166, "lr": 0.00018338770412055483, "tps": 36953, "wall": 31362.3} {"step": 17684, "train_loss": 3.37783145904541, "lr": 0.00018336894681887035, "tps": 36948, "wall": 31367.7} {"step": 17685, "train_loss": 3.2761783599853516, "lr": 0.00018335018993214446, "tps": 36944, "wall": 31373.2} {"step": 17686, "train_loss": 3.323791027069092, "lr": 0.00018333143346058962, "tps": 36940, "wall": 31378.7} {"step": 17687, "train_loss": 3.34700083732605, "lr": 0.0001833126774044182, "tps": 36936, "wall": 31384.0} {"step": 17688, "train_loss": 3.420077085494995, "lr": 0.00018329392176384283, "tps": 36931, "wall": 31389.4} {"step": 17689, "train_loss": 3.215048313140869, "lr": 0.0001832751665390759, "tps": 36927, "wall": 31394.9} {"step": 17690, "train_loss": 3.251572608947754, "lr": 0.0001832564117303299, "tps": 36923, "wall": 31400.4} {"step": 17691, "train_loss": 3.387392520904541, "lr": 0.00018323765733781717, "tps": 36918, "wall": 31405.8} {"step": 17692, "train_loss": 3.3189902305603027, "lr": 0.00018321890336175036, "tps": 36914, "wall": 31411.3} {"step": 17693, "train_loss": 3.212893486022949, "lr": 0.00018320014980234168, "tps": 36910, "wall": 31416.7} {"step": 17694, "train_loss": 3.367670774459839, "lr": 0.00018318139665980372, "tps": 36905, "wall": 31422.2} {"step": 17695, "train_loss": 3.3190855979919434, "lr": 0.0001831626439343489, "tps": 36901, "wall": 31427.7} {"step": 17696, "train_loss": 3.31264591217041, "lr": 0.00018314389162618974, "tps": 36897, "wall": 31433.1} {"step": 17697, "train_loss": 3.2595465183258057, "lr": 0.00018312513973553845, "tps": 36892, "wall": 31438.6} {"step": 17698, "train_loss": 3.349957227706909, "lr": 0.00018310638826260763, "tps": 36888, "wall": 31444.0} {"step": 17699, "train_loss": 3.375227451324463, "lr": 0.0001830876372076096, "tps": 36884, "wall": 31449.5} {"step": 17700, "train_loss": 3.3796918392181396, "lr": 0.00018306888657075682, "tps": 36879, "wall": 31454.9} {"step": 17701, "train_loss": 3.265174388885498, "lr": 0.00018305013635226173, "tps": 36875, "wall": 31460.4} {"step": 17702, "train_loss": 3.2724316120147705, "lr": 0.00018303138655233667, "tps": 36871, "wall": 31465.8} {"step": 17703, "train_loss": 3.2749311923980713, "lr": 0.0001830126371711941, "tps": 36866, "wall": 31471.4} {"step": 17704, "train_loss": 3.251011848449707, "lr": 0.00018299388820904627, "tps": 36862, "wall": 31476.8} {"step": 17705, "train_loss": 3.298353672027588, "lr": 0.00018297513966610576, "tps": 36858, "wall": 31482.3} {"step": 17706, "train_loss": 3.1896138191223145, "lr": 0.00018295639154258488, "tps": 36853, "wall": 31487.8} {"step": 17707, "train_loss": 3.2547779083251953, "lr": 0.00018293764383869597, "tps": 36849, "wall": 31493.2} {"step": 17708, "train_loss": 3.30220365524292, "lr": 0.00018291889655465147, "tps": 36845, "wall": 31498.7} {"step": 17709, "train_loss": 3.2891087532043457, "lr": 0.00018290014969066367, "tps": 36840, "wall": 31504.1} {"step": 17710, "train_loss": 3.297424793243408, "lr": 0.00018288140324694498, "tps": 36836, "wall": 31509.6} {"step": 17711, "train_loss": 3.266411781311035, "lr": 0.0001828626572237078, "tps": 36832, "wall": 31515.1} {"step": 17712, "train_loss": 3.2879135608673096, "lr": 0.00018284391162116443, "tps": 36828, "wall": 31520.5} {"step": 17713, "train_loss": 3.300584316253662, "lr": 0.00018282516643952724, "tps": 36823, "wall": 31526.0} {"step": 17714, "train_loss": 3.27768611907959, "lr": 0.0001828064216790086, "tps": 36819, "wall": 31531.6} {"step": 17715, "train_loss": 3.338456630706787, "lr": 0.00018278767733982077, "tps": 36815, "wall": 31537.0} {"step": 17716, "train_loss": 3.285581350326538, "lr": 0.00018276893342217618, "tps": 36810, "wall": 31542.4} {"step": 17717, "train_loss": 3.3260817527770996, "lr": 0.00018275018992628712, "tps": 36806, "wall": 31547.9} {"step": 17718, "train_loss": 3.3701975345611572, "lr": 0.00018273144685236595, "tps": 36802, "wall": 31553.2} {"step": 17719, "train_loss": 3.30580735206604, "lr": 0.00018271270420062497, "tps": 36798, "wall": 31558.7} {"step": 17720, "train_loss": 3.284308433532715, "lr": 0.00018269396197127642, "tps": 36793, "wall": 31564.1} {"step": 17721, "train_loss": 3.4025073051452637, "lr": 0.00018267522016453275, "tps": 36789, "wall": 31569.6} {"step": 17722, "train_loss": 3.2639994621276855, "lr": 0.00018265647878060618, "tps": 36785, "wall": 31575.1} {"step": 17723, "train_loss": 3.405906915664673, "lr": 0.00018263773781970906, "tps": 36780, "wall": 31580.5} {"step": 17724, "train_loss": 3.270336627960205, "lr": 0.00018261899728205366, "tps": 36776, "wall": 31585.9} {"step": 17725, "train_loss": 3.275515556335449, "lr": 0.00018260025716785227, "tps": 36772, "wall": 31591.5} {"step": 17726, "train_loss": 3.2855255603790283, "lr": 0.0001825815174773172, "tps": 36768, "wall": 31596.9} {"step": 17727, "train_loss": 3.264547109603882, "lr": 0.0001825627782106607, "tps": 36763, "wall": 31602.2} {"step": 17728, "train_loss": 3.239974021911621, "lr": 0.0001825440393680951, "tps": 36759, "wall": 31607.7} {"step": 17729, "train_loss": 3.3864598274230957, "lr": 0.00018252530094983266, "tps": 36755, "wall": 31613.1} {"step": 17730, "train_loss": 3.3725743293762207, "lr": 0.00018250656295608564, "tps": 36751, "wall": 31618.6} {"step": 17731, "train_loss": 3.2693514823913574, "lr": 0.00018248782538706623, "tps": 36746, "wall": 31624.0} {"step": 17732, "train_loss": 3.3000268936157227, "lr": 0.00018246908824298683, "tps": 36742, "wall": 31629.3} {"step": 17733, "train_loss": 3.349609136581421, "lr": 0.00018245035152405966, "tps": 36738, "wall": 31634.8} {"step": 17734, "train_loss": 3.3319952487945557, "lr": 0.00018243161523049688, "tps": 36734, "wall": 31640.2} {"step": 17735, "train_loss": 3.363654613494873, "lr": 0.0001824128793625108, "tps": 36730, "wall": 31645.6} {"step": 17736, "train_loss": 3.3661680221557617, "lr": 0.00018239414392031366, "tps": 36725, "wall": 31651.1} {"step": 17737, "train_loss": 3.2168521881103516, "lr": 0.00018237540890411768, "tps": 36721, "wall": 31656.5} {"step": 17738, "train_loss": 3.2617502212524414, "lr": 0.00018235667431413513, "tps": 36717, "wall": 31661.9} {"step": 17739, "train_loss": 3.26139497756958, "lr": 0.0001823379401505782, "tps": 36713, "wall": 31667.4} {"step": 17740, "train_loss": 3.305797576904297, "lr": 0.00018231920641365913, "tps": 36708, "wall": 31672.8} {"step": 17741, "train_loss": 3.4088377952575684, "lr": 0.00018230047310359012, "tps": 36704, "wall": 31678.3} {"step": 17742, "train_loss": 3.394880533218384, "lr": 0.00018228174022058338, "tps": 36700, "wall": 31683.7} {"step": 17743, "train_loss": 3.345757484436035, "lr": 0.00018226300776485118, "tps": 36696, "wall": 31689.1} {"step": 17744, "train_loss": 3.335212230682373, "lr": 0.00018224427573660564, "tps": 36691, "wall": 31694.6} {"step": 17745, "train_loss": 3.2439844608306885, "lr": 0.00018222554413605894, "tps": 36687, "wall": 31699.9} {"step": 17746, "train_loss": 3.324012279510498, "lr": 0.00018220681296342338, "tps": 36683, "wall": 31705.4} {"step": 17747, "train_loss": 3.302123785018921, "lr": 0.00018218808221891108, "tps": 36679, "wall": 31710.9} {"step": 17748, "train_loss": 3.283205270767212, "lr": 0.00018216935190273418, "tps": 36675, "wall": 31716.3} {"step": 17749, "train_loss": 3.2088775634765625, "lr": 0.00018215062201510493, "tps": 36670, "wall": 31721.7} {"step": 17750, "train_loss": 3.3541226387023926, "lr": 0.0001821318925562355, "tps": 36666, "wall": 31727.2} {"step": 17751, "train_loss": 3.289177894592285, "lr": 0.00018211316352633806, "tps": 36662, "wall": 31732.6} {"step": 17752, "train_loss": 3.304871082305908, "lr": 0.0001820944349256247, "tps": 36658, "wall": 31738.0} {"step": 17753, "train_loss": 3.398251533508301, "lr": 0.0001820757067543077, "tps": 36654, "wall": 31743.4} {"step": 17754, "train_loss": 3.3361101150512695, "lr": 0.0001820569790125991, "tps": 36649, "wall": 31748.9} {"step": 17755, "train_loss": 3.2702317237854004, "lr": 0.00018203825170071104, "tps": 36645, "wall": 31754.3} {"step": 17756, "train_loss": 3.359081745147705, "lr": 0.00018201952481885583, "tps": 36641, "wall": 31759.7} {"step": 17757, "train_loss": 3.279372453689575, "lr": 0.00018200079836724542, "tps": 36637, "wall": 31765.1} {"step": 17758, "train_loss": 3.332791566848755, "lr": 0.000181982072346092, "tps": 36633, "wall": 31770.5} {"step": 17759, "train_loss": 3.251636505126953, "lr": 0.0001819633467556078, "tps": 36628, "wall": 31776.0} {"step": 17760, "train_loss": 3.247255325317383, "lr": 0.00018194462159600488, "tps": 36624, "wall": 31781.4} {"step": 17761, "train_loss": 3.332611083984375, "lr": 0.00018192589686749525, "tps": 36620, "wall": 31786.8} {"step": 17762, "train_loss": 3.2131619453430176, "lr": 0.00018190717257029118, "tps": 36616, "wall": 31792.2} {"step": 17763, "train_loss": 3.343045234680176, "lr": 0.00018188844870460473, "tps": 36612, "wall": 31797.7} {"step": 17764, "train_loss": 3.3052520751953125, "lr": 0.00018186972527064796, "tps": 36607, "wall": 31803.1} {"step": 17765, "train_loss": 3.22037410736084, "lr": 0.000181851002268633, "tps": 36603, "wall": 31808.5} {"step": 17766, "train_loss": 3.4096312522888184, "lr": 0.000181832279698772, "tps": 36599, "wall": 31813.8} {"step": 17767, "train_loss": 3.260596752166748, "lr": 0.00018181355756127695, "tps": 36595, "wall": 31819.3} {"step": 17768, "train_loss": 3.314100742340088, "lr": 0.00018179483585635997, "tps": 36591, "wall": 31824.7} {"step": 17769, "train_loss": 3.2466814517974854, "lr": 0.0001817761145842332, "tps": 36587, "wall": 31830.2} {"step": 17770, "train_loss": 3.274503231048584, "lr": 0.0001817573937451087, "tps": 36582, "wall": 31835.7} {"step": 17771, "train_loss": 3.354381799697876, "lr": 0.00018173867333919844, "tps": 36578, "wall": 31841.1} {"step": 17772, "train_loss": 3.321424722671509, "lr": 0.00018171995336671462, "tps": 36574, "wall": 31846.5} {"step": 17773, "train_loss": 3.386190891265869, "lr": 0.00018170123382786924, "tps": 36570, "wall": 31852.0} {"step": 17774, "train_loss": 3.350559711456299, "lr": 0.00018168251472287428, "tps": 36566, "wall": 31857.4} {"step": 17775, "train_loss": 3.2205727100372314, "lr": 0.00018166379605194193, "tps": 36561, "wall": 31862.9} {"step": 17776, "train_loss": 3.282203197479248, "lr": 0.00018164507781528414, "tps": 36557, "wall": 31868.3} {"step": 17777, "train_loss": 3.2934813499450684, "lr": 0.00018162636001311304, "tps": 36553, "wall": 31873.8} {"step": 17778, "train_loss": 3.226726770401001, "lr": 0.00018160764264564053, "tps": 36549, "wall": 31879.2} {"step": 17779, "train_loss": 3.217466354370117, "lr": 0.00018158892571307873, "tps": 36545, "wall": 31884.6} {"step": 17780, "train_loss": 3.2535476684570312, "lr": 0.00018157020921563972, "tps": 36541, "wall": 31890.1} {"step": 17781, "train_loss": 3.3364481925964355, "lr": 0.0001815514931535354, "tps": 36536, "wall": 31895.6} {"step": 17782, "train_loss": 3.3295490741729736, "lr": 0.0001815327775269779, "tps": 36532, "wall": 31901.0} {"step": 17783, "train_loss": 3.370826005935669, "lr": 0.0001815140623361792, "tps": 36528, "wall": 31906.5} {"step": 17784, "train_loss": 3.285703659057617, "lr": 0.00018149534758135123, "tps": 36524, "wall": 31911.9} {"step": 17785, "train_loss": 3.355664014816284, "lr": 0.00018147663326270608, "tps": 36520, "wall": 31917.4} {"step": 17786, "train_loss": 3.25044846534729, "lr": 0.00018145791938045566, "tps": 36515, "wall": 31922.8} {"step": 17787, "train_loss": 3.2151334285736084, "lr": 0.00018143920593481205, "tps": 36511, "wall": 31928.2} {"step": 17788, "train_loss": 3.349184989929199, "lr": 0.0001814204929259872, "tps": 36507, "wall": 31933.6} {"step": 17789, "train_loss": 3.306765079498291, "lr": 0.00018140178035419305, "tps": 36503, "wall": 31939.0} {"step": 17790, "train_loss": 3.329857110977173, "lr": 0.00018138306821964165, "tps": 36499, "wall": 31944.4} {"step": 17791, "train_loss": 3.4033751487731934, "lr": 0.00018136435652254496, "tps": 36495, "wall": 31949.8} {"step": 17792, "train_loss": 3.2994582653045654, "lr": 0.0001813456452631149, "tps": 36491, "wall": 31955.3} {"step": 17793, "train_loss": 3.183783769607544, "lr": 0.00018132693444156348, "tps": 36486, "wall": 31960.7} {"step": 17794, "train_loss": 3.3597702980041504, "lr": 0.0001813082240581026, "tps": 36482, "wall": 31966.2} {"step": 17795, "train_loss": 3.3909213542938232, "lr": 0.0001812895141129443, "tps": 36478, "wall": 31971.6} {"step": 17796, "train_loss": 3.3695123195648193, "lr": 0.00018127080460630048, "tps": 36474, "wall": 31977.0} {"step": 17797, "train_loss": 3.2673439979553223, "lr": 0.00018125209553838305, "tps": 36470, "wall": 31982.5} {"step": 17798, "train_loss": 3.3312220573425293, "lr": 0.000181233386909404, "tps": 36466, "wall": 31987.9} {"step": 17799, "train_loss": 3.355426788330078, "lr": 0.00018121467871957522, "tps": 36461, "wall": 31993.3} {"step": 17800, "train_loss": 3.3207340240478516, "lr": 0.00018119597096910868, "tps": 36457, "wall": 31998.7} {"step": 17801, "train_loss": 3.317756175994873, "lr": 0.00018117726365821625, "tps": 36453, "wall": 32004.2} {"step": 17802, "train_loss": 3.3751206398010254, "lr": 0.0001811585567871099, "tps": 36449, "wall": 32009.6} {"step": 17803, "train_loss": 3.298834800720215, "lr": 0.00018113985035600152, "tps": 36445, "wall": 32015.1} {"step": 17804, "train_loss": 3.3349456787109375, "lr": 0.00018112114436510298, "tps": 36441, "wall": 32020.6} {"step": 17805, "train_loss": 3.274669647216797, "lr": 0.0001811024388146263, "tps": 36437, "wall": 32026.0} {"step": 17806, "train_loss": 3.337412118911743, "lr": 0.00018108373370478328, "tps": 36432, "wall": 32031.5} {"step": 17807, "train_loss": 3.2512588500976562, "lr": 0.00018106502903578577, "tps": 36428, "wall": 32036.9} {"step": 17808, "train_loss": 3.2869882583618164, "lr": 0.00018104632480784574, "tps": 36424, "wall": 32042.3} {"step": 17809, "train_loss": 3.4007198810577393, "lr": 0.00018102762102117508, "tps": 36420, "wall": 32047.8} {"step": 17810, "train_loss": 3.328373670578003, "lr": 0.00018100891767598557, "tps": 36416, "wall": 32053.2} {"step": 17811, "train_loss": 3.4154458045959473, "lr": 0.0001809902147724892, "tps": 36412, "wall": 32058.6} {"step": 17812, "train_loss": 3.3726067543029785, "lr": 0.00018097151231089785, "tps": 36408, "wall": 32064.1} {"step": 17813, "train_loss": 3.344099521636963, "lr": 0.00018095281029142322, "tps": 36403, "wall": 32069.5} {"step": 17814, "train_loss": 3.3230717182159424, "lr": 0.0001809341087142773, "tps": 36399, "wall": 32075.0} {"step": 17815, "train_loss": 3.264186143875122, "lr": 0.00018091540757967192, "tps": 36395, "wall": 32080.5} {"step": 17816, "train_loss": 3.234532356262207, "lr": 0.0001808967068878189, "tps": 36391, "wall": 32085.9} {"step": 17817, "train_loss": 3.3797316551208496, "lr": 0.00018087800663893009, "tps": 36387, "wall": 32091.4} {"step": 17818, "train_loss": 3.2419538497924805, "lr": 0.0001808593068332174, "tps": 36383, "wall": 32096.9} {"step": 17819, "train_loss": 3.3547730445861816, "lr": 0.00018084060747089255, "tps": 36379, "wall": 32102.3} {"step": 17820, "train_loss": 3.323437452316284, "lr": 0.0001808219085521674, "tps": 36374, "wall": 32107.8} {"step": 17821, "train_loss": 3.3937408924102783, "lr": 0.0001808032100772538, "tps": 36370, "wall": 32113.3} {"step": 17822, "train_loss": 3.283226490020752, "lr": 0.00018078451204636358, "tps": 36366, "wall": 32118.7} {"step": 17823, "train_loss": 3.3084449768066406, "lr": 0.0001807658144597085, "tps": 36362, "wall": 32124.2} {"step": 17824, "train_loss": 3.328490734100342, "lr": 0.00018074711731750042, "tps": 36358, "wall": 32129.7} {"step": 17825, "train_loss": 3.326939821243286, "lr": 0.0001807284206199511, "tps": 36354, "wall": 32135.2} {"step": 17826, "train_loss": 3.3902969360351562, "lr": 0.00018070972436727242, "tps": 36349, "wall": 32140.8} {"step": 17827, "train_loss": 3.271711826324463, "lr": 0.000180691028559676, "tps": 36345, "wall": 32146.3} {"step": 17828, "train_loss": 3.337604284286499, "lr": 0.00018067233319737377, "tps": 36341, "wall": 32151.7} {"step": 17829, "train_loss": 3.324551582336426, "lr": 0.00018065363828057755, "tps": 36337, "wall": 32157.2} {"step": 17830, "train_loss": 3.3689446449279785, "lr": 0.00018063494380949897, "tps": 36333, "wall": 32162.7} {"step": 17831, "train_loss": 3.2663490772247314, "lr": 0.0001806162497843499, "tps": 36329, "wall": 32168.1} {"step": 17832, "train_loss": 3.345050811767578, "lr": 0.0001805975562053421, "tps": 36324, "wall": 32173.5} {"step": 17833, "train_loss": 3.3598551750183105, "lr": 0.00018057886307268727, "tps": 36320, "wall": 32179.1} {"step": 17834, "train_loss": 3.254776954650879, "lr": 0.00018056017038659724, "tps": 36316, "wall": 32184.6} {"step": 17835, "train_loss": 3.2924022674560547, "lr": 0.00018054147814728375, "tps": 36312, "wall": 32190.1} {"step": 17836, "train_loss": 3.4285006523132324, "lr": 0.00018052278635495852, "tps": 36308, "wall": 32195.6} {"step": 17837, "train_loss": 3.3444290161132812, "lr": 0.00018050409500983326, "tps": 36303, "wall": 32201.2} {"step": 17838, "train_loss": 3.326244831085205, "lr": 0.00018048540411211978, "tps": 36299, "wall": 32206.7} {"step": 17839, "train_loss": 3.3627660274505615, "lr": 0.0001804667136620298, "tps": 36295, "wall": 32212.2} {"step": 17840, "train_loss": 3.3143796920776367, "lr": 0.00018044802365977503, "tps": 36291, "wall": 32217.8} {"step": 17841, "train_loss": 3.2965450286865234, "lr": 0.00018042933410556712, "tps": 36287, "wall": 32223.3} {"step": 17842, "train_loss": 3.2634060382843018, "lr": 0.00018041064499961794, "tps": 36282, "wall": 32228.9} {"step": 17843, "train_loss": 3.252103805541992, "lr": 0.00018039195634213907, "tps": 36278, "wall": 32234.4} {"step": 17844, "train_loss": 3.212486982345581, "lr": 0.00018037326813334222, "tps": 36274, "wall": 32240.0} {"step": 17845, "train_loss": 3.2602529525756836, "lr": 0.00018035458037343922, "tps": 36270, "wall": 32245.6} {"step": 17846, "train_loss": 3.3738954067230225, "lr": 0.00018033589306264163, "tps": 36265, "wall": 32251.2} {"step": 17847, "train_loss": 3.2601399421691895, "lr": 0.0001803172062011612, "tps": 36261, "wall": 32256.8} {"step": 17848, "train_loss": 3.296731948852539, "lr": 0.00018029851978920957, "tps": 36257, "wall": 32262.3} {"step": 17849, "train_loss": 3.416247606277466, "lr": 0.0001802798338269985, "tps": 36253, "wall": 32267.9} {"step": 17850, "train_loss": 3.2782464027404785, "lr": 0.00018026114831473967, "tps": 36249, "wall": 32273.4} {"step": 17851, "train_loss": 3.2293894290924072, "lr": 0.00018024246325264458, "tps": 36244, "wall": 32279.0} {"step": 17852, "train_loss": 3.2377545833587646, "lr": 0.0001802237786409251, "tps": 36240, "wall": 32284.5} {"step": 17853, "train_loss": 3.2236714363098145, "lr": 0.0001802050944797928, "tps": 36236, "wall": 32290.1} {"step": 17854, "train_loss": 3.280900239944458, "lr": 0.0001801864107694593, "tps": 36232, "wall": 32295.6} {"step": 17855, "train_loss": 3.2639827728271484, "lr": 0.0001801677275101363, "tps": 36228, "wall": 32301.2} {"step": 17856, "train_loss": 3.400684118270874, "lr": 0.00018014904470203548, "tps": 36223, "wall": 32306.9} {"step": 17857, "train_loss": 3.3950986862182617, "lr": 0.00018013036234536842, "tps": 36219, "wall": 32312.5} {"step": 17858, "train_loss": 3.2624478340148926, "lr": 0.00018011168044034675, "tps": 36215, "wall": 32318.1} {"step": 17859, "train_loss": 3.3632164001464844, "lr": 0.0001800929989871822, "tps": 36211, "wall": 32323.7} {"step": 17860, "train_loss": 3.201169490814209, "lr": 0.0001800743179860862, "tps": 36206, "wall": 32329.3} {"step": 17861, "train_loss": 3.29697847366333, "lr": 0.00018005563743727057, "tps": 36202, "wall": 32334.9} {"step": 17862, "train_loss": 3.3377881050109863, "lr": 0.0001800369573409468, "tps": 36198, "wall": 32340.5} {"step": 17863, "train_loss": 3.305372476577759, "lr": 0.00018001827769732653, "tps": 36193, "wall": 32346.2} {"step": 17864, "train_loss": 3.243867874145508, "lr": 0.0001799995985066214, "tps": 36189, "wall": 32351.8} {"step": 17865, "train_loss": 3.3872218132019043, "lr": 0.00017998091976904296, "tps": 36185, "wall": 32357.4} {"step": 17866, "train_loss": 3.397158622741699, "lr": 0.00017996224148480287, "tps": 36181, "wall": 32363.0} {"step": 17867, "train_loss": 3.3167519569396973, "lr": 0.00017994356365411265, "tps": 36176, "wall": 32368.7} {"step": 17868, "train_loss": 3.249363660812378, "lr": 0.0001799248862771839, "tps": 36172, "wall": 32374.4} {"step": 17869, "train_loss": 3.2853245735168457, "lr": 0.00017990620935422823, "tps": 36168, "wall": 32380.0} {"step": 17870, "train_loss": 3.2155609130859375, "lr": 0.00017988753288545714, "tps": 36163, "wall": 32385.7} {"step": 17871, "train_loss": 3.3091602325439453, "lr": 0.00017986885687108227, "tps": 36159, "wall": 32391.2} {"step": 17872, "train_loss": 3.295095443725586, "lr": 0.0001798501813113152, "tps": 36155, "wall": 32396.8} {"step": 17873, "train_loss": 3.3249595165252686, "lr": 0.00017983150620636738, "tps": 36151, "wall": 32402.5} {"step": 17874, "train_loss": 3.2402517795562744, "lr": 0.0001798128315564505, "tps": 36147, "wall": 32408.1} {"step": 17875, "train_loss": 3.3303680419921875, "lr": 0.00017979415736177597, "tps": 36142, "wall": 32413.7} {"step": 17876, "train_loss": 3.2845990657806396, "lr": 0.00017977548362255546, "tps": 36138, "wall": 32419.3} {"step": 17877, "train_loss": 3.237611770629883, "lr": 0.00017975681033900043, "tps": 36134, "wall": 32425.0} {"step": 17878, "train_loss": 3.3579485416412354, "lr": 0.00017973813751132238, "tps": 36129, "wall": 32430.7} {"step": 17879, "train_loss": 3.3703298568725586, "lr": 0.00017971946513973297, "tps": 36125, "wall": 32436.4} {"step": 17880, "train_loss": 3.3367502689361572, "lr": 0.00017970079322444363, "tps": 36121, "wall": 32442.1} {"step": 17881, "train_loss": 3.3216071128845215, "lr": 0.00017968212176566582, "tps": 36116, "wall": 32447.8} {"step": 17882, "train_loss": 3.257495880126953, "lr": 0.0001796634507636111, "tps": 36112, "wall": 32453.5} {"step": 17883, "train_loss": 3.3193273544311523, "lr": 0.00017964478021849107, "tps": 36108, "wall": 32459.2} {"step": 17884, "train_loss": 3.32771635055542, "lr": 0.00017962611013051712, "tps": 36104, "wall": 32464.8} {"step": 17885, "train_loss": 3.2281851768493652, "lr": 0.00017960744049990077, "tps": 36099, "wall": 32470.5} {"step": 17886, "train_loss": 3.3330795764923096, "lr": 0.00017958877132685355, "tps": 36095, "wall": 32476.2} {"step": 17887, "train_loss": 3.3096976280212402, "lr": 0.0001795701026115869, "tps": 36091, "wall": 32481.9} {"step": 17888, "train_loss": 3.30251145362854, "lr": 0.00017955143435431227, "tps": 36086, "wall": 32487.6} {"step": 17889, "train_loss": 3.208854913711548, "lr": 0.00017953276655524128, "tps": 36082, "wall": 32493.4} {"step": 17890, "train_loss": 3.230337381362915, "lr": 0.00017951409921458523, "tps": 36077, "wall": 32499.2} {"step": 17891, "train_loss": 3.408658981323242, "lr": 0.00017949543233255564, "tps": 36073, "wall": 32504.8} {"step": 17892, "train_loss": 3.3859686851501465, "lr": 0.000179476765909364, "tps": 36069, "wall": 32510.6} {"step": 17893, "train_loss": 3.296496868133545, "lr": 0.0001794580999452218, "tps": 36065, "wall": 32516.3} {"step": 17894, "train_loss": 3.2565064430236816, "lr": 0.00017943943444034032, "tps": 36060, "wall": 32521.9} {"step": 17895, "train_loss": 3.3572356700897217, "lr": 0.0001794207693949312, "tps": 36056, "wall": 32527.7} {"step": 17896, "train_loss": 3.268275499343872, "lr": 0.00017940210480920583, "tps": 36052, "wall": 32533.5} {"step": 17897, "train_loss": 3.2996439933776855, "lr": 0.00017938344068337556, "tps": 36047, "wall": 32539.3} {"step": 17898, "train_loss": 3.431969165802002, "lr": 0.0001793647770176519, "tps": 36043, "wall": 32544.9} {"step": 17899, "train_loss": 3.412971019744873, "lr": 0.0001793461138122462, "tps": 36038, "wall": 32550.7} {"step": 17900, "train_loss": 3.265596628189087, "lr": 0.00017932745106736996, "tps": 36034, "wall": 32556.5} {"step": 17901, "train_loss": 3.3302483558654785, "lr": 0.0001793087887832346, "tps": 36030, "wall": 32562.2} {"step": 17902, "train_loss": 3.3364243507385254, "lr": 0.00017929012696005136, "tps": 36025, "wall": 32567.9} {"step": 17903, "train_loss": 3.307730197906494, "lr": 0.00017927146559803186, "tps": 36021, "wall": 32573.6} {"step": 17904, "train_loss": 3.25429630279541, "lr": 0.00017925280469738736, "tps": 36017, "wall": 32579.3} {"step": 17905, "train_loss": 3.288271188735962, "lr": 0.0001792341442583293, "tps": 36013, "wall": 32585.1} {"step": 17906, "train_loss": 3.303589344024658, "lr": 0.00017921548428106912, "tps": 36008, "wall": 32590.8} {"step": 17907, "train_loss": 3.28971266746521, "lr": 0.00017919682476581804, "tps": 36004, "wall": 32596.5} {"step": 17908, "train_loss": 3.2892231941223145, "lr": 0.0001791781657127876, "tps": 36000, "wall": 32602.3} {"step": 17909, "train_loss": 3.2705636024475098, "lr": 0.00017915950712218907, "tps": 35995, "wall": 32608.0} {"step": 17910, "train_loss": 3.3087985515594482, "lr": 0.00017914084899423393, "tps": 35991, "wall": 32613.9} {"step": 17911, "train_loss": 3.3126044273376465, "lr": 0.0001791221913291334, "tps": 35986, "wall": 32619.7} {"step": 17912, "train_loss": 3.2278661727905273, "lr": 0.00017910353412709887, "tps": 35982, "wall": 32625.5} {"step": 17913, "train_loss": 3.399601936340332, "lr": 0.00017908487738834178, "tps": 35978, "wall": 32631.3} {"step": 17914, "train_loss": 3.282632827758789, "lr": 0.00017906622111307335, "tps": 35973, "wall": 32637.0} {"step": 17915, "train_loss": 3.3058581352233887, "lr": 0.00017904756530150504, "tps": 35969, "wall": 32642.7} {"step": 17916, "train_loss": 3.243274211883545, "lr": 0.00017902890995384816, "tps": 35965, "wall": 32648.4} {"step": 17917, "train_loss": 3.332031488418579, "lr": 0.0001790102550703139, "tps": 35960, "wall": 32654.2} {"step": 17918, "train_loss": 3.2527971267700195, "lr": 0.00017899160065111373, "tps": 35956, "wall": 32659.9} {"step": 17919, "train_loss": 3.274261474609375, "lr": 0.00017897294669645892, "tps": 35952, "wall": 32665.7} {"step": 17920, "train_loss": 3.2562990188598633, "lr": 0.00017895429320656083, "tps": 35947, "wall": 32671.5} {"step": 17921, "train_loss": 3.3422093391418457, "lr": 0.00017893564018163068, "tps": 35943, "wall": 32677.3} {"step": 17922, "train_loss": 3.353890895843506, "lr": 0.00017891698762187983, "tps": 35939, "wall": 32683.1} {"step": 17923, "train_loss": 3.3609375953674316, "lr": 0.0001788983355275196, "tps": 35934, "wall": 32688.8} {"step": 17924, "train_loss": 3.4296650886535645, "lr": 0.00017887968389876125, "tps": 35930, "wall": 32694.7} {"step": 17925, "train_loss": 3.290973663330078, "lr": 0.000178861032735816, "tps": 35926, "wall": 32700.4} {"step": 17926, "train_loss": 3.304051637649536, "lr": 0.00017884238203889528, "tps": 35921, "wall": 32706.3} {"step": 17927, "train_loss": 3.284149646759033, "lr": 0.00017882373180821021, "tps": 35917, "wall": 32712.1} {"step": 17928, "train_loss": 3.2527337074279785, "lr": 0.00017880508204397213, "tps": 35913, "wall": 32717.8} {"step": 17929, "train_loss": 3.3094029426574707, "lr": 0.00017878643274639236, "tps": 35908, "wall": 32723.6} {"step": 17930, "train_loss": 3.263477325439453, "lr": 0.0001787677839156821, "tps": 35904, "wall": 32729.4} {"step": 17931, "train_loss": 3.309843063354492, "lr": 0.00017874913555205262, "tps": 35899, "wall": 32735.3} {"step": 17932, "train_loss": 3.390538215637207, "lr": 0.00017873048765571512, "tps": 35895, "wall": 32741.1} {"step": 17933, "train_loss": 3.268028974533081, "lr": 0.00017871184022688095, "tps": 35891, "wall": 32747.0} {"step": 17934, "train_loss": 3.3194382190704346, "lr": 0.00017869319326576126, "tps": 35886, "wall": 32752.8} {"step": 17935, "train_loss": 3.2313289642333984, "lr": 0.00017867454677256728, "tps": 35882, "wall": 32758.5} {"step": 17936, "train_loss": 3.175218105316162, "lr": 0.00017865590074751027, "tps": 35878, "wall": 32764.3} {"step": 17937, "train_loss": 3.30471134185791, "lr": 0.0001786372551908015, "tps": 35873, "wall": 32770.1} {"step": 17938, "train_loss": 3.2824854850769043, "lr": 0.00017861861010265212, "tps": 35869, "wall": 32775.9} {"step": 17939, "train_loss": 3.230288505554199, "lr": 0.00017859996548327337, "tps": 35865, "wall": 32781.6} {"step": 17940, "train_loss": 3.3412556648254395, "lr": 0.00017858132133287646, "tps": 35860, "wall": 32787.4} {"step": 17941, "train_loss": 3.4113430976867676, "lr": 0.00017856267765167254, "tps": 35856, "wall": 32793.2} {"step": 17942, "train_loss": 3.3534889221191406, "lr": 0.00017854403443987287, "tps": 35852, "wall": 32799.0} {"step": 17943, "train_loss": 3.3144845962524414, "lr": 0.00017852539169768865, "tps": 35847, "wall": 32804.8} {"step": 17944, "train_loss": 3.3770065307617188, "lr": 0.000178506749425331, "tps": 35843, "wall": 32810.7} {"step": 17945, "train_loss": 3.3148486614227295, "lr": 0.00017848810762301115, "tps": 35838, "wall": 32816.5} {"step": 17946, "train_loss": 3.358591318130493, "lr": 0.00017846946629094027, "tps": 35834, "wall": 32822.4} {"step": 17947, "train_loss": 3.4114303588867188, "lr": 0.00017845082542932952, "tps": 35830, "wall": 32828.1} {"step": 17948, "train_loss": 3.378844738006592, "lr": 0.00017843218503839006, "tps": 35825, "wall": 32834.0} {"step": 17949, "train_loss": 3.2847766876220703, "lr": 0.00017841354511833303, "tps": 35821, "wall": 32839.7} {"step": 17950, "train_loss": 3.229088306427002, "lr": 0.00017839490566936967, "tps": 35817, "wall": 32845.6} {"step": 17951, "train_loss": 3.368741035461426, "lr": 0.00017837626669171103, "tps": 35812, "wall": 32851.5} {"step": 17952, "train_loss": 3.4402523040771484, "lr": 0.00017835762818556837, "tps": 35808, "wall": 32857.3} {"step": 17953, "train_loss": 3.1803178787231445, "lr": 0.0001783389901511527, "tps": 35804, "wall": 32863.1} {"step": 17954, "train_loss": 3.382486343383789, "lr": 0.00017832035258867515, "tps": 35799, "wall": 32869.0} {"step": 17955, "train_loss": 3.29079270362854, "lr": 0.00017830171549834697, "tps": 35795, "wall": 32874.9} {"step": 17956, "train_loss": 3.2306623458862305, "lr": 0.00017828307888037917, "tps": 35790, "wall": 32880.7} {"step": 17957, "train_loss": 3.2763166427612305, "lr": 0.00017826444273498292, "tps": 35786, "wall": 32886.5} {"step": 17958, "train_loss": 3.1882944107055664, "lr": 0.00017824580706236933, "tps": 35782, "wall": 32892.4} {"step": 17959, "train_loss": 3.2409915924072266, "lr": 0.00017822717186274947, "tps": 35777, "wall": 32898.2} {"step": 17960, "train_loss": 3.386021614074707, "lr": 0.0001782085371363345, "tps": 35773, "wall": 32904.0} {"step": 17961, "train_loss": 3.3585636615753174, "lr": 0.00017818990288333546, "tps": 35769, "wall": 32909.9} {"step": 17962, "train_loss": 3.267086982727051, "lr": 0.00017817126910396348, "tps": 35764, "wall": 32915.8} {"step": 17963, "train_loss": 3.3446083068847656, "lr": 0.0001781526357984296, "tps": 35760, "wall": 32921.6} {"step": 17964, "train_loss": 3.3056399822235107, "lr": 0.00017813400296694493, "tps": 35756, "wall": 32927.5} {"step": 17965, "train_loss": 3.2308850288391113, "lr": 0.00017811537060972058, "tps": 35751, "wall": 32933.3} {"step": 17966, "train_loss": 3.390324115753174, "lr": 0.00017809673872696755, "tps": 35747, "wall": 32939.2} {"step": 17967, "train_loss": 3.2696657180786133, "lr": 0.0001780781073188969, "tps": 35742, "wall": 32945.2} {"step": 17968, "train_loss": 3.223780632019043, "lr": 0.00017805947638571977, "tps": 35738, "wall": 32951.0} {"step": 17969, "train_loss": 3.2718818187713623, "lr": 0.00017804084592764713, "tps": 35734, "wall": 32956.8} {"step": 17970, "train_loss": 3.3618359565734863, "lr": 0.00017802221594489005, "tps": 35729, "wall": 32962.7} {"step": 17971, "train_loss": 3.233823299407959, "lr": 0.0001780035864376596, "tps": 35725, "wall": 32968.5} {"step": 17972, "train_loss": 3.261176109313965, "lr": 0.0001779849574061668, "tps": 35721, "wall": 32974.4} {"step": 17973, "train_loss": 3.3060812950134277, "lr": 0.00017796632885062262, "tps": 35716, "wall": 32980.2} {"step": 17974, "train_loss": 3.3434648513793945, "lr": 0.00017794770077123818, "tps": 35712, "wall": 32986.1} {"step": 17975, "train_loss": 3.2842557430267334, "lr": 0.0001779290731682245, "tps": 35707, "wall": 32991.9} {"step": 17976, "train_loss": 3.288910388946533, "lr": 0.0001779104460417925, "tps": 35703, "wall": 32997.8} {"step": 17977, "train_loss": 3.2633304595947266, "lr": 0.00017789181939215326, "tps": 35699, "wall": 33003.7} {"step": 17978, "train_loss": 3.349508285522461, "lr": 0.0001778731932195178, "tps": 35694, "wall": 33009.5} {"step": 17979, "train_loss": 3.4139156341552734, "lr": 0.00017785456752409705, "tps": 35690, "wall": 33015.4} {"step": 17980, "train_loss": 3.3841636180877686, "lr": 0.00017783594230610207, "tps": 35686, "wall": 33021.3} {"step": 17981, "train_loss": 3.2503457069396973, "lr": 0.00017781731756574373, "tps": 35681, "wall": 33027.1} {"step": 17982, "train_loss": 3.168947696685791, "lr": 0.00017779869330323322, "tps": 35677, "wall": 33033.1} {"step": 17983, "train_loss": 3.3441903591156006, "lr": 0.00017778006951878132, "tps": 35673, "wall": 33038.9} {"step": 17984, "train_loss": 3.4365618228912354, "lr": 0.00017776144621259906, "tps": 35668, "wall": 33044.8} {"step": 17985, "train_loss": 3.3562865257263184, "lr": 0.0001777428233848975, "tps": 35664, "wall": 33050.7} {"step": 17986, "train_loss": 3.5050342082977295, "lr": 0.00017772420103588746, "tps": 35659, "wall": 33056.6} {"step": 17987, "train_loss": 3.3213679790496826, "lr": 0.00017770557916577996, "tps": 35655, "wall": 33062.4} {"step": 17988, "train_loss": 3.33836030960083, "lr": 0.00017768695777478595, "tps": 35651, "wall": 33068.3} {"step": 17989, "train_loss": 3.295523166656494, "lr": 0.00017766833686311642, "tps": 35646, "wall": 33074.2} {"step": 17990, "train_loss": 3.2844431400299072, "lr": 0.00017764971643098224, "tps": 35642, "wall": 33080.0} {"step": 17991, "train_loss": 3.2973814010620117, "lr": 0.00017763109647859433, "tps": 35638, "wall": 33085.9} {"step": 17992, "train_loss": 3.3297324180603027, "lr": 0.00017761247700616371, "tps": 35633, "wall": 33091.9} {"step": 17993, "train_loss": 3.2081451416015625, "lr": 0.0001775938580139012, "tps": 35629, "wall": 33097.7} {"step": 17994, "train_loss": 3.2512288093566895, "lr": 0.00017757523950201774, "tps": 35625, "wall": 33103.5} {"step": 17995, "train_loss": 3.2100210189819336, "lr": 0.00017755662147072432, "tps": 35620, "wall": 33109.4} {"step": 17996, "train_loss": 3.309614419937134, "lr": 0.0001775380039202317, "tps": 35616, "wall": 33115.2} {"step": 17997, "train_loss": 3.241241216659546, "lr": 0.00017751938685075093, "tps": 35612, "wall": 33121.1} {"step": 17998, "train_loss": 3.3460803031921387, "lr": 0.00017750077026249284, "tps": 35607, "wall": 33126.9} {"step": 17999, "train_loss": 3.329948902130127, "lr": 0.00017748215415566834, "tps": 35603, "wall": 33132.7} {"step": 18000, "train_loss": 3.321746349334717, "lr": 0.00017746353853048826, "tps": 35599, "wall": 33138.5, "val_loss_monitor": 3.409449970709997} {"step": 18001, "train_loss": 3.2144365310668945, "lr": 0.00017744492338716352, "tps": 35555, "wall": 33181.5} {"step": 18002, "train_loss": 3.339214563369751, "lr": 0.00017742630872590503, "tps": 35551, "wall": 33187.3} {"step": 18003, "train_loss": 3.264885902404785, "lr": 0.00017740769454692359, "tps": 35546, "wall": 33193.2} {"step": 18004, "train_loss": 3.315762758255005, "lr": 0.00017738908085043008, "tps": 35542, "wall": 33199.1} {"step": 18005, "train_loss": 3.306199073791504, "lr": 0.0001773704676366354, "tps": 35538, "wall": 33204.9} {"step": 18006, "train_loss": 3.3781540393829346, "lr": 0.00017735185490575038, "tps": 35533, "wall": 33210.8} {"step": 18007, "train_loss": 3.28287410736084, "lr": 0.0001773332426579858, "tps": 35529, "wall": 33216.7} {"step": 18008, "train_loss": 3.3375797271728516, "lr": 0.00017731463089355255, "tps": 35525, "wall": 33222.5} {"step": 18009, "train_loss": 3.344796895980835, "lr": 0.00017729601961266153, "tps": 35520, "wall": 33228.5} {"step": 18010, "train_loss": 3.322826385498047, "lr": 0.00017727740881552347, "tps": 35516, "wall": 33234.3} {"step": 18011, "train_loss": 3.3276965618133545, "lr": 0.00017725879850234922, "tps": 35512, "wall": 33240.1} {"step": 18012, "train_loss": 3.3898236751556396, "lr": 0.00017724018867334968, "tps": 35508, "wall": 33245.9} {"step": 18013, "train_loss": 3.283310890197754, "lr": 0.00017722157932873557, "tps": 35503, "wall": 33251.8} {"step": 18014, "train_loss": 3.238295316696167, "lr": 0.0001772029704687177, "tps": 35499, "wall": 33257.6} {"step": 18015, "train_loss": 3.3388726711273193, "lr": 0.0001771843620935069, "tps": 35495, "wall": 33263.4} {"step": 18016, "train_loss": 3.3373007774353027, "lr": 0.00017716575420331397, "tps": 35491, "wall": 33269.3} {"step": 18017, "train_loss": 3.260819911956787, "lr": 0.00017714714679834966, "tps": 35486, "wall": 33275.2} {"step": 18018, "train_loss": 3.3255224227905273, "lr": 0.0001771285398788248, "tps": 35482, "wall": 33281.0} {"step": 18019, "train_loss": 3.3488893508911133, "lr": 0.00017710993344495024, "tps": 35478, "wall": 33286.7} {"step": 18020, "train_loss": 3.208933115005493, "lr": 0.00017709132749693657, "tps": 35474, "wall": 33292.5} {"step": 18021, "train_loss": 3.218567132949829, "lr": 0.00017707272203499472, "tps": 35469, "wall": 33298.3} {"step": 18022, "train_loss": 3.361983299255371, "lr": 0.0001770541170593354, "tps": 35465, "wall": 33304.1} {"step": 18023, "train_loss": 3.317814588546753, "lr": 0.0001770355125701693, "tps": 35461, "wall": 33309.9} {"step": 18024, "train_loss": 3.409630060195923, "lr": 0.00017701690856770732, "tps": 35457, "wall": 33315.7} {"step": 18025, "train_loss": 3.281360626220703, "lr": 0.00017699830505216006, "tps": 35453, "wall": 33321.4} {"step": 18026, "train_loss": 3.3439533710479736, "lr": 0.0001769797020237384, "tps": 35449, "wall": 33327.2} {"step": 18027, "train_loss": 3.377045154571533, "lr": 0.00017696109948265294, "tps": 35444, "wall": 33333.0} {"step": 18028, "train_loss": 3.262965440750122, "lr": 0.0001769424974291145, "tps": 35440, "wall": 33338.7} {"step": 18029, "train_loss": 3.316462516784668, "lr": 0.00017692389586333377, "tps": 35436, "wall": 33344.5} {"step": 18030, "train_loss": 3.2709901332855225, "lr": 0.00017690529478552147, "tps": 35432, "wall": 33350.3} {"step": 18031, "train_loss": 3.327732801437378, "lr": 0.00017688669419588834, "tps": 35428, "wall": 33356.1} {"step": 18032, "train_loss": 3.265453577041626, "lr": 0.00017686809409464508, "tps": 35424, "wall": 33361.8} {"step": 18033, "train_loss": 3.240640640258789, "lr": 0.00017684949448200236, "tps": 35419, "wall": 33367.5} {"step": 18034, "train_loss": 3.283475399017334, "lr": 0.0001768308953581709, "tps": 35415, "wall": 33373.2} {"step": 18035, "train_loss": 3.296173572540283, "lr": 0.00017681229672336136, "tps": 35411, "wall": 33379.0} {"step": 18036, "train_loss": 3.4053049087524414, "lr": 0.00017679369857778453, "tps": 35407, "wall": 33384.7} {"step": 18037, "train_loss": 3.289982795715332, "lr": 0.000176775100921651, "tps": 35403, "wall": 33390.4} {"step": 18038, "train_loss": 3.327817916870117, "lr": 0.00017675650375517145, "tps": 35399, "wall": 33396.2} {"step": 18039, "train_loss": 3.2740554809570312, "lr": 0.0001767379070785566, "tps": 35395, "wall": 33401.9} {"step": 18040, "train_loss": 3.311636209487915, "lr": 0.00017671931089201706, "tps": 35391, "wall": 33407.6} {"step": 18041, "train_loss": 3.307114601135254, "lr": 0.00017670071519576346, "tps": 35387, "wall": 33413.3} {"step": 18042, "train_loss": 3.2075085639953613, "lr": 0.0001766821199900065, "tps": 35383, "wall": 33419.0} {"step": 18043, "train_loss": 3.334268808364868, "lr": 0.00017666352527495688, "tps": 35378, "wall": 33424.7} {"step": 18044, "train_loss": 3.4141228199005127, "lr": 0.00017664493105082517, "tps": 35374, "wall": 33430.3} {"step": 18045, "train_loss": 3.418132781982422, "lr": 0.00017662633731782204, "tps": 35370, "wall": 33436.0} {"step": 18046, "train_loss": 3.2857749462127686, "lr": 0.00017660774407615812, "tps": 35366, "wall": 33441.7} {"step": 18047, "train_loss": 3.3439018726348877, "lr": 0.00017658915132604398, "tps": 35362, "wall": 33447.3} {"step": 18048, "train_loss": 3.2969772815704346, "lr": 0.0001765705590676903, "tps": 35358, "wall": 33453.0} {"step": 18049, "train_loss": 3.2858972549438477, "lr": 0.0001765519673013077, "tps": 35354, "wall": 33458.7} {"step": 18050, "train_loss": 3.3423752784729004, "lr": 0.00017653337602710676, "tps": 35350, "wall": 33464.3} {"step": 18051, "train_loss": 3.356631278991699, "lr": 0.00017651478524529805, "tps": 35346, "wall": 33470.0} {"step": 18052, "train_loss": 3.3518776893615723, "lr": 0.00017649619495609223, "tps": 35342, "wall": 33475.6} {"step": 18053, "train_loss": 3.320277214050293, "lr": 0.0001764776051596999, "tps": 35338, "wall": 33481.3} {"step": 18054, "train_loss": 3.3022608757019043, "lr": 0.00017645901585633156, "tps": 35334, "wall": 33486.9} {"step": 18055, "train_loss": 3.1968460083007812, "lr": 0.00017644042704619784, "tps": 35330, "wall": 33492.5} {"step": 18056, "train_loss": 3.367680549621582, "lr": 0.00017642183872950939, "tps": 35326, "wall": 33498.1} {"step": 18057, "train_loss": 3.2271058559417725, "lr": 0.00017640325090647666, "tps": 35322, "wall": 33503.7} {"step": 18058, "train_loss": 3.2681162357330322, "lr": 0.00017638466357731023, "tps": 35318, "wall": 33509.4} {"step": 18059, "train_loss": 3.242452621459961, "lr": 0.00017636607674222074, "tps": 35314, "wall": 33515.2} {"step": 18060, "train_loss": 3.26339054107666, "lr": 0.00017634749040141868, "tps": 35310, "wall": 33520.8} {"step": 18061, "train_loss": 3.210629940032959, "lr": 0.0001763289045551146, "tps": 35306, "wall": 33526.5} {"step": 18062, "train_loss": 3.2934913635253906, "lr": 0.00017631031920351906, "tps": 35302, "wall": 33532.2} {"step": 18063, "train_loss": 3.254911422729492, "lr": 0.0001762917343468426, "tps": 35298, "wall": 33537.7} {"step": 18064, "train_loss": 3.3888955116271973, "lr": 0.0001762731499852957, "tps": 35294, "wall": 33543.4} {"step": 18065, "train_loss": 3.3865034580230713, "lr": 0.00017625456611908895, "tps": 35290, "wall": 33549.0} {"step": 18066, "train_loss": 3.233501672744751, "lr": 0.00017623598274843288, "tps": 35286, "wall": 33554.6} {"step": 18067, "train_loss": 3.1719908714294434, "lr": 0.00017621739987353787, "tps": 35283, "wall": 33560.2} {"step": 18068, "train_loss": 3.3447699546813965, "lr": 0.0001761988174946146, "tps": 35279, "wall": 33565.7} {"step": 18069, "train_loss": 3.4031059741973877, "lr": 0.00017618023561187345, "tps": 35275, "wall": 33571.4} {"step": 18070, "train_loss": 3.249630928039551, "lr": 0.00017616165422552503, "tps": 35271, "wall": 33577.0} {"step": 18071, "train_loss": 3.2691917419433594, "lr": 0.00017614307333577967, "tps": 35267, "wall": 33582.6} {"step": 18072, "train_loss": 3.268627166748047, "lr": 0.00017612449294284797, "tps": 35263, "wall": 33588.2} {"step": 18073, "train_loss": 3.273336410522461, "lr": 0.00017610591304694046, "tps": 35259, "wall": 33593.8} {"step": 18074, "train_loss": 3.3474059104919434, "lr": 0.00017608733364826747, "tps": 35255, "wall": 33599.4} {"step": 18075, "train_loss": 3.259047269821167, "lr": 0.00017606875474703956, "tps": 35251, "wall": 33605.0} {"step": 18076, "train_loss": 3.238644599914551, "lr": 0.00017605017634346722, "tps": 35247, "wall": 33610.5} {"step": 18077, "train_loss": 3.3565967082977295, "lr": 0.00017603159843776077, "tps": 35243, "wall": 33616.2} {"step": 18078, "train_loss": 3.316490411758423, "lr": 0.00017601302103013077, "tps": 35239, "wall": 33621.7} {"step": 18079, "train_loss": 3.3574633598327637, "lr": 0.00017599444412078768, "tps": 35235, "wall": 33627.3} {"step": 18080, "train_loss": 3.316918134689331, "lr": 0.00017597586770994194, "tps": 35232, "wall": 33632.9} {"step": 18081, "train_loss": 3.3166415691375732, "lr": 0.00017595729179780388, "tps": 35228, "wall": 33638.5} {"step": 18082, "train_loss": 3.334343433380127, "lr": 0.00017593871638458403, "tps": 35224, "wall": 33644.2} {"step": 18083, "train_loss": 3.4221482276916504, "lr": 0.00017592014147049283, "tps": 35220, "wall": 33649.8} {"step": 18084, "train_loss": 3.3705170154571533, "lr": 0.0001759015670557406, "tps": 35216, "wall": 33655.4} {"step": 18085, "train_loss": 3.178288459777832, "lr": 0.00017588299314053783, "tps": 35212, "wall": 33661.0} {"step": 18086, "train_loss": 3.2807693481445312, "lr": 0.0001758644197250949, "tps": 35208, "wall": 33666.6} {"step": 18087, "train_loss": 3.241391897201538, "lr": 0.0001758458468096222, "tps": 35204, "wall": 33672.2} {"step": 18088, "train_loss": 3.2969322204589844, "lr": 0.0001758272743943301, "tps": 35200, "wall": 33677.8} {"step": 18089, "train_loss": 3.387061834335327, "lr": 0.00017580870247942905, "tps": 35196, "wall": 33683.3} {"step": 18090, "train_loss": 3.2932651042938232, "lr": 0.00017579013106512945, "tps": 35192, "wall": 33688.9} {"step": 18091, "train_loss": 3.327665090560913, "lr": 0.0001757715601516416, "tps": 35189, "wall": 33694.5} {"step": 18092, "train_loss": 3.3894553184509277, "lr": 0.00017575298973917586, "tps": 35185, "wall": 33700.1} {"step": 18093, "train_loss": 3.335697889328003, "lr": 0.00017573441982794274, "tps": 35181, "wall": 33705.7} {"step": 18094, "train_loss": 3.3463237285614014, "lr": 0.00017571585041815246, "tps": 35177, "wall": 33711.3} {"step": 18095, "train_loss": 3.2839043140411377, "lr": 0.00017569728151001543, "tps": 35173, "wall": 33717.0} {"step": 18096, "train_loss": 3.3770532608032227, "lr": 0.00017567871310374198, "tps": 35169, "wall": 33722.6} {"step": 18097, "train_loss": 3.4041571617126465, "lr": 0.0001756601451995425, "tps": 35165, "wall": 33728.1} {"step": 18098, "train_loss": 3.302070140838623, "lr": 0.00017564157779762724, "tps": 35161, "wall": 33733.8} {"step": 18099, "train_loss": 3.3134827613830566, "lr": 0.0001756230108982066, "tps": 35157, "wall": 33739.4} {"step": 18100, "train_loss": 3.218252658843994, "lr": 0.00017560444450149095, "tps": 35153, "wall": 33745.0} {"step": 18101, "train_loss": 3.2924089431762695, "lr": 0.0001755858786076905, "tps": 35150, "wall": 33750.5} {"step": 18102, "train_loss": 3.3229494094848633, "lr": 0.00017556731321701565, "tps": 35146, "wall": 33756.2} {"step": 18103, "train_loss": 3.3471877574920654, "lr": 0.00017554874832967666, "tps": 35142, "wall": 33761.7} {"step": 18104, "train_loss": 3.2818522453308105, "lr": 0.00017553018394588388, "tps": 35138, "wall": 33767.2} {"step": 18105, "train_loss": 3.4030613899230957, "lr": 0.00017551162006584754, "tps": 35134, "wall": 33772.8} {"step": 18106, "train_loss": 3.274329662322998, "lr": 0.000175493056689778, "tps": 35130, "wall": 33778.4} {"step": 18107, "train_loss": 3.422163486480713, "lr": 0.00017547449381788552, "tps": 35126, "wall": 33783.9} {"step": 18108, "train_loss": 3.3423399925231934, "lr": 0.00017545593145038035, "tps": 35123, "wall": 33789.6} {"step": 18109, "train_loss": 3.203655242919922, "lr": 0.00017543736958747284, "tps": 35119, "wall": 33795.2} {"step": 18110, "train_loss": 3.271188259124756, "lr": 0.00017541880822937323, "tps": 35115, "wall": 33800.7} {"step": 18111, "train_loss": 3.320460557937622, "lr": 0.00017540024737629171, "tps": 35111, "wall": 33806.4} {"step": 18112, "train_loss": 3.401315212249756, "lr": 0.00017538168702843865, "tps": 35107, "wall": 33812.0} {"step": 18113, "train_loss": 3.1896815299987793, "lr": 0.00017536312718602427, "tps": 35103, "wall": 33817.6} {"step": 18114, "train_loss": 3.2947375774383545, "lr": 0.00017534456784925876, "tps": 35099, "wall": 33823.1} {"step": 18115, "train_loss": 3.3146772384643555, "lr": 0.0001753260090183524, "tps": 35095, "wall": 33828.7} {"step": 18116, "train_loss": 3.3377182483673096, "lr": 0.00017530745069351542, "tps": 35092, "wall": 33834.3} {"step": 18117, "train_loss": 3.359889030456543, "lr": 0.00017528889287495814, "tps": 35088, "wall": 33839.8} {"step": 18118, "train_loss": 3.224485158920288, "lr": 0.0001752703355628906, "tps": 35084, "wall": 33845.4} {"step": 18119, "train_loss": 3.266143560409546, "lr": 0.00017525177875752314, "tps": 35080, "wall": 33851.0} {"step": 18120, "train_loss": 3.2339653968811035, "lr": 0.00017523322245906604, "tps": 35076, "wall": 33856.6} {"step": 18121, "train_loss": 3.4452321529388428, "lr": 0.00017521466666772933, "tps": 35072, "wall": 33862.2} {"step": 18122, "train_loss": 3.391068458557129, "lr": 0.0001751961113837233, "tps": 35068, "wall": 33867.8} {"step": 18123, "train_loss": 3.2526583671569824, "lr": 0.00017517755660725816, "tps": 35065, "wall": 33873.4} {"step": 18124, "train_loss": 3.3059136867523193, "lr": 0.0001751590023385441, "tps": 35061, "wall": 33878.9} {"step": 18125, "train_loss": 3.331662654876709, "lr": 0.0001751404485777913, "tps": 35057, "wall": 33884.4} {"step": 18126, "train_loss": 3.336276054382324, "lr": 0.00017512189532520984, "tps": 35053, "wall": 33890.0} {"step": 18127, "train_loss": 3.227879285812378, "lr": 0.00017510334258101008, "tps": 35049, "wall": 33895.6} {"step": 18128, "train_loss": 3.176924467086792, "lr": 0.000175084790345402, "tps": 35046, "wall": 33901.1} {"step": 18129, "train_loss": 3.3299267292022705, "lr": 0.0001750662386185959, "tps": 35042, "wall": 33906.7} {"step": 18130, "train_loss": 3.40669322013855, "lr": 0.00017504768740080184, "tps": 35038, "wall": 33912.3} {"step": 18131, "train_loss": 3.3286290168762207, "lr": 0.00017502913669223, "tps": 35034, "wall": 33917.8} {"step": 18132, "train_loss": 3.4339241981506348, "lr": 0.0001750105864930906, "tps": 35030, "wall": 33923.4} {"step": 18133, "train_loss": 3.2838404178619385, "lr": 0.00017499203680359363, "tps": 35027, "wall": 33928.9} {"step": 18134, "train_loss": 3.2424936294555664, "lr": 0.00017497348762394936, "tps": 35023, "wall": 33934.5} {"step": 18135, "train_loss": 3.3162240982055664, "lr": 0.00017495493895436788, "tps": 35019, "wall": 33940.1} {"step": 18136, "train_loss": 3.2638955116271973, "lr": 0.00017493639079505923, "tps": 35015, "wall": 33945.7} {"step": 18137, "train_loss": 3.2060093879699707, "lr": 0.0001749178431462336, "tps": 35011, "wall": 33951.2} {"step": 18138, "train_loss": 3.286386251449585, "lr": 0.00017489929600810112, "tps": 35007, "wall": 33956.8} {"step": 18139, "train_loss": 3.355283260345459, "lr": 0.0001748807493808718, "tps": 35004, "wall": 33962.3} {"step": 18140, "train_loss": 3.2803544998168945, "lr": 0.00017486220326475577, "tps": 35000, "wall": 33967.8} {"step": 18141, "train_loss": 3.226062774658203, "lr": 0.0001748436576599632, "tps": 34996, "wall": 33973.4} {"step": 18142, "train_loss": 3.296046733856201, "lr": 0.00017482511256670412, "tps": 34992, "wall": 33979.0} {"step": 18143, "train_loss": 3.2700746059417725, "lr": 0.0001748065679851886, "tps": 34988, "wall": 33984.6} {"step": 18144, "train_loss": 3.2676022052764893, "lr": 0.00017478802391562666, "tps": 34985, "wall": 33990.1} {"step": 18145, "train_loss": 3.307661294937134, "lr": 0.00017476948035822853, "tps": 34981, "wall": 33995.8} {"step": 18146, "train_loss": 3.3551228046417236, "lr": 0.0001747509373132041, "tps": 34977, "wall": 34001.3} {"step": 18147, "train_loss": 3.2459161281585693, "lr": 0.00017473239478076353, "tps": 34973, "wall": 34006.9} {"step": 18148, "train_loss": 3.391061305999756, "lr": 0.00017471385276111683, "tps": 34969, "wall": 34012.4} {"step": 18149, "train_loss": 3.23262619972229, "lr": 0.00017469531125447407, "tps": 34966, "wall": 34018.0} {"step": 18150, "train_loss": 3.2843856811523438, "lr": 0.0001746767702610453, "tps": 34962, "wall": 34023.5} {"step": 18151, "train_loss": 3.170712947845459, "lr": 0.0001746582297810405, "tps": 34958, "wall": 34029.0} {"step": 18152, "train_loss": 3.3634543418884277, "lr": 0.0001746396898146697, "tps": 34954, "wall": 34034.5} {"step": 18153, "train_loss": 3.270345687866211, "lr": 0.00017462115036214298, "tps": 34951, "wall": 34040.1} {"step": 18154, "train_loss": 3.2368977069854736, "lr": 0.00017460261142367029, "tps": 34947, "wall": 34045.6} {"step": 18155, "train_loss": 3.334301471710205, "lr": 0.00017458407299946176, "tps": 34943, "wall": 34051.2} {"step": 18156, "train_loss": 3.3245699405670166, "lr": 0.00017456553508972723, "tps": 34939, "wall": 34056.7} {"step": 18157, "train_loss": 3.314213752746582, "lr": 0.0001745469976946768, "tps": 34936, "wall": 34062.3} {"step": 18158, "train_loss": 3.383495807647705, "lr": 0.00017452846081452038, "tps": 34932, "wall": 34067.9} {"step": 18159, "train_loss": 3.2381129264831543, "lr": 0.0001745099244494681, "tps": 34928, "wall": 34073.4} {"step": 18160, "train_loss": 3.3723788261413574, "lr": 0.00017449138859972982, "tps": 34924, "wall": 34078.9} {"step": 18161, "train_loss": 3.308727741241455, "lr": 0.00017447285326551554, "tps": 34921, "wall": 34084.5} {"step": 18162, "train_loss": 3.3240644931793213, "lr": 0.0001744543184470353, "tps": 34917, "wall": 34090.0} {"step": 18163, "train_loss": 3.245957851409912, "lr": 0.00017443578414449897, "tps": 34913, "wall": 34095.5} {"step": 18164, "train_loss": 3.2340211868286133, "lr": 0.00017441725035811652, "tps": 34909, "wall": 34101.0} {"step": 18165, "train_loss": 3.289949417114258, "lr": 0.00017439871708809797, "tps": 34906, "wall": 34106.6} {"step": 18166, "train_loss": 3.290156364440918, "lr": 0.00017438018433465317, "tps": 34902, "wall": 34112.3} {"step": 18167, "train_loss": 3.2718124389648438, "lr": 0.00017436165209799208, "tps": 34898, "wall": 34117.8} {"step": 18168, "train_loss": 3.376845121383667, "lr": 0.00017434312037832475, "tps": 34894, "wall": 34123.3} {"step": 18169, "train_loss": 3.303300380706787, "lr": 0.00017432458917586102, "tps": 34890, "wall": 34128.9} {"step": 18170, "train_loss": 3.208824634552002, "lr": 0.0001743060584908107, "tps": 34887, "wall": 34134.4} {"step": 18171, "train_loss": 3.3626084327697754, "lr": 0.00017428752832338392, "tps": 34883, "wall": 34139.9} {"step": 18172, "train_loss": 3.24410343170166, "lr": 0.00017426899867379052, "tps": 34879, "wall": 34145.4} {"step": 18173, "train_loss": 3.3070127964019775, "lr": 0.0001742504695422403, "tps": 34876, "wall": 34151.0} {"step": 18174, "train_loss": 3.285130739212036, "lr": 0.00017423194092894327, "tps": 34872, "wall": 34156.5} {"step": 18175, "train_loss": 3.294466972351074, "lr": 0.0001742134128341093, "tps": 34868, "wall": 34162.0} {"step": 18176, "train_loss": 3.3308162689208984, "lr": 0.0001741948852579483, "tps": 34864, "wall": 34167.5} {"step": 18177, "train_loss": 3.3479275703430176, "lr": 0.00017417635820067, "tps": 34861, "wall": 34173.2} {"step": 18178, "train_loss": 3.293458938598633, "lr": 0.00017415783166248446, "tps": 34857, "wall": 34178.8} {"step": 18179, "train_loss": 3.302016258239746, "lr": 0.00017413930564360154, "tps": 34853, "wall": 34184.3} {"step": 18180, "train_loss": 3.382131576538086, "lr": 0.00017412078014423097, "tps": 34849, "wall": 34189.9} {"step": 18181, "train_loss": 3.3317885398864746, "lr": 0.0001741022551645827, "tps": 34846, "wall": 34195.4} {"step": 18182, "train_loss": 3.2673702239990234, "lr": 0.0001740837307048666, "tps": 34842, "wall": 34201.0} {"step": 18183, "train_loss": 3.342672348022461, "lr": 0.00017406520676529246, "tps": 34838, "wall": 34206.5} {"step": 18184, "train_loss": 3.193946123123169, "lr": 0.00017404668334607015, "tps": 34834, "wall": 34212.0} {"step": 18185, "train_loss": 3.2947049140930176, "lr": 0.00017402816044740944, "tps": 34831, "wall": 34217.5} {"step": 18186, "train_loss": 3.3150577545166016, "lr": 0.0001740096380695203, "tps": 34827, "wall": 34223.0} {"step": 18187, "train_loss": 3.2921996116638184, "lr": 0.0001739911162126124, "tps": 34823, "wall": 34228.5} {"step": 18188, "train_loss": 3.368511199951172, "lr": 0.00017397259487689568, "tps": 34819, "wall": 34234.2} {"step": 18189, "train_loss": 3.4068989753723145, "lr": 0.0001739540740625799, "tps": 34816, "wall": 34239.7} {"step": 18190, "train_loss": 3.3805465698242188, "lr": 0.0001739355537698748, "tps": 34812, "wall": 34245.3} {"step": 18191, "train_loss": 3.2816529273986816, "lr": 0.00017391703399899028, "tps": 34808, "wall": 34250.8} {"step": 18192, "train_loss": 3.3669166564941406, "lr": 0.0001738985147501361, "tps": 34805, "wall": 34256.4} {"step": 18193, "train_loss": 3.2678210735321045, "lr": 0.000173879996023522, "tps": 34801, "wall": 34261.9} {"step": 18194, "train_loss": 3.2528624534606934, "lr": 0.00017386147781935782, "tps": 34797, "wall": 34267.3} {"step": 18195, "train_loss": 3.3065452575683594, "lr": 0.0001738429601378533, "tps": 34794, "wall": 34272.8} {"step": 18196, "train_loss": 3.3205652236938477, "lr": 0.00017382444297921827, "tps": 34790, "wall": 34278.4} {"step": 18197, "train_loss": 3.308495044708252, "lr": 0.0001738059263436624, "tps": 34786, "wall": 34283.9} {"step": 18198, "train_loss": 3.3350090980529785, "lr": 0.0001737874102313955, "tps": 34782, "wall": 34289.5} {"step": 18199, "train_loss": 3.3370184898376465, "lr": 0.00017376889464262738, "tps": 34779, "wall": 34295.2} {"step": 18200, "train_loss": 3.4199507236480713, "lr": 0.00017375037957756764, "tps": 34775, "wall": 34300.7} {"step": 18201, "train_loss": 3.3441052436828613, "lr": 0.00017373186503642614, "tps": 34771, "wall": 34306.2} {"step": 18202, "train_loss": 3.286381244659424, "lr": 0.00017371335101941257, "tps": 34767, "wall": 34311.8} {"step": 18203, "train_loss": 3.224344491958618, "lr": 0.00017369483752673666, "tps": 34764, "wall": 34317.3} {"step": 18204, "train_loss": 3.3694167137145996, "lr": 0.00017367632455860812, "tps": 34760, "wall": 34322.9} {"step": 18205, "train_loss": 3.3506808280944824, "lr": 0.0001736578121152367, "tps": 34756, "wall": 34328.3} {"step": 18206, "train_loss": 3.3114681243896484, "lr": 0.0001736393001968321, "tps": 34753, "wall": 34333.9} {"step": 18207, "train_loss": 3.292949676513672, "lr": 0.000173620788803604, "tps": 34749, "wall": 34339.4} {"step": 18208, "train_loss": 3.2052533626556396, "lr": 0.00017360227793576213, "tps": 34745, "wall": 34344.9} {"step": 18209, "train_loss": 3.353775978088379, "lr": 0.00017358376759351617, "tps": 34742, "wall": 34350.4} {"step": 18210, "train_loss": 3.3817262649536133, "lr": 0.0001735652577770758, "tps": 34738, "wall": 34356.0} {"step": 18211, "train_loss": 3.3290903568267822, "lr": 0.00017354674848665068, "tps": 34734, "wall": 34361.4} {"step": 18212, "train_loss": 3.299384593963623, "lr": 0.00017352823972245052, "tps": 34731, "wall": 34366.9} {"step": 18213, "train_loss": 3.320136785507202, "lr": 0.00017350973148468497, "tps": 34727, "wall": 34372.5} {"step": 18214, "train_loss": 3.308607578277588, "lr": 0.0001734912237735637, "tps": 34723, "wall": 34378.0} {"step": 18215, "train_loss": 3.258418083190918, "lr": 0.00017347271658929635, "tps": 34720, "wall": 34383.5} {"step": 18216, "train_loss": 3.3956239223480225, "lr": 0.00017345420993209265, "tps": 34716, "wall": 34389.0} {"step": 18217, "train_loss": 3.3637046813964844, "lr": 0.0001734357038021621, "tps": 34712, "wall": 34394.5} {"step": 18218, "train_loss": 3.247368812561035, "lr": 0.00017341719819971444, "tps": 34709, "wall": 34400.0} {"step": 18219, "train_loss": 3.3359529972076416, "lr": 0.0001733986931249593, "tps": 34705, "wall": 34405.5} {"step": 18220, "train_loss": 3.3221113681793213, "lr": 0.00017338018857810625, "tps": 34701, "wall": 34411.1} {"step": 18221, "train_loss": 3.2928590774536133, "lr": 0.00017336168455936495, "tps": 34698, "wall": 34416.7} {"step": 18222, "train_loss": 3.358996629714966, "lr": 0.00017334318106894503, "tps": 34694, "wall": 34422.1} {"step": 18223, "train_loss": 3.2669804096221924, "lr": 0.00017332467810705606, "tps": 34690, "wall": 34427.6} {"step": 18224, "train_loss": 3.339211940765381, "lr": 0.0001733061756739077, "tps": 34687, "wall": 34433.1} {"step": 18225, "train_loss": 3.298675060272217, "lr": 0.00017328767376970948, "tps": 34683, "wall": 34438.6} {"step": 18226, "train_loss": 3.2577569484710693, "lr": 0.00017326917239467103, "tps": 34680, "wall": 34444.1} {"step": 18227, "train_loss": 3.275155544281006, "lr": 0.00017325067154900188, "tps": 34676, "wall": 34449.6} {"step": 18228, "train_loss": 3.3406667709350586, "lr": 0.0001732321712329117, "tps": 34672, "wall": 34455.1} {"step": 18229, "train_loss": 3.24838924407959, "lr": 0.00017321367144660998, "tps": 34669, "wall": 34460.6} {"step": 18230, "train_loss": 3.3791561126708984, "lr": 0.00017319517219030638, "tps": 34665, "wall": 34466.1} {"step": 18231, "train_loss": 3.295015335083008, "lr": 0.00017317667346421033, "tps": 34661, "wall": 34471.7} {"step": 18232, "train_loss": 3.2664613723754883, "lr": 0.00017315817526853148, "tps": 34658, "wall": 34477.2} {"step": 18233, "train_loss": 3.316331386566162, "lr": 0.0001731396776034794, "tps": 34654, "wall": 34482.7} {"step": 18234, "train_loss": 3.2177891731262207, "lr": 0.0001731211804692635, "tps": 34650, "wall": 34488.2} {"step": 18235, "train_loss": 3.3411831855773926, "lr": 0.00017310268386609346, "tps": 34647, "wall": 34493.7} {"step": 18236, "train_loss": 3.400786876678467, "lr": 0.00017308418779417875, "tps": 34643, "wall": 34499.2} {"step": 18237, "train_loss": 3.204880714416504, "lr": 0.00017306569225372892, "tps": 34640, "wall": 34504.7} {"step": 18238, "train_loss": 3.2668581008911133, "lr": 0.0001730471972449534, "tps": 34636, "wall": 34510.2} {"step": 18239, "train_loss": 3.2138428688049316, "lr": 0.0001730287027680618, "tps": 34632, "wall": 34515.7} {"step": 18240, "train_loss": 3.3228583335876465, "lr": 0.00017301020882326364, "tps": 34629, "wall": 34521.1} {"step": 18241, "train_loss": 3.3699264526367188, "lr": 0.0001729917154107683, "tps": 34625, "wall": 34526.6} {"step": 18242, "train_loss": 3.3198649883270264, "lr": 0.0001729732225307854, "tps": 34621, "wall": 34532.3} {"step": 18243, "train_loss": 3.330003261566162, "lr": 0.00017295473018352441, "tps": 34618, "wall": 34537.7} {"step": 18244, "train_loss": 3.204507350921631, "lr": 0.00017293623836919472, "tps": 34614, "wall": 34543.2} {"step": 18245, "train_loss": 3.4114015102386475, "lr": 0.0001729177470880059, "tps": 34611, "wall": 34548.8} {"step": 18246, "train_loss": 3.4008960723876953, "lr": 0.00017289925634016742, "tps": 34607, "wall": 34554.3} {"step": 18247, "train_loss": 3.3548030853271484, "lr": 0.00017288076612588865, "tps": 34603, "wall": 34559.8} {"step": 18248, "train_loss": 3.3445816040039062, "lr": 0.00017286227644537915, "tps": 34600, "wall": 34565.3} {"step": 18249, "train_loss": 3.2832655906677246, "lr": 0.0001728437872988483, "tps": 34596, "wall": 34570.8} {"step": 18250, "train_loss": 3.24932861328125, "lr": 0.00017282529868650558, "tps": 34593, "wall": 34576.2} {"step": 18251, "train_loss": 3.249906539916992, "lr": 0.00017280681060856048, "tps": 34589, "wall": 34581.7} {"step": 18252, "train_loss": 3.382761001586914, "lr": 0.00017278832306522233, "tps": 34585, "wall": 34587.2} {"step": 18253, "train_loss": 3.300360679626465, "lr": 0.00017276983605670068, "tps": 34582, "wall": 34592.9} {"step": 18254, "train_loss": 3.3866729736328125, "lr": 0.0001727513495832048, "tps": 34578, "wall": 34598.4} {"step": 18255, "train_loss": 3.363593101501465, "lr": 0.00017273286364494417, "tps": 34574, "wall": 34603.9} {"step": 18256, "train_loss": 3.26888108253479, "lr": 0.0001727143782421283, "tps": 34571, "wall": 34609.4} {"step": 18257, "train_loss": 3.458411693572998, "lr": 0.0001726958933749665, "tps": 34567, "wall": 34614.8} {"step": 18258, "train_loss": 3.183320999145508, "lr": 0.00017267740904366812, "tps": 34564, "wall": 34620.3} {"step": 18259, "train_loss": 3.3006386756896973, "lr": 0.00017265892524844265, "tps": 34560, "wall": 34625.8} {"step": 18260, "train_loss": 3.3390767574310303, "lr": 0.00017264044198949944, "tps": 34556, "wall": 34631.3} {"step": 18261, "train_loss": 3.292001247406006, "lr": 0.00017262195926704785, "tps": 34553, "wall": 34636.7} {"step": 18262, "train_loss": 3.3931217193603516, "lr": 0.0001726034770812973, "tps": 34549, "wall": 34642.2} {"step": 18263, "train_loss": 3.3920843601226807, "lr": 0.00017258499543245712, "tps": 34546, "wall": 34647.7} {"step": 18264, "train_loss": 3.290618896484375, "lr": 0.00017256651432073664, "tps": 34542, "wall": 34653.3} {"step": 18265, "train_loss": 3.2606468200683594, "lr": 0.00017254803374634525, "tps": 34539, "wall": 34658.8} {"step": 18266, "train_loss": 3.312070608139038, "lr": 0.00017252955370949233, "tps": 34535, "wall": 34664.3} {"step": 18267, "train_loss": 3.2379581928253174, "lr": 0.00017251107421038716, "tps": 34531, "wall": 34669.8} {"step": 18268, "train_loss": 3.2399368286132812, "lr": 0.00017249259524923914, "tps": 34528, "wall": 34675.2} {"step": 18269, "train_loss": 3.3151631355285645, "lr": 0.0001724741168262576, "tps": 34524, "wall": 34680.7} {"step": 18270, "train_loss": 3.311277389526367, "lr": 0.0001724556389416518, "tps": 34521, "wall": 34686.2} {"step": 18271, "train_loss": 3.3301830291748047, "lr": 0.0001724371615956311, "tps": 34517, "wall": 34691.6} {"step": 18272, "train_loss": 3.3165907859802246, "lr": 0.0001724186847884048, "tps": 34514, "wall": 34697.1} {"step": 18273, "train_loss": 3.3278284072875977, "lr": 0.0001724002085201822, "tps": 34510, "wall": 34702.6} {"step": 18274, "train_loss": 3.335273027420044, "lr": 0.00017238173279117262, "tps": 34506, "wall": 34708.1} {"step": 18275, "train_loss": 3.303813934326172, "lr": 0.00017236325760158536, "tps": 34503, "wall": 34713.6} {"step": 18276, "train_loss": 3.3319995403289795, "lr": 0.0001723447829516297, "tps": 34499, "wall": 34719.0} {"step": 18277, "train_loss": 3.36191463470459, "lr": 0.00017232630884151493, "tps": 34496, "wall": 34724.6} {"step": 18278, "train_loss": 3.2964835166931152, "lr": 0.00017230783527145027, "tps": 34492, "wall": 34730.0} {"step": 18279, "train_loss": 3.202000617980957, "lr": 0.00017228936224164505, "tps": 34489, "wall": 34735.5} {"step": 18280, "train_loss": 3.3282923698425293, "lr": 0.00017227088975230856, "tps": 34485, "wall": 34741.0} {"step": 18281, "train_loss": 3.3257837295532227, "lr": 0.00017225241780364993, "tps": 34482, "wall": 34746.5} {"step": 18282, "train_loss": 3.356765031814575, "lr": 0.00017223394639587856, "tps": 34478, "wall": 34752.0} {"step": 18283, "train_loss": 3.2242469787597656, "lr": 0.00017221547552920358, "tps": 34474, "wall": 34757.4} {"step": 18284, "train_loss": 3.2882254123687744, "lr": 0.00017219700520383432, "tps": 34471, "wall": 34762.9} {"step": 18285, "train_loss": 3.301478624343872, "lr": 0.00017217853541997994, "tps": 34467, "wall": 34768.4} {"step": 18286, "train_loss": 3.333573579788208, "lr": 0.0001721600661778497, "tps": 34464, "wall": 34774.0} {"step": 18287, "train_loss": 3.2949204444885254, "lr": 0.0001721415974776529, "tps": 34460, "wall": 34779.5} {"step": 18288, "train_loss": 3.32645320892334, "lr": 0.00017212312931959853, "tps": 34457, "wall": 34785.0} {"step": 18289, "train_loss": 3.302039623260498, "lr": 0.00017210466170389612, "tps": 34453, "wall": 34790.5} {"step": 18290, "train_loss": 3.2567758560180664, "lr": 0.00017208619463075455, "tps": 34449, "wall": 34796.0} {"step": 18291, "train_loss": 3.2526090145111084, "lr": 0.0001720677281003832, "tps": 34446, "wall": 34801.5} {"step": 18292, "train_loss": 3.3369617462158203, "lr": 0.00017204926211299122, "tps": 34442, "wall": 34807.0} {"step": 18293, "train_loss": 3.399101972579956, "lr": 0.0001720307966687878, "tps": 34439, "wall": 34812.4} {"step": 18294, "train_loss": 3.4271914958953857, "lr": 0.00017201233176798207, "tps": 34435, "wall": 34818.0} {"step": 18295, "train_loss": 3.2259483337402344, "lr": 0.00017199386741078332, "tps": 34432, "wall": 34823.5} {"step": 18296, "train_loss": 3.3140716552734375, "lr": 0.00017197540359740056, "tps": 34428, "wall": 34829.0} {"step": 18297, "train_loss": 3.3583242893218994, "lr": 0.00017195694032804304, "tps": 34424, "wall": 34834.5} {"step": 18298, "train_loss": 3.276942491531372, "lr": 0.0001719384776029199, "tps": 34421, "wall": 34840.0} {"step": 18299, "train_loss": 3.20481014251709, "lr": 0.00017192001542224036, "tps": 34417, "wall": 34845.5} {"step": 18300, "train_loss": 3.3362021446228027, "lr": 0.00017190155378621339, "tps": 34414, "wall": 34851.0} {"step": 18301, "train_loss": 3.295285701751709, "lr": 0.00017188309269504829, "tps": 34410, "wall": 34856.5} {"step": 18302, "train_loss": 3.2638094425201416, "lr": 0.0001718646321489541, "tps": 34407, "wall": 34862.0} {"step": 18303, "train_loss": 3.2786896228790283, "lr": 0.00017184617214813992, "tps": 34403, "wall": 34867.4} {"step": 18304, "train_loss": 3.2428319454193115, "lr": 0.0001718277126928149, "tps": 34400, "wall": 34873.0} {"step": 18305, "train_loss": 3.2320189476013184, "lr": 0.0001718092537831882, "tps": 34396, "wall": 34878.5} {"step": 18306, "train_loss": 3.2488088607788086, "lr": 0.0001717907954194689, "tps": 34393, "wall": 34884.0} {"step": 18307, "train_loss": 3.3199825286865234, "lr": 0.00017177233760186603, "tps": 34389, "wall": 34889.4} {"step": 18308, "train_loss": 3.4008820056915283, "lr": 0.00017175388033058875, "tps": 34385, "wall": 34895.0} {"step": 18309, "train_loss": 3.303903579711914, "lr": 0.0001717354236058461, "tps": 34382, "wall": 34900.5} {"step": 18310, "train_loss": 3.259772539138794, "lr": 0.00017171696742784723, "tps": 34378, "wall": 34906.0} {"step": 18311, "train_loss": 3.1758642196655273, "lr": 0.00017169851179680111, "tps": 34375, "wall": 34911.5} {"step": 18312, "train_loss": 3.3955471515655518, "lr": 0.00017168005671291692, "tps": 34371, "wall": 34917.0} {"step": 18313, "train_loss": 3.2641937732696533, "lr": 0.0001716616021764036, "tps": 34368, "wall": 34922.5} {"step": 18314, "train_loss": 3.3363335132598877, "lr": 0.0001716431481874703, "tps": 34364, "wall": 34927.9} {"step": 18315, "train_loss": 3.191500663757324, "lr": 0.00017162469474632608, "tps": 34361, "wall": 34933.4} {"step": 18316, "train_loss": 3.284203052520752, "lr": 0.00017160624185317985, "tps": 34357, "wall": 34938.9} {"step": 18317, "train_loss": 3.2413511276245117, "lr": 0.00017158778950824078, "tps": 34354, "wall": 34944.4} {"step": 18318, "train_loss": 3.414473533630371, "lr": 0.0001715693377117178, "tps": 34350, "wall": 34949.9} {"step": 18319, "train_loss": 3.2581262588500977, "lr": 0.00017155088646382004, "tps": 34347, "wall": 34955.5} {"step": 18320, "train_loss": 3.3061466217041016, "lr": 0.00017153243576475643, "tps": 34343, "wall": 34961.0} {"step": 18321, "train_loss": 3.3386902809143066, "lr": 0.00017151398561473605, "tps": 34340, "wall": 34966.4} {"step": 18322, "train_loss": 3.294386386871338, "lr": 0.00017149553601396783, "tps": 34336, "wall": 34972.0} {"step": 18323, "train_loss": 3.3625385761260986, "lr": 0.00017147708696266077, "tps": 34333, "wall": 34977.5} {"step": 18324, "train_loss": 3.2947609424591064, "lr": 0.00017145863846102392, "tps": 34329, "wall": 34983.0} {"step": 18325, "train_loss": 3.248469829559326, "lr": 0.00017144019050926624, "tps": 34325, "wall": 34988.5} {"step": 18326, "train_loss": 3.253847122192383, "lr": 0.00017142174310759675, "tps": 34322, "wall": 34993.9} {"step": 18327, "train_loss": 3.219245195388794, "lr": 0.00017140329625622434, "tps": 34318, "wall": 34999.4} {"step": 18328, "train_loss": 3.344221591949463, "lr": 0.000171384849955358, "tps": 34315, "wall": 35004.9} {"step": 18329, "train_loss": 3.2940139770507812, "lr": 0.00017136640420520677, "tps": 34311, "wall": 35010.4} {"step": 18330, "train_loss": 3.2666091918945312, "lr": 0.0001713479590059795, "tps": 34308, "wall": 35016.0} {"step": 18331, "train_loss": 3.4074172973632812, "lr": 0.0001713295143578852, "tps": 34304, "wall": 35021.5} {"step": 18332, "train_loss": 3.3407928943634033, "lr": 0.00017131107026113277, "tps": 34301, "wall": 35027.0} {"step": 18333, "train_loss": 3.265237808227539, "lr": 0.0001712926267159312, "tps": 34297, "wall": 35032.5} {"step": 18334, "train_loss": 3.359034299850464, "lr": 0.00017127418372248938, "tps": 34294, "wall": 35038.0} {"step": 18335, "train_loss": 3.219836711883545, "lr": 0.0001712557412810162, "tps": 34290, "wall": 35043.5} {"step": 18336, "train_loss": 3.332345485687256, "lr": 0.0001712372993917207, "tps": 34287, "wall": 35049.0} {"step": 18337, "train_loss": 3.264024496078491, "lr": 0.00017121885805481166, "tps": 34283, "wall": 35054.5} {"step": 18338, "train_loss": 3.2475080490112305, "lr": 0.00017120041727049804, "tps": 34280, "wall": 35060.0} {"step": 18339, "train_loss": 3.490668773651123, "lr": 0.00017118197703898876, "tps": 34276, "wall": 35065.4} {"step": 18340, "train_loss": 3.395756244659424, "lr": 0.00017116353736049264, "tps": 34273, "wall": 35070.9} {"step": 18341, "train_loss": 3.314272165298462, "lr": 0.0001711450982352186, "tps": 34269, "wall": 35076.4} {"step": 18342, "train_loss": 3.280367851257324, "lr": 0.0001711266596633756, "tps": 34266, "wall": 35081.9} {"step": 18343, "train_loss": 3.213721752166748, "lr": 0.00017110822164517243, "tps": 34262, "wall": 35087.3} {"step": 18344, "train_loss": 3.3790712356567383, "lr": 0.00017108978418081794, "tps": 34259, "wall": 35092.8} {"step": 18345, "train_loss": 3.251997947692871, "lr": 0.00017107134727052098, "tps": 34255, "wall": 35098.2} {"step": 18346, "train_loss": 3.2832088470458984, "lr": 0.00017105291091449053, "tps": 34252, "wall": 35103.7} {"step": 18347, "train_loss": 3.340398073196411, "lr": 0.0001710344751129353, "tps": 34249, "wall": 35109.1} {"step": 18348, "train_loss": 3.2273030281066895, "lr": 0.00017101603986606422, "tps": 34245, "wall": 35114.6} {"step": 18349, "train_loss": 3.2650184631347656, "lr": 0.00017099760517408607, "tps": 34242, "wall": 35120.1} {"step": 18350, "train_loss": 3.260772228240967, "lr": 0.00017097917103720968, "tps": 34238, "wall": 35125.6} {"step": 18351, "train_loss": 3.2289047241210938, "lr": 0.00017096073745564394, "tps": 34235, "wall": 35131.1} {"step": 18352, "train_loss": 3.332343578338623, "lr": 0.0001709423044295976, "tps": 34231, "wall": 35136.6} {"step": 18353, "train_loss": 3.2738430500030518, "lr": 0.00017092387195927948, "tps": 34228, "wall": 35142.1} {"step": 18354, "train_loss": 3.328486680984497, "lr": 0.0001709054400448984, "tps": 34224, "wall": 35147.6} {"step": 18355, "train_loss": 3.3333213329315186, "lr": 0.0001708870086866631, "tps": 34221, "wall": 35153.1} {"step": 18356, "train_loss": 3.333066940307617, "lr": 0.0001708685778847825, "tps": 34217, "wall": 35158.5} {"step": 18357, "train_loss": 3.3353285789489746, "lr": 0.00017085014763946527, "tps": 34214, "wall": 35164.0} {"step": 18358, "train_loss": 3.2973759174346924, "lr": 0.00017083171795092024, "tps": 34210, "wall": 35169.5} {"step": 18359, "train_loss": 3.207852602005005, "lr": 0.0001708132888193562, "tps": 34207, "wall": 35175.0} {"step": 18360, "train_loss": 3.2665884494781494, "lr": 0.00017079486024498182, "tps": 34203, "wall": 35180.5} {"step": 18361, "train_loss": 3.3361735343933105, "lr": 0.00017077643222800597, "tps": 34200, "wall": 35185.9} {"step": 18362, "train_loss": 3.3765273094177246, "lr": 0.00017075800476863733, "tps": 34196, "wall": 35191.5} {"step": 18363, "train_loss": 3.301906108856201, "lr": 0.0001707395778670847, "tps": 34193, "wall": 35196.9} {"step": 18364, "train_loss": 3.321913719177246, "lr": 0.00017072115152355676, "tps": 34189, "wall": 35202.4} {"step": 18365, "train_loss": 3.28365159034729, "lr": 0.0001707027257382623, "tps": 34186, "wall": 35207.9} {"step": 18366, "train_loss": 3.338723659515381, "lr": 0.00017068430051141005, "tps": 34182, "wall": 35213.5} {"step": 18367, "train_loss": 3.2630388736724854, "lr": 0.0001706658758432087, "tps": 34179, "wall": 35219.0} {"step": 18368, "train_loss": 3.220872163772583, "lr": 0.00017064745173386693, "tps": 34176, "wall": 35224.4} {"step": 18369, "train_loss": 3.303575038909912, "lr": 0.0001706290281835936, "tps": 34172, "wall": 35229.8} {"step": 18370, "train_loss": 3.279275894165039, "lr": 0.00017061060519259723, "tps": 34169, "wall": 35235.3} {"step": 18371, "train_loss": 3.285712480545044, "lr": 0.00017059218276108663, "tps": 34165, "wall": 35240.7} {"step": 18372, "train_loss": 3.268820285797119, "lr": 0.00017057376088927044, "tps": 34162, "wall": 35246.2} {"step": 18373, "train_loss": 3.203049898147583, "lr": 0.00017055533957735736, "tps": 34158, "wall": 35251.8} {"step": 18374, "train_loss": 3.342586040496826, "lr": 0.00017053691882555608, "tps": 34155, "wall": 35257.3} {"step": 18375, "train_loss": 3.2508604526519775, "lr": 0.00017051849863407523, "tps": 34151, "wall": 35262.8} {"step": 18376, "train_loss": 3.2109591960906982, "lr": 0.00017050007900312357, "tps": 34148, "wall": 35268.3} {"step": 18377, "train_loss": 3.2818660736083984, "lr": 0.00017048165993290964, "tps": 34144, "wall": 35273.8} {"step": 18378, "train_loss": 3.331605911254883, "lr": 0.00017046324142364213, "tps": 34141, "wall": 35279.2} {"step": 18379, "train_loss": 3.2105040550231934, "lr": 0.00017044482347552972, "tps": 34138, "wall": 35284.7} {"step": 18380, "train_loss": 3.2741854190826416, "lr": 0.00017042640608878106, "tps": 34134, "wall": 35290.3} {"step": 18381, "train_loss": 3.342322826385498, "lr": 0.0001704079892636047, "tps": 34131, "wall": 35295.7} {"step": 18382, "train_loss": 3.361706018447876, "lr": 0.00017038957300020933, "tps": 34127, "wall": 35301.2} {"step": 18383, "train_loss": 3.325900077819824, "lr": 0.00017037115729880365, "tps": 34124, "wall": 35306.6} {"step": 18384, "train_loss": 3.2626514434814453, "lr": 0.00017035274215959607, "tps": 34120, "wall": 35312.1} {"step": 18385, "train_loss": 3.238935947418213, "lr": 0.00017033432758279538, "tps": 34117, "wall": 35317.5} {"step": 18386, "train_loss": 3.260960102081299, "lr": 0.0001703159135686101, "tps": 34114, "wall": 35323.0} {"step": 18387, "train_loss": 3.3081583976745605, "lr": 0.00017029750011724883, "tps": 34110, "wall": 35328.5} {"step": 18388, "train_loss": 3.2740979194641113, "lr": 0.00017027908722892017, "tps": 34107, "wall": 35334.0} {"step": 18389, "train_loss": 3.2324116230010986, "lr": 0.00017026067490383268, "tps": 34103, "wall": 35339.4} {"step": 18390, "train_loss": 3.2609567642211914, "lr": 0.000170242263142195, "tps": 34100, "wall": 35344.9} {"step": 18391, "train_loss": 3.2545266151428223, "lr": 0.00017022385194421559, "tps": 34096, "wall": 35350.3} {"step": 18392, "train_loss": 3.342465400695801, "lr": 0.0001702054413101031, "tps": 34093, "wall": 35355.8} {"step": 18393, "train_loss": 3.27315616607666, "lr": 0.00017018703124006615, "tps": 34090, "wall": 35361.2} {"step": 18394, "train_loss": 3.2599244117736816, "lr": 0.00017016862173431312, "tps": 34086, "wall": 35366.6} {"step": 18395, "train_loss": 3.268589973449707, "lr": 0.00017015021279305264, "tps": 34083, "wall": 35372.2} {"step": 18396, "train_loss": 3.2681844234466553, "lr": 0.00017013180441649328, "tps": 34079, "wall": 35377.6} {"step": 18397, "train_loss": 3.290562629699707, "lr": 0.0001701133966048435, "tps": 34076, "wall": 35383.0} {"step": 18398, "train_loss": 3.3422534465789795, "lr": 0.00017009498935831188, "tps": 34073, "wall": 35388.5} {"step": 18399, "train_loss": 3.320258617401123, "lr": 0.0001700765826771069, "tps": 34069, "wall": 35394.0} {"step": 18400, "train_loss": 3.2769923210144043, "lr": 0.00017005817656143716, "tps": 34066, "wall": 35399.4} {"step": 18401, "train_loss": 3.346144676208496, "lr": 0.00017003977101151104, "tps": 34062, "wall": 35404.9} {"step": 18402, "train_loss": 3.377190589904785, "lr": 0.0001700213660275371, "tps": 34059, "wall": 35410.4} {"step": 18403, "train_loss": 3.241992950439453, "lr": 0.00017000296160972383, "tps": 34056, "wall": 35415.8} {"step": 18404, "train_loss": 3.3756866455078125, "lr": 0.00016998455775827975, "tps": 34052, "wall": 35421.3} {"step": 18405, "train_loss": 3.288404941558838, "lr": 0.00016996615447341327, "tps": 34049, "wall": 35426.7} {"step": 18406, "train_loss": 3.2846574783325195, "lr": 0.00016994775175533292, "tps": 34045, "wall": 35432.2} {"step": 18407, "train_loss": 3.227569818496704, "lr": 0.00016992934960424711, "tps": 34042, "wall": 35437.7} {"step": 18408, "train_loss": 3.3359198570251465, "lr": 0.00016991094802036436, "tps": 34039, "wall": 35443.1} {"step": 18409, "train_loss": 3.298671245574951, "lr": 0.0001698925470038931, "tps": 34035, "wall": 35448.6} {"step": 18410, "train_loss": 3.3175888061523438, "lr": 0.0001698741465550418, "tps": 34032, "wall": 35454.1} {"step": 18411, "train_loss": 3.315912961959839, "lr": 0.00016985574667401884, "tps": 34028, "wall": 35459.5} {"step": 18412, "train_loss": 3.1927051544189453, "lr": 0.00016983734736103273, "tps": 34025, "wall": 35465.0} {"step": 18413, "train_loss": 3.275238513946533, "lr": 0.00016981894861629187, "tps": 34022, "wall": 35470.4} {"step": 18414, "train_loss": 3.321451187133789, "lr": 0.00016980055044000465, "tps": 34018, "wall": 35475.9} {"step": 18415, "train_loss": 3.3005499839782715, "lr": 0.00016978215283237948, "tps": 34015, "wall": 35481.3} {"step": 18416, "train_loss": 3.301631450653076, "lr": 0.00016976375579362484, "tps": 34011, "wall": 35486.8} {"step": 18417, "train_loss": 3.2480552196502686, "lr": 0.00016974535932394908, "tps": 34008, "wall": 35492.5} {"step": 18418, "train_loss": 3.340456008911133, "lr": 0.00016972696342356064, "tps": 34005, "wall": 35497.9} {"step": 18419, "train_loss": 3.489142894744873, "lr": 0.00016970856809266782, "tps": 34001, "wall": 35503.5} {"step": 18420, "train_loss": 3.2409794330596924, "lr": 0.00016969017333147912, "tps": 33998, "wall": 35508.9} {"step": 18421, "train_loss": 3.3144478797912598, "lr": 0.0001696717791402028, "tps": 33994, "wall": 35514.3} {"step": 18422, "train_loss": 3.294245719909668, "lr": 0.00016965338551904732, "tps": 33991, "wall": 35519.8} {"step": 18423, "train_loss": 3.2358505725860596, "lr": 0.00016963499246822105, "tps": 33988, "wall": 35525.3} {"step": 18424, "train_loss": 3.3507065773010254, "lr": 0.00016961659998793226, "tps": 33984, "wall": 35530.8} {"step": 18425, "train_loss": 3.3965463638305664, "lr": 0.00016959820807838934, "tps": 33981, "wall": 35536.3} {"step": 18426, "train_loss": 3.242771863937378, "lr": 0.00016957981673980065, "tps": 33977, "wall": 35541.7} {"step": 18427, "train_loss": 3.236872673034668, "lr": 0.00016956142597237457, "tps": 33974, "wall": 35547.2} {"step": 18428, "train_loss": 3.2645952701568604, "lr": 0.00016954303577631933, "tps": 33970, "wall": 35552.9} {"step": 18429, "train_loss": 3.28279447555542, "lr": 0.00016952464615184335, "tps": 33967, "wall": 35558.4} {"step": 18430, "train_loss": 3.274725914001465, "lr": 0.00016950625709915494, "tps": 33964, "wall": 35563.9} {"step": 18431, "train_loss": 3.26017165184021, "lr": 0.0001694878686184623, "tps": 33960, "wall": 35569.3} {"step": 18432, "train_loss": 3.259938955307007, "lr": 0.00016946948070997383, "tps": 33957, "wall": 35574.7} {"step": 18433, "train_loss": 3.2393195629119873, "lr": 0.00016945109337389788, "tps": 33953, "wall": 35580.2} {"step": 18434, "train_loss": 3.3308539390563965, "lr": 0.00016943270661044264, "tps": 33950, "wall": 35585.7} {"step": 18435, "train_loss": 3.3104288578033447, "lr": 0.0001694143204198164, "tps": 33947, "wall": 35591.2} {"step": 18436, "train_loss": 3.2746353149414062, "lr": 0.00016939593480222752, "tps": 33943, "wall": 35596.7} {"step": 18437, "train_loss": 3.25761079788208, "lr": 0.00016937754975788422, "tps": 33940, "wall": 35602.2} {"step": 18438, "train_loss": 3.2445826530456543, "lr": 0.00016935916528699476, "tps": 33936, "wall": 35607.7} {"step": 18439, "train_loss": 3.315126895904541, "lr": 0.00016934078138976743, "tps": 33933, "wall": 35613.3} {"step": 18440, "train_loss": 3.287963390350342, "lr": 0.00016932239806641047, "tps": 33930, "wall": 35618.9} {"step": 18441, "train_loss": 3.20753812789917, "lr": 0.00016930401531713214, "tps": 33926, "wall": 35624.4} {"step": 18442, "train_loss": 3.1855227947235107, "lr": 0.00016928563314214063, "tps": 33923, "wall": 35629.9} {"step": 18443, "train_loss": 3.1584243774414062, "lr": 0.0001692672515416442, "tps": 33919, "wall": 35635.5} {"step": 18444, "train_loss": 3.2822189331054688, "lr": 0.00016924887051585118, "tps": 33916, "wall": 35641.1} {"step": 18445, "train_loss": 3.2360434532165527, "lr": 0.00016923049006496962, "tps": 33912, "wall": 35646.6} {"step": 18446, "train_loss": 3.242009162902832, "lr": 0.00016921211018920782, "tps": 33909, "wall": 35652.2} {"step": 18447, "train_loss": 3.235664129257202, "lr": 0.00016919373088877405, "tps": 33905, "wall": 35657.7} {"step": 18448, "train_loss": 3.278254747390747, "lr": 0.00016917535216387635, "tps": 33902, "wall": 35663.3} {"step": 18449, "train_loss": 3.1986489295959473, "lr": 0.00016915697401472305, "tps": 33899, "wall": 35668.8} {"step": 18450, "train_loss": 3.2932281494140625, "lr": 0.00016913859644152236, "tps": 33895, "wall": 35674.4} {"step": 18451, "train_loss": 3.270684003829956, "lr": 0.00016912021944448231, "tps": 33892, "wall": 35679.9} {"step": 18452, "train_loss": 3.2681539058685303, "lr": 0.00016910184302381117, "tps": 33888, "wall": 35685.5} {"step": 18453, "train_loss": 3.285393714904785, "lr": 0.00016908346717971716, "tps": 33885, "wall": 35691.0} {"step": 18454, "train_loss": 3.31315279006958, "lr": 0.00016906509191240838, "tps": 33881, "wall": 35696.6} {"step": 18455, "train_loss": 3.1876912117004395, "lr": 0.00016904671722209295, "tps": 33878, "wall": 35702.1} {"step": 18456, "train_loss": 3.2923011779785156, "lr": 0.0001690283431089791, "tps": 33874, "wall": 35707.7} {"step": 18457, "train_loss": 3.341675281524658, "lr": 0.00016900996957327496, "tps": 33871, "wall": 35713.3} {"step": 18458, "train_loss": 3.348743438720703, "lr": 0.00016899159661518863, "tps": 33868, "wall": 35718.8} {"step": 18459, "train_loss": 3.289264678955078, "lr": 0.00016897322423492828, "tps": 33864, "wall": 35724.4} {"step": 18460, "train_loss": 3.2008838653564453, "lr": 0.00016895485243270195, "tps": 33861, "wall": 35730.0} {"step": 18461, "train_loss": 3.2276487350463867, "lr": 0.0001689364812087178, "tps": 33857, "wall": 35735.7} {"step": 18462, "train_loss": 3.2723355293273926, "lr": 0.00016891811056318404, "tps": 33854, "wall": 35741.4} {"step": 18463, "train_loss": 3.406083106994629, "lr": 0.00016889974049630858, "tps": 33850, "wall": 35747.0} {"step": 18464, "train_loss": 3.293287992477417, "lr": 0.00016888137100829967, "tps": 33847, "wall": 35752.7} {"step": 18465, "train_loss": 3.2626047134399414, "lr": 0.00016886300209936539, "tps": 33843, "wall": 35758.3} {"step": 18466, "train_loss": 3.3154940605163574, "lr": 0.00016884463376971374, "tps": 33840, "wall": 35763.9} {"step": 18467, "train_loss": 3.359792709350586, "lr": 0.00016882626601955283, "tps": 33836, "wall": 35769.4} {"step": 18468, "train_loss": 3.207937717437744, "lr": 0.0001688078988490908, "tps": 33833, "wall": 35775.0} {"step": 18469, "train_loss": 3.3163955211639404, "lr": 0.00016878953225853564, "tps": 33829, "wall": 35780.6} {"step": 18470, "train_loss": 3.240553379058838, "lr": 0.00016877116624809544, "tps": 33826, "wall": 35786.2} {"step": 18471, "train_loss": 3.220874786376953, "lr": 0.00016875280081797821, "tps": 33822, "wall": 35791.9} {"step": 18472, "train_loss": 3.3221893310546875, "lr": 0.00016873443596839206, "tps": 33819, "wall": 35797.6} {"step": 18473, "train_loss": 3.2585883140563965, "lr": 0.00016871607169954497, "tps": 33815, "wall": 35803.2} {"step": 18474, "train_loss": 3.323632001876831, "lr": 0.00016869770801164496, "tps": 33812, "wall": 35808.9} {"step": 18475, "train_loss": 3.348066806793213, "lr": 0.0001686793449049002, "tps": 33808, "wall": 35814.6} {"step": 18476, "train_loss": 3.167362928390503, "lr": 0.00016866098237951847, "tps": 33805, "wall": 35820.2} {"step": 18477, "train_loss": 3.2929677963256836, "lr": 0.00016864262043570798, "tps": 33801, "wall": 35825.9} {"step": 18478, "train_loss": 3.2708613872528076, "lr": 0.00016862425907367663, "tps": 33798, "wall": 35831.6} {"step": 18479, "train_loss": 3.3507094383239746, "lr": 0.0001686058982936325, "tps": 33794, "wall": 35837.2} {"step": 18480, "train_loss": 3.401202917098999, "lr": 0.0001685875380957835, "tps": 33791, "wall": 35843.0} {"step": 18481, "train_loss": 3.2025258541107178, "lr": 0.00016856917848033764, "tps": 33787, "wall": 35848.6} {"step": 18482, "train_loss": 3.28385591506958, "lr": 0.00016855081944750294, "tps": 33783, "wall": 35854.4} {"step": 18483, "train_loss": 3.3321175575256348, "lr": 0.0001685324609974873, "tps": 33780, "wall": 35860.1} {"step": 18484, "train_loss": 3.276959180831909, "lr": 0.00016851410313049872, "tps": 33776, "wall": 35865.8} {"step": 18485, "train_loss": 3.276797294616699, "lr": 0.00016849574584674518, "tps": 33773, "wall": 35871.5} {"step": 18486, "train_loss": 3.282719135284424, "lr": 0.00016847738914643471, "tps": 33769, "wall": 35877.2} {"step": 18487, "train_loss": 3.290553569793701, "lr": 0.00016845903302977505, "tps": 33766, "wall": 35882.9} {"step": 18488, "train_loss": 3.3111250400543213, "lr": 0.00016844067749697427, "tps": 33762, "wall": 35888.5} {"step": 18489, "train_loss": 3.2938902378082275, "lr": 0.00016842232254824036, "tps": 33759, "wall": 35894.2} {"step": 18490, "train_loss": 3.369549512863159, "lr": 0.0001684039681837811, "tps": 33755, "wall": 35900.0} {"step": 18491, "train_loss": 3.2984871864318848, "lr": 0.00016838561440380448, "tps": 33752, "wall": 35905.6} {"step": 18492, "train_loss": 3.309227466583252, "lr": 0.00016836726120851843, "tps": 33748, "wall": 35911.4} {"step": 18493, "train_loss": 3.321200370788574, "lr": 0.00016834890859813086, "tps": 33744, "wall": 35917.2} {"step": 18494, "train_loss": 3.2187085151672363, "lr": 0.00016833055657284959, "tps": 33741, "wall": 35922.9} {"step": 18495, "train_loss": 3.30112361907959, "lr": 0.00016831220513288263, "tps": 33737, "wall": 35928.5} {"step": 18496, "train_loss": 3.337491750717163, "lr": 0.00016829385427843775, "tps": 33734, "wall": 35934.2} {"step": 18497, "train_loss": 3.3120014667510986, "lr": 0.00016827550400972294, "tps": 33730, "wall": 35939.9} {"step": 18498, "train_loss": 3.2975192070007324, "lr": 0.00016825715432694594, "tps": 33727, "wall": 35945.5} {"step": 18499, "train_loss": 3.226135730743408, "lr": 0.00016823880523031482, "tps": 33723, "wall": 35951.4} {"step": 18500, "train_loss": 3.3659534454345703, "lr": 0.0001682204567200372, "tps": 33720, "wall": 35957.1} {"step": 18501, "train_loss": 3.1935157775878906, "lr": 0.00016820210879632107, "tps": 33716, "wall": 35962.9} {"step": 18502, "train_loss": 3.3623523712158203, "lr": 0.00016818376145937434, "tps": 33713, "wall": 35968.7} {"step": 18503, "train_loss": 3.3829617500305176, "lr": 0.0001681654147094047, "tps": 33709, "wall": 35974.5} {"step": 18504, "train_loss": 3.22503924369812, "lr": 0.00016814706854662, "tps": 33705, "wall": 35980.2} {"step": 18505, "train_loss": 3.3413264751434326, "lr": 0.00016812872297122816, "tps": 33702, "wall": 35986.0} {"step": 18506, "train_loss": 3.3384931087493896, "lr": 0.000168110377983437, "tps": 33698, "wall": 35991.7} {"step": 18507, "train_loss": 3.291365146636963, "lr": 0.0001680920335834542, "tps": 33695, "wall": 35997.5} {"step": 18508, "train_loss": 3.3362700939178467, "lr": 0.00016807368977148768, "tps": 33691, "wall": 36003.2} {"step": 18509, "train_loss": 3.333364248275757, "lr": 0.00016805534654774524, "tps": 33688, "wall": 36008.9} {"step": 18510, "train_loss": 3.339656352996826, "lr": 0.0001680370039124346, "tps": 33684, "wall": 36014.7} {"step": 18511, "train_loss": 3.2970266342163086, "lr": 0.0001680186618657636, "tps": 33680, "wall": 36020.4} {"step": 18512, "train_loss": 3.342665672302246, "lr": 0.00016800032040794003, "tps": 33677, "wall": 36026.1} {"step": 18513, "train_loss": 3.3614425659179688, "lr": 0.00016798197953917163, "tps": 33673, "wall": 36032.0} {"step": 18514, "train_loss": 3.272768497467041, "lr": 0.00016796363925966618, "tps": 33670, "wall": 36037.8} {"step": 18515, "train_loss": 3.2926487922668457, "lr": 0.00016794529956963146, "tps": 33666, "wall": 36043.5} {"step": 18516, "train_loss": 3.2452006340026855, "lr": 0.0001679269604692752, "tps": 33663, "wall": 36049.3} {"step": 18517, "train_loss": 3.260312795639038, "lr": 0.00016790862195880513, "tps": 33659, "wall": 36055.0} {"step": 18518, "train_loss": 3.2532262802124023, "lr": 0.000167890284038429, "tps": 33656, "wall": 36060.8} {"step": 18519, "train_loss": 3.370978355407715, "lr": 0.00016787194670835463, "tps": 33652, "wall": 36066.6} {"step": 18520, "train_loss": 3.31874942779541, "lr": 0.00016785360996878957, "tps": 33648, "wall": 36072.3} {"step": 18521, "train_loss": 3.4012622833251953, "lr": 0.00016783527381994165, "tps": 33645, "wall": 36078.1} {"step": 18522, "train_loss": 3.269343376159668, "lr": 0.00016781693826201858, "tps": 33641, "wall": 36083.9} {"step": 18523, "train_loss": 3.3633511066436768, "lr": 0.00016779860329522813, "tps": 33638, "wall": 36089.7} {"step": 18524, "train_loss": 3.19504976272583, "lr": 0.00016778026891977783, "tps": 33634, "wall": 36095.5} {"step": 18525, "train_loss": 3.181607246398926, "lr": 0.0001677619351358755, "tps": 33630, "wall": 36101.3} {"step": 18526, "train_loss": 3.281984567642212, "lr": 0.0001677436019437288, "tps": 33627, "wall": 36107.2} {"step": 18527, "train_loss": 3.2791712284088135, "lr": 0.00016772526934354543, "tps": 33623, "wall": 36113.0} {"step": 18528, "train_loss": 3.250795841217041, "lr": 0.00016770693733553297, "tps": 33620, "wall": 36118.7} {"step": 18529, "train_loss": 3.312105178833008, "lr": 0.00016768860591989925, "tps": 33616, "wall": 36124.6} {"step": 18530, "train_loss": 3.344473361968994, "lr": 0.00016767027509685174, "tps": 33612, "wall": 36130.4} {"step": 18531, "train_loss": 3.1808905601501465, "lr": 0.00016765194486659826, "tps": 33609, "wall": 36136.1} {"step": 18532, "train_loss": 3.2146222591400146, "lr": 0.0001676336152293463, "tps": 33605, "wall": 36141.9} {"step": 18533, "train_loss": 3.311790943145752, "lr": 0.00016761528618530367, "tps": 33602, "wall": 36147.8} {"step": 18534, "train_loss": 3.3629307746887207, "lr": 0.00016759695773467783, "tps": 33598, "wall": 36153.6} {"step": 18535, "train_loss": 3.301605224609375, "lr": 0.00016757862987767648, "tps": 33594, "wall": 36159.4} {"step": 18536, "train_loss": 3.243983745574951, "lr": 0.00016756030261450735, "tps": 33591, "wall": 36165.2} {"step": 18537, "train_loss": 3.2577812671661377, "lr": 0.00016754197594537787, "tps": 33587, "wall": 36171.1} {"step": 18538, "train_loss": 3.2974019050598145, "lr": 0.0001675236498704957, "tps": 33584, "wall": 36176.9} {"step": 18539, "train_loss": 3.3535327911376953, "lr": 0.00016750532439006852, "tps": 33580, "wall": 36182.7} {"step": 18540, "train_loss": 3.4004502296447754, "lr": 0.0001674869995043039, "tps": 33577, "wall": 36188.5} {"step": 18541, "train_loss": 3.340034008026123, "lr": 0.00016746867521340926, "tps": 33573, "wall": 36194.3} {"step": 18542, "train_loss": 3.3594985008239746, "lr": 0.00016745035151759238, "tps": 33569, "wall": 36200.1} {"step": 18543, "train_loss": 3.384888172149658, "lr": 0.00016743202841706082, "tps": 33566, "wall": 36205.9} {"step": 18544, "train_loss": 3.400822639465332, "lr": 0.00016741370591202202, "tps": 33562, "wall": 36211.8} {"step": 18545, "train_loss": 3.238086700439453, "lr": 0.0001673953840026836, "tps": 33559, "wall": 36217.7} {"step": 18546, "train_loss": 3.3325045108795166, "lr": 0.0001673770626892532, "tps": 33555, "wall": 36223.5} {"step": 18547, "train_loss": 3.304778575897217, "lr": 0.0001673587419719382, "tps": 33551, "wall": 36229.3} {"step": 18548, "train_loss": 3.345946788787842, "lr": 0.00016734042185094622, "tps": 33548, "wall": 36235.1} {"step": 18549, "train_loss": 3.247925281524658, "lr": 0.00016732210232648476, "tps": 33544, "wall": 36241.0} {"step": 18550, "train_loss": 3.3712217807769775, "lr": 0.00016730378339876144, "tps": 33541, "wall": 36246.8} {"step": 18551, "train_loss": 3.2873048782348633, "lr": 0.00016728546506798373, "tps": 33537, "wall": 36252.6} {"step": 18552, "train_loss": 3.306924819946289, "lr": 0.00016726714733435904, "tps": 33533, "wall": 36258.5} {"step": 18553, "train_loss": 3.3516807556152344, "lr": 0.00016724883019809505, "tps": 33530, "wall": 36264.4} {"step": 18554, "train_loss": 3.24130916595459, "lr": 0.0001672305136593991, "tps": 33526, "wall": 36270.2} {"step": 18555, "train_loss": 3.2857632637023926, "lr": 0.00016721219771847877, "tps": 33522, "wall": 36276.2} {"step": 18556, "train_loss": 3.310685157775879, "lr": 0.0001671938823755415, "tps": 33519, "wall": 36282.0} {"step": 18557, "train_loss": 3.352957248687744, "lr": 0.0001671755676307948, "tps": 33515, "wall": 36287.9} {"step": 18558, "train_loss": 3.2241926193237305, "lr": 0.0001671572534844461, "tps": 33512, "wall": 36293.7} {"step": 18559, "train_loss": 3.2527098655700684, "lr": 0.00016713893993670293, "tps": 33508, "wall": 36299.5} {"step": 18560, "train_loss": 3.2331528663635254, "lr": 0.00016712062698777272, "tps": 33505, "wall": 36305.4} {"step": 18561, "train_loss": 3.320922374725342, "lr": 0.00016710231463786288, "tps": 33501, "wall": 36311.2} {"step": 18562, "train_loss": 3.2589054107666016, "lr": 0.00016708400288718088, "tps": 33497, "wall": 36317.0} {"step": 18563, "train_loss": 3.365165948867798, "lr": 0.0001670656917359342, "tps": 33494, "wall": 36322.9} {"step": 18564, "train_loss": 3.2533118724823, "lr": 0.0001670473811843302, "tps": 33490, "wall": 36328.7} {"step": 18565, "train_loss": 3.299196720123291, "lr": 0.0001670290712325763, "tps": 33487, "wall": 36334.6} {"step": 18566, "train_loss": 3.2970173358917236, "lr": 0.00016701076188087996, "tps": 33483, "wall": 36340.4} {"step": 18567, "train_loss": 3.3084139823913574, "lr": 0.00016699245312944863, "tps": 33480, "wall": 36346.2} {"step": 18568, "train_loss": 3.325615882873535, "lr": 0.00016697414497848957, "tps": 33476, "wall": 36352.0} {"step": 18569, "train_loss": 3.345881462097168, "lr": 0.00016695583742821032, "tps": 33472, "wall": 36357.8} {"step": 18570, "train_loss": 3.1898701190948486, "lr": 0.00016693753047881824, "tps": 33469, "wall": 36363.7} {"step": 18571, "train_loss": 3.2784042358398438, "lr": 0.00016691922413052064, "tps": 33465, "wall": 36369.5} {"step": 18572, "train_loss": 3.2794528007507324, "lr": 0.00016690091838352493, "tps": 33462, "wall": 36375.3} {"step": 18573, "train_loss": 3.283961296081543, "lr": 0.00016688261323803856, "tps": 33458, "wall": 36381.1} {"step": 18574, "train_loss": 3.423656463623047, "lr": 0.00016686430869426874, "tps": 33455, "wall": 36386.9} {"step": 18575, "train_loss": 3.324018716812134, "lr": 0.0001668460047524229, "tps": 33451, "wall": 36392.8} {"step": 18576, "train_loss": 3.330735921859741, "lr": 0.0001668277014127084, "tps": 33448, "wall": 36398.6} {"step": 18577, "train_loss": 3.3201160430908203, "lr": 0.00016680939867533265, "tps": 33444, "wall": 36404.4} {"step": 18578, "train_loss": 3.1829490661621094, "lr": 0.00016679109654050284, "tps": 33440, "wall": 36410.2} {"step": 18579, "train_loss": 3.291492462158203, "lr": 0.0001667727950084264, "tps": 33437, "wall": 36416.0} {"step": 18580, "train_loss": 3.345083713531494, "lr": 0.00016675449407931066, "tps": 33433, "wall": 36421.8} {"step": 18581, "train_loss": 3.342933177947998, "lr": 0.0001667361937533628, "tps": 33430, "wall": 36427.6} {"step": 18582, "train_loss": 3.3009305000305176, "lr": 0.00016671789403079025, "tps": 33426, "wall": 36433.4} {"step": 18583, "train_loss": 3.267301559448242, "lr": 0.00016669959491180035, "tps": 33423, "wall": 36439.2} {"step": 18584, "train_loss": 3.394282341003418, "lr": 0.0001666812963966002, "tps": 33419, "wall": 36445.0} {"step": 18585, "train_loss": 3.234792470932007, "lr": 0.00016666299848539727, "tps": 33416, "wall": 36450.8} {"step": 18586, "train_loss": 3.337181329727173, "lr": 0.0001666447011783988, "tps": 33412, "wall": 36456.7} {"step": 18587, "train_loss": 3.2339749336242676, "lr": 0.00016662640447581204, "tps": 33409, "wall": 36462.5} {"step": 18588, "train_loss": 3.2271881103515625, "lr": 0.00016660810837784422, "tps": 33405, "wall": 36468.3} {"step": 18589, "train_loss": 3.301753520965576, "lr": 0.00016658981288470264, "tps": 33402, "wall": 36474.1} {"step": 18590, "train_loss": 3.3152389526367188, "lr": 0.00016657151799659458, "tps": 33398, "wall": 36479.9} {"step": 18591, "train_loss": 3.407529830932617, "lr": 0.00016655322371372723, "tps": 33395, "wall": 36485.7} {"step": 18592, "train_loss": 3.3798863887786865, "lr": 0.00016653493003630784, "tps": 33391, "wall": 36491.5} {"step": 18593, "train_loss": 3.309436559677124, "lr": 0.00016651663696454368, "tps": 33388, "wall": 36497.2} {"step": 18594, "train_loss": 3.2163591384887695, "lr": 0.00016649834449864197, "tps": 33384, "wall": 36503.0} {"step": 18595, "train_loss": 3.3166098594665527, "lr": 0.00016648005263880986, "tps": 33381, "wall": 36508.8} {"step": 18596, "train_loss": 3.322575330734253, "lr": 0.00016646176138525464, "tps": 33377, "wall": 36514.7} {"step": 18597, "train_loss": 3.268651247024536, "lr": 0.0001664434707381835, "tps": 33374, "wall": 36520.4} {"step": 18598, "train_loss": 3.2677090167999268, "lr": 0.00016642518069780358, "tps": 33370, "wall": 36526.2} {"step": 18599, "train_loss": 3.211937427520752, "lr": 0.0001664068912643221, "tps": 33367, "wall": 36531.9} {"step": 18600, "train_loss": 3.450532913208008, "lr": 0.00016638860243794632, "tps": 33363, "wall": 36537.7} {"step": 18601, "train_loss": 3.1087491512298584, "lr": 0.00016637031421888333, "tps": 33360, "wall": 36543.5} {"step": 18602, "train_loss": 3.329669952392578, "lr": 0.00016635202660734026, "tps": 33356, "wall": 36549.2} {"step": 18603, "train_loss": 3.2534573078155518, "lr": 0.00016633373960352437, "tps": 33353, "wall": 36555.0} {"step": 18604, "train_loss": 3.3123583793640137, "lr": 0.00016631545320764282, "tps": 33349, "wall": 36560.7} {"step": 18605, "train_loss": 3.3585901260375977, "lr": 0.0001662971674199027, "tps": 33346, "wall": 36566.5} {"step": 18606, "train_loss": 3.329070568084717, "lr": 0.00016627888224051112, "tps": 33342, "wall": 36572.3} {"step": 18607, "train_loss": 3.232715606689453, "lr": 0.00016626059766967533, "tps": 33339, "wall": 36578.0} {"step": 18608, "train_loss": 3.333375930786133, "lr": 0.0001662423137076024, "tps": 33336, "wall": 36583.7} {"step": 18609, "train_loss": 3.3139822483062744, "lr": 0.00016622403035449943, "tps": 33332, "wall": 36589.5} {"step": 18610, "train_loss": 3.3017048835754395, "lr": 0.00016620574761057357, "tps": 33329, "wall": 36595.3} {"step": 18611, "train_loss": 3.2131264209747314, "lr": 0.00016618746547603186, "tps": 33325, "wall": 36601.0} {"step": 18612, "train_loss": 3.288370132446289, "lr": 0.0001661691839510815, "tps": 33322, "wall": 36606.6} {"step": 18613, "train_loss": 3.240161418914795, "lr": 0.00016615090303592948, "tps": 33319, "wall": 36612.3} {"step": 18614, "train_loss": 3.3863463401794434, "lr": 0.00016613262273078302, "tps": 33315, "wall": 36618.0} {"step": 18615, "train_loss": 3.1823904514312744, "lr": 0.0001661143430358491, "tps": 33312, "wall": 36623.7} {"step": 18616, "train_loss": 3.3182504177093506, "lr": 0.00016609606395133478, "tps": 33308, "wall": 36629.4} {"step": 18617, "train_loss": 3.3724966049194336, "lr": 0.00016607778547744726, "tps": 33305, "wall": 36635.1} {"step": 18618, "train_loss": 3.2433812618255615, "lr": 0.00016605950761439337, "tps": 33302, "wall": 36640.8} {"step": 18619, "train_loss": 3.308586597442627, "lr": 0.00016604123036238034, "tps": 33298, "wall": 36646.5} {"step": 18620, "train_loss": 3.208296537399292, "lr": 0.00016602295372161524, "tps": 33295, "wall": 36652.2} {"step": 18621, "train_loss": 3.303217887878418, "lr": 0.000166004677692305, "tps": 33291, "wall": 36657.9} {"step": 18622, "train_loss": 3.167543411254883, "lr": 0.00016598640227465667, "tps": 33288, "wall": 36663.5} {"step": 18623, "train_loss": 3.4079525470733643, "lr": 0.0001659681274688773, "tps": 33285, "wall": 36669.2} {"step": 18624, "train_loss": 3.2893714904785156, "lr": 0.00016594985327517394, "tps": 33281, "wall": 36674.9} {"step": 18625, "train_loss": 3.3706107139587402, "lr": 0.0001659315796937535, "tps": 33278, "wall": 36680.6} {"step": 18626, "train_loss": 3.3038253784179688, "lr": 0.00016591330672482317, "tps": 33275, "wall": 36686.3} {"step": 18627, "train_loss": 3.1979281902313232, "lr": 0.00016589503436858976, "tps": 33271, "wall": 36692.1} {"step": 18628, "train_loss": 3.277763605117798, "lr": 0.00016587676262526027, "tps": 33268, "wall": 36697.8} {"step": 18629, "train_loss": 3.233137369155884, "lr": 0.00016585849149504183, "tps": 33264, "wall": 36703.5} {"step": 18630, "train_loss": 3.228846549987793, "lr": 0.0001658402209781413, "tps": 33261, "wall": 36709.3} {"step": 18631, "train_loss": 3.343069553375244, "lr": 0.00016582195107476565, "tps": 33258, "wall": 36715.0} {"step": 18632, "train_loss": 3.357837438583374, "lr": 0.00016580368178512194, "tps": 33254, "wall": 36720.6} {"step": 18633, "train_loss": 3.297884941101074, "lr": 0.00016578541310941693, "tps": 33251, "wall": 36726.3} {"step": 18634, "train_loss": 3.290708541870117, "lr": 0.00016576714504785777, "tps": 33248, "wall": 36731.9} {"step": 18635, "train_loss": 3.3125202655792236, "lr": 0.00016574887760065137, "tps": 33244, "wall": 36737.6} {"step": 18636, "train_loss": 3.2781946659088135, "lr": 0.0001657306107680045, "tps": 33241, "wall": 36743.2} {"step": 18637, "train_loss": 3.335210084915161, "lr": 0.00016571234455012426, "tps": 33238, "wall": 36748.9} {"step": 18638, "train_loss": 3.312157154083252, "lr": 0.00016569407894721753, "tps": 33234, "wall": 36754.6} {"step": 18639, "train_loss": 3.1618072986602783, "lr": 0.00016567581395949125, "tps": 33231, "wall": 36760.3} {"step": 18640, "train_loss": 3.2770917415618896, "lr": 0.00016565754958715223, "tps": 33227, "wall": 36765.9} {"step": 18641, "train_loss": 3.199028730392456, "lr": 0.00016563928583040744, "tps": 33224, "wall": 36771.6} {"step": 18642, "train_loss": 3.2844161987304688, "lr": 0.0001656210226894638, "tps": 33221, "wall": 36777.3} {"step": 18643, "train_loss": 3.293830394744873, "lr": 0.0001656027601645281, "tps": 33217, "wall": 36783.0} {"step": 18644, "train_loss": 3.328395128250122, "lr": 0.00016558449825580728, "tps": 33214, "wall": 36788.6} {"step": 18645, "train_loss": 3.2300214767456055, "lr": 0.00016556623696350827, "tps": 33211, "wall": 36794.3} {"step": 18646, "train_loss": 3.202002763748169, "lr": 0.00016554797628783784, "tps": 33207, "wall": 36800.0} {"step": 18647, "train_loss": 3.3574347496032715, "lr": 0.00016552971622900287, "tps": 33204, "wall": 36805.6} {"step": 18648, "train_loss": 3.2606072425842285, "lr": 0.0001655114567872102, "tps": 33201, "wall": 36811.4} {"step": 18649, "train_loss": 3.296104907989502, "lr": 0.00016549319796266672, "tps": 33197, "wall": 36817.1} {"step": 18650, "train_loss": 3.2287862300872803, "lr": 0.00016547493975557927, "tps": 33194, "wall": 36822.8} {"step": 18651, "train_loss": 3.2505812644958496, "lr": 0.0001654566821661546, "tps": 33191, "wall": 36828.5} {"step": 18652, "train_loss": 3.287048816680908, "lr": 0.0001654384251945996, "tps": 33187, "wall": 36834.2} {"step": 18653, "train_loss": 3.2917745113372803, "lr": 0.00016542016884112107, "tps": 33184, "wall": 36839.7} {"step": 18654, "train_loss": 3.1802167892456055, "lr": 0.0001654019131059258, "tps": 33181, "wall": 36845.4} {"step": 18655, "train_loss": 3.2631194591522217, "lr": 0.00016538365798922068, "tps": 33177, "wall": 36851.0} {"step": 18656, "train_loss": 3.231221914291382, "lr": 0.0001653654034912124, "tps": 33174, "wall": 36856.7} {"step": 18657, "train_loss": 3.3649954795837402, "lr": 0.00016534714961210776, "tps": 33171, "wall": 36862.3} {"step": 18658, "train_loss": 3.3074049949645996, "lr": 0.0001653288963521136, "tps": 33167, "wall": 36868.0} {"step": 18659, "train_loss": 3.3143465518951416, "lr": 0.00016531064371143667, "tps": 33164, "wall": 36873.7} {"step": 18660, "train_loss": 3.22331166267395, "lr": 0.00016529239169028368, "tps": 33161, "wall": 36879.3} {"step": 18661, "train_loss": 3.327293872833252, "lr": 0.00016527414028886148, "tps": 33158, "wall": 36885.0} {"step": 18662, "train_loss": 3.2400753498077393, "lr": 0.0001652558895073768, "tps": 33154, "wall": 36890.6} {"step": 18663, "train_loss": 3.300703525543213, "lr": 0.00016523763934603628, "tps": 33151, "wall": 36896.2} {"step": 18664, "train_loss": 3.3519396781921387, "lr": 0.00016521938980504678, "tps": 33148, "wall": 36901.8} {"step": 18665, "train_loss": 3.2877938747406006, "lr": 0.00016520114088461503, "tps": 33144, "wall": 36907.4} {"step": 18666, "train_loss": 3.284628391265869, "lr": 0.00016518289258494773, "tps": 33141, "wall": 36913.0} {"step": 18667, "train_loss": 3.28536057472229, "lr": 0.0001651646449062515, "tps": 33138, "wall": 36918.6} {"step": 18668, "train_loss": 3.245480537414551, "lr": 0.00016514639784873323, "tps": 33135, "wall": 36924.2} {"step": 18669, "train_loss": 3.3292737007141113, "lr": 0.0001651281514125995, "tps": 33132, "wall": 36929.8} {"step": 18670, "train_loss": 3.25125789642334, "lr": 0.00016510990559805703, "tps": 33128, "wall": 36935.5} {"step": 18671, "train_loss": 3.2162868976593018, "lr": 0.00016509166040531254, "tps": 33125, "wall": 36941.1} {"step": 18672, "train_loss": 3.408080577850342, "lr": 0.00016507341583457262, "tps": 33122, "wall": 36946.8} {"step": 18673, "train_loss": 3.3477554321289062, "lr": 0.0001650551718860441, "tps": 33118, "wall": 36952.4} {"step": 18674, "train_loss": 3.1921212673187256, "lr": 0.00016503692855993353, "tps": 33115, "wall": 36958.0} {"step": 18675, "train_loss": 3.194967031478882, "lr": 0.00016501868585644763, "tps": 33112, "wall": 36963.6} {"step": 18676, "train_loss": 3.218679904937744, "lr": 0.00016500044377579305, "tps": 33109, "wall": 36969.2} {"step": 18677, "train_loss": 3.232320785522461, "lr": 0.00016498220231817636, "tps": 33105, "wall": 36974.8} {"step": 18678, "train_loss": 3.2077503204345703, "lr": 0.00016496396148380423, "tps": 33102, "wall": 36980.4} {"step": 18679, "train_loss": 3.1005842685699463, "lr": 0.0001649457212728834, "tps": 33099, "wall": 36986.0} {"step": 18680, "train_loss": 3.2304351329803467, "lr": 0.00016492748168562041, "tps": 33096, "wall": 36991.6} {"step": 18681, "train_loss": 3.2631454467773438, "lr": 0.00016490924272222185, "tps": 33092, "wall": 36997.3} {"step": 18682, "train_loss": 3.2585856914520264, "lr": 0.0001648910043828944, "tps": 33089, "wall": 37003.0} {"step": 18683, "train_loss": 3.3695099353790283, "lr": 0.00016487276666784468, "tps": 33086, "wall": 37008.8} {"step": 18684, "train_loss": 3.262420177459717, "lr": 0.00016485452957727917, "tps": 33082, "wall": 37014.6} {"step": 18685, "train_loss": 3.220637321472168, "lr": 0.00016483629311140452, "tps": 33079, "wall": 37020.3} {"step": 18686, "train_loss": 3.240936040878296, "lr": 0.0001648180572704274, "tps": 33075, "wall": 37026.1} {"step": 18687, "train_loss": 3.2173240184783936, "lr": 0.0001647998220545542, "tps": 33072, "wall": 37031.8} {"step": 18688, "train_loss": 3.358034133911133, "lr": 0.00016478158746399167, "tps": 33069, "wall": 37037.6} {"step": 18689, "train_loss": 3.3848390579223633, "lr": 0.00016476335349894635, "tps": 33065, "wall": 37043.3} {"step": 18690, "train_loss": 3.2722270488739014, "lr": 0.00016474512015962468, "tps": 33062, "wall": 37049.0} {"step": 18691, "train_loss": 3.454043388366699, "lr": 0.00016472688744623327, "tps": 33059, "wall": 37054.7} {"step": 18692, "train_loss": 3.3610196113586426, "lr": 0.00016470865535897868, "tps": 33056, "wall": 37060.3} {"step": 18693, "train_loss": 3.225160837173462, "lr": 0.0001646904238980675, "tps": 33052, "wall": 37065.9} {"step": 18694, "train_loss": 3.3659486770629883, "lr": 0.00016467219306370612, "tps": 33049, "wall": 37071.5} {"step": 18695, "train_loss": 3.2663121223449707, "lr": 0.00016465396285610115, "tps": 33046, "wall": 37077.1} {"step": 18696, "train_loss": 3.300581693649292, "lr": 0.00016463573327545912, "tps": 33043, "wall": 37082.7} {"step": 18697, "train_loss": 3.323943614959717, "lr": 0.00016461750432198645, "tps": 33039, "wall": 37088.3} {"step": 18698, "train_loss": 3.245048999786377, "lr": 0.0001645992759958897, "tps": 33036, "wall": 37093.9} {"step": 18699, "train_loss": 3.223906993865967, "lr": 0.0001645810482973753, "tps": 33033, "wall": 37099.5} {"step": 18700, "train_loss": 3.300398826599121, "lr": 0.0001645628212266499, "tps": 33030, "wall": 37105.1} {"step": 18701, "train_loss": 3.288785696029663, "lr": 0.0001645445947839198, "tps": 33027, "wall": 37110.7} {"step": 18702, "train_loss": 3.3169217109680176, "lr": 0.0001645263689693915, "tps": 33023, "wall": 37116.4} {"step": 18703, "train_loss": 3.311556816101074, "lr": 0.00016450814378327153, "tps": 33020, "wall": 37121.9} {"step": 18704, "train_loss": 3.3512115478515625, "lr": 0.00016448991922576628, "tps": 33017, "wall": 37127.5} {"step": 18705, "train_loss": 3.2222447395324707, "lr": 0.00016447169529708222, "tps": 33014, "wall": 37133.2} {"step": 18706, "train_loss": 3.369150400161743, "lr": 0.00016445347199742588, "tps": 33010, "wall": 37138.8} {"step": 18707, "train_loss": 3.301290512084961, "lr": 0.0001644352493270035, "tps": 33007, "wall": 37144.4} {"step": 18708, "train_loss": 3.2622978687286377, "lr": 0.0001644170272860217, "tps": 33004, "wall": 37150.0} {"step": 18709, "train_loss": 3.2041358947753906, "lr": 0.00016439880587468676, "tps": 33001, "wall": 37155.5} {"step": 18710, "train_loss": 3.2676022052764893, "lr": 0.00016438058509320524, "tps": 32998, "wall": 37161.1} {"step": 18711, "train_loss": 3.1457977294921875, "lr": 0.0001643623649417834, "tps": 32994, "wall": 37166.6} {"step": 18712, "train_loss": 3.232025623321533, "lr": 0.00016434414542062774, "tps": 32991, "wall": 37172.2} {"step": 18713, "train_loss": 3.3423218727111816, "lr": 0.00016432592652994461, "tps": 32988, "wall": 37177.8} {"step": 18714, "train_loss": 3.3501200675964355, "lr": 0.00016430770826994038, "tps": 32985, "wall": 37183.4} {"step": 18715, "train_loss": 3.27860164642334, "lr": 0.0001642894906408214, "tps": 32982, "wall": 37188.9} {"step": 18716, "train_loss": 3.2496745586395264, "lr": 0.00016427127364279412, "tps": 32978, "wall": 37194.5} {"step": 18717, "train_loss": 3.297149419784546, "lr": 0.00016425305727606491, "tps": 32975, "wall": 37200.0} {"step": 18718, "train_loss": 3.168149948120117, "lr": 0.00016423484154084, "tps": 32972, "wall": 37205.6} {"step": 18719, "train_loss": 3.2827327251434326, "lr": 0.00016421662643732586, "tps": 32969, "wall": 37211.1} {"step": 18720, "train_loss": 3.2189247608184814, "lr": 0.00016419841196572884, "tps": 32966, "wall": 37216.7} {"step": 18721, "train_loss": 3.2045302391052246, "lr": 0.00016418019812625514, "tps": 32963, "wall": 37222.3} {"step": 18722, "train_loss": 3.251706123352051, "lr": 0.00016416198491911126, "tps": 32960, "wall": 37227.8} {"step": 18723, "train_loss": 3.343980550765991, "lr": 0.0001641437723445034, "tps": 32956, "wall": 37233.5} {"step": 18724, "train_loss": 3.353087902069092, "lr": 0.0001641255604026379, "tps": 32953, "wall": 37239.1} {"step": 18725, "train_loss": 3.2749314308166504, "lr": 0.00016410734909372106, "tps": 32950, "wall": 37244.6} {"step": 18726, "train_loss": 3.158555030822754, "lr": 0.00016408913841795922, "tps": 32947, "wall": 37250.2} {"step": 18727, "train_loss": 3.289630889892578, "lr": 0.00016407092837555863, "tps": 32944, "wall": 37255.7} {"step": 18728, "train_loss": 3.1846554279327393, "lr": 0.00016405271896672563, "tps": 32940, "wall": 37261.3} {"step": 18729, "train_loss": 3.386566400527954, "lr": 0.0001640345101916664, "tps": 32937, "wall": 37266.8} {"step": 18730, "train_loss": 3.293381690979004, "lr": 0.0001640163020505873, "tps": 32934, "wall": 37272.4} {"step": 18731, "train_loss": 3.380640983581543, "lr": 0.00016399809454369457, "tps": 32931, "wall": 37277.9} {"step": 18732, "train_loss": 3.3545970916748047, "lr": 0.00016397988767119439, "tps": 32928, "wall": 37283.5} {"step": 18733, "train_loss": 3.3144524097442627, "lr": 0.00016396168143329316, "tps": 32925, "wall": 37289.0} {"step": 18734, "train_loss": 3.2093775272369385, "lr": 0.00016394347583019697, "tps": 32922, "wall": 37294.7} {"step": 18735, "train_loss": 3.270474433898926, "lr": 0.00016392527086211213, "tps": 32918, "wall": 37300.3} {"step": 18736, "train_loss": 3.2226150035858154, "lr": 0.00016390706652924487, "tps": 32915, "wall": 37305.8} {"step": 18737, "train_loss": 3.262742757797241, "lr": 0.00016388886283180142, "tps": 32912, "wall": 37311.3} {"step": 18738, "train_loss": 3.2677001953125, "lr": 0.0001638706597699879, "tps": 32909, "wall": 37316.9} {"step": 18739, "train_loss": 3.274665355682373, "lr": 0.00016385245734401065, "tps": 32906, "wall": 37322.4} {"step": 18740, "train_loss": 3.3067870140075684, "lr": 0.00016383425555407578, "tps": 32903, "wall": 37328.0} {"step": 18741, "train_loss": 3.287095546722412, "lr": 0.00016381605440038944, "tps": 32900, "wall": 37333.5} {"step": 18742, "train_loss": 3.2417778968811035, "lr": 0.00016379785388315792, "tps": 32896, "wall": 37339.1} {"step": 18743, "train_loss": 3.2242956161499023, "lr": 0.0001637796540025874, "tps": 32893, "wall": 37344.6} {"step": 18744, "train_loss": 3.2872934341430664, "lr": 0.00016376145475888393, "tps": 32890, "wall": 37350.2} {"step": 18745, "train_loss": 3.2946150302886963, "lr": 0.00016374325615225378, "tps": 32887, "wall": 37355.8} {"step": 18746, "train_loss": 3.201535224914551, "lr": 0.00016372505818290306, "tps": 32884, "wall": 37361.4} {"step": 18747, "train_loss": 3.2012832164764404, "lr": 0.00016370686085103792, "tps": 32881, "wall": 37367.0} {"step": 18748, "train_loss": 3.480952739715576, "lr": 0.0001636886641568645, "tps": 32877, "wall": 37372.6} {"step": 18749, "train_loss": 3.2634639739990234, "lr": 0.00016367046810058895, "tps": 32874, "wall": 37378.1} {"step": 18750, "train_loss": 3.3643405437469482, "lr": 0.00016365227268241742, "tps": 32871, "wall": 37383.7} {"step": 18751, "train_loss": 3.283128023147583, "lr": 0.00016363407790255595, "tps": 32868, "wall": 37389.2} {"step": 18752, "train_loss": 3.2155635356903076, "lr": 0.00016361588376121068, "tps": 32865, "wall": 37394.8} {"step": 18753, "train_loss": 3.217808723449707, "lr": 0.00016359769025858775, "tps": 32862, "wall": 37400.3} {"step": 18754, "train_loss": 3.2433865070343018, "lr": 0.0001635794973948933, "tps": 32859, "wall": 37405.9} {"step": 18755, "train_loss": 3.303863763809204, "lr": 0.00016356130517033326, "tps": 32856, "wall": 37411.5} {"step": 18756, "train_loss": 3.2410359382629395, "lr": 0.00016354311358511385, "tps": 32852, "wall": 37417.0} {"step": 18757, "train_loss": 3.401421546936035, "lr": 0.00016352492263944107, "tps": 32849, "wall": 37422.6} {"step": 18758, "train_loss": 3.2347474098205566, "lr": 0.00016350673233352108, "tps": 32846, "wall": 37428.1} {"step": 18759, "train_loss": 3.276048183441162, "lr": 0.00016348854266755983, "tps": 32843, "wall": 37433.6} {"step": 18760, "train_loss": 3.2715485095977783, "lr": 0.00016347035364176347, "tps": 32840, "wall": 37439.2} {"step": 18761, "train_loss": 3.2301406860351562, "lr": 0.00016345216525633799, "tps": 32837, "wall": 37444.7} {"step": 18762, "train_loss": 3.3252077102661133, "lr": 0.0001634339775114894, "tps": 32834, "wall": 37450.3} {"step": 18763, "train_loss": 3.293156147003174, "lr": 0.0001634157904074238, "tps": 32831, "wall": 37455.8} {"step": 18764, "train_loss": 3.2997591495513916, "lr": 0.00016339760394434716, "tps": 32828, "wall": 37461.4} {"step": 18765, "train_loss": 3.288442611694336, "lr": 0.0001633794181224656, "tps": 32824, "wall": 37466.9} {"step": 18766, "train_loss": 3.2041587829589844, "lr": 0.000163361232941985, "tps": 32821, "wall": 37472.6} {"step": 18767, "train_loss": 3.264054775238037, "lr": 0.00016334304840311142, "tps": 32818, "wall": 37478.1} {"step": 18768, "train_loss": 3.338310480117798, "lr": 0.00016332486450605088, "tps": 32815, "wall": 37483.6} {"step": 18769, "train_loss": 3.345778226852417, "lr": 0.0001633066812510093, "tps": 32812, "wall": 37489.1} {"step": 18770, "train_loss": 3.342616319656372, "lr": 0.00016328849863819276, "tps": 32809, "wall": 37494.7} {"step": 18771, "train_loss": 3.2781052589416504, "lr": 0.00016327031666780713, "tps": 32806, "wall": 37500.2} {"step": 18772, "train_loss": 3.288740634918213, "lr": 0.0001632521353400584, "tps": 32803, "wall": 37505.7} {"step": 18773, "train_loss": 3.1811327934265137, "lr": 0.00016323395465515255, "tps": 32800, "wall": 37511.2} {"step": 18774, "train_loss": 3.26798939704895, "lr": 0.00016321577461329563, "tps": 32797, "wall": 37516.8} {"step": 18775, "train_loss": 3.214177131652832, "lr": 0.00016319759521469339, "tps": 32793, "wall": 37522.3} {"step": 18776, "train_loss": 3.3696045875549316, "lr": 0.00016317941645955188, "tps": 32790, "wall": 37527.8} {"step": 18777, "train_loss": 3.3163981437683105, "lr": 0.00016316123834807705, "tps": 32787, "wall": 37533.4} {"step": 18778, "train_loss": 3.235015392303467, "lr": 0.00016314306088047474, "tps": 32784, "wall": 37538.9} {"step": 18779, "train_loss": 3.37852144241333, "lr": 0.00016312488405695094, "tps": 32781, "wall": 37544.4} {"step": 18780, "train_loss": 3.257260322570801, "lr": 0.00016310670787771155, "tps": 32778, "wall": 37550.0} {"step": 18781, "train_loss": 3.237067699432373, "lr": 0.00016308853234296242, "tps": 32775, "wall": 37555.5} {"step": 18782, "train_loss": 3.2540602684020996, "lr": 0.00016307035745290947, "tps": 32772, "wall": 37561.1} {"step": 18783, "train_loss": 3.4122776985168457, "lr": 0.0001630521832077586, "tps": 32769, "wall": 37566.7} {"step": 18784, "train_loss": 3.297353982925415, "lr": 0.0001630340096077157, "tps": 32766, "wall": 37572.2} {"step": 18785, "train_loss": 3.296924591064453, "lr": 0.00016301583665298658, "tps": 32762, "wall": 37577.8} {"step": 18786, "train_loss": 3.2894158363342285, "lr": 0.00016299766434377716, "tps": 32759, "wall": 37583.3} {"step": 18787, "train_loss": 3.299731969833374, "lr": 0.00016297949268029334, "tps": 32756, "wall": 37588.9} {"step": 18788, "train_loss": 3.1906867027282715, "lr": 0.00016296132166274086, "tps": 32753, "wall": 37594.5} {"step": 18789, "train_loss": 3.314174175262451, "lr": 0.00016294315129132558, "tps": 32750, "wall": 37600.1} {"step": 18790, "train_loss": 3.3542401790618896, "lr": 0.0001629249815662534, "tps": 32747, "wall": 37605.6} {"step": 18791, "train_loss": 3.2362093925476074, "lr": 0.00016290681248773016, "tps": 32744, "wall": 37611.2} {"step": 18792, "train_loss": 3.3519585132598877, "lr": 0.00016288864405596161, "tps": 32741, "wall": 37616.7} {"step": 18793, "train_loss": 3.3257317543029785, "lr": 0.00016287047627115358, "tps": 32738, "wall": 37622.2} {"step": 18794, "train_loss": 3.329648971557617, "lr": 0.00016285230913351187, "tps": 32735, "wall": 37627.7} {"step": 18795, "train_loss": 3.425309419631958, "lr": 0.0001628341426432424, "tps": 32732, "wall": 37633.3} {"step": 18796, "train_loss": 3.3189682960510254, "lr": 0.00016281597680055073, "tps": 32728, "wall": 37638.8} {"step": 18797, "train_loss": 3.266388416290283, "lr": 0.00016279781160564278, "tps": 32725, "wall": 37644.4} {"step": 18798, "train_loss": 3.3324451446533203, "lr": 0.00016277964705872436, "tps": 32722, "wall": 37649.9} {"step": 18799, "train_loss": 3.3139495849609375, "lr": 0.0001627614831600012, "tps": 32719, "wall": 37655.5} {"step": 18800, "train_loss": 3.448518753051758, "lr": 0.000162743319909679, "tps": 32716, "wall": 37661.0} {"step": 18801, "train_loss": 3.1877756118774414, "lr": 0.0001627251573079636, "tps": 32713, "wall": 37666.5} {"step": 18802, "train_loss": 3.3476076126098633, "lr": 0.0001627069953550607, "tps": 32710, "wall": 37672.0} {"step": 18803, "train_loss": 3.2361485958099365, "lr": 0.00016268883405117608, "tps": 32707, "wall": 37677.5} {"step": 18804, "train_loss": 3.294386863708496, "lr": 0.0001626706733965154, "tps": 32704, "wall": 37683.1} {"step": 18805, "train_loss": 3.2978200912475586, "lr": 0.00016265251339128448, "tps": 32701, "wall": 37688.6} {"step": 18806, "train_loss": 3.2498106956481934, "lr": 0.00016263435403568902, "tps": 32698, "wall": 37694.2} {"step": 18807, "train_loss": 3.344907760620117, "lr": 0.00016261619532993463, "tps": 32695, "wall": 37699.8} {"step": 18808, "train_loss": 3.2732038497924805, "lr": 0.0001625980372742271, "tps": 32692, "wall": 37705.3} {"step": 18809, "train_loss": 3.3310818672180176, "lr": 0.00016257987986877215, "tps": 32689, "wall": 37710.9} {"step": 18810, "train_loss": 3.360835075378418, "lr": 0.0001625617231137754, "tps": 32685, "wall": 37716.6} {"step": 18811, "train_loss": 3.150599718093872, "lr": 0.00016254356700944254, "tps": 32682, "wall": 37722.1} {"step": 18812, "train_loss": 3.239227771759033, "lr": 0.00016252541155597933, "tps": 32679, "wall": 37727.7} {"step": 18813, "train_loss": 3.2896804809570312, "lr": 0.00016250725675359128, "tps": 32676, "wall": 37733.2} {"step": 18814, "train_loss": 3.3761157989501953, "lr": 0.0001624891026024842, "tps": 32673, "wall": 37738.8} {"step": 18815, "train_loss": 3.1881520748138428, "lr": 0.0001624709491028636, "tps": 32670, "wall": 37744.3} {"step": 18816, "train_loss": 3.288996934890747, "lr": 0.00016245279625493527, "tps": 32667, "wall": 37749.9} {"step": 18817, "train_loss": 3.3835437297821045, "lr": 0.00016243464405890477, "tps": 32664, "wall": 37755.4} {"step": 18818, "train_loss": 3.316389560699463, "lr": 0.00016241649251497772, "tps": 32661, "wall": 37760.9} {"step": 18819, "train_loss": 3.307246208190918, "lr": 0.0001623983416233598, "tps": 32658, "wall": 37766.4} {"step": 18820, "train_loss": 3.2314605712890625, "lr": 0.0001623801913842565, "tps": 32655, "wall": 37772.0} {"step": 18821, "train_loss": 3.4001617431640625, "lr": 0.00016236204179787355, "tps": 32652, "wall": 37777.5} {"step": 18822, "train_loss": 3.307708740234375, "lr": 0.00016234389286441653, "tps": 32649, "wall": 37783.1} {"step": 18823, "train_loss": 3.350688934326172, "lr": 0.00016232574458409103, "tps": 32646, "wall": 37788.6} {"step": 18824, "train_loss": 3.229829788208008, "lr": 0.00016230759695710253, "tps": 32643, "wall": 37794.1} {"step": 18825, "train_loss": 3.2518415451049805, "lr": 0.00016228944998365673, "tps": 32640, "wall": 37799.6} {"step": 18826, "train_loss": 3.348165512084961, "lr": 0.0001622713036639592, "tps": 32637, "wall": 37805.1} {"step": 18827, "train_loss": 3.3595495223999023, "lr": 0.00016225315799821543, "tps": 32634, "wall": 37810.5} {"step": 18828, "train_loss": 3.410961389541626, "lr": 0.00016223501298663102, "tps": 32631, "wall": 37816.1} {"step": 18829, "train_loss": 3.2595155239105225, "lr": 0.00016221686862941153, "tps": 32628, "wall": 37821.6} {"step": 18830, "train_loss": 3.281923294067383, "lr": 0.00016219872492676248, "tps": 32624, "wall": 37827.1} {"step": 18831, "train_loss": 3.2710189819335938, "lr": 0.00016218058187888933, "tps": 32621, "wall": 37832.7} {"step": 18832, "train_loss": 3.2534642219543457, "lr": 0.0001621624394859977, "tps": 32618, "wall": 37838.2} {"step": 18833, "train_loss": 3.371805191040039, "lr": 0.00016214429774829317, "tps": 32615, "wall": 37843.7} {"step": 18834, "train_loss": 3.288796901702881, "lr": 0.0001621261566659811, "tps": 32612, "wall": 37849.2} {"step": 18835, "train_loss": 3.3127198219299316, "lr": 0.000162108016239267, "tps": 32609, "wall": 37854.7} {"step": 18836, "train_loss": 3.385472297668457, "lr": 0.00016208987646835655, "tps": 32606, "wall": 37860.2} {"step": 18837, "train_loss": 3.217128276824951, "lr": 0.000162071737353455, "tps": 32603, "wall": 37865.8} {"step": 18838, "train_loss": 3.3010425567626953, "lr": 0.000162053598894768, "tps": 32600, "wall": 37871.4} {"step": 18839, "train_loss": 3.267608165740967, "lr": 0.000162035461092501, "tps": 32597, "wall": 37876.9} {"step": 18840, "train_loss": 3.3417840003967285, "lr": 0.00016201732394685939, "tps": 32594, "wall": 37882.4} {"step": 18841, "train_loss": 3.2518811225891113, "lr": 0.00016199918745804864, "tps": 32591, "wall": 37888.0} {"step": 18842, "train_loss": 3.2269153594970703, "lr": 0.00016198105162627425, "tps": 32588, "wall": 37893.6} {"step": 18843, "train_loss": 3.292102575302124, "lr": 0.00016196291645174168, "tps": 32585, "wall": 37899.1} {"step": 18844, "train_loss": 3.310220956802368, "lr": 0.0001619447819346563, "tps": 32582, "wall": 37904.7} {"step": 18845, "train_loss": 3.397653341293335, "lr": 0.0001619266480752236, "tps": 32579, "wall": 37910.2} {"step": 18846, "train_loss": 3.2621665000915527, "lr": 0.00016190851487364895, "tps": 32576, "wall": 37915.7} {"step": 18847, "train_loss": 3.3131561279296875, "lr": 0.00016189038233013777, "tps": 32573, "wall": 37921.2} {"step": 18848, "train_loss": 3.263040781021118, "lr": 0.0001618722504448955, "tps": 32570, "wall": 37926.7} {"step": 18849, "train_loss": 3.2205374240875244, "lr": 0.00016185411921812754, "tps": 32567, "wall": 37932.2} {"step": 18850, "train_loss": 3.1698219776153564, "lr": 0.00016183598865003926, "tps": 32564, "wall": 37937.7} {"step": 18851, "train_loss": 3.233157157897949, "lr": 0.000161817858740836, "tps": 32561, "wall": 37943.3} {"step": 18852, "train_loss": 3.2645249366760254, "lr": 0.00016179972949072324, "tps": 32558, "wall": 37948.9} {"step": 18853, "train_loss": 3.217489004135132, "lr": 0.00016178160089990628, "tps": 32555, "wall": 37954.4} {"step": 18854, "train_loss": 3.302126407623291, "lr": 0.0001617634729685905, "tps": 32552, "wall": 37960.0} {"step": 18855, "train_loss": 3.335249423980713, "lr": 0.00016174534569698122, "tps": 32549, "wall": 37965.5} {"step": 18856, "train_loss": 3.2961268424987793, "lr": 0.00016172721908528384, "tps": 32546, "wall": 37971.1} {"step": 18857, "train_loss": 3.34037184715271, "lr": 0.00016170909313370366, "tps": 32543, "wall": 37976.5} {"step": 18858, "train_loss": 3.362516403198242, "lr": 0.000161690967842446, "tps": 32540, "wall": 37982.1} {"step": 18859, "train_loss": 3.4291605949401855, "lr": 0.00016167284321171624, "tps": 32537, "wall": 37987.5} {"step": 18860, "train_loss": 3.3270998001098633, "lr": 0.0001616547192417197, "tps": 32534, "wall": 37993.0} {"step": 18861, "train_loss": 3.265577554702759, "lr": 0.0001616365959326616, "tps": 32531, "wall": 37998.6} {"step": 18862, "train_loss": 3.3852853775024414, "lr": 0.00016161847328474734, "tps": 32528, "wall": 38004.1} {"step": 18863, "train_loss": 3.3135416507720947, "lr": 0.00016160035129818217, "tps": 32525, "wall": 38009.6} {"step": 18864, "train_loss": 3.329043388366699, "lr": 0.00016158222997317138, "tps": 32522, "wall": 38015.2} {"step": 18865, "train_loss": 3.309065818786621, "lr": 0.00016156410930992022, "tps": 32519, "wall": 38020.6} {"step": 18866, "train_loss": 3.355266571044922, "lr": 0.00016154598930863404, "tps": 32516, "wall": 38026.2} {"step": 18867, "train_loss": 3.3686177730560303, "lr": 0.00016152786996951802, "tps": 32513, "wall": 38031.7} {"step": 18868, "train_loss": 3.337627649307251, "lr": 0.00016150975129277742, "tps": 32510, "wall": 38037.2} {"step": 18869, "train_loss": 3.355752944946289, "lr": 0.00016149163327861755, "tps": 32507, "wall": 38042.8} {"step": 18870, "train_loss": 3.1460013389587402, "lr": 0.00016147351592724367, "tps": 32504, "wall": 38048.3} {"step": 18871, "train_loss": 3.3237948417663574, "lr": 0.0001614553992388609, "tps": 32501, "wall": 38053.7} {"step": 18872, "train_loss": 3.367544651031494, "lr": 0.00016143728321367458, "tps": 32498, "wall": 38059.2} {"step": 18873, "train_loss": 3.2392737865448, "lr": 0.00016141916785188988, "tps": 32495, "wall": 38064.8} {"step": 18874, "train_loss": 3.309793472290039, "lr": 0.00016140105315371202, "tps": 32492, "wall": 38070.3} {"step": 18875, "train_loss": 3.3803763389587402, "lr": 0.00016138293911934618, "tps": 32489, "wall": 38076.0} {"step": 18876, "train_loss": 3.1755449771881104, "lr": 0.0001613648257489976, "tps": 32486, "wall": 38081.6} {"step": 18877, "train_loss": 3.3389475345611572, "lr": 0.00016134671304287142, "tps": 32483, "wall": 38087.1} {"step": 18878, "train_loss": 3.332838535308838, "lr": 0.00016132860100117284, "tps": 32480, "wall": 38092.6} {"step": 18879, "train_loss": 3.287264823913574, "lr": 0.00016131048962410703, "tps": 32477, "wall": 38098.1} {"step": 18880, "train_loss": 3.322584629058838, "lr": 0.0001612923789118792, "tps": 32474, "wall": 38103.6} {"step": 18881, "train_loss": 3.319404125213623, "lr": 0.00016127426886469447, "tps": 32471, "wall": 38109.1} {"step": 18882, "train_loss": 3.3384854793548584, "lr": 0.000161256159482758, "tps": 32468, "wall": 38114.6} {"step": 18883, "train_loss": 3.2469305992126465, "lr": 0.00016123805076627496, "tps": 32465, "wall": 38120.1} {"step": 18884, "train_loss": 3.2660696506500244, "lr": 0.00016121994271545042, "tps": 32462, "wall": 38125.6} {"step": 18885, "train_loss": 3.220698356628418, "lr": 0.00016120183533048957, "tps": 32459, "wall": 38131.1} {"step": 18886, "train_loss": 3.298936367034912, "lr": 0.0001611837286115975, "tps": 32456, "wall": 38136.6} {"step": 18887, "train_loss": 3.3194594383239746, "lr": 0.00016116562255897936, "tps": 32453, "wall": 38142.2} {"step": 18888, "train_loss": 3.2441694736480713, "lr": 0.0001611475171728402, "tps": 32450, "wall": 38147.7} {"step": 18889, "train_loss": 3.291886329650879, "lr": 0.00016112941245338512, "tps": 32447, "wall": 38153.2} {"step": 18890, "train_loss": 3.274033546447754, "lr": 0.00016111130840081928, "tps": 32444, "wall": 38158.7} {"step": 18891, "train_loss": 3.287175178527832, "lr": 0.00016109320501534775, "tps": 32441, "wall": 38164.2} {"step": 18892, "train_loss": 3.300769805908203, "lr": 0.00016107510229717553, "tps": 32438, "wall": 38169.6} {"step": 18893, "train_loss": 3.212906837463379, "lr": 0.0001610570002465078, "tps": 32435, "wall": 38175.1} {"step": 18894, "train_loss": 3.3279612064361572, "lr": 0.00016103889886354952, "tps": 32432, "wall": 38180.6} {"step": 18895, "train_loss": 3.2515058517456055, "lr": 0.00016102079814850576, "tps": 32429, "wall": 38186.1} {"step": 18896, "train_loss": 3.372224807739258, "lr": 0.00016100269810158163, "tps": 32426, "wall": 38191.6} {"step": 18897, "train_loss": 3.4386775493621826, "lr": 0.0001609845987229821, "tps": 32423, "wall": 38197.2} {"step": 18898, "train_loss": 3.2728729248046875, "lr": 0.00016096650001291228, "tps": 32420, "wall": 38202.8} {"step": 18899, "train_loss": 3.2455224990844727, "lr": 0.00016094840197157707, "tps": 32417, "wall": 38208.3} {"step": 18900, "train_loss": 3.2582743167877197, "lr": 0.0001609303045991816, "tps": 32414, "wall": 38213.7} {"step": 18901, "train_loss": 3.323538303375244, "lr": 0.0001609122078959308, "tps": 32411, "wall": 38219.3} {"step": 18902, "train_loss": 3.2610082626342773, "lr": 0.00016089411186202975, "tps": 32408, "wall": 38224.8} {"step": 18903, "train_loss": 3.348294973373413, "lr": 0.00016087601649768338, "tps": 32406, "wall": 38230.3} {"step": 18904, "train_loss": 3.3217365741729736, "lr": 0.0001608579218030967, "tps": 32403, "wall": 38235.8} {"step": 18905, "train_loss": 3.2605457305908203, "lr": 0.00016083982777847467, "tps": 32400, "wall": 38241.2} {"step": 18906, "train_loss": 3.329455852508545, "lr": 0.00016082173442402223, "tps": 32397, "wall": 38246.7} {"step": 18907, "train_loss": 3.272019147872925, "lr": 0.00016080364173994447, "tps": 32394, "wall": 38252.3} {"step": 18908, "train_loss": 3.264260768890381, "lr": 0.00016078554972644623, "tps": 32391, "wall": 38257.9} {"step": 18909, "train_loss": 3.258702516555786, "lr": 0.00016076745838373245, "tps": 32387, "wall": 38264.3} {"step": 18910, "train_loss": 3.2049386501312256, "lr": 0.00016074936771200818, "tps": 32384, "wall": 38270.0} {"step": 18911, "train_loss": 3.2539007663726807, "lr": 0.00016073127771147817, "tps": 32381, "wall": 38275.5} {"step": 18912, "train_loss": 3.351121425628662, "lr": 0.00016071318838234753, "tps": 32378, "wall": 38281.1} {"step": 18913, "train_loss": 3.320775270462036, "lr": 0.00016069509972482107, "tps": 32375, "wall": 38286.6} {"step": 18914, "train_loss": 3.277881383895874, "lr": 0.00016067701173910374, "tps": 32372, "wall": 38292.2} {"step": 18915, "train_loss": 3.2588367462158203, "lr": 0.00016065892442540048, "tps": 32369, "wall": 38297.7} {"step": 18916, "train_loss": 3.2740402221679688, "lr": 0.000160640837783916, "tps": 32366, "wall": 38303.3} {"step": 18917, "train_loss": 3.264834403991699, "lr": 0.00016062275181485548, "tps": 32363, "wall": 38308.8} {"step": 18918, "train_loss": 3.182255744934082, "lr": 0.00016060466651842355, "tps": 32360, "wall": 38314.4} {"step": 18919, "train_loss": 3.26220440864563, "lr": 0.00016058658189482515, "tps": 32357, "wall": 38319.9} {"step": 18920, "train_loss": 3.4188268184661865, "lr": 0.00016056849794426526, "tps": 32354, "wall": 38325.4} {"step": 18921, "train_loss": 3.3261327743530273, "lr": 0.00016055041466694854, "tps": 32351, "wall": 38331.0} {"step": 18922, "train_loss": 3.353269577026367, "lr": 0.00016053233206307996, "tps": 32348, "wall": 38336.5} {"step": 18923, "train_loss": 3.327414035797119, "lr": 0.00016051425013286435, "tps": 32345, "wall": 38342.0} {"step": 18924, "train_loss": 3.2909791469573975, "lr": 0.00016049616887650657, "tps": 32342, "wall": 38347.5} {"step": 18925, "train_loss": 3.2589402198791504, "lr": 0.0001604780882942114, "tps": 32339, "wall": 38353.0} {"step": 18926, "train_loss": 3.2551846504211426, "lr": 0.0001604600083861836, "tps": 32337, "wall": 38358.5} {"step": 18927, "train_loss": 3.397188425064087, "lr": 0.0001604419291526281, "tps": 32334, "wall": 38364.0} {"step": 18928, "train_loss": 3.258768081665039, "lr": 0.00016042385059374966, "tps": 32331, "wall": 38369.5} {"step": 18929, "train_loss": 3.266935110092163, "lr": 0.00016040577270975303, "tps": 32328, "wall": 38375.1} {"step": 18930, "train_loss": 3.403502941131592, "lr": 0.00016038769550084307, "tps": 32325, "wall": 38380.6} {"step": 18931, "train_loss": 3.2889366149902344, "lr": 0.00016036961896722448, "tps": 32322, "wall": 38386.2} {"step": 18932, "train_loss": 3.3463146686553955, "lr": 0.00016035154310910205, "tps": 32319, "wall": 38391.6} {"step": 18933, "train_loss": 3.3122434616088867, "lr": 0.00016033346792668064, "tps": 32316, "wall": 38397.2} {"step": 18934, "train_loss": 3.337571144104004, "lr": 0.0001603153934201649, "tps": 32313, "wall": 38402.7} {"step": 18935, "train_loss": 3.279264450073242, "lr": 0.0001602973195897596, "tps": 32310, "wall": 38408.2} {"step": 18936, "train_loss": 3.3058414459228516, "lr": 0.0001602792464356695, "tps": 32307, "wall": 38413.7} {"step": 18937, "train_loss": 3.2329869270324707, "lr": 0.00016026117395809934, "tps": 32304, "wall": 38419.3} {"step": 18938, "train_loss": 3.3102893829345703, "lr": 0.0001602431021572538, "tps": 32301, "wall": 38424.7} {"step": 18939, "train_loss": 3.3012478351593018, "lr": 0.00016022503103333766, "tps": 32298, "wall": 38430.2} {"step": 18940, "train_loss": 3.393547534942627, "lr": 0.0001602069605865556, "tps": 32295, "wall": 38435.8} {"step": 18941, "train_loss": 3.2306113243103027, "lr": 0.00016018889081711234, "tps": 32292, "wall": 38441.3} {"step": 18942, "train_loss": 3.309706211090088, "lr": 0.0001601708217252125, "tps": 32290, "wall": 38446.8} {"step": 18943, "train_loss": 3.2771430015563965, "lr": 0.00016015275331106085, "tps": 32287, "wall": 38452.3} {"step": 18944, "train_loss": 3.2737390995025635, "lr": 0.00016013468557486213, "tps": 32284, "wall": 38457.8} {"step": 18945, "train_loss": 3.2200798988342285, "lr": 0.00016011661851682085, "tps": 32281, "wall": 38463.3} {"step": 18946, "train_loss": 3.201727867126465, "lr": 0.0001600985521371418, "tps": 32278, "wall": 38468.9} {"step": 18947, "train_loss": 3.3345088958740234, "lr": 0.00016008048643602956, "tps": 32275, "wall": 38474.3} {"step": 18948, "train_loss": 3.2457306385040283, "lr": 0.00016006242141368882, "tps": 32272, "wall": 38479.9} {"step": 18949, "train_loss": 3.3118276596069336, "lr": 0.00016004435707032418, "tps": 32269, "wall": 38485.4} {"step": 18950, "train_loss": 3.1808102130889893, "lr": 0.00016002629340614033, "tps": 32266, "wall": 38490.9} {"step": 18951, "train_loss": 3.3271658420562744, "lr": 0.0001600082304213419, "tps": 32263, "wall": 38496.4} {"step": 18952, "train_loss": 3.2224478721618652, "lr": 0.00015999016811613345, "tps": 32260, "wall": 38501.9} {"step": 18953, "train_loss": 3.2402777671813965, "lr": 0.00015997210649071962, "tps": 32257, "wall": 38507.4} {"step": 18954, "train_loss": 3.259046792984009, "lr": 0.00015995404554530507, "tps": 32254, "wall": 38513.0} {"step": 18955, "train_loss": 3.338949203491211, "lr": 0.00015993598528009427, "tps": 32252, "wall": 38518.4} {"step": 18956, "train_loss": 3.324990749359131, "lr": 0.00015991792569529188, "tps": 32249, "wall": 38523.9} {"step": 18957, "train_loss": 3.2060317993164062, "lr": 0.00015989986679110257, "tps": 32246, "wall": 38529.4} {"step": 18958, "train_loss": 3.3575186729431152, "lr": 0.0001598818085677307, "tps": 32243, "wall": 38534.9} {"step": 18959, "train_loss": 3.2544021606445312, "lr": 0.00015986375102538102, "tps": 32240, "wall": 38540.4} {"step": 18960, "train_loss": 3.3537609577178955, "lr": 0.00015984569416425802, "tps": 32237, "wall": 38545.8} {"step": 18961, "train_loss": 3.380034923553467, "lr": 0.00015982763798456624, "tps": 32234, "wall": 38551.3} {"step": 18962, "train_loss": 3.276510238647461, "lr": 0.00015980958248651024, "tps": 32231, "wall": 38556.9} {"step": 18963, "train_loss": 3.232665777206421, "lr": 0.0001597915276702945, "tps": 32228, "wall": 38562.4} {"step": 18964, "train_loss": 3.3278307914733887, "lr": 0.00015977347353612374, "tps": 32226, "wall": 38567.9} {"step": 18965, "train_loss": 3.3050758838653564, "lr": 0.00015975542008420218, "tps": 32223, "wall": 38573.4} {"step": 18966, "train_loss": 3.3762950897216797, "lr": 0.00015973736731473456, "tps": 32220, "wall": 38578.9} {"step": 18967, "train_loss": 3.1976187229156494, "lr": 0.00015971931522792526, "tps": 32217, "wall": 38584.3} {"step": 18968, "train_loss": 3.304874897003174, "lr": 0.0001597012638239788, "tps": 32214, "wall": 38589.8} {"step": 18969, "train_loss": 3.3601484298706055, "lr": 0.00015968321310309976, "tps": 32211, "wall": 38595.3} {"step": 18970, "train_loss": 3.3344790935516357, "lr": 0.00015966516306549245, "tps": 32208, "wall": 38600.8} {"step": 18971, "train_loss": 3.2652742862701416, "lr": 0.0001596471137113615, "tps": 32205, "wall": 38606.3} {"step": 18972, "train_loss": 3.240476608276367, "lr": 0.0001596290650409113, "tps": 32202, "wall": 38611.9} {"step": 18973, "train_loss": 3.2760634422302246, "lr": 0.00015961101705434628, "tps": 32200, "wall": 38617.4} {"step": 18974, "train_loss": 3.3621246814727783, "lr": 0.00015959296975187094, "tps": 32197, "wall": 38622.8} {"step": 18975, "train_loss": 3.249769687652588, "lr": 0.00015957492313368974, "tps": 32194, "wall": 38628.3} {"step": 18976, "train_loss": 3.3349764347076416, "lr": 0.00015955687720000706, "tps": 32191, "wall": 38633.8} {"step": 18977, "train_loss": 3.247504472732544, "lr": 0.00015953883195102736, "tps": 32188, "wall": 38639.2} {"step": 18978, "train_loss": 3.323943853378296, "lr": 0.000159520787386955, "tps": 32185, "wall": 38644.7} {"step": 18979, "train_loss": 3.285463809967041, "lr": 0.0001595027435079945, "tps": 32182, "wall": 38650.3} {"step": 18980, "train_loss": 3.468031883239746, "lr": 0.00015948470031435018, "tps": 32179, "wall": 38655.8} {"step": 18981, "train_loss": 3.319120407104492, "lr": 0.00015946665780622635, "tps": 32176, "wall": 38661.3} {"step": 18982, "train_loss": 3.350393772125244, "lr": 0.00015944861598382758, "tps": 32174, "wall": 38666.8} {"step": 18983, "train_loss": 3.3148205280303955, "lr": 0.00015943057484735823, "tps": 32171, "wall": 38672.4} {"step": 18984, "train_loss": 3.3292431831359863, "lr": 0.00015941253439702248, "tps": 32168, "wall": 38677.8} {"step": 18985, "train_loss": 3.292109489440918, "lr": 0.00015939449463302485, "tps": 32165, "wall": 38683.3} {"step": 18986, "train_loss": 3.1733951568603516, "lr": 0.00015937645555556972, "tps": 32162, "wall": 38688.8} {"step": 18987, "train_loss": 3.2915797233581543, "lr": 0.00015935841716486132, "tps": 32159, "wall": 38694.3} {"step": 18988, "train_loss": 3.3773694038391113, "lr": 0.0001593403794611041, "tps": 32156, "wall": 38699.8} {"step": 18989, "train_loss": 3.315549850463867, "lr": 0.00015932234244450227, "tps": 32153, "wall": 38705.4} {"step": 18990, "train_loss": 3.244450092315674, "lr": 0.0001593043061152603, "tps": 32151, "wall": 38710.9} {"step": 18991, "train_loss": 3.2777762413024902, "lr": 0.00015928627047358238, "tps": 32148, "wall": 38716.4} {"step": 18992, "train_loss": 3.2829771041870117, "lr": 0.0001592682355196729, "tps": 32145, "wall": 38721.9} {"step": 18993, "train_loss": 3.369065999984741, "lr": 0.00015925020125373616, "tps": 32142, "wall": 38727.5} {"step": 18994, "train_loss": 3.372170925140381, "lr": 0.00015923216767597638, "tps": 32139, "wall": 38733.2} {"step": 18995, "train_loss": 3.3566040992736816, "lr": 0.0001592141347865979, "tps": 32136, "wall": 38738.7} {"step": 18996, "train_loss": 3.3499717712402344, "lr": 0.00015919610258580504, "tps": 32133, "wall": 38744.2} {"step": 18997, "train_loss": 3.293452262878418, "lr": 0.00015917807107380195, "tps": 32130, "wall": 38749.7} {"step": 18998, "train_loss": 3.405949592590332, "lr": 0.00015916004025079297, "tps": 32127, "wall": 38755.2} {"step": 18999, "train_loss": 3.2872540950775146, "lr": 0.0001591420101169824, "tps": 32124, "wall": 38760.7} {"step": 19000, "train_loss": 3.327084541320801, "lr": 0.0001591239806725744, "tps": 32121, "wall": 38766.3, "val_loss_monitor": 3.3972543815995433} {"step": 19001, "train_loss": 3.2931623458862305, "lr": 0.00015910595191777325, "tps": 32089, "wall": 38807.6} {"step": 19002, "train_loss": 3.343639850616455, "lr": 0.00015908792385278315, "tps": 32086, "wall": 38813.1} {"step": 19003, "train_loss": 3.2295312881469727, "lr": 0.00015906989647780835, "tps": 32083, "wall": 38818.7} {"step": 19004, "train_loss": 3.29473614692688, "lr": 0.00015905186979305307, "tps": 32080, "wall": 38824.2} {"step": 19005, "train_loss": 3.3235177993774414, "lr": 0.00015903384379872145, "tps": 32077, "wall": 38829.8} {"step": 19006, "train_loss": 3.2376034259796143, "lr": 0.00015901581849501786, "tps": 32074, "wall": 38835.4} {"step": 19007, "train_loss": 3.275933265686035, "lr": 0.0001589977938821463, "tps": 32071, "wall": 38841.0} {"step": 19008, "train_loss": 3.3220973014831543, "lr": 0.00015897976996031104, "tps": 32069, "wall": 38846.6} {"step": 19009, "train_loss": 3.3269784450531006, "lr": 0.00015896174672971625, "tps": 32066, "wall": 38852.3} {"step": 19010, "train_loss": 3.3753538131713867, "lr": 0.00015894372419056612, "tps": 32063, "wall": 38857.8} {"step": 19011, "train_loss": 3.3060920238494873, "lr": 0.00015892570234306473, "tps": 32060, "wall": 38863.4} {"step": 19012, "train_loss": 3.229063034057617, "lr": 0.0001589076811874163, "tps": 32057, "wall": 38869.0} {"step": 19013, "train_loss": 3.263545513153076, "lr": 0.000158889660723825, "tps": 32054, "wall": 38874.6} {"step": 19014, "train_loss": 3.3270363807678223, "lr": 0.0001588716409524949, "tps": 32051, "wall": 38880.3} {"step": 19015, "train_loss": 3.2750680446624756, "lr": 0.0001588536218736302, "tps": 32048, "wall": 38885.8} {"step": 19016, "train_loss": 3.2421255111694336, "lr": 0.00015883560348743493, "tps": 32045, "wall": 38891.5} {"step": 19017, "train_loss": 3.2713193893432617, "lr": 0.0001588175857941133, "tps": 32042, "wall": 38897.1} {"step": 19018, "train_loss": 3.309597969055176, "lr": 0.0001587995687938693, "tps": 32039, "wall": 38902.6} {"step": 19019, "train_loss": 3.229414939880371, "lr": 0.00015878155248690715, "tps": 32036, "wall": 38908.2} {"step": 19020, "train_loss": 3.2306323051452637, "lr": 0.00015876353687343086, "tps": 32033, "wall": 38913.9} {"step": 19021, "train_loss": 3.3610472679138184, "lr": 0.00015874552195364454, "tps": 32030, "wall": 38919.4} {"step": 19022, "train_loss": 3.3269004821777344, "lr": 0.00015872750772775226, "tps": 32028, "wall": 38925.0} {"step": 19023, "train_loss": 3.305514335632324, "lr": 0.0001587094941959581, "tps": 32025, "wall": 38930.5} {"step": 19024, "train_loss": 3.2687602043151855, "lr": 0.0001586914813584661, "tps": 32022, "wall": 38936.1} {"step": 19025, "train_loss": 3.422844171524048, "lr": 0.00015867346921548032, "tps": 32019, "wall": 38941.7} {"step": 19026, "train_loss": 3.257946729660034, "lr": 0.00015865545776720484, "tps": 32016, "wall": 38947.3} {"step": 19027, "train_loss": 3.284372329711914, "lr": 0.0001586374470138436, "tps": 32013, "wall": 38952.8} {"step": 19028, "train_loss": 3.293916702270508, "lr": 0.00015861943695560067, "tps": 32010, "wall": 38958.6} {"step": 19029, "train_loss": 3.2749080657958984, "lr": 0.00015860142759268006, "tps": 32007, "wall": 38964.1} {"step": 19030, "train_loss": 3.3734347820281982, "lr": 0.0001585834189252859, "tps": 32004, "wall": 38969.7} {"step": 19031, "train_loss": 3.232024669647217, "lr": 0.00015856541095362201, "tps": 32001, "wall": 38975.4} {"step": 19032, "train_loss": 3.3933024406433105, "lr": 0.00015854740367789245, "tps": 31998, "wall": 38980.9} {"step": 19033, "train_loss": 3.1784605979919434, "lr": 0.00015852939709830132, "tps": 31995, "wall": 38986.5} {"step": 19034, "train_loss": 3.3946619033813477, "lr": 0.00015851139121505242, "tps": 31993, "wall": 38992.1} {"step": 19035, "train_loss": 3.299239158630371, "lr": 0.00015849338602834983, "tps": 31990, "wall": 38997.7} {"step": 19036, "train_loss": 3.2876505851745605, "lr": 0.00015847538153839752, "tps": 31987, "wall": 39003.3} {"step": 19037, "train_loss": 3.2800533771514893, "lr": 0.0001584573777453994, "tps": 31984, "wall": 39008.8} {"step": 19038, "train_loss": 3.284242630004883, "lr": 0.00015843937464955941, "tps": 31981, "wall": 39014.3} {"step": 19039, "train_loss": 3.2688918113708496, "lr": 0.00015842137225108153, "tps": 31978, "wall": 39019.9} {"step": 19040, "train_loss": 3.178799867630005, "lr": 0.0001584033705501697, "tps": 31975, "wall": 39025.4} {"step": 19041, "train_loss": 3.269247531890869, "lr": 0.00015838536954702778, "tps": 31973, "wall": 39030.9} {"step": 19042, "train_loss": 3.2360589504241943, "lr": 0.00015836736924185974, "tps": 31970, "wall": 39036.5} {"step": 19043, "train_loss": 3.1903433799743652, "lr": 0.00015834936963486952, "tps": 31967, "wall": 39042.1} {"step": 19044, "train_loss": 3.220862865447998, "lr": 0.0001583313707262609, "tps": 31964, "wall": 39047.6} {"step": 19045, "train_loss": 3.3907065391540527, "lr": 0.00015831337251623787, "tps": 31961, "wall": 39053.1} {"step": 19046, "train_loss": 3.395695686340332, "lr": 0.0001582953750050043, "tps": 31958, "wall": 39058.7} {"step": 19047, "train_loss": 3.2657957077026367, "lr": 0.0001582773781927641, "tps": 31955, "wall": 39064.2} {"step": 19048, "train_loss": 3.3002262115478516, "lr": 0.00015825938207972103, "tps": 31953, "wall": 39069.7} {"step": 19049, "train_loss": 3.222304344177246, "lr": 0.00015824138666607906, "tps": 31950, "wall": 39075.2} {"step": 19050, "train_loss": 3.2656991481781006, "lr": 0.00015822339195204204, "tps": 31947, "wall": 39080.8} {"step": 19051, "train_loss": 3.2881956100463867, "lr": 0.00015820539793781372, "tps": 31944, "wall": 39086.3} {"step": 19052, "train_loss": 3.3251233100891113, "lr": 0.000158187404623598, "tps": 31941, "wall": 39092.0} {"step": 19053, "train_loss": 3.1820712089538574, "lr": 0.00015816941200959877, "tps": 31938, "wall": 39097.6} {"step": 19054, "train_loss": 3.3824214935302734, "lr": 0.00015815142009601972, "tps": 31935, "wall": 39103.1} {"step": 19055, "train_loss": 3.2716102600097656, "lr": 0.00015813342888306475, "tps": 31932, "wall": 39108.7} {"step": 19056, "train_loss": 3.2448084354400635, "lr": 0.0001581154383709376, "tps": 31930, "wall": 39114.2} {"step": 19057, "train_loss": 3.3082499504089355, "lr": 0.00015809744855984218, "tps": 31927, "wall": 39119.8} {"step": 19058, "train_loss": 3.184889793395996, "lr": 0.0001580794594499822, "tps": 31924, "wall": 39125.3} {"step": 19059, "train_loss": 3.1339595317840576, "lr": 0.00015806147104156136, "tps": 31921, "wall": 39130.8} {"step": 19060, "train_loss": 3.2960333824157715, "lr": 0.00015804348333478365, "tps": 31918, "wall": 39136.3} {"step": 19061, "train_loss": 3.250018358230591, "lr": 0.00015802549632985263, "tps": 31915, "wall": 39141.9} {"step": 19062, "train_loss": 3.2955007553100586, "lr": 0.00015800751002697217, "tps": 31913, "wall": 39147.4} {"step": 19063, "train_loss": 3.277435779571533, "lr": 0.00015798952442634603, "tps": 31910, "wall": 39153.0} {"step": 19064, "train_loss": 3.3174257278442383, "lr": 0.00015797153952817788, "tps": 31907, "wall": 39158.5} {"step": 19065, "train_loss": 3.17726731300354, "lr": 0.00015795355533267146, "tps": 31904, "wall": 39164.0} {"step": 19066, "train_loss": 3.3106327056884766, "lr": 0.0001579355718400305, "tps": 31901, "wall": 39169.5} {"step": 19067, "train_loss": 3.1995272636413574, "lr": 0.00015791758905045887, "tps": 31898, "wall": 39175.1} {"step": 19068, "train_loss": 3.332252025604248, "lr": 0.00015789960696416003, "tps": 31896, "wall": 39180.6} {"step": 19069, "train_loss": 3.2683444023132324, "lr": 0.00015788162558133783, "tps": 31893, "wall": 39186.1} {"step": 19070, "train_loss": 3.2252578735351562, "lr": 0.00015786364490219597, "tps": 31890, "wall": 39191.6} {"step": 19071, "train_loss": 3.17984938621521, "lr": 0.00015784566492693807, "tps": 31887, "wall": 39197.1} {"step": 19072, "train_loss": 3.4274802207946777, "lr": 0.00015782768565576784, "tps": 31884, "wall": 39202.6} {"step": 19073, "train_loss": 3.315756320953369, "lr": 0.00015780970708888893, "tps": 31881, "wall": 39208.2} {"step": 19074, "train_loss": 3.392282009124756, "lr": 0.00015779172922650506, "tps": 31879, "wall": 39213.7} {"step": 19075, "train_loss": 3.2932889461517334, "lr": 0.00015777375206881984, "tps": 31876, "wall": 39219.2} {"step": 19076, "train_loss": 3.2990517616271973, "lr": 0.00015775577561603693, "tps": 31873, "wall": 39224.8} {"step": 19077, "train_loss": 3.2523372173309326, "lr": 0.0001577377998683599, "tps": 31870, "wall": 39230.4} {"step": 19078, "train_loss": 3.2767624855041504, "lr": 0.0001577198248259925, "tps": 31867, "wall": 39235.9} {"step": 19079, "train_loss": 3.2249653339385986, "lr": 0.0001577018504891383, "tps": 31864, "wall": 39241.4} {"step": 19080, "train_loss": 3.3646974563598633, "lr": 0.0001576838768580009, "tps": 31862, "wall": 39247.0} {"step": 19081, "train_loss": 3.4423141479492188, "lr": 0.0001576659039327839, "tps": 31859, "wall": 39252.5} {"step": 19082, "train_loss": 3.275193929672241, "lr": 0.00015764793171369092, "tps": 31856, "wall": 39258.0} {"step": 19083, "train_loss": 3.3811638355255127, "lr": 0.00015762996020092556, "tps": 31853, "wall": 39263.5} {"step": 19084, "train_loss": 3.2374472618103027, "lr": 0.00015761198939469133, "tps": 31850, "wall": 39269.1} {"step": 19085, "train_loss": 3.305875301361084, "lr": 0.0001575940192951919, "tps": 31847, "wall": 39274.7} {"step": 19086, "train_loss": 3.348079204559326, "lr": 0.00015757604990263078, "tps": 31845, "wall": 39280.2} {"step": 19087, "train_loss": 3.313793897628784, "lr": 0.00015755808121721158, "tps": 31842, "wall": 39285.8} {"step": 19088, "train_loss": 3.3788352012634277, "lr": 0.00015754011323913778, "tps": 31839, "wall": 39291.3} {"step": 19089, "train_loss": 3.2271087169647217, "lr": 0.00015752214596861296, "tps": 31836, "wall": 39296.8} {"step": 19090, "train_loss": 3.274301528930664, "lr": 0.00015750417940584068, "tps": 31833, "wall": 39302.4} {"step": 19091, "train_loss": 3.273083209991455, "lr": 0.0001574862135510244, "tps": 31831, "wall": 39307.9} {"step": 19092, "train_loss": 3.3448359966278076, "lr": 0.00015746824840436765, "tps": 31828, "wall": 39313.4} {"step": 19093, "train_loss": 3.2193443775177, "lr": 0.000157450283966074, "tps": 31825, "wall": 39318.9} {"step": 19094, "train_loss": 3.3067846298217773, "lr": 0.00015743232023634693, "tps": 31822, "wall": 39324.4} {"step": 19095, "train_loss": 3.274873733520508, "lr": 0.00015741435721538993, "tps": 31819, "wall": 39329.9} {"step": 19096, "train_loss": 3.309372663497925, "lr": 0.00015739639490340644, "tps": 31817, "wall": 39335.5} {"step": 19097, "train_loss": 3.1590890884399414, "lr": 0.0001573784333006, "tps": 31814, "wall": 39341.0} {"step": 19098, "train_loss": 3.318789482116699, "lr": 0.00015736047240717403, "tps": 31811, "wall": 39346.6} {"step": 19099, "train_loss": 3.1925148963928223, "lr": 0.00015734251222333204, "tps": 31808, "wall": 39352.1} {"step": 19100, "train_loss": 3.2853000164031982, "lr": 0.00015732455274927745, "tps": 31805, "wall": 39357.7} {"step": 19101, "train_loss": 3.2757279872894287, "lr": 0.00015730659398521373, "tps": 31802, "wall": 39363.2} {"step": 19102, "train_loss": 3.2649381160736084, "lr": 0.00015728863593134432, "tps": 31800, "wall": 39368.8} {"step": 19103, "train_loss": 3.259089469909668, "lr": 0.0001572706785878726, "tps": 31797, "wall": 39374.3} {"step": 19104, "train_loss": 3.277730941772461, "lr": 0.00015725272195500205, "tps": 31794, "wall": 39379.8} {"step": 19105, "train_loss": 3.434211015701294, "lr": 0.00015723476603293608, "tps": 31791, "wall": 39385.3} {"step": 19106, "train_loss": 3.3239171504974365, "lr": 0.000157216810821878, "tps": 31788, "wall": 39390.9} {"step": 19107, "train_loss": 3.2888617515563965, "lr": 0.00015719885632203132, "tps": 31786, "wall": 39396.5} {"step": 19108, "train_loss": 3.3119094371795654, "lr": 0.00015718090253359943, "tps": 31783, "wall": 39402.0} {"step": 19109, "train_loss": 3.2869250774383545, "lr": 0.00015716294945678562, "tps": 31780, "wall": 39407.5} {"step": 19110, "train_loss": 3.247893810272217, "lr": 0.00015714499709179337, "tps": 31777, "wall": 39413.1} {"step": 19111, "train_loss": 3.333721876144409, "lr": 0.00015712704543882598, "tps": 31774, "wall": 39418.6} {"step": 19112, "train_loss": 3.276550769805908, "lr": 0.00015710909449808677, "tps": 31772, "wall": 39424.1} {"step": 19113, "train_loss": 3.2918953895568848, "lr": 0.00015709114426977916, "tps": 31769, "wall": 39429.6} {"step": 19114, "train_loss": 3.323925256729126, "lr": 0.00015707319475410656, "tps": 31766, "wall": 39435.1} {"step": 19115, "train_loss": 3.389309883117676, "lr": 0.0001570552459512721, "tps": 31763, "wall": 39440.7} {"step": 19116, "train_loss": 3.275747060775757, "lr": 0.00015703729786147928, "tps": 31761, "wall": 39446.2} {"step": 19117, "train_loss": 3.296902894973755, "lr": 0.00015701935048493138, "tps": 31758, "wall": 39451.8} {"step": 19118, "train_loss": 3.2785980701446533, "lr": 0.00015700140382183162, "tps": 31755, "wall": 39457.3} {"step": 19119, "train_loss": 3.2789885997772217, "lr": 0.00015698345787238334, "tps": 31752, "wall": 39462.8} {"step": 19120, "train_loss": 3.326702356338501, "lr": 0.00015696551263678988, "tps": 31749, "wall": 39468.3} {"step": 19121, "train_loss": 3.4005215167999268, "lr": 0.00015694756811525457, "tps": 31747, "wall": 39473.9} {"step": 19122, "train_loss": 3.2975003719329834, "lr": 0.00015692962430798063, "tps": 31744, "wall": 39479.5} {"step": 19123, "train_loss": 3.3142356872558594, "lr": 0.0001569116812151712, "tps": 31741, "wall": 39485.0} {"step": 19124, "train_loss": 3.238348960876465, "lr": 0.00015689373883702977, "tps": 31738, "wall": 39490.5} {"step": 19125, "train_loss": 3.3352584838867188, "lr": 0.0001568757971737594, "tps": 31735, "wall": 39496.0} {"step": 19126, "train_loss": 3.1421849727630615, "lr": 0.00015685785622556345, "tps": 31733, "wall": 39501.6} {"step": 19127, "train_loss": 3.267849922180176, "lr": 0.0001568399159926451, "tps": 31730, "wall": 39507.1} {"step": 19128, "train_loss": 3.256359100341797, "lr": 0.00015682197647520768, "tps": 31727, "wall": 39512.7} {"step": 19129, "train_loss": 3.298898696899414, "lr": 0.00015680403767345425, "tps": 31724, "wall": 39518.2} {"step": 19130, "train_loss": 3.338132381439209, "lr": 0.0001567860995875881, "tps": 31721, "wall": 39523.7} {"step": 19131, "train_loss": 3.314054012298584, "lr": 0.0001567681622178125, "tps": 31719, "wall": 39529.3} {"step": 19132, "train_loss": 3.2887980937957764, "lr": 0.00015675022556433058, "tps": 31716, "wall": 39534.8} {"step": 19133, "train_loss": 3.2756850719451904, "lr": 0.00015673228962734544, "tps": 31713, "wall": 39540.4} {"step": 19134, "train_loss": 3.307370185852051, "lr": 0.00015671435440706038, "tps": 31710, "wall": 39545.9} {"step": 19135, "train_loss": 3.329258441925049, "lr": 0.00015669641990367854, "tps": 31707, "wall": 39551.5} {"step": 19136, "train_loss": 3.3150811195373535, "lr": 0.0001566784861174031, "tps": 31705, "wall": 39557.1} {"step": 19137, "train_loss": 3.249953031539917, "lr": 0.00015666055304843716, "tps": 31702, "wall": 39562.7} {"step": 19138, "train_loss": 3.370518922805786, "lr": 0.00015664262069698393, "tps": 31699, "wall": 39568.3} {"step": 19139, "train_loss": 3.215883255004883, "lr": 0.00015662468906324652, "tps": 31696, "wall": 39573.9} {"step": 19140, "train_loss": 3.289255142211914, "lr": 0.00015660675814742805, "tps": 31693, "wall": 39579.4} {"step": 19141, "train_loss": 3.328583002090454, "lr": 0.00015658882794973165, "tps": 31691, "wall": 39584.9} {"step": 19142, "train_loss": 3.3648669719696045, "lr": 0.00015657089847036045, "tps": 31688, "wall": 39590.5} {"step": 19143, "train_loss": 3.3335022926330566, "lr": 0.00015655296970951756, "tps": 31685, "wall": 39595.9} {"step": 19144, "train_loss": 3.3612823486328125, "lr": 0.00015653504166740598, "tps": 31682, "wall": 39601.5} {"step": 19145, "train_loss": 3.1884920597076416, "lr": 0.00015651711434422894, "tps": 31680, "wall": 39607.0} {"step": 19146, "train_loss": 3.256930351257324, "lr": 0.0001564991877401895, "tps": 31677, "wall": 39612.5} {"step": 19147, "train_loss": 3.289824962615967, "lr": 0.00015648126185549064, "tps": 31674, "wall": 39618.0} {"step": 19148, "train_loss": 3.361264705657959, "lr": 0.0001564633366903355, "tps": 31671, "wall": 39623.6} {"step": 19149, "train_loss": 3.3318333625793457, "lr": 0.00015644541224492712, "tps": 31669, "wall": 39629.1} {"step": 19150, "train_loss": 3.2736897468566895, "lr": 0.00015642748851946853, "tps": 31666, "wall": 39634.7} {"step": 19151, "train_loss": 3.2999491691589355, "lr": 0.00015640956551416283, "tps": 31663, "wall": 39640.2} {"step": 19152, "train_loss": 3.2904624938964844, "lr": 0.00015639164322921295, "tps": 31660, "wall": 39645.8} {"step": 19153, "train_loss": 3.3231863975524902, "lr": 0.00015637372166482205, "tps": 31657, "wall": 39651.3} {"step": 19154, "train_loss": 3.281893730163574, "lr": 0.000156355800821193, "tps": 31655, "wall": 39656.8} {"step": 19155, "train_loss": 3.2943716049194336, "lr": 0.0001563378806985289, "tps": 31652, "wall": 39662.3} {"step": 19156, "train_loss": 3.2305805683135986, "lr": 0.00015631996129703278, "tps": 31649, "wall": 39667.8} {"step": 19157, "train_loss": 3.1634979248046875, "lr": 0.00015630204261690754, "tps": 31646, "wall": 39673.4} {"step": 19158, "train_loss": 3.3528521060943604, "lr": 0.00015628412465835623, "tps": 31644, "wall": 39678.9} {"step": 19159, "train_loss": 3.245387554168701, "lr": 0.0001562662074215818, "tps": 31641, "wall": 39684.4} {"step": 19160, "train_loss": 3.30136775970459, "lr": 0.00015624829090678718, "tps": 31638, "wall": 39689.9} {"step": 19161, "train_loss": 3.2983384132385254, "lr": 0.0001562303751141754, "tps": 31635, "wall": 39695.4} {"step": 19162, "train_loss": 3.2649171352386475, "lr": 0.00015621246004394942, "tps": 31633, "wall": 39700.9} {"step": 19163, "train_loss": 3.3367388248443604, "lr": 0.0001561945456963121, "tps": 31630, "wall": 39706.4} {"step": 19164, "train_loss": 3.3012967109680176, "lr": 0.00015617663207146643, "tps": 31627, "wall": 39711.9} {"step": 19165, "train_loss": 3.2458930015563965, "lr": 0.00015615871916961532, "tps": 31624, "wall": 39717.5} {"step": 19166, "train_loss": 3.237873077392578, "lr": 0.0001561408069909617, "tps": 31622, "wall": 39723.0} {"step": 19167, "train_loss": 3.2058205604553223, "lr": 0.0001561228955357085, "tps": 31619, "wall": 39728.4} {"step": 19168, "train_loss": 3.1934022903442383, "lr": 0.00015610498480405851, "tps": 31616, "wall": 39733.9} {"step": 19169, "train_loss": 3.2856736183166504, "lr": 0.00015608707479621473, "tps": 31614, "wall": 39739.4} {"step": 19170, "train_loss": 3.1836864948272705, "lr": 0.0001560691655123801, "tps": 31611, "wall": 39744.9} {"step": 19171, "train_loss": 3.2906432151794434, "lr": 0.00015605125695275737, "tps": 31608, "wall": 39750.3} {"step": 19172, "train_loss": 3.2163898944854736, "lr": 0.00015603334911754946, "tps": 31605, "wall": 39755.9} {"step": 19173, "train_loss": 3.264240026473999, "lr": 0.00015601544200695923, "tps": 31603, "wall": 39761.4} {"step": 19174, "train_loss": 3.3191614151000977, "lr": 0.00015599753562118952, "tps": 31600, "wall": 39766.8} {"step": 19175, "train_loss": 3.316237688064575, "lr": 0.00015597962996044323, "tps": 31597, "wall": 39772.3} {"step": 19176, "train_loss": 3.2731220722198486, "lr": 0.00015596172502492313, "tps": 31595, "wall": 39777.8} {"step": 19177, "train_loss": 3.245758056640625, "lr": 0.00015594382081483209, "tps": 31592, "wall": 39783.3} {"step": 19178, "train_loss": 3.272575616836548, "lr": 0.00015592591733037289, "tps": 31589, "wall": 39788.7} {"step": 19179, "train_loss": 3.2465755939483643, "lr": 0.00015590801457174836, "tps": 31586, "wall": 39794.2} {"step": 19180, "train_loss": 3.306239604949951, "lr": 0.00015589011253916137, "tps": 31584, "wall": 39799.7} {"step": 19181, "train_loss": 3.1889805793762207, "lr": 0.0001558722112328146, "tps": 31581, "wall": 39805.2} {"step": 19182, "train_loss": 3.2127814292907715, "lr": 0.0001558543106529109, "tps": 31578, "wall": 39810.7} {"step": 19183, "train_loss": 3.29893159866333, "lr": 0.00015583641079965305, "tps": 31576, "wall": 39816.2} {"step": 19184, "train_loss": 3.3676869869232178, "lr": 0.0001558185116732438, "tps": 31573, "wall": 39821.7} {"step": 19185, "train_loss": 3.3122711181640625, "lr": 0.00015580061327388588, "tps": 31570, "wall": 39827.1} {"step": 19186, "train_loss": 3.2350668907165527, "lr": 0.00015578271560178216, "tps": 31568, "wall": 39832.6} {"step": 19187, "train_loss": 3.3332481384277344, "lr": 0.0001557648186571353, "tps": 31565, "wall": 39838.1} {"step": 19188, "train_loss": 3.326456308364868, "lr": 0.00015574692244014798, "tps": 31562, "wall": 39843.5} {"step": 19189, "train_loss": 3.1628963947296143, "lr": 0.00015572902695102308, "tps": 31559, "wall": 39849.1} {"step": 19190, "train_loss": 3.3109989166259766, "lr": 0.00015571113218996319, "tps": 31557, "wall": 39854.6} {"step": 19191, "train_loss": 3.3767762184143066, "lr": 0.00015569323815717108, "tps": 31554, "wall": 39860.0} {"step": 19192, "train_loss": 3.330260992050171, "lr": 0.00015567534485284946, "tps": 31551, "wall": 39865.5} {"step": 19193, "train_loss": 3.3056933879852295, "lr": 0.00015565745227720106, "tps": 31549, "wall": 39871.0} {"step": 19194, "train_loss": 3.327162265777588, "lr": 0.00015563956043042842, "tps": 31546, "wall": 39876.5} {"step": 19195, "train_loss": 3.2930188179016113, "lr": 0.0001556216693127344, "tps": 31543, "wall": 39882.0} {"step": 19196, "train_loss": 3.2244391441345215, "lr": 0.0001556037789243215, "tps": 31541, "wall": 39887.5} {"step": 19197, "train_loss": 3.265977382659912, "lr": 0.00015558588926539263, "tps": 31538, "wall": 39892.9} {"step": 19198, "train_loss": 3.359527349472046, "lr": 0.00015556800033615016, "tps": 31535, "wall": 39898.4} {"step": 19199, "train_loss": 3.3213882446289062, "lr": 0.0001555501121367969, "tps": 31533, "wall": 39903.8} {"step": 19200, "train_loss": 3.3079938888549805, "lr": 0.00015553222466753547, "tps": 31530, "wall": 39909.3} {"step": 19201, "train_loss": 3.3131566047668457, "lr": 0.0001555143379285685, "tps": 31527, "wall": 39914.8} {"step": 19202, "train_loss": 3.282294273376465, "lr": 0.00015549645192009854, "tps": 31525, "wall": 39920.3} {"step": 19203, "train_loss": 3.353969097137451, "lr": 0.00015547856664232837, "tps": 31522, "wall": 39925.7} {"step": 19204, "train_loss": 3.3187143802642822, "lr": 0.00015546068209546041, "tps": 31519, "wall": 39931.2} {"step": 19205, "train_loss": 3.3449435234069824, "lr": 0.00015544279827969733, "tps": 31516, "wall": 39936.8} {"step": 19206, "train_loss": 3.260563373565674, "lr": 0.0001554249151952417, "tps": 31514, "wall": 39942.3} {"step": 19207, "train_loss": 3.324951648712158, "lr": 0.0001554070328422962, "tps": 31511, "wall": 39947.7} {"step": 19208, "train_loss": 3.2441468238830566, "lr": 0.00015538915122106329, "tps": 31508, "wall": 39953.2} {"step": 19209, "train_loss": 3.3578667640686035, "lr": 0.00015537127033174556, "tps": 31506, "wall": 39958.7} {"step": 19210, "train_loss": 3.3279216289520264, "lr": 0.0001553533901745456, "tps": 31503, "wall": 39964.2} {"step": 19211, "train_loss": 3.2379910945892334, "lr": 0.0001553355107496659, "tps": 31500, "wall": 39969.7} {"step": 19212, "train_loss": 3.2623095512390137, "lr": 0.00015531763205730906, "tps": 31498, "wall": 39975.2} {"step": 19213, "train_loss": 3.3852334022521973, "lr": 0.00015529975409767758, "tps": 31495, "wall": 39980.6} {"step": 19214, "train_loss": 3.2824959754943848, "lr": 0.00015528187687097403, "tps": 31492, "wall": 39986.1} {"step": 19215, "train_loss": 3.2673487663269043, "lr": 0.00015526400037740076, "tps": 31490, "wall": 39991.7} {"step": 19216, "train_loss": 3.3059051036834717, "lr": 0.0001552461246171605, "tps": 31487, "wall": 39997.2} {"step": 19217, "train_loss": 3.275714874267578, "lr": 0.0001552282495904556, "tps": 31484, "wall": 40002.7} {"step": 19218, "train_loss": 3.296567440032959, "lr": 0.0001552103752974886, "tps": 31481, "wall": 40008.2} {"step": 19219, "train_loss": 3.25217342376709, "lr": 0.000155192501738462, "tps": 31479, "wall": 40013.6} {"step": 19220, "train_loss": 3.337610960006714, "lr": 0.0001551746289135782, "tps": 31476, "wall": 40019.2} {"step": 19221, "train_loss": 3.2820115089416504, "lr": 0.00015515675682303975, "tps": 31473, "wall": 40024.7} {"step": 19222, "train_loss": 3.345453977584839, "lr": 0.00015513888546704903, "tps": 31471, "wall": 40030.2} {"step": 19223, "train_loss": 3.2930870056152344, "lr": 0.0001551210148458085, "tps": 31468, "wall": 40035.6} {"step": 19224, "train_loss": 3.2335264682769775, "lr": 0.00015510314495952073, "tps": 31465, "wall": 40041.1} {"step": 19225, "train_loss": 3.245060682296753, "lr": 0.00015508527580838797, "tps": 31463, "wall": 40046.6} {"step": 19226, "train_loss": 3.285071849822998, "lr": 0.00015506740739261275, "tps": 31460, "wall": 40052.2} {"step": 19227, "train_loss": 3.3360352516174316, "lr": 0.00015504953971239745, "tps": 31457, "wall": 40057.7} {"step": 19228, "train_loss": 3.24576735496521, "lr": 0.00015503167276794444, "tps": 31455, "wall": 40063.2} {"step": 19229, "train_loss": 3.360050678253174, "lr": 0.00015501380655945615, "tps": 31452, "wall": 40068.7} {"step": 19230, "train_loss": 3.3491077423095703, "lr": 0.00015499594108713503, "tps": 31449, "wall": 40074.2} {"step": 19231, "train_loss": 3.312839984893799, "lr": 0.00015497807635118336, "tps": 31447, "wall": 40079.7} {"step": 19232, "train_loss": 3.316079616546631, "lr": 0.00015496021235180362, "tps": 31444, "wall": 40085.2} {"step": 19233, "train_loss": 3.3510358333587646, "lr": 0.00015494234908919801, "tps": 31441, "wall": 40090.8} {"step": 19234, "train_loss": 3.2734978199005127, "lr": 0.0001549244865635691, "tps": 31439, "wall": 40096.2} {"step": 19235, "train_loss": 3.2318687438964844, "lr": 0.00015490662477511905, "tps": 31436, "wall": 40101.7} {"step": 19236, "train_loss": 3.2057011127471924, "lr": 0.00015488876372405028, "tps": 31433, "wall": 40107.2} {"step": 19237, "train_loss": 3.2524921894073486, "lr": 0.00015487090341056517, "tps": 31430, "wall": 40112.8} {"step": 19238, "train_loss": 3.3931102752685547, "lr": 0.00015485304383486596, "tps": 31428, "wall": 40118.3} {"step": 19239, "train_loss": 3.1811344623565674, "lr": 0.000154835184997155, "tps": 31425, "wall": 40123.8} {"step": 19240, "train_loss": 3.241189956665039, "lr": 0.0001548173268976346, "tps": 31422, "wall": 40129.2} {"step": 19241, "train_loss": 3.2412736415863037, "lr": 0.000154799469536507, "tps": 31420, "wall": 40134.7} {"step": 19242, "train_loss": 3.239086389541626, "lr": 0.00015478161291397453, "tps": 31417, "wall": 40140.2} {"step": 19243, "train_loss": 3.2244067192077637, "lr": 0.0001547637570302395, "tps": 31414, "wall": 40145.7} {"step": 19244, "train_loss": 3.3715007305145264, "lr": 0.0001547459018855042, "tps": 31412, "wall": 40151.1} {"step": 19245, "train_loss": 3.35166597366333, "lr": 0.00015472804747997083, "tps": 31409, "wall": 40156.6} {"step": 19246, "train_loss": 3.3079752922058105, "lr": 0.00015471019381384165, "tps": 31407, "wall": 40162.1} {"step": 19247, "train_loss": 3.3045594692230225, "lr": 0.00015469234088731897, "tps": 31404, "wall": 40167.5} {"step": 19248, "train_loss": 3.267380714416504, "lr": 0.00015467448870060496, "tps": 31401, "wall": 40173.1} {"step": 19249, "train_loss": 3.2398715019226074, "lr": 0.00015465663725390186, "tps": 31398, "wall": 40178.6} {"step": 19250, "train_loss": 3.293649196624756, "lr": 0.00015463878654741194, "tps": 31396, "wall": 40184.1} {"step": 19251, "train_loss": 3.319558620452881, "lr": 0.00015462093658133737, "tps": 31393, "wall": 40189.6} {"step": 19252, "train_loss": 3.277608871459961, "lr": 0.00015460308735588033, "tps": 31391, "wall": 40195.1} {"step": 19253, "train_loss": 3.335028886795044, "lr": 0.00015458523887124307, "tps": 31388, "wall": 40200.6} {"step": 19254, "train_loss": 3.2686710357666016, "lr": 0.0001545673911276278, "tps": 31385, "wall": 40206.1} {"step": 19255, "train_loss": 3.292576313018799, "lr": 0.00015454954412523665, "tps": 31383, "wall": 40211.6} {"step": 19256, "train_loss": 3.3482677936553955, "lr": 0.00015453169786427178, "tps": 31380, "wall": 40217.1} {"step": 19257, "train_loss": 3.3458306789398193, "lr": 0.00015451385234493544, "tps": 31377, "wall": 40222.6} {"step": 19258, "train_loss": 3.2884738445281982, "lr": 0.00015449600756742963, "tps": 31375, "wall": 40228.1} {"step": 19259, "train_loss": 3.2935383319854736, "lr": 0.00015447816353195663, "tps": 31372, "wall": 40233.7} {"step": 19260, "train_loss": 3.2086167335510254, "lr": 0.00015446032023871853, "tps": 31369, "wall": 40239.1} {"step": 19261, "train_loss": 3.2640490531921387, "lr": 0.0001544424776879175, "tps": 31367, "wall": 40244.6} {"step": 19262, "train_loss": 3.20025372505188, "lr": 0.00015442463587975565, "tps": 31364, "wall": 40250.1} {"step": 19263, "train_loss": 3.3209338188171387, "lr": 0.000154406794814435, "tps": 31361, "wall": 40255.5} {"step": 19264, "train_loss": 3.134740114212036, "lr": 0.00015438895449215777, "tps": 31359, "wall": 40261.0} {"step": 19265, "train_loss": 3.2842061519622803, "lr": 0.00015437111491312604, "tps": 31356, "wall": 40266.4} {"step": 19266, "train_loss": 3.3395066261291504, "lr": 0.00015435327607754177, "tps": 31353, "wall": 40271.9} {"step": 19267, "train_loss": 3.2325010299682617, "lr": 0.00015433543798560727, "tps": 31351, "wall": 40277.4} {"step": 19268, "train_loss": 3.27331805229187, "lr": 0.0001543176006375244, "tps": 31348, "wall": 40282.9} {"step": 19269, "train_loss": 3.297729969024658, "lr": 0.00015429976403349532, "tps": 31345, "wall": 40288.4} {"step": 19270, "train_loss": 3.285407543182373, "lr": 0.00015428192817372205, "tps": 31343, "wall": 40294.0} {"step": 19271, "train_loss": 3.3337349891662598, "lr": 0.00015426409305840667, "tps": 31340, "wall": 40299.4} {"step": 19272, "train_loss": 3.299520492553711, "lr": 0.0001542462586877512, "tps": 31337, "wall": 40305.0} {"step": 19273, "train_loss": 3.2366793155670166, "lr": 0.00015422842506195768, "tps": 31335, "wall": 40310.4} {"step": 19274, "train_loss": 3.3025362491607666, "lr": 0.0001542105921812281, "tps": 31332, "wall": 40316.0} {"step": 19275, "train_loss": 3.253617286682129, "lr": 0.00015419276004576452, "tps": 31330, "wall": 40321.4} {"step": 19276, "train_loss": 3.2918386459350586, "lr": 0.00015417492865576885, "tps": 31327, "wall": 40326.9} {"step": 19277, "train_loss": 3.2335009574890137, "lr": 0.0001541570980114432, "tps": 31324, "wall": 40332.4} {"step": 19278, "train_loss": 3.1939592361450195, "lr": 0.00015413926811298954, "tps": 31322, "wall": 40337.8} {"step": 19279, "train_loss": 3.307574510574341, "lr": 0.00015412143896060973, "tps": 31319, "wall": 40343.3} {"step": 19280, "train_loss": 3.3131022453308105, "lr": 0.00015410361055450585, "tps": 31316, "wall": 40348.8} {"step": 19281, "train_loss": 3.2920782566070557, "lr": 0.0001540857828948799, "tps": 31314, "wall": 40354.3} {"step": 19282, "train_loss": 3.3532028198242188, "lr": 0.0001540679559819337, "tps": 31311, "wall": 40359.8} {"step": 19283, "train_loss": 3.146125316619873, "lr": 0.0001540501298158693, "tps": 31309, "wall": 40365.2} {"step": 19284, "train_loss": 3.2881991863250732, "lr": 0.00015403230439688857, "tps": 31306, "wall": 40370.7} {"step": 19285, "train_loss": 3.2442619800567627, "lr": 0.00015401447972519344, "tps": 31303, "wall": 40376.2} {"step": 19286, "train_loss": 3.28310489654541, "lr": 0.0001539966558009859, "tps": 31301, "wall": 40381.7} {"step": 19287, "train_loss": 3.302700996398926, "lr": 0.0001539788326244678, "tps": 31298, "wall": 40387.2} {"step": 19288, "train_loss": 3.2620182037353516, "lr": 0.0001539610101958411, "tps": 31295, "wall": 40392.7} {"step": 19289, "train_loss": 3.15799617767334, "lr": 0.00015394318851530758, "tps": 31293, "wall": 40398.2} {"step": 19290, "train_loss": 3.216590642929077, "lr": 0.0001539253675830692, "tps": 31290, "wall": 40403.6} {"step": 19291, "train_loss": 3.2054967880249023, "lr": 0.00015390754739932785, "tps": 31287, "wall": 40409.1} {"step": 19292, "train_loss": 3.293755054473877, "lr": 0.00015388972796428539, "tps": 31285, "wall": 40414.7} {"step": 19293, "train_loss": 3.3031115531921387, "lr": 0.00015387190927814364, "tps": 31282, "wall": 40420.3} {"step": 19294, "train_loss": 3.232404947280884, "lr": 0.0001538540913411045, "tps": 31280, "wall": 40425.7} {"step": 19295, "train_loss": 3.2870521545410156, "lr": 0.0001538362741533698, "tps": 31277, "wall": 40431.2} {"step": 19296, "train_loss": 3.2455544471740723, "lr": 0.00015381845771514133, "tps": 31274, "wall": 40436.6} {"step": 19297, "train_loss": 3.273984909057617, "lr": 0.00015380064202662097, "tps": 31272, "wall": 40442.1} {"step": 19298, "train_loss": 3.339639186859131, "lr": 0.00015378282708801053, "tps": 31269, "wall": 40447.6} {"step": 19299, "train_loss": 3.3302009105682373, "lr": 0.0001537650128995118, "tps": 31266, "wall": 40453.1} {"step": 19300, "train_loss": 3.249879837036133, "lr": 0.00015374719946132656, "tps": 31264, "wall": 40458.5} {"step": 19301, "train_loss": 3.3176586627960205, "lr": 0.0001537293867736567, "tps": 31261, "wall": 40464.0} {"step": 19302, "train_loss": 3.1851093769073486, "lr": 0.0001537115748367039, "tps": 31259, "wall": 40469.5} {"step": 19303, "train_loss": 3.217674970626831, "lr": 0.00015369376365066998, "tps": 31256, "wall": 40475.0} {"step": 19304, "train_loss": 3.2614989280700684, "lr": 0.00015367595321575666, "tps": 31253, "wall": 40480.5} {"step": 19305, "train_loss": 3.24798583984375, "lr": 0.0001536581435321657, "tps": 31251, "wall": 40485.9} {"step": 19306, "train_loss": 3.162879228591919, "lr": 0.00015364033460009896, "tps": 31248, "wall": 40491.4} {"step": 19307, "train_loss": 3.228691339492798, "lr": 0.00015362252641975803, "tps": 31246, "wall": 40496.9} {"step": 19308, "train_loss": 3.331429958343506, "lr": 0.0001536047189913447, "tps": 31243, "wall": 40502.5} {"step": 19309, "train_loss": 3.3057026863098145, "lr": 0.00015358691231506078, "tps": 31240, "wall": 40507.9} {"step": 19310, "train_loss": 3.2596662044525146, "lr": 0.00015356910639110786, "tps": 31238, "wall": 40513.4} {"step": 19311, "train_loss": 3.1515612602233887, "lr": 0.00015355130121968774, "tps": 31235, "wall": 40518.9} {"step": 19312, "train_loss": 3.318681240081787, "lr": 0.000153533496801002, "tps": 31233, "wall": 40524.3} {"step": 19313, "train_loss": 3.151768922805786, "lr": 0.00015351569313525246, "tps": 31230, "wall": 40529.8} {"step": 19314, "train_loss": 3.1696557998657227, "lr": 0.00015349789022264072, "tps": 31227, "wall": 40535.4} {"step": 19315, "train_loss": 3.212691307067871, "lr": 0.00015348008806336847, "tps": 31225, "wall": 40540.8} {"step": 19316, "train_loss": 3.3899056911468506, "lr": 0.00015346228665763745, "tps": 31222, "wall": 40546.3} {"step": 19317, "train_loss": 3.2317190170288086, "lr": 0.0001534444860056492, "tps": 31219, "wall": 40551.8} {"step": 19318, "train_loss": 3.306708335876465, "lr": 0.00015342668610760537, "tps": 31217, "wall": 40557.3} {"step": 19319, "train_loss": 3.213970184326172, "lr": 0.00015340888696370773, "tps": 31214, "wall": 40562.8} {"step": 19320, "train_loss": 3.2606375217437744, "lr": 0.00015339108857415776, "tps": 31212, "wall": 40568.3} {"step": 19321, "train_loss": 3.288520097732544, "lr": 0.00015337329093915712, "tps": 31209, "wall": 40573.8} {"step": 19322, "train_loss": 3.2881360054016113, "lr": 0.00015335549405890748, "tps": 31206, "wall": 40579.3} {"step": 19323, "train_loss": 3.348921298980713, "lr": 0.00015333769793361043, "tps": 31204, "wall": 40584.8} {"step": 19324, "train_loss": 3.314725399017334, "lr": 0.0001533199025634675, "tps": 31201, "wall": 40590.2} {"step": 19325, "train_loss": 3.2932558059692383, "lr": 0.00015330210794868037, "tps": 31199, "wall": 40595.8} {"step": 19326, "train_loss": 3.3554131984710693, "lr": 0.00015328431408945053, "tps": 31196, "wall": 40601.3} {"step": 19327, "train_loss": 3.254103899002075, "lr": 0.0001532665209859796, "tps": 31193, "wall": 40606.8} {"step": 19328, "train_loss": 3.3128015995025635, "lr": 0.00015324872863846912, "tps": 31191, "wall": 40612.2} {"step": 19329, "train_loss": 3.206716299057007, "lr": 0.00015323093704712064, "tps": 31188, "wall": 40617.7} {"step": 19330, "train_loss": 3.228066921234131, "lr": 0.0001532131462121358, "tps": 31186, "wall": 40623.2} {"step": 19331, "train_loss": 3.2928626537323, "lr": 0.00015319535613371595, "tps": 31183, "wall": 40628.7} {"step": 19332, "train_loss": 3.2143313884735107, "lr": 0.00015317756681206275, "tps": 31180, "wall": 40634.2} {"step": 19333, "train_loss": 3.306760787963867, "lr": 0.00015315977824737774, "tps": 31178, "wall": 40639.6} {"step": 19334, "train_loss": 3.41326904296875, "lr": 0.00015314199043986232, "tps": 31175, "wall": 40645.1} {"step": 19335, "train_loss": 3.3405094146728516, "lr": 0.00015312420338971805, "tps": 31173, "wall": 40650.5} {"step": 19336, "train_loss": 3.3427934646606445, "lr": 0.00015310641709714647, "tps": 31170, "wall": 40656.1} {"step": 19337, "train_loss": 3.2808916568756104, "lr": 0.00015308863156234898, "tps": 31167, "wall": 40661.6} {"step": 19338, "train_loss": 3.353853225708008, "lr": 0.00015307084678552708, "tps": 31165, "wall": 40667.1} {"step": 19339, "train_loss": 3.2607693672180176, "lr": 0.00015305306276688224, "tps": 31162, "wall": 40672.6} {"step": 19340, "train_loss": 3.391017436981201, "lr": 0.00015303527950661603, "tps": 31160, "wall": 40678.1} {"step": 19341, "train_loss": 3.309129238128662, "lr": 0.0001530174970049297, "tps": 31157, "wall": 40683.6} {"step": 19342, "train_loss": 3.316345691680908, "lr": 0.00015299971526202478, "tps": 31154, "wall": 40689.1} {"step": 19343, "train_loss": 3.3223867416381836, "lr": 0.00015298193427810278, "tps": 31152, "wall": 40694.6} {"step": 19344, "train_loss": 3.1963658332824707, "lr": 0.00015296415405336502, "tps": 31149, "wall": 40700.1} {"step": 19345, "train_loss": 3.248049736022949, "lr": 0.00015294637458801292, "tps": 31147, "wall": 40705.6} {"step": 19346, "train_loss": 3.3110761642456055, "lr": 0.00015292859588224796, "tps": 31144, "wall": 40711.1} {"step": 19347, "train_loss": 3.4287986755371094, "lr": 0.00015291081793627145, "tps": 31141, "wall": 40716.6} {"step": 19348, "train_loss": 3.3667938709259033, "lr": 0.00015289304075028482, "tps": 31139, "wall": 40722.1} {"step": 19349, "train_loss": 3.300607919692993, "lr": 0.0001528752643244895, "tps": 31136, "wall": 40727.6} {"step": 19350, "train_loss": 3.2700448036193848, "lr": 0.00015285748865908683, "tps": 31134, "wall": 40733.1} {"step": 19351, "train_loss": 3.198819160461426, "lr": 0.00015283971375427808, "tps": 31131, "wall": 40738.6} {"step": 19352, "train_loss": 3.3297438621520996, "lr": 0.00015282193961026476, "tps": 31128, "wall": 40744.1} {"step": 19353, "train_loss": 3.3353123664855957, "lr": 0.00015280416622724815, "tps": 31126, "wall": 40749.6} {"step": 19354, "train_loss": 3.2071340084075928, "lr": 0.0001527863936054295, "tps": 31123, "wall": 40755.1} {"step": 19355, "train_loss": 3.292158603668213, "lr": 0.00015276862174501025, "tps": 31121, "wall": 40760.6} {"step": 19356, "train_loss": 3.3644676208496094, "lr": 0.0001527508506461917, "tps": 31118, "wall": 40766.0} {"step": 19357, "train_loss": 3.3213939666748047, "lr": 0.0001527330803091752, "tps": 31115, "wall": 40771.5} {"step": 19358, "train_loss": 3.319431781768799, "lr": 0.00015271531073416194, "tps": 31113, "wall": 40777.0} {"step": 19359, "train_loss": 3.2338461875915527, "lr": 0.0001526975419213533, "tps": 31110, "wall": 40782.5} {"step": 19360, "train_loss": 3.2597150802612305, "lr": 0.00015267977387095058, "tps": 31108, "wall": 40787.9} {"step": 19361, "train_loss": 3.1564083099365234, "lr": 0.000152662006583155, "tps": 31105, "wall": 40793.4} {"step": 19362, "train_loss": 3.3337326049804688, "lr": 0.00015264424005816785, "tps": 31103, "wall": 40798.9} {"step": 19363, "train_loss": 3.363290309906006, "lr": 0.0001526264742961904, "tps": 31100, "wall": 40804.4} {"step": 19364, "train_loss": 3.2489383220672607, "lr": 0.00015260870929742387, "tps": 31098, "wall": 40809.8} {"step": 19365, "train_loss": 3.274351119995117, "lr": 0.0001525909450620695, "tps": 31095, "wall": 40815.3} {"step": 19366, "train_loss": 3.2628908157348633, "lr": 0.00015257318159032858, "tps": 31092, "wall": 40820.8} {"step": 19367, "train_loss": 3.4742653369903564, "lr": 0.00015255541888240233, "tps": 31090, "wall": 40826.3} {"step": 19368, "train_loss": 3.394963026046753, "lr": 0.00015253765693849195, "tps": 31087, "wall": 40831.9} {"step": 19369, "train_loss": 3.318368434906006, "lr": 0.0001525198957587986, "tps": 31085, "wall": 40837.4} {"step": 19370, "train_loss": 3.2724609375, "lr": 0.00015250213534352355, "tps": 31082, "wall": 40842.9} {"step": 19371, "train_loss": 3.302043914794922, "lr": 0.00015248437569286794, "tps": 31079, "wall": 40848.4} {"step": 19372, "train_loss": 3.2850630283355713, "lr": 0.000152466616807033, "tps": 31077, "wall": 40853.9} {"step": 19373, "train_loss": 3.235370635986328, "lr": 0.0001524488586862199, "tps": 31074, "wall": 40859.4} {"step": 19374, "train_loss": 3.226166009902954, "lr": 0.00015243110133062975, "tps": 31072, "wall": 40864.9} {"step": 19375, "train_loss": 3.2309820652008057, "lr": 0.00015241334474046375, "tps": 31069, "wall": 40870.4} {"step": 19376, "train_loss": 3.3178861141204834, "lr": 0.000152395588915923, "tps": 31067, "wall": 40875.8} {"step": 19377, "train_loss": 3.3276913166046143, "lr": 0.00015237783385720874, "tps": 31064, "wall": 40881.3} {"step": 19378, "train_loss": 3.280856132507324, "lr": 0.000152360079564522, "tps": 31061, "wall": 40886.8} {"step": 19379, "train_loss": 3.2590010166168213, "lr": 0.0001523423260380639, "tps": 31059, "wall": 40892.4} {"step": 19380, "train_loss": 3.3035502433776855, "lr": 0.00015232457327803565, "tps": 31056, "wall": 40897.8} {"step": 19381, "train_loss": 3.2957634925842285, "lr": 0.00015230682128463828, "tps": 31054, "wall": 40903.3} {"step": 19382, "train_loss": 3.251070499420166, "lr": 0.0001522890700580729, "tps": 31051, "wall": 40908.8} {"step": 19383, "train_loss": 3.2490649223327637, "lr": 0.00015227131959854058, "tps": 31049, "wall": 40914.3} {"step": 19384, "train_loss": 3.3085532188415527, "lr": 0.00015225356990624243, "tps": 31046, "wall": 40919.7} {"step": 19385, "train_loss": 3.2684552669525146, "lr": 0.0001522358209813795, "tps": 31043, "wall": 40925.2} {"step": 19386, "train_loss": 3.2285284996032715, "lr": 0.00015221807282415285, "tps": 31041, "wall": 40930.7} {"step": 19387, "train_loss": 3.2754335403442383, "lr": 0.00015220032543476357, "tps": 31038, "wall": 40936.2} {"step": 19388, "train_loss": 3.2153120040893555, "lr": 0.00015218257881341267, "tps": 31036, "wall": 40941.7} {"step": 19389, "train_loss": 3.347874879837036, "lr": 0.00015216483296030115, "tps": 31033, "wall": 40947.2} {"step": 19390, "train_loss": 3.2462987899780273, "lr": 0.0001521470878756301, "tps": 31031, "wall": 40952.7} {"step": 19391, "train_loss": 3.246488094329834, "lr": 0.00015212934355960048, "tps": 31028, "wall": 40958.2} {"step": 19392, "train_loss": 3.277585029602051, "lr": 0.00015211160001241334, "tps": 31026, "wall": 40963.7} {"step": 19393, "train_loss": 3.3103432655334473, "lr": 0.00015209385723426966, "tps": 31023, "wall": 40969.1} {"step": 19394, "train_loss": 3.3266749382019043, "lr": 0.00015207611522537046, "tps": 31020, "wall": 40974.6} {"step": 19395, "train_loss": 3.301054000854492, "lr": 0.00015205837398591673, "tps": 31018, "wall": 40980.1} {"step": 19396, "train_loss": 3.293452739715576, "lr": 0.0001520406335161093, "tps": 31015, "wall": 40985.5} {"step": 19397, "train_loss": 3.217705249786377, "lr": 0.00015202289381614938, "tps": 31013, "wall": 40991.0} {"step": 19398, "train_loss": 3.2430708408355713, "lr": 0.00015200515488623774, "tps": 31010, "wall": 40996.5} {"step": 19399, "train_loss": 3.344778537750244, "lr": 0.0001519874167265754, "tps": 31008, "wall": 41001.9} {"step": 19400, "train_loss": 3.2791898250579834, "lr": 0.00015196967933736328, "tps": 31005, "wall": 41007.4} {"step": 19401, "train_loss": 3.2729332447052, "lr": 0.00015195194271880232, "tps": 31003, "wall": 41013.0} {"step": 19402, "train_loss": 3.2436978816986084, "lr": 0.0001519342068710934, "tps": 31000, "wall": 41018.5} {"step": 19403, "train_loss": 3.2745816707611084, "lr": 0.00015191647179443746, "tps": 30998, "wall": 41023.9} {"step": 19404, "train_loss": 3.218029260635376, "lr": 0.00015189873748903545, "tps": 30995, "wall": 41029.4} {"step": 19405, "train_loss": 3.295010805130005, "lr": 0.0001518810039550882, "tps": 30992, "wall": 41034.9} {"step": 19406, "train_loss": 3.343026638031006, "lr": 0.00015186327119279662, "tps": 30990, "wall": 41040.4} {"step": 19407, "train_loss": 3.303455352783203, "lr": 0.00015184553920236161, "tps": 30987, "wall": 41045.9} {"step": 19408, "train_loss": 3.319826602935791, "lr": 0.00015182780798398405, "tps": 30985, "wall": 41051.3} {"step": 19409, "train_loss": 3.235551595687866, "lr": 0.00015181007753786472, "tps": 30982, "wall": 41056.9} {"step": 19410, "train_loss": 3.314380168914795, "lr": 0.00015179234786420452, "tps": 30980, "wall": 41062.3} {"step": 19411, "train_loss": 3.2698497772216797, "lr": 0.00015177461896320434, "tps": 30977, "wall": 41067.8} {"step": 19412, "train_loss": 3.2448837757110596, "lr": 0.00015175689083506494, "tps": 30975, "wall": 41073.4} {"step": 19413, "train_loss": 3.30320143699646, "lr": 0.00015173916347998713, "tps": 30972, "wall": 41078.9} {"step": 19414, "train_loss": 3.3158297538757324, "lr": 0.0001517214368981718, "tps": 30969, "wall": 41084.4} {"step": 19415, "train_loss": 3.231013774871826, "lr": 0.00015170371108981975, "tps": 30967, "wall": 41089.9} {"step": 19416, "train_loss": 3.196329116821289, "lr": 0.00015168598605513176, "tps": 30964, "wall": 41095.4} {"step": 19417, "train_loss": 3.2470312118530273, "lr": 0.0001516682617943086, "tps": 30962, "wall": 41100.9} {"step": 19418, "train_loss": 3.2593274116516113, "lr": 0.00015165053830755104, "tps": 30959, "wall": 41106.4} {"step": 19419, "train_loss": 3.242290496826172, "lr": 0.00015163281559505987, "tps": 30957, "wall": 41111.9} {"step": 19420, "train_loss": 3.2895610332489014, "lr": 0.00015161509365703587, "tps": 30954, "wall": 41117.3} {"step": 19421, "train_loss": 3.36444354057312, "lr": 0.0001515973724936799, "tps": 30952, "wall": 41122.8} {"step": 19422, "train_loss": 3.1490652561187744, "lr": 0.00015157965210519248, "tps": 30949, "wall": 41128.3} {"step": 19423, "train_loss": 3.146388053894043, "lr": 0.00015156193249177445, "tps": 30947, "wall": 41133.9} {"step": 19424, "train_loss": 3.2700371742248535, "lr": 0.00015154421365362662, "tps": 30944, "wall": 41139.4} {"step": 19425, "train_loss": 3.3359758853912354, "lr": 0.00015152649559094963, "tps": 30941, "wall": 41144.9} {"step": 19426, "train_loss": 3.4030137062072754, "lr": 0.00015150877830394417, "tps": 30939, "wall": 41150.4} {"step": 19427, "train_loss": 3.375260829925537, "lr": 0.000151491061792811, "tps": 30936, "wall": 41155.8} {"step": 19428, "train_loss": 3.3223211765289307, "lr": 0.0001514733460577508, "tps": 30934, "wall": 41161.4} {"step": 19429, "train_loss": 3.356027364730835, "lr": 0.00015145563109896418, "tps": 30931, "wall": 41166.8} {"step": 19430, "train_loss": 3.3023464679718018, "lr": 0.0001514379169166519, "tps": 30929, "wall": 41172.3} {"step": 19431, "train_loss": 3.2611989974975586, "lr": 0.00015142020351101464, "tps": 30926, "wall": 41177.8} {"step": 19432, "train_loss": 3.325857162475586, "lr": 0.00015140249088225303, "tps": 30924, "wall": 41183.3} {"step": 19433, "train_loss": 3.311455488204956, "lr": 0.00015138477903056766, "tps": 30921, "wall": 41188.7} {"step": 19434, "train_loss": 3.3680949211120605, "lr": 0.00015136706795615927, "tps": 30919, "wall": 41194.3} {"step": 19435, "train_loss": 3.2373905181884766, "lr": 0.00015134935765922846, "tps": 30916, "wall": 41199.8} {"step": 19436, "train_loss": 3.344386577606201, "lr": 0.0001513316481399758, "tps": 30914, "wall": 41205.3} {"step": 19437, "train_loss": 3.428748846054077, "lr": 0.00015131393939860194, "tps": 30911, "wall": 41210.8} {"step": 19438, "train_loss": 3.2443292140960693, "lr": 0.00015129623143530756, "tps": 30908, "wall": 41216.3} {"step": 19439, "train_loss": 3.39154052734375, "lr": 0.00015127852425029313, "tps": 30906, "wall": 41221.8} {"step": 19440, "train_loss": 3.377790927886963, "lr": 0.0001512608178437593, "tps": 30903, "wall": 41227.2} {"step": 19441, "train_loss": 3.1876015663146973, "lr": 0.00015124311221590667, "tps": 30901, "wall": 41232.7} {"step": 19442, "train_loss": 3.286966323852539, "lr": 0.00015122540736693573, "tps": 30898, "wall": 41238.3} {"step": 19443, "train_loss": 3.3065738677978516, "lr": 0.00015120770329704714, "tps": 30896, "wall": 41243.8} {"step": 19444, "train_loss": 3.2993905544281006, "lr": 0.0001511900000064414, "tps": 30893, "wall": 41249.2} {"step": 19445, "train_loss": 3.3515987396240234, "lr": 0.00015117229749531905, "tps": 30891, "wall": 41254.8} {"step": 19446, "train_loss": 3.3916101455688477, "lr": 0.00015115459576388064, "tps": 30888, "wall": 41260.3} {"step": 19447, "train_loss": 3.363297939300537, "lr": 0.0001511368948123267, "tps": 30886, "wall": 41265.8} {"step": 19448, "train_loss": 3.3132591247558594, "lr": 0.00015111919464085775, "tps": 30883, "wall": 41271.3} {"step": 19449, "train_loss": 3.3006088733673096, "lr": 0.00015110149524967428, "tps": 30881, "wall": 41276.8} {"step": 19450, "train_loss": 3.314162254333496, "lr": 0.00015108379663897678, "tps": 30878, "wall": 41282.3} {"step": 19451, "train_loss": 3.3154215812683105, "lr": 0.00015106609880896583, "tps": 30876, "wall": 41287.8} {"step": 19452, "train_loss": 3.2925186157226562, "lr": 0.0001510484017598418, "tps": 30873, "wall": 41293.3} {"step": 19453, "train_loss": 3.1790859699249268, "lr": 0.00015103070549180516, "tps": 30871, "wall": 41298.7} {"step": 19454, "train_loss": 3.1914265155792236, "lr": 0.0001510130100050565, "tps": 30868, "wall": 41304.3} {"step": 19455, "train_loss": 3.197751998901367, "lr": 0.00015099531529979613, "tps": 30866, "wall": 41309.8} {"step": 19456, "train_loss": 3.2490406036376953, "lr": 0.00015097762137622456, "tps": 30863, "wall": 41315.3} {"step": 19457, "train_loss": 3.119410991668701, "lr": 0.00015095992823454228, "tps": 30860, "wall": 41320.8} {"step": 19458, "train_loss": 3.1709954738616943, "lr": 0.00015094223587494966, "tps": 30858, "wall": 41326.3} {"step": 19459, "train_loss": 3.211256504058838, "lr": 0.00015092454429764705, "tps": 30855, "wall": 41331.9} {"step": 19460, "train_loss": 3.2400267124176025, "lr": 0.00015090685350283503, "tps": 30853, "wall": 41337.3} {"step": 19461, "train_loss": 3.3540639877319336, "lr": 0.0001508891634907139, "tps": 30850, "wall": 41342.8} {"step": 19462, "train_loss": 3.3234758377075195, "lr": 0.00015087147426148402, "tps": 30848, "wall": 41348.3} {"step": 19463, "train_loss": 3.3476107120513916, "lr": 0.00015085378581534587, "tps": 30845, "wall": 41353.9} {"step": 19464, "train_loss": 3.3065268993377686, "lr": 0.0001508360981524997, "tps": 30843, "wall": 41359.4} {"step": 19465, "train_loss": 3.3036608695983887, "lr": 0.000150818411273146, "tps": 30840, "wall": 41365.0} {"step": 19466, "train_loss": 3.2085201740264893, "lr": 0.0001508007251774851, "tps": 30838, "wall": 41370.6} {"step": 19467, "train_loss": 3.2972240447998047, "lr": 0.0001507830398657173, "tps": 30835, "wall": 41376.2} {"step": 19468, "train_loss": 3.2671499252319336, "lr": 0.000150765355338043, "tps": 30832, "wall": 41381.7} {"step": 19469, "train_loss": 3.247130870819092, "lr": 0.00015074767159466246, "tps": 30830, "wall": 41387.2} {"step": 19470, "train_loss": 3.36484956741333, "lr": 0.0001507299886357761, "tps": 30827, "wall": 41392.7} {"step": 19471, "train_loss": 3.270048141479492, "lr": 0.00015071230646158417, "tps": 30825, "wall": 41398.1} {"step": 19472, "train_loss": 3.3797202110290527, "lr": 0.00015069462507228694, "tps": 30822, "wall": 41403.6} {"step": 19473, "train_loss": 3.237886428833008, "lr": 0.00015067694446808475, "tps": 30820, "wall": 41409.1} {"step": 19474, "train_loss": 3.2440762519836426, "lr": 0.00015065926464917788, "tps": 30817, "wall": 41414.6} {"step": 19475, "train_loss": 3.2419774532318115, "lr": 0.00015064158561576662, "tps": 30815, "wall": 41420.1} {"step": 19476, "train_loss": 3.387967586517334, "lr": 0.00015062390736805123, "tps": 30812, "wall": 41425.6} {"step": 19477, "train_loss": 3.3709702491760254, "lr": 0.00015060622990623198, "tps": 30810, "wall": 41431.0} {"step": 19478, "train_loss": 3.2676079273223877, "lr": 0.0001505885532305091, "tps": 30807, "wall": 41436.7} {"step": 19479, "train_loss": 3.182772159576416, "lr": 0.00015057087734108286, "tps": 30805, "wall": 41442.1} {"step": 19480, "train_loss": 3.286428213119507, "lr": 0.00015055320223815346, "tps": 30802, "wall": 41447.6} {"step": 19481, "train_loss": 3.2896969318389893, "lr": 0.0001505355279219211, "tps": 30800, "wall": 41453.2} {"step": 19482, "train_loss": 3.2666122913360596, "lr": 0.00015051785439258608, "tps": 30797, "wall": 41458.6} {"step": 19483, "train_loss": 3.1749658584594727, "lr": 0.00015050018165034862, "tps": 30795, "wall": 41464.2} {"step": 19484, "train_loss": 3.220731735229492, "lr": 0.00015048250969540878, "tps": 30792, "wall": 41469.6} {"step": 19485, "train_loss": 3.2212016582489014, "lr": 0.00015046483852796687, "tps": 30790, "wall": 41475.2} {"step": 19486, "train_loss": 3.19962215423584, "lr": 0.00015044716814822305, "tps": 30787, "wall": 41480.6} {"step": 19487, "train_loss": 3.3434882164001465, "lr": 0.0001504294985563774, "tps": 30785, "wall": 41486.1} {"step": 19488, "train_loss": 3.297008514404297, "lr": 0.0001504118297526302, "tps": 30782, "wall": 41491.5} {"step": 19489, "train_loss": 3.2008306980133057, "lr": 0.00015039416173718157, "tps": 30780, "wall": 41497.1} {"step": 19490, "train_loss": 3.336630344390869, "lr": 0.00015037649451023164, "tps": 30777, "wall": 41502.6} {"step": 19491, "train_loss": 3.314985513687134, "lr": 0.0001503588280719805, "tps": 30775, "wall": 41508.1} {"step": 19492, "train_loss": 3.3089375495910645, "lr": 0.00015034116242262834, "tps": 30772, "wall": 41513.6} {"step": 19493, "train_loss": 3.3283987045288086, "lr": 0.00015032349756237534, "tps": 30770, "wall": 41519.1} {"step": 19494, "train_loss": 3.3072078227996826, "lr": 0.00015030583349142144, "tps": 30767, "wall": 41524.5} {"step": 19495, "train_loss": 3.2448782920837402, "lr": 0.00015028817020996686, "tps": 30765, "wall": 41530.0} {"step": 19496, "train_loss": 3.2972655296325684, "lr": 0.00015027050771821164, "tps": 30762, "wall": 41535.5} {"step": 19497, "train_loss": 3.212987184524536, "lr": 0.00015025284601635593, "tps": 30760, "wall": 41541.0} {"step": 19498, "train_loss": 3.262439250946045, "lr": 0.00015023518510459967, "tps": 30757, "wall": 41546.5} {"step": 19499, "train_loss": 3.2380361557006836, "lr": 0.00015021752498314305, "tps": 30755, "wall": 41552.1} {"step": 19500, "train_loss": 3.2940759658813477, "lr": 0.00015019986565218614, "tps": 30752, "wall": 41557.6} {"step": 19501, "train_loss": 3.332580804824829, "lr": 0.00015018220711192885, "tps": 30750, "wall": 41563.2} {"step": 19502, "train_loss": 3.2329623699188232, "lr": 0.00015016454936257132, "tps": 30747, "wall": 41568.7} {"step": 19503, "train_loss": 3.335236072540283, "lr": 0.00015014689240431354, "tps": 30745, "wall": 41574.2} {"step": 19504, "train_loss": 3.2871100902557373, "lr": 0.0001501292362373556, "tps": 30742, "wall": 41579.6} {"step": 19505, "train_loss": 3.301130771636963, "lr": 0.00015011158086189737, "tps": 30740, "wall": 41585.2} {"step": 19506, "train_loss": 3.1701860427856445, "lr": 0.00015009392627813898, "tps": 30737, "wall": 41590.7} {"step": 19507, "train_loss": 3.2337779998779297, "lr": 0.0001500762724862804, "tps": 30735, "wall": 41596.3} {"step": 19508, "train_loss": 3.285865545272827, "lr": 0.00015005861948652155, "tps": 30732, "wall": 41601.8} {"step": 19509, "train_loss": 3.3224518299102783, "lr": 0.0001500409672790624, "tps": 30730, "wall": 41607.3} {"step": 19510, "train_loss": 3.2673282623291016, "lr": 0.00015002331586410304, "tps": 30727, "wall": 41612.8} {"step": 19511, "train_loss": 3.2424983978271484, "lr": 0.00015000566524184326, "tps": 30725, "wall": 41618.3} {"step": 19512, "train_loss": 3.223768711090088, "lr": 0.00014998801541248318, "tps": 30722, "wall": 41623.8} {"step": 19513, "train_loss": 3.2611031532287598, "lr": 0.0001499703663762226, "tps": 30720, "wall": 41629.3} {"step": 19514, "train_loss": 3.2087559700012207, "lr": 0.00014995271813326148, "tps": 30717, "wall": 41634.8} {"step": 19515, "train_loss": 3.3237996101379395, "lr": 0.00014993507068379976, "tps": 30715, "wall": 41640.2} {"step": 19516, "train_loss": 3.379551649093628, "lr": 0.00014991742402803738, "tps": 30713, "wall": 41645.8} {"step": 19517, "train_loss": 3.2589645385742188, "lr": 0.0001498997781661742, "tps": 30710, "wall": 41651.3} {"step": 19518, "train_loss": 3.282656669616699, "lr": 0.00014988213309841014, "tps": 30708, "wall": 41656.8} {"step": 19519, "train_loss": 3.336493968963623, "lr": 0.00014986448882494505, "tps": 30705, "wall": 41662.3} {"step": 19520, "train_loss": 3.0856752395629883, "lr": 0.00014984684534597887, "tps": 30703, "wall": 41667.7} {"step": 19521, "train_loss": 3.2758917808532715, "lr": 0.00014982920266171137, "tps": 30700, "wall": 41673.3} {"step": 19522, "train_loss": 3.3260629177093506, "lr": 0.00014981156077234248, "tps": 30698, "wall": 41678.8} {"step": 19523, "train_loss": 3.2043046951293945, "lr": 0.00014979391967807204, "tps": 30695, "wall": 41684.2} {"step": 19524, "train_loss": 3.172360420227051, "lr": 0.00014977627937909986, "tps": 30693, "wall": 41689.7} {"step": 19525, "train_loss": 3.3065128326416016, "lr": 0.00014975863987562576, "tps": 30690, "wall": 41695.2} {"step": 19526, "train_loss": 3.3060824871063232, "lr": 0.0001497410011678496, "tps": 30688, "wall": 41700.7} {"step": 19527, "train_loss": 3.2976839542388916, "lr": 0.0001497233632559712, "tps": 30685, "wall": 41706.2} {"step": 19528, "train_loss": 3.2435436248779297, "lr": 0.00014970572614019033, "tps": 30683, "wall": 41711.6} {"step": 19529, "train_loss": 3.3140084743499756, "lr": 0.0001496880898207068, "tps": 30680, "wall": 41717.2} {"step": 19530, "train_loss": 3.2668962478637695, "lr": 0.0001496704542977204, "tps": 30678, "wall": 41722.7} {"step": 19531, "train_loss": 3.303755760192871, "lr": 0.00014965281957143089, "tps": 30675, "wall": 41728.1} {"step": 19532, "train_loss": 3.3230791091918945, "lr": 0.00014963518564203802, "tps": 30673, "wall": 41733.8} {"step": 19533, "train_loss": 3.2662353515625, "lr": 0.00014961755250974163, "tps": 30670, "wall": 41739.2} {"step": 19534, "train_loss": 3.3474135398864746, "lr": 0.00014959992017474138, "tps": 30668, "wall": 41744.7} {"step": 19535, "train_loss": 3.1755716800689697, "lr": 0.00014958228863723701, "tps": 30666, "wall": 41750.1} {"step": 19536, "train_loss": 3.2179770469665527, "lr": 0.00014956465789742836, "tps": 30663, "wall": 41755.6} {"step": 19537, "train_loss": 3.298224687576294, "lr": 0.00014954702795551503, "tps": 30661, "wall": 41761.2} {"step": 19538, "train_loss": 3.217893362045288, "lr": 0.00014952939881169677, "tps": 30658, "wall": 41766.7} {"step": 19539, "train_loss": 3.223154067993164, "lr": 0.0001495117704661733, "tps": 30656, "wall": 41772.2} {"step": 19540, "train_loss": 3.218649387359619, "lr": 0.00014949414291914436, "tps": 30653, "wall": 41777.6} {"step": 19541, "train_loss": 3.2137980461120605, "lr": 0.00014947651617080952, "tps": 30651, "wall": 41783.1} {"step": 19542, "train_loss": 3.2398204803466797, "lr": 0.0001494588902213685, "tps": 30648, "wall": 41788.6} {"step": 19543, "train_loss": 3.3340187072753906, "lr": 0.00014944126507102104, "tps": 30646, "wall": 41794.2} {"step": 19544, "train_loss": 3.221714496612549, "lr": 0.00014942364071996673, "tps": 30643, "wall": 41799.6} {"step": 19545, "train_loss": 3.224534273147583, "lr": 0.00014940601716840522, "tps": 30641, "wall": 41805.2} {"step": 19546, "train_loss": 3.350226879119873, "lr": 0.0001493883944165362, "tps": 30638, "wall": 41810.7} {"step": 19547, "train_loss": 3.2855913639068604, "lr": 0.00014937077246455927, "tps": 30636, "wall": 41816.1} {"step": 19548, "train_loss": 3.2205193042755127, "lr": 0.00014935315131267402, "tps": 30633, "wall": 41821.6} {"step": 19549, "train_loss": 3.261655330657959, "lr": 0.0001493355309610801, "tps": 30631, "wall": 41827.1} {"step": 19550, "train_loss": 3.2120165824890137, "lr": 0.00014931791140997716, "tps": 30629, "wall": 41832.6} {"step": 19551, "train_loss": 3.3737094402313232, "lr": 0.00014930029265956466, "tps": 30626, "wall": 41838.0} {"step": 19552, "train_loss": 3.2441205978393555, "lr": 0.0001492826747100423, "tps": 30624, "wall": 41843.5} {"step": 19553, "train_loss": 3.3380398750305176, "lr": 0.0001492650575616096, "tps": 30621, "wall": 41849.0} {"step": 19554, "train_loss": 3.2786026000976562, "lr": 0.00014924744121446625, "tps": 30619, "wall": 41854.5} {"step": 19555, "train_loss": 3.185913562774658, "lr": 0.0001492298256688116, "tps": 30616, "wall": 41860.0} {"step": 19556, "train_loss": 3.2134766578674316, "lr": 0.00014921221092484537, "tps": 30614, "wall": 41865.5} {"step": 19557, "train_loss": 3.1990556716918945, "lr": 0.0001491945969827671, "tps": 30611, "wall": 41871.0} {"step": 19558, "train_loss": 3.2391741275787354, "lr": 0.0001491769838427762, "tps": 30609, "wall": 41876.4} {"step": 19559, "train_loss": 3.234529495239258, "lr": 0.00014915937150507223, "tps": 30607, "wall": 41881.9} {"step": 19560, "train_loss": 3.2740957736968994, "lr": 0.0001491417599698548, "tps": 30604, "wall": 41887.4} {"step": 19561, "train_loss": 3.1892597675323486, "lr": 0.0001491241492373233, "tps": 30602, "wall": 41892.9} {"step": 19562, "train_loss": 3.277804136276245, "lr": 0.0001491065393076773, "tps": 30599, "wall": 41898.4} {"step": 19563, "train_loss": 3.243875026702881, "lr": 0.0001490889301811162, "tps": 30597, "wall": 41903.8} {"step": 19564, "train_loss": 3.220797300338745, "lr": 0.00014907132185783958, "tps": 30594, "wall": 41909.3} {"step": 19565, "train_loss": 3.2967047691345215, "lr": 0.00014905371433804687, "tps": 30592, "wall": 41914.9} {"step": 19566, "train_loss": 3.252764940261841, "lr": 0.0001490361076219375, "tps": 30589, "wall": 41920.4} {"step": 19567, "train_loss": 3.0769190788269043, "lr": 0.000149018501709711, "tps": 30587, "wall": 41925.9} {"step": 19568, "train_loss": 3.2859809398651123, "lr": 0.00014900089660156672, "tps": 30585, "wall": 41931.3} {"step": 19569, "train_loss": 3.3074817657470703, "lr": 0.0001489832922977041, "tps": 30582, "wall": 41936.8} {"step": 19570, "train_loss": 3.2740588188171387, "lr": 0.00014896568879832253, "tps": 30580, "wall": 41942.3} {"step": 19571, "train_loss": 3.3070108890533447, "lr": 0.0001489480861036216, "tps": 30577, "wall": 41947.8} {"step": 19572, "train_loss": 3.1922764778137207, "lr": 0.00014893048421380054, "tps": 30575, "wall": 41953.2} {"step": 19573, "train_loss": 3.1709489822387695, "lr": 0.00014891288312905875, "tps": 30572, "wall": 41958.7} {"step": 19574, "train_loss": 3.2436070442199707, "lr": 0.00014889528284959579, "tps": 30570, "wall": 41964.2} {"step": 19575, "train_loss": 3.188694477081299, "lr": 0.00014887768337561082, "tps": 30568, "wall": 41969.7} {"step": 19576, "train_loss": 3.2744479179382324, "lr": 0.0001488600847073033, "tps": 30565, "wall": 41975.3} {"step": 19577, "train_loss": 3.2868847846984863, "lr": 0.00014884248684487265, "tps": 30563, "wall": 41980.9} {"step": 19578, "train_loss": 3.3015336990356445, "lr": 0.0001488248897885181, "tps": 30560, "wall": 41986.3} {"step": 19579, "train_loss": 3.241790533065796, "lr": 0.00014880729353843907, "tps": 30558, "wall": 41991.8} {"step": 19580, "train_loss": 3.2935619354248047, "lr": 0.00014878969809483484, "tps": 30555, "wall": 41997.3} {"step": 19581, "train_loss": 3.2945549488067627, "lr": 0.00014877210345790482, "tps": 30553, "wall": 42002.8} {"step": 19582, "train_loss": 3.3304409980773926, "lr": 0.00014875450962784824, "tps": 30550, "wall": 42008.2} {"step": 19583, "train_loss": 3.2710812091827393, "lr": 0.0001487369166048644, "tps": 30548, "wall": 42013.7} {"step": 19584, "train_loss": 3.2372632026672363, "lr": 0.0001487193243891527, "tps": 30546, "wall": 42019.2} {"step": 19585, "train_loss": 3.1647355556488037, "lr": 0.00014870173298091226, "tps": 30543, "wall": 42024.7} {"step": 19586, "train_loss": 3.272887945175171, "lr": 0.00014868414238034246, "tps": 30541, "wall": 42030.2} {"step": 19587, "train_loss": 3.1668038368225098, "lr": 0.00014866655258764263, "tps": 30538, "wall": 42035.7} {"step": 19588, "train_loss": 3.304546356201172, "lr": 0.0001486489636030119, "tps": 30536, "wall": 42041.2} {"step": 19589, "train_loss": 3.199666976928711, "lr": 0.00014863137542664955, "tps": 30533, "wall": 42046.7} {"step": 19590, "train_loss": 3.2658421993255615, "lr": 0.00014861378805875486, "tps": 30531, "wall": 42052.2} {"step": 19591, "train_loss": 3.3333301544189453, "lr": 0.00014859620149952702, "tps": 30529, "wall": 42057.6} {"step": 19592, "train_loss": 3.2137951850891113, "lr": 0.00014857861574916532, "tps": 30526, "wall": 42063.1} {"step": 19593, "train_loss": 3.2323906421661377, "lr": 0.00014856103080786889, "tps": 30524, "wall": 42068.6} {"step": 19594, "train_loss": 3.4205334186553955, "lr": 0.000148543446675837, "tps": 30521, "wall": 42074.1} {"step": 19595, "train_loss": 3.2122955322265625, "lr": 0.00014852586335326878, "tps": 30519, "wall": 42079.6} {"step": 19596, "train_loss": 3.259521245956421, "lr": 0.00014850828084036347, "tps": 30516, "wall": 42085.1} {"step": 19597, "train_loss": 3.251445770263672, "lr": 0.00014849069913732015, "tps": 30514, "wall": 42090.6} {"step": 19598, "train_loss": 3.2922534942626953, "lr": 0.00014847311824433814, "tps": 30512, "wall": 42096.2} {"step": 19599, "train_loss": 3.242374897003174, "lr": 0.00014845553816161648, "tps": 30509, "wall": 42101.7} {"step": 19600, "train_loss": 3.3168230056762695, "lr": 0.00014843795888935438, "tps": 30507, "wall": 42107.1} {"step": 19601, "train_loss": 3.302354335784912, "lr": 0.00014842038042775095, "tps": 30504, "wall": 42112.6} {"step": 19602, "train_loss": 3.224797248840332, "lr": 0.00014840280277700528, "tps": 30502, "wall": 42118.1} {"step": 19603, "train_loss": 3.163759231567383, "lr": 0.00014838522593731658, "tps": 30499, "wall": 42123.6} {"step": 19604, "train_loss": 3.2986552715301514, "lr": 0.00014836764990888392, "tps": 30497, "wall": 42129.1} {"step": 19605, "train_loss": 3.2292044162750244, "lr": 0.0001483500746919064, "tps": 30495, "wall": 42134.5} {"step": 19606, "train_loss": 3.1946966648101807, "lr": 0.00014833250028658306, "tps": 30492, "wall": 42140.0} {"step": 19607, "train_loss": 3.266845226287842, "lr": 0.000148314926693113, "tps": 30490, "wall": 42145.5} {"step": 19608, "train_loss": 3.2944016456604004, "lr": 0.00014829735391169545, "tps": 30487, "wall": 42151.0} {"step": 19609, "train_loss": 3.3794164657592773, "lr": 0.00014827978194252928, "tps": 30485, "wall": 42156.6} {"step": 19610, "train_loss": 3.2027676105499268, "lr": 0.00014826221078581363, "tps": 30483, "wall": 42162.0} {"step": 19611, "train_loss": 3.3528268337249756, "lr": 0.00014824464044174755, "tps": 30480, "wall": 42167.5} {"step": 19612, "train_loss": 3.3370275497436523, "lr": 0.00014822707091053004, "tps": 30478, "wall": 42172.9} {"step": 19613, "train_loss": 3.2537643909454346, "lr": 0.00014820950219236018, "tps": 30475, "wall": 42178.5} {"step": 19614, "train_loss": 3.262540817260742, "lr": 0.00014819193428743698, "tps": 30473, "wall": 42184.0} {"step": 19615, "train_loss": 3.3514561653137207, "lr": 0.00014817436719595937, "tps": 30470, "wall": 42189.5} {"step": 19616, "train_loss": 3.257861614227295, "lr": 0.00014815680091812645, "tps": 30468, "wall": 42195.0} {"step": 19617, "train_loss": 3.2273788452148438, "lr": 0.00014813923545413716, "tps": 30466, "wall": 42200.5} {"step": 19618, "train_loss": 3.2642016410827637, "lr": 0.00014812167080419054, "tps": 30463, "wall": 42206.0} {"step": 19619, "train_loss": 3.301724433898926, "lr": 0.0001481041069684855, "tps": 30461, "wall": 42211.4} {"step": 19620, "train_loss": 3.244076728820801, "lr": 0.000148086543947221, "tps": 30458, "wall": 42217.0} {"step": 19621, "train_loss": 3.256540298461914, "lr": 0.00014806898174059608, "tps": 30456, "wall": 42222.4} {"step": 19622, "train_loss": 3.243992328643799, "lr": 0.00014805142034880956, "tps": 30454, "wall": 42228.0} {"step": 19623, "train_loss": 3.1773428916931152, "lr": 0.00014803385977206048, "tps": 30451, "wall": 42233.5} {"step": 19624, "train_loss": 3.303575038909912, "lr": 0.0001480163000105477, "tps": 30449, "wall": 42239.0} {"step": 19625, "train_loss": 3.212258815765381, "lr": 0.00014799874106447022, "tps": 30446, "wall": 42244.5} {"step": 19626, "train_loss": 3.338017463684082, "lr": 0.00014798118293402683, "tps": 30444, "wall": 42250.1} {"step": 19627, "train_loss": 3.195488452911377, "lr": 0.00014796362561941652, "tps": 30441, "wall": 42255.6} {"step": 19628, "train_loss": 3.3636105060577393, "lr": 0.0001479460691208382, "tps": 30439, "wall": 42261.1} {"step": 19629, "train_loss": 3.313666820526123, "lr": 0.00014792851343849067, "tps": 30437, "wall": 42266.6} {"step": 19630, "train_loss": 3.2683568000793457, "lr": 0.0001479109585725728, "tps": 30434, "wall": 42272.2} {"step": 19631, "train_loss": 3.3172481060028076, "lr": 0.0001478934045232836, "tps": 30432, "wall": 42277.7} {"step": 19632, "train_loss": 3.233254909515381, "lr": 0.00014787585129082172, "tps": 30429, "wall": 42283.2} {"step": 19633, "train_loss": 3.1546101570129395, "lr": 0.00014785829887538614, "tps": 30427, "wall": 42288.7} {"step": 19634, "train_loss": 3.30013108253479, "lr": 0.00014784074727717557, "tps": 30424, "wall": 42294.2} {"step": 19635, "train_loss": 3.2229883670806885, "lr": 0.00014782319649638904, "tps": 30422, "wall": 42299.7} {"step": 19636, "train_loss": 3.324504852294922, "lr": 0.0001478056465332252, "tps": 30420, "wall": 42305.3} {"step": 19637, "train_loss": 3.2811312675476074, "lr": 0.00014778809738788288, "tps": 30417, "wall": 42310.8} {"step": 19638, "train_loss": 3.192333698272705, "lr": 0.000147770549060561, "tps": 30415, "wall": 42316.3} {"step": 19639, "train_loss": 3.2196080684661865, "lr": 0.00014775300155145816, "tps": 30412, "wall": 42321.8} {"step": 19640, "train_loss": 3.2414698600769043, "lr": 0.00014773545486077323, "tps": 30410, "wall": 42327.2} {"step": 19641, "train_loss": 3.287306547164917, "lr": 0.00014771790898870495, "tps": 30408, "wall": 42332.8} {"step": 19642, "train_loss": 3.2590067386627197, "lr": 0.00014770036393545213, "tps": 30405, "wall": 42338.3} {"step": 19643, "train_loss": 3.2412972450256348, "lr": 0.00014768281970121354, "tps": 30403, "wall": 42343.7} {"step": 19644, "train_loss": 3.1906304359436035, "lr": 0.00014766527628618778, "tps": 30400, "wall": 42349.1} {"step": 19645, "train_loss": 3.3179407119750977, "lr": 0.00014764773369057375, "tps": 30398, "wall": 42354.6} {"step": 19646, "train_loss": 3.2676544189453125, "lr": 0.0001476301919145701, "tps": 30396, "wall": 42360.1} {"step": 19647, "train_loss": 3.3628480434417725, "lr": 0.0001476126509583756, "tps": 30393, "wall": 42365.6} {"step": 19648, "train_loss": 3.237570285797119, "lr": 0.0001475951108221888, "tps": 30391, "wall": 42371.0} {"step": 19649, "train_loss": 3.3018369674682617, "lr": 0.00014757757150620857, "tps": 30389, "wall": 42376.5} {"step": 19650, "train_loss": 3.240723133087158, "lr": 0.00014756003301063356, "tps": 30386, "wall": 42381.9} {"step": 19651, "train_loss": 3.3309788703918457, "lr": 0.00014754249533566234, "tps": 30384, "wall": 42387.4} {"step": 19652, "train_loss": 3.2783069610595703, "lr": 0.00014752495848149367, "tps": 30381, "wall": 42392.9} {"step": 19653, "train_loss": 3.196470022201538, "lr": 0.00014750742244832625, "tps": 30379, "wall": 42398.4} {"step": 19654, "train_loss": 3.3234071731567383, "lr": 0.00014748988723635862, "tps": 30377, "wall": 42403.9} {"step": 19655, "train_loss": 3.2684004306793213, "lr": 0.00014747235284578948, "tps": 30374, "wall": 42409.3} {"step": 19656, "train_loss": 3.3165197372436523, "lr": 0.0001474548192768175, "tps": 30372, "wall": 42414.8} {"step": 19657, "train_loss": 3.3003053665161133, "lr": 0.00014743728652964118, "tps": 30370, "wall": 42420.3} {"step": 19658, "train_loss": 3.1493988037109375, "lr": 0.0001474197546044592, "tps": 30367, "wall": 42425.9} {"step": 19659, "train_loss": 3.1912972927093506, "lr": 0.00014740222350147016, "tps": 30365, "wall": 42431.4} {"step": 19660, "train_loss": 3.281886577606201, "lr": 0.0001473846932208727, "tps": 30362, "wall": 42436.8} {"step": 19661, "train_loss": 3.202544689178467, "lr": 0.00014736716376286538, "tps": 30360, "wall": 42442.3} {"step": 19662, "train_loss": 3.2139153480529785, "lr": 0.0001473496351276467, "tps": 30358, "wall": 42447.8} {"step": 19663, "train_loss": 3.257885456085205, "lr": 0.0001473321073154154, "tps": 30355, "wall": 42453.3} {"step": 19664, "train_loss": 3.218661308288574, "lr": 0.0001473145803263698, "tps": 30353, "wall": 42458.8} {"step": 19665, "train_loss": 3.400300979614258, "lr": 0.00014729705416070856, "tps": 30350, "wall": 42464.4} {"step": 19666, "train_loss": 3.3550119400024414, "lr": 0.0001472795288186303, "tps": 30348, "wall": 42469.8} {"step": 19667, "train_loss": 3.262239933013916, "lr": 0.00014726200430033345, "tps": 30346, "wall": 42475.3} {"step": 19668, "train_loss": 3.2695114612579346, "lr": 0.00014724448060601653, "tps": 30343, "wall": 42480.8} {"step": 19669, "train_loss": 3.2144408226013184, "lr": 0.00014722695773587802, "tps": 30341, "wall": 42486.3} {"step": 19670, "train_loss": 3.220755100250244, "lr": 0.0001472094356901166, "tps": 30339, "wall": 42491.7} {"step": 19671, "train_loss": 3.2391011714935303, "lr": 0.00014719191446893053, "tps": 30336, "wall": 42497.2} {"step": 19672, "train_loss": 3.354048728942871, "lr": 0.0001471743940725184, "tps": 30334, "wall": 42502.7} {"step": 19673, "train_loss": 3.3090476989746094, "lr": 0.00014715687450107874, "tps": 30331, "wall": 42508.1} {"step": 19674, "train_loss": 3.297261953353882, "lr": 0.00014713935575480988, "tps": 30329, "wall": 42513.7} {"step": 19675, "train_loss": 3.1854195594787598, "lr": 0.00014712183783391035, "tps": 30327, "wall": 42519.2} {"step": 19676, "train_loss": 3.197314500808716, "lr": 0.00014710432073857858, "tps": 30324, "wall": 42524.6} {"step": 19677, "train_loss": 3.32273530960083, "lr": 0.00014708680446901307, "tps": 30322, "wall": 42530.1} {"step": 19678, "train_loss": 3.209461212158203, "lr": 0.00014706928902541208, "tps": 30320, "wall": 42535.6} {"step": 19679, "train_loss": 3.379115104675293, "lr": 0.0001470517744079742, "tps": 30317, "wall": 42541.1} {"step": 19680, "train_loss": 3.2936394214630127, "lr": 0.0001470342606168978, "tps": 30315, "wall": 42546.5} {"step": 19681, "train_loss": 3.375101089477539, "lr": 0.00014701674765238117, "tps": 30313, "wall": 42552.0} {"step": 19682, "train_loss": 3.2680466175079346, "lr": 0.00014699923551462276, "tps": 30310, "wall": 42557.5} {"step": 19683, "train_loss": 3.2353549003601074, "lr": 0.00014698172420382104, "tps": 30308, "wall": 42563.0} {"step": 19684, "train_loss": 3.296454429626465, "lr": 0.00014696421372017423, "tps": 30305, "wall": 42568.4} {"step": 19685, "train_loss": 3.258790969848633, "lr": 0.00014694670406388072, "tps": 30303, "wall": 42574.1} {"step": 19686, "train_loss": 3.30655574798584, "lr": 0.000146929195235139, "tps": 30301, "wall": 42579.6} {"step": 19687, "train_loss": 3.2360243797302246, "lr": 0.0001469116872341473, "tps": 30298, "wall": 42585.0} {"step": 19688, "train_loss": 3.2679905891418457, "lr": 0.0001468941800611039, "tps": 30296, "wall": 42590.5} {"step": 19689, "train_loss": 3.180107831954956, "lr": 0.0001468766737162072, "tps": 30294, "wall": 42596.0} {"step": 19690, "train_loss": 3.3774237632751465, "lr": 0.00014685916819965554, "tps": 30291, "wall": 42601.4} {"step": 19691, "train_loss": 3.3125994205474854, "lr": 0.00014684166351164714, "tps": 30289, "wall": 42606.9} {"step": 19692, "train_loss": 3.1235127449035645, "lr": 0.00014682415965238033, "tps": 30286, "wall": 42612.4} {"step": 19693, "train_loss": 3.274972915649414, "lr": 0.00014680665662205345, "tps": 30284, "wall": 42618.0} {"step": 19694, "train_loss": 3.18826961517334, "lr": 0.00014678915442086464, "tps": 30282, "wall": 42623.5} {"step": 19695, "train_loss": 3.35050892829895, "lr": 0.00014677165304901227, "tps": 30279, "wall": 42628.9} {"step": 19696, "train_loss": 3.136640787124634, "lr": 0.0001467541525066946, "tps": 30277, "wall": 42634.5} {"step": 19697, "train_loss": 3.171475887298584, "lr": 0.0001467366527941099, "tps": 30275, "wall": 42640.0} {"step": 19698, "train_loss": 3.234858989715576, "lr": 0.0001467191539114563, "tps": 30272, "wall": 42645.5} {"step": 19699, "train_loss": 3.3697433471679688, "lr": 0.00014670165585893208, "tps": 30270, "wall": 42651.0} {"step": 19700, "train_loss": 3.2336463928222656, "lr": 0.00014668415863673554, "tps": 30267, "wall": 42656.5} {"step": 19701, "train_loss": 3.2515788078308105, "lr": 0.00014666666224506472, "tps": 30265, "wall": 42662.0} {"step": 19702, "train_loss": 3.2217419147491455, "lr": 0.00014664916668411798, "tps": 30263, "wall": 42667.6} {"step": 19703, "train_loss": 3.259579658508301, "lr": 0.0001466316719540934, "tps": 30260, "wall": 42673.0} {"step": 19704, "train_loss": 3.175273895263672, "lr": 0.00014661417805518923, "tps": 30258, "wall": 42678.5} {"step": 19705, "train_loss": 3.3391575813293457, "lr": 0.00014659668498760367, "tps": 30256, "wall": 42684.0} {"step": 19706, "train_loss": 3.326857089996338, "lr": 0.00014657919275153477, "tps": 30253, "wall": 42689.5} {"step": 19707, "train_loss": 3.370872974395752, "lr": 0.00014656170134718082, "tps": 30251, "wall": 42695.1} {"step": 19708, "train_loss": 3.226245403289795, "lr": 0.0001465442107747398, "tps": 30249, "wall": 42700.5} {"step": 19709, "train_loss": 3.314473867416382, "lr": 0.00014652672103440998, "tps": 30246, "wall": 42706.1} {"step": 19710, "train_loss": 3.296868324279785, "lr": 0.00014650923212638944, "tps": 30244, "wall": 42711.6} {"step": 19711, "train_loss": 3.3090810775756836, "lr": 0.00014649174405087625, "tps": 30241, "wall": 42717.1} {"step": 19712, "train_loss": 3.2689027786254883, "lr": 0.00014647425680806863, "tps": 30239, "wall": 42722.6} {"step": 19713, "train_loss": 3.3317885398864746, "lr": 0.00014645677039816456, "tps": 30237, "wall": 42728.1} {"step": 19714, "train_loss": 3.2845966815948486, "lr": 0.0001464392848213622, "tps": 30234, "wall": 42733.7} {"step": 19715, "train_loss": 3.344714641571045, "lr": 0.0001464218000778596, "tps": 30232, "wall": 42739.1} {"step": 19716, "train_loss": 3.2582404613494873, "lr": 0.00014640431616785483, "tps": 30230, "wall": 42744.6} {"step": 19717, "train_loss": 3.211615562438965, "lr": 0.00014638683309154592, "tps": 30227, "wall": 42750.1} {"step": 19718, "train_loss": 3.2989468574523926, "lr": 0.00014636935084913098, "tps": 30225, "wall": 42755.7} {"step": 19719, "train_loss": 3.254636764526367, "lr": 0.00014635186944080797, "tps": 30222, "wall": 42761.2} {"step": 19720, "train_loss": 3.340949535369873, "lr": 0.00014633438886677507, "tps": 30220, "wall": 42766.7} {"step": 19721, "train_loss": 3.3262336254119873, "lr": 0.0001463169091272301, "tps": 30218, "wall": 42772.2} {"step": 19722, "train_loss": 3.301487922668457, "lr": 0.00014629943022237115, "tps": 30215, "wall": 42777.7} {"step": 19723, "train_loss": 3.2361690998077393, "lr": 0.0001462819521523963, "tps": 30213, "wall": 42783.2} {"step": 19724, "train_loss": 3.300776481628418, "lr": 0.0001462644749175035, "tps": 30211, "wall": 42788.7} {"step": 19725, "train_loss": 3.3255066871643066, "lr": 0.00014624699851789065, "tps": 30208, "wall": 42794.2} {"step": 19726, "train_loss": 3.3891775608062744, "lr": 0.00014622952295375585, "tps": 30206, "wall": 42799.7} {"step": 19727, "train_loss": 3.3236210346221924, "lr": 0.00014621204822529702, "tps": 30204, "wall": 42805.2} {"step": 19728, "train_loss": 3.363586664199829, "lr": 0.00014619457433271205, "tps": 30201, "wall": 42810.7} {"step": 19729, "train_loss": 3.1380677223205566, "lr": 0.0001461771012761989, "tps": 30199, "wall": 42816.3} {"step": 19730, "train_loss": 3.192871570587158, "lr": 0.0001461596290559556, "tps": 30197, "wall": 42821.8} {"step": 19731, "train_loss": 3.3521666526794434, "lr": 0.00014614215767218, "tps": 30194, "wall": 42827.3} {"step": 19732, "train_loss": 3.326570749282837, "lr": 0.00014612468712507006, "tps": 30192, "wall": 42832.8} {"step": 19733, "train_loss": 3.246021270751953, "lr": 0.00014610721741482364, "tps": 30189, "wall": 42838.3} {"step": 19734, "train_loss": 3.218324661254883, "lr": 0.00014608974854163868, "tps": 30187, "wall": 42843.7} {"step": 19735, "train_loss": 3.3422117233276367, "lr": 0.000146072280505713, "tps": 30185, "wall": 42849.2} {"step": 19736, "train_loss": 3.29036283493042, "lr": 0.00014605481330724458, "tps": 30183, "wall": 42854.7} {"step": 19737, "train_loss": 3.2739169597625732, "lr": 0.0001460373469464312, "tps": 30180, "wall": 42860.2} {"step": 19738, "train_loss": 3.2666056156158447, "lr": 0.00014601988142347078, "tps": 30178, "wall": 42865.7} {"step": 19739, "train_loss": 3.2859978675842285, "lr": 0.0001460024167385611, "tps": 30176, "wall": 42871.1} {"step": 19740, "train_loss": 3.350907325744629, "lr": 0.0001459849528919001, "tps": 30173, "wall": 42876.7} {"step": 19741, "train_loss": 3.2120087146759033, "lr": 0.00014596748988368553, "tps": 30171, "wall": 42882.2} {"step": 19742, "train_loss": 3.1816890239715576, "lr": 0.0001459500277141152, "tps": 30168, "wall": 42887.7} {"step": 19743, "train_loss": 3.2603108882904053, "lr": 0.00014593256638338703, "tps": 30166, "wall": 42893.1} {"step": 19744, "train_loss": 3.1902945041656494, "lr": 0.00014591510589169872, "tps": 30164, "wall": 42898.6} {"step": 19745, "train_loss": 3.173125982284546, "lr": 0.0001458976462392481, "tps": 30162, "wall": 42904.1} {"step": 19746, "train_loss": 3.3205184936523438, "lr": 0.00014588018742623296, "tps": 30159, "wall": 42909.5} {"step": 19747, "train_loss": 3.275271415710449, "lr": 0.0001458627294528511, "tps": 30157, "wall": 42915.0} {"step": 19748, "train_loss": 3.3030123710632324, "lr": 0.00014584527231930022, "tps": 30155, "wall": 42920.5} {"step": 19749, "train_loss": 3.2986416816711426, "lr": 0.00014582781602577808, "tps": 30152, "wall": 42926.0} {"step": 19750, "train_loss": 3.293318033218384, "lr": 0.00014581036057248245, "tps": 30150, "wall": 42931.5} {"step": 19751, "train_loss": 3.3974266052246094, "lr": 0.00014579290595961113, "tps": 30148, "wall": 42937.0} {"step": 19752, "train_loss": 3.2500500679016113, "lr": 0.00014577545218736178, "tps": 30145, "wall": 42942.5} {"step": 19753, "train_loss": 3.279092788696289, "lr": 0.00014575799925593206, "tps": 30143, "wall": 42948.1} {"step": 19754, "train_loss": 3.237809181213379, "lr": 0.00014574054716551976, "tps": 30141, "wall": 42953.6} {"step": 19755, "train_loss": 3.310473918914795, "lr": 0.00014572309591632257, "tps": 30138, "wall": 42959.0} {"step": 19756, "train_loss": 3.278822660446167, "lr": 0.0001457056455085382, "tps": 30136, "wall": 42964.5} {"step": 19757, "train_loss": 3.2728092670440674, "lr": 0.00014568819594236424, "tps": 30134, "wall": 42970.0} {"step": 19758, "train_loss": 3.356719493865967, "lr": 0.00014567074721799847, "tps": 30131, "wall": 42975.5} {"step": 19759, "train_loss": 3.2488718032836914, "lr": 0.00014565329933563848, "tps": 30129, "wall": 42981.0} {"step": 19760, "train_loss": 3.2787139415740967, "lr": 0.00014563585229548194, "tps": 30127, "wall": 42986.5} {"step": 19761, "train_loss": 3.223820209503174, "lr": 0.00014561840609772646, "tps": 30124, "wall": 42992.0} {"step": 19762, "train_loss": 3.186143159866333, "lr": 0.00014560096074256972, "tps": 30122, "wall": 42997.5} {"step": 19763, "train_loss": 3.298649549484253, "lr": 0.00014558351623020931, "tps": 30120, "wall": 43003.0} {"step": 19764, "train_loss": 3.36873197555542, "lr": 0.00014556607256084288, "tps": 30117, "wall": 43008.5} {"step": 19765, "train_loss": 3.245983362197876, "lr": 0.00014554862973466799, "tps": 30115, "wall": 43014.0} {"step": 19766, "train_loss": 3.2622475624084473, "lr": 0.00014553118775188225, "tps": 30113, "wall": 43019.5} {"step": 19767, "train_loss": 3.2837326526641846, "lr": 0.00014551374661268325, "tps": 30110, "wall": 43025.0} {"step": 19768, "train_loss": 3.272071123123169, "lr": 0.00014549630631726857, "tps": 30108, "wall": 43030.5} {"step": 19769, "train_loss": 3.3037760257720947, "lr": 0.00014547886686583575, "tps": 30106, "wall": 43036.0} {"step": 19770, "train_loss": 3.243029832839966, "lr": 0.00014546142825858232, "tps": 30103, "wall": 43041.5} {"step": 19771, "train_loss": 3.21376895904541, "lr": 0.00014544399049570595, "tps": 30101, "wall": 43047.0} {"step": 19772, "train_loss": 3.2484993934631348, "lr": 0.00014542655357740398, "tps": 30099, "wall": 43052.6} {"step": 19773, "train_loss": 3.2227816581726074, "lr": 0.00014540911750387408, "tps": 30096, "wall": 43058.1} {"step": 19774, "train_loss": 3.1814475059509277, "lr": 0.0001453916822753138, "tps": 30094, "wall": 43063.6} {"step": 19775, "train_loss": 3.257676124572754, "lr": 0.00014537424789192054, "tps": 30092, "wall": 43069.1} {"step": 19776, "train_loss": 3.2101263999938965, "lr": 0.00014535681435389182, "tps": 30089, "wall": 43074.6} {"step": 19777, "train_loss": 3.2541580200195312, "lr": 0.00014533938166142512, "tps": 30087, "wall": 43080.1} {"step": 19778, "train_loss": 3.1726815700531006, "lr": 0.00014532194981471802, "tps": 30085, "wall": 43085.6} {"step": 19779, "train_loss": 3.3047215938568115, "lr": 0.00014530451881396785, "tps": 30082, "wall": 43091.1} {"step": 19780, "train_loss": 3.3325345516204834, "lr": 0.00014528708865937215, "tps": 30080, "wall": 43096.7} {"step": 19781, "train_loss": 3.299774646759033, "lr": 0.00014526965935112836, "tps": 30078, "wall": 43102.2} {"step": 19782, "train_loss": 3.3055691719055176, "lr": 0.0001452522308894339, "tps": 30075, "wall": 43107.7} {"step": 19783, "train_loss": 3.3403677940368652, "lr": 0.00014523480327448623, "tps": 30073, "wall": 43113.3} {"step": 19784, "train_loss": 3.2627971172332764, "lr": 0.00014521737650648273, "tps": 30071, "wall": 43118.7} {"step": 19785, "train_loss": 3.3327293395996094, "lr": 0.00014519995058562087, "tps": 30068, "wall": 43124.2} {"step": 19786, "train_loss": 3.2664313316345215, "lr": 0.000145182525512098, "tps": 30066, "wall": 43129.7} {"step": 19787, "train_loss": 3.294508934020996, "lr": 0.0001451651012861115, "tps": 30064, "wall": 43135.1} {"step": 19788, "train_loss": 3.2942311763763428, "lr": 0.0001451476779078588, "tps": 30061, "wall": 43140.6} {"step": 19789, "train_loss": 3.310823678970337, "lr": 0.00014513025537753725, "tps": 30059, "wall": 43146.1} {"step": 19790, "train_loss": 3.320016860961914, "lr": 0.00014511283369534423, "tps": 30057, "wall": 43151.7} {"step": 19791, "train_loss": 3.2269866466522217, "lr": 0.00014509541286147708, "tps": 30055, "wall": 43157.1} {"step": 19792, "train_loss": 3.155287265777588, "lr": 0.00014507799287613314, "tps": 30052, "wall": 43162.6} {"step": 19793, "train_loss": 3.419534921646118, "lr": 0.00014506057373950978, "tps": 30050, "wall": 43168.1} {"step": 19794, "train_loss": 3.317603349685669, "lr": 0.00014504315545180423, "tps": 30047, "wall": 43173.8} {"step": 19795, "train_loss": 3.2979087829589844, "lr": 0.0001450257380132139, "tps": 30045, "wall": 43179.2} {"step": 19796, "train_loss": 3.2446603775024414, "lr": 0.00014500832142393612, "tps": 30043, "wall": 43184.8} {"step": 19797, "train_loss": 3.2655467987060547, "lr": 0.00014499090568416802, "tps": 30041, "wall": 43190.3} {"step": 19798, "train_loss": 3.2753350734710693, "lr": 0.0001449734907941071, "tps": 30038, "wall": 43195.8} {"step": 19799, "train_loss": 3.1600379943847656, "lr": 0.00014495607675395043, "tps": 30036, "wall": 43201.3} {"step": 19800, "train_loss": 3.3129467964172363, "lr": 0.00014493866356389548, "tps": 30034, "wall": 43206.8} {"step": 19801, "train_loss": 3.2305383682250977, "lr": 0.0001449212512241394, "tps": 30031, "wall": 43212.3} {"step": 19802, "train_loss": 3.190772533416748, "lr": 0.0001449038397348794, "tps": 30029, "wall": 43217.7} {"step": 19803, "train_loss": 3.294245719909668, "lr": 0.00014488642909631284, "tps": 30027, "wall": 43223.2} {"step": 19804, "train_loss": 3.2087013721466064, "lr": 0.00014486901930863683, "tps": 30024, "wall": 43228.7} {"step": 19805, "train_loss": 3.204373836517334, "lr": 0.00014485161037204857, "tps": 30022, "wall": 43234.2} {"step": 19806, "train_loss": 3.318129539489746, "lr": 0.00014483420228674545, "tps": 30020, "wall": 43239.7} {"step": 19807, "train_loss": 3.3331832885742188, "lr": 0.0001448167950529245, "tps": 30018, "wall": 43245.2} {"step": 19808, "train_loss": 3.236159324645996, "lr": 0.00014479938867078298, "tps": 30015, "wall": 43250.7} {"step": 19809, "train_loss": 3.2131760120391846, "lr": 0.00014478198314051807, "tps": 30013, "wall": 43256.1} {"step": 19810, "train_loss": 3.1281280517578125, "lr": 0.00014476457846232684, "tps": 30011, "wall": 43261.6} {"step": 19811, "train_loss": 3.180098056793213, "lr": 0.0001447471746364066, "tps": 30008, "wall": 43267.1} {"step": 19812, "train_loss": 3.2610793113708496, "lr": 0.00014472977166295444, "tps": 30006, "wall": 43272.6} {"step": 19813, "train_loss": 3.3122644424438477, "lr": 0.0001447123695421674, "tps": 30004, "wall": 43278.1} {"step": 19814, "train_loss": 3.3396854400634766, "lr": 0.00014469496827424286, "tps": 30002, "wall": 43283.6} {"step": 19815, "train_loss": 3.274744987487793, "lr": 0.00014467756785937775, "tps": 29999, "wall": 43289.1} {"step": 19816, "train_loss": 3.1478142738342285, "lr": 0.00014466016829776913, "tps": 29997, "wall": 43294.6} {"step": 19817, "train_loss": 3.311347723007202, "lr": 0.0001446427695896143, "tps": 29995, "wall": 43300.1} {"step": 19818, "train_loss": 3.1449897289276123, "lr": 0.00014462537173511023, "tps": 29992, "wall": 43305.5} {"step": 19819, "train_loss": 3.260280132293701, "lr": 0.00014460797473445398, "tps": 29990, "wall": 43311.0} {"step": 19820, "train_loss": 3.2072088718414307, "lr": 0.00014459057858784275, "tps": 29988, "wall": 43316.5} {"step": 19821, "train_loss": 3.3762736320495605, "lr": 0.0001445731832954735, "tps": 29986, "wall": 43322.0} {"step": 19822, "train_loss": 3.2652153968811035, "lr": 0.00014455578885754324, "tps": 29983, "wall": 43327.5} {"step": 19823, "train_loss": 3.343561887741089, "lr": 0.00014453839527424917, "tps": 29981, "wall": 43333.0} {"step": 19824, "train_loss": 3.2060580253601074, "lr": 0.00014452100254578815, "tps": 29979, "wall": 43338.5} {"step": 19825, "train_loss": 3.377046585083008, "lr": 0.0001445036106723574, "tps": 29976, "wall": 43344.0} {"step": 19826, "train_loss": 3.3240132331848145, "lr": 0.00014448621965415382, "tps": 29974, "wall": 43349.5} {"step": 19827, "train_loss": 3.1865477561950684, "lr": 0.00014446882949137435, "tps": 29972, "wall": 43355.0} {"step": 19828, "train_loss": 3.2735166549682617, "lr": 0.00014445144018421612, "tps": 29969, "wall": 43360.5} {"step": 19829, "train_loss": 3.320219039916992, "lr": 0.00014443405173287607, "tps": 29967, "wall": 43366.0} {"step": 19830, "train_loss": 3.3143672943115234, "lr": 0.0001444166641375511, "tps": 29965, "wall": 43371.5} {"step": 19831, "train_loss": 3.1994423866271973, "lr": 0.00014439927739843834, "tps": 29963, "wall": 43377.0} {"step": 19832, "train_loss": 3.2460052967071533, "lr": 0.00014438189151573467, "tps": 29960, "wall": 43382.5} {"step": 19833, "train_loss": 3.267503499984741, "lr": 0.00014436450648963692, "tps": 29958, "wall": 43388.0} {"step": 19834, "train_loss": 3.225374698638916, "lr": 0.00014434712232034222, "tps": 29956, "wall": 43393.6} {"step": 19835, "train_loss": 3.3786067962646484, "lr": 0.00014432973900804742, "tps": 29953, "wall": 43399.0} {"step": 19836, "train_loss": 3.2031397819519043, "lr": 0.0001443123565529493, "tps": 29951, "wall": 43404.6} {"step": 19837, "train_loss": 3.3271429538726807, "lr": 0.00014429497495524503, "tps": 29949, "wall": 43410.0} {"step": 19838, "train_loss": 3.3647611141204834, "lr": 0.00014427759421513137, "tps": 29947, "wall": 43415.6} {"step": 19839, "train_loss": 3.3279433250427246, "lr": 0.00014426021433280512, "tps": 29944, "wall": 43421.1} {"step": 19840, "train_loss": 3.2574424743652344, "lr": 0.00014424283530846337, "tps": 29942, "wall": 43426.6} {"step": 19841, "train_loss": 3.2968218326568604, "lr": 0.00014422545714230277, "tps": 29940, "wall": 43432.1} {"step": 19842, "train_loss": 3.2582454681396484, "lr": 0.0001442080798345204, "tps": 29937, "wall": 43437.6} {"step": 19843, "train_loss": 3.3320741653442383, "lr": 0.00014419070338531298, "tps": 29935, "wall": 43443.1} {"step": 19844, "train_loss": 3.2779760360717773, "lr": 0.0001441733277948773, "tps": 29933, "wall": 43448.6} {"step": 19845, "train_loss": 3.298903465270996, "lr": 0.00014415595306341031, "tps": 29931, "wall": 43454.1} {"step": 19846, "train_loss": 3.237694025039673, "lr": 0.00014413857919110882, "tps": 29928, "wall": 43459.6} {"step": 19847, "train_loss": 3.2050702571868896, "lr": 0.00014412120617816955, "tps": 29926, "wall": 43465.1} {"step": 19848, "train_loss": 3.2472739219665527, "lr": 0.00014410383402478942, "tps": 29924, "wall": 43470.6} {"step": 19849, "train_loss": 3.222498655319214, "lr": 0.00014408646273116516, "tps": 29921, "wall": 43476.2} {"step": 19850, "train_loss": 3.251920223236084, "lr": 0.00014406909229749352, "tps": 29919, "wall": 43481.7} {"step": 19851, "train_loss": 3.2692558765411377, "lr": 0.00014405172272397132, "tps": 29917, "wall": 43487.1} {"step": 19852, "train_loss": 3.243978500366211, "lr": 0.00014403435401079534, "tps": 29915, "wall": 43492.6} {"step": 19853, "train_loss": 3.2146987915039062, "lr": 0.00014401698615816225, "tps": 29912, "wall": 43498.1} {"step": 19854, "train_loss": 3.2028419971466064, "lr": 0.00014399961916626892, "tps": 29910, "wall": 43503.6} {"step": 19855, "train_loss": 3.294003963470459, "lr": 0.00014398225303531201, "tps": 29908, "wall": 43509.1} {"step": 19856, "train_loss": 3.250540256500244, "lr": 0.0001439648877654882, "tps": 29905, "wall": 43514.7} {"step": 19857, "train_loss": 3.297781229019165, "lr": 0.00014394752335699428, "tps": 29903, "wall": 43520.2} {"step": 19858, "train_loss": 3.1886844635009766, "lr": 0.00014393015981002688, "tps": 29901, "wall": 43525.7} {"step": 19859, "train_loss": 3.17960262298584, "lr": 0.0001439127971247828, "tps": 29899, "wall": 43531.2} {"step": 19860, "train_loss": 3.325645923614502, "lr": 0.00014389543530145867, "tps": 29896, "wall": 43536.8} {"step": 19861, "train_loss": 3.303798198699951, "lr": 0.0001438780743402511, "tps": 29894, "wall": 43542.3} {"step": 19862, "train_loss": 3.384634494781494, "lr": 0.00014386071424135697, "tps": 29892, "wall": 43547.8} {"step": 19863, "train_loss": 3.282144784927368, "lr": 0.0001438433550049727, "tps": 29889, "wall": 43553.3} {"step": 19864, "train_loss": 3.335423469543457, "lr": 0.00014382599663129497, "tps": 29887, "wall": 43558.8} {"step": 19865, "train_loss": 3.279094934463501, "lr": 0.00014380863912052055, "tps": 29885, "wall": 43564.3} {"step": 19866, "train_loss": 3.2350425720214844, "lr": 0.00014379128247284597, "tps": 29883, "wall": 43569.9} {"step": 19867, "train_loss": 3.233579158782959, "lr": 0.00014377392668846786, "tps": 29880, "wall": 43575.4} {"step": 19868, "train_loss": 3.292586088180542, "lr": 0.00014375657176758283, "tps": 29878, "wall": 43580.9} {"step": 19869, "train_loss": 3.3607630729675293, "lr": 0.00014373921771038747, "tps": 29876, "wall": 43586.4} {"step": 19870, "train_loss": 3.2796788215637207, "lr": 0.00014372186451707837, "tps": 29873, "wall": 43592.0} {"step": 19871, "train_loss": 3.2332069873809814, "lr": 0.00014370451218785214, "tps": 29871, "wall": 43597.5} {"step": 19872, "train_loss": 3.2355871200561523, "lr": 0.00014368716072290534, "tps": 29869, "wall": 43603.0} {"step": 19873, "train_loss": 3.3757693767547607, "lr": 0.00014366981012243444, "tps": 29867, "wall": 43608.6} {"step": 19874, "train_loss": 3.0996596813201904, "lr": 0.00014365246038663612, "tps": 29864, "wall": 43614.1} {"step": 19875, "train_loss": 3.234123468399048, "lr": 0.0001436351115157069, "tps": 29862, "wall": 43619.6} {"step": 19876, "train_loss": 3.3134279251098633, "lr": 0.00014361776350984315, "tps": 29860, "wall": 43625.2} {"step": 19877, "train_loss": 3.337057590484619, "lr": 0.00014360041636924162, "tps": 29857, "wall": 43630.7} {"step": 19878, "train_loss": 3.2907888889312744, "lr": 0.0001435830700940986, "tps": 29855, "wall": 43636.3} {"step": 19879, "train_loss": 3.192751169204712, "lr": 0.0001435657246846108, "tps": 29853, "wall": 43641.8} {"step": 19880, "train_loss": 3.274069309234619, "lr": 0.00014354838014097457, "tps": 29851, "wall": 43647.4} {"step": 19881, "train_loss": 3.3508481979370117, "lr": 0.00014353103646338634, "tps": 29848, "wall": 43653.0} {"step": 19882, "train_loss": 3.26104474067688, "lr": 0.0001435136936520428, "tps": 29846, "wall": 43658.5} {"step": 19883, "train_loss": 3.2797515392303467, "lr": 0.00014349635170714026, "tps": 29844, "wall": 43664.0} {"step": 19884, "train_loss": 3.3476996421813965, "lr": 0.00014347901062887507, "tps": 29841, "wall": 43669.6} {"step": 19885, "train_loss": 3.2803707122802734, "lr": 0.0001434616704174439, "tps": 29839, "wall": 43675.1} {"step": 19886, "train_loss": 3.2863316535949707, "lr": 0.00014344433107304306, "tps": 29837, "wall": 43680.6} {"step": 19887, "train_loss": 3.2449212074279785, "lr": 0.00014342699259586888, "tps": 29835, "wall": 43686.2} {"step": 19888, "train_loss": 3.284470558166504, "lr": 0.00014340965498611796, "tps": 29832, "wall": 43691.7} {"step": 19889, "train_loss": 3.3532941341400146, "lr": 0.0001433923182439866, "tps": 29830, "wall": 43697.3} {"step": 19890, "train_loss": 3.400052070617676, "lr": 0.0001433749823696712, "tps": 29828, "wall": 43702.8} {"step": 19891, "train_loss": 3.2501461505889893, "lr": 0.00014335764736336811, "tps": 29825, "wall": 43708.3} {"step": 19892, "train_loss": 3.2498934268951416, "lr": 0.00014334031322527384, "tps": 29823, "wall": 43714.0} {"step": 19893, "train_loss": 3.302370309829712, "lr": 0.00014332297995558451, "tps": 29821, "wall": 43719.5} {"step": 19894, "train_loss": 3.3431360721588135, "lr": 0.00014330564755449672, "tps": 29819, "wall": 43725.0} {"step": 19895, "train_loss": 3.2572813034057617, "lr": 0.00014328831602220657, "tps": 29816, "wall": 43730.5} {"step": 19896, "train_loss": 3.249221086502075, "lr": 0.00014327098535891065, "tps": 29814, "wall": 43736.0} {"step": 19897, "train_loss": 3.1923000812530518, "lr": 0.00014325365556480514, "tps": 29812, "wall": 43741.6} {"step": 19898, "train_loss": 3.2444028854370117, "lr": 0.00014323632664008633, "tps": 29809, "wall": 43747.1} {"step": 19899, "train_loss": 3.287487268447876, "lr": 0.00014321899858495062, "tps": 29807, "wall": 43752.7} {"step": 19900, "train_loss": 3.290088653564453, "lr": 0.00014320167139959423, "tps": 29805, "wall": 43758.3} {"step": 19901, "train_loss": 3.2785916328430176, "lr": 0.0001431843450842134, "tps": 29803, "wall": 43763.8} {"step": 19902, "train_loss": 3.198111057281494, "lr": 0.00014316701963900457, "tps": 29800, "wall": 43769.3} {"step": 19903, "train_loss": 3.346087694168091, "lr": 0.00014314969506416385, "tps": 29798, "wall": 43774.9} {"step": 19904, "train_loss": 3.33782696723938, "lr": 0.0001431323713598875, "tps": 29796, "wall": 43780.5} {"step": 19905, "train_loss": 3.2175216674804688, "lr": 0.0001431150485263719, "tps": 29793, "wall": 43786.0} {"step": 19906, "train_loss": 3.2465200424194336, "lr": 0.00014309772656381312, "tps": 29791, "wall": 43791.6} {"step": 19907, "train_loss": 3.3185653686523438, "lr": 0.00014308040547240743, "tps": 29789, "wall": 43797.1} {"step": 19908, "train_loss": 3.2363967895507812, "lr": 0.00014306308525235113, "tps": 29787, "wall": 43802.7} {"step": 19909, "train_loss": 3.2917425632476807, "lr": 0.00014304576590384036, "tps": 29784, "wall": 43808.2} {"step": 19910, "train_loss": 3.26710844039917, "lr": 0.00014302844742707124, "tps": 29782, "wall": 43813.8} {"step": 19911, "train_loss": 3.3216607570648193, "lr": 0.00014301112982224008, "tps": 29780, "wall": 43819.3} {"step": 19912, "train_loss": 3.2884631156921387, "lr": 0.00014299381308954297, "tps": 29778, "wall": 43824.9} {"step": 19913, "train_loss": 3.2996826171875, "lr": 0.0001429764972291762, "tps": 29775, "wall": 43830.5} {"step": 19914, "train_loss": 3.207061767578125, "lr": 0.00014295918224133583, "tps": 29773, "wall": 43836.1} {"step": 19915, "train_loss": 3.345600128173828, "lr": 0.00014294186812621788, "tps": 29771, "wall": 43841.7} {"step": 19916, "train_loss": 3.2540154457092285, "lr": 0.00014292455488401875, "tps": 29768, "wall": 43847.2} {"step": 19917, "train_loss": 3.3245270252227783, "lr": 0.00014290724251493438, "tps": 29766, "wall": 43852.8} {"step": 19918, "train_loss": 3.3239283561706543, "lr": 0.00014288993101916093, "tps": 29764, "wall": 43858.3} {"step": 19919, "train_loss": 3.284410238265991, "lr": 0.00014287262039689455, "tps": 29762, "wall": 43863.8} {"step": 19920, "train_loss": 3.24381947517395, "lr": 0.00014285531064833133, "tps": 29759, "wall": 43869.3} {"step": 19921, "train_loss": 3.2294201850891113, "lr": 0.0001428380017736672, "tps": 29757, "wall": 43874.9} {"step": 19922, "train_loss": 3.337531089782715, "lr": 0.00014282069377309842, "tps": 29755, "wall": 43880.4} {"step": 19923, "train_loss": 3.343352794647217, "lr": 0.00014280338664682108, "tps": 29753, "wall": 43885.9} {"step": 19924, "train_loss": 3.270599365234375, "lr": 0.00014278608039503102, "tps": 29750, "wall": 43891.4} {"step": 19925, "train_loss": 3.2021422386169434, "lr": 0.00014276877501792452, "tps": 29748, "wall": 43897.0} {"step": 19926, "train_loss": 3.261202335357666, "lr": 0.00014275147051569746, "tps": 29746, "wall": 43902.5} {"step": 19927, "train_loss": 3.353459358215332, "lr": 0.0001427341668885459, "tps": 29743, "wall": 43908.1} {"step": 19928, "train_loss": 3.3323254585266113, "lr": 0.00014271686413666593, "tps": 29741, "wall": 43913.6} {"step": 19929, "train_loss": 3.269047737121582, "lr": 0.0001426995622602535, "tps": 29739, "wall": 43919.2} {"step": 19930, "train_loss": 3.307199716567993, "lr": 0.00014268226125950458, "tps": 29737, "wall": 43924.7} {"step": 19931, "train_loss": 3.3053038120269775, "lr": 0.00014266496113461523, "tps": 29734, "wall": 43930.3} {"step": 19932, "train_loss": 3.1686036586761475, "lr": 0.00014264766188578132, "tps": 29732, "wall": 43935.8} {"step": 19933, "train_loss": 3.257230758666992, "lr": 0.0001426303635131989, "tps": 29730, "wall": 43941.4} {"step": 19934, "train_loss": 3.270890712738037, "lr": 0.00014261306601706398, "tps": 29728, "wall": 43946.9} {"step": 19935, "train_loss": 3.149350643157959, "lr": 0.00014259576939757232, "tps": 29725, "wall": 43952.4} {"step": 19936, "train_loss": 3.1940970420837402, "lr": 0.00014257847365492008, "tps": 29723, "wall": 43957.9} {"step": 19937, "train_loss": 3.17905855178833, "lr": 0.00014256117878930303, "tps": 29721, "wall": 43963.4} {"step": 19938, "train_loss": 3.324240207672119, "lr": 0.00014254388480091712, "tps": 29719, "wall": 43969.0} {"step": 19939, "train_loss": 3.2929396629333496, "lr": 0.0001425265916899583, "tps": 29716, "wall": 43974.5} {"step": 19940, "train_loss": 3.3756625652313232, "lr": 0.00014250929945662248, "tps": 29714, "wall": 43980.1} {"step": 19941, "train_loss": 3.2739744186401367, "lr": 0.00014249200810110538, "tps": 29712, "wall": 43985.6} {"step": 19942, "train_loss": 3.251546621322632, "lr": 0.0001424747176236031, "tps": 29710, "wall": 43991.2} {"step": 19943, "train_loss": 3.198695182800293, "lr": 0.00014245742802431144, "tps": 29707, "wall": 43996.8} {"step": 19944, "train_loss": 3.2842001914978027, "lr": 0.00014244013930342616, "tps": 29705, "wall": 44002.3} {"step": 19945, "train_loss": 3.260110378265381, "lr": 0.0001424228514611432, "tps": 29703, "wall": 44007.9} {"step": 19946, "train_loss": 3.1725354194641113, "lr": 0.00014240556449765843, "tps": 29701, "wall": 44013.5} {"step": 19947, "train_loss": 3.2309823036193848, "lr": 0.0001423882784131675, "tps": 29698, "wall": 44019.0} {"step": 19948, "train_loss": 3.368346691131592, "lr": 0.00014237099320786646, "tps": 29696, "wall": 44024.5} {"step": 19949, "train_loss": 3.381565570831299, "lr": 0.00014235370888195095, "tps": 29694, "wall": 44030.1} {"step": 19950, "train_loss": 3.2248735427856445, "lr": 0.00014233642543561684, "tps": 29692, "wall": 44035.7} {"step": 19951, "train_loss": 3.3177709579467773, "lr": 0.00014231914286905997, "tps": 29689, "wall": 44041.2} {"step": 19952, "train_loss": 3.2740495204925537, "lr": 0.00014230186118247598, "tps": 29687, "wall": 44046.8} {"step": 19953, "train_loss": 3.285750150680542, "lr": 0.00014228458037606072, "tps": 29685, "wall": 44052.4} {"step": 19954, "train_loss": 3.302307605743408, "lr": 0.00014226730045000996, "tps": 29683, "wall": 44057.8} {"step": 19955, "train_loss": 3.3050973415374756, "lr": 0.00014225002140451934, "tps": 29680, "wall": 44063.4} {"step": 19956, "train_loss": 3.312669515609741, "lr": 0.0001422327432397848, "tps": 29678, "wall": 44068.9} {"step": 19957, "train_loss": 3.263598918914795, "lr": 0.00014221546595600195, "tps": 29676, "wall": 44074.6} {"step": 19958, "train_loss": 3.3467555046081543, "lr": 0.0001421981895533664, "tps": 29674, "wall": 44080.1} {"step": 19959, "train_loss": 3.244734287261963, "lr": 0.00014218091403207407, "tps": 29671, "wall": 44085.6} {"step": 19960, "train_loss": 3.265272617340088, "lr": 0.0001421636393923205, "tps": 29669, "wall": 44091.2} {"step": 19961, "train_loss": 3.3097970485687256, "lr": 0.00014214636563430143, "tps": 29667, "wall": 44096.7} {"step": 19962, "train_loss": 3.3154311180114746, "lr": 0.00014212909275821263, "tps": 29665, "wall": 44102.3} {"step": 19963, "train_loss": 3.2450027465820312, "lr": 0.0001421118207642496, "tps": 29662, "wall": 44107.8} {"step": 19964, "train_loss": 3.296041488647461, "lr": 0.00014209454965260804, "tps": 29660, "wall": 44113.4} {"step": 19965, "train_loss": 3.2005059719085693, "lr": 0.00014207727942348376, "tps": 29658, "wall": 44119.0} {"step": 19966, "train_loss": 3.36324143409729, "lr": 0.00014206001007707216, "tps": 29656, "wall": 44124.5} {"step": 19967, "train_loss": 3.270845413208008, "lr": 0.000142042741613569, "tps": 29653, "wall": 44130.0} {"step": 19968, "train_loss": 3.393800973892212, "lr": 0.00014202547403316995, "tps": 29651, "wall": 44135.7} {"step": 19969, "train_loss": 3.2787864208221436, "lr": 0.00014200820733607046, "tps": 29649, "wall": 44141.2} {"step": 19970, "train_loss": 3.159184455871582, "lr": 0.0001419909415224663, "tps": 29647, "wall": 44146.7} {"step": 19971, "train_loss": 3.264254570007324, "lr": 0.00014197367659255292, "tps": 29644, "wall": 44152.2} {"step": 19972, "train_loss": 3.2365152835845947, "lr": 0.00014195641254652593, "tps": 29642, "wall": 44157.8} {"step": 19973, "train_loss": 3.2483606338500977, "lr": 0.000141939149384581, "tps": 29640, "wall": 44163.3} {"step": 19974, "train_loss": 3.2292978763580322, "lr": 0.00014192188710691357, "tps": 29638, "wall": 44168.9} {"step": 19975, "train_loss": 3.31327748298645, "lr": 0.0001419046257137192, "tps": 29635, "wall": 44174.4} {"step": 19976, "train_loss": 3.2453649044036865, "lr": 0.00014188736520519358, "tps": 29633, "wall": 44180.0} {"step": 19977, "train_loss": 3.1757493019104004, "lr": 0.00014187010558153196, "tps": 29631, "wall": 44185.6} {"step": 19978, "train_loss": 3.3255765438079834, "lr": 0.0001418528468429301, "tps": 29629, "wall": 44191.1} {"step": 19979, "train_loss": 3.3169188499450684, "lr": 0.0001418355889895834, "tps": 29626, "wall": 44196.8} {"step": 19980, "train_loss": 3.2810566425323486, "lr": 0.00014181833202168731, "tps": 29624, "wall": 44202.3} {"step": 19981, "train_loss": 3.3436026573181152, "lr": 0.00014180107593943743, "tps": 29622, "wall": 44207.9} {"step": 19982, "train_loss": 3.268127918243408, "lr": 0.00014178382074302924, "tps": 29620, "wall": 44213.5} {"step": 19983, "train_loss": 3.2985379695892334, "lr": 0.00014176656643265809, "tps": 29617, "wall": 44219.0} {"step": 19984, "train_loss": 3.2963056564331055, "lr": 0.00014174931300851954, "tps": 29615, "wall": 44224.6} {"step": 19985, "train_loss": 3.2314324378967285, "lr": 0.00014173206047080902, "tps": 29613, "wall": 44230.1} {"step": 19986, "train_loss": 3.2048211097717285, "lr": 0.0001417148088197219, "tps": 29611, "wall": 44235.7} {"step": 19987, "train_loss": 3.3584225177764893, "lr": 0.00014169755805545372, "tps": 29608, "wall": 44241.3} {"step": 19988, "train_loss": 3.2557992935180664, "lr": 0.00014168030817819985, "tps": 29606, "wall": 44246.9} {"step": 19989, "train_loss": 3.3005142211914062, "lr": 0.00014166305918815559, "tps": 29604, "wall": 44252.6} {"step": 19990, "train_loss": 3.2802650928497314, "lr": 0.00014164581108551652, "tps": 29601, "wall": 44258.2} {"step": 19991, "train_loss": 3.191422462463379, "lr": 0.00014162856387047782, "tps": 29599, "wall": 44263.7} {"step": 19992, "train_loss": 3.236043930053711, "lr": 0.00014161131754323512, "tps": 29597, "wall": 44269.3} {"step": 19993, "train_loss": 3.363410234451294, "lr": 0.00014159407210398363, "tps": 29595, "wall": 44274.9} {"step": 19994, "train_loss": 3.375133514404297, "lr": 0.0001415768275529187, "tps": 29593, "wall": 44280.4} {"step": 19995, "train_loss": 3.2704381942749023, "lr": 0.00014155958389023573, "tps": 29590, "wall": 44286.0} {"step": 19996, "train_loss": 3.2369184494018555, "lr": 0.00014154234111613006, "tps": 29588, "wall": 44291.5} {"step": 19997, "train_loss": 3.265373945236206, "lr": 0.0001415250992307969, "tps": 29586, "wall": 44297.1} {"step": 19998, "train_loss": 3.3889734745025635, "lr": 0.0001415078582344318, "tps": 29584, "wall": 44302.6} {"step": 19999, "train_loss": 3.197114944458008, "lr": 0.00014149061812722988, "tps": 29581, "wall": 44308.2} {"step": 20000, "train_loss": 3.3037075996398926, "lr": 0.0001414733789093864, "tps": 29579, "wall": 44313.8, "val_loss_monitor": 3.3862345828736693, "val_loss_full": 3.40367541485075} {"step": 20001, "train_loss": 3.3058228492736816, "lr": 0.00014145614058109685, "tps": 29493, "wall": 44445.8} {"step": 20002, "train_loss": 3.2655065059661865, "lr": 0.00014143890314255634, "tps": 29490, "wall": 44451.5} {"step": 20003, "train_loss": 3.2758378982543945, "lr": 0.00014142166659396015, "tps": 29488, "wall": 44457.3} {"step": 20004, "train_loss": 3.3529319763183594, "lr": 0.0001414044309355036, "tps": 29486, "wall": 44463.0} {"step": 20005, "train_loss": 3.3357040882110596, "lr": 0.0001413871961673819, "tps": 29483, "wall": 44468.8} {"step": 20006, "train_loss": 3.2935454845428467, "lr": 0.0001413699622897903, "tps": 29481, "wall": 44474.5} {"step": 20007, "train_loss": 3.341674566268921, "lr": 0.00014135272930292407, "tps": 29479, "wall": 44480.3} {"step": 20008, "train_loss": 3.4271740913391113, "lr": 0.00014133549720697834, "tps": 29476, "wall": 44485.9} {"step": 20009, "train_loss": 3.1307713985443115, "lr": 0.0001413182660021483, "tps": 29474, "wall": 44491.7} {"step": 20010, "train_loss": 3.346717596054077, "lr": 0.00014130103568862928, "tps": 29472, "wall": 44497.5} {"step": 20011, "train_loss": 3.352989673614502, "lr": 0.0001412838062666163, "tps": 29469, "wall": 44503.2} {"step": 20012, "train_loss": 3.400977849960327, "lr": 0.0001412665777363047, "tps": 29467, "wall": 44508.9} {"step": 20013, "train_loss": 3.3578357696533203, "lr": 0.00014124935009788954, "tps": 29465, "wall": 44514.6} {"step": 20014, "train_loss": 3.317972183227539, "lr": 0.00014123212335156597, "tps": 29463, "wall": 44520.3} {"step": 20015, "train_loss": 3.3724255561828613, "lr": 0.00014121489749752922, "tps": 29460, "wall": 44525.9} {"step": 20016, "train_loss": 3.349518060684204, "lr": 0.00014119767253597436, "tps": 29458, "wall": 44531.6} {"step": 20017, "train_loss": 3.42094349861145, "lr": 0.0001411804484670965, "tps": 29456, "wall": 44537.2} {"step": 20018, "train_loss": 3.3200583457946777, "lr": 0.00014116322529109083, "tps": 29453, "wall": 44542.9} {"step": 20019, "train_loss": 3.364920139312744, "lr": 0.00014114600300815238, "tps": 29451, "wall": 44548.5} {"step": 20020, "train_loss": 3.290788173675537, "lr": 0.00014112878161847624, "tps": 29449, "wall": 44554.3} {"step": 20021, "train_loss": 3.3293967247009277, "lr": 0.0001411115611222576, "tps": 29447, "wall": 44559.9} {"step": 20022, "train_loss": 3.2264957427978516, "lr": 0.0001410943415196915, "tps": 29444, "wall": 44565.5} {"step": 20023, "train_loss": 3.3482041358947754, "lr": 0.0001410771228109728, "tps": 29442, "wall": 44571.1} {"step": 20024, "train_loss": 3.2978360652923584, "lr": 0.00014105990499629683, "tps": 29440, "wall": 44576.7} {"step": 20025, "train_loss": 3.3356151580810547, "lr": 0.00014104268807585855, "tps": 29438, "wall": 44582.3} {"step": 20026, "train_loss": 3.2453086376190186, "lr": 0.0001410254720498529, "tps": 29435, "wall": 44587.9} {"step": 20027, "train_loss": 3.3297653198242188, "lr": 0.00014100825691847505, "tps": 29433, "wall": 44593.5} {"step": 20028, "train_loss": 3.3308136463165283, "lr": 0.00014099104268191983, "tps": 29431, "wall": 44599.0} {"step": 20029, "train_loss": 3.36769962310791, "lr": 0.00014097382934038247, "tps": 29429, "wall": 44604.6} {"step": 20030, "train_loss": 3.312256097793579, "lr": 0.00014095661689405783, "tps": 29427, "wall": 44610.1} {"step": 20031, "train_loss": 3.379110813140869, "lr": 0.0001409394053431408, "tps": 29424, "wall": 44615.8} {"step": 20032, "train_loss": 3.299379825592041, "lr": 0.00014092219468782663, "tps": 29422, "wall": 44621.3} {"step": 20033, "train_loss": 3.3550736904144287, "lr": 0.00014090498492831004, "tps": 29420, "wall": 44626.8} {"step": 20034, "train_loss": 3.351701259613037, "lr": 0.00014088777606478597, "tps": 29418, "wall": 44632.4} {"step": 20035, "train_loss": 3.3715622425079346, "lr": 0.0001408705680974496, "tps": 29416, "wall": 44637.9} {"step": 20036, "train_loss": 3.2554705142974854, "lr": 0.00014085336102649567, "tps": 29414, "wall": 44643.4} {"step": 20037, "train_loss": 3.367703437805176, "lr": 0.00014083615485211906, "tps": 29411, "wall": 44648.9} {"step": 20038, "train_loss": 3.2588376998901367, "lr": 0.00014081894957451488, "tps": 29409, "wall": 44654.4} {"step": 20039, "train_loss": 3.3539907932281494, "lr": 0.0001408017451938779, "tps": 29407, "wall": 44659.9} {"step": 20040, "train_loss": 3.293870210647583, "lr": 0.00014078454171040296, "tps": 29405, "wall": 44665.5} {"step": 20041, "train_loss": 3.2916836738586426, "lr": 0.0001407673391242851, "tps": 29403, "wall": 44671.0} {"step": 20042, "train_loss": 3.3181040287017822, "lr": 0.0001407501374357191, "tps": 29401, "wall": 44676.6} {"step": 20043, "train_loss": 3.261171579360962, "lr": 0.00014073293664489976, "tps": 29398, "wall": 44682.1} {"step": 20044, "train_loss": 3.377406597137451, "lr": 0.00014071573675202207, "tps": 29396, "wall": 44687.6} {"step": 20045, "train_loss": 3.3384149074554443, "lr": 0.00014069853775728074, "tps": 29394, "wall": 44693.0} {"step": 20046, "train_loss": 3.291696071624756, "lr": 0.00014068133966087075, "tps": 29392, "wall": 44698.6} {"step": 20047, "train_loss": 3.3328373432159424, "lr": 0.00014066414246298684, "tps": 29390, "wall": 44704.1} {"step": 20048, "train_loss": 3.4276676177978516, "lr": 0.0001406469461638237, "tps": 29388, "wall": 44709.6} {"step": 20049, "train_loss": 3.3570876121520996, "lr": 0.00014062975076357636, "tps": 29385, "wall": 44715.1} {"step": 20050, "train_loss": 3.3029322624206543, "lr": 0.0001406125562624395, "tps": 29383, "wall": 44720.6} {"step": 20051, "train_loss": 3.373035430908203, "lr": 0.0001405953626606078, "tps": 29381, "wall": 44726.1} {"step": 20052, "train_loss": 3.27054500579834, "lr": 0.00014057816995827617, "tps": 29379, "wall": 44731.6} {"step": 20053, "train_loss": 3.244657039642334, "lr": 0.00014056097815563935, "tps": 29377, "wall": 44737.2} {"step": 20054, "train_loss": 3.315423011779785, "lr": 0.00014054378725289203, "tps": 29375, "wall": 44742.7} {"step": 20055, "train_loss": 3.3939080238342285, "lr": 0.00014052659725022907, "tps": 29373, "wall": 44748.1} {"step": 20056, "train_loss": 3.463609457015991, "lr": 0.0001405094081478451, "tps": 29370, "wall": 44753.6} {"step": 20057, "train_loss": 3.386187791824341, "lr": 0.00014049221994593474, "tps": 29368, "wall": 44759.2} {"step": 20058, "train_loss": 3.35085391998291, "lr": 0.0001404750326446929, "tps": 29366, "wall": 44764.7} {"step": 20059, "train_loss": 3.341536521911621, "lr": 0.0001404578462443142, "tps": 29364, "wall": 44770.1} {"step": 20060, "train_loss": 3.3022239208221436, "lr": 0.00014044066074499326, "tps": 29362, "wall": 44775.6} {"step": 20061, "train_loss": 3.2658190727233887, "lr": 0.00014042347614692487, "tps": 29360, "wall": 44781.1} {"step": 20062, "train_loss": 3.3581676483154297, "lr": 0.0001404062924503037, "tps": 29358, "wall": 44786.7} {"step": 20063, "train_loss": 3.2240564823150635, "lr": 0.00014038910965532422, "tps": 29355, "wall": 44792.2} {"step": 20064, "train_loss": 3.337970018386841, "lr": 0.00014037192776218134, "tps": 29353, "wall": 44797.7} {"step": 20065, "train_loss": 3.3308229446411133, "lr": 0.00014035474677106944, "tps": 29351, "wall": 44803.2} {"step": 20066, "train_loss": 3.308244466781616, "lr": 0.0001403375666821834, "tps": 29349, "wall": 44808.6} {"step": 20067, "train_loss": 3.4246623516082764, "lr": 0.00014032038749571765, "tps": 29347, "wall": 44814.1} {"step": 20068, "train_loss": 3.4376652240753174, "lr": 0.00014030320921186684, "tps": 29345, "wall": 44819.6} {"step": 20069, "train_loss": 3.2877755165100098, "lr": 0.00014028603183082567, "tps": 29343, "wall": 44825.1} {"step": 20070, "train_loss": 3.2404322624206543, "lr": 0.00014026885535278863, "tps": 29340, "wall": 44830.6} {"step": 20071, "train_loss": 3.404897689819336, "lr": 0.00014025167977795025, "tps": 29338, "wall": 44836.2} {"step": 20072, "train_loss": 3.246607542037964, "lr": 0.00014023450510650516, "tps": 29336, "wall": 44841.7} {"step": 20073, "train_loss": 3.314239978790283, "lr": 0.000140217331338648, "tps": 29334, "wall": 44847.3} {"step": 20074, "train_loss": 3.3544819355010986, "lr": 0.00014020015847457308, "tps": 29332, "wall": 44852.9} {"step": 20075, "train_loss": 3.288341522216797, "lr": 0.0001401829865144752, "tps": 29330, "wall": 44858.4} {"step": 20076, "train_loss": 3.288969039916992, "lr": 0.00014016581545854873, "tps": 29327, "wall": 44863.9} {"step": 20077, "train_loss": 3.3286242485046387, "lr": 0.0001401486453069882, "tps": 29325, "wall": 44869.5} {"step": 20078, "train_loss": 3.4730329513549805, "lr": 0.0001401314760599882, "tps": 29323, "wall": 44875.0} {"step": 20079, "train_loss": 3.331965923309326, "lr": 0.00014011430771774315, "tps": 29321, "wall": 44880.5} {"step": 20080, "train_loss": 3.2904272079467773, "lr": 0.00014009714028044744, "tps": 29319, "wall": 44886.1} {"step": 20081, "train_loss": 3.3390567302703857, "lr": 0.00014007997374829577, "tps": 29317, "wall": 44891.6} {"step": 20082, "train_loss": 3.373790740966797, "lr": 0.00014006280812148237, "tps": 29315, "wall": 44897.1} {"step": 20083, "train_loss": 3.331829309463501, "lr": 0.0001400456434002019, "tps": 29312, "wall": 44902.6} {"step": 20084, "train_loss": 3.362959384918213, "lr": 0.00014002847958464865, "tps": 29310, "wall": 44908.2} {"step": 20085, "train_loss": 3.303175926208496, "lr": 0.00014001131667501713, "tps": 29308, "wall": 44913.8} {"step": 20086, "train_loss": 3.2870006561279297, "lr": 0.00013999415467150176, "tps": 29306, "wall": 44919.3} {"step": 20087, "train_loss": 3.313413619995117, "lr": 0.00013997699357429694, "tps": 29304, "wall": 44924.8} {"step": 20088, "train_loss": 3.404628038406372, "lr": 0.000139959833383597, "tps": 29302, "wall": 44930.3} {"step": 20089, "train_loss": 3.3768715858459473, "lr": 0.00013994267409959648, "tps": 29299, "wall": 44935.8} {"step": 20090, "train_loss": 3.4455831050872803, "lr": 0.00013992551572248964, "tps": 29297, "wall": 44941.4} {"step": 20091, "train_loss": 3.2663230895996094, "lr": 0.00013990835825247085, "tps": 29295, "wall": 44946.9} {"step": 20092, "train_loss": 3.3894925117492676, "lr": 0.00013989120168973458, "tps": 29293, "wall": 44952.4} {"step": 20093, "train_loss": 3.3243894577026367, "lr": 0.0001398740460344751, "tps": 29291, "wall": 44958.0} {"step": 20094, "train_loss": 3.320538282394409, "lr": 0.0001398568912868867, "tps": 29289, "wall": 44963.5} {"step": 20095, "train_loss": 3.275911808013916, "lr": 0.00013983973744716385, "tps": 29287, "wall": 44969.0} {"step": 20096, "train_loss": 3.298269748687744, "lr": 0.00013982258451550076, "tps": 29284, "wall": 44974.6} {"step": 20097, "train_loss": 3.3308258056640625, "lr": 0.00013980543249209173, "tps": 29282, "wall": 44980.1} {"step": 20098, "train_loss": 3.3564624786376953, "lr": 0.00013978828137713116, "tps": 29280, "wall": 44985.7} {"step": 20099, "train_loss": 3.29769229888916, "lr": 0.00013977113117081318, "tps": 29278, "wall": 44991.2} {"step": 20100, "train_loss": 3.2876899242401123, "lr": 0.00013975398187333232, "tps": 29276, "wall": 44996.7} {"step": 20101, "train_loss": 3.332364082336426, "lr": 0.0001397368334848826, "tps": 29274, "wall": 45002.3} {"step": 20102, "train_loss": 3.304142475128174, "lr": 0.00013971968600565835, "tps": 29272, "wall": 45007.8} {"step": 20103, "train_loss": 3.392298698425293, "lr": 0.0001397025394358539, "tps": 29269, "wall": 45013.4} {"step": 20104, "train_loss": 3.281764030456543, "lr": 0.00013968539377566343, "tps": 29267, "wall": 45018.9} {"step": 20105, "train_loss": 3.353951930999756, "lr": 0.00013966824902528107, "tps": 29265, "wall": 45024.4} {"step": 20106, "train_loss": 3.3424177169799805, "lr": 0.00013965110518490123, "tps": 29263, "wall": 45030.0} {"step": 20107, "train_loss": 3.2808241844177246, "lr": 0.00013963396225471803, "tps": 29261, "wall": 45035.6} {"step": 20108, "train_loss": 3.3026089668273926, "lr": 0.00013961682023492554, "tps": 29259, "wall": 45041.1} {"step": 20109, "train_loss": 3.3925633430480957, "lr": 0.00013959967912571816, "tps": 29256, "wall": 45046.7} {"step": 20110, "train_loss": 3.3782122135162354, "lr": 0.00013958253892728997, "tps": 29254, "wall": 45052.2} {"step": 20111, "train_loss": 3.261183023452759, "lr": 0.00013956539963983503, "tps": 29252, "wall": 45057.8} {"step": 20112, "train_loss": 3.317941188812256, "lr": 0.0001395482612635477, "tps": 29250, "wall": 45063.3} {"step": 20113, "train_loss": 3.2527730464935303, "lr": 0.00013953112379862202, "tps": 29248, "wall": 45068.8} {"step": 20114, "train_loss": 3.3930931091308594, "lr": 0.000139513987245252, "tps": 29246, "wall": 45074.3} {"step": 20115, "train_loss": 3.340945243835449, "lr": 0.000139496851603632, "tps": 29244, "wall": 45079.9} {"step": 20116, "train_loss": 3.3434503078460693, "lr": 0.000139479716873956, "tps": 29242, "wall": 45085.4} {"step": 20117, "train_loss": 3.371919870376587, "lr": 0.00013946258305641806, "tps": 29239, "wall": 45090.9} {"step": 20118, "train_loss": 3.3343281745910645, "lr": 0.0001394454501512124, "tps": 29237, "wall": 45096.6} {"step": 20119, "train_loss": 3.3391880989074707, "lr": 0.000139428318158533, "tps": 29235, "wall": 45102.2} {"step": 20120, "train_loss": 3.2853686809539795, "lr": 0.00013941118707857402, "tps": 29233, "wall": 45107.7} {"step": 20121, "train_loss": 3.320456027984619, "lr": 0.00013939405691152946, "tps": 29231, "wall": 45113.3} {"step": 20122, "train_loss": 3.288262128829956, "lr": 0.00013937692765759332, "tps": 29229, "wall": 45118.8} {"step": 20123, "train_loss": 3.3067662715911865, "lr": 0.0001393597993169598, "tps": 29226, "wall": 45124.3} {"step": 20124, "train_loss": 3.294663667678833, "lr": 0.00013934267188982279, "tps": 29224, "wall": 45129.8} {"step": 20125, "train_loss": 3.322327136993408, "lr": 0.00013932554537637634, "tps": 29222, "wall": 45135.4} {"step": 20126, "train_loss": 3.4076626300811768, "lr": 0.0001393084197768145, "tps": 29220, "wall": 45140.9} {"step": 20127, "train_loss": 3.3402528762817383, "lr": 0.00013929129509133124, "tps": 29218, "wall": 45146.4} {"step": 20128, "train_loss": 3.290860652923584, "lr": 0.00013927417132012055, "tps": 29216, "wall": 45152.0} {"step": 20129, "train_loss": 3.2476649284362793, "lr": 0.0001392570484633764, "tps": 29214, "wall": 45157.6} {"step": 20130, "train_loss": 3.2826924324035645, "lr": 0.00013923992652129283, "tps": 29211, "wall": 45163.1} {"step": 20131, "train_loss": 3.3390510082244873, "lr": 0.0001392228054940637, "tps": 29209, "wall": 45168.7} {"step": 20132, "train_loss": 3.4119930267333984, "lr": 0.00013920568538188302, "tps": 29207, "wall": 45174.2} {"step": 20133, "train_loss": 3.328500986099243, "lr": 0.0001391885661849447, "tps": 29205, "wall": 45179.7} {"step": 20134, "train_loss": 3.267612934112549, "lr": 0.00013917144790344263, "tps": 29203, "wall": 45185.2} {"step": 20135, "train_loss": 3.286640167236328, "lr": 0.00013915433053757084, "tps": 29201, "wall": 45190.8} {"step": 20136, "train_loss": 3.356374740600586, "lr": 0.00013913721408752308, "tps": 29199, "wall": 45196.3} {"step": 20137, "train_loss": 3.343125581741333, "lr": 0.0001391200985534934, "tps": 29197, "wall": 45201.9} {"step": 20138, "train_loss": 3.333944320678711, "lr": 0.00013910298393567564, "tps": 29194, "wall": 45207.4} {"step": 20139, "train_loss": 3.348426342010498, "lr": 0.00013908587023426353, "tps": 29192, "wall": 45213.1} {"step": 20140, "train_loss": 3.2269344329833984, "lr": 0.0001390687574494512, "tps": 29190, "wall": 45218.6} {"step": 20141, "train_loss": 3.3520872592926025, "lr": 0.00013905164558143237, "tps": 29188, "wall": 45224.1} {"step": 20142, "train_loss": 3.2780299186706543, "lr": 0.00013903453463040075, "tps": 29186, "wall": 45229.6} {"step": 20143, "train_loss": 3.44787859916687, "lr": 0.0001390174245965504, "tps": 29184, "wall": 45235.2} {"step": 20144, "train_loss": 3.2239489555358887, "lr": 0.00013900031548007505, "tps": 29182, "wall": 45240.7} {"step": 20145, "train_loss": 3.392188549041748, "lr": 0.0001389832072811685, "tps": 29180, "wall": 45246.2} {"step": 20146, "train_loss": 3.366705894470215, "lr": 0.00013896610000002453, "tps": 29177, "wall": 45251.7} {"step": 20147, "train_loss": 3.3559043407440186, "lr": 0.00013894899363683694, "tps": 29175, "wall": 45257.3} {"step": 20148, "train_loss": 3.376677989959717, "lr": 0.00013893188819179958, "tps": 29173, "wall": 45262.8} {"step": 20149, "train_loss": 3.377859115600586, "lr": 0.00013891478366510622, "tps": 29171, "wall": 45268.4} {"step": 20150, "train_loss": 3.3543806076049805, "lr": 0.00013889768005695045, "tps": 29169, "wall": 45274.0} {"step": 20151, "train_loss": 3.234774112701416, "lr": 0.00013888057736752624, "tps": 29167, "wall": 45279.5} {"step": 20152, "train_loss": 3.3033366203308105, "lr": 0.00013886347559702723, "tps": 29165, "wall": 45285.0} {"step": 20153, "train_loss": 3.3366901874542236, "lr": 0.00013884637474564712, "tps": 29163, "wall": 45290.6} {"step": 20154, "train_loss": 3.386195659637451, "lr": 0.00013882927481357972, "tps": 29160, "wall": 45296.2} {"step": 20155, "train_loss": 3.328359603881836, "lr": 0.00013881217580101867, "tps": 29158, "wall": 45301.7} {"step": 20156, "train_loss": 3.3030338287353516, "lr": 0.00013879507770815763, "tps": 29156, "wall": 45307.2} {"step": 20157, "train_loss": 3.3140885829925537, "lr": 0.0001387779805351904, "tps": 29154, "wall": 45312.8} {"step": 20158, "train_loss": 3.4125514030456543, "lr": 0.00013876088428231063, "tps": 29152, "wall": 45318.3} {"step": 20159, "train_loss": 3.3222286701202393, "lr": 0.00013874378894971186, "tps": 29150, "wall": 45323.9} {"step": 20160, "train_loss": 3.3836288452148438, "lr": 0.0001387266945375879, "tps": 29148, "wall": 45329.4} {"step": 20161, "train_loss": 3.2905311584472656, "lr": 0.00013870960104613231, "tps": 29146, "wall": 45335.0} {"step": 20162, "train_loss": 3.336474895477295, "lr": 0.0001386925084755388, "tps": 29143, "wall": 45340.5} {"step": 20163, "train_loss": 3.3400940895080566, "lr": 0.00013867541682600096, "tps": 29141, "wall": 45346.0} {"step": 20164, "train_loss": 3.3711352348327637, "lr": 0.00013865832609771234, "tps": 29139, "wall": 45351.6} {"step": 20165, "train_loss": 3.3045382499694824, "lr": 0.00013864123629086668, "tps": 29137, "wall": 45357.1} {"step": 20166, "train_loss": 3.227773666381836, "lr": 0.00013862414740565746, "tps": 29135, "wall": 45362.6} {"step": 20167, "train_loss": 3.292757511138916, "lr": 0.00013860705944227823, "tps": 29133, "wall": 45368.1} {"step": 20168, "train_loss": 3.306582450866699, "lr": 0.00013858997240092275, "tps": 29131, "wall": 45373.7} {"step": 20169, "train_loss": 3.3369650840759277, "lr": 0.00013857288628178443, "tps": 29129, "wall": 45379.2} {"step": 20170, "train_loss": 3.30135440826416, "lr": 0.0001385558010850568, "tps": 29127, "wall": 45384.7} {"step": 20171, "train_loss": 3.307117462158203, "lr": 0.0001385387168109335, "tps": 29125, "wall": 45390.2} {"step": 20172, "train_loss": 3.3108232021331787, "lr": 0.0001385216334596081, "tps": 29122, "wall": 45395.9} {"step": 20173, "train_loss": 3.245558023452759, "lr": 0.0001385045510312739, "tps": 29120, "wall": 45401.4} {"step": 20174, "train_loss": 3.2893168926239014, "lr": 0.00013848746952612465, "tps": 29118, "wall": 45406.9} {"step": 20175, "train_loss": 3.1465132236480713, "lr": 0.00013847038894435377, "tps": 29116, "wall": 45412.4} {"step": 20176, "train_loss": 3.2206408977508545, "lr": 0.00013845330928615463, "tps": 29114, "wall": 45418.0} {"step": 20177, "train_loss": 3.338519811630249, "lr": 0.00013843623055172092, "tps": 29112, "wall": 45423.5} {"step": 20178, "train_loss": 3.285702705383301, "lr": 0.0001384191527412459, "tps": 29110, "wall": 45429.1} {"step": 20179, "train_loss": 3.3391356468200684, "lr": 0.00013840207585492323, "tps": 29108, "wall": 45434.6} {"step": 20180, "train_loss": 3.429234266281128, "lr": 0.00013838499989294627, "tps": 29106, "wall": 45440.1} {"step": 20181, "train_loss": 3.352144479751587, "lr": 0.00013836792485550837, "tps": 29103, "wall": 45445.7} {"step": 20182, "train_loss": 3.40034818649292, "lr": 0.00013835085074280308, "tps": 29101, "wall": 45451.2} {"step": 20183, "train_loss": 3.268477439880371, "lr": 0.00013833377755502376, "tps": 29099, "wall": 45456.8} {"step": 20184, "train_loss": 3.290254592895508, "lr": 0.00013831670529236377, "tps": 29097, "wall": 45462.3} {"step": 20185, "train_loss": 3.4652023315429688, "lr": 0.00013829963395501667, "tps": 29095, "wall": 45467.8} {"step": 20186, "train_loss": 3.3072338104248047, "lr": 0.00013828256354317568, "tps": 29093, "wall": 45473.4} {"step": 20187, "train_loss": 3.489145517349243, "lr": 0.00013826549405703418, "tps": 29091, "wall": 45478.9} {"step": 20188, "train_loss": 3.328278064727783, "lr": 0.00013824842549678564, "tps": 29089, "wall": 45484.5} {"step": 20189, "train_loss": 3.2609493732452393, "lr": 0.0001382313578626234, "tps": 29087, "wall": 45490.0} {"step": 20190, "train_loss": 3.279179096221924, "lr": 0.00013821429115474065, "tps": 29084, "wall": 45495.6} {"step": 20191, "train_loss": 3.20792555809021, "lr": 0.00013819722537333095, "tps": 29082, "wall": 45501.1} {"step": 20192, "train_loss": 3.4817686080932617, "lr": 0.00013818016051858747, "tps": 29080, "wall": 45506.6} {"step": 20193, "train_loss": 3.314286470413208, "lr": 0.00013816309659070352, "tps": 29078, "wall": 45512.2} {"step": 20194, "train_loss": 3.321930170059204, "lr": 0.00013814603358987246, "tps": 29076, "wall": 45517.8} {"step": 20195, "train_loss": 3.3205015659332275, "lr": 0.00013812897151628753, "tps": 29074, "wall": 45523.4} {"step": 20196, "train_loss": 3.394011974334717, "lr": 0.0001381119103701421, "tps": 29072, "wall": 45529.0} {"step": 20197, "train_loss": 3.3450207710266113, "lr": 0.00013809485015162936, "tps": 29070, "wall": 45534.5} {"step": 20198, "train_loss": 3.453300952911377, "lr": 0.00013807779086094256, "tps": 29068, "wall": 45540.0} {"step": 20199, "train_loss": 3.2901148796081543, "lr": 0.000138060732498275, "tps": 29066, "wall": 45545.5} {"step": 20200, "train_loss": 3.3503360748291016, "lr": 0.00013804367506381991, "tps": 29063, "wall": 45551.0} {"step": 20201, "train_loss": 3.3257062435150146, "lr": 0.00013802661855777046, "tps": 29061, "wall": 45556.6} {"step": 20202, "train_loss": 3.3902039527893066, "lr": 0.00013800956298031997, "tps": 29059, "wall": 45562.1} {"step": 20203, "train_loss": 3.393002986907959, "lr": 0.00013799250833166157, "tps": 29057, "wall": 45567.6} {"step": 20204, "train_loss": 3.3005971908569336, "lr": 0.0001379754546119884, "tps": 29055, "wall": 45573.3} {"step": 20205, "train_loss": 3.2603659629821777, "lr": 0.00013795840182149379, "tps": 29053, "wall": 45578.8} {"step": 20206, "train_loss": 3.3248820304870605, "lr": 0.00013794134996037086, "tps": 29051, "wall": 45584.3} {"step": 20207, "train_loss": 3.444502830505371, "lr": 0.0001379242990288127, "tps": 29049, "wall": 45589.8} {"step": 20208, "train_loss": 3.4057791233062744, "lr": 0.00013790724902701252, "tps": 29047, "wall": 45595.4} {"step": 20209, "train_loss": 3.2975821495056152, "lr": 0.00013789019995516353, "tps": 29045, "wall": 45601.0} {"step": 20210, "train_loss": 3.3675379753112793, "lr": 0.0001378731518134587, "tps": 29042, "wall": 45606.6} {"step": 20211, "train_loss": 3.3303937911987305, "lr": 0.00013785610460209134, "tps": 29040, "wall": 45612.1} {"step": 20212, "train_loss": 3.268861770629883, "lr": 0.00013783905832125443, "tps": 29038, "wall": 45617.7} {"step": 20213, "train_loss": 3.3401060104370117, "lr": 0.0001378220129711411, "tps": 29036, "wall": 45623.2} {"step": 20214, "train_loss": 3.2976598739624023, "lr": 0.00013780496855194448, "tps": 29034, "wall": 45628.8} {"step": 20215, "train_loss": 3.2497081756591797, "lr": 0.00013778792506385755, "tps": 29032, "wall": 45634.5} {"step": 20216, "train_loss": 3.26303768157959, "lr": 0.00013777088250707353, "tps": 29030, "wall": 45640.0} {"step": 20217, "train_loss": 3.3909239768981934, "lr": 0.00013775384088178543, "tps": 29028, "wall": 45645.5} {"step": 20218, "train_loss": 3.2602219581604004, "lr": 0.00013773680018818615, "tps": 29026, "wall": 45651.0} {"step": 20219, "train_loss": 3.4238548278808594, "lr": 0.00013771976042646896, "tps": 29024, "wall": 45656.6} {"step": 20220, "train_loss": 3.2242727279663086, "lr": 0.00013770272159682674, "tps": 29021, "wall": 45662.2} {"step": 20221, "train_loss": 3.300002098083496, "lr": 0.00013768568369945254, "tps": 29019, "wall": 45667.7} {"step": 20222, "train_loss": 3.3227193355560303, "lr": 0.00013766864673453937, "tps": 29017, "wall": 45673.3} {"step": 20223, "train_loss": 3.4310221672058105, "lr": 0.00013765161070228022, "tps": 29015, "wall": 45678.8} {"step": 20224, "train_loss": 3.247096061706543, "lr": 0.00013763457560286808, "tps": 29013, "wall": 45684.3} {"step": 20225, "train_loss": 3.4035050868988037, "lr": 0.00013761754143649593, "tps": 29011, "wall": 45689.9} {"step": 20226, "train_loss": 3.456683874130249, "lr": 0.00013760050820335677, "tps": 29009, "wall": 45695.5} {"step": 20227, "train_loss": 3.332874298095703, "lr": 0.0001375834759036434, "tps": 29007, "wall": 45701.0} {"step": 20228, "train_loss": 3.3220977783203125, "lr": 0.00013756644453754893, "tps": 29005, "wall": 45706.6} {"step": 20229, "train_loss": 3.363345146179199, "lr": 0.00013754941410526632, "tps": 29003, "wall": 45712.1} {"step": 20230, "train_loss": 3.310333490371704, "lr": 0.00013753238460698826, "tps": 29001, "wall": 45717.6} {"step": 20231, "train_loss": 3.2871077060699463, "lr": 0.00013751535604290788, "tps": 28998, "wall": 45723.2} {"step": 20232, "train_loss": 3.403101682662964, "lr": 0.00013749832841321798, "tps": 28996, "wall": 45728.7} {"step": 20233, "train_loss": 3.3229775428771973, "lr": 0.00013748130171811152, "tps": 28994, "wall": 45734.3} {"step": 20234, "train_loss": 3.2905964851379395, "lr": 0.00013746427595778135, "tps": 28992, "wall": 45739.8} {"step": 20235, "train_loss": 3.3533999919891357, "lr": 0.00013744725113242024, "tps": 28990, "wall": 45745.4} {"step": 20236, "train_loss": 3.4098269939422607, "lr": 0.00013743022724222126, "tps": 28988, "wall": 45750.9} {"step": 20237, "train_loss": 3.407040596008301, "lr": 0.00013741320428737707, "tps": 28986, "wall": 45756.6} {"step": 20238, "train_loss": 3.269449472427368, "lr": 0.00013739618226808054, "tps": 28984, "wall": 45762.1} {"step": 20239, "train_loss": 3.282449245452881, "lr": 0.00013737916118452455, "tps": 28982, "wall": 45767.6} {"step": 20240, "train_loss": 3.2826061248779297, "lr": 0.00013736214103690191, "tps": 28980, "wall": 45773.3} {"step": 20241, "train_loss": 3.3399386405944824, "lr": 0.00013734512182540538, "tps": 28978, "wall": 45778.8} {"step": 20242, "train_loss": 3.3147988319396973, "lr": 0.0001373281035502278, "tps": 28975, "wall": 45784.3} {"step": 20243, "train_loss": 3.2832188606262207, "lr": 0.000137311086211562, "tps": 28973, "wall": 45789.9} {"step": 20244, "train_loss": 3.31520414352417, "lr": 0.00013729406980960053, "tps": 28971, "wall": 45795.4} {"step": 20245, "train_loss": 3.357032060623169, "lr": 0.00013727705434453643, "tps": 28969, "wall": 45800.9} {"step": 20246, "train_loss": 3.272834062576294, "lr": 0.00013726003981656234, "tps": 28967, "wall": 45806.5} {"step": 20247, "train_loss": 3.349013090133667, "lr": 0.0001372430262258709, "tps": 28965, "wall": 45812.1} {"step": 20248, "train_loss": 3.4748921394348145, "lr": 0.00013722601357265502, "tps": 28963, "wall": 45817.7} {"step": 20249, "train_loss": 3.206502914428711, "lr": 0.00013720900185710728, "tps": 28961, "wall": 45823.2} {"step": 20250, "train_loss": 3.2963037490844727, "lr": 0.00013719199107942048, "tps": 28959, "wall": 45828.8} {"step": 20251, "train_loss": 3.4078750610351562, "lr": 0.00013717498123978734, "tps": 28957, "wall": 45834.3} {"step": 20252, "train_loss": 3.251826763153076, "lr": 0.00013715797233840036, "tps": 28955, "wall": 45839.8} {"step": 20253, "train_loss": 3.3666772842407227, "lr": 0.00013714096437545247, "tps": 28953, "wall": 45845.4} {"step": 20254, "train_loss": 3.277228355407715, "lr": 0.0001371239573511362, "tps": 28951, "wall": 45851.0} {"step": 20255, "train_loss": 3.326216697692871, "lr": 0.00013710695126564418, "tps": 28948, "wall": 45856.5} {"step": 20256, "train_loss": 3.2866029739379883, "lr": 0.0001370899461191691, "tps": 28946, "wall": 45862.0} {"step": 20257, "train_loss": 3.385364532470703, "lr": 0.00013707294191190366, "tps": 28944, "wall": 45867.6} {"step": 20258, "train_loss": 3.3191709518432617, "lr": 0.0001370559386440403, "tps": 28942, "wall": 45873.2} {"step": 20259, "train_loss": 3.4339232444763184, "lr": 0.00013703893631577188, "tps": 28940, "wall": 45878.8} {"step": 20260, "train_loss": 3.290860414505005, "lr": 0.00013702193492729086, "tps": 28938, "wall": 45884.4} {"step": 20261, "train_loss": 3.2495107650756836, "lr": 0.00013700493447878976, "tps": 28936, "wall": 45889.9} {"step": 20262, "train_loss": 3.4004507064819336, "lr": 0.00013698793497046133, "tps": 28934, "wall": 45895.5} {"step": 20263, "train_loss": 3.3253707885742188, "lr": 0.0001369709364024981, "tps": 28932, "wall": 45901.0} {"step": 20264, "train_loss": 3.3646998405456543, "lr": 0.00013695393877509245, "tps": 28930, "wall": 45906.6} {"step": 20265, "train_loss": 3.291822671890259, "lr": 0.00013693694208843723, "tps": 28928, "wall": 45912.2} {"step": 20266, "train_loss": 3.298630714416504, "lr": 0.00013691994634272475, "tps": 28926, "wall": 45917.8} {"step": 20267, "train_loss": 3.3976082801818848, "lr": 0.0001369029515381476, "tps": 28923, "wall": 45923.3} {"step": 20268, "train_loss": 3.3783206939697266, "lr": 0.00013688595767489834, "tps": 28921, "wall": 45928.9} {"step": 20269, "train_loss": 3.27435302734375, "lr": 0.0001368689647531694, "tps": 28919, "wall": 45934.5} {"step": 20270, "train_loss": 3.3339269161224365, "lr": 0.00013685197277315335, "tps": 28917, "wall": 45940.1} {"step": 20271, "train_loss": 3.3280744552612305, "lr": 0.00013683498173504272, "tps": 28915, "wall": 45945.6} {"step": 20272, "train_loss": 3.2211766242980957, "lr": 0.0001368179916390298, "tps": 28913, "wall": 45951.2} {"step": 20273, "train_loss": 3.2950029373168945, "lr": 0.00013680100248530724, "tps": 28911, "wall": 45956.7} {"step": 20274, "train_loss": 3.361605644226074, "lr": 0.00013678401427406745, "tps": 28909, "wall": 45962.2} {"step": 20275, "train_loss": 3.3558526039123535, "lr": 0.00013676702700550277, "tps": 28907, "wall": 45967.8} {"step": 20276, "train_loss": 3.3463521003723145, "lr": 0.00013675004067980576, "tps": 28905, "wall": 45973.4} {"step": 20277, "train_loss": 3.432651996612549, "lr": 0.00013673305529716886, "tps": 28903, "wall": 45978.9} {"step": 20278, "train_loss": 3.286526679992676, "lr": 0.00013671607085778426, "tps": 28901, "wall": 45984.4} {"step": 20279, "train_loss": 3.3265490531921387, "lr": 0.0001366990873618446, "tps": 28899, "wall": 45990.0} {"step": 20280, "train_loss": 3.3437206745147705, "lr": 0.00013668210480954223, "tps": 28897, "wall": 45995.6} {"step": 20281, "train_loss": 3.2006940841674805, "lr": 0.0001366651232010694, "tps": 28894, "wall": 46001.2} {"step": 20282, "train_loss": 3.2844398021698, "lr": 0.0001366481425366186, "tps": 28892, "wall": 46006.7} {"step": 20283, "train_loss": 3.2953720092773438, "lr": 0.0001366311628163822, "tps": 28890, "wall": 46012.2} {"step": 20284, "train_loss": 3.406496047973633, "lr": 0.00013661418404055237, "tps": 28888, "wall": 46017.8} {"step": 20285, "train_loss": 3.320963144302368, "lr": 0.0001365972062093217, "tps": 28886, "wall": 46023.3} {"step": 20286, "train_loss": 3.2927889823913574, "lr": 0.00013658022932288227, "tps": 28884, "wall": 46028.9} {"step": 20287, "train_loss": 3.1319642066955566, "lr": 0.0001365632533814266, "tps": 28882, "wall": 46034.4} {"step": 20288, "train_loss": 3.3485329151153564, "lr": 0.00013654627838514692, "tps": 28880, "wall": 46040.0} {"step": 20289, "train_loss": 3.3767409324645996, "lr": 0.00013652930433423545, "tps": 28878, "wall": 46045.5} {"step": 20290, "train_loss": 3.346217632293701, "lr": 0.00013651233122888458, "tps": 28876, "wall": 46051.1} {"step": 20291, "train_loss": 3.284923791885376, "lr": 0.00013649535906928658, "tps": 28874, "wall": 46056.7} {"step": 20292, "train_loss": 3.4200284481048584, "lr": 0.00013647838785563359, "tps": 28872, "wall": 46062.3} {"step": 20293, "train_loss": 3.298473358154297, "lr": 0.000136461417588118, "tps": 28870, "wall": 46067.9} {"step": 20294, "train_loss": 3.303316593170166, "lr": 0.00013644444826693195, "tps": 28868, "wall": 46073.4} {"step": 20295, "train_loss": 3.2814111709594727, "lr": 0.0001364274798922677, "tps": 28866, "wall": 46079.0} {"step": 20296, "train_loss": 3.2576563358306885, "lr": 0.00013641051246431754, "tps": 28863, "wall": 46084.5} {"step": 20297, "train_loss": 3.3796799182891846, "lr": 0.00013639354598327357, "tps": 28861, "wall": 46090.1} {"step": 20298, "train_loss": 3.3440253734588623, "lr": 0.00013637658044932802, "tps": 28859, "wall": 46095.6} {"step": 20299, "train_loss": 3.2803399562835693, "lr": 0.00013635961586267313, "tps": 28857, "wall": 46101.2} {"step": 20300, "train_loss": 3.363971710205078, "lr": 0.00013634265222350105, "tps": 28855, "wall": 46106.7} {"step": 20301, "train_loss": 3.386082649230957, "lr": 0.00013632568953200383, "tps": 28853, "wall": 46112.3} {"step": 20302, "train_loss": 3.204596996307373, "lr": 0.00013630872778837383, "tps": 28851, "wall": 46117.9} {"step": 20303, "train_loss": 3.354766368865967, "lr": 0.0001362917669928031, "tps": 28849, "wall": 46123.5} {"step": 20304, "train_loss": 3.2922616004943848, "lr": 0.00013627480714548367, "tps": 28847, "wall": 46129.0} {"step": 20305, "train_loss": 3.2042312622070312, "lr": 0.00013625784824660784, "tps": 28845, "wall": 46134.6} {"step": 20306, "train_loss": 3.384298324584961, "lr": 0.00013624089029636756, "tps": 28843, "wall": 46140.1} {"step": 20307, "train_loss": 3.3659279346466064, "lr": 0.00013622393329495503, "tps": 28841, "wall": 46145.7} {"step": 20308, "train_loss": 3.3408541679382324, "lr": 0.00013620697724256236, "tps": 28839, "wall": 46151.3} {"step": 20309, "train_loss": 3.26658034324646, "lr": 0.0001361900221393815, "tps": 28837, "wall": 46156.8} {"step": 20310, "train_loss": 3.3243613243103027, "lr": 0.0001361730679856047, "tps": 28835, "wall": 46162.4} {"step": 20311, "train_loss": 3.356283664703369, "lr": 0.00013615611478142388, "tps": 28833, "wall": 46167.9} {"step": 20312, "train_loss": 3.2319066524505615, "lr": 0.0001361391625270311, "tps": 28831, "wall": 46173.5} {"step": 20313, "train_loss": 3.417454242706299, "lr": 0.00013612221122261855, "tps": 28829, "wall": 46179.1} {"step": 20314, "train_loss": 3.2989439964294434, "lr": 0.00013610526086837798, "tps": 28827, "wall": 46184.6} {"step": 20315, "train_loss": 3.2747693061828613, "lr": 0.00013608831146450165, "tps": 28824, "wall": 46190.1} {"step": 20316, "train_loss": 3.312009334564209, "lr": 0.00013607136301118145, "tps": 28822, "wall": 46195.7} {"step": 20317, "train_loss": 3.3318979740142822, "lr": 0.0001360544155086093, "tps": 28820, "wall": 46201.2} {"step": 20318, "train_loss": 3.1888656616210938, "lr": 0.00013603746895697735, "tps": 28818, "wall": 46206.8} {"step": 20319, "train_loss": 3.334367275238037, "lr": 0.00013602052335647753, "tps": 28816, "wall": 46212.3} {"step": 20320, "train_loss": 3.3234763145446777, "lr": 0.00013600357870730164, "tps": 28814, "wall": 46217.9} {"step": 20321, "train_loss": 3.230215072631836, "lr": 0.00013598663500964184, "tps": 28812, "wall": 46223.5} {"step": 20322, "train_loss": 3.3032591342926025, "lr": 0.00013596969226368997, "tps": 28810, "wall": 46229.0} {"step": 20323, "train_loss": 3.270003318786621, "lr": 0.000135952750469638, "tps": 28808, "wall": 46234.6} {"step": 20324, "train_loss": 3.330860137939453, "lr": 0.00013593580962767779, "tps": 28806, "wall": 46240.1} {"step": 20325, "train_loss": 3.3712029457092285, "lr": 0.0001359188697380013, "tps": 28804, "wall": 46245.7} {"step": 20326, "train_loss": 3.3152072429656982, "lr": 0.00013590193080080033, "tps": 28802, "wall": 46251.2} {"step": 20327, "train_loss": 3.175875186920166, "lr": 0.00013588499281626693, "tps": 28800, "wall": 46256.8} {"step": 20328, "train_loss": 3.2668662071228027, "lr": 0.00013586805578459277, "tps": 28798, "wall": 46262.3} {"step": 20329, "train_loss": 3.3511853218078613, "lr": 0.00013585111970596992, "tps": 28796, "wall": 46267.9} {"step": 20330, "train_loss": 3.1341938972473145, "lr": 0.00013583418458059017, "tps": 28794, "wall": 46273.4} {"step": 20331, "train_loss": 3.2716734409332275, "lr": 0.00013581725040864523, "tps": 28792, "wall": 46279.0} {"step": 20332, "train_loss": 3.3460588455200195, "lr": 0.00013580031719032708, "tps": 28790, "wall": 46284.6} {"step": 20333, "train_loss": 3.2492241859436035, "lr": 0.00013578338492582748, "tps": 28788, "wall": 46290.1} {"step": 20334, "train_loss": 3.365009307861328, "lr": 0.00013576645361533825, "tps": 28786, "wall": 46295.8} {"step": 20335, "train_loss": 3.3142786026000977, "lr": 0.00013574952325905122, "tps": 28784, "wall": 46301.3} {"step": 20336, "train_loss": 3.312119960784912, "lr": 0.00013573259385715812, "tps": 28782, "wall": 46306.8} {"step": 20337, "train_loss": 3.2229859828948975, "lr": 0.00013571566540985074, "tps": 28779, "wall": 46312.4} {"step": 20338, "train_loss": 3.333730936050415, "lr": 0.0001356987379173209, "tps": 28777, "wall": 46318.0} {"step": 20339, "train_loss": 3.3446359634399414, "lr": 0.00013568181137976035, "tps": 28775, "wall": 46323.6} {"step": 20340, "train_loss": 3.28125, "lr": 0.00013566488579736067, "tps": 28773, "wall": 46329.1} {"step": 20341, "train_loss": 3.370429277420044, "lr": 0.00013564796117031386, "tps": 28771, "wall": 46334.7} {"step": 20342, "train_loss": 3.2993407249450684, "lr": 0.0001356310374988115, "tps": 28769, "wall": 46340.2} {"step": 20343, "train_loss": 3.2744879722595215, "lr": 0.0001356141147830452, "tps": 28767, "wall": 46345.8} {"step": 20344, "train_loss": 3.2586772441864014, "lr": 0.00013559719302320687, "tps": 28765, "wall": 46351.3} {"step": 20345, "train_loss": 3.449591875076294, "lr": 0.0001355802722194881, "tps": 28763, "wall": 46357.0} {"step": 20346, "train_loss": 3.328317165374756, "lr": 0.00013556335237208052, "tps": 28761, "wall": 46362.5} {"step": 20347, "train_loss": 3.227177858352661, "lr": 0.0001355464334811759, "tps": 28759, "wall": 46368.1} {"step": 20348, "train_loss": 3.349640130996704, "lr": 0.0001355295155469658, "tps": 28757, "wall": 46373.6} {"step": 20349, "train_loss": 3.2682766914367676, "lr": 0.00013551259856964194, "tps": 28755, "wall": 46379.2} {"step": 20350, "train_loss": 3.349781036376953, "lr": 0.000135495682549396, "tps": 28753, "wall": 46384.7} {"step": 20351, "train_loss": 3.2951111793518066, "lr": 0.00013547876748641944, "tps": 28751, "wall": 46390.3} {"step": 20352, "train_loss": 3.215104818344116, "lr": 0.00013546185338090405, "tps": 28749, "wall": 46395.9} {"step": 20353, "train_loss": 3.1948466300964355, "lr": 0.00013544494023304135, "tps": 28747, "wall": 46401.4} {"step": 20354, "train_loss": 3.3390159606933594, "lr": 0.00013542802804302286, "tps": 28745, "wall": 46407.0} {"step": 20355, "train_loss": 3.232569932937622, "lr": 0.00013541111681104035, "tps": 28743, "wall": 46412.6} {"step": 20356, "train_loss": 3.3012664318084717, "lr": 0.00013539420653728524, "tps": 28741, "wall": 46418.2} {"step": 20357, "train_loss": 3.2674734592437744, "lr": 0.00013537729722194912, "tps": 28739, "wall": 46423.8} {"step": 20358, "train_loss": 3.221738815307617, "lr": 0.00013536038886522358, "tps": 28737, "wall": 46429.3} {"step": 20359, "train_loss": 3.3684468269348145, "lr": 0.00013534348146730015, "tps": 28735, "wall": 46434.8} {"step": 20360, "train_loss": 3.422250270843506, "lr": 0.00013532657502837028, "tps": 28733, "wall": 46440.4} {"step": 20361, "train_loss": 3.351032257080078, "lr": 0.0001353096695486256, "tps": 28731, "wall": 46446.0} {"step": 20362, "train_loss": 3.3245270252227783, "lr": 0.00013529276502825756, "tps": 28729, "wall": 46451.5} {"step": 20363, "train_loss": 3.3116049766540527, "lr": 0.0001352758614674576, "tps": 28727, "wall": 46457.1} {"step": 20364, "train_loss": 3.426892042160034, "lr": 0.00013525895886641736, "tps": 28725, "wall": 46462.7} {"step": 20365, "train_loss": 3.286008358001709, "lr": 0.00013524205722532812, "tps": 28722, "wall": 46468.3} {"step": 20366, "train_loss": 3.3737478256225586, "lr": 0.00013522515654438154, "tps": 28720, "wall": 46473.9} {"step": 20367, "train_loss": 3.307877540588379, "lr": 0.00013520825682376893, "tps": 28718, "wall": 46479.5} {"step": 20368, "train_loss": 3.3591995239257812, "lr": 0.0001351913580636817, "tps": 28716, "wall": 46485.0} {"step": 20369, "train_loss": 3.3255066871643066, "lr": 0.00013517446026431148, "tps": 28714, "wall": 46490.6} {"step": 20370, "train_loss": 3.31095027923584, "lr": 0.00013515756342584952, "tps": 28712, "wall": 46496.2} {"step": 20371, "train_loss": 3.2971067428588867, "lr": 0.0001351406675484872, "tps": 28710, "wall": 46501.7} {"step": 20372, "train_loss": 3.24045991897583, "lr": 0.0001351237726324161, "tps": 28708, "wall": 46507.2} {"step": 20373, "train_loss": 3.316494941711426, "lr": 0.00013510687867782743, "tps": 28706, "wall": 46512.8} {"step": 20374, "train_loss": 3.30141544342041, "lr": 0.00013508998568491262, "tps": 28704, "wall": 46518.4} {"step": 20375, "train_loss": 3.291825294494629, "lr": 0.00013507309365386308, "tps": 28702, "wall": 46524.0} {"step": 20376, "train_loss": 3.262106418609619, "lr": 0.00013505620258487015, "tps": 28700, "wall": 46529.5} {"step": 20377, "train_loss": 3.2170968055725098, "lr": 0.00013503931247812507, "tps": 28698, "wall": 46535.2} {"step": 20378, "train_loss": 3.262803554534912, "lr": 0.00013502242333381933, "tps": 28696, "wall": 46540.7} {"step": 20379, "train_loss": 3.342442274093628, "lr": 0.00013500553515214417, "tps": 28694, "wall": 46546.3} {"step": 20380, "train_loss": 3.326307535171509, "lr": 0.00013498864793329087, "tps": 28692, "wall": 46551.8} {"step": 20381, "train_loss": 3.3784830570220947, "lr": 0.0001349717616774508, "tps": 28690, "wall": 46557.4} {"step": 20382, "train_loss": 3.2730517387390137, "lr": 0.00013495487638481515, "tps": 28688, "wall": 46563.0} {"step": 20383, "train_loss": 3.3835887908935547, "lr": 0.00013493799205557534, "tps": 28686, "wall": 46568.5} {"step": 20384, "train_loss": 3.4624180793762207, "lr": 0.00013492110868992255, "tps": 28684, "wall": 46574.1} {"step": 20385, "train_loss": 3.2275867462158203, "lr": 0.00013490422628804796, "tps": 28682, "wall": 46579.7} {"step": 20386, "train_loss": 3.29841947555542, "lr": 0.00013488734485014297, "tps": 28680, "wall": 46585.2} {"step": 20387, "train_loss": 3.369089365005493, "lr": 0.00013487046437639876, "tps": 28678, "wall": 46590.8} {"step": 20388, "train_loss": 3.372037410736084, "lr": 0.00013485358486700646, "tps": 28676, "wall": 46596.5} {"step": 20389, "train_loss": 3.370941400527954, "lr": 0.00013483670632215744, "tps": 28674, "wall": 46602.0} {"step": 20390, "train_loss": 3.322786808013916, "lr": 0.0001348198287420428, "tps": 28672, "wall": 46607.6} {"step": 20391, "train_loss": 3.4202728271484375, "lr": 0.00013480295212685368, "tps": 28670, "wall": 46613.1} {"step": 20392, "train_loss": 3.362794876098633, "lr": 0.0001347860764767814, "tps": 28668, "wall": 46618.7} {"step": 20393, "train_loss": 3.3686299324035645, "lr": 0.00013476920179201707, "tps": 28666, "wall": 46624.2} {"step": 20394, "train_loss": 3.3782639503479004, "lr": 0.00013475232807275175, "tps": 28664, "wall": 46629.8} {"step": 20395, "train_loss": 3.326158285140991, "lr": 0.00013473545531917668, "tps": 28662, "wall": 46635.4} {"step": 20396, "train_loss": 3.3793423175811768, "lr": 0.00013471858353148307, "tps": 28660, "wall": 46640.9} {"step": 20397, "train_loss": 3.241534471511841, "lr": 0.00013470171270986184, "tps": 28658, "wall": 46646.5} {"step": 20398, "train_loss": 3.321023464202881, "lr": 0.00013468484285450436, "tps": 28656, "wall": 46652.1} {"step": 20399, "train_loss": 3.327239513397217, "lr": 0.00013466797396560155, "tps": 28654, "wall": 46657.7} {"step": 20400, "train_loss": 3.278765916824341, "lr": 0.00013465110604334444, "tps": 28652, "wall": 46663.3} {"step": 20401, "train_loss": 3.3454108238220215, "lr": 0.00013463423908792433, "tps": 28650, "wall": 46668.8} {"step": 20402, "train_loss": 3.3345937728881836, "lr": 0.0001346173730995321, "tps": 28648, "wall": 46674.4} {"step": 20403, "train_loss": 3.3853020668029785, "lr": 0.00013460050807835897, "tps": 28646, "wall": 46679.9} {"step": 20404, "train_loss": 3.288356065750122, "lr": 0.0001345836440245959, "tps": 28644, "wall": 46685.5} {"step": 20405, "train_loss": 3.3348536491394043, "lr": 0.00013456678093843385, "tps": 28642, "wall": 46691.0} {"step": 20406, "train_loss": 3.312831401824951, "lr": 0.00013454991882006403, "tps": 28640, "wall": 46696.6} {"step": 20407, "train_loss": 3.309062957763672, "lr": 0.00013453305766967732, "tps": 28638, "wall": 46702.1} {"step": 20408, "train_loss": 3.2681968212127686, "lr": 0.0001345161974874647, "tps": 28636, "wall": 46707.7} {"step": 20409, "train_loss": 3.370323657989502, "lr": 0.00013449933827361726, "tps": 28633, "wall": 46713.4} {"step": 20410, "train_loss": 3.3332948684692383, "lr": 0.00013448248002832599, "tps": 28631, "wall": 46719.0} {"step": 20411, "train_loss": 3.21295166015625, "lr": 0.00013446562275178168, "tps": 28629, "wall": 46724.6} {"step": 20412, "train_loss": 3.269956111907959, "lr": 0.00013444876644417555, "tps": 28627, "wall": 46730.1} {"step": 20413, "train_loss": 3.4412412643432617, "lr": 0.0001344319111056984, "tps": 28625, "wall": 46735.7} {"step": 20414, "train_loss": 3.361802339553833, "lr": 0.00013441505673654112, "tps": 28623, "wall": 46741.2} {"step": 20415, "train_loss": 3.3036959171295166, "lr": 0.00013439820333689478, "tps": 28621, "wall": 46746.8} {"step": 20416, "train_loss": 3.3236782550811768, "lr": 0.00013438135090695018, "tps": 28619, "wall": 46752.4} {"step": 20417, "train_loss": 3.1637144088745117, "lr": 0.00013436449944689827, "tps": 28617, "wall": 46758.0} {"step": 20418, "train_loss": 3.306124687194824, "lr": 0.00013434764895692996, "tps": 28615, "wall": 46763.6} {"step": 20419, "train_loss": 3.274268627166748, "lr": 0.00013433079943723608, "tps": 28613, "wall": 46769.2} {"step": 20420, "train_loss": 3.3188846111297607, "lr": 0.0001343139508880076, "tps": 28611, "wall": 46774.8} {"step": 20421, "train_loss": 3.24945330619812, "lr": 0.0001342971033094353, "tps": 28609, "wall": 46780.4} {"step": 20422, "train_loss": 3.2602643966674805, "lr": 0.00013428025670171004, "tps": 28607, "wall": 46786.0} {"step": 20423, "train_loss": 3.3190507888793945, "lr": 0.00013426341106502268, "tps": 28605, "wall": 46791.5} {"step": 20424, "train_loss": 3.3868489265441895, "lr": 0.00013424656639956405, "tps": 28603, "wall": 46797.1} {"step": 20425, "train_loss": 3.3175394535064697, "lr": 0.00013422972270552488, "tps": 28601, "wall": 46802.6} {"step": 20426, "train_loss": 3.3593053817749023, "lr": 0.00013421287998309614, "tps": 28599, "wall": 46808.2} {"step": 20427, "train_loss": 3.504974126815796, "lr": 0.00013419603823246854, "tps": 28597, "wall": 46813.8} {"step": 20428, "train_loss": 3.1695005893707275, "lr": 0.00013417919745383275, "tps": 28595, "wall": 46819.3} {"step": 20429, "train_loss": 3.3740673065185547, "lr": 0.00013416235764737976, "tps": 28593, "wall": 46824.9} {"step": 20430, "train_loss": 3.3850016593933105, "lr": 0.00013414551881330025, "tps": 28591, "wall": 46830.4} {"step": 20431, "train_loss": 3.3733816146850586, "lr": 0.00013412868095178483, "tps": 28589, "wall": 46836.1} {"step": 20432, "train_loss": 3.321769952774048, "lr": 0.00013411184406302443, "tps": 28587, "wall": 46841.6} {"step": 20433, "train_loss": 3.2996132373809814, "lr": 0.00013409500814720972, "tps": 28585, "wall": 46847.2} {"step": 20434, "train_loss": 3.2599925994873047, "lr": 0.00013407817320453135, "tps": 28583, "wall": 46852.8} {"step": 20435, "train_loss": 3.2075817584991455, "lr": 0.00013406133923518014, "tps": 28581, "wall": 46858.4} {"step": 20436, "train_loss": 3.2918965816497803, "lr": 0.00013404450623934663, "tps": 28579, "wall": 46864.0} {"step": 20437, "train_loss": 3.293423652648926, "lr": 0.00013402767421722173, "tps": 28577, "wall": 46869.5} {"step": 20438, "train_loss": 3.3216562271118164, "lr": 0.00013401084316899597, "tps": 28575, "wall": 46875.2} {"step": 20439, "train_loss": 3.3457190990448, "lr": 0.00013399401309485996, "tps": 28573, "wall": 46880.7} {"step": 20440, "train_loss": 3.220280647277832, "lr": 0.00013397718399500445, "tps": 28571, "wall": 46886.3} {"step": 20441, "train_loss": 3.3534789085388184, "lr": 0.0001339603558696201, "tps": 28569, "wall": 46891.9} {"step": 20442, "train_loss": 3.2057976722717285, "lr": 0.0001339435287188974, "tps": 28567, "wall": 46897.5} {"step": 20443, "train_loss": 3.330508232116699, "lr": 0.00013392670254302715, "tps": 28565, "wall": 46903.1} {"step": 20444, "train_loss": 3.271911859512329, "lr": 0.00013390987734219985, "tps": 28563, "wall": 46908.6} {"step": 20445, "train_loss": 3.3280892372131348, "lr": 0.00013389305311660606, "tps": 28561, "wall": 46914.2} {"step": 20446, "train_loss": 3.224539041519165, "lr": 0.00013387622986643646, "tps": 28559, "wall": 46919.7} {"step": 20447, "train_loss": 3.2512753009796143, "lr": 0.0001338594075918816, "tps": 28557, "wall": 46925.3} {"step": 20448, "train_loss": 3.3961572647094727, "lr": 0.000133842586293132, "tps": 28555, "wall": 46930.9} {"step": 20449, "train_loss": 3.3277173042297363, "lr": 0.00013382576597037834, "tps": 28553, "wall": 46936.4} {"step": 20450, "train_loss": 3.3401031494140625, "lr": 0.000133808946623811, "tps": 28551, "wall": 46941.9} {"step": 20451, "train_loss": 3.2855379581451416, "lr": 0.00013379212825362054, "tps": 28549, "wall": 46947.5} {"step": 20452, "train_loss": 3.2796263694763184, "lr": 0.00013377531085999756, "tps": 28547, "wall": 46953.2} {"step": 20453, "train_loss": 3.259295701980591, "lr": 0.0001337584944431325, "tps": 28545, "wall": 46958.8} {"step": 20454, "train_loss": 3.231624126434326, "lr": 0.00013374167900321584, "tps": 28543, "wall": 46964.3} {"step": 20455, "train_loss": 3.2877914905548096, "lr": 0.00013372486454043818, "tps": 28541, "wall": 46969.9} {"step": 20456, "train_loss": 3.2670528888702393, "lr": 0.0001337080510549898, "tps": 28539, "wall": 46975.4} {"step": 20457, "train_loss": 3.2596237659454346, "lr": 0.00013369123854706144, "tps": 28537, "wall": 46981.0} {"step": 20458, "train_loss": 3.2749054431915283, "lr": 0.00013367442701684337, "tps": 28535, "wall": 46986.5} {"step": 20459, "train_loss": 3.327181100845337, "lr": 0.000133657616464526, "tps": 28533, "wall": 46992.1} {"step": 20460, "train_loss": 3.312591552734375, "lr": 0.00013364080689029988, "tps": 28531, "wall": 46997.6} {"step": 20461, "train_loss": 3.3600258827209473, "lr": 0.00013362399829435536, "tps": 28529, "wall": 47003.2} {"step": 20462, "train_loss": 3.301508665084839, "lr": 0.0001336071906768828, "tps": 28527, "wall": 47008.8} {"step": 20463, "train_loss": 3.410764455795288, "lr": 0.00013359038403807275, "tps": 28525, "wall": 47014.4} {"step": 20464, "train_loss": 3.286811590194702, "lr": 0.00013357357837811545, "tps": 28523, "wall": 47020.0} {"step": 20465, "train_loss": 3.2988698482513428, "lr": 0.0001335567736972013, "tps": 28521, "wall": 47025.6} {"step": 20466, "train_loss": 3.1664817333221436, "lr": 0.00013353996999552076, "tps": 28519, "wall": 47031.2} {"step": 20467, "train_loss": 3.301408290863037, "lr": 0.00013352316727326412, "tps": 28517, "wall": 47036.9} {"step": 20468, "train_loss": 3.1956615447998047, "lr": 0.00013350636553062165, "tps": 28515, "wall": 47042.4} {"step": 20469, "train_loss": 3.4014124870300293, "lr": 0.0001334895647677838, "tps": 28513, "wall": 47048.0} {"step": 20470, "train_loss": 3.1134583950042725, "lr": 0.00013347276498494086, "tps": 28511, "wall": 47053.6} {"step": 20471, "train_loss": 3.322051525115967, "lr": 0.000133455966182283, "tps": 28509, "wall": 47059.2} {"step": 20472, "train_loss": 3.259439468383789, "lr": 0.00013343916836000078, "tps": 28507, "wall": 47064.8} {"step": 20473, "train_loss": 3.3070311546325684, "lr": 0.00013342237151828422, "tps": 28505, "wall": 47070.4} {"step": 20474, "train_loss": 3.3422422409057617, "lr": 0.0001334055756573238, "tps": 28503, "wall": 47076.0} {"step": 20475, "train_loss": 3.3197059631347656, "lr": 0.0001333887807773097, "tps": 28501, "wall": 47081.6} {"step": 20476, "train_loss": 3.3828835487365723, "lr": 0.00013337198687843219, "tps": 28499, "wall": 47087.2} {"step": 20477, "train_loss": 3.391529083251953, "lr": 0.00013335519396088147, "tps": 28497, "wall": 47092.8} {"step": 20478, "train_loss": 3.3632936477661133, "lr": 0.0001333384020248478, "tps": 28495, "wall": 47098.3} {"step": 20479, "train_loss": 3.194356679916382, "lr": 0.00013332161107052138, "tps": 28494, "wall": 47103.9} {"step": 20480, "train_loss": 3.3632752895355225, "lr": 0.0001333048210980925, "tps": 28492, "wall": 47109.4} {"step": 20481, "train_loss": 3.2832794189453125, "lr": 0.0001332880321077513, "tps": 28490, "wall": 47114.9} {"step": 20482, "train_loss": 3.262653350830078, "lr": 0.00013327124409968794, "tps": 28488, "wall": 47120.5} {"step": 20483, "train_loss": 3.378002643585205, "lr": 0.00013325445707409265, "tps": 28486, "wall": 47126.0} {"step": 20484, "train_loss": 3.330177068710327, "lr": 0.00013323767103115544, "tps": 28484, "wall": 47131.6} {"step": 20485, "train_loss": 3.276674270629883, "lr": 0.00013322088597106667, "tps": 28482, "wall": 47137.3} {"step": 20486, "train_loss": 3.342360496520996, "lr": 0.00013320410189401644, "tps": 28480, "wall": 47142.8} {"step": 20487, "train_loss": 3.2572503089904785, "lr": 0.00013318731880019474, "tps": 28478, "wall": 47148.4} {"step": 20488, "train_loss": 3.221634864807129, "lr": 0.00013317053668979187, "tps": 28476, "wall": 47154.0} {"step": 20489, "train_loss": 3.391854763031006, "lr": 0.00013315375556299786, "tps": 28474, "wall": 47159.6} {"step": 20490, "train_loss": 3.2644202709198, "lr": 0.00013313697542000275, "tps": 28472, "wall": 47165.1} {"step": 20491, "train_loss": 3.1723320484161377, "lr": 0.0001331201962609967, "tps": 28470, "wall": 47170.7} {"step": 20492, "train_loss": 3.3645987510681152, "lr": 0.0001331034180861698, "tps": 28468, "wall": 47176.2} {"step": 20493, "train_loss": 3.218519926071167, "lr": 0.00013308664089571202, "tps": 28466, "wall": 47181.8} {"step": 20494, "train_loss": 3.2164063453674316, "lr": 0.00013306986468981352, "tps": 28464, "wall": 47187.3} {"step": 20495, "train_loss": 3.312084913253784, "lr": 0.0001330530894686643, "tps": 28462, "wall": 47192.9} {"step": 20496, "train_loss": 3.2951955795288086, "lr": 0.00013303631523245435, "tps": 28460, "wall": 47198.5} {"step": 20497, "train_loss": 3.3042073249816895, "lr": 0.00013301954198137374, "tps": 28458, "wall": 47204.1} {"step": 20498, "train_loss": 3.263533115386963, "lr": 0.00013300276971561244, "tps": 28456, "wall": 47209.6} {"step": 20499, "train_loss": 3.299506902694702, "lr": 0.00013298599843536053, "tps": 28454, "wall": 47215.2} {"step": 20500, "train_loss": 3.3758139610290527, "lr": 0.00013296922814080793, "tps": 28452, "wall": 47220.7} {"step": 20501, "train_loss": 3.2913174629211426, "lr": 0.00013295245883214454, "tps": 28450, "wall": 47226.4} {"step": 20502, "train_loss": 3.324770450592041, "lr": 0.0001329356905095605, "tps": 28448, "wall": 47232.0} {"step": 20503, "train_loss": 3.2646968364715576, "lr": 0.00013291892317324563, "tps": 28446, "wall": 47237.5} {"step": 20504, "train_loss": 3.2500524520874023, "lr": 0.0001329021568233899, "tps": 28444, "wall": 47243.0} {"step": 20505, "train_loss": 3.2964985370635986, "lr": 0.00013288539146018326, "tps": 28442, "wall": 47248.5} {"step": 20506, "train_loss": 3.3120102882385254, "lr": 0.00013286862708381564, "tps": 28440, "wall": 47254.1} {"step": 20507, "train_loss": 3.323629856109619, "lr": 0.00013285186369447688, "tps": 28438, "wall": 47259.6} {"step": 20508, "train_loss": 3.2953813076019287, "lr": 0.000132835101292357, "tps": 28436, "wall": 47265.1} {"step": 20509, "train_loss": 3.313751220703125, "lr": 0.00013281833987764576, "tps": 28435, "wall": 47270.7} {"step": 20510, "train_loss": 3.249181032180786, "lr": 0.000132801579450533, "tps": 28433, "wall": 47276.2} {"step": 20511, "train_loss": 3.2903823852539062, "lr": 0.0001327848200112088, "tps": 28431, "wall": 47281.7} {"step": 20512, "train_loss": 3.404179096221924, "lr": 0.00013276806155986285, "tps": 28429, "wall": 47287.3} {"step": 20513, "train_loss": 3.2455055713653564, "lr": 0.00013275130409668492, "tps": 28427, "wall": 47292.9} {"step": 20514, "train_loss": 3.3885607719421387, "lr": 0.00013273454762186506, "tps": 28425, "wall": 47298.4} {"step": 20515, "train_loss": 3.2582147121429443, "lr": 0.00013271779213559287, "tps": 28423, "wall": 47303.9} {"step": 20516, "train_loss": 3.1700985431671143, "lr": 0.00013270103763805832, "tps": 28421, "wall": 47309.4} {"step": 20517, "train_loss": 3.2287323474884033, "lr": 0.0001326842841294511, "tps": 28419, "wall": 47315.0} {"step": 20518, "train_loss": 3.416269302368164, "lr": 0.00013266753160996104, "tps": 28417, "wall": 47320.5} {"step": 20519, "train_loss": 3.242572784423828, "lr": 0.00013265078007977793, "tps": 28415, "wall": 47326.0} {"step": 20520, "train_loss": 3.2722012996673584, "lr": 0.0001326340295390915, "tps": 28413, "wall": 47331.5} {"step": 20521, "train_loss": 3.325446605682373, "lr": 0.00013261727998809146, "tps": 28411, "wall": 47337.0} {"step": 20522, "train_loss": 3.2144856452941895, "lr": 0.00013260053142696767, "tps": 28409, "wall": 47342.5} {"step": 20523, "train_loss": 3.2530040740966797, "lr": 0.00013258378385590976, "tps": 28407, "wall": 47348.0} {"step": 20524, "train_loss": 3.2760066986083984, "lr": 0.00013256703727510745, "tps": 28406, "wall": 47353.5} {"step": 20525, "train_loss": 3.263657331466675, "lr": 0.00013255029168475051, "tps": 28404, "wall": 47359.1} {"step": 20526, "train_loss": 3.3127071857452393, "lr": 0.00013253354708502862, "tps": 28402, "wall": 47364.6} {"step": 20527, "train_loss": 3.3941781520843506, "lr": 0.00013251680347613136, "tps": 28400, "wall": 47370.1} {"step": 20528, "train_loss": 3.315755844116211, "lr": 0.00013250006085824856, "tps": 28398, "wall": 47375.7} {"step": 20529, "train_loss": 3.2503485679626465, "lr": 0.0001324833192315698, "tps": 28396, "wall": 47381.3} {"step": 20530, "train_loss": 3.3553643226623535, "lr": 0.00013246657859628463, "tps": 28394, "wall": 47386.8} {"step": 20531, "train_loss": 3.2736454010009766, "lr": 0.00013244983895258292, "tps": 28392, "wall": 47392.3} {"step": 20532, "train_loss": 3.2777092456817627, "lr": 0.00013243310030065412, "tps": 28390, "wall": 47397.8} {"step": 20533, "train_loss": 3.3764398097991943, "lr": 0.00013241636264068785, "tps": 28388, "wall": 47403.4} {"step": 20534, "train_loss": 3.2482080459594727, "lr": 0.00013239962597287383, "tps": 28386, "wall": 47408.9} {"step": 20535, "train_loss": 3.280400514602661, "lr": 0.00013238289029740154, "tps": 28384, "wall": 47414.5} {"step": 20536, "train_loss": 3.3193421363830566, "lr": 0.00013236615561446063, "tps": 28382, "wall": 47420.0} {"step": 20537, "train_loss": 3.3445615768432617, "lr": 0.00013234942192424072, "tps": 28380, "wall": 47425.5} {"step": 20538, "train_loss": 3.330263376235962, "lr": 0.00013233268922693115, "tps": 28378, "wall": 47431.0} {"step": 20539, "train_loss": 3.30009388923645, "lr": 0.00013231595752272174, "tps": 28376, "wall": 47436.7} {"step": 20540, "train_loss": 3.306670665740967, "lr": 0.00013229922681180193, "tps": 28375, "wall": 47442.2} {"step": 20541, "train_loss": 3.3797607421875, "lr": 0.0001322824970943611, "tps": 28373, "wall": 47447.8} {"step": 20542, "train_loss": 3.3054184913635254, "lr": 0.00013226576837058898, "tps": 28371, "wall": 47453.3} {"step": 20543, "train_loss": 3.2080187797546387, "lr": 0.00013224904064067493, "tps": 28369, "wall": 47458.8} {"step": 20544, "train_loss": 3.2936646938323975, "lr": 0.0001322323139048085, "tps": 28367, "wall": 47464.4} {"step": 20545, "train_loss": 3.2146401405334473, "lr": 0.0001322155881631792, "tps": 28365, "wall": 47469.9} {"step": 20546, "train_loss": 3.3088631629943848, "lr": 0.0001321988634159765, "tps": 28363, "wall": 47475.4} {"step": 20547, "train_loss": 3.2645740509033203, "lr": 0.00013218213966338972, "tps": 28361, "wall": 47481.0} {"step": 20548, "train_loss": 3.343996047973633, "lr": 0.00013216541690560848, "tps": 28359, "wall": 47486.5} {"step": 20549, "train_loss": 3.3238091468811035, "lr": 0.00013214869514282217, "tps": 28357, "wall": 47492.0} {"step": 20550, "train_loss": 3.2546334266662598, "lr": 0.00013213197437522012, "tps": 28355, "wall": 47497.7} {"step": 20551, "train_loss": 3.3796005249023438, "lr": 0.00013211525460299188, "tps": 28353, "wall": 47503.1} {"step": 20552, "train_loss": 3.362598419189453, "lr": 0.00013209853582632673, "tps": 28351, "wall": 47508.7} {"step": 20553, "train_loss": 3.335094451904297, "lr": 0.0001320818180454142, "tps": 28349, "wall": 47514.3} {"step": 20554, "train_loss": 3.335923433303833, "lr": 0.00013206510126044353, "tps": 28348, "wall": 47519.8} {"step": 20555, "train_loss": 3.4543895721435547, "lr": 0.00013204838547160413, "tps": 28346, "wall": 47525.4} {"step": 20556, "train_loss": 3.2121126651763916, "lr": 0.0001320316706790855, "tps": 28344, "wall": 47530.8} {"step": 20557, "train_loss": 3.336059093475342, "lr": 0.00013201495688307678, "tps": 28342, "wall": 47536.4} {"step": 20558, "train_loss": 3.248223304748535, "lr": 0.00013199824408376736, "tps": 28340, "wall": 47541.9} {"step": 20559, "train_loss": 3.30580735206604, "lr": 0.00013198153228134664, "tps": 28338, "wall": 47547.4} {"step": 20560, "train_loss": 3.370743751525879, "lr": 0.00013196482147600385, "tps": 28336, "wall": 47553.0} {"step": 20561, "train_loss": 3.335348129272461, "lr": 0.00013194811166792833, "tps": 28334, "wall": 47558.6} {"step": 20562, "train_loss": 3.233675718307495, "lr": 0.0001319314028573094, "tps": 28332, "wall": 47564.1} {"step": 20563, "train_loss": 3.29968523979187, "lr": 0.0001319146950443363, "tps": 28330, "wall": 47569.6} {"step": 20564, "train_loss": 3.2038497924804688, "lr": 0.00013189798822919822, "tps": 28328, "wall": 47575.1} {"step": 20565, "train_loss": 3.2628798484802246, "lr": 0.0001318812824120846, "tps": 28326, "wall": 47580.7} {"step": 20566, "train_loss": 3.39833664894104, "lr": 0.00013186457759318455, "tps": 28325, "wall": 47586.2} {"step": 20567, "train_loss": 3.221996545791626, "lr": 0.00013184787377268727, "tps": 28323, "wall": 47591.8} {"step": 20568, "train_loss": 3.435678243637085, "lr": 0.00013183117095078215, "tps": 28321, "wall": 47597.3} {"step": 20569, "train_loss": 3.3334426879882812, "lr": 0.00013181446912765817, "tps": 28319, "wall": 47602.8} {"step": 20570, "train_loss": 3.360826253890991, "lr": 0.00013179776830350476, "tps": 28317, "wall": 47608.4} {"step": 20571, "train_loss": 3.3131253719329834, "lr": 0.000131781068478511, "tps": 28315, "wall": 47614.0} {"step": 20572, "train_loss": 3.2906861305236816, "lr": 0.00013176436965286597, "tps": 28313, "wall": 47619.5} {"step": 20573, "train_loss": 3.3414711952209473, "lr": 0.00013174767182675906, "tps": 28311, "wall": 47625.0} {"step": 20574, "train_loss": 3.3812389373779297, "lr": 0.00013173097500037922, "tps": 28309, "wall": 47630.6} {"step": 20575, "train_loss": 3.357193946838379, "lr": 0.00013171427917391565, "tps": 28307, "wall": 47636.1} {"step": 20576, "train_loss": 3.3442788124084473, "lr": 0.00013169758434755755, "tps": 28305, "wall": 47641.7} {"step": 20577, "train_loss": 3.279798746109009, "lr": 0.00013168089052149402, "tps": 28303, "wall": 47647.2} {"step": 20578, "train_loss": 3.338444948196411, "lr": 0.00013166419769591406, "tps": 28301, "wall": 47652.9} {"step": 20579, "train_loss": 3.267580032348633, "lr": 0.0001316475058710069, "tps": 28299, "wall": 47658.4} {"step": 20580, "train_loss": 3.213197708129883, "lr": 0.0001316308150469616, "tps": 28298, "wall": 47664.0} {"step": 20581, "train_loss": 3.379798412322998, "lr": 0.0001316141252239671, "tps": 28296, "wall": 47669.6} {"step": 20582, "train_loss": 3.3001880645751953, "lr": 0.0001315974364022127, "tps": 28294, "wall": 47675.2} {"step": 20583, "train_loss": 3.276430130004883, "lr": 0.0001315807485818873, "tps": 28292, "wall": 47680.8} {"step": 20584, "train_loss": 3.1817469596862793, "lr": 0.00013156406176317986, "tps": 28290, "wall": 47686.3} {"step": 20585, "train_loss": 3.372504234313965, "lr": 0.00013154737594627962, "tps": 28288, "wall": 47691.9} {"step": 20586, "train_loss": 3.3218913078308105, "lr": 0.00013153069113137545, "tps": 28286, "wall": 47697.4} {"step": 20587, "train_loss": 3.261200189590454, "lr": 0.00013151400731865634, "tps": 28284, "wall": 47702.9} {"step": 20588, "train_loss": 3.2452564239501953, "lr": 0.00013149732450831145, "tps": 28282, "wall": 47708.4} {"step": 20589, "train_loss": 3.424406051635742, "lr": 0.00013148064270052955, "tps": 28280, "wall": 47714.0} {"step": 20590, "train_loss": 3.181832790374756, "lr": 0.00013146396189549981, "tps": 28278, "wall": 47719.6} {"step": 20591, "train_loss": 3.2282958030700684, "lr": 0.00013144728209341108, "tps": 28276, "wall": 47725.1} {"step": 20592, "train_loss": 3.2760298252105713, "lr": 0.00013143060329445224, "tps": 28274, "wall": 47730.6} {"step": 20593, "train_loss": 3.2959234714508057, "lr": 0.00013141392549881242, "tps": 28273, "wall": 47736.3} {"step": 20594, "train_loss": 3.253248453140259, "lr": 0.00013139724870668047, "tps": 28271, "wall": 47741.8} {"step": 20595, "train_loss": 3.159651279449463, "lr": 0.00013138057291824516, "tps": 28269, "wall": 47747.3} {"step": 20596, "train_loss": 3.306304931640625, "lr": 0.0001313638981336956, "tps": 28267, "wall": 47752.9} {"step": 20597, "train_loss": 3.2598047256469727, "lr": 0.0001313472243532206, "tps": 28265, "wall": 47758.4} {"step": 20598, "train_loss": 3.2987148761749268, "lr": 0.00013133055157700895, "tps": 28263, "wall": 47764.0} {"step": 20599, "train_loss": 3.311281681060791, "lr": 0.0001313138798052497, "tps": 28261, "wall": 47769.5} {"step": 20600, "train_loss": 3.3219313621520996, "lr": 0.00013129720903813164, "tps": 28259, "wall": 47775.0} {"step": 20601, "train_loss": 3.250558614730835, "lr": 0.00013128053927584347, "tps": 28257, "wall": 47780.6} {"step": 20602, "train_loss": 3.3361775875091553, "lr": 0.00013126387051857428, "tps": 28255, "wall": 47786.1} {"step": 20603, "train_loss": 3.2652385234832764, "lr": 0.00013124720276651273, "tps": 28253, "wall": 47791.6} {"step": 20604, "train_loss": 3.285369873046875, "lr": 0.0001312305360198476, "tps": 28252, "wall": 47797.2} {"step": 20605, "train_loss": 3.318199634552002, "lr": 0.0001312138702787678, "tps": 28250, "wall": 47802.8} {"step": 20606, "train_loss": 3.2590560913085938, "lr": 0.00013119720554346208, "tps": 28248, "wall": 47808.3} {"step": 20607, "train_loss": 3.2955050468444824, "lr": 0.00013118054181411926, "tps": 28246, "wall": 47813.8} {"step": 20608, "train_loss": 3.3227624893188477, "lr": 0.00013116387909092804, "tps": 28244, "wall": 47819.4} {"step": 20609, "train_loss": 3.3529391288757324, "lr": 0.00013114721737407715, "tps": 28242, "wall": 47824.9} {"step": 20610, "train_loss": 3.392805576324463, "lr": 0.00013113055666375546, "tps": 28240, "wall": 47830.5} {"step": 20611, "train_loss": 3.3285913467407227, "lr": 0.00013111389696015164, "tps": 28238, "wall": 47836.0} {"step": 20612, "train_loss": 3.278754472732544, "lr": 0.00013109723826345432, "tps": 28236, "wall": 47841.5} {"step": 20613, "train_loss": 3.3677265644073486, "lr": 0.00013108058057385237, "tps": 28234, "wall": 47847.0} {"step": 20614, "train_loss": 3.1929931640625, "lr": 0.00013106392389153443, "tps": 28233, "wall": 47852.6} {"step": 20615, "train_loss": 3.3190853595733643, "lr": 0.0001310472682166891, "tps": 28231, "wall": 47858.2} {"step": 20616, "train_loss": 3.349198818206787, "lr": 0.0001310306135495052, "tps": 28229, "wall": 47863.8} {"step": 20617, "train_loss": 3.241833448410034, "lr": 0.00013101395989017126, "tps": 28227, "wall": 47869.4} {"step": 20618, "train_loss": 3.3593862056732178, "lr": 0.00013099730723887602, "tps": 28225, "wall": 47874.9} {"step": 20619, "train_loss": 3.236733913421631, "lr": 0.00013098065559580813, "tps": 28223, "wall": 47880.5} {"step": 20620, "train_loss": 3.30191969871521, "lr": 0.00013096400496115618, "tps": 28221, "wall": 47886.0} {"step": 20621, "train_loss": 3.4053444862365723, "lr": 0.00013094735533510871, "tps": 28219, "wall": 47891.5} {"step": 20622, "train_loss": 3.1594455242156982, "lr": 0.0001309307067178545, "tps": 28217, "wall": 47897.1} {"step": 20623, "train_loss": 3.169985771179199, "lr": 0.00013091405910958202, "tps": 28215, "wall": 47902.6} {"step": 20624, "train_loss": 3.2330896854400635, "lr": 0.00013089741251047995, "tps": 28213, "wall": 47908.2} {"step": 20625, "train_loss": 3.2766079902648926, "lr": 0.00013088076692073682, "tps": 28212, "wall": 47913.8} {"step": 20626, "train_loss": 3.401479959487915, "lr": 0.00013086412234054109, "tps": 28210, "wall": 47919.3} {"step": 20627, "train_loss": 3.27768874168396, "lr": 0.0001308474787700815, "tps": 28208, "wall": 47924.8} {"step": 20628, "train_loss": 3.3184404373168945, "lr": 0.00013083083620954645, "tps": 28206, "wall": 47930.3} {"step": 20629, "train_loss": 3.3224329948425293, "lr": 0.0001308141946591245, "tps": 28204, "wall": 47935.9} {"step": 20630, "train_loss": 3.3433375358581543, "lr": 0.0001307975541190042, "tps": 28202, "wall": 47941.5} {"step": 20631, "train_loss": 3.2386064529418945, "lr": 0.0001307809145893741, "tps": 28200, "wall": 47947.0} {"step": 20632, "train_loss": 3.299224376678467, "lr": 0.0001307642760704225, "tps": 28198, "wall": 47952.6} {"step": 20633, "train_loss": 3.4519104957580566, "lr": 0.00013074763856233806, "tps": 28196, "wall": 47958.1} {"step": 20634, "train_loss": 3.280910015106201, "lr": 0.00013073100206530925, "tps": 28195, "wall": 47963.6} {"step": 20635, "train_loss": 3.314964771270752, "lr": 0.0001307143665795244, "tps": 28193, "wall": 47969.2} {"step": 20636, "train_loss": 3.3311097621917725, "lr": 0.00013069773210517207, "tps": 28191, "wall": 47974.8} {"step": 20637, "train_loss": 3.3540239334106445, "lr": 0.00013068109864244068, "tps": 28189, "wall": 47980.3} {"step": 20638, "train_loss": 3.400689125061035, "lr": 0.00013066446619151858, "tps": 28187, "wall": 47985.9} {"step": 20639, "train_loss": 3.304342746734619, "lr": 0.0001306478347525943, "tps": 28185, "wall": 47991.4} {"step": 20640, "train_loss": 3.2754311561584473, "lr": 0.00013063120432585618, "tps": 28183, "wall": 47997.0} {"step": 20641, "train_loss": 3.331568717956543, "lr": 0.00013061457491149252, "tps": 28181, "wall": 48002.5} {"step": 20642, "train_loss": 3.198286294937134, "lr": 0.0001305979465096919, "tps": 28179, "wall": 48008.1} {"step": 20643, "train_loss": 3.3736181259155273, "lr": 0.00013058131912064248, "tps": 28177, "wall": 48013.6} {"step": 20644, "train_loss": 3.3930845260620117, "lr": 0.0001305646927445328, "tps": 28176, "wall": 48019.2} {"step": 20645, "train_loss": 3.3340888023376465, "lr": 0.00013054806738155113, "tps": 28174, "wall": 48024.7} {"step": 20646, "train_loss": 3.4284377098083496, "lr": 0.0001305314430318857, "tps": 28172, "wall": 48030.3} {"step": 20647, "train_loss": 3.304638147354126, "lr": 0.000130514819695725, "tps": 28170, "wall": 48035.9} {"step": 20648, "train_loss": 3.3869926929473877, "lr": 0.00013049819737325725, "tps": 28168, "wall": 48041.5} {"step": 20649, "train_loss": 3.3081111907958984, "lr": 0.00013048157606467074, "tps": 28166, "wall": 48047.0} {"step": 20650, "train_loss": 3.3184285163879395, "lr": 0.00013046495577015386, "tps": 28164, "wall": 48052.5} {"step": 20651, "train_loss": 3.4364538192749023, "lr": 0.0001304483364898947, "tps": 28162, "wall": 48058.1} {"step": 20652, "train_loss": 3.3916189670562744, "lr": 0.0001304317182240817, "tps": 28160, "wall": 48063.6} {"step": 20653, "train_loss": 3.2766659259796143, "lr": 0.00013041510097290302, "tps": 28159, "wall": 48069.2} {"step": 20654, "train_loss": 3.348560094833374, "lr": 0.00013039848473654688, "tps": 28157, "wall": 48074.7} {"step": 20655, "train_loss": 3.350153923034668, "lr": 0.0001303818695152016, "tps": 28155, "wall": 48080.3} {"step": 20656, "train_loss": 3.194091320037842, "lr": 0.00013036525530905535, "tps": 28153, "wall": 48085.9} {"step": 20657, "train_loss": 3.357536792755127, "lr": 0.00013034864211829627, "tps": 28151, "wall": 48091.4} {"step": 20658, "train_loss": 3.2770023345947266, "lr": 0.0001303320299431127, "tps": 28149, "wall": 48097.0} {"step": 20659, "train_loss": 3.256882429122925, "lr": 0.00013031541878369274, "tps": 28147, "wall": 48102.5} {"step": 20660, "train_loss": 3.3536672592163086, "lr": 0.0001302988086402245, "tps": 28145, "wall": 48108.0} {"step": 20661, "train_loss": 3.311239242553711, "lr": 0.0001302821995128963, "tps": 28143, "wall": 48113.6} {"step": 20662, "train_loss": 3.228799819946289, "lr": 0.00013026559140189616, "tps": 28142, "wall": 48119.1} {"step": 20663, "train_loss": 3.3881285190582275, "lr": 0.0001302489843074122, "tps": 28140, "wall": 48124.7} {"step": 20664, "train_loss": 3.278515577316284, "lr": 0.00013023237822963268, "tps": 28138, "wall": 48130.2} {"step": 20665, "train_loss": 3.373138904571533, "lr": 0.00013021577316874562, "tps": 28136, "wall": 48135.7} {"step": 20666, "train_loss": 3.173597812652588, "lr": 0.00013019916912493907, "tps": 28134, "wall": 48141.2} {"step": 20667, "train_loss": 3.282242774963379, "lr": 0.0001301825660984013, "tps": 28132, "wall": 48146.8} {"step": 20668, "train_loss": 3.301095485687256, "lr": 0.00013016596408932016, "tps": 28130, "wall": 48152.4} {"step": 20669, "train_loss": 3.2877144813537598, "lr": 0.00013014936309788393, "tps": 28128, "wall": 48158.0} {"step": 20670, "train_loss": 3.208954334259033, "lr": 0.00013013276312428057, "tps": 28126, "wall": 48163.5} {"step": 20671, "train_loss": 3.3144984245300293, "lr": 0.00013011616416869806, "tps": 28125, "wall": 48169.1} {"step": 20672, "train_loss": 3.23171067237854, "lr": 0.00013009956623132455, "tps": 28123, "wall": 48174.7} {"step": 20673, "train_loss": 3.3370416164398193, "lr": 0.00013008296931234806, "tps": 28121, "wall": 48180.2} {"step": 20674, "train_loss": 3.2661356925964355, "lr": 0.0001300663734119565, "tps": 28119, "wall": 48185.8} {"step": 20675, "train_loss": 3.194849967956543, "lr": 0.00013004977853033796, "tps": 28117, "wall": 48191.3} {"step": 20676, "train_loss": 3.2960474491119385, "lr": 0.00013003318466768042, "tps": 28115, "wall": 48196.9} {"step": 20677, "train_loss": 3.338554859161377, "lr": 0.00013001659182417175, "tps": 28113, "wall": 48202.5} {"step": 20678, "train_loss": 3.2324912548065186, "lr": 0.00013000000000000004, "tps": 28111, "wall": 48208.0} {"step": 20679, "train_loss": 3.4322006702423096, "lr": 0.0001299834091953532, "tps": 28109, "wall": 48213.6} {"step": 20680, "train_loss": 3.2164039611816406, "lr": 0.00012996681941041915, "tps": 28108, "wall": 48219.2} {"step": 20681, "train_loss": 3.4228923320770264, "lr": 0.00012995023064538586, "tps": 28106, "wall": 48224.7} {"step": 20682, "train_loss": 3.290764808654785, "lr": 0.0001299336429004413, "tps": 28104, "wall": 48230.3} {"step": 20683, "train_loss": 3.304027795791626, "lr": 0.00012991705617577316, "tps": 28102, "wall": 48235.8} {"step": 20684, "train_loss": 3.3216392993927, "lr": 0.00012990047047156957, "tps": 28100, "wall": 48241.4} {"step": 20685, "train_loss": 3.277866840362549, "lr": 0.00012988388578801828, "tps": 28098, "wall": 48246.9} {"step": 20686, "train_loss": 3.270045042037964, "lr": 0.00012986730212530726, "tps": 28096, "wall": 48252.5} {"step": 20687, "train_loss": 3.3152313232421875, "lr": 0.0001298507194836243, "tps": 28095, "wall": 48258.0} {"step": 20688, "train_loss": 3.3507866859436035, "lr": 0.00012983413786315723, "tps": 28093, "wall": 48263.6} {"step": 20689, "train_loss": 3.1927194595336914, "lr": 0.00012981755726409398, "tps": 28091, "wall": 48269.1} {"step": 20690, "train_loss": 3.3134710788726807, "lr": 0.0001298009776866223, "tps": 28089, "wall": 48274.7} {"step": 20691, "train_loss": 3.3198814392089844, "lr": 0.00012978439913093, "tps": 28087, "wall": 48280.3} {"step": 20692, "train_loss": 3.250581741333008, "lr": 0.00012976782159720494, "tps": 28085, "wall": 48285.8} {"step": 20693, "train_loss": 3.215165853500366, "lr": 0.0001297512450856349, "tps": 28083, "wall": 48291.4} {"step": 20694, "train_loss": 3.2833495140075684, "lr": 0.00012973466959640754, "tps": 28081, "wall": 48296.9} {"step": 20695, "train_loss": 3.2770304679870605, "lr": 0.00012971809512971082, "tps": 28079, "wall": 48302.5} {"step": 20696, "train_loss": 3.427330255508423, "lr": 0.00012970152168573237, "tps": 28078, "wall": 48308.0} {"step": 20697, "train_loss": 3.3240456581115723, "lr": 0.00012968494926465996, "tps": 28076, "wall": 48313.6} {"step": 20698, "train_loss": 3.280416965484619, "lr": 0.00012966837786668132, "tps": 28074, "wall": 48319.1} {"step": 20699, "train_loss": 3.2873873710632324, "lr": 0.00012965180749198424, "tps": 28072, "wall": 48324.7} {"step": 20700, "train_loss": 3.364649772644043, "lr": 0.0001296352381407563, "tps": 28070, "wall": 48330.2} {"step": 20701, "train_loss": 3.290548801422119, "lr": 0.00012961866981318532, "tps": 28068, "wall": 48335.9} {"step": 20702, "train_loss": 3.2363319396972656, "lr": 0.00012960210250945889, "tps": 28066, "wall": 48341.4} {"step": 20703, "train_loss": 3.241340160369873, "lr": 0.0001295855362297648, "tps": 28064, "wall": 48347.0} {"step": 20704, "train_loss": 3.2839345932006836, "lr": 0.00012956897097429063, "tps": 28063, "wall": 48352.5} {"step": 20705, "train_loss": 3.2072806358337402, "lr": 0.00012955240674322396, "tps": 28061, "wall": 48358.0} {"step": 20706, "train_loss": 3.330271005630493, "lr": 0.00012953584353675264, "tps": 28059, "wall": 48363.6} {"step": 20707, "train_loss": 3.2919154167175293, "lr": 0.00012951928135506414, "tps": 28057, "wall": 48369.1} {"step": 20708, "train_loss": 3.401411294937134, "lr": 0.00012950272019834606, "tps": 28055, "wall": 48374.7} {"step": 20709, "train_loss": 3.295457363128662, "lr": 0.00012948616006678613, "tps": 28053, "wall": 48380.3} {"step": 20710, "train_loss": 3.409318447113037, "lr": 0.0001294696009605719, "tps": 28051, "wall": 48385.8} {"step": 20711, "train_loss": 3.349426507949829, "lr": 0.00012945304287989082, "tps": 28050, "wall": 48391.3} {"step": 20712, "train_loss": 3.3209335803985596, "lr": 0.00012943648582493066, "tps": 28048, "wall": 48397.0} {"step": 20713, "train_loss": 3.3572580814361572, "lr": 0.00012941992979587888, "tps": 28046, "wall": 48402.6} {"step": 20714, "train_loss": 3.35860538482666, "lr": 0.00012940337479292296, "tps": 28044, "wall": 48408.1} {"step": 20715, "train_loss": 3.362717628479004, "lr": 0.0001293868208162506, "tps": 28042, "wall": 48413.7} {"step": 20716, "train_loss": 3.329507350921631, "lr": 0.0001293702678660492, "tps": 28040, "wall": 48419.2} {"step": 20717, "train_loss": 3.191032886505127, "lr": 0.00012935371594250628, "tps": 28038, "wall": 48424.8} {"step": 20718, "train_loss": 3.384793281555176, "lr": 0.00012933716504580942, "tps": 28037, "wall": 48430.3} {"step": 20719, "train_loss": 3.230895519256592, "lr": 0.00012932061517614604, "tps": 28035, "wall": 48435.9} {"step": 20720, "train_loss": 3.282235622406006, "lr": 0.00012930406633370362, "tps": 28033, "wall": 48441.4} {"step": 20721, "train_loss": 3.325296401977539, "lr": 0.00012928751851866966, "tps": 28031, "wall": 48447.0} {"step": 20722, "train_loss": 3.299104690551758, "lr": 0.00012927097173123157, "tps": 28029, "wall": 48452.6} {"step": 20723, "train_loss": 3.304816246032715, "lr": 0.0001292544259715769, "tps": 28027, "wall": 48458.1} {"step": 20724, "train_loss": 3.322662353515625, "lr": 0.00012923788123989294, "tps": 28025, "wall": 48463.7} {"step": 20725, "train_loss": 3.2638158798217773, "lr": 0.0001292213375363671, "tps": 28023, "wall": 48469.2} {"step": 20726, "train_loss": 3.2341113090515137, "lr": 0.00012920479486118702, "tps": 28022, "wall": 48474.7} {"step": 20727, "train_loss": 3.2556867599487305, "lr": 0.00012918825321453985, "tps": 28020, "wall": 48480.3} {"step": 20728, "train_loss": 3.3341357707977295, "lr": 0.00012917171259661304, "tps": 28018, "wall": 48485.8} {"step": 20729, "train_loss": 3.3382930755615234, "lr": 0.00012915517300759403, "tps": 28016, "wall": 48491.4} {"step": 20730, "train_loss": 3.3195853233337402, "lr": 0.00012913863444767012, "tps": 28014, "wall": 48496.9} {"step": 20731, "train_loss": 3.283658742904663, "lr": 0.00012912209691702862, "tps": 28012, "wall": 48502.4} {"step": 20732, "train_loss": 3.3295369148254395, "lr": 0.000129105560415857, "tps": 28011, "wall": 48507.9} {"step": 20733, "train_loss": 3.2928967475891113, "lr": 0.00012908902494434253, "tps": 28009, "wall": 48513.6} {"step": 20734, "train_loss": 3.2827303409576416, "lr": 0.00012907249050267237, "tps": 28007, "wall": 48519.1} {"step": 20735, "train_loss": 3.2988476753234863, "lr": 0.00012905595709103407, "tps": 28005, "wall": 48524.7} {"step": 20736, "train_loss": 3.4056601524353027, "lr": 0.00012903942470961482, "tps": 28003, "wall": 48530.3} {"step": 20737, "train_loss": 3.310290575027466, "lr": 0.0001290228933586018, "tps": 28001, "wall": 48535.8} {"step": 20738, "train_loss": 3.2781596183776855, "lr": 0.00012900636303818242, "tps": 27999, "wall": 48541.4} {"step": 20739, "train_loss": 3.35728120803833, "lr": 0.00012898983374854382, "tps": 27997, "wall": 48546.9} {"step": 20740, "train_loss": 3.283148765563965, "lr": 0.00012897330548987342, "tps": 27996, "wall": 48552.5} {"step": 20741, "train_loss": 3.357104778289795, "lr": 0.0001289567782623583, "tps": 27994, "wall": 48558.1} {"step": 20742, "train_loss": 3.2905001640319824, "lr": 0.00012894025206618563, "tps": 27992, "wall": 48563.6} {"step": 20743, "train_loss": 3.2511749267578125, "lr": 0.0001289237269015428, "tps": 27990, "wall": 48569.2} {"step": 20744, "train_loss": 3.318573236465454, "lr": 0.0001289072027686169, "tps": 27988, "wall": 48574.9} {"step": 20745, "train_loss": 3.2929489612579346, "lr": 0.00012889067966759512, "tps": 27986, "wall": 48580.4} {"step": 20746, "train_loss": 3.3323593139648438, "lr": 0.00012887415759866468, "tps": 27984, "wall": 48585.9} {"step": 20747, "train_loss": 3.1179909706115723, "lr": 0.00012885763656201275, "tps": 27983, "wall": 48591.5} {"step": 20748, "train_loss": 3.3305671215057373, "lr": 0.0001288411165578263, "tps": 27981, "wall": 48597.0} {"step": 20749, "train_loss": 3.4341025352478027, "lr": 0.00012882459758629274, "tps": 27979, "wall": 48602.6} {"step": 20750, "train_loss": 3.2442779541015625, "lr": 0.00012880807964759907, "tps": 27977, "wall": 48608.1} {"step": 20751, "train_loss": 3.327101230621338, "lr": 0.00012879156274193232, "tps": 27975, "wall": 48613.7} {"step": 20752, "train_loss": 3.243594169616699, "lr": 0.00012877504686947976, "tps": 27973, "wall": 48619.2} {"step": 20753, "train_loss": 3.234978199005127, "lr": 0.00012875853203042842, "tps": 27972, "wall": 48624.8} {"step": 20754, "train_loss": 3.31850528717041, "lr": 0.0001287420182249653, "tps": 27970, "wall": 48630.4} {"step": 20755, "train_loss": 3.270747661590576, "lr": 0.00012872550545327757, "tps": 27968, "wall": 48636.0} {"step": 20756, "train_loss": 3.2729296684265137, "lr": 0.00012870899371555217, "tps": 27966, "wall": 48641.5} {"step": 20757, "train_loss": 3.3436529636383057, "lr": 0.00012869248301197633, "tps": 27964, "wall": 48647.0} {"step": 20758, "train_loss": 3.3638195991516113, "lr": 0.000128675973342737, "tps": 27962, "wall": 48652.6} {"step": 20759, "train_loss": 3.259068012237549, "lr": 0.00012865946470802108, "tps": 27960, "wall": 48658.1} {"step": 20760, "train_loss": 3.376441478729248, "lr": 0.00012864295710801575, "tps": 27959, "wall": 48663.7} {"step": 20761, "train_loss": 3.36474871635437, "lr": 0.00012862645054290795, "tps": 27957, "wall": 48669.2} {"step": 20762, "train_loss": 3.3025734424591064, "lr": 0.0001286099450128846, "tps": 27955, "wall": 48674.8} {"step": 20763, "train_loss": 3.3098089694976807, "lr": 0.00012859344051813283, "tps": 27953, "wall": 48680.3} {"step": 20764, "train_loss": 3.4267172813415527, "lr": 0.0001285769370588395, "tps": 27951, "wall": 48685.9} {"step": 20765, "train_loss": 3.3960726261138916, "lr": 0.0001285604346351915, "tps": 27949, "wall": 48691.4} {"step": 20766, "train_loss": 3.3336453437805176, "lr": 0.00012854393324737587, "tps": 27947, "wall": 48697.1} {"step": 20767, "train_loss": 3.303382158279419, "lr": 0.00012852743289557957, "tps": 27946, "wall": 48702.7} {"step": 20768, "train_loss": 3.397266387939453, "lr": 0.00012851093357998936, "tps": 27944, "wall": 48708.2} {"step": 20769, "train_loss": 3.279484987258911, "lr": 0.0001284944353007923, "tps": 27942, "wall": 48713.8} {"step": 20770, "train_loss": 3.307687759399414, "lr": 0.00012847793805817527, "tps": 27940, "wall": 48719.4} {"step": 20771, "train_loss": 3.359858274459839, "lr": 0.000128461441852325, "tps": 27938, "wall": 48724.9} {"step": 20772, "train_loss": 3.288086414337158, "lr": 0.00012844494668342855, "tps": 27936, "wall": 48730.4} {"step": 20773, "train_loss": 3.4498579502105713, "lr": 0.00012842845255167272, "tps": 27935, "wall": 48736.0} {"step": 20774, "train_loss": 3.328671455383301, "lr": 0.00012841195945724422, "tps": 27933, "wall": 48741.5} {"step": 20775, "train_loss": 3.3698372840881348, "lr": 0.00012839546740033012, "tps": 27931, "wall": 48747.1} {"step": 20776, "train_loss": 3.25177264213562, "lr": 0.000128378976381117, "tps": 27929, "wall": 48752.7} {"step": 20777, "train_loss": 3.3976454734802246, "lr": 0.0001283624863997919, "tps": 27927, "wall": 48758.3} {"step": 20778, "train_loss": 3.376995086669922, "lr": 0.00012834599745654147, "tps": 27925, "wall": 48763.9} {"step": 20779, "train_loss": 3.1791861057281494, "lr": 0.0001283295095515525, "tps": 27924, "wall": 48769.4} {"step": 20780, "train_loss": 3.3439064025878906, "lr": 0.0001283130226850119, "tps": 27922, "wall": 48775.0} {"step": 20781, "train_loss": 3.392730712890625, "lr": 0.0001282965368571063, "tps": 27920, "wall": 48780.5} {"step": 20782, "train_loss": 3.2536122798919678, "lr": 0.00012828005206802243, "tps": 27918, "wall": 48786.1} {"step": 20783, "train_loss": 3.2905404567718506, "lr": 0.00012826356831794716, "tps": 27916, "wall": 48791.7} {"step": 20784, "train_loss": 3.3497726917266846, "lr": 0.00012824708560706718, "tps": 27914, "wall": 48797.2} {"step": 20785, "train_loss": 3.3477401733398438, "lr": 0.00012823060393556905, "tps": 27912, "wall": 48802.8} {"step": 20786, "train_loss": 3.3727469444274902, "lr": 0.0001282141233036397, "tps": 27911, "wall": 48808.3} {"step": 20787, "train_loss": 3.251427173614502, "lr": 0.00012819764371146576, "tps": 27909, "wall": 48814.0} {"step": 20788, "train_loss": 3.275867223739624, "lr": 0.00012818116515923378, "tps": 27907, "wall": 48819.6} {"step": 20789, "train_loss": 3.295724868774414, "lr": 0.00012816468764713062, "tps": 27905, "wall": 48825.1} {"step": 20790, "train_loss": 3.317685604095459, "lr": 0.0001281482111753428, "tps": 27903, "wall": 48830.6} {"step": 20791, "train_loss": 3.26108980178833, "lr": 0.00012813173574405696, "tps": 27901, "wall": 48836.2} {"step": 20792, "train_loss": 3.22418212890625, "lr": 0.00012811526135345989, "tps": 27900, "wall": 48841.7} {"step": 20793, "train_loss": 3.261983871459961, "lr": 0.00012809878800373802, "tps": 27898, "wall": 48847.2} {"step": 20794, "train_loss": 3.3806312084198, "lr": 0.0001280823156950781, "tps": 27896, "wall": 48852.8} {"step": 20795, "train_loss": 3.3005151748657227, "lr": 0.00012806584442766672, "tps": 27894, "wall": 48858.4} {"step": 20796, "train_loss": 3.3178210258483887, "lr": 0.00012804937420169034, "tps": 27892, "wall": 48863.9} {"step": 20797, "train_loss": 3.3379669189453125, "lr": 0.00012803290501733566, "tps": 27890, "wall": 48869.5} {"step": 20798, "train_loss": 3.2957029342651367, "lr": 0.00012801643687478925, "tps": 27889, "wall": 48875.1} {"step": 20799, "train_loss": 3.366438388824463, "lr": 0.00012799996977423756, "tps": 27887, "wall": 48880.7} {"step": 20800, "train_loss": 3.334977388381958, "lr": 0.00012798350371586722, "tps": 27885, "wall": 48886.2} {"step": 20801, "train_loss": 3.3503265380859375, "lr": 0.00012796703869986475, "tps": 27883, "wall": 48891.8} {"step": 20802, "train_loss": 3.253600835800171, "lr": 0.00012795057472641657, "tps": 27881, "wall": 48897.4} {"step": 20803, "train_loss": 3.261215925216675, "lr": 0.0001279341117957093, "tps": 27879, "wall": 48902.9} {"step": 20804, "train_loss": 3.323699951171875, "lr": 0.00012791764990792944, "tps": 27878, "wall": 48908.5} {"step": 20805, "train_loss": 3.235811710357666, "lr": 0.00012790118906326334, "tps": 27876, "wall": 48914.1} {"step": 20806, "train_loss": 3.2379050254821777, "lr": 0.0001278847292618976, "tps": 27874, "wall": 48919.6} {"step": 20807, "train_loss": 3.227578639984131, "lr": 0.00012786827050401866, "tps": 27872, "wall": 48925.2} {"step": 20808, "train_loss": 3.2274138927459717, "lr": 0.00012785181278981286, "tps": 27870, "wall": 48930.7} {"step": 20809, "train_loss": 3.3371381759643555, "lr": 0.00012783535611946679, "tps": 27868, "wall": 48936.3} {"step": 20810, "train_loss": 3.208540916442871, "lr": 0.0001278189004931667, "tps": 27867, "wall": 48941.9} {"step": 20811, "train_loss": 3.346893310546875, "lr": 0.00012780244591109914, "tps": 27865, "wall": 48947.5} {"step": 20812, "train_loss": 3.347882032394409, "lr": 0.0001277859923734505, "tps": 27863, "wall": 48953.1} {"step": 20813, "train_loss": 3.276796817779541, "lr": 0.00012776953988040702, "tps": 27861, "wall": 48958.7} {"step": 20814, "train_loss": 3.262256383895874, "lr": 0.0001277530884321553, "tps": 27859, "wall": 48964.3} {"step": 20815, "train_loss": 3.269101619720459, "lr": 0.00012773663802888153, "tps": 27857, "wall": 48969.8} {"step": 20816, "train_loss": 3.4009201526641846, "lr": 0.00012772018867077212, "tps": 27856, "wall": 48975.3} {"step": 20817, "train_loss": 3.3735554218292236, "lr": 0.00012770374035801343, "tps": 27854, "wall": 48980.9} {"step": 20818, "train_loss": 3.2690320014953613, "lr": 0.00012768729309079176, "tps": 27852, "wall": 48986.5} {"step": 20819, "train_loss": 3.3003642559051514, "lr": 0.00012767084686929342, "tps": 27850, "wall": 48992.0} {"step": 20820, "train_loss": 3.3669958114624023, "lr": 0.00012765440169370472, "tps": 27848, "wall": 48997.6} {"step": 20821, "train_loss": 3.2884302139282227, "lr": 0.00012763795756421192, "tps": 27846, "wall": 49003.2} {"step": 20822, "train_loss": 3.2362797260284424, "lr": 0.00012762151448100136, "tps": 27845, "wall": 49008.8} {"step": 20823, "train_loss": 3.2451584339141846, "lr": 0.0001276050724442593, "tps": 27843, "wall": 49014.3} {"step": 20824, "train_loss": 3.366111993789673, "lr": 0.00012758863145417192, "tps": 27841, "wall": 49019.9} {"step": 20825, "train_loss": 3.255378246307373, "lr": 0.00012757219151092558, "tps": 27839, "wall": 49025.4} {"step": 20826, "train_loss": 3.188307285308838, "lr": 0.00012755575261470646, "tps": 27837, "wall": 49031.0} {"step": 20827, "train_loss": 3.2561147212982178, "lr": 0.0001275393147657007, "tps": 27836, "wall": 49036.5} {"step": 20828, "train_loss": 3.3659067153930664, "lr": 0.00012752287796409468, "tps": 27834, "wall": 49042.1} {"step": 20829, "train_loss": 3.225496768951416, "lr": 0.00012750644221007446, "tps": 27832, "wall": 49047.6} {"step": 20830, "train_loss": 3.1789488792419434, "lr": 0.00012749000750382622, "tps": 27830, "wall": 49053.2} {"step": 20831, "train_loss": 3.2896807193756104, "lr": 0.00012747357384553624, "tps": 27828, "wall": 49058.7} {"step": 20832, "train_loss": 3.3769936561584473, "lr": 0.0001274571412353906, "tps": 27826, "wall": 49064.3} {"step": 20833, "train_loss": 3.4008846282958984, "lr": 0.00012744070967357545, "tps": 27825, "wall": 49069.9} {"step": 20834, "train_loss": 3.319591522216797, "lr": 0.00012742427916027699, "tps": 27823, "wall": 49075.4} {"step": 20835, "train_loss": 3.3217568397521973, "lr": 0.00012740784969568126, "tps": 27821, "wall": 49081.0} {"step": 20836, "train_loss": 3.2732396125793457, "lr": 0.00012739142127997445, "tps": 27819, "wall": 49086.5} {"step": 20837, "train_loss": 3.2805957794189453, "lr": 0.00012737499391334264, "tps": 27817, "wall": 49092.1} {"step": 20838, "train_loss": 3.274336814880371, "lr": 0.00012735856759597187, "tps": 27816, "wall": 49097.6} {"step": 20839, "train_loss": 3.315281867980957, "lr": 0.0001273421423280483, "tps": 27814, "wall": 49103.2} {"step": 20840, "train_loss": 3.290156364440918, "lr": 0.00012732571810975796, "tps": 27812, "wall": 49108.8} {"step": 20841, "train_loss": 3.2706100940704346, "lr": 0.00012730929494128682, "tps": 27810, "wall": 49114.5} {"step": 20842, "train_loss": 3.258126735687256, "lr": 0.00012729287282282109, "tps": 27808, "wall": 49120.2} {"step": 20843, "train_loss": 3.3189444541931152, "lr": 0.00012727645175454667, "tps": 27806, "wall": 49125.7} {"step": 20844, "train_loss": 3.3362278938293457, "lr": 0.0001272600317366496, "tps": 27805, "wall": 49131.3} {"step": 20845, "train_loss": 3.3815274238586426, "lr": 0.00012724361276931595, "tps": 27803, "wall": 49136.9} {"step": 20846, "train_loss": 3.280132532119751, "lr": 0.00012722719485273168, "tps": 27801, "wall": 49142.5} {"step": 20847, "train_loss": 3.361588954925537, "lr": 0.00012721077798708268, "tps": 27799, "wall": 49148.1} {"step": 20848, "train_loss": 3.305976629257202, "lr": 0.00012719436217255512, "tps": 27797, "wall": 49153.6} {"step": 20849, "train_loss": 3.2896342277526855, "lr": 0.00012717794740933481, "tps": 27795, "wall": 49159.2} {"step": 20850, "train_loss": 3.3623907566070557, "lr": 0.00012716153369760768, "tps": 27794, "wall": 49164.9} {"step": 20851, "train_loss": 3.355586528778076, "lr": 0.00012714512103755978, "tps": 27792, "wall": 49170.4} {"step": 20852, "train_loss": 3.2328193187713623, "lr": 0.0001271287094293769, "tps": 27790, "wall": 49176.1} {"step": 20853, "train_loss": 3.256606101989746, "lr": 0.0001271122988732451, "tps": 27788, "wall": 49181.6} {"step": 20854, "train_loss": 3.190728187561035, "lr": 0.00012709588936935022, "tps": 27786, "wall": 49187.2} {"step": 20855, "train_loss": 3.3508379459381104, "lr": 0.00012707948091787802, "tps": 27784, "wall": 49192.7} {"step": 20856, "train_loss": 3.326925277709961, "lr": 0.0001270630735190146, "tps": 27783, "wall": 49198.3} {"step": 20857, "train_loss": 3.3593056201934814, "lr": 0.00012704666717294568, "tps": 27781, "wall": 49203.8} {"step": 20858, "train_loss": 3.2403087615966797, "lr": 0.00012703026187985708, "tps": 27779, "wall": 49209.4} {"step": 20859, "train_loss": 3.41506290435791, "lr": 0.00012701385763993478, "tps": 27777, "wall": 49214.9} {"step": 20860, "train_loss": 3.3399085998535156, "lr": 0.00012699745445336454, "tps": 27775, "wall": 49220.5} {"step": 20861, "train_loss": 3.25148344039917, "lr": 0.00012698105232033206, "tps": 27774, "wall": 49226.1} {"step": 20862, "train_loss": 3.2117767333984375, "lr": 0.00012696465124102337, "tps": 27772, "wall": 49231.7} {"step": 20863, "train_loss": 3.3462154865264893, "lr": 0.00012694825121562411, "tps": 27770, "wall": 49237.3} {"step": 20864, "train_loss": 3.332975387573242, "lr": 0.00012693185224432003, "tps": 27768, "wall": 49243.0} {"step": 20865, "train_loss": 3.318737506866455, "lr": 0.00012691545432729702, "tps": 27766, "wall": 49248.6} {"step": 20866, "train_loss": 3.367788314819336, "lr": 0.0001268990574647408, "tps": 27764, "wall": 49254.2} {"step": 20867, "train_loss": 3.2793707847595215, "lr": 0.00012688266165683705, "tps": 27763, "wall": 49259.7} {"step": 20868, "train_loss": 3.1997828483581543, "lr": 0.00012686626690377157, "tps": 27761, "wall": 49265.3} {"step": 20869, "train_loss": 3.2763583660125732, "lr": 0.00012684987320573009, "tps": 27759, "wall": 49270.9} {"step": 20870, "train_loss": 3.3127760887145996, "lr": 0.00012683348056289817, "tps": 27757, "wall": 49276.5} {"step": 20871, "train_loss": 3.2624876499176025, "lr": 0.00012681708897546175, "tps": 27755, "wall": 49282.1} {"step": 20872, "train_loss": 3.301393747329712, "lr": 0.00012680069844360627, "tps": 27754, "wall": 49287.6} {"step": 20873, "train_loss": 3.364725112915039, "lr": 0.00012678430896751762, "tps": 27752, "wall": 49293.3} {"step": 20874, "train_loss": 3.2742388248443604, "lr": 0.00012676792054738134, "tps": 27750, "wall": 49298.8} {"step": 20875, "train_loss": 3.2923288345336914, "lr": 0.00012675153318338303, "tps": 27748, "wall": 49304.4} {"step": 20876, "train_loss": 3.3579816818237305, "lr": 0.00012673514687570848, "tps": 27746, "wall": 49310.0} {"step": 20877, "train_loss": 3.275790214538574, "lr": 0.00012671876162454325, "tps": 27744, "wall": 49315.6} {"step": 20878, "train_loss": 3.370515823364258, "lr": 0.00012670237743007284, "tps": 27743, "wall": 49321.2} {"step": 20879, "train_loss": 3.2045798301696777, "lr": 0.000126685994292483, "tps": 27741, "wall": 49326.7} {"step": 20880, "train_loss": 3.3460116386413574, "lr": 0.00012666961221195929, "tps": 27739, "wall": 49332.3} {"step": 20881, "train_loss": 3.2148215770721436, "lr": 0.00012665323118868718, "tps": 27737, "wall": 49337.9} {"step": 20882, "train_loss": 3.238558769226074, "lr": 0.00012663685122285242, "tps": 27735, "wall": 49343.5} {"step": 20883, "train_loss": 3.2511086463928223, "lr": 0.0001266204723146404, "tps": 27734, "wall": 49349.0} {"step": 20884, "train_loss": 3.244946241378784, "lr": 0.0001266040944642367, "tps": 27732, "wall": 49354.7} {"step": 20885, "train_loss": 3.302706241607666, "lr": 0.00012658771767182691, "tps": 27730, "wall": 49360.3} {"step": 20886, "train_loss": 3.230463981628418, "lr": 0.00012657134193759653, "tps": 27728, "wall": 49365.8} {"step": 20887, "train_loss": 3.330068588256836, "lr": 0.00012655496726173097, "tps": 27726, "wall": 49371.4} {"step": 20888, "train_loss": 3.318269729614258, "lr": 0.00012653859364441584, "tps": 27725, "wall": 49377.0} {"step": 20889, "train_loss": 3.2330820560455322, "lr": 0.00012652222108583655, "tps": 27723, "wall": 49382.6} {"step": 20890, "train_loss": 3.4312078952789307, "lr": 0.00012650584958617865, "tps": 27721, "wall": 49388.1} {"step": 20891, "train_loss": 3.246858835220337, "lr": 0.00012648947914562753, "tps": 27719, "wall": 49393.7} {"step": 20892, "train_loss": 3.3299057483673096, "lr": 0.0001264731097643686, "tps": 27717, "wall": 49399.3} {"step": 20893, "train_loss": 3.367069721221924, "lr": 0.00012645674144258742, "tps": 27716, "wall": 49404.8} {"step": 20894, "train_loss": 3.3516759872436523, "lr": 0.00012644037418046929, "tps": 27714, "wall": 49410.4} {"step": 20895, "train_loss": 3.3744101524353027, "lr": 0.00012642400797819962, "tps": 27712, "wall": 49416.0} {"step": 20896, "train_loss": 3.450634002685547, "lr": 0.00012640764283596391, "tps": 27710, "wall": 49421.6} {"step": 20897, "train_loss": 3.3054966926574707, "lr": 0.0001263912787539475, "tps": 27708, "wall": 49427.2} {"step": 20898, "train_loss": 3.354461193084717, "lr": 0.00012637491573233564, "tps": 27707, "wall": 49432.7} {"step": 20899, "train_loss": 3.290107488632202, "lr": 0.0001263585537713139, "tps": 27705, "wall": 49438.3} {"step": 20900, "train_loss": 3.2092199325561523, "lr": 0.00012634219287106755, "tps": 27703, "wall": 49443.9} {"step": 20901, "train_loss": 3.2563743591308594, "lr": 0.00012632583303178181, "tps": 27701, "wall": 49449.5} {"step": 20902, "train_loss": 3.3363022804260254, "lr": 0.0001263094742536422, "tps": 27699, "wall": 49455.1} {"step": 20903, "train_loss": 3.3590900897979736, "lr": 0.0001262931165368339, "tps": 27698, "wall": 49460.7} {"step": 20904, "train_loss": 3.4226818084716797, "lr": 0.0001262767598815422, "tps": 27696, "wall": 49466.2} {"step": 20905, "train_loss": 3.45394229888916, "lr": 0.00012626040428795245, "tps": 27694, "wall": 49471.8} {"step": 20906, "train_loss": 3.3175437450408936, "lr": 0.00012624404975624995, "tps": 27692, "wall": 49477.5} {"step": 20907, "train_loss": 3.3320140838623047, "lr": 0.00012622769628661988, "tps": 27690, "wall": 49483.0} {"step": 20908, "train_loss": 3.3512487411499023, "lr": 0.0001262113438792476, "tps": 27689, "wall": 49488.6} {"step": 20909, "train_loss": 3.2674312591552734, "lr": 0.00012619499253431818, "tps": 27687, "wall": 49494.1} {"step": 20910, "train_loss": 3.3110079765319824, "lr": 0.00012617864225201707, "tps": 27685, "wall": 49499.7} {"step": 20911, "train_loss": 3.3232998847961426, "lr": 0.00012616229303252937, "tps": 27683, "wall": 49505.3} {"step": 20912, "train_loss": 3.1585826873779297, "lr": 0.0001261459448760402, "tps": 27681, "wall": 49510.9} {"step": 20913, "train_loss": 3.297788143157959, "lr": 0.00012612959778273493, "tps": 27680, "wall": 49516.6} {"step": 20914, "train_loss": 3.3786702156066895, "lr": 0.00012611325175279867, "tps": 27678, "wall": 49522.1} {"step": 20915, "train_loss": 3.3148066997528076, "lr": 0.00012609690678641648, "tps": 27676, "wall": 49527.7} {"step": 20916, "train_loss": 3.3220348358154297, "lr": 0.00012608056288377368, "tps": 27674, "wall": 49533.4} {"step": 20917, "train_loss": 3.254545211791992, "lr": 0.00012606422004505534, "tps": 27672, "wall": 49538.9} {"step": 20918, "train_loss": 3.3667359352111816, "lr": 0.00012604787827044653, "tps": 27671, "wall": 49544.5} {"step": 20919, "train_loss": 3.2629308700561523, "lr": 0.00012603153756013256, "tps": 27669, "wall": 49550.1} {"step": 20920, "train_loss": 3.384843349456787, "lr": 0.00012601519791429836, "tps": 27667, "wall": 49555.6} {"step": 20921, "train_loss": 3.3394582271575928, "lr": 0.000125998859333129, "tps": 27665, "wall": 49561.2} {"step": 20922, "train_loss": 3.325448513031006, "lr": 0.00012598252181680977, "tps": 27663, "wall": 49566.8} {"step": 20923, "train_loss": 3.3410675525665283, "lr": 0.0001259661853655256, "tps": 27662, "wall": 49572.4} {"step": 20924, "train_loss": 3.3166441917419434, "lr": 0.00012594984997946147, "tps": 27660, "wall": 49578.0} {"step": 20925, "train_loss": 3.318913221359253, "lr": 0.0001259335156588026, "tps": 27658, "wall": 49583.6} {"step": 20926, "train_loss": 3.2508301734924316, "lr": 0.0001259171824037339, "tps": 27656, "wall": 49589.2} {"step": 20927, "train_loss": 3.267448902130127, "lr": 0.00012590085021444054, "tps": 27654, "wall": 49594.8} {"step": 20928, "train_loss": 3.3190178871154785, "lr": 0.0001258845190911074, "tps": 27653, "wall": 49600.4} {"step": 20929, "train_loss": 3.3113269805908203, "lr": 0.0001258681890339195, "tps": 27651, "wall": 49606.0} {"step": 20930, "train_loss": 3.226457357406616, "lr": 0.00012585186004306187, "tps": 27649, "wall": 49611.5} {"step": 20931, "train_loss": 3.18802809715271, "lr": 0.00012583553211871945, "tps": 27647, "wall": 49617.1} {"step": 20932, "train_loss": 3.1953208446502686, "lr": 0.0001258192052610772, "tps": 27645, "wall": 49622.7} {"step": 20933, "train_loss": 3.2836380004882812, "lr": 0.0001258028794703201, "tps": 27644, "wall": 49628.3} {"step": 20934, "train_loss": 3.2494568824768066, "lr": 0.00012578655474663312, "tps": 27642, "wall": 49633.9} {"step": 20935, "train_loss": 3.2819578647613525, "lr": 0.00012577023109020108, "tps": 27640, "wall": 49639.4} {"step": 20936, "train_loss": 3.287342071533203, "lr": 0.00012575390850120898, "tps": 27638, "wall": 49645.0} {"step": 20937, "train_loss": 3.1626131534576416, "lr": 0.00012573758697984175, "tps": 27637, "wall": 49650.5} {"step": 20938, "train_loss": 3.2800722122192383, "lr": 0.00012572126652628414, "tps": 27635, "wall": 49656.2} {"step": 20939, "train_loss": 3.1842198371887207, "lr": 0.00012570494714072124, "tps": 27633, "wall": 49661.8} {"step": 20940, "train_loss": 3.3476219177246094, "lr": 0.00012568862882333774, "tps": 27631, "wall": 49667.3} {"step": 20941, "train_loss": 3.204270124435425, "lr": 0.0001256723115743185, "tps": 27629, "wall": 49673.0} {"step": 20942, "train_loss": 3.3286471366882324, "lr": 0.00012565599539384853, "tps": 27628, "wall": 49678.5} {"step": 20943, "train_loss": 3.3440380096435547, "lr": 0.00012563968028211242, "tps": 27626, "wall": 49684.1} {"step": 20944, "train_loss": 3.234121084213257, "lr": 0.0001256233662392952, "tps": 27624, "wall": 49689.7} {"step": 20945, "train_loss": 3.244779348373413, "lr": 0.0001256070532655816, "tps": 27622, "wall": 49695.3} {"step": 20946, "train_loss": 3.30861234664917, "lr": 0.00012559074136115635, "tps": 27620, "wall": 49700.8} {"step": 20947, "train_loss": 3.3232662677764893, "lr": 0.00012557443052620436, "tps": 27619, "wall": 49706.4} {"step": 20948, "train_loss": 3.3086941242218018, "lr": 0.0001255581207609103, "tps": 27617, "wall": 49712.0} {"step": 20949, "train_loss": 3.3560400009155273, "lr": 0.00012554181206545891, "tps": 27615, "wall": 49717.7} {"step": 20950, "train_loss": 3.292729377746582, "lr": 0.00012552550444003505, "tps": 27613, "wall": 49723.3} {"step": 20951, "train_loss": 3.1426382064819336, "lr": 0.00012550919788482338, "tps": 27611, "wall": 49728.8} {"step": 20952, "train_loss": 3.2711448669433594, "lr": 0.0001254928924000086, "tps": 27610, "wall": 49734.4} {"step": 20953, "train_loss": 3.3267831802368164, "lr": 0.00012547658798577546, "tps": 27608, "wall": 49740.0} {"step": 20954, "train_loss": 3.227012872695923, "lr": 0.00012546028464230865, "tps": 27606, "wall": 49745.6} {"step": 20955, "train_loss": 3.2700273990631104, "lr": 0.0001254439823697928, "tps": 27604, "wall": 49751.1} {"step": 20956, "train_loss": 3.2744626998901367, "lr": 0.00012542768116841272, "tps": 27603, "wall": 49756.7} {"step": 20957, "train_loss": 3.4243505001068115, "lr": 0.00012541138103835294, "tps": 27601, "wall": 49762.3} {"step": 20958, "train_loss": 3.24589204788208, "lr": 0.00012539508197979813, "tps": 27599, "wall": 49767.9} {"step": 20959, "train_loss": 3.3489830493927, "lr": 0.000125378783992933, "tps": 27597, "wall": 49773.6} {"step": 20960, "train_loss": 3.3231112957000732, "lr": 0.0001253624870779421, "tps": 27595, "wall": 49779.1} {"step": 20961, "train_loss": 3.2518653869628906, "lr": 0.00012534619123501, "tps": 27594, "wall": 49784.7} {"step": 20962, "train_loss": 3.3641011714935303, "lr": 0.00012532989646432148, "tps": 27592, "wall": 49790.3} {"step": 20963, "train_loss": 3.336348056793213, "lr": 0.0001253136027660609, "tps": 27590, "wall": 49795.9} {"step": 20964, "train_loss": 3.2708945274353027, "lr": 0.00012529731014041304, "tps": 27588, "wall": 49801.5} {"step": 20965, "train_loss": 3.2521257400512695, "lr": 0.00012528101858756238, "tps": 27587, "wall": 49807.0} {"step": 20966, "train_loss": 3.310741901397705, "lr": 0.0001252647281076934, "tps": 27585, "wall": 49812.6} {"step": 20967, "train_loss": 3.2507219314575195, "lr": 0.00012524843870099074, "tps": 27583, "wall": 49818.2} {"step": 20968, "train_loss": 3.231812000274658, "lr": 0.00012523215036763894, "tps": 27581, "wall": 49823.9} {"step": 20969, "train_loss": 3.2274417877197266, "lr": 0.00012521586310782235, "tps": 27579, "wall": 49829.5} {"step": 20970, "train_loss": 3.2547671794891357, "lr": 0.0001251995769217257, "tps": 27578, "wall": 49835.1} {"step": 20971, "train_loss": 3.2860655784606934, "lr": 0.00012518329180953334, "tps": 27576, "wall": 49840.6} {"step": 20972, "train_loss": 3.358961582183838, "lr": 0.00012516700777142972, "tps": 27574, "wall": 49846.2} {"step": 20973, "train_loss": 3.288257360458374, "lr": 0.00012515072480759947, "tps": 27572, "wall": 49851.8} {"step": 20974, "train_loss": 3.218778133392334, "lr": 0.0001251344429182269, "tps": 27570, "wall": 49857.4} {"step": 20975, "train_loss": 3.3619136810302734, "lr": 0.00012511816210349641, "tps": 27569, "wall": 49863.0} {"step": 20976, "train_loss": 3.279036521911621, "lr": 0.00012510188236359264, "tps": 27567, "wall": 49868.5} {"step": 20977, "train_loss": 3.3383989334106445, "lr": 0.00012508560369869982, "tps": 27565, "wall": 49874.2} {"step": 20978, "train_loss": 3.2465624809265137, "lr": 0.00012506932610900238, "tps": 27563, "wall": 49879.8} {"step": 20979, "train_loss": 3.2729668617248535, "lr": 0.0001250530495946848, "tps": 27562, "wall": 49885.3} {"step": 20980, "train_loss": 3.2402267456054688, "lr": 0.0001250367741559314, "tps": 27560, "wall": 49890.9} {"step": 20981, "train_loss": 3.3443620204925537, "lr": 0.00012502049979292655, "tps": 27558, "wall": 49896.6} {"step": 20982, "train_loss": 3.2969226837158203, "lr": 0.00012500422650585464, "tps": 27556, "wall": 49902.2} {"step": 20983, "train_loss": 3.323331117630005, "lr": 0.00012498795429489995, "tps": 27554, "wall": 49907.8} {"step": 20984, "train_loss": 3.3190674781799316, "lr": 0.0001249716831602469, "tps": 27553, "wall": 49913.3} {"step": 20985, "train_loss": 3.308016300201416, "lr": 0.00012495541310207978, "tps": 27551, "wall": 49919.0} {"step": 20986, "train_loss": 3.3866236209869385, "lr": 0.00012493914412058275, "tps": 27549, "wall": 49924.5} {"step": 20987, "train_loss": 3.2122180461883545, "lr": 0.00012492287621594037, "tps": 27547, "wall": 49930.1} {"step": 20988, "train_loss": 3.2914185523986816, "lr": 0.00012490660938833682, "tps": 27546, "wall": 49935.7} {"step": 20989, "train_loss": 3.2599709033966064, "lr": 0.00012489034363795626, "tps": 27544, "wall": 49941.3} {"step": 20990, "train_loss": 3.3486099243164062, "lr": 0.00012487407896498312, "tps": 27542, "wall": 49946.9} {"step": 20991, "train_loss": 3.2608401775360107, "lr": 0.00012485781536960143, "tps": 27540, "wall": 49952.4} {"step": 20992, "train_loss": 3.3055968284606934, "lr": 0.00012484155285199565, "tps": 27539, "wall": 49958.1} {"step": 20993, "train_loss": 3.3079166412353516, "lr": 0.00012482529141234988, "tps": 27537, "wall": 49963.7} {"step": 20994, "train_loss": 3.251014232635498, "lr": 0.0001248090310508483, "tps": 27535, "wall": 49969.3} {"step": 20995, "train_loss": 3.302687168121338, "lr": 0.00012479277176767525, "tps": 27533, "wall": 49974.9} {"step": 20996, "train_loss": 3.4297842979431152, "lr": 0.00012477651356301484, "tps": 27531, "wall": 49980.5} {"step": 20997, "train_loss": 3.184732437133789, "lr": 0.00012476025643705114, "tps": 27530, "wall": 49986.0} {"step": 20998, "train_loss": 3.3077826499938965, "lr": 0.00012474400038996848, "tps": 27528, "wall": 49991.6} {"step": 20999, "train_loss": 3.194211483001709, "lr": 0.00012472774542195096, "tps": 27526, "wall": 49997.1} {"step": 21000, "train_loss": 3.315535545349121, "lr": 0.00012471149153318257, "tps": 27524, "wall": 50002.7, "val_loss_monitor": 3.365751841905295} {"step": 21001, "train_loss": 3.386967182159424, "lr": 0.0001246952387238477, "tps": 27503, "wall": 50044.6} {"step": 21002, "train_loss": 3.248457431793213, "lr": 0.00012467898699413028, "tps": 27501, "wall": 50050.2} {"step": 21003, "train_loss": 3.214597225189209, "lr": 0.00012466273634421438, "tps": 27499, "wall": 50055.8} {"step": 21004, "train_loss": 3.287109136581421, "lr": 0.00012464648677428425, "tps": 27497, "wall": 50061.4} {"step": 21005, "train_loss": 3.312579870223999, "lr": 0.0001246302382845238, "tps": 27496, "wall": 50067.1} {"step": 21006, "train_loss": 3.270007610321045, "lr": 0.00012461399087511724, "tps": 27494, "wall": 50072.8} {"step": 21007, "train_loss": 3.2461838722229004, "lr": 0.00012459774454624855, "tps": 27492, "wall": 50078.5} {"step": 21008, "train_loss": 3.1950795650482178, "lr": 0.0001245814992981017, "tps": 27490, "wall": 50084.1} {"step": 21009, "train_loss": 3.3086743354797363, "lr": 0.00012456525513086087, "tps": 27488, "wall": 50089.7} {"step": 21010, "train_loss": 3.2082412242889404, "lr": 0.00012454901204470996, "tps": 27487, "wall": 50095.4} {"step": 21011, "train_loss": 3.280073881149292, "lr": 0.00012453277003983296, "tps": 27485, "wall": 50101.0} {"step": 21012, "train_loss": 3.346400737762451, "lr": 0.00012451652911641398, "tps": 27483, "wall": 50106.7} {"step": 21013, "train_loss": 3.3575873374938965, "lr": 0.00012450028927463692, "tps": 27481, "wall": 50112.3} {"step": 21014, "train_loss": 3.32645320892334, "lr": 0.00012448405051468565, "tps": 27479, "wall": 50118.0} {"step": 21015, "train_loss": 3.3853964805603027, "lr": 0.00012446781283674432, "tps": 27478, "wall": 50123.6} {"step": 21016, "train_loss": 3.400472640991211, "lr": 0.0001244515762409968, "tps": 27476, "wall": 50129.3} {"step": 21017, "train_loss": 3.2713634967803955, "lr": 0.00012443534072762688, "tps": 27474, "wall": 50135.0} {"step": 21018, "train_loss": 3.2792224884033203, "lr": 0.00012441910629681867, "tps": 27472, "wall": 50140.7} {"step": 21019, "train_loss": 3.315351963043213, "lr": 0.000124402872948756, "tps": 27470, "wall": 50146.3} {"step": 21020, "train_loss": 3.281146764755249, "lr": 0.0001243866406836227, "tps": 27469, "wall": 50151.9} {"step": 21021, "train_loss": 3.3433828353881836, "lr": 0.00012437040950160277, "tps": 27467, "wall": 50157.6} {"step": 21022, "train_loss": 3.251753807067871, "lr": 0.00012435417940287992, "tps": 27465, "wall": 50163.2} {"step": 21023, "train_loss": 3.284292697906494, "lr": 0.00012433795038763822, "tps": 27463, "wall": 50168.9} {"step": 21024, "train_loss": 3.398453712463379, "lr": 0.00012432172245606136, "tps": 27462, "wall": 50174.5} {"step": 21025, "train_loss": 3.321485996246338, "lr": 0.0001243054956083331, "tps": 27460, "wall": 50180.2} {"step": 21026, "train_loss": 3.2912633419036865, "lr": 0.0001242892698446375, "tps": 27458, "wall": 50185.8} {"step": 21027, "train_loss": 3.2466623783111572, "lr": 0.00012427304516515817, "tps": 27456, "wall": 50191.4} {"step": 21028, "train_loss": 3.2509050369262695, "lr": 0.00012425682157007895, "tps": 27454, "wall": 50197.2} {"step": 21029, "train_loss": 3.337761402130127, "lr": 0.00012424059905958367, "tps": 27453, "wall": 50202.8} {"step": 21030, "train_loss": 3.3527755737304688, "lr": 0.00012422437763385608, "tps": 27451, "wall": 50208.4} {"step": 21031, "train_loss": 3.324955463409424, "lr": 0.00012420815729307985, "tps": 27449, "wall": 50214.0} {"step": 21032, "train_loss": 3.296184778213501, "lr": 0.00012419193803743885, "tps": 27447, "wall": 50219.7} {"step": 21033, "train_loss": 3.2475407123565674, "lr": 0.00012417571986711676, "tps": 27446, "wall": 50225.2} {"step": 21034, "train_loss": 3.227871894836426, "lr": 0.00012415950278229723, "tps": 27444, "wall": 50230.9} {"step": 21035, "train_loss": 3.2877516746520996, "lr": 0.00012414328678316415, "tps": 27442, "wall": 50236.5} {"step": 21036, "train_loss": 3.316765785217285, "lr": 0.00012412707186990103, "tps": 27440, "wall": 50242.2} {"step": 21037, "train_loss": 3.3217742443084717, "lr": 0.00012411085804269162, "tps": 27438, "wall": 50247.8} {"step": 21038, "train_loss": 3.3222968578338623, "lr": 0.00012409464530171963, "tps": 27437, "wall": 50253.5} {"step": 21039, "train_loss": 3.342794895172119, "lr": 0.00012407843364716862, "tps": 27435, "wall": 50259.0} {"step": 21040, "train_loss": 3.145806312561035, "lr": 0.00012406222307922236, "tps": 27433, "wall": 50264.6} {"step": 21041, "train_loss": 3.254514694213867, "lr": 0.00012404601359806446, "tps": 27431, "wall": 50270.2} {"step": 21042, "train_loss": 3.3628828525543213, "lr": 0.00012402980520387843, "tps": 27430, "wall": 50275.9} {"step": 21043, "train_loss": 3.3327534198760986, "lr": 0.00012401359789684805, "tps": 27428, "wall": 50281.5} {"step": 21044, "train_loss": 3.1347408294677734, "lr": 0.00012399739167715678, "tps": 27426, "wall": 50287.1} {"step": 21045, "train_loss": 3.332566499710083, "lr": 0.0001239811865449882, "tps": 27424, "wall": 50292.7} {"step": 21046, "train_loss": 3.2762115001678467, "lr": 0.000123964982500526, "tps": 27423, "wall": 50298.3} {"step": 21047, "train_loss": 3.4101619720458984, "lr": 0.0001239487795439537, "tps": 27421, "wall": 50303.9} {"step": 21048, "train_loss": 3.2404301166534424, "lr": 0.00012393257767545472, "tps": 27419, "wall": 50309.4} {"step": 21049, "train_loss": 3.3393349647521973, "lr": 0.00012391637689521278, "tps": 27417, "wall": 50315.1} {"step": 21050, "train_loss": 3.358623504638672, "lr": 0.00012390017720341132, "tps": 27416, "wall": 50320.7} {"step": 21051, "train_loss": 3.181363105773926, "lr": 0.00012388397860023379, "tps": 27414, "wall": 50326.3} {"step": 21052, "train_loss": 3.378176212310791, "lr": 0.00012386778108586382, "tps": 27412, "wall": 50331.8} {"step": 21053, "train_loss": 3.2324376106262207, "lr": 0.0001238515846604848, "tps": 27410, "wall": 50337.4} {"step": 21054, "train_loss": 3.3021962642669678, "lr": 0.00012383538932428018, "tps": 27409, "wall": 50343.0} {"step": 21055, "train_loss": 3.292752265930176, "lr": 0.00012381919507743354, "tps": 27407, "wall": 50348.6} {"step": 21056, "train_loss": 3.4018068313598633, "lr": 0.00012380300192012825, "tps": 27405, "wall": 50354.2} {"step": 21057, "train_loss": 3.3356332778930664, "lr": 0.0001237868098525477, "tps": 27403, "wall": 50359.9} {"step": 21058, "train_loss": 3.2782673835754395, "lr": 0.00012377061887487546, "tps": 27402, "wall": 50365.4} {"step": 21059, "train_loss": 3.355924129486084, "lr": 0.00012375442898729478, "tps": 27400, "wall": 50371.1} {"step": 21060, "train_loss": 3.1782259941101074, "lr": 0.00012373824018998918, "tps": 27398, "wall": 50376.7} {"step": 21061, "train_loss": 3.356959342956543, "lr": 0.00012372205248314198, "tps": 27396, "wall": 50382.3} {"step": 21062, "train_loss": 3.273714542388916, "lr": 0.00012370586586693655, "tps": 27395, "wall": 50387.8} {"step": 21063, "train_loss": 3.1582388877868652, "lr": 0.00012368968034155638, "tps": 27393, "wall": 50393.4} {"step": 21064, "train_loss": 3.3691177368164062, "lr": 0.00012367349590718465, "tps": 27391, "wall": 50399.0} {"step": 21065, "train_loss": 3.2698004245758057, "lr": 0.00012365731256400476, "tps": 27389, "wall": 50404.6} {"step": 21066, "train_loss": 3.2650418281555176, "lr": 0.0001236411303122001, "tps": 27388, "wall": 50410.2} {"step": 21067, "train_loss": 3.3526835441589355, "lr": 0.00012362494915195389, "tps": 27386, "wall": 50415.8} {"step": 21068, "train_loss": 3.4536292552948, "lr": 0.00012360876908344945, "tps": 27384, "wall": 50421.4} {"step": 21069, "train_loss": 3.32877779006958, "lr": 0.00012359259010687014, "tps": 27383, "wall": 50427.0} {"step": 21070, "train_loss": 3.2904562950134277, "lr": 0.0001235764122223992, "tps": 27381, "wall": 50432.6} {"step": 21071, "train_loss": 3.3304126262664795, "lr": 0.00012356023543021974, "tps": 27379, "wall": 50438.2} {"step": 21072, "train_loss": 3.359886646270752, "lr": 0.0001235440597305153, "tps": 27377, "wall": 50443.8} {"step": 21073, "train_loss": 3.339907169342041, "lr": 0.00012352788512346894, "tps": 27376, "wall": 50449.4} {"step": 21074, "train_loss": 3.3190252780914307, "lr": 0.00012351171160926384, "tps": 27374, "wall": 50455.0} {"step": 21075, "train_loss": 3.3293118476867676, "lr": 0.0001234955391880834, "tps": 27372, "wall": 50460.6} {"step": 21076, "train_loss": 3.290313720703125, "lr": 0.00012347936786011058, "tps": 27370, "wall": 50466.2} {"step": 21077, "train_loss": 3.232786178588867, "lr": 0.0001234631976255288, "tps": 27369, "wall": 50471.8} {"step": 21078, "train_loss": 3.286997079849243, "lr": 0.00012344702848452116, "tps": 27367, "wall": 50477.4} {"step": 21079, "train_loss": 3.2852091789245605, "lr": 0.00012343086043727072, "tps": 27365, "wall": 50483.0} {"step": 21080, "train_loss": 3.31821870803833, "lr": 0.0001234146934839608, "tps": 27363, "wall": 50488.6} {"step": 21081, "train_loss": 3.1408309936523438, "lr": 0.00012339852762477445, "tps": 27362, "wall": 50494.2} {"step": 21082, "train_loss": 3.3093392848968506, "lr": 0.0001233823628598947, "tps": 27360, "wall": 50499.8} {"step": 21083, "train_loss": 3.309018135070801, "lr": 0.0001233661991895049, "tps": 27358, "wall": 50505.4} {"step": 21084, "train_loss": 3.3432071208953857, "lr": 0.00012335003661378797, "tps": 27356, "wall": 50511.0} {"step": 21085, "train_loss": 3.2064218521118164, "lr": 0.000123333875132927, "tps": 27355, "wall": 50516.6} {"step": 21086, "train_loss": 3.1803293228149414, "lr": 0.00012331771474710524, "tps": 27353, "wall": 50522.3} {"step": 21087, "train_loss": 3.316340684890747, "lr": 0.00012330155545650556, "tps": 27351, "wall": 50527.9} {"step": 21088, "train_loss": 3.3229482173919678, "lr": 0.00012328539726131108, "tps": 27349, "wall": 50533.5} {"step": 21089, "train_loss": 3.165853500366211, "lr": 0.00012326924016170486, "tps": 27348, "wall": 50539.1} {"step": 21090, "train_loss": 3.3667330741882324, "lr": 0.00012325308415786997, "tps": 27346, "wall": 50544.7} {"step": 21091, "train_loss": 3.2992873191833496, "lr": 0.0001232369292499893, "tps": 27344, "wall": 50550.4} {"step": 21092, "train_loss": 3.2773654460906982, "lr": 0.000123220775438246, "tps": 27342, "wall": 50556.1} {"step": 21093, "train_loss": 3.2371432781219482, "lr": 0.00012320462272282293, "tps": 27341, "wall": 50561.7} {"step": 21094, "train_loss": 3.3204870223999023, "lr": 0.00012318847110390316, "tps": 27339, "wall": 50567.3} {"step": 21095, "train_loss": 3.3239824771881104, "lr": 0.00012317232058166967, "tps": 27337, "wall": 50572.9} {"step": 21096, "train_loss": 3.2502522468566895, "lr": 0.0001231561711563053, "tps": 27335, "wall": 50578.5} {"step": 21097, "train_loss": 3.2705841064453125, "lr": 0.0001231400228279931, "tps": 27334, "wall": 50584.1} {"step": 21098, "train_loss": 3.2756147384643555, "lr": 0.000123123875596916, "tps": 27332, "wall": 50589.7} {"step": 21099, "train_loss": 3.3181509971618652, "lr": 0.00012310772946325677, "tps": 27330, "wall": 50595.3} {"step": 21100, "train_loss": 3.2803049087524414, "lr": 0.0001230915844271985, "tps": 27329, "wall": 50600.9} {"step": 21101, "train_loss": 3.302751302719116, "lr": 0.000123075440488924, "tps": 27327, "wall": 50606.5} {"step": 21102, "train_loss": 3.3366870880126953, "lr": 0.00012305929764861614, "tps": 27325, "wall": 50612.2} {"step": 21103, "train_loss": 3.290933132171631, "lr": 0.0001230431559064578, "tps": 27323, "wall": 50617.9} {"step": 21104, "train_loss": 3.2725472450256348, "lr": 0.0001230270152626319, "tps": 27322, "wall": 50623.4} {"step": 21105, "train_loss": 3.314836025238037, "lr": 0.0001230108757173211, "tps": 27320, "wall": 50629.1} {"step": 21106, "train_loss": 3.357402801513672, "lr": 0.0001229947372707084, "tps": 27318, "wall": 50634.7} {"step": 21107, "train_loss": 3.268656015396118, "lr": 0.00012297859992297663, "tps": 27316, "wall": 50640.3} {"step": 21108, "train_loss": 3.2179903984069824, "lr": 0.00012296246367430843, "tps": 27315, "wall": 50645.9} {"step": 21109, "train_loss": 3.357407569885254, "lr": 0.0001229463285248867, "tps": 27313, "wall": 50651.5} {"step": 21110, "train_loss": 3.390888214111328, "lr": 0.0001229301944748943, "tps": 27311, "wall": 50657.2} {"step": 21111, "train_loss": 3.342041015625, "lr": 0.0001229140615245138, "tps": 27309, "wall": 50662.7} {"step": 21112, "train_loss": 3.337661027908325, "lr": 0.00012289792967392813, "tps": 27308, "wall": 50668.3} {"step": 21113, "train_loss": 3.3302650451660156, "lr": 0.0001228817989233199, "tps": 27306, "wall": 50674.0} {"step": 21114, "train_loss": 3.3406412601470947, "lr": 0.00012286566927287198, "tps": 27304, "wall": 50679.6} {"step": 21115, "train_loss": 3.2059953212738037, "lr": 0.000122849540722767, "tps": 27302, "wall": 50685.3} {"step": 21116, "train_loss": 3.3203206062316895, "lr": 0.00012283341327318765, "tps": 27301, "wall": 50690.9} {"step": 21117, "train_loss": 3.3198599815368652, "lr": 0.00012281728692431666, "tps": 27299, "wall": 50696.5} {"step": 21118, "train_loss": 3.2410993576049805, "lr": 0.00012280116167633673, "tps": 27297, "wall": 50702.1} {"step": 21119, "train_loss": 3.2432069778442383, "lr": 0.00012278503752943042, "tps": 27296, "wall": 50707.7} {"step": 21120, "train_loss": 3.333847999572754, "lr": 0.00012276891448378057, "tps": 27294, "wall": 50713.3} {"step": 21121, "train_loss": 3.298837184906006, "lr": 0.00012275279253956968, "tps": 27292, "wall": 50718.9} {"step": 21122, "train_loss": 3.351348400115967, "lr": 0.00012273667169698034, "tps": 27290, "wall": 50724.5} {"step": 21123, "train_loss": 3.284606456756592, "lr": 0.00012272055195619537, "tps": 27289, "wall": 50730.1} {"step": 21124, "train_loss": 3.278137683868408, "lr": 0.0001227044333173972, "tps": 27287, "wall": 50735.9} {"step": 21125, "train_loss": 3.351414442062378, "lr": 0.0001226883157807684, "tps": 27285, "wall": 50741.4} {"step": 21126, "train_loss": 3.3362174034118652, "lr": 0.00012267219934649173, "tps": 27283, "wall": 50747.0} {"step": 21127, "train_loss": 3.2621614933013916, "lr": 0.00012265608401474962, "tps": 27282, "wall": 50752.6} {"step": 21128, "train_loss": 3.2777259349823, "lr": 0.00012263996978572461, "tps": 27280, "wall": 50758.2} {"step": 21129, "train_loss": 3.347264051437378, "lr": 0.00012262385665959933, "tps": 27278, "wall": 50763.9} {"step": 21130, "train_loss": 3.3103950023651123, "lr": 0.0001226077446365562, "tps": 27277, "wall": 50769.4} {"step": 21131, "train_loss": 3.171680450439453, "lr": 0.0001225916337167779, "tps": 27275, "wall": 50775.1} {"step": 21132, "train_loss": 3.3364334106445312, "lr": 0.00012257552390044683, "tps": 27273, "wall": 50780.6} {"step": 21133, "train_loss": 3.3028788566589355, "lr": 0.00012255941518774546, "tps": 27271, "wall": 50786.2} {"step": 21134, "train_loss": 3.196950674057007, "lr": 0.00012254330757885631, "tps": 27270, "wall": 50791.8} {"step": 21135, "train_loss": 3.3157541751861572, "lr": 0.00012252720107396188, "tps": 27268, "wall": 50797.5} {"step": 21136, "train_loss": 3.3349599838256836, "lr": 0.00012251109567324453, "tps": 27266, "wall": 50803.1} {"step": 21137, "train_loss": 3.3296141624450684, "lr": 0.00012249499137688682, "tps": 27264, "wall": 50808.7} {"step": 21138, "train_loss": 3.3521389961242676, "lr": 0.00012247888818507115, "tps": 27263, "wall": 50814.4} {"step": 21139, "train_loss": 3.270203113555908, "lr": 0.0001224627860979798, "tps": 27261, "wall": 50820.0} {"step": 21140, "train_loss": 3.3297111988067627, "lr": 0.00012244668511579538, "tps": 27259, "wall": 50825.6} {"step": 21141, "train_loss": 3.263418197631836, "lr": 0.00012243058523870017, "tps": 27258, "wall": 50831.2} {"step": 21142, "train_loss": 3.259408950805664, "lr": 0.0001224144864668765, "tps": 27256, "wall": 50836.8} {"step": 21143, "train_loss": 3.260531187057495, "lr": 0.00012239838880050692, "tps": 27254, "wall": 50842.4} {"step": 21144, "train_loss": 3.3162426948547363, "lr": 0.00012238229223977362, "tps": 27252, "wall": 50848.0} {"step": 21145, "train_loss": 3.3049750328063965, "lr": 0.00012236619678485894, "tps": 27251, "wall": 50853.7} {"step": 21146, "train_loss": 3.295926809310913, "lr": 0.00012235010243594533, "tps": 27249, "wall": 50859.3} {"step": 21147, "train_loss": 3.2604122161865234, "lr": 0.000122334009193215, "tps": 27247, "wall": 50864.9} {"step": 21148, "train_loss": 3.221895933151245, "lr": 0.00012231791705685034, "tps": 27246, "wall": 50870.6} {"step": 21149, "train_loss": 3.3986637592315674, "lr": 0.00012230182602703362, "tps": 27244, "wall": 50876.2} {"step": 21150, "train_loss": 3.390782594680786, "lr": 0.000122285736103947, "tps": 27242, "wall": 50881.8} {"step": 21151, "train_loss": 3.3298661708831787, "lr": 0.00012226964728777296, "tps": 27240, "wall": 50887.4} {"step": 21152, "train_loss": 3.299572229385376, "lr": 0.00012225355957869359, "tps": 27239, "wall": 50893.0} {"step": 21153, "train_loss": 3.321579933166504, "lr": 0.00012223747297689116, "tps": 27237, "wall": 50898.6} {"step": 21154, "train_loss": 3.2969071865081787, "lr": 0.00012222138748254797, "tps": 27235, "wall": 50904.2} {"step": 21155, "train_loss": 3.3057875633239746, "lr": 0.00012220530309584618, "tps": 27234, "wall": 50909.8} {"step": 21156, "train_loss": 3.3876922130584717, "lr": 0.00012218921981696805, "tps": 27232, "wall": 50915.5} {"step": 21157, "train_loss": 3.3283557891845703, "lr": 0.00012217313764609572, "tps": 27230, "wall": 50921.2} {"step": 21158, "train_loss": 3.3349523544311523, "lr": 0.00012215705658341129, "tps": 27228, "wall": 50926.8} {"step": 21159, "train_loss": 3.3497660160064697, "lr": 0.00012214097662909709, "tps": 27227, "wall": 50932.4} {"step": 21160, "train_loss": 3.34609317779541, "lr": 0.0001221248977833352, "tps": 27225, "wall": 50938.1} {"step": 21161, "train_loss": 3.356255531311035, "lr": 0.0001221088200463077, "tps": 27223, "wall": 50943.7} {"step": 21162, "train_loss": 3.3651723861694336, "lr": 0.00012209274341819684, "tps": 27221, "wall": 50949.3} {"step": 21163, "train_loss": 3.2839956283569336, "lr": 0.0001220766678991847, "tps": 27220, "wall": 50954.9} {"step": 21164, "train_loss": 3.448301076889038, "lr": 0.0001220605934894533, "tps": 27218, "wall": 50960.5} {"step": 21165, "train_loss": 3.1948671340942383, "lr": 0.00012204452018918482, "tps": 27216, "wall": 50966.2} {"step": 21166, "train_loss": 3.3123841285705566, "lr": 0.00012202844799856135, "tps": 27215, "wall": 50971.8} {"step": 21167, "train_loss": 3.1935296058654785, "lr": 0.00012201237691776483, "tps": 27213, "wall": 50977.5} {"step": 21168, "train_loss": 3.3828907012939453, "lr": 0.00012199630694697748, "tps": 27211, "wall": 50983.1} {"step": 21169, "train_loss": 3.2272260189056396, "lr": 0.00012198023808638128, "tps": 27209, "wall": 50988.8} {"step": 21170, "train_loss": 3.2603254318237305, "lr": 0.00012196417033615817, "tps": 27208, "wall": 50994.4} {"step": 21171, "train_loss": 3.344548225402832, "lr": 0.00012194810369649032, "tps": 27206, "wall": 51000.0} {"step": 21172, "train_loss": 3.411644458770752, "lr": 0.00012193203816755958, "tps": 27204, "wall": 51005.6} {"step": 21173, "train_loss": 3.196624755859375, "lr": 0.00012191597374954806, "tps": 27203, "wall": 51011.2} {"step": 21174, "train_loss": 3.1838645935058594, "lr": 0.00012189991044263774, "tps": 27201, "wall": 51016.8} {"step": 21175, "train_loss": 3.3300654888153076, "lr": 0.00012188384824701047, "tps": 27199, "wall": 51022.4} {"step": 21176, "train_loss": 3.251556158065796, "lr": 0.00012186778716284832, "tps": 27197, "wall": 51028.1} {"step": 21177, "train_loss": 3.2894692420959473, "lr": 0.00012185172719033317, "tps": 27196, "wall": 51033.8} {"step": 21178, "train_loss": 3.3412790298461914, "lr": 0.00012183566832964694, "tps": 27194, "wall": 51039.4} {"step": 21179, "train_loss": 3.4049324989318848, "lr": 0.0001218196105809716, "tps": 27192, "wall": 51045.1} {"step": 21180, "train_loss": 3.280022621154785, "lr": 0.00012180355394448906, "tps": 27190, "wall": 51050.7} {"step": 21181, "train_loss": 3.35330867767334, "lr": 0.00012178749842038106, "tps": 27189, "wall": 51056.3} {"step": 21182, "train_loss": 3.3182942867279053, "lr": 0.0001217714440088297, "tps": 27187, "wall": 51061.9} {"step": 21183, "train_loss": 3.249124526977539, "lr": 0.00012175539071001671, "tps": 27185, "wall": 51067.5} {"step": 21184, "train_loss": 3.2629401683807373, "lr": 0.00012173933852412394, "tps": 27184, "wall": 51073.1} {"step": 21185, "train_loss": 3.196727752685547, "lr": 0.00012172328745133328, "tps": 27182, "wall": 51078.8} {"step": 21186, "train_loss": 3.3988876342773438, "lr": 0.00012170723749182653, "tps": 27180, "wall": 51084.4} {"step": 21187, "train_loss": 3.3208489418029785, "lr": 0.00012169118864578549, "tps": 27179, "wall": 51090.0} {"step": 21188, "train_loss": 3.2639353275299072, "lr": 0.00012167514091339203, "tps": 27177, "wall": 51095.7} {"step": 21189, "train_loss": 3.2695822715759277, "lr": 0.0001216590942948279, "tps": 27175, "wall": 51101.3} {"step": 21190, "train_loss": 3.2497000694274902, "lr": 0.0001216430487902748, "tps": 27173, "wall": 51106.9} {"step": 21191, "train_loss": 3.2042689323425293, "lr": 0.00012162700439991459, "tps": 27172, "wall": 51112.5} {"step": 21192, "train_loss": 3.1951282024383545, "lr": 0.00012161096112392898, "tps": 27170, "wall": 51118.2} {"step": 21193, "train_loss": 3.3239946365356445, "lr": 0.00012159491896249977, "tps": 27168, "wall": 51123.9} {"step": 21194, "train_loss": 3.289874792098999, "lr": 0.00012157887791580866, "tps": 27167, "wall": 51129.5} {"step": 21195, "train_loss": 3.2143590450286865, "lr": 0.00012156283798403728, "tps": 27165, "wall": 51135.1} {"step": 21196, "train_loss": 3.2211499214172363, "lr": 0.00012154679916736745, "tps": 27163, "wall": 51140.7} {"step": 21197, "train_loss": 3.195862054824829, "lr": 0.00012153076146598079, "tps": 27161, "wall": 51146.3} {"step": 21198, "train_loss": 3.254706382751465, "lr": 0.00012151472488005895, "tps": 27160, "wall": 51152.0} {"step": 21199, "train_loss": 3.302605152130127, "lr": 0.00012149868940978369, "tps": 27158, "wall": 51157.7} {"step": 21200, "train_loss": 3.391529083251953, "lr": 0.0001214826550553366, "tps": 27156, "wall": 51163.3} {"step": 21201, "train_loss": 3.3096463680267334, "lr": 0.00012146662181689927, "tps": 27155, "wall": 51168.9} {"step": 21202, "train_loss": 3.3202342987060547, "lr": 0.00012145058969465344, "tps": 27153, "wall": 51174.5} {"step": 21203, "train_loss": 3.2787277698516846, "lr": 0.00012143455868878064, "tps": 27151, "wall": 51180.1} {"step": 21204, "train_loss": 3.18145489692688, "lr": 0.00012141852879946248, "tps": 27149, "wall": 51185.7} {"step": 21205, "train_loss": 3.2482378482818604, "lr": 0.00012140250002688058, "tps": 27148, "wall": 51191.4} {"step": 21206, "train_loss": 3.4043354988098145, "lr": 0.0001213864723712165, "tps": 27146, "wall": 51197.0} {"step": 21207, "train_loss": 3.3695101737976074, "lr": 0.00012137044583265172, "tps": 27144, "wall": 51202.7} {"step": 21208, "train_loss": 3.2691874504089355, "lr": 0.00012135442041136795, "tps": 27143, "wall": 51208.3} {"step": 21209, "train_loss": 3.303598165512085, "lr": 0.00012133839610754658, "tps": 27141, "wall": 51213.9} {"step": 21210, "train_loss": 3.1766021251678467, "lr": 0.00012132237292136926, "tps": 27139, "wall": 51219.5} {"step": 21211, "train_loss": 3.2921571731567383, "lr": 0.00012130635085301742, "tps": 27138, "wall": 51225.1} {"step": 21212, "train_loss": 3.3398680686950684, "lr": 0.00012129032990267253, "tps": 27136, "wall": 51230.8} {"step": 21213, "train_loss": 3.299114942550659, "lr": 0.00012127431007051617, "tps": 27134, "wall": 51236.4} {"step": 21214, "train_loss": 3.302705764770508, "lr": 0.0001212582913567298, "tps": 27132, "wall": 51242.1} {"step": 21215, "train_loss": 3.2904648780822754, "lr": 0.00012124227376149474, "tps": 27131, "wall": 51247.7} {"step": 21216, "train_loss": 3.3035974502563477, "lr": 0.00012122625728499264, "tps": 27129, "wall": 51253.4} {"step": 21217, "train_loss": 3.302748203277588, "lr": 0.00012121024192740483, "tps": 27127, "wall": 51259.0} {"step": 21218, "train_loss": 3.3350677490234375, "lr": 0.00012119422768891269, "tps": 27126, "wall": 51264.7} {"step": 21219, "train_loss": 3.237851858139038, "lr": 0.00012117821456969771, "tps": 27124, "wall": 51270.3} {"step": 21220, "train_loss": 3.2348849773406982, "lr": 0.0001211622025699413, "tps": 27122, "wall": 51276.0} {"step": 21221, "train_loss": 3.2666118144989014, "lr": 0.00012114619168982473, "tps": 27120, "wall": 51281.6} {"step": 21222, "train_loss": 3.3427982330322266, "lr": 0.00012113018192952953, "tps": 27119, "wall": 51287.2} {"step": 21223, "train_loss": 3.255563735961914, "lr": 0.00012111417328923696, "tps": 27117, "wall": 51292.8} {"step": 21224, "train_loss": 3.2974178791046143, "lr": 0.00012109816576912831, "tps": 27115, "wall": 51298.5} {"step": 21225, "train_loss": 3.3523292541503906, "lr": 0.00012108215936938507, "tps": 27114, "wall": 51304.1} {"step": 21226, "train_loss": 3.2756142616271973, "lr": 0.00012106615409018843, "tps": 27112, "wall": 51309.7} {"step": 21227, "train_loss": 3.2344675064086914, "lr": 0.00012105014993171979, "tps": 27110, "wall": 51315.4} {"step": 21228, "train_loss": 3.4141011238098145, "lr": 0.00012103414689416039, "tps": 27109, "wall": 51321.1} {"step": 21229, "train_loss": 3.2632410526275635, "lr": 0.00012101814497769149, "tps": 27107, "wall": 51326.7} {"step": 21230, "train_loss": 3.3828744888305664, "lr": 0.0001210021441824945, "tps": 27105, "wall": 51332.3} {"step": 21231, "train_loss": 3.36922025680542, "lr": 0.0001209861445087505, "tps": 27103, "wall": 51338.1} {"step": 21232, "train_loss": 3.2283778190612793, "lr": 0.00012097014595664078, "tps": 27102, "wall": 51343.8} {"step": 21233, "train_loss": 3.254915714263916, "lr": 0.00012095414852634668, "tps": 27100, "wall": 51349.4} {"step": 21234, "train_loss": 3.336564064025879, "lr": 0.00012093815221804932, "tps": 27098, "wall": 51355.1} {"step": 21235, "train_loss": 3.2983572483062744, "lr": 0.00012092215703192988, "tps": 27097, "wall": 51360.7} {"step": 21236, "train_loss": 3.2935006618499756, "lr": 0.00012090616296816968, "tps": 27095, "wall": 51366.4} {"step": 21237, "train_loss": 3.283592700958252, "lr": 0.0001208901700269498, "tps": 27093, "wall": 51372.1} {"step": 21238, "train_loss": 3.4033315181732178, "lr": 0.0001208741782084514, "tps": 27091, "wall": 51377.7} {"step": 21239, "train_loss": 3.3134312629699707, "lr": 0.00012085818751285571, "tps": 27090, "wall": 51383.3} {"step": 21240, "train_loss": 3.183093547821045, "lr": 0.00012084219794034386, "tps": 27088, "wall": 51389.0} {"step": 21241, "train_loss": 3.218780040740967, "lr": 0.00012082620949109689, "tps": 27086, "wall": 51394.7} {"step": 21242, "train_loss": 3.296954393386841, "lr": 0.00012081022216529602, "tps": 27085, "wall": 51400.4} {"step": 21243, "train_loss": 3.3898513317108154, "lr": 0.00012079423596312234, "tps": 27083, "wall": 51406.1} {"step": 21244, "train_loss": 3.243360757827759, "lr": 0.00012077825088475685, "tps": 27081, "wall": 51411.8} {"step": 21245, "train_loss": 3.4612715244293213, "lr": 0.00012076226693038077, "tps": 27079, "wall": 51417.5} {"step": 21246, "train_loss": 3.3815016746520996, "lr": 0.00012074628410017505, "tps": 27078, "wall": 51423.2} {"step": 21247, "train_loss": 3.1831471920013428, "lr": 0.00012073030239432084, "tps": 27076, "wall": 51428.9} {"step": 21248, "train_loss": 3.161924123764038, "lr": 0.00012071432181299914, "tps": 27074, "wall": 51434.6} {"step": 21249, "train_loss": 3.374181032180786, "lr": 0.0001206983423563909, "tps": 27072, "wall": 51440.3} {"step": 21250, "train_loss": 3.3195431232452393, "lr": 0.00012068236402467727, "tps": 27071, "wall": 51446.0} {"step": 21251, "train_loss": 3.244384765625, "lr": 0.00012066638681803922, "tps": 27069, "wall": 51451.6} {"step": 21252, "train_loss": 3.3292338848114014, "lr": 0.00012065041073665764, "tps": 27067, "wall": 51457.6} {"step": 21253, "train_loss": 3.314756393432617, "lr": 0.00012063443578071365, "tps": 27065, "wall": 51463.3} {"step": 21254, "train_loss": 3.3257627487182617, "lr": 0.0001206184619503881, "tps": 27064, "wall": 51469.0} {"step": 21255, "train_loss": 3.3394715785980225, "lr": 0.000120602489245862, "tps": 27062, "wall": 51474.7} {"step": 21256, "train_loss": 3.3740601539611816, "lr": 0.0001205865176673163, "tps": 27060, "wall": 51480.3} {"step": 21257, "train_loss": 3.3934764862060547, "lr": 0.0001205705472149319, "tps": 27059, "wall": 51486.0} {"step": 21258, "train_loss": 3.2797906398773193, "lr": 0.00012055457788888968, "tps": 27057, "wall": 51491.7} {"step": 21259, "train_loss": 3.326763391494751, "lr": 0.00012053860968937064, "tps": 27055, "wall": 51497.4} {"step": 21260, "train_loss": 3.344557046890259, "lr": 0.00012052264261655559, "tps": 27053, "wall": 51503.1} {"step": 21261, "train_loss": 3.269716739654541, "lr": 0.00012050667667062536, "tps": 27052, "wall": 51508.8} {"step": 21262, "train_loss": 3.341154098510742, "lr": 0.00012049071185176098, "tps": 27050, "wall": 51514.7} {"step": 21263, "train_loss": 3.2902169227600098, "lr": 0.0001204747481601431, "tps": 27048, "wall": 51520.3} {"step": 21264, "train_loss": 3.2343015670776367, "lr": 0.00012045878559595276, "tps": 27046, "wall": 51526.0} {"step": 21265, "train_loss": 3.303783655166626, "lr": 0.00012044282415937064, "tps": 27045, "wall": 51531.8} {"step": 21266, "train_loss": 3.3583664894104004, "lr": 0.00012042686385057758, "tps": 27043, "wall": 51537.5} {"step": 21267, "train_loss": 3.286829948425293, "lr": 0.0001204109046697544, "tps": 27041, "wall": 51543.2} {"step": 21268, "train_loss": 3.2190794944763184, "lr": 0.00012039494661708191, "tps": 27040, "wall": 51548.9} {"step": 21269, "train_loss": 3.212655544281006, "lr": 0.0001203789896927408, "tps": 27038, "wall": 51554.6} {"step": 21270, "train_loss": 3.275930643081665, "lr": 0.00012036303389691193, "tps": 27036, "wall": 51560.2} {"step": 21271, "train_loss": 3.323018789291382, "lr": 0.00012034707922977601, "tps": 27034, "wall": 51565.9} {"step": 21272, "train_loss": 3.3858730792999268, "lr": 0.00012033112569151366, "tps": 27033, "wall": 51571.7} {"step": 21273, "train_loss": 3.373920440673828, "lr": 0.00012031517328230584, "tps": 27031, "wall": 51577.5} {"step": 21274, "train_loss": 3.246206521987915, "lr": 0.0001202992220023331, "tps": 27029, "wall": 51583.1} {"step": 21275, "train_loss": 3.2865233421325684, "lr": 0.00012028327185177608, "tps": 27028, "wall": 51588.9} {"step": 21276, "train_loss": 3.2709553241729736, "lr": 0.00012026732283081565, "tps": 27026, "wall": 51594.6} {"step": 21277, "train_loss": 3.3449654579162598, "lr": 0.00012025137493963239, "tps": 27024, "wall": 51600.3} {"step": 21278, "train_loss": 3.376823902130127, "lr": 0.00012023542817840688, "tps": 27022, "wall": 51606.0} {"step": 21279, "train_loss": 3.337801456451416, "lr": 0.00012021948254731987, "tps": 27021, "wall": 51611.8} {"step": 21280, "train_loss": 3.342507839202881, "lr": 0.00012020353804655193, "tps": 27019, "wall": 51617.5} {"step": 21281, "train_loss": 3.303420066833496, "lr": 0.00012018759467628373, "tps": 27017, "wall": 51623.2} {"step": 21282, "train_loss": 3.184934616088867, "lr": 0.00012017165243669591, "tps": 27015, "wall": 51628.9} {"step": 21283, "train_loss": 3.3458595275878906, "lr": 0.00012015571132796894, "tps": 27014, "wall": 51634.7} {"step": 21284, "train_loss": 3.229841947555542, "lr": 0.00012013977135028351, "tps": 27012, "wall": 51640.4} {"step": 21285, "train_loss": 3.29854679107666, "lr": 0.00012012383250382015, "tps": 27010, "wall": 51646.1} {"step": 21286, "train_loss": 3.3064162731170654, "lr": 0.00012010789478875937, "tps": 27009, "wall": 51651.8} {"step": 21287, "train_loss": 3.3816094398498535, "lr": 0.00012009195820528183, "tps": 27007, "wall": 51657.5} {"step": 21288, "train_loss": 3.237823724746704, "lr": 0.000120076022753568, "tps": 27005, "wall": 51663.3} {"step": 21289, "train_loss": 3.270991802215576, "lr": 0.0001200600884337983, "tps": 27003, "wall": 51669.0} {"step": 21290, "train_loss": 3.22445011138916, "lr": 0.0001200441552461534, "tps": 27002, "wall": 51674.7} {"step": 21291, "train_loss": 3.3560149669647217, "lr": 0.00012002822319081373, "tps": 27000, "wall": 51680.4} {"step": 21292, "train_loss": 3.296949863433838, "lr": 0.00012001229226795967, "tps": 26998, "wall": 51686.2} {"step": 21293, "train_loss": 3.270174980163574, "lr": 0.00011999636247777186, "tps": 26996, "wall": 51691.9} {"step": 21294, "train_loss": 3.3215508460998535, "lr": 0.00011998043382043066, "tps": 26995, "wall": 51697.7} {"step": 21295, "train_loss": 3.330425262451172, "lr": 0.00011996450629611645, "tps": 26993, "wall": 51703.4} {"step": 21296, "train_loss": 3.3279786109924316, "lr": 0.00011994857990500978, "tps": 26991, "wall": 51709.0} {"step": 21297, "train_loss": 3.266206979751587, "lr": 0.00011993265464729102, "tps": 26990, "wall": 51714.7} {"step": 21298, "train_loss": 3.2251381874084473, "lr": 0.0001199167305231405, "tps": 26988, "wall": 51720.4} {"step": 21299, "train_loss": 3.312044620513916, "lr": 0.00011990080753273872, "tps": 26986, "wall": 51726.2} {"step": 21300, "train_loss": 3.3500401973724365, "lr": 0.00011988488567626595, "tps": 26984, "wall": 51731.8} {"step": 21301, "train_loss": 3.2928109169006348, "lr": 0.0001198689649539027, "tps": 26983, "wall": 51737.5} {"step": 21302, "train_loss": 3.2752068042755127, "lr": 0.00011985304536582918, "tps": 26981, "wall": 51743.2} {"step": 21303, "train_loss": 3.2778286933898926, "lr": 0.00011983712691222575, "tps": 26979, "wall": 51748.9} {"step": 21304, "train_loss": 3.299140453338623, "lr": 0.00011982120959327281, "tps": 26978, "wall": 51754.7} {"step": 21305, "train_loss": 3.2957346439361572, "lr": 0.00011980529340915065, "tps": 26976, "wall": 51760.4} {"step": 21306, "train_loss": 3.3748250007629395, "lr": 0.0001197893783600395, "tps": 26974, "wall": 51766.1} {"step": 21307, "train_loss": 3.359771490097046, "lr": 0.0001197734644461197, "tps": 26972, "wall": 51771.8} {"step": 21308, "train_loss": 3.321727752685547, "lr": 0.00011975755166757157, "tps": 26971, "wall": 51777.5} {"step": 21309, "train_loss": 3.2149171829223633, "lr": 0.00011974164002457521, "tps": 26969, "wall": 51783.2} {"step": 21310, "train_loss": 3.3159375190734863, "lr": 0.00011972572951731104, "tps": 26967, "wall": 51788.9} {"step": 21311, "train_loss": 3.3962035179138184, "lr": 0.00011970982014595929, "tps": 26966, "wall": 51794.6} {"step": 21312, "train_loss": 3.2935633659362793, "lr": 0.00011969391191070001, "tps": 26964, "wall": 51800.3} {"step": 21313, "train_loss": 3.3095803260803223, "lr": 0.00011967800481171361, "tps": 26962, "wall": 51806.0} {"step": 21314, "train_loss": 3.339339017868042, "lr": 0.00011966209884918016, "tps": 26961, "wall": 51811.6} {"step": 21315, "train_loss": 3.3158085346221924, "lr": 0.00011964619402327985, "tps": 26959, "wall": 51817.4} {"step": 21316, "train_loss": 3.2682557106018066, "lr": 0.00011963029033419296, "tps": 26957, "wall": 51823.1} {"step": 21317, "train_loss": 3.304006814956665, "lr": 0.00011961438778209948, "tps": 26955, "wall": 51828.8} {"step": 21318, "train_loss": 3.2644925117492676, "lr": 0.00011959848636717971, "tps": 26954, "wall": 51834.5} {"step": 21319, "train_loss": 3.258523941040039, "lr": 0.00011958258608961373, "tps": 26952, "wall": 51840.2} {"step": 21320, "train_loss": 3.341609239578247, "lr": 0.00011956668694958157, "tps": 26950, "wall": 51845.8} {"step": 21321, "train_loss": 3.187291383743286, "lr": 0.00011955078894726348, "tps": 26949, "wall": 51851.5} {"step": 21322, "train_loss": 3.2537758350372314, "lr": 0.0001195348920828395, "tps": 26947, "wall": 51857.3} {"step": 21323, "train_loss": 3.303088665008545, "lr": 0.00011951899635648964, "tps": 26945, "wall": 51863.0} {"step": 21324, "train_loss": 3.388056516647339, "lr": 0.00011950310176839407, "tps": 26944, "wall": 51868.7} {"step": 21325, "train_loss": 3.38704252243042, "lr": 0.00011948720831873283, "tps": 26942, "wall": 51874.6} {"step": 21326, "train_loss": 3.2895658016204834, "lr": 0.0001194713160076859, "tps": 26940, "wall": 51880.2} {"step": 21327, "train_loss": 3.3306853771209717, "lr": 0.00011945542483543335, "tps": 26938, "wall": 51885.9} {"step": 21328, "train_loss": 3.3286285400390625, "lr": 0.00011943953480215512, "tps": 26937, "wall": 51891.6} {"step": 21329, "train_loss": 3.372246265411377, "lr": 0.00011942364590803135, "tps": 26935, "wall": 51897.3} {"step": 21330, "train_loss": 3.3334803581237793, "lr": 0.00011940775815324195, "tps": 26933, "wall": 51903.0} {"step": 21331, "train_loss": 3.255162477493286, "lr": 0.00011939187153796685, "tps": 26932, "wall": 51908.7} {"step": 21332, "train_loss": 3.281242847442627, "lr": 0.00011937598606238614, "tps": 26930, "wall": 51914.3} {"step": 21333, "train_loss": 3.2804129123687744, "lr": 0.00011936010172667969, "tps": 26928, "wall": 51920.0} {"step": 21334, "train_loss": 3.312105894088745, "lr": 0.0001193442185310274, "tps": 26927, "wall": 51925.8} {"step": 21335, "train_loss": 3.363222122192383, "lr": 0.0001193283364756093, "tps": 26925, "wall": 51931.5} {"step": 21336, "train_loss": 3.202577590942383, "lr": 0.00011931245556060528, "tps": 26923, "wall": 51937.3} {"step": 21337, "train_loss": 3.2647173404693604, "lr": 0.00011929657578619514, "tps": 26921, "wall": 51943.0} {"step": 21338, "train_loss": 3.2551982402801514, "lr": 0.00011928069715255885, "tps": 26920, "wall": 51948.8} {"step": 21339, "train_loss": 3.3660776615142822, "lr": 0.00011926481965987632, "tps": 26918, "wall": 51954.4} {"step": 21340, "train_loss": 3.3401665687561035, "lr": 0.0001192489433083273, "tps": 26916, "wall": 51960.2} {"step": 21341, "train_loss": 3.3733763694763184, "lr": 0.00011923306809809176, "tps": 26915, "wall": 51965.9} {"step": 21342, "train_loss": 3.2945685386657715, "lr": 0.00011921719402934938, "tps": 26913, "wall": 51971.6} {"step": 21343, "train_loss": 3.2805728912353516, "lr": 0.0001192013211022802, "tps": 26911, "wall": 51977.3} {"step": 21344, "train_loss": 3.407918930053711, "lr": 0.00011918544931706385, "tps": 26910, "wall": 51983.0} {"step": 21345, "train_loss": 3.312033176422119, "lr": 0.00011916957867388015, "tps": 26908, "wall": 51988.8} {"step": 21346, "train_loss": 3.316122055053711, "lr": 0.000119153709172909, "tps": 26906, "wall": 51994.6} {"step": 21347, "train_loss": 3.3484439849853516, "lr": 0.00011913784081433003, "tps": 26904, "wall": 52000.3} {"step": 21348, "train_loss": 3.296203136444092, "lr": 0.00011912197359832304, "tps": 26903, "wall": 52006.0} {"step": 21349, "train_loss": 3.3311679363250732, "lr": 0.00011910610752506785, "tps": 26901, "wall": 52011.7} {"step": 21350, "train_loss": 3.2450406551361084, "lr": 0.00011909024259474412, "tps": 26899, "wall": 52017.5} {"step": 21351, "train_loss": 3.321536064147949, "lr": 0.00011907437880753152, "tps": 26898, "wall": 52023.2} {"step": 21352, "train_loss": 3.367769241333008, "lr": 0.00011905851616360988, "tps": 26896, "wall": 52028.9} {"step": 21353, "train_loss": 3.344388008117676, "lr": 0.00011904265466315885, "tps": 26894, "wall": 52034.6} {"step": 21354, "train_loss": 3.289966106414795, "lr": 0.00011902679430635799, "tps": 26893, "wall": 52040.3} {"step": 21355, "train_loss": 3.2170395851135254, "lr": 0.00011901093509338715, "tps": 26891, "wall": 52046.1} {"step": 21356, "train_loss": 3.17443585395813, "lr": 0.0001189950770244259, "tps": 26889, "wall": 52051.8} {"step": 21357, "train_loss": 3.2608418464660645, "lr": 0.00011897922009965381, "tps": 26887, "wall": 52057.6} {"step": 21358, "train_loss": 3.4794790744781494, "lr": 0.00011896336431925066, "tps": 26886, "wall": 52063.3} {"step": 21359, "train_loss": 3.336550712585449, "lr": 0.0001189475096833959, "tps": 26884, "wall": 52069.0} {"step": 21360, "train_loss": 3.3050448894500732, "lr": 0.00011893165619226931, "tps": 26882, "wall": 52074.7} {"step": 21361, "train_loss": 3.3314380645751953, "lr": 0.00011891580384605036, "tps": 26881, "wall": 52080.5} {"step": 21362, "train_loss": 3.3050994873046875, "lr": 0.0001188999526449186, "tps": 26879, "wall": 52086.2} {"step": 21363, "train_loss": 3.278881072998047, "lr": 0.00011888410258905369, "tps": 26877, "wall": 52091.9} {"step": 21364, "train_loss": 3.3453335762023926, "lr": 0.00011886825367863516, "tps": 26876, "wall": 52097.6} {"step": 21365, "train_loss": 3.2342939376831055, "lr": 0.00011885240591384246, "tps": 26874, "wall": 52103.3} {"step": 21366, "train_loss": 3.3150854110717773, "lr": 0.00011883655929485525, "tps": 26872, "wall": 52109.0} {"step": 21367, "train_loss": 3.340308666229248, "lr": 0.00011882071382185294, "tps": 26870, "wall": 52114.8} {"step": 21368, "train_loss": 3.2707643508911133, "lr": 0.00011880486949501502, "tps": 26869, "wall": 52120.5} {"step": 21369, "train_loss": 3.259244441986084, "lr": 0.00011878902631452104, "tps": 26867, "wall": 52126.2} {"step": 21370, "train_loss": 3.2545595169067383, "lr": 0.00011877318428055049, "tps": 26865, "wall": 52131.9} {"step": 21371, "train_loss": 3.2425918579101562, "lr": 0.00011875734339328268, "tps": 26864, "wall": 52137.7} {"step": 21372, "train_loss": 3.2805533409118652, "lr": 0.00011874150365289724, "tps": 26862, "wall": 52143.4} {"step": 21373, "train_loss": 3.2967066764831543, "lr": 0.00011872566505957355, "tps": 26860, "wall": 52149.2} {"step": 21374, "train_loss": 3.3571887016296387, "lr": 0.00011870982761349091, "tps": 26859, "wall": 52154.9} {"step": 21375, "train_loss": 3.3172216415405273, "lr": 0.0001186939913148289, "tps": 26857, "wall": 52160.6} {"step": 21376, "train_loss": 3.2311923503875732, "lr": 0.00011867815616376683, "tps": 26855, "wall": 52166.4} {"step": 21377, "train_loss": 3.479619026184082, "lr": 0.00011866232216048402, "tps": 26854, "wall": 52172.0} {"step": 21378, "train_loss": 3.3419885635375977, "lr": 0.00011864648930516, "tps": 26852, "wall": 52177.8} {"step": 21379, "train_loss": 3.233302593231201, "lr": 0.00011863065759797394, "tps": 26850, "wall": 52183.5} {"step": 21380, "train_loss": 3.3646740913391113, "lr": 0.00011861482703910533, "tps": 26848, "wall": 52189.1} {"step": 21381, "train_loss": 3.3037168979644775, "lr": 0.00011859899762873348, "tps": 26847, "wall": 52194.8} {"step": 21382, "train_loss": 3.2763943672180176, "lr": 0.00011858316936703759, "tps": 26845, "wall": 52200.5} {"step": 21383, "train_loss": 3.2588937282562256, "lr": 0.00011856734225419707, "tps": 26844, "wall": 52206.1} {"step": 21384, "train_loss": 3.317504644393921, "lr": 0.00011855151629039123, "tps": 26842, "wall": 52211.8} {"step": 21385, "train_loss": 3.3440582752227783, "lr": 0.00011853569147579924, "tps": 26840, "wall": 52217.5} {"step": 21386, "train_loss": 3.335911273956299, "lr": 0.00011851986781060047, "tps": 26838, "wall": 52223.2} {"step": 21387, "train_loss": 3.2243869304656982, "lr": 0.00011850404529497417, "tps": 26837, "wall": 52228.9} {"step": 21388, "train_loss": 3.3658103942871094, "lr": 0.00011848822392909942, "tps": 26835, "wall": 52234.6} {"step": 21389, "train_loss": 3.295182704925537, "lr": 0.00011847240371315562, "tps": 26833, "wall": 52240.3} {"step": 21390, "train_loss": 3.2294793128967285, "lr": 0.00011845658464732196, "tps": 26832, "wall": 52246.0} {"step": 21391, "train_loss": 3.3597850799560547, "lr": 0.00011844076673177753, "tps": 26830, "wall": 52251.6} {"step": 21392, "train_loss": 3.2458319664001465, "lr": 0.00011842494996670163, "tps": 26829, "wall": 52257.3} {"step": 21393, "train_loss": 3.2563600540161133, "lr": 0.00011840913435227343, "tps": 26827, "wall": 52262.9} {"step": 21394, "train_loss": 3.3341941833496094, "lr": 0.00011839331988867198, "tps": 26825, "wall": 52268.6} {"step": 21395, "train_loss": 3.1724300384521484, "lr": 0.00011837750657607653, "tps": 26824, "wall": 52274.3} {"step": 21396, "train_loss": 3.3201634883880615, "lr": 0.00011836169441466611, "tps": 26822, "wall": 52280.0} {"step": 21397, "train_loss": 3.324984073638916, "lr": 0.00011834588340462002, "tps": 26820, "wall": 52285.7} {"step": 21398, "train_loss": 3.2734994888305664, "lr": 0.00011833007354611725, "tps": 26819, "wall": 52291.4} {"step": 21399, "train_loss": 3.244771957397461, "lr": 0.00011831426483933685, "tps": 26817, "wall": 52297.1} {"step": 21400, "train_loss": 3.352252960205078, "lr": 0.000118298457284458, "tps": 26815, "wall": 52302.8} {"step": 21401, "train_loss": 3.2812089920043945, "lr": 0.00011828265088165976, "tps": 26814, "wall": 52308.5} {"step": 21402, "train_loss": 3.2296953201293945, "lr": 0.00011826684563112107, "tps": 26812, "wall": 52314.1} {"step": 21403, "train_loss": 3.2015559673309326, "lr": 0.00011825104153302114, "tps": 26810, "wall": 52319.8} {"step": 21404, "train_loss": 3.3230128288269043, "lr": 0.0001182352385875389, "tps": 26809, "wall": 52325.5} {"step": 21405, "train_loss": 3.2849931716918945, "lr": 0.0001182194367948533, "tps": 26807, "wall": 52331.1} {"step": 21406, "train_loss": 3.3609840869903564, "lr": 0.00011820363615514352, "tps": 26805, "wall": 52336.8} {"step": 21407, "train_loss": 3.3218445777893066, "lr": 0.00011818783666858841, "tps": 26804, "wall": 52342.5} {"step": 21408, "train_loss": 3.1231143474578857, "lr": 0.00011817203833536699, "tps": 26802, "wall": 52348.1} {"step": 21409, "train_loss": 3.2059485912323, "lr": 0.00011815624115565827, "tps": 26800, "wall": 52353.9} {"step": 21410, "train_loss": 3.331000804901123, "lr": 0.00011814044512964116, "tps": 26799, "wall": 52359.5} {"step": 21411, "train_loss": 3.2128565311431885, "lr": 0.0001181246502574945, "tps": 26797, "wall": 52365.2} {"step": 21412, "train_loss": 3.3299689292907715, "lr": 0.00011810885653939742, "tps": 26795, "wall": 52370.9} {"step": 21413, "train_loss": 3.281463861465454, "lr": 0.00011809306397552866, "tps": 26794, "wall": 52376.6} {"step": 21414, "train_loss": 3.226717710494995, "lr": 0.00011807727256606722, "tps": 26792, "wall": 52382.2} {"step": 21415, "train_loss": 3.2620291709899902, "lr": 0.00011806148231119198, "tps": 26790, "wall": 52387.9} {"step": 21416, "train_loss": 3.281245470046997, "lr": 0.0001180456932110817, "tps": 26789, "wall": 52393.6} {"step": 21417, "train_loss": 3.405040740966797, "lr": 0.0001180299052659154, "tps": 26787, "wall": 52399.3} {"step": 21418, "train_loss": 3.3309741020202637, "lr": 0.00011801411847587185, "tps": 26785, "wall": 52404.9} {"step": 21419, "train_loss": 3.319300889968872, "lr": 0.00011799833284112982, "tps": 26784, "wall": 52410.6} {"step": 21420, "train_loss": 3.3770852088928223, "lr": 0.00011798254836186827, "tps": 26782, "wall": 52416.4} {"step": 21421, "train_loss": 3.2418313026428223, "lr": 0.0001179667650382659, "tps": 26780, "wall": 52422.1} {"step": 21422, "train_loss": 3.2650413513183594, "lr": 0.00011795098287050148, "tps": 26779, "wall": 52427.8} {"step": 21423, "train_loss": 3.3166561126708984, "lr": 0.00011793520185875389, "tps": 26777, "wall": 52433.4} {"step": 21424, "train_loss": 3.2571544647216797, "lr": 0.00011791942200320187, "tps": 26775, "wall": 52439.2} {"step": 21425, "train_loss": 3.237978458404541, "lr": 0.00011790364330402413, "tps": 26774, "wall": 52444.8} {"step": 21426, "train_loss": 3.315615177154541, "lr": 0.00011788786576139949, "tps": 26772, "wall": 52450.6} {"step": 21427, "train_loss": 3.323051929473877, "lr": 0.00011787208937550663, "tps": 26770, "wall": 52456.2} {"step": 21428, "train_loss": 3.2857046127319336, "lr": 0.00011785631414652419, "tps": 26769, "wall": 52461.9} {"step": 21429, "train_loss": 3.307392120361328, "lr": 0.00011784054007463101, "tps": 26767, "wall": 52467.5} {"step": 21430, "train_loss": 3.2279977798461914, "lr": 0.00011782476716000572, "tps": 26766, "wall": 52473.4} {"step": 21431, "train_loss": 3.2344071865081787, "lr": 0.00011780899540282693, "tps": 26764, "wall": 52479.1} {"step": 21432, "train_loss": 3.279804229736328, "lr": 0.00011779322480327346, "tps": 26762, "wall": 52484.8} {"step": 21433, "train_loss": 3.320742607116699, "lr": 0.00011777745536152376, "tps": 26761, "wall": 52490.5} {"step": 21434, "train_loss": 3.266979217529297, "lr": 0.00011776168707775668, "tps": 26759, "wall": 52496.2} {"step": 21435, "train_loss": 3.284515142440796, "lr": 0.00011774591995215072, "tps": 26757, "wall": 52501.8} {"step": 21436, "train_loss": 3.2593069076538086, "lr": 0.00011773015398488445, "tps": 26756, "wall": 52507.6} {"step": 21437, "train_loss": 3.2817564010620117, "lr": 0.0001177143891761366, "tps": 26754, "wall": 52513.3} {"step": 21438, "train_loss": 3.2543013095855713, "lr": 0.00011769862552608568, "tps": 26752, "wall": 52518.9} {"step": 21439, "train_loss": 3.2954986095428467, "lr": 0.00011768286303491018, "tps": 26751, "wall": 52524.6} {"step": 21440, "train_loss": 3.343132972717285, "lr": 0.00011766710170278883, "tps": 26749, "wall": 52530.3} {"step": 21441, "train_loss": 3.3896660804748535, "lr": 0.0001176513415299001, "tps": 26747, "wall": 52536.1} {"step": 21442, "train_loss": 3.313918113708496, "lr": 0.00011763558251642242, "tps": 26746, "wall": 52541.7} {"step": 21443, "train_loss": 3.2848925590515137, "lr": 0.00011761982466253445, "tps": 26744, "wall": 52547.4} {"step": 21444, "train_loss": 3.22676944732666, "lr": 0.00011760406796841468, "tps": 26742, "wall": 52553.1} {"step": 21445, "train_loss": 3.3953404426574707, "lr": 0.00011758831243424148, "tps": 26741, "wall": 52558.8} {"step": 21446, "train_loss": 3.2916293144226074, "lr": 0.0001175725580601935, "tps": 26739, "wall": 52564.5} {"step": 21447, "train_loss": 3.277451276779175, "lr": 0.00011755680484644911, "tps": 26737, "wall": 52570.2} {"step": 21448, "train_loss": 3.1954245567321777, "lr": 0.00011754105279318672, "tps": 26736, "wall": 52575.9} {"step": 21449, "train_loss": 3.2065422534942627, "lr": 0.0001175253019005849, "tps": 26734, "wall": 52581.6} {"step": 21450, "train_loss": 3.2800300121307373, "lr": 0.00011750955216882191, "tps": 26732, "wall": 52587.3} {"step": 21451, "train_loss": 3.270732879638672, "lr": 0.00011749380359807634, "tps": 26731, "wall": 52593.1} {"step": 21452, "train_loss": 3.3144609928131104, "lr": 0.00011747805618852652, "tps": 26729, "wall": 52598.8} {"step": 21453, "train_loss": 3.3425564765930176, "lr": 0.00011746230994035075, "tps": 26727, "wall": 52604.5} {"step": 21454, "train_loss": 3.169508934020996, "lr": 0.00011744656485372754, "tps": 26726, "wall": 52610.2} {"step": 21455, "train_loss": 3.334376335144043, "lr": 0.0001174308209288352, "tps": 26724, "wall": 52615.8} {"step": 21456, "train_loss": 3.2990663051605225, "lr": 0.00011741507816585198, "tps": 26723, "wall": 52621.5} {"step": 21457, "train_loss": 3.325728178024292, "lr": 0.00011739933656495638, "tps": 26721, "wall": 52627.2} {"step": 21458, "train_loss": 3.2477502822875977, "lr": 0.00011738359612632668, "tps": 26719, "wall": 52632.8} {"step": 21459, "train_loss": 3.3870246410369873, "lr": 0.00011736785685014107, "tps": 26718, "wall": 52638.5} {"step": 21460, "train_loss": 3.288356304168701, "lr": 0.00011735211873657798, "tps": 26716, "wall": 52644.2} {"step": 21461, "train_loss": 3.287994623184204, "lr": 0.00011733638178581565, "tps": 26714, "wall": 52649.9} {"step": 21462, "train_loss": 3.4229066371917725, "lr": 0.00011732064599803227, "tps": 26713, "wall": 52655.7} {"step": 21463, "train_loss": 3.2432754039764404, "lr": 0.00011730491137340624, "tps": 26711, "wall": 52661.4} {"step": 21464, "train_loss": 3.2614121437072754, "lr": 0.00011728917791211575, "tps": 26709, "wall": 52667.1} {"step": 21465, "train_loss": 3.3892805576324463, "lr": 0.0001172734456143389, "tps": 26708, "wall": 52672.8} {"step": 21466, "train_loss": 3.2820682525634766, "lr": 0.00011725771448025411, "tps": 26706, "wall": 52678.6} {"step": 21467, "train_loss": 3.3159446716308594, "lr": 0.00011724198451003942, "tps": 26704, "wall": 52684.3} {"step": 21468, "train_loss": 3.2629477977752686, "lr": 0.00011722625570387316, "tps": 26703, "wall": 52690.0} {"step": 21469, "train_loss": 3.3080925941467285, "lr": 0.00011721052806193342, "tps": 26701, "wall": 52695.7} {"step": 21470, "train_loss": 3.3273048400878906, "lr": 0.00011719480158439833, "tps": 26699, "wall": 52701.4} {"step": 21471, "train_loss": 3.1257922649383545, "lr": 0.00011717907627144615, "tps": 26698, "wall": 52707.1} {"step": 21472, "train_loss": 3.3445653915405273, "lr": 0.00011716335212325495, "tps": 26696, "wall": 52712.8} {"step": 21473, "train_loss": 3.252845525741577, "lr": 0.00011714762914000278, "tps": 26694, "wall": 52718.6} {"step": 21474, "train_loss": 3.286585569381714, "lr": 0.00011713190732186792, "tps": 26693, "wall": 52724.3} {"step": 21475, "train_loss": 3.2415809631347656, "lr": 0.00011711618666902837, "tps": 26691, "wall": 52730.0} {"step": 21476, "train_loss": 3.3348724842071533, "lr": 0.00011710046718166217, "tps": 26689, "wall": 52735.7} {"step": 21477, "train_loss": 3.069121837615967, "lr": 0.00011708474885994749, "tps": 26688, "wall": 52741.4} {"step": 21478, "train_loss": 3.4793975353240967, "lr": 0.00011706903170406236, "tps": 26686, "wall": 52747.1} {"step": 21479, "train_loss": 3.3085498809814453, "lr": 0.00011705331571418474, "tps": 26685, "wall": 52752.7} {"step": 21480, "train_loss": 3.315824508666992, "lr": 0.00011703760089049278, "tps": 26683, "wall": 52758.4} {"step": 21481, "train_loss": 3.359870433807373, "lr": 0.00011702188723316445, "tps": 26681, "wall": 52764.1} {"step": 21482, "train_loss": 3.23148775100708, "lr": 0.00011700617474237771, "tps": 26680, "wall": 52769.8} {"step": 21483, "train_loss": 3.309246778488159, "lr": 0.00011699046341831063, "tps": 26678, "wall": 52775.6} {"step": 21484, "train_loss": 3.250105381011963, "lr": 0.00011697475326114116, "tps": 26676, "wall": 52781.2} {"step": 21485, "train_loss": 3.2359776496887207, "lr": 0.00011695904427104723, "tps": 26675, "wall": 52787.0} {"step": 21486, "train_loss": 3.3461389541625977, "lr": 0.00011694333644820683, "tps": 26673, "wall": 52792.6} {"step": 21487, "train_loss": 3.3630876541137695, "lr": 0.00011692762979279786, "tps": 26671, "wall": 52798.4} {"step": 21488, "train_loss": 3.287641763687134, "lr": 0.00011691192430499834, "tps": 26670, "wall": 52804.0} {"step": 21489, "train_loss": 3.2528560161590576, "lr": 0.0001168962199849861, "tps": 26668, "wall": 52809.7} {"step": 21490, "train_loss": 3.2416906356811523, "lr": 0.00011688051683293899, "tps": 26667, "wall": 52815.4} {"step": 21491, "train_loss": 3.256059408187866, "lr": 0.00011686481484903505, "tps": 26665, "wall": 52821.1} {"step": 21492, "train_loss": 3.404716730117798, "lr": 0.00011684911403345207, "tps": 26663, "wall": 52826.8} {"step": 21493, "train_loss": 3.2675116062164307, "lr": 0.00011683341438636781, "tps": 26662, "wall": 52832.5} {"step": 21494, "train_loss": 3.3081912994384766, "lr": 0.00011681771590796039, "tps": 26660, "wall": 52838.3} {"step": 21495, "train_loss": 3.2244861125946045, "lr": 0.00011680201859840729, "tps": 26658, "wall": 52844.0} {"step": 21496, "train_loss": 3.352529764175415, "lr": 0.0001167863224578866, "tps": 26657, "wall": 52849.7} {"step": 21497, "train_loss": 3.2925705909729004, "lr": 0.00011677062748657604, "tps": 26655, "wall": 52855.4} {"step": 21498, "train_loss": 3.226472854614258, "lr": 0.00011675493368465332, "tps": 26653, "wall": 52861.1} {"step": 21499, "train_loss": 3.336960792541504, "lr": 0.00011673924105229632, "tps": 26652, "wall": 52866.8} {"step": 21500, "train_loss": 3.250991106033325, "lr": 0.00011672354958968283, "tps": 26650, "wall": 52872.5} {"step": 21501, "train_loss": 3.2885451316833496, "lr": 0.00011670785929699049, "tps": 26648, "wall": 52878.4} {"step": 21502, "train_loss": 3.204967498779297, "lr": 0.00011669217017439717, "tps": 26647, "wall": 52884.1} {"step": 21503, "train_loss": 3.2798500061035156, "lr": 0.00011667648222208052, "tps": 26645, "wall": 52889.8} {"step": 21504, "train_loss": 3.282743453979492, "lr": 0.00011666079544021822, "tps": 26644, "wall": 52895.6} {"step": 21505, "train_loss": 3.3050284385681152, "lr": 0.00011664510982898806, "tps": 26642, "wall": 52901.3} {"step": 21506, "train_loss": 3.226327419281006, "lr": 0.00011662942538856771, "tps": 26640, "wall": 52907.0} {"step": 21507, "train_loss": 3.2823917865753174, "lr": 0.00011661374211913476, "tps": 26639, "wall": 52912.8} {"step": 21508, "train_loss": 3.2029800415039062, "lr": 0.00011659806002086699, "tps": 26637, "wall": 52918.4} {"step": 21509, "train_loss": 3.353389263153076, "lr": 0.00011658237909394194, "tps": 26635, "wall": 52924.1} {"step": 21510, "train_loss": 3.2038798332214355, "lr": 0.00011656669933853734, "tps": 26634, "wall": 52929.8} {"step": 21511, "train_loss": 3.3156983852386475, "lr": 0.00011655102075483077, "tps": 26632, "wall": 52935.5} {"step": 21512, "train_loss": 3.33426833152771, "lr": 0.00011653534334299976, "tps": 26630, "wall": 52941.3} {"step": 21513, "train_loss": 3.347423553466797, "lr": 0.00011651966710322207, "tps": 26629, "wall": 52947.0} {"step": 21514, "train_loss": 3.3296737670898438, "lr": 0.00011650399203567517, "tps": 26627, "wall": 52952.7} {"step": 21515, "train_loss": 3.3004889488220215, "lr": 0.00011648831814053658, "tps": 26626, "wall": 52958.5} {"step": 21516, "train_loss": 3.2353920936584473, "lr": 0.000116472645417984, "tps": 26624, "wall": 52964.2} {"step": 21517, "train_loss": 3.3494372367858887, "lr": 0.00011645697386819488, "tps": 26622, "wall": 52969.9} {"step": 21518, "train_loss": 3.2884483337402344, "lr": 0.0001164413034913467, "tps": 26621, "wall": 52975.7} {"step": 21519, "train_loss": 3.2700977325439453, "lr": 0.0001164256342876171, "tps": 26619, "wall": 52981.3} {"step": 21520, "train_loss": 3.2889089584350586, "lr": 0.0001164099662571835, "tps": 26617, "wall": 52987.0} {"step": 21521, "train_loss": 3.332441568374634, "lr": 0.00011639429940022337, "tps": 26616, "wall": 52992.7} {"step": 21522, "train_loss": 3.308725118637085, "lr": 0.00011637863371691429, "tps": 26614, "wall": 52998.4} {"step": 21523, "train_loss": 3.228626251220703, "lr": 0.00011636296920743364, "tps": 26612, "wall": 53004.2} {"step": 21524, "train_loss": 3.353513479232788, "lr": 0.00011634730587195881, "tps": 26611, "wall": 53009.9} {"step": 21525, "train_loss": 3.4184579849243164, "lr": 0.00011633164371066738, "tps": 26609, "wall": 53015.7} {"step": 21526, "train_loss": 3.2729811668395996, "lr": 0.0001163159827237367, "tps": 26608, "wall": 53021.4} {"step": 21527, "train_loss": 3.283057689666748, "lr": 0.00011630032291134409, "tps": 26606, "wall": 53027.0} {"step": 21528, "train_loss": 3.3250327110290527, "lr": 0.00011628466427366713, "tps": 26604, "wall": 53032.7} {"step": 21529, "train_loss": 3.1997275352478027, "lr": 0.00011626900681088304, "tps": 26603, "wall": 53038.4} {"step": 21530, "train_loss": 3.2800517082214355, "lr": 0.00011625335052316927, "tps": 26601, "wall": 53044.1} {"step": 21531, "train_loss": 3.361793041229248, "lr": 0.00011623769541070322, "tps": 26599, "wall": 53049.9} {"step": 21532, "train_loss": 3.277033805847168, "lr": 0.00011622204147366207, "tps": 26598, "wall": 53055.5} {"step": 21533, "train_loss": 3.2439117431640625, "lr": 0.00011620638871222333, "tps": 26596, "wall": 53061.3} {"step": 21534, "train_loss": 3.294867515563965, "lr": 0.00011619073712656421, "tps": 26595, "wall": 53066.9} {"step": 21535, "train_loss": 3.3203513622283936, "lr": 0.00011617508671686197, "tps": 26593, "wall": 53072.6} {"step": 21536, "train_loss": 3.3815600872039795, "lr": 0.00011615943748329405, "tps": 26591, "wall": 53078.4} {"step": 21537, "train_loss": 3.361758232116699, "lr": 0.00011614378942603763, "tps": 26590, "wall": 53084.0} {"step": 21538, "train_loss": 3.3222475051879883, "lr": 0.00011612814254526991, "tps": 26588, "wall": 53089.7} {"step": 21539, "train_loss": 3.2794623374938965, "lr": 0.0001161124968411683, "tps": 26586, "wall": 53095.4} {"step": 21540, "train_loss": 3.3101489543914795, "lr": 0.00011609685231390994, "tps": 26585, "wall": 53101.0} {"step": 21541, "train_loss": 3.260917901992798, "lr": 0.00011608120896367198, "tps": 26583, "wall": 53106.8} {"step": 21542, "train_loss": 3.3493804931640625, "lr": 0.00011606556679063181, "tps": 26582, "wall": 53112.5} {"step": 21543, "train_loss": 3.3331079483032227, "lr": 0.00011604992579496647, "tps": 26580, "wall": 53118.1} {"step": 21544, "train_loss": 3.225956439971924, "lr": 0.00011603428597685315, "tps": 26578, "wall": 53123.8} {"step": 21545, "train_loss": 3.330355644226074, "lr": 0.00011601864733646912, "tps": 26577, "wall": 53129.5} {"step": 21546, "train_loss": 3.3370752334594727, "lr": 0.00011600300987399142, "tps": 26575, "wall": 53135.3} {"step": 21547, "train_loss": 3.404541492462158, "lr": 0.00011598737358959733, "tps": 26574, "wall": 53140.9} {"step": 21548, "train_loss": 3.2479419708251953, "lr": 0.00011597173848346385, "tps": 26572, "wall": 53146.6} {"step": 21549, "train_loss": 3.3350696563720703, "lr": 0.00011595610455576814, "tps": 26570, "wall": 53152.2} {"step": 21550, "train_loss": 3.230152130126953, "lr": 0.00011594047180668732, "tps": 26569, "wall": 53157.9} {"step": 21551, "train_loss": 3.301496982574463, "lr": 0.00011592484023639851, "tps": 26567, "wall": 53163.6} {"step": 21552, "train_loss": 3.2845704555511475, "lr": 0.00011590920984507864, "tps": 26566, "wall": 53169.2} {"step": 21553, "train_loss": 3.317140817642212, "lr": 0.00011589358063290494, "tps": 26564, "wall": 53174.9} {"step": 21554, "train_loss": 3.2948012351989746, "lr": 0.00011587795260005441, "tps": 26562, "wall": 53180.6} {"step": 21555, "train_loss": 3.2830331325531006, "lr": 0.00011586232574670402, "tps": 26561, "wall": 53186.3} {"step": 21556, "train_loss": 3.359494686126709, "lr": 0.00011584670007303087, "tps": 26559, "wall": 53191.9} {"step": 21557, "train_loss": 3.3299574851989746, "lr": 0.00011583107557921194, "tps": 26558, "wall": 53197.7} {"step": 21558, "train_loss": 3.2382450103759766, "lr": 0.00011581545226542414, "tps": 26556, "wall": 53203.4} {"step": 21559, "train_loss": 3.331599712371826, "lr": 0.00011579983013184463, "tps": 26554, "wall": 53209.0} {"step": 21560, "train_loss": 3.37522292137146, "lr": 0.00011578420917865025, "tps": 26553, "wall": 53214.7} {"step": 21561, "train_loss": 3.2237417697906494, "lr": 0.00011576858940601796, "tps": 26551, "wall": 53220.3} {"step": 21562, "train_loss": 3.2276618480682373, "lr": 0.00011575297081412477, "tps": 26550, "wall": 53226.0} {"step": 21563, "train_loss": 3.326071262359619, "lr": 0.00011573735340314757, "tps": 26548, "wall": 53231.6} {"step": 21564, "train_loss": 3.390820264816284, "lr": 0.00011572173717326317, "tps": 26546, "wall": 53237.3} {"step": 21565, "train_loss": 3.418987989425659, "lr": 0.00011570612212464868, "tps": 26545, "wall": 53242.9} {"step": 21566, "train_loss": 3.3411142826080322, "lr": 0.0001156905082574808, "tps": 26543, "wall": 53248.6} {"step": 21567, "train_loss": 3.230131149291992, "lr": 0.00011567489557193659, "tps": 26542, "wall": 53254.3} {"step": 21568, "train_loss": 3.3518145084381104, "lr": 0.00011565928406819275, "tps": 26540, "wall": 53260.0} {"step": 21569, "train_loss": 3.293714761734009, "lr": 0.00011564367374642615, "tps": 26538, "wall": 53265.7} {"step": 21570, "train_loss": 3.261335849761963, "lr": 0.00011562806460681373, "tps": 26537, "wall": 53271.3} {"step": 21571, "train_loss": 3.287454605102539, "lr": 0.00011561245664953222, "tps": 26535, "wall": 53276.9} {"step": 21572, "train_loss": 3.3096227645874023, "lr": 0.00011559684987475839, "tps": 26534, "wall": 53282.6} {"step": 21573, "train_loss": 3.402329683303833, "lr": 0.00011558124428266917, "tps": 26532, "wall": 53288.3} {"step": 21574, "train_loss": 3.343960762023926, "lr": 0.00011556563987344127, "tps": 26530, "wall": 53293.9} {"step": 21575, "train_loss": 3.3567800521850586, "lr": 0.00011555003664725137, "tps": 26529, "wall": 53299.5} {"step": 21576, "train_loss": 3.3328752517700195, "lr": 0.00011553443460427635, "tps": 26527, "wall": 53305.1} {"step": 21577, "train_loss": 3.24161958694458, "lr": 0.00011551883374469294, "tps": 26526, "wall": 53310.7} {"step": 21578, "train_loss": 3.2323408126831055, "lr": 0.00011550323406867774, "tps": 26524, "wall": 53316.5} {"step": 21579, "train_loss": 3.3137526512145996, "lr": 0.00011548763557640763, "tps": 26523, "wall": 53322.1} {"step": 21580, "train_loss": 3.282017707824707, "lr": 0.00011547203826805926, "tps": 26521, "wall": 53327.7} {"step": 21581, "train_loss": 3.2086071968078613, "lr": 0.00011545644214380922, "tps": 26519, "wall": 53333.4} {"step": 21582, "train_loss": 3.184116840362549, "lr": 0.00011544084720383433, "tps": 26518, "wall": 53339.0} {"step": 21583, "train_loss": 3.438634157180786, "lr": 0.00011542525344831113, "tps": 26516, "wall": 53344.6} {"step": 21584, "train_loss": 3.3167452812194824, "lr": 0.00011540966087741634, "tps": 26515, "wall": 53350.3} {"step": 21585, "train_loss": 3.188938617706299, "lr": 0.00011539406949132658, "tps": 26513, "wall": 53355.9} {"step": 21586, "train_loss": 3.203197479248047, "lr": 0.00011537847929021839, "tps": 26512, "wall": 53361.5} {"step": 21587, "train_loss": 3.264159917831421, "lr": 0.00011536289027426852, "tps": 26510, "wall": 53367.2} {"step": 21588, "train_loss": 3.213923454284668, "lr": 0.0001153473024436535, "tps": 26508, "wall": 53372.8} {"step": 21589, "train_loss": 3.24953031539917, "lr": 0.00011533171579854982, "tps": 26507, "wall": 53378.5} {"step": 21590, "train_loss": 3.2627954483032227, "lr": 0.00011531613033913423, "tps": 26505, "wall": 53384.1} {"step": 21591, "train_loss": 3.2694389820098877, "lr": 0.00011530054606558312, "tps": 26504, "wall": 53389.7} {"step": 21592, "train_loss": 3.2275848388671875, "lr": 0.00011528496297807306, "tps": 26502, "wall": 53395.3} {"step": 21593, "train_loss": 3.2764909267425537, "lr": 0.00011526938107678064, "tps": 26501, "wall": 53400.9} {"step": 21594, "train_loss": 3.3433194160461426, "lr": 0.00011525380036188238, "tps": 26499, "wall": 53406.5} {"step": 21595, "train_loss": 3.2107059955596924, "lr": 0.00011523822083355465, "tps": 26498, "wall": 53412.2} {"step": 21596, "train_loss": 3.210421562194824, "lr": 0.0001152226424919741, "tps": 26496, "wall": 53417.8} {"step": 21597, "train_loss": 3.3324131965637207, "lr": 0.00011520706533731708, "tps": 26494, "wall": 53423.4} {"step": 21598, "train_loss": 3.2454934120178223, "lr": 0.00011519148936976008, "tps": 26493, "wall": 53429.1} {"step": 21599, "train_loss": 3.333772897720337, "lr": 0.00011517591458947958, "tps": 26491, "wall": 53434.8} {"step": 21600, "train_loss": 3.321821689605713, "lr": 0.00011516034099665196, "tps": 26490, "wall": 53440.4} {"step": 21601, "train_loss": 3.357944965362549, "lr": 0.00011514476859145371, "tps": 26488, "wall": 53446.1} {"step": 21602, "train_loss": 3.2760961055755615, "lr": 0.0001151291973740612, "tps": 26486, "wall": 53451.7} {"step": 21603, "train_loss": 3.4003992080688477, "lr": 0.00011511362734465079, "tps": 26485, "wall": 53457.3} {"step": 21604, "train_loss": 3.2990407943725586, "lr": 0.0001150980585033989, "tps": 26483, "wall": 53462.9} {"step": 21605, "train_loss": 3.2840280532836914, "lr": 0.00011508249085048189, "tps": 26482, "wall": 53468.5} {"step": 21606, "train_loss": 3.3086471557617188, "lr": 0.00011506692438607602, "tps": 26480, "wall": 53474.1} {"step": 21607, "train_loss": 3.2147960662841797, "lr": 0.00011505135911035778, "tps": 26479, "wall": 53479.8} {"step": 21608, "train_loss": 3.407071590423584, "lr": 0.00011503579502350344, "tps": 26477, "wall": 53485.4} {"step": 21609, "train_loss": 3.27158784866333, "lr": 0.00011502023212568921, "tps": 26476, "wall": 53491.0} {"step": 21610, "train_loss": 3.321150064468384, "lr": 0.00011500467041709155, "tps": 26474, "wall": 53496.7} {"step": 21611, "train_loss": 3.36663818359375, "lr": 0.00011498910989788667, "tps": 26472, "wall": 53502.3} {"step": 21612, "train_loss": 3.371345281600952, "lr": 0.00011497355056825077, "tps": 26471, "wall": 53507.9} {"step": 21613, "train_loss": 3.3020591735839844, "lr": 0.00011495799242836019, "tps": 26469, "wall": 53513.5} {"step": 21614, "train_loss": 3.16463041305542, "lr": 0.00011494243547839118, "tps": 26468, "wall": 53519.1} {"step": 21615, "train_loss": 3.2691140174865723, "lr": 0.0001149268797185199, "tps": 26466, "wall": 53524.7} {"step": 21616, "train_loss": 3.392643451690674, "lr": 0.00011491132514892266, "tps": 26465, "wall": 53530.4} {"step": 21617, "train_loss": 3.2184033393859863, "lr": 0.00011489577176977561, "tps": 26463, "wall": 53536.0} {"step": 21618, "train_loss": 3.403491497039795, "lr": 0.0001148802195812549, "tps": 26462, "wall": 53541.6} {"step": 21619, "train_loss": 3.327164649963379, "lr": 0.00011486466858353679, "tps": 26460, "wall": 53547.2} {"step": 21620, "train_loss": 3.2522740364074707, "lr": 0.00011484911877679736, "tps": 26458, "wall": 53552.8} {"step": 21621, "train_loss": 3.3300111293792725, "lr": 0.00011483357016121283, "tps": 26457, "wall": 53558.5} {"step": 21622, "train_loss": 3.3639049530029297, "lr": 0.00011481802273695934, "tps": 26455, "wall": 53564.1} {"step": 21623, "train_loss": 3.255640745162964, "lr": 0.0001148024765042129, "tps": 26454, "wall": 53569.7} {"step": 21624, "train_loss": 3.226813793182373, "lr": 0.00011478693146314974, "tps": 26452, "wall": 53575.3} {"step": 21625, "train_loss": 3.3634135723114014, "lr": 0.00011477138761394597, "tps": 26451, "wall": 53580.9} {"step": 21626, "train_loss": 3.26716685295105, "lr": 0.00011475584495677751, "tps": 26449, "wall": 53586.5} {"step": 21627, "train_loss": 3.316234588623047, "lr": 0.00011474030349182059, "tps": 26448, "wall": 53592.1} {"step": 21628, "train_loss": 3.378699779510498, "lr": 0.00011472476321925121, "tps": 26446, "wall": 53597.8} {"step": 21629, "train_loss": 3.2188057899475098, "lr": 0.00011470922413924536, "tps": 26445, "wall": 53603.4} {"step": 21630, "train_loss": 3.40860652923584, "lr": 0.00011469368625197919, "tps": 26443, "wall": 53609.0} {"step": 21631, "train_loss": 3.3518640995025635, "lr": 0.00011467814955762859, "tps": 26441, "wall": 53614.7} {"step": 21632, "train_loss": 3.247004985809326, "lr": 0.00011466261405636958, "tps": 26440, "wall": 53620.3} {"step": 21633, "train_loss": 3.195570230484009, "lr": 0.00011464707974837823, "tps": 26438, "wall": 53625.9} {"step": 21634, "train_loss": 3.2686378955841064, "lr": 0.00011463154663383049, "tps": 26437, "wall": 53631.5} {"step": 21635, "train_loss": 3.2400174140930176, "lr": 0.0001146160147129022, "tps": 26435, "wall": 53637.1} {"step": 21636, "train_loss": 3.256844997406006, "lr": 0.00011460048398576945, "tps": 26434, "wall": 53642.7} {"step": 21637, "train_loss": 3.2329602241516113, "lr": 0.00011458495445260807, "tps": 26432, "wall": 53648.3} {"step": 21638, "train_loss": 3.325883150100708, "lr": 0.0001145694261135941, "tps": 26431, "wall": 53653.9} {"step": 21639, "train_loss": 3.408127784729004, "lr": 0.00011455389896890336, "tps": 26429, "wall": 53659.5} {"step": 21640, "train_loss": 3.2746753692626953, "lr": 0.00011453837301871168, "tps": 26428, "wall": 53665.1} {"step": 21641, "train_loss": 3.389354705810547, "lr": 0.00011452284826319513, "tps": 26426, "wall": 53670.7} {"step": 21642, "train_loss": 3.484189748764038, "lr": 0.00011450732470252941, "tps": 26424, "wall": 53676.4} {"step": 21643, "train_loss": 3.3203814029693604, "lr": 0.00011449180233689038, "tps": 26423, "wall": 53682.1} {"step": 21644, "train_loss": 3.1155691146850586, "lr": 0.00011447628116645399, "tps": 26421, "wall": 53687.7} {"step": 21645, "train_loss": 3.347933769226074, "lr": 0.00011446076119139596, "tps": 26420, "wall": 53693.3} {"step": 21646, "train_loss": 3.2783384323120117, "lr": 0.00011444524241189212, "tps": 26418, "wall": 53698.9} {"step": 21647, "train_loss": 3.2573089599609375, "lr": 0.00011442972482811831, "tps": 26417, "wall": 53704.5} {"step": 21648, "train_loss": 3.358283042907715, "lr": 0.00011441420844025032, "tps": 26415, "wall": 53710.1} {"step": 21649, "train_loss": 3.2356622219085693, "lr": 0.00011439869324846384, "tps": 26414, "wall": 53715.8} {"step": 21650, "train_loss": 3.2909016609191895, "lr": 0.00011438317925293469, "tps": 26412, "wall": 53721.4} {"step": 21651, "train_loss": 3.354512929916382, "lr": 0.00011436766645383863, "tps": 26411, "wall": 53727.0} {"step": 21652, "train_loss": 3.2461843490600586, "lr": 0.00011435215485135127, "tps": 26409, "wall": 53732.6} {"step": 21653, "train_loss": 3.4093258380889893, "lr": 0.00011433664444564851, "tps": 26407, "wall": 53738.3} {"step": 21654, "train_loss": 3.303927421569824, "lr": 0.00011432113523690588, "tps": 26406, "wall": 53743.9} {"step": 21655, "train_loss": 3.269531488418579, "lr": 0.00011430562722529923, "tps": 26404, "wall": 53749.6} {"step": 21656, "train_loss": 3.27720046043396, "lr": 0.0001142901204110041, "tps": 26403, "wall": 53755.2} {"step": 21657, "train_loss": 3.3505959510803223, "lr": 0.00011427461479419621, "tps": 26401, "wall": 53760.7} {"step": 21658, "train_loss": 3.3470802307128906, "lr": 0.00011425911037505121, "tps": 26400, "wall": 53766.4} {"step": 21659, "train_loss": 3.2707576751708984, "lr": 0.00011424360715374476, "tps": 26398, "wall": 53771.9} {"step": 21660, "train_loss": 3.2637577056884766, "lr": 0.00011422810513045239, "tps": 26397, "wall": 53777.5} {"step": 21661, "train_loss": 3.3047683238983154, "lr": 0.00011421260430534979, "tps": 26395, "wall": 53783.2} {"step": 21662, "train_loss": 3.357025384902954, "lr": 0.00011419710467861257, "tps": 26394, "wall": 53788.8} {"step": 21663, "train_loss": 3.3078248500823975, "lr": 0.00011418160625041628, "tps": 26392, "wall": 53794.5} {"step": 21664, "train_loss": 3.4163475036621094, "lr": 0.00011416610902093643, "tps": 26390, "wall": 53800.1} {"step": 21665, "train_loss": 3.278057098388672, "lr": 0.00011415061299034862, "tps": 26389, "wall": 53805.7} {"step": 21666, "train_loss": 3.2412796020507812, "lr": 0.00011413511815882843, "tps": 26387, "wall": 53811.3} {"step": 21667, "train_loss": 3.264906883239746, "lr": 0.00011411962452655132, "tps": 26386, "wall": 53816.9} {"step": 21668, "train_loss": 3.2854461669921875, "lr": 0.0001141041320936928, "tps": 26384, "wall": 53822.5} {"step": 21669, "train_loss": 3.274787187576294, "lr": 0.00011408864086042845, "tps": 26383, "wall": 53828.1} {"step": 21670, "train_loss": 3.3755273818969727, "lr": 0.00011407315082693371, "tps": 26381, "wall": 53833.8} {"step": 21671, "train_loss": 3.2811567783355713, "lr": 0.00011405766199338399, "tps": 26380, "wall": 53839.4} {"step": 21672, "train_loss": 3.3934149742126465, "lr": 0.00011404217435995486, "tps": 26378, "wall": 53845.0} {"step": 21673, "train_loss": 3.2815990447998047, "lr": 0.00011402668792682174, "tps": 26377, "wall": 53850.6} {"step": 21674, "train_loss": 3.3366425037384033, "lr": 0.00011401120269415991, "tps": 26375, "wall": 53856.3} {"step": 21675, "train_loss": 3.246199369430542, "lr": 0.00011399571866214502, "tps": 26374, "wall": 53861.9} {"step": 21676, "train_loss": 3.4011881351470947, "lr": 0.00011398023583095236, "tps": 26372, "wall": 53867.4} {"step": 21677, "train_loss": 3.298898220062256, "lr": 0.00011396475420075723, "tps": 26371, "wall": 53873.0} {"step": 21678, "train_loss": 3.2873682975769043, "lr": 0.00011394927377173518, "tps": 26369, "wall": 53878.6} {"step": 21679, "train_loss": 3.254422903060913, "lr": 0.00011393379454406145, "tps": 26368, "wall": 53884.2} {"step": 21680, "train_loss": 3.3223605155944824, "lr": 0.00011391831651791149, "tps": 26366, "wall": 53889.8} {"step": 21681, "train_loss": 3.3129355907440186, "lr": 0.00011390283969346058, "tps": 26364, "wall": 53895.4} {"step": 21682, "train_loss": 3.319673538208008, "lr": 0.00011388736407088396, "tps": 26363, "wall": 53901.0} {"step": 21683, "train_loss": 3.302173137664795, "lr": 0.0001138718896503571, "tps": 26361, "wall": 53906.6} {"step": 21684, "train_loss": 3.358553171157837, "lr": 0.00011385641643205522, "tps": 26360, "wall": 53912.2} {"step": 21685, "train_loss": 3.396930694580078, "lr": 0.00011384094441615351, "tps": 26358, "wall": 53917.8} {"step": 21686, "train_loss": 3.2398314476013184, "lr": 0.00011382547360282742, "tps": 26357, "wall": 53923.4} {"step": 21687, "train_loss": 3.3171629905700684, "lr": 0.0001138100039922521, "tps": 26355, "wall": 53929.1} {"step": 21688, "train_loss": 3.3269200325012207, "lr": 0.00011379453558460271, "tps": 26354, "wall": 53934.7} {"step": 21689, "train_loss": 3.3163766860961914, "lr": 0.00011377906838005465, "tps": 26352, "wall": 53940.3} {"step": 21690, "train_loss": 3.3588337898254395, "lr": 0.00011376360237878305, "tps": 26351, "wall": 53945.9} {"step": 21691, "train_loss": 3.349595069885254, "lr": 0.00011374813758096306, "tps": 26349, "wall": 53951.5} {"step": 21692, "train_loss": 3.33402681350708, "lr": 0.00011373267398676996, "tps": 26348, "wall": 53957.1} {"step": 21693, "train_loss": 3.282120704650879, "lr": 0.00011371721159637887, "tps": 26346, "wall": 53962.7} {"step": 21694, "train_loss": 3.2763428688049316, "lr": 0.00011370175040996491, "tps": 26345, "wall": 53968.3} {"step": 21695, "train_loss": 3.2977118492126465, "lr": 0.00011368629042770334, "tps": 26343, "wall": 53974.0} {"step": 21696, "train_loss": 3.2872116565704346, "lr": 0.00011367083164976913, "tps": 26342, "wall": 53979.5} {"step": 21697, "train_loss": 3.233339786529541, "lr": 0.0001136553740763376, "tps": 26340, "wall": 53985.1} {"step": 21698, "train_loss": 3.261842727661133, "lr": 0.00011363991770758371, "tps": 26339, "wall": 53990.6} {"step": 21699, "train_loss": 3.361189126968384, "lr": 0.00011362446254368255, "tps": 26337, "wall": 53996.2} {"step": 21700, "train_loss": 3.306457281112671, "lr": 0.00011360900858480926, "tps": 26336, "wall": 54001.9} {"step": 21701, "train_loss": 3.2851576805114746, "lr": 0.00011359355583113891, "tps": 26334, "wall": 54007.5} {"step": 21702, "train_loss": 3.4541678428649902, "lr": 0.00011357810428284641, "tps": 26333, "wall": 54013.1} {"step": 21703, "train_loss": 3.2780933380126953, "lr": 0.00011356265394010703, "tps": 26331, "wall": 54018.7} {"step": 21704, "train_loss": 3.244302272796631, "lr": 0.00011354720480309561, "tps": 26329, "wall": 54024.3} {"step": 21705, "train_loss": 3.3606691360473633, "lr": 0.00011353175687198718, "tps": 26328, "wall": 54029.9} {"step": 21706, "train_loss": 3.327491521835327, "lr": 0.00011351631014695681, "tps": 26326, "wall": 54035.6} {"step": 21707, "train_loss": 3.231062889099121, "lr": 0.00011350086462817943, "tps": 26325, "wall": 54041.2} {"step": 21708, "train_loss": 3.3038206100463867, "lr": 0.00011348542031582998, "tps": 26323, "wall": 54046.9} {"step": 21709, "train_loss": 3.278383731842041, "lr": 0.00011346997721008352, "tps": 26322, "wall": 54052.5} {"step": 21710, "train_loss": 3.33736252784729, "lr": 0.0001134545353111149, "tps": 26320, "wall": 54058.1} {"step": 21711, "train_loss": 3.3779096603393555, "lr": 0.00011343909461909902, "tps": 26319, "wall": 54063.7} {"step": 21712, "train_loss": 3.3887441158294678, "lr": 0.00011342365513421089, "tps": 26317, "wall": 54069.4} {"step": 21713, "train_loss": 3.354722499847412, "lr": 0.00011340821685662537, "tps": 26316, "wall": 54075.0} {"step": 21714, "train_loss": 3.2343132495880127, "lr": 0.00011339277978651727, "tps": 26314, "wall": 54080.6} {"step": 21715, "train_loss": 3.393777370452881, "lr": 0.0001133773439240616, "tps": 26313, "wall": 54086.2} {"step": 21716, "train_loss": 3.1556060314178467, "lr": 0.00011336190926943309, "tps": 26311, "wall": 54091.9} {"step": 21717, "train_loss": 3.305629253387451, "lr": 0.00011334647582280666, "tps": 26310, "wall": 54097.5} {"step": 21718, "train_loss": 3.2092905044555664, "lr": 0.00011333104358435718, "tps": 26308, "wall": 54103.1} {"step": 21719, "train_loss": 3.274775981903076, "lr": 0.00011331561255425929, "tps": 26307, "wall": 54108.7} {"step": 21720, "train_loss": 3.2406177520751953, "lr": 0.000113300182732688, "tps": 26305, "wall": 54114.3} {"step": 21721, "train_loss": 3.2613372802734375, "lr": 0.00011328475411981803, "tps": 26304, "wall": 54120.0} {"step": 21722, "train_loss": 3.2919063568115234, "lr": 0.00011326932671582406, "tps": 26302, "wall": 54125.6} {"step": 21723, "train_loss": 3.375544309616089, "lr": 0.00011325390052088099, "tps": 26300, "wall": 54131.2} {"step": 21724, "train_loss": 3.321561336517334, "lr": 0.00011323847553516351, "tps": 26299, "wall": 54136.8} {"step": 21725, "train_loss": 3.3797364234924316, "lr": 0.00011322305175884631, "tps": 26297, "wall": 54142.4} {"step": 21726, "train_loss": 3.244049072265625, "lr": 0.00011320762919210417, "tps": 26296, "wall": 54148.0} {"step": 21727, "train_loss": 3.328831434249878, "lr": 0.00011319220783511184, "tps": 26294, "wall": 54153.6} {"step": 21728, "train_loss": 3.3427016735076904, "lr": 0.00011317678768804388, "tps": 26293, "wall": 54159.3} {"step": 21729, "train_loss": 3.151669502258301, "lr": 0.00011316136875107511, "tps": 26291, "wall": 54164.9} {"step": 21730, "train_loss": 3.251384973526001, "lr": 0.00011314595102438013, "tps": 26290, "wall": 54170.5} {"step": 21731, "train_loss": 3.3330602645874023, "lr": 0.00011313053450813351, "tps": 26288, "wall": 54176.1} {"step": 21732, "train_loss": 3.3603365421295166, "lr": 0.00011311511920251008, "tps": 26287, "wall": 54181.7} {"step": 21733, "train_loss": 3.2440013885498047, "lr": 0.00011309970510768429, "tps": 26285, "wall": 54187.3} {"step": 21734, "train_loss": 3.3847553730010986, "lr": 0.00011308429222383088, "tps": 26284, "wall": 54192.9} {"step": 21735, "train_loss": 3.1461615562438965, "lr": 0.00011306888055112436, "tps": 26282, "wall": 54198.5} {"step": 21736, "train_loss": 3.2647762298583984, "lr": 0.00011305347008973934, "tps": 26281, "wall": 54204.1} {"step": 21737, "train_loss": 3.2755658626556396, "lr": 0.00011303806083985042, "tps": 26279, "wall": 54209.7} {"step": 21738, "train_loss": 3.294706106185913, "lr": 0.00011302265280163213, "tps": 26278, "wall": 54215.4} {"step": 21739, "train_loss": 3.304185390472412, "lr": 0.000113007245975259, "tps": 26276, "wall": 54221.0} {"step": 21740, "train_loss": 3.311288356781006, "lr": 0.0001129918403609056, "tps": 26275, "wall": 54226.6} {"step": 21741, "train_loss": 3.344322681427002, "lr": 0.00011297643595874645, "tps": 26273, "wall": 54232.2} {"step": 21742, "train_loss": 3.304621458053589, "lr": 0.00011296103276895592, "tps": 26272, "wall": 54237.8} {"step": 21743, "train_loss": 3.2516427040100098, "lr": 0.0001129456307917087, "tps": 26270, "wall": 54243.4} {"step": 21744, "train_loss": 3.1569488048553467, "lr": 0.00011293023002717915, "tps": 26269, "wall": 54249.1} {"step": 21745, "train_loss": 3.314784288406372, "lr": 0.00011291483047554167, "tps": 26267, "wall": 54254.7} {"step": 21746, "train_loss": 3.380950450897217, "lr": 0.00011289943213697085, "tps": 26266, "wall": 54260.3} {"step": 21747, "train_loss": 3.265439987182617, "lr": 0.00011288403501164109, "tps": 26264, "wall": 54265.9} {"step": 21748, "train_loss": 3.2798452377319336, "lr": 0.00011286863909972666, "tps": 26263, "wall": 54271.5} {"step": 21749, "train_loss": 3.2451186180114746, "lr": 0.00011285324440140219, "tps": 26261, "wall": 54277.2} {"step": 21750, "train_loss": 3.3404102325439453, "lr": 0.00011283785091684189, "tps": 26260, "wall": 54282.8} {"step": 21751, "train_loss": 3.4320600032806396, "lr": 0.00011282245864622027, "tps": 26258, "wall": 54288.4} {"step": 21752, "train_loss": 3.365978956222534, "lr": 0.00011280706758971167, "tps": 26257, "wall": 54294.0} {"step": 21753, "train_loss": 3.3401761054992676, "lr": 0.00011279167774749029, "tps": 26255, "wall": 54299.6} {"step": 21754, "train_loss": 3.3509480953216553, "lr": 0.00011277628911973069, "tps": 26254, "wall": 54305.2} {"step": 21755, "train_loss": 3.409029006958008, "lr": 0.00011276090170660704, "tps": 26252, "wall": 54310.8} {"step": 21756, "train_loss": 3.2210521697998047, "lr": 0.00011274551550829366, "tps": 26251, "wall": 54316.4} {"step": 21757, "train_loss": 3.2913050651550293, "lr": 0.00011273013052496497, "tps": 26249, "wall": 54322.0} {"step": 21758, "train_loss": 3.1497228145599365, "lr": 0.00011271474675679515, "tps": 26248, "wall": 54327.6} {"step": 21759, "train_loss": 3.329537868499756, "lr": 0.00011269936420395839, "tps": 26246, "wall": 54333.2} {"step": 21760, "train_loss": 3.2402493953704834, "lr": 0.00011268398286662911, "tps": 26245, "wall": 54338.8} {"step": 21761, "train_loss": 3.2253899574279785, "lr": 0.0001126686027449815, "tps": 26243, "wall": 54344.4} {"step": 21762, "train_loss": 3.330317735671997, "lr": 0.0001126532238391897, "tps": 26242, "wall": 54350.0} {"step": 21763, "train_loss": 3.309741973876953, "lr": 0.00011263784614942804, "tps": 26240, "wall": 54355.6} {"step": 21764, "train_loss": 3.3392481803894043, "lr": 0.00011262246967587067, "tps": 26239, "wall": 54361.2} {"step": 21765, "train_loss": 3.3929524421691895, "lr": 0.00011260709441869171, "tps": 26237, "wall": 54366.8} {"step": 21766, "train_loss": 3.439138889312744, "lr": 0.00011259172037806547, "tps": 26236, "wall": 54372.4} {"step": 21767, "train_loss": 3.3825109004974365, "lr": 0.00011257634755416599, "tps": 26234, "wall": 54377.9} {"step": 21768, "train_loss": 3.224318742752075, "lr": 0.00011256097594716743, "tps": 26233, "wall": 54383.5} {"step": 21769, "train_loss": 3.3479340076446533, "lr": 0.00011254560555724403, "tps": 26231, "wall": 54389.1} {"step": 21770, "train_loss": 3.2957730293273926, "lr": 0.00011253023638456972, "tps": 26230, "wall": 54394.8} {"step": 21771, "train_loss": 3.26237154006958, "lr": 0.00011251486842931877, "tps": 26228, "wall": 54400.4} {"step": 21772, "train_loss": 3.3680105209350586, "lr": 0.00011249950169166523, "tps": 26227, "wall": 54406.0} {"step": 21773, "train_loss": 3.3348166942596436, "lr": 0.00011248413617178307, "tps": 26225, "wall": 54411.6} {"step": 21774, "train_loss": 3.2660574913024902, "lr": 0.0001124687718698465, "tps": 26224, "wall": 54417.2} {"step": 21775, "train_loss": 3.228046417236328, "lr": 0.00011245340878602948, "tps": 26222, "wall": 54422.7} {"step": 21776, "train_loss": 3.2979063987731934, "lr": 0.00011243804692050601, "tps": 26221, "wall": 54428.3} {"step": 21777, "train_loss": 3.220885753631592, "lr": 0.00011242268627345027, "tps": 26219, "wall": 54433.9} {"step": 21778, "train_loss": 3.2813825607299805, "lr": 0.00011240732684503613, "tps": 26218, "wall": 54439.5} {"step": 21779, "train_loss": 3.3036186695098877, "lr": 0.00011239196863543755, "tps": 26216, "wall": 54445.1} {"step": 21780, "train_loss": 3.3108394145965576, "lr": 0.0001123766116448286, "tps": 26215, "wall": 54450.7} {"step": 21781, "train_loss": 3.2215137481689453, "lr": 0.00011236125587338326, "tps": 26213, "wall": 54456.4} {"step": 21782, "train_loss": 3.368359327316284, "lr": 0.00011234590132127536, "tps": 26212, "wall": 54462.0} {"step": 21783, "train_loss": 3.243818759918213, "lr": 0.00011233054798867897, "tps": 26210, "wall": 54467.7} {"step": 21784, "train_loss": 3.1571199893951416, "lr": 0.00011231519587576796, "tps": 26209, "wall": 54473.2} {"step": 21785, "train_loss": 3.3610172271728516, "lr": 0.00011229984498271618, "tps": 26207, "wall": 54478.8} {"step": 21786, "train_loss": 3.284167528152466, "lr": 0.00011228449530969762, "tps": 26206, "wall": 54484.4} {"step": 21787, "train_loss": 3.300877094268799, "lr": 0.00011226914685688607, "tps": 26204, "wall": 54490.0} {"step": 21788, "train_loss": 3.350236415863037, "lr": 0.00011225379962445557, "tps": 26203, "wall": 54495.6} {"step": 21789, "train_loss": 3.3339552879333496, "lr": 0.00011223845361257978, "tps": 26201, "wall": 54501.1} {"step": 21790, "train_loss": 3.2907278537750244, "lr": 0.00011222310882143259, "tps": 26200, "wall": 54506.8} {"step": 21791, "train_loss": 3.2777106761932373, "lr": 0.00011220776525118793, "tps": 26198, "wall": 54512.3} {"step": 21792, "train_loss": 3.2991063594818115, "lr": 0.00011219242290201953, "tps": 26197, "wall": 54518.0} {"step": 21793, "train_loss": 3.2364659309387207, "lr": 0.00011217708177410112, "tps": 26195, "wall": 54523.7} {"step": 21794, "train_loss": 3.3189315795898438, "lr": 0.00011216174186760664, "tps": 26194, "wall": 54529.3} {"step": 21795, "train_loss": 3.2315053939819336, "lr": 0.00011214640318270977, "tps": 26192, "wall": 54534.8} {"step": 21796, "train_loss": 3.3831982612609863, "lr": 0.00011213106571958421, "tps": 26191, "wall": 54540.4} {"step": 21797, "train_loss": 3.2140538692474365, "lr": 0.00011211572947840385, "tps": 26189, "wall": 54546.1} {"step": 21798, "train_loss": 3.2750539779663086, "lr": 0.00011210039445934235, "tps": 26188, "wall": 54551.6} {"step": 21799, "train_loss": 3.1932430267333984, "lr": 0.00011208506066257332, "tps": 26186, "wall": 54557.2} {"step": 21800, "train_loss": 3.3558731079101562, "lr": 0.00011206972808827068, "tps": 26185, "wall": 54562.8} {"step": 21801, "train_loss": 3.1995110511779785, "lr": 0.00011205439673660793, "tps": 26183, "wall": 54568.4} {"step": 21802, "train_loss": 3.256527900695801, "lr": 0.00011203906660775881, "tps": 26182, "wall": 54574.1} {"step": 21803, "train_loss": 3.244328022003174, "lr": 0.00011202373770189703, "tps": 26180, "wall": 54579.7} {"step": 21804, "train_loss": 3.2795443534851074, "lr": 0.00011200841001919617, "tps": 26179, "wall": 54585.2} {"step": 21805, "train_loss": 3.269188404083252, "lr": 0.00011199308355982983, "tps": 26178, "wall": 54590.8} {"step": 21806, "train_loss": 3.300664186477661, "lr": 0.00011197775832397175, "tps": 26176, "wall": 54596.3} {"step": 21807, "train_loss": 3.3025407791137695, "lr": 0.0001119624343117954, "tps": 26175, "wall": 54601.9} {"step": 21808, "train_loss": 3.3170878887176514, "lr": 0.0001119471115234745, "tps": 26173, "wall": 54607.6} {"step": 21809, "train_loss": 3.352811098098755, "lr": 0.00011193178995918259, "tps": 26172, "wall": 54613.2} {"step": 21810, "train_loss": 3.236973762512207, "lr": 0.00011191646961909313, "tps": 26170, "wall": 54618.8} {"step": 21811, "train_loss": 3.3555617332458496, "lr": 0.00011190115050337979, "tps": 26169, "wall": 54624.4} {"step": 21812, "train_loss": 3.3455913066864014, "lr": 0.00011188583261221607, "tps": 26167, "wall": 54630.0} {"step": 21813, "train_loss": 3.2922096252441406, "lr": 0.00011187051594577547, "tps": 26166, "wall": 54635.6} {"step": 21814, "train_loss": 3.36560320854187, "lr": 0.00011185520050423152, "tps": 26164, "wall": 54641.2} {"step": 21815, "train_loss": 3.2978410720825195, "lr": 0.00011183988628775777, "tps": 26163, "wall": 54646.8} {"step": 21816, "train_loss": 3.3473520278930664, "lr": 0.00011182457329652754, "tps": 26161, "wall": 54652.4} {"step": 21817, "train_loss": 3.3555524349212646, "lr": 0.00011180926153071447, "tps": 26160, "wall": 54657.9} {"step": 21818, "train_loss": 3.3358147144317627, "lr": 0.00011179395099049195, "tps": 26158, "wall": 54663.5} {"step": 21819, "train_loss": 3.2909951210021973, "lr": 0.00011177864167603331, "tps": 26157, "wall": 54669.1} {"step": 21820, "train_loss": 3.273949146270752, "lr": 0.00011176333358751217, "tps": 26155, "wall": 54674.7} {"step": 21821, "train_loss": 3.310603618621826, "lr": 0.00011174802672510179, "tps": 26154, "wall": 54680.4} {"step": 21822, "train_loss": 3.333423376083374, "lr": 0.0001117327210889756, "tps": 26152, "wall": 54685.9} {"step": 21823, "train_loss": 3.2329659461975098, "lr": 0.00011171741667930704, "tps": 26151, "wall": 54691.5} {"step": 21824, "train_loss": 3.2968757152557373, "lr": 0.0001117021134962694, "tps": 26149, "wall": 54697.2} {"step": 21825, "train_loss": 3.3006129264831543, "lr": 0.00011168681154003615, "tps": 26148, "wall": 54702.7} {"step": 21826, "train_loss": 3.2926268577575684, "lr": 0.00011167151081078054, "tps": 26146, "wall": 54708.3} {"step": 21827, "train_loss": 3.290205240249634, "lr": 0.00011165621130867586, "tps": 26145, "wall": 54713.9} {"step": 21828, "train_loss": 3.235956907272339, "lr": 0.00011164091303389554, "tps": 26143, "wall": 54719.5} {"step": 21829, "train_loss": 3.1661715507507324, "lr": 0.00011162561598661281, "tps": 26142, "wall": 54725.2} {"step": 21830, "train_loss": 3.278904438018799, "lr": 0.0001116103201670009, "tps": 26140, "wall": 54730.8} {"step": 21831, "train_loss": 3.2143092155456543, "lr": 0.00011159502557523329, "tps": 26139, "wall": 54736.4} {"step": 21832, "train_loss": 3.270451784133911, "lr": 0.00011157973221148297, "tps": 26138, "wall": 54742.0} {"step": 21833, "train_loss": 3.3899521827697754, "lr": 0.00011156444007592335, "tps": 26136, "wall": 54747.6} {"step": 21834, "train_loss": 3.2135353088378906, "lr": 0.00011154914916872765, "tps": 26135, "wall": 54753.2} {"step": 21835, "train_loss": 3.293590545654297, "lr": 0.00011153385949006896, "tps": 26133, "wall": 54758.9} {"step": 21836, "train_loss": 3.3139116764068604, "lr": 0.00011151857104012066, "tps": 26132, "wall": 54764.5} {"step": 21837, "train_loss": 3.2909321784973145, "lr": 0.00011150328381905586, "tps": 26130, "wall": 54770.0} {"step": 21838, "train_loss": 3.1848976612091064, "lr": 0.00011148799782704766, "tps": 26129, "wall": 54775.6} {"step": 21839, "train_loss": 3.277691125869751, "lr": 0.00011147271306426934, "tps": 26127, "wall": 54781.2} {"step": 21840, "train_loss": 3.3773272037506104, "lr": 0.00011145742953089402, "tps": 26126, "wall": 54786.8} {"step": 21841, "train_loss": 3.305558919906616, "lr": 0.00011144214722709474, "tps": 26124, "wall": 54792.4} {"step": 21842, "train_loss": 3.2593131065368652, "lr": 0.00011142686615304477, "tps": 26123, "wall": 54798.0} {"step": 21843, "train_loss": 3.3395392894744873, "lr": 0.00011141158630891709, "tps": 26121, "wall": 54803.6} {"step": 21844, "train_loss": 3.36262845993042, "lr": 0.0001113963076948848, "tps": 26120, "wall": 54809.1} {"step": 21845, "train_loss": 3.35587739944458, "lr": 0.00011138103031112108, "tps": 26118, "wall": 54814.8} {"step": 21846, "train_loss": 3.293217658996582, "lr": 0.0001113657541577989, "tps": 26117, "wall": 54820.5} {"step": 21847, "train_loss": 3.2062039375305176, "lr": 0.0001113504792350913, "tps": 26115, "wall": 54826.1} {"step": 21848, "train_loss": 3.329888343811035, "lr": 0.00011133520554317138, "tps": 26114, "wall": 54831.7} {"step": 21849, "train_loss": 3.3848960399627686, "lr": 0.00011131993308221212, "tps": 26112, "wall": 54837.4} {"step": 21850, "train_loss": 3.325547218322754, "lr": 0.00011130466185238655, "tps": 26111, "wall": 54842.9} {"step": 21851, "train_loss": 3.2483768463134766, "lr": 0.00011128939185386767, "tps": 26109, "wall": 54848.5} {"step": 21852, "train_loss": 3.2518997192382812, "lr": 0.00011127412308682836, "tps": 26108, "wall": 54854.2} {"step": 21853, "train_loss": 3.3083975315093994, "lr": 0.00011125885555144173, "tps": 26106, "wall": 54859.8} {"step": 21854, "train_loss": 3.2878458499908447, "lr": 0.00011124358924788069, "tps": 26105, "wall": 54865.4} {"step": 21855, "train_loss": 3.1775755882263184, "lr": 0.0001112283241763181, "tps": 26104, "wall": 54871.0} {"step": 21856, "train_loss": 3.2843375205993652, "lr": 0.00011121306033692698, "tps": 26102, "wall": 54876.8} {"step": 21857, "train_loss": 3.3504559993743896, "lr": 0.0001111977977298802, "tps": 26101, "wall": 54882.3} {"step": 21858, "train_loss": 3.394101619720459, "lr": 0.00011118253635535059, "tps": 26099, "wall": 54887.9} {"step": 21859, "train_loss": 3.277388572692871, "lr": 0.00011116727621351116, "tps": 26098, "wall": 54893.5} {"step": 21860, "train_loss": 3.233908176422119, "lr": 0.0001111520173045347, "tps": 26096, "wall": 54899.1} {"step": 21861, "train_loss": 3.3346030712127686, "lr": 0.00011113675962859402, "tps": 26095, "wall": 54904.7} {"step": 21862, "train_loss": 3.3390133380889893, "lr": 0.00011112150318586211, "tps": 26093, "wall": 54910.3} {"step": 21863, "train_loss": 3.3302745819091797, "lr": 0.00011110624797651168, "tps": 26092, "wall": 54915.9} {"step": 21864, "train_loss": 3.3269801139831543, "lr": 0.00011109099400071547, "tps": 26090, "wall": 54921.6} {"step": 21865, "train_loss": 3.301992177963257, "lr": 0.00011107574125864645, "tps": 26089, "wall": 54927.2} {"step": 21866, "train_loss": 3.290013313293457, "lr": 0.00011106048975047731, "tps": 26087, "wall": 54932.7} {"step": 21867, "train_loss": 3.3375418186187744, "lr": 0.00011104523947638086, "tps": 26086, "wall": 54938.4} {"step": 21868, "train_loss": 3.184113025665283, "lr": 0.00011102999043652984, "tps": 26084, "wall": 54943.9} {"step": 21869, "train_loss": 3.347142219543457, "lr": 0.00011101474263109691, "tps": 26083, "wall": 54949.5} {"step": 21870, "train_loss": 3.349313735961914, "lr": 0.00011099949606025495, "tps": 26081, "wall": 54955.1} {"step": 21871, "train_loss": 3.3613524436950684, "lr": 0.00011098425072417658, "tps": 26080, "wall": 54960.7} {"step": 21872, "train_loss": 3.216629981994629, "lr": 0.00011096900662303444, "tps": 26079, "wall": 54966.3} {"step": 21873, "train_loss": 3.264007568359375, "lr": 0.00011095376375700139, "tps": 26077, "wall": 54971.9} {"step": 21874, "train_loss": 3.273951530456543, "lr": 0.00011093852212625, "tps": 26076, "wall": 54977.5} {"step": 21875, "train_loss": 3.315373182296753, "lr": 0.00011092328173095285, "tps": 26074, "wall": 54983.1} {"step": 21876, "train_loss": 3.3786802291870117, "lr": 0.00011090804257128274, "tps": 26073, "wall": 54988.7} {"step": 21877, "train_loss": 3.281099796295166, "lr": 0.00011089280464741221, "tps": 26071, "wall": 54994.4} {"step": 21878, "train_loss": 3.411449670791626, "lr": 0.00011087756795951383, "tps": 26070, "wall": 55000.0} {"step": 21879, "train_loss": 3.263050079345703, "lr": 0.00011086233250776032, "tps": 26068, "wall": 55005.5} {"step": 21880, "train_loss": 3.269085645675659, "lr": 0.00011084709829232425, "tps": 26067, "wall": 55011.1} {"step": 21881, "train_loss": 3.255679130554199, "lr": 0.00011083186531337806, "tps": 26065, "wall": 55016.7} {"step": 21882, "train_loss": 3.2726521492004395, "lr": 0.00011081663357109446, "tps": 26064, "wall": 55022.3} {"step": 21883, "train_loss": 3.273571491241455, "lr": 0.00011080140306564591, "tps": 26062, "wall": 55027.8} {"step": 21884, "train_loss": 3.341212272644043, "lr": 0.00011078617379720504, "tps": 26061, "wall": 55033.4} {"step": 21885, "train_loss": 3.292020797729492, "lr": 0.00011077094576594426, "tps": 26060, "wall": 55039.0} {"step": 21886, "train_loss": 3.270923376083374, "lr": 0.00011075571897203609, "tps": 26058, "wall": 55044.6} {"step": 21887, "train_loss": 3.255101442337036, "lr": 0.00011074049341565312, "tps": 26057, "wall": 55050.2} {"step": 21888, "train_loss": 3.444520950317383, "lr": 0.0001107252690969677, "tps": 26055, "wall": 55055.9} {"step": 21889, "train_loss": 3.3331642150878906, "lr": 0.00011071004601615232, "tps": 26054, "wall": 55061.4} {"step": 21890, "train_loss": 3.1977007389068604, "lr": 0.00011069482417337948, "tps": 26052, "wall": 55067.0} {"step": 21891, "train_loss": 3.2859888076782227, "lr": 0.0001106796035688216, "tps": 26051, "wall": 55072.6} {"step": 21892, "train_loss": 3.2758901119232178, "lr": 0.00011066438420265104, "tps": 26049, "wall": 55078.1} {"step": 21893, "train_loss": 3.277039051055908, "lr": 0.00011064916607504031, "tps": 26048, "wall": 55083.7} {"step": 21894, "train_loss": 3.3168697357177734, "lr": 0.00011063394918616174, "tps": 26047, "wall": 55089.3} {"step": 21895, "train_loss": 3.2270913124084473, "lr": 0.00011061873353618763, "tps": 26045, "wall": 55094.8} {"step": 21896, "train_loss": 3.4048092365264893, "lr": 0.0001106035191252905, "tps": 26044, "wall": 55100.4} {"step": 21897, "train_loss": 3.380380630493164, "lr": 0.00011058830595364261, "tps": 26042, "wall": 55106.0} {"step": 21898, "train_loss": 3.305722713470459, "lr": 0.00011057309402141626, "tps": 26041, "wall": 55111.6} {"step": 21899, "train_loss": 3.246479034423828, "lr": 0.00011055788332878389, "tps": 26039, "wall": 55117.3} {"step": 21900, "train_loss": 3.2679145336151123, "lr": 0.00011054267387591774, "tps": 26038, "wall": 55122.9} {"step": 21901, "train_loss": 3.4560837745666504, "lr": 0.00011052746566299004, "tps": 26036, "wall": 55128.4} {"step": 21902, "train_loss": 3.3057427406311035, "lr": 0.00011051225869017317, "tps": 26035, "wall": 55134.0} {"step": 21903, "train_loss": 3.2383971214294434, "lr": 0.00011049705295763933, "tps": 26033, "wall": 55139.6} {"step": 21904, "train_loss": 3.313838005065918, "lr": 0.0001104818484655608, "tps": 26032, "wall": 55145.1} {"step": 21905, "train_loss": 3.3626346588134766, "lr": 0.00011046664521410988, "tps": 26031, "wall": 55150.7} {"step": 21906, "train_loss": 3.2916245460510254, "lr": 0.00011045144320345864, "tps": 26029, "wall": 55156.2} {"step": 21907, "train_loss": 3.2379086017608643, "lr": 0.00011043624243377943, "tps": 26028, "wall": 55161.8} {"step": 21908, "train_loss": 3.3695321083068848, "lr": 0.0001104210429052444, "tps": 26026, "wall": 55167.3} {"step": 21909, "train_loss": 3.282994270324707, "lr": 0.00011040584461802565, "tps": 26025, "wall": 55172.9} {"step": 21910, "train_loss": 3.3359875679016113, "lr": 0.00011039064757229552, "tps": 26023, "wall": 55178.5} {"step": 21911, "train_loss": 3.2844457626342773, "lr": 0.00011037545176822606, "tps": 26022, "wall": 55184.1} {"step": 21912, "train_loss": 3.340651273727417, "lr": 0.0001103602572059893, "tps": 26020, "wall": 55189.7} {"step": 21913, "train_loss": 3.25655460357666, "lr": 0.00011034506388575758, "tps": 26019, "wall": 55195.3} {"step": 21914, "train_loss": 3.324411392211914, "lr": 0.00011032987180770291, "tps": 26018, "wall": 55200.9} {"step": 21915, "train_loss": 3.2625255584716797, "lr": 0.00011031468097199731, "tps": 26016, "wall": 55206.5} {"step": 21916, "train_loss": 3.2719101905822754, "lr": 0.00011029949137881299, "tps": 26015, "wall": 55212.1} {"step": 21917, "train_loss": 3.2958226203918457, "lr": 0.000110284303028322, "tps": 26013, "wall": 55217.7} {"step": 21918, "train_loss": 3.3538665771484375, "lr": 0.00011026911592069627, "tps": 26012, "wall": 55223.2} {"step": 21919, "train_loss": 3.323838233947754, "lr": 0.00011025393005610802, "tps": 26010, "wall": 55228.8} {"step": 21920, "train_loss": 3.3822412490844727, "lr": 0.00011023874543472912, "tps": 26009, "wall": 55234.5} {"step": 21921, "train_loss": 3.199985980987549, "lr": 0.00011022356205673167, "tps": 26007, "wall": 55240.0} {"step": 21922, "train_loss": 3.351574182510376, "lr": 0.0001102083799222877, "tps": 26006, "wall": 55245.6} {"step": 21923, "train_loss": 3.2869386672973633, "lr": 0.00011019319903156904, "tps": 26005, "wall": 55251.1} {"step": 21924, "train_loss": 3.32072377204895, "lr": 0.00011017801938474785, "tps": 26003, "wall": 55256.7} {"step": 21925, "train_loss": 3.200136184692383, "lr": 0.00011016284098199599, "tps": 26002, "wall": 55262.3} {"step": 21926, "train_loss": 3.330815315246582, "lr": 0.00011014766382348533, "tps": 26000, "wall": 55267.9} {"step": 21927, "train_loss": 3.405400514602661, "lr": 0.00011013248790938795, "tps": 25999, "wall": 55273.4} {"step": 21928, "train_loss": 3.262235641479492, "lr": 0.0001101173132398757, "tps": 25997, "wall": 55279.1} {"step": 21929, "train_loss": 3.237333297729492, "lr": 0.0001101021398151204, "tps": 25996, "wall": 55284.9} {"step": 21930, "train_loss": 3.355808734893799, "lr": 0.00011008696763529409, "tps": 25994, "wall": 55290.6} {"step": 21931, "train_loss": 3.25449275970459, "lr": 0.00011007179670056852, "tps": 25993, "wall": 55296.4} {"step": 21932, "train_loss": 3.2214770317077637, "lr": 0.00011005662701111555, "tps": 25991, "wall": 55302.1} {"step": 21933, "train_loss": 3.3081531524658203, "lr": 0.0001100414585671071, "tps": 25990, "wall": 55307.8} {"step": 21934, "train_loss": 3.1808297634124756, "lr": 0.00011002629136871498, "tps": 25988, "wall": 55313.6} {"step": 21935, "train_loss": 3.2730870246887207, "lr": 0.00011001112541611091, "tps": 25987, "wall": 55319.2} {"step": 21936, "train_loss": 3.366313934326172, "lr": 0.00010999596070946683, "tps": 25985, "wall": 55324.8} {"step": 21937, "train_loss": 3.284231662750244, "lr": 0.00010998079724895435, "tps": 25984, "wall": 55330.4} {"step": 21938, "train_loss": 3.222445487976074, "lr": 0.00010996563503474549, "tps": 25982, "wall": 55336.0} {"step": 21939, "train_loss": 3.2293195724487305, "lr": 0.0001099504740670118, "tps": 25981, "wall": 55341.6} {"step": 21940, "train_loss": 3.4036498069763184, "lr": 0.00010993531434592506, "tps": 25980, "wall": 55347.2} {"step": 21941, "train_loss": 3.386336088180542, "lr": 0.0001099201558716571, "tps": 25978, "wall": 55352.8} {"step": 21942, "train_loss": 3.257701873779297, "lr": 0.00010990499864437955, "tps": 25977, "wall": 55358.5} {"step": 21943, "train_loss": 3.270575523376465, "lr": 0.0001098898426642641, "tps": 25975, "wall": 55364.0} {"step": 21944, "train_loss": 3.345397472381592, "lr": 0.00010987468793148252, "tps": 25974, "wall": 55369.6} {"step": 21945, "train_loss": 3.3351175785064697, "lr": 0.0001098595344462064, "tps": 25972, "wall": 55375.2} {"step": 21946, "train_loss": 3.2208786010742188, "lr": 0.00010984438220860742, "tps": 25971, "wall": 55380.8} {"step": 21947, "train_loss": 3.2850399017333984, "lr": 0.00010982923121885726, "tps": 25970, "wall": 55386.4} {"step": 21948, "train_loss": 3.295984983444214, "lr": 0.00010981408147712755, "tps": 25968, "wall": 55391.9} {"step": 21949, "train_loss": 3.162686347961426, "lr": 0.00010979893298358983, "tps": 25967, "wall": 55397.5} {"step": 21950, "train_loss": 3.243459701538086, "lr": 0.00010978378573841581, "tps": 25965, "wall": 55403.1} {"step": 21951, "train_loss": 3.3486886024475098, "lr": 0.00010976863974177702, "tps": 25964, "wall": 55408.6} {"step": 21952, "train_loss": 3.402921676635742, "lr": 0.000109753494993845, "tps": 25962, "wall": 55414.3} {"step": 21953, "train_loss": 3.2496697902679443, "lr": 0.00010973835149479139, "tps": 25961, "wall": 55419.9} {"step": 21954, "train_loss": 3.280750274658203, "lr": 0.00010972320924478772, "tps": 25959, "wall": 55425.4} {"step": 21955, "train_loss": 3.2635207176208496, "lr": 0.00010970806824400543, "tps": 25958, "wall": 55431.0} {"step": 21956, "train_loss": 3.332026958465576, "lr": 0.00010969292849261616, "tps": 25957, "wall": 55436.6} {"step": 21957, "train_loss": 3.4997549057006836, "lr": 0.00010967778999079133, "tps": 25955, "wall": 55442.2} {"step": 21958, "train_loss": 3.251408100128174, "lr": 0.00010966265273870251, "tps": 25954, "wall": 55447.8} {"step": 21959, "train_loss": 3.346442222595215, "lr": 0.00010964751673652111, "tps": 25952, "wall": 55453.4} {"step": 21960, "train_loss": 3.3959317207336426, "lr": 0.00010963238198441858, "tps": 25951, "wall": 55459.0} {"step": 21961, "train_loss": 3.256828784942627, "lr": 0.00010961724848256645, "tps": 25949, "wall": 55464.6} {"step": 21962, "train_loss": 3.234792947769165, "lr": 0.00010960211623113612, "tps": 25948, "wall": 55470.2} {"step": 21963, "train_loss": 3.370826244354248, "lr": 0.00010958698523029889, "tps": 25947, "wall": 55475.9} {"step": 21964, "train_loss": 3.3052594661712646, "lr": 0.00010957185548022634, "tps": 25945, "wall": 55481.5} {"step": 21965, "train_loss": 3.326375961303711, "lr": 0.00010955672698108977, "tps": 25944, "wall": 55487.0} {"step": 21966, "train_loss": 3.287606716156006, "lr": 0.00010954159973306052, "tps": 25942, "wall": 55492.6} {"step": 21967, "train_loss": 3.3288521766662598, "lr": 0.0001095264737363101, "tps": 25941, "wall": 55498.2} {"step": 21968, "train_loss": 3.273712635040283, "lr": 0.00010951134899100972, "tps": 25939, "wall": 55503.8} {"step": 21969, "train_loss": 3.308420181274414, "lr": 0.00010949622549733071, "tps": 25938, "wall": 55509.3} {"step": 21970, "train_loss": 3.329493761062622, "lr": 0.00010948110325544452, "tps": 25937, "wall": 55514.9} {"step": 21971, "train_loss": 3.2807655334472656, "lr": 0.00010946598226552233, "tps": 25935, "wall": 55520.5} {"step": 21972, "train_loss": 3.2145988941192627, "lr": 0.00010945086252773542, "tps": 25934, "wall": 55526.1} {"step": 21973, "train_loss": 3.3144469261169434, "lr": 0.0001094357440422552, "tps": 25932, "wall": 55531.7} {"step": 21974, "train_loss": 3.2667176723480225, "lr": 0.00010942062680925278, "tps": 25931, "wall": 55537.4} {"step": 21975, "train_loss": 3.320866107940674, "lr": 0.00010940551082889957, "tps": 25929, "wall": 55542.9} {"step": 21976, "train_loss": 3.2283496856689453, "lr": 0.00010939039610136665, "tps": 25928, "wall": 55548.5} {"step": 21977, "train_loss": 3.338974952697754, "lr": 0.0001093752826268253, "tps": 25927, "wall": 55554.1} {"step": 21978, "train_loss": 3.34956955909729, "lr": 0.00010936017040544679, "tps": 25925, "wall": 55559.6} {"step": 21979, "train_loss": 3.1709396839141846, "lr": 0.00010934505943740223, "tps": 25924, "wall": 55565.2} {"step": 21980, "train_loss": 3.246368885040283, "lr": 0.0001093299497228628, "tps": 25922, "wall": 55570.8} {"step": 21981, "train_loss": 3.2263023853302, "lr": 0.00010931484126199971, "tps": 25921, "wall": 55576.3} {"step": 21982, "train_loss": 3.2292797565460205, "lr": 0.00010929973405498413, "tps": 25919, "wall": 55581.9} {"step": 21983, "train_loss": 3.2316384315490723, "lr": 0.00010928462810198705, "tps": 25918, "wall": 55587.5} {"step": 21984, "train_loss": 3.3470005989074707, "lr": 0.00010926952340317975, "tps": 25917, "wall": 55593.1} {"step": 21985, "train_loss": 3.290677070617676, "lr": 0.00010925441995873331, "tps": 25915, "wall": 55598.8} {"step": 21986, "train_loss": 3.281466007232666, "lr": 0.00010923931776881871, "tps": 25914, "wall": 55604.3} {"step": 21987, "train_loss": 3.3225109577178955, "lr": 0.00010922421683360719, "tps": 25912, "wall": 55609.9} {"step": 21988, "train_loss": 3.2902042865753174, "lr": 0.00010920911715326974, "tps": 25911, "wall": 55615.4} {"step": 21989, "train_loss": 3.3008131980895996, "lr": 0.00010919401872797732, "tps": 25909, "wall": 55621.0} {"step": 21990, "train_loss": 3.3397021293640137, "lr": 0.00010917892155790111, "tps": 25908, "wall": 55626.6} {"step": 21991, "train_loss": 3.26035475730896, "lr": 0.00010916382564321201, "tps": 25907, "wall": 55632.1} {"step": 21992, "train_loss": 3.3056812286376953, "lr": 0.00010914873098408116, "tps": 25905, "wall": 55637.7} {"step": 21993, "train_loss": 3.261265516281128, "lr": 0.0001091336375806795, "tps": 25904, "wall": 55643.3} {"step": 21994, "train_loss": 3.2935574054718018, "lr": 0.00010911854543317788, "tps": 25902, "wall": 55648.9} {"step": 21995, "train_loss": 3.2908058166503906, "lr": 0.00010910345454174749, "tps": 25901, "wall": 55654.5} {"step": 21996, "train_loss": 3.297149419784546, "lr": 0.00010908836490655914, "tps": 25899, "wall": 55660.1} {"step": 21997, "train_loss": 3.4478187561035156, "lr": 0.00010907327652778372, "tps": 25898, "wall": 55665.7} {"step": 21998, "train_loss": 3.31648588180542, "lr": 0.00010905818940559231, "tps": 25897, "wall": 55671.3} {"step": 21999, "train_loss": 3.3051328659057617, "lr": 0.0001090431035401557, "tps": 25895, "wall": 55676.9} {"step": 22000, "train_loss": 3.2985143661499023, "lr": 0.00010902801893164487, "tps": 25894, "wall": 55682.5, "val_loss_monitor": 3.352472211589833} {"step": 22001, "train_loss": 3.261770486831665, "lr": 0.0001090129355802306, "tps": 25876, "wall": 55724.3} {"step": 22002, "train_loss": 3.316161632537842, "lr": 0.00010899785348608378, "tps": 25874, "wall": 55729.9} {"step": 22003, "train_loss": 3.2852532863616943, "lr": 0.00010898277264937531, "tps": 25873, "wall": 55735.5} {"step": 22004, "train_loss": 3.3012163639068604, "lr": 0.00010896769307027602, "tps": 25871, "wall": 55741.1} {"step": 22005, "train_loss": 3.208733320236206, "lr": 0.00010895261474895661, "tps": 25870, "wall": 55746.7} {"step": 22006, "train_loss": 3.2134687900543213, "lr": 0.00010893753768558807, "tps": 25868, "wall": 55752.4} {"step": 22007, "train_loss": 3.413799524307251, "lr": 0.0001089224618803411, "tps": 25867, "wall": 55758.1} {"step": 22008, "train_loss": 3.386536121368408, "lr": 0.00010890738733338644, "tps": 25865, "wall": 55763.7} {"step": 22009, "train_loss": 3.2707061767578125, "lr": 0.00010889231404489497, "tps": 25864, "wall": 55769.4} {"step": 22010, "train_loss": 3.2755861282348633, "lr": 0.00010887724201503737, "tps": 25863, "wall": 55775.1} {"step": 22011, "train_loss": 3.2418887615203857, "lr": 0.00010886217124398434, "tps": 25861, "wall": 55780.7} {"step": 22012, "train_loss": 3.2832999229431152, "lr": 0.00010884710173190668, "tps": 25860, "wall": 55786.4} {"step": 22013, "train_loss": 3.2739617824554443, "lr": 0.0001088320334789751, "tps": 25858, "wall": 55792.1} {"step": 22014, "train_loss": 3.3916938304901123, "lr": 0.00010881696648536018, "tps": 25857, "wall": 55797.7} {"step": 22015, "train_loss": 3.292776584625244, "lr": 0.00010880190075123273, "tps": 25855, "wall": 55803.3} {"step": 22016, "train_loss": 3.3282551765441895, "lr": 0.00010878683627676332, "tps": 25854, "wall": 55808.9} {"step": 22017, "train_loss": 3.2244348526000977, "lr": 0.00010877177306212269, "tps": 25852, "wall": 55814.6} {"step": 22018, "train_loss": 3.294318675994873, "lr": 0.00010875671110748145, "tps": 25851, "wall": 55820.2} {"step": 22019, "train_loss": 3.231400489807129, "lr": 0.00010874165041301015, "tps": 25850, "wall": 55825.8} {"step": 22020, "train_loss": 3.3388900756835938, "lr": 0.0001087265909788795, "tps": 25848, "wall": 55831.4} {"step": 22021, "train_loss": 3.271120071411133, "lr": 0.00010871153280526, "tps": 25847, "wall": 55837.1} {"step": 22022, "train_loss": 3.355311870574951, "lr": 0.00010869647589232228, "tps": 25845, "wall": 55842.8} {"step": 22023, "train_loss": 3.2448434829711914, "lr": 0.00010868142024023695, "tps": 25844, "wall": 55848.4} {"step": 22024, "train_loss": 3.2974581718444824, "lr": 0.00010866636584917452, "tps": 25842, "wall": 55854.0} {"step": 22025, "train_loss": 3.277510166168213, "lr": 0.00010865131271930545, "tps": 25841, "wall": 55859.6} {"step": 22026, "train_loss": 3.239722728729248, "lr": 0.00010863626085080039, "tps": 25840, "wall": 55865.2} {"step": 22027, "train_loss": 3.244016170501709, "lr": 0.00010862121024382978, "tps": 25838, "wall": 55870.9} {"step": 22028, "train_loss": 3.313537836074829, "lr": 0.00010860616089856411, "tps": 25837, "wall": 55876.5} {"step": 22029, "train_loss": 3.232515811920166, "lr": 0.00010859111281517389, "tps": 25835, "wall": 55882.1} {"step": 22030, "train_loss": 3.2574989795684814, "lr": 0.0001085760659938296, "tps": 25834, "wall": 55887.8} {"step": 22031, "train_loss": 3.3310537338256836, "lr": 0.00010856102043470157, "tps": 25832, "wall": 55893.5} {"step": 22032, "train_loss": 3.3320159912109375, "lr": 0.0001085459761379604, "tps": 25831, "wall": 55899.1} {"step": 22033, "train_loss": 3.353959321975708, "lr": 0.00010853093310377645, "tps": 25830, "wall": 55904.7} {"step": 22034, "train_loss": 3.3350133895874023, "lr": 0.00010851589133232007, "tps": 25828, "wall": 55910.4} {"step": 22035, "train_loss": 3.223235607147217, "lr": 0.00010850085082376175, "tps": 25827, "wall": 55915.9} {"step": 22036, "train_loss": 3.3394436836242676, "lr": 0.00010848581157827178, "tps": 25825, "wall": 55921.5} {"step": 22037, "train_loss": 3.18983793258667, "lr": 0.0001084707735960206, "tps": 25824, "wall": 55927.2} {"step": 22038, "train_loss": 3.2240185737609863, "lr": 0.00010845573687717854, "tps": 25822, "wall": 55932.8} {"step": 22039, "train_loss": 3.3034679889678955, "lr": 0.0001084407014219159, "tps": 25821, "wall": 55938.4} {"step": 22040, "train_loss": 3.2690799236297607, "lr": 0.00010842566723040306, "tps": 25820, "wall": 55944.0} {"step": 22041, "train_loss": 3.25526762008667, "lr": 0.00010841063430281028, "tps": 25818, "wall": 55949.6} {"step": 22042, "train_loss": 3.3512468338012695, "lr": 0.00010839560263930786, "tps": 25817, "wall": 55955.3} {"step": 22043, "train_loss": 3.3119473457336426, "lr": 0.0001083805722400661, "tps": 25815, "wall": 55960.8} {"step": 22044, "train_loss": 3.1154017448425293, "lr": 0.00010836554310525529, "tps": 25814, "wall": 55966.4} {"step": 22045, "train_loss": 3.301865577697754, "lr": 0.0001083505152350456, "tps": 25813, "wall": 55972.0} {"step": 22046, "train_loss": 3.2598953247070312, "lr": 0.00010833548862960734, "tps": 25811, "wall": 55977.6} {"step": 22047, "train_loss": 3.2793874740600586, "lr": 0.00010832046328911072, "tps": 25810, "wall": 55983.2} {"step": 22048, "train_loss": 3.312936544418335, "lr": 0.00010830543921372584, "tps": 25808, "wall": 55988.8} {"step": 22049, "train_loss": 3.3567893505096436, "lr": 0.0001082904164036231, "tps": 25807, "wall": 55994.4} {"step": 22050, "train_loss": 3.2819554805755615, "lr": 0.00010827539485897253, "tps": 25806, "wall": 55999.9} {"step": 22051, "train_loss": 3.4311037063598633, "lr": 0.00010826037457994429, "tps": 25804, "wall": 56005.5} {"step": 22052, "train_loss": 3.360621929168701, "lr": 0.00010824535556670865, "tps": 25803, "wall": 56011.0} {"step": 22053, "train_loss": 3.2484939098358154, "lr": 0.00010823033781943559, "tps": 25801, "wall": 56016.7} {"step": 22054, "train_loss": 3.2805092334747314, "lr": 0.00010821532133829535, "tps": 25800, "wall": 56022.3} {"step": 22055, "train_loss": 3.274700880050659, "lr": 0.00010820030612345802, "tps": 25798, "wall": 56027.9} {"step": 22056, "train_loss": 3.261486053466797, "lr": 0.00010818529217509362, "tps": 25797, "wall": 56033.5} {"step": 22057, "train_loss": 3.31211519241333, "lr": 0.00010817027949337231, "tps": 25796, "wall": 56039.0} {"step": 22058, "train_loss": 3.2245898246765137, "lr": 0.00010815526807846414, "tps": 25794, "wall": 56044.6} {"step": 22059, "train_loss": 3.2318243980407715, "lr": 0.00010814025793053906, "tps": 25793, "wall": 56050.2} {"step": 22060, "train_loss": 3.3090827465057373, "lr": 0.00010812524904976729, "tps": 25792, "wall": 56055.7} {"step": 22061, "train_loss": 3.327146053314209, "lr": 0.00010811024143631874, "tps": 25790, "wall": 56061.3} {"step": 22062, "train_loss": 3.325889825820923, "lr": 0.00010809523509036333, "tps": 25789, "wall": 56066.9} {"step": 22063, "train_loss": 3.3332810401916504, "lr": 0.00010808023001207123, "tps": 25787, "wall": 56072.5} {"step": 22064, "train_loss": 3.2488136291503906, "lr": 0.00010806522620161236, "tps": 25786, "wall": 56078.1} {"step": 22065, "train_loss": 3.396484851837158, "lr": 0.00010805022365915661, "tps": 25784, "wall": 56083.7} {"step": 22066, "train_loss": 3.395205020904541, "lr": 0.000108035222384874, "tps": 25783, "wall": 56089.3} {"step": 22067, "train_loss": 3.3032760620117188, "lr": 0.00010802022237893448, "tps": 25782, "wall": 56094.9} {"step": 22068, "train_loss": 3.2416765689849854, "lr": 0.00010800522364150787, "tps": 25780, "wall": 56100.5} {"step": 22069, "train_loss": 3.2256557941436768, "lr": 0.00010799022617276422, "tps": 25779, "wall": 56106.0} {"step": 22070, "train_loss": 3.3015739917755127, "lr": 0.00010797522997287326, "tps": 25778, "wall": 56111.5} {"step": 22071, "train_loss": 3.3193633556365967, "lr": 0.00010796023504200503, "tps": 25776, "wall": 56117.1} {"step": 22072, "train_loss": 3.2113609313964844, "lr": 0.00010794524138032934, "tps": 25775, "wall": 56122.7} {"step": 22073, "train_loss": 3.2472174167633057, "lr": 0.00010793024898801592, "tps": 25773, "wall": 56128.2} {"step": 22074, "train_loss": 3.2702929973602295, "lr": 0.00010791525786523478, "tps": 25772, "wall": 56133.8} {"step": 22075, "train_loss": 3.3676278591156006, "lr": 0.00010790026801215565, "tps": 25771, "wall": 56139.4} {"step": 22076, "train_loss": 3.422020435333252, "lr": 0.00010788527942894831, "tps": 25769, "wall": 56144.9} {"step": 22077, "train_loss": 3.1973788738250732, "lr": 0.00010787029211578264, "tps": 25768, "wall": 56150.5} {"step": 22078, "train_loss": 3.3138504028320312, "lr": 0.00010785530607282837, "tps": 25766, "wall": 56156.1} {"step": 22079, "train_loss": 3.380358934402466, "lr": 0.00010784032130025518, "tps": 25765, "wall": 56161.6} {"step": 22080, "train_loss": 3.4180517196655273, "lr": 0.00010782533779823298, "tps": 25764, "wall": 56167.2} {"step": 22081, "train_loss": 3.312897205352783, "lr": 0.00010781035556693142, "tps": 25762, "wall": 56172.7} {"step": 22082, "train_loss": 3.3953957557678223, "lr": 0.00010779537460652015, "tps": 25761, "wall": 56178.3} {"step": 22083, "train_loss": 3.2767462730407715, "lr": 0.00010778039491716905, "tps": 25760, "wall": 56183.9} {"step": 22084, "train_loss": 3.33327317237854, "lr": 0.00010776541649904766, "tps": 25758, "wall": 56189.5} {"step": 22085, "train_loss": 3.2704555988311768, "lr": 0.00010775043935232566, "tps": 25757, "wall": 56195.2} {"step": 22086, "train_loss": 3.2904887199401855, "lr": 0.00010773546347717278, "tps": 25755, "wall": 56200.7} {"step": 22087, "train_loss": 3.2589802742004395, "lr": 0.00010772048887375867, "tps": 25754, "wall": 56206.3} {"step": 22088, "train_loss": 3.191646099090576, "lr": 0.0001077055155422529, "tps": 25753, "wall": 56211.8} {"step": 22089, "train_loss": 3.2189157009124756, "lr": 0.00010769054348282517, "tps": 25751, "wall": 56217.4} {"step": 22090, "train_loss": 3.2260079383850098, "lr": 0.00010767557269564499, "tps": 25750, "wall": 56223.0} {"step": 22091, "train_loss": 3.218303680419922, "lr": 0.00010766060318088203, "tps": 25748, "wall": 56228.6} {"step": 22092, "train_loss": 3.2627525329589844, "lr": 0.00010764563493870585, "tps": 25747, "wall": 56234.1} {"step": 22093, "train_loss": 3.3634133338928223, "lr": 0.00010763066796928592, "tps": 25746, "wall": 56239.7} {"step": 22094, "train_loss": 3.304100751876831, "lr": 0.00010761570227279194, "tps": 25744, "wall": 56245.2} {"step": 22095, "train_loss": 3.303191661834717, "lr": 0.00010760073784939337, "tps": 25743, "wall": 56250.8} {"step": 22096, "train_loss": 3.2820332050323486, "lr": 0.00010758577469925964, "tps": 25741, "wall": 56256.4} {"step": 22097, "train_loss": 3.229748249053955, "lr": 0.00010757081282256043, "tps": 25740, "wall": 56262.0} {"step": 22098, "train_loss": 3.292271137237549, "lr": 0.00010755585221946512, "tps": 25739, "wall": 56267.6} {"step": 22099, "train_loss": 3.277686834335327, "lr": 0.00010754089289014313, "tps": 25737, "wall": 56273.1} {"step": 22100, "train_loss": 3.371061325073242, "lr": 0.00010752593483476403, "tps": 25736, "wall": 56278.7} {"step": 22101, "train_loss": 3.240725517272949, "lr": 0.00010751097805349726, "tps": 25735, "wall": 56284.3} {"step": 22102, "train_loss": 3.3516602516174316, "lr": 0.00010749602254651214, "tps": 25733, "wall": 56289.9} {"step": 22103, "train_loss": 3.2475709915161133, "lr": 0.00010748106831397822, "tps": 25732, "wall": 56296.0} {"step": 22104, "train_loss": 3.236112117767334, "lr": 0.00010746611535606486, "tps": 25730, "wall": 56302.0} {"step": 22105, "train_loss": 3.375908613204956, "lr": 0.00010745116367294137, "tps": 25729, "wall": 56307.6} {"step": 22106, "train_loss": 3.373332977294922, "lr": 0.00010743621326477722, "tps": 25727, "wall": 56313.3} {"step": 22107, "train_loss": 3.295923948287964, "lr": 0.00010742126413174172, "tps": 25726, "wall": 56318.9} {"step": 22108, "train_loss": 3.2869114875793457, "lr": 0.00010740631627400425, "tps": 25724, "wall": 56324.5} {"step": 22109, "train_loss": 3.3534069061279297, "lr": 0.00010739136969173415, "tps": 25723, "wall": 56330.0} {"step": 22110, "train_loss": 3.232318639755249, "lr": 0.00010737642438510063, "tps": 25722, "wall": 56335.6} {"step": 22111, "train_loss": 3.307647228240967, "lr": 0.00010736148035427314, "tps": 25720, "wall": 56341.2} {"step": 22112, "train_loss": 3.1692216396331787, "lr": 0.00010734653759942088, "tps": 25719, "wall": 56346.8} {"step": 22113, "train_loss": 3.228482723236084, "lr": 0.00010733159612071309, "tps": 25717, "wall": 56352.3} {"step": 22114, "train_loss": 3.2728962898254395, "lr": 0.00010731665591831912, "tps": 25716, "wall": 56357.9} {"step": 22115, "train_loss": 3.258565902709961, "lr": 0.00010730171699240816, "tps": 25715, "wall": 56363.5} {"step": 22116, "train_loss": 3.344489812850952, "lr": 0.00010728677934314944, "tps": 25713, "wall": 56369.1} {"step": 22117, "train_loss": 3.4447643756866455, "lr": 0.00010727184297071218, "tps": 25712, "wall": 56374.8} {"step": 22118, "train_loss": 3.2512922286987305, "lr": 0.00010725690787526561, "tps": 25710, "wall": 56380.4} {"step": 22119, "train_loss": 3.245168685913086, "lr": 0.00010724197405697882, "tps": 25709, "wall": 56386.0} {"step": 22120, "train_loss": 3.363342046737671, "lr": 0.0001072270415160211, "tps": 25708, "wall": 56391.5} {"step": 22121, "train_loss": 3.364872932434082, "lr": 0.00010721211025256157, "tps": 25706, "wall": 56397.1} {"step": 22122, "train_loss": 3.401576519012451, "lr": 0.00010719718026676928, "tps": 25705, "wall": 56402.7} {"step": 22123, "train_loss": 3.334956169128418, "lr": 0.0001071822515588135, "tps": 25703, "wall": 56408.3} {"step": 22124, "train_loss": 3.3894858360290527, "lr": 0.00010716732412886323, "tps": 25702, "wall": 56413.9} {"step": 22125, "train_loss": 3.2358713150024414, "lr": 0.00010715239797708767, "tps": 25701, "wall": 56419.4} {"step": 22126, "train_loss": 3.226254940032959, "lr": 0.00010713747310365585, "tps": 25699, "wall": 56425.0} {"step": 22127, "train_loss": 3.2627170085906982, "lr": 0.00010712254950873677, "tps": 25698, "wall": 56430.7} {"step": 22128, "train_loss": 3.363016366958618, "lr": 0.00010710762719249963, "tps": 25697, "wall": 56436.3} {"step": 22129, "train_loss": 3.3572614192962646, "lr": 0.0001070927061551134, "tps": 25695, "wall": 56441.9} {"step": 22130, "train_loss": 3.4596686363220215, "lr": 0.00010707778639674704, "tps": 25694, "wall": 56447.5} {"step": 22131, "train_loss": 3.344959020614624, "lr": 0.00010706286791756968, "tps": 25692, "wall": 56453.0} {"step": 22132, "train_loss": 3.176809072494507, "lr": 0.00010704795071775025, "tps": 25691, "wall": 56458.6} {"step": 22133, "train_loss": 3.308588981628418, "lr": 0.0001070330347974577, "tps": 25690, "wall": 56464.2} {"step": 22134, "train_loss": 3.2269017696380615, "lr": 0.0001070181201568611, "tps": 25688, "wall": 56469.8} {"step": 22135, "train_loss": 3.3008415699005127, "lr": 0.00010700320679612934, "tps": 25687, "wall": 56475.4} {"step": 22136, "train_loss": 3.2184925079345703, "lr": 0.0001069882947154313, "tps": 25686, "wall": 56480.9} {"step": 22137, "train_loss": 3.3859190940856934, "lr": 0.00010697338391493605, "tps": 25684, "wall": 56486.6} {"step": 22138, "train_loss": 3.2999684810638428, "lr": 0.00010695847439481243, "tps": 25683, "wall": 56492.2} {"step": 22139, "train_loss": 3.353336811065674, "lr": 0.00010694356615522925, "tps": 25681, "wall": 56497.8} {"step": 22140, "train_loss": 3.2121200561523438, "lr": 0.00010692865919635555, "tps": 25680, "wall": 56503.4} {"step": 22141, "train_loss": 3.2960433959960938, "lr": 0.0001069137535183601, "tps": 25679, "wall": 56509.0} {"step": 22142, "train_loss": 3.26353120803833, "lr": 0.00010689884912141168, "tps": 25677, "wall": 56514.6} {"step": 22143, "train_loss": 3.1830780506134033, "lr": 0.00010688394600567932, "tps": 25676, "wall": 56520.2} {"step": 22144, "train_loss": 3.360572338104248, "lr": 0.00010686904417133168, "tps": 25674, "wall": 56525.8} {"step": 22145, "train_loss": 3.275304079055786, "lr": 0.00010685414361853765, "tps": 25673, "wall": 56531.3} {"step": 22146, "train_loss": 3.313957452774048, "lr": 0.00010683924434746602, "tps": 25672, "wall": 56536.9} {"step": 22147, "train_loss": 3.191774368286133, "lr": 0.00010682434635828548, "tps": 25670, "wall": 56542.5} {"step": 22148, "train_loss": 3.3481321334838867, "lr": 0.00010680944965116495, "tps": 25669, "wall": 56548.1} {"step": 22149, "train_loss": 3.2224626541137695, "lr": 0.00010679455422627309, "tps": 25668, "wall": 56553.8} {"step": 22150, "train_loss": 3.307878017425537, "lr": 0.00010677966008377857, "tps": 25666, "wall": 56559.3} {"step": 22151, "train_loss": 3.257746696472168, "lr": 0.00010676476722385027, "tps": 25665, "wall": 56564.9} {"step": 22152, "train_loss": 3.402446746826172, "lr": 0.00010674987564665679, "tps": 25663, "wall": 56570.5} {"step": 22153, "train_loss": 3.361400604248047, "lr": 0.00010673498535236681, "tps": 25662, "wall": 56576.1} {"step": 22154, "train_loss": 3.218503475189209, "lr": 0.00010672009634114908, "tps": 25661, "wall": 56581.7} {"step": 22155, "train_loss": 3.3180630207061768, "lr": 0.00010670520861317223, "tps": 25659, "wall": 56587.3} {"step": 22156, "train_loss": 3.3955864906311035, "lr": 0.00010669032216860486, "tps": 25658, "wall": 56592.9} {"step": 22157, "train_loss": 3.2346959114074707, "lr": 0.00010667543700761573, "tps": 25656, "wall": 56598.5} {"step": 22158, "train_loss": 3.268306016921997, "lr": 0.00010666055313037333, "tps": 25655, "wall": 56604.1} {"step": 22159, "train_loss": 3.339244842529297, "lr": 0.00010664567053704626, "tps": 25654, "wall": 56609.7} {"step": 22160, "train_loss": 3.4049313068389893, "lr": 0.00010663078922780326, "tps": 25652, "wall": 56615.3} {"step": 22161, "train_loss": 3.293417453765869, "lr": 0.00010661590920281275, "tps": 25651, "wall": 56620.9} {"step": 22162, "train_loss": 3.212519884109497, "lr": 0.0001066010304622434, "tps": 25650, "wall": 56626.5} {"step": 22163, "train_loss": 3.431889057159424, "lr": 0.00010658615300626372, "tps": 25648, "wall": 56632.0} {"step": 22164, "train_loss": 3.232227325439453, "lr": 0.00010657127683504216, "tps": 25647, "wall": 56637.6} {"step": 22165, "train_loss": 3.269554853439331, "lr": 0.00010655640194874739, "tps": 25645, "wall": 56643.2} {"step": 22166, "train_loss": 3.2228968143463135, "lr": 0.00010654152834754781, "tps": 25644, "wall": 56648.8} {"step": 22167, "train_loss": 3.339768171310425, "lr": 0.00010652665603161189, "tps": 25643, "wall": 56654.4} {"step": 22168, "train_loss": 3.3723456859588623, "lr": 0.00010651178500110828, "tps": 25641, "wall": 56660.0} {"step": 22169, "train_loss": 3.2486608028411865, "lr": 0.00010649691525620518, "tps": 25640, "wall": 56665.6} {"step": 22170, "train_loss": 3.253622055053711, "lr": 0.00010648204679707124, "tps": 25639, "wall": 56671.1} {"step": 22171, "train_loss": 3.378648281097412, "lr": 0.0001064671796238748, "tps": 25637, "wall": 56676.8} {"step": 22172, "train_loss": 3.281205177307129, "lr": 0.00010645231373678421, "tps": 25636, "wall": 56682.4} {"step": 22173, "train_loss": 3.307429075241089, "lr": 0.00010643744913596805, "tps": 25635, "wall": 56687.9} {"step": 22174, "train_loss": 3.2415754795074463, "lr": 0.0001064225858215946, "tps": 25633, "wall": 56693.5} {"step": 22175, "train_loss": 3.2341294288635254, "lr": 0.00010640772379383215, "tps": 25632, "wall": 56699.1} {"step": 22176, "train_loss": 3.331301689147949, "lr": 0.00010639286305284926, "tps": 25630, "wall": 56704.7} {"step": 22177, "train_loss": 3.3572888374328613, "lr": 0.00010637800359881414, "tps": 25629, "wall": 56710.3} {"step": 22178, "train_loss": 3.3099868297576904, "lr": 0.00010636314543189505, "tps": 25628, "wall": 56715.9} {"step": 22179, "train_loss": 3.2831692695617676, "lr": 0.00010634828855226051, "tps": 25626, "wall": 56721.4} {"step": 22180, "train_loss": 3.280484676361084, "lr": 0.00010633343296007869, "tps": 25625, "wall": 56727.0} {"step": 22181, "train_loss": 3.2051706314086914, "lr": 0.00010631857865551782, "tps": 25624, "wall": 56732.5} {"step": 22182, "train_loss": 3.2527222633361816, "lr": 0.00010630372563874629, "tps": 25622, "wall": 56738.2} {"step": 22183, "train_loss": 3.249501943588257, "lr": 0.00010628887390993232, "tps": 25621, "wall": 56743.7} {"step": 22184, "train_loss": 3.2121949195861816, "lr": 0.00010627402346924409, "tps": 25620, "wall": 56749.3} {"step": 22185, "train_loss": 3.371063232421875, "lr": 0.00010625917431684994, "tps": 25618, "wall": 56754.8} {"step": 22186, "train_loss": 3.3480961322784424, "lr": 0.00010624432645291793, "tps": 25617, "wall": 56760.3} {"step": 22187, "train_loss": 3.225834846496582, "lr": 0.00010622947987761642, "tps": 25615, "wall": 56765.9} {"step": 22188, "train_loss": 3.3212852478027344, "lr": 0.0001062146345911135, "tps": 25614, "wall": 56771.5} {"step": 22189, "train_loss": 3.4128987789154053, "lr": 0.0001061997905935773, "tps": 25613, "wall": 56777.0} {"step": 22190, "train_loss": 3.250723361968994, "lr": 0.0001061849478851761, "tps": 25611, "wall": 56782.5} {"step": 22191, "train_loss": 3.179311513900757, "lr": 0.00010617010646607797, "tps": 25610, "wall": 56788.1} {"step": 22192, "train_loss": 3.263434648513794, "lr": 0.00010615526633645097, "tps": 25609, "wall": 56793.8} {"step": 22193, "train_loss": 3.345409631729126, "lr": 0.00010614042749646333, "tps": 25607, "wall": 56799.4} {"step": 22194, "train_loss": 3.297426700592041, "lr": 0.00010612558994628307, "tps": 25606, "wall": 56805.0} {"step": 22195, "train_loss": 3.2224678993225098, "lr": 0.00010611075368607824, "tps": 25605, "wall": 56810.5} {"step": 22196, "train_loss": 3.4072978496551514, "lr": 0.000106095918716017, "tps": 25603, "wall": 56816.0} {"step": 22197, "train_loss": 3.3229854106903076, "lr": 0.00010608108503626739, "tps": 25602, "wall": 56821.6} {"step": 22198, "train_loss": 3.3044443130493164, "lr": 0.00010606625264699733, "tps": 25601, "wall": 56827.1} {"step": 22199, "train_loss": 3.216510772705078, "lr": 0.000106051421548375, "tps": 25599, "wall": 56832.7} {"step": 22200, "train_loss": 3.252185344696045, "lr": 0.0001060365917405683, "tps": 25598, "wall": 56838.2} {"step": 22201, "train_loss": 3.2731921672821045, "lr": 0.00010602176322374522, "tps": 25597, "wall": 56843.7} {"step": 22202, "train_loss": 3.317969799041748, "lr": 0.00010600693599807381, "tps": 25595, "wall": 56849.3} {"step": 22203, "train_loss": 3.3083178997039795, "lr": 0.00010599211006372196, "tps": 25594, "wall": 56855.0} {"step": 22204, "train_loss": 3.323702096939087, "lr": 0.0001059772854208577, "tps": 25592, "wall": 56860.5} {"step": 22205, "train_loss": 3.268124580383301, "lr": 0.00010596246206964893, "tps": 25591, "wall": 56866.1} {"step": 22206, "train_loss": 3.2463183403015137, "lr": 0.00010594764001026349, "tps": 25590, "wall": 56871.7} {"step": 22207, "train_loss": 3.2394373416900635, "lr": 0.00010593281924286941, "tps": 25588, "wall": 56877.2} {"step": 22208, "train_loss": 3.243642807006836, "lr": 0.00010591799976763455, "tps": 25587, "wall": 56882.8} {"step": 22209, "train_loss": 3.3832249641418457, "lr": 0.00010590318158472667, "tps": 25586, "wall": 56888.3} {"step": 22210, "train_loss": 3.2983815670013428, "lr": 0.0001058883646943138, "tps": 25584, "wall": 56893.9} {"step": 22211, "train_loss": 3.3163504600524902, "lr": 0.0001058735490965637, "tps": 25583, "wall": 56899.5} {"step": 22212, "train_loss": 3.1754093170166016, "lr": 0.00010585873479164417, "tps": 25582, "wall": 56905.1} {"step": 22213, "train_loss": 3.3501343727111816, "lr": 0.00010584392177972309, "tps": 25580, "wall": 56910.6} {"step": 22214, "train_loss": 3.1736161708831787, "lr": 0.00010582911006096825, "tps": 25579, "wall": 56916.3} {"step": 22215, "train_loss": 3.3354153633117676, "lr": 0.00010581429963554736, "tps": 25578, "wall": 56921.8} {"step": 22216, "train_loss": 3.3403007984161377, "lr": 0.00010579949050362836, "tps": 25576, "wall": 56927.4} {"step": 22217, "train_loss": 3.2872352600097656, "lr": 0.00010578468266537889, "tps": 25575, "wall": 56933.0} {"step": 22218, "train_loss": 3.3299922943115234, "lr": 0.00010576987612096662, "tps": 25573, "wall": 56938.5} {"step": 22219, "train_loss": 3.277647018432617, "lr": 0.0001057550708705595, "tps": 25572, "wall": 56944.1} {"step": 22220, "train_loss": 3.224262237548828, "lr": 0.00010574026691432507, "tps": 25571, "wall": 56949.6} {"step": 22221, "train_loss": 3.241734027862549, "lr": 0.00010572546425243102, "tps": 25569, "wall": 56955.2} {"step": 22222, "train_loss": 3.3117613792419434, "lr": 0.00010571066288504517, "tps": 25568, "wall": 56960.7} {"step": 22223, "train_loss": 3.260756015777588, "lr": 0.00010569586281233503, "tps": 25567, "wall": 56966.3} {"step": 22224, "train_loss": 3.264188051223755, "lr": 0.00010568106403446845, "tps": 25565, "wall": 56971.9} {"step": 22225, "train_loss": 3.32761287689209, "lr": 0.00010566626655161291, "tps": 25564, "wall": 56977.5} {"step": 22226, "train_loss": 3.196227550506592, "lr": 0.00010565147036393606, "tps": 25563, "wall": 56983.1} {"step": 22227, "train_loss": 3.2323496341705322, "lr": 0.00010563667547160556, "tps": 25561, "wall": 56988.6} {"step": 22228, "train_loss": 3.1673734188079834, "lr": 0.00010562188187478902, "tps": 25560, "wall": 56994.2} {"step": 22229, "train_loss": 3.260430097579956, "lr": 0.00010560708957365392, "tps": 25559, "wall": 56999.8} {"step": 22230, "train_loss": 3.3025288581848145, "lr": 0.00010559229856836795, "tps": 25557, "wall": 57005.3} {"step": 22231, "train_loss": 3.36082124710083, "lr": 0.00010557750885909863, "tps": 25556, "wall": 57010.8} {"step": 22232, "train_loss": 3.3848655223846436, "lr": 0.00010556272044601341, "tps": 25555, "wall": 57016.4} {"step": 22233, "train_loss": 3.3539786338806152, "lr": 0.00010554793332927995, "tps": 25553, "wall": 57021.9} {"step": 22234, "train_loss": 3.3075673580169678, "lr": 0.00010553314750906569, "tps": 25552, "wall": 57027.5} {"step": 22235, "train_loss": 3.2110323905944824, "lr": 0.00010551836298553807, "tps": 25551, "wall": 57033.0} {"step": 22236, "train_loss": 3.3885293006896973, "lr": 0.00010550357975886466, "tps": 25549, "wall": 57038.7} {"step": 22237, "train_loss": 3.3428821563720703, "lr": 0.00010548879782921291, "tps": 25548, "wall": 57044.2} {"step": 22238, "train_loss": 3.2864019870758057, "lr": 0.00010547401719675021, "tps": 25547, "wall": 57049.8} {"step": 22239, "train_loss": 3.1823225021362305, "lr": 0.00010545923786164409, "tps": 25545, "wall": 57055.4} {"step": 22240, "train_loss": 3.253052234649658, "lr": 0.00010544445982406186, "tps": 25544, "wall": 57060.9} {"step": 22241, "train_loss": 3.3807053565979004, "lr": 0.00010542968308417105, "tps": 25543, "wall": 57066.5} {"step": 22242, "train_loss": 3.195413589477539, "lr": 0.00010541490764213896, "tps": 25541, "wall": 57072.1} {"step": 22243, "train_loss": 3.2749249935150146, "lr": 0.00010540013349813299, "tps": 25540, "wall": 57077.6} {"step": 22244, "train_loss": 3.3533620834350586, "lr": 0.00010538536065232052, "tps": 25539, "wall": 57083.1} {"step": 22245, "train_loss": 3.275435209274292, "lr": 0.00010537058910486889, "tps": 25537, "wall": 57088.7} {"step": 22246, "train_loss": 3.200279951095581, "lr": 0.00010535581885594537, "tps": 25536, "wall": 57094.4} {"step": 22247, "train_loss": 3.292673110961914, "lr": 0.00010534104990571738, "tps": 25534, "wall": 57099.9} {"step": 22248, "train_loss": 3.223083972930908, "lr": 0.00010532628225435224, "tps": 25533, "wall": 57105.5} {"step": 22249, "train_loss": 3.447784423828125, "lr": 0.00010531151590201707, "tps": 25532, "wall": 57111.0} {"step": 22250, "train_loss": 3.373555898666382, "lr": 0.00010529675084887932, "tps": 25530, "wall": 57116.6} {"step": 22251, "train_loss": 3.3239760398864746, "lr": 0.0001052819870951062, "tps": 25529, "wall": 57122.1} {"step": 22252, "train_loss": 3.299849033355713, "lr": 0.00010526722464086485, "tps": 25528, "wall": 57127.7} {"step": 22253, "train_loss": 3.2293758392333984, "lr": 0.00010525246348632265, "tps": 25526, "wall": 57133.3} {"step": 22254, "train_loss": 3.3911585807800293, "lr": 0.00010523770363164676, "tps": 25525, "wall": 57138.9} {"step": 22255, "train_loss": 3.333616256713867, "lr": 0.00010522294507700432, "tps": 25524, "wall": 57144.4} {"step": 22256, "train_loss": 3.3057141304016113, "lr": 0.00010520818782256261, "tps": 25522, "wall": 57150.0} {"step": 22257, "train_loss": 3.357548236846924, "lr": 0.00010519343186848872, "tps": 25521, "wall": 57155.6} {"step": 22258, "train_loss": 3.200349807739258, "lr": 0.00010517867721494989, "tps": 25520, "wall": 57161.2} {"step": 22259, "train_loss": 3.3702259063720703, "lr": 0.00010516392386211322, "tps": 25518, "wall": 57166.7} {"step": 22260, "train_loss": 3.3102078437805176, "lr": 0.00010514917181014576, "tps": 25517, "wall": 57172.3} {"step": 22261, "train_loss": 3.3351521492004395, "lr": 0.00010513442105921476, "tps": 25516, "wall": 57177.9} {"step": 22262, "train_loss": 3.2963192462921143, "lr": 0.00010511967160948726, "tps": 25514, "wall": 57183.5} {"step": 22263, "train_loss": 3.23795747756958, "lr": 0.00010510492346113028, "tps": 25513, "wall": 57189.0} {"step": 22264, "train_loss": 3.3616373538970947, "lr": 0.000105090176614311, "tps": 25512, "wall": 57194.5} {"step": 22265, "train_loss": 3.235340118408203, "lr": 0.00010507543106919642, "tps": 25510, "wall": 57200.1} {"step": 22266, "train_loss": 3.292158842086792, "lr": 0.00010506068682595347, "tps": 25509, "wall": 57205.7} {"step": 22267, "train_loss": 3.258881092071533, "lr": 0.0001050459438847494, "tps": 25508, "wall": 57211.2} {"step": 22268, "train_loss": 3.1993374824523926, "lr": 0.00010503120224575108, "tps": 25506, "wall": 57216.9} {"step": 22269, "train_loss": 3.3078861236572266, "lr": 0.00010501646190912544, "tps": 25505, "wall": 57222.5} {"step": 22270, "train_loss": 3.2534821033477783, "lr": 0.0001050017228750396, "tps": 25504, "wall": 57228.0} {"step": 22271, "train_loss": 3.275132894515991, "lr": 0.0001049869851436605, "tps": 25502, "wall": 57233.6} {"step": 22272, "train_loss": 3.3241987228393555, "lr": 0.00010497224871515494, "tps": 25501, "wall": 57239.1} {"step": 22273, "train_loss": 3.317990303039551, "lr": 0.00010495751358969008, "tps": 25500, "wall": 57244.7} {"step": 22274, "train_loss": 3.2822396755218506, "lr": 0.0001049427797674327, "tps": 25498, "wall": 57250.2} {"step": 22275, "train_loss": 3.2903854846954346, "lr": 0.00010492804724854967, "tps": 25497, "wall": 57255.8} {"step": 22276, "train_loss": 3.314113140106201, "lr": 0.00010491331603320804, "tps": 25496, "wall": 57261.3} {"step": 22277, "train_loss": 3.268657684326172, "lr": 0.0001048985861215745, "tps": 25494, "wall": 57266.9} {"step": 22278, "train_loss": 3.4022984504699707, "lr": 0.00010488385751381609, "tps": 25493, "wall": 57272.4} {"step": 22279, "train_loss": 3.3158090114593506, "lr": 0.00010486913021009954, "tps": 25492, "wall": 57278.1} {"step": 22280, "train_loss": 3.1991851329803467, "lr": 0.00010485440421059167, "tps": 25490, "wall": 57283.6} {"step": 22281, "train_loss": 3.268303632736206, "lr": 0.00010483967951545941, "tps": 25489, "wall": 57289.2} {"step": 22282, "train_loss": 3.1810386180877686, "lr": 0.00010482495612486946, "tps": 25488, "wall": 57294.8} {"step": 22283, "train_loss": 3.2818145751953125, "lr": 0.0001048102340389886, "tps": 25486, "wall": 57300.3} {"step": 22284, "train_loss": 3.3618459701538086, "lr": 0.0001047955132579837, "tps": 25485, "wall": 57305.9} {"step": 22285, "train_loss": 3.1747336387634277, "lr": 0.00010478079378202146, "tps": 25484, "wall": 57311.5} {"step": 22286, "train_loss": 3.308901309967041, "lr": 0.00010476607561126854, "tps": 25482, "wall": 57317.0} {"step": 22287, "train_loss": 3.3350658416748047, "lr": 0.00010475135874589181, "tps": 25481, "wall": 57322.6} {"step": 22288, "train_loss": 3.2328786849975586, "lr": 0.00010473664318605796, "tps": 25480, "wall": 57328.2} {"step": 22289, "train_loss": 3.3015384674072266, "lr": 0.00010472192893193357, "tps": 25478, "wall": 57333.8} {"step": 22290, "train_loss": 3.3275563716888428, "lr": 0.00010470721598368544, "tps": 25477, "wall": 57339.4} {"step": 22291, "train_loss": 3.2863378524780273, "lr": 0.00010469250434148023, "tps": 25476, "wall": 57344.9} {"step": 22292, "train_loss": 3.1825151443481445, "lr": 0.00010467779400548452, "tps": 25474, "wall": 57350.5} {"step": 22293, "train_loss": 3.2479772567749023, "lr": 0.00010466308497586503, "tps": 25473, "wall": 57356.0} {"step": 22294, "train_loss": 3.1874351501464844, "lr": 0.00010464837725278833, "tps": 25472, "wall": 57361.6} {"step": 22295, "train_loss": 3.2767560482025146, "lr": 0.00010463367083642108, "tps": 25470, "wall": 57367.1} {"step": 22296, "train_loss": 3.254110813140869, "lr": 0.00010461896572692987, "tps": 25469, "wall": 57372.7} {"step": 22297, "train_loss": 3.3647620677948, "lr": 0.00010460426192448119, "tps": 25468, "wall": 57378.2} {"step": 22298, "train_loss": 3.343090057373047, "lr": 0.00010458955942924171, "tps": 25466, "wall": 57383.8} {"step": 22299, "train_loss": 3.289011001586914, "lr": 0.00010457485824137795, "tps": 25465, "wall": 57389.4} {"step": 22300, "train_loss": 3.2226340770721436, "lr": 0.00010456015836105643, "tps": 25464, "wall": 57395.0} {"step": 22301, "train_loss": 3.2559750080108643, "lr": 0.0001045454597884437, "tps": 25462, "wall": 57400.6} {"step": 22302, "train_loss": 3.329648494720459, "lr": 0.00010453076252370624, "tps": 25461, "wall": 57406.1} {"step": 22303, "train_loss": 3.407331943511963, "lr": 0.00010451606656701049, "tps": 25460, "wall": 57411.7} {"step": 22304, "train_loss": 3.3530168533325195, "lr": 0.0001045013719185231, "tps": 25458, "wall": 57417.2} {"step": 22305, "train_loss": 3.300586700439453, "lr": 0.00010448667857841037, "tps": 25457, "wall": 57422.8} {"step": 22306, "train_loss": 3.2241578102111816, "lr": 0.00010447198654683874, "tps": 25456, "wall": 57428.4} {"step": 22307, "train_loss": 3.297281265258789, "lr": 0.00010445729582397477, "tps": 25454, "wall": 57433.9} {"step": 22308, "train_loss": 3.19985032081604, "lr": 0.00010444260640998478, "tps": 25453, "wall": 57439.5} {"step": 22309, "train_loss": 3.2695443630218506, "lr": 0.00010442791830503513, "tps": 25452, "wall": 57445.1} {"step": 22310, "train_loss": 3.2675468921661377, "lr": 0.00010441323150929235, "tps": 25450, "wall": 57450.7} {"step": 22311, "train_loss": 3.1811773777008057, "lr": 0.00010439854602292269, "tps": 25449, "wall": 57456.3} {"step": 22312, "train_loss": 3.2900333404541016, "lr": 0.00010438386184609259, "tps": 25448, "wall": 57461.9} {"step": 22313, "train_loss": 3.3912301063537598, "lr": 0.00010436917897896837, "tps": 25446, "wall": 57467.5} {"step": 22314, "train_loss": 3.347982883453369, "lr": 0.00010435449742171628, "tps": 25445, "wall": 57473.0} {"step": 22315, "train_loss": 3.402531623840332, "lr": 0.00010433981717450278, "tps": 25444, "wall": 57478.6} {"step": 22316, "train_loss": 3.325432300567627, "lr": 0.00010432513823749409, "tps": 25442, "wall": 57484.2} {"step": 22317, "train_loss": 3.3069467544555664, "lr": 0.00010431046061085639, "tps": 25441, "wall": 57489.7} {"step": 22318, "train_loss": 3.1635971069335938, "lr": 0.00010429578429475615, "tps": 25440, "wall": 57495.3} {"step": 22319, "train_loss": 3.1936450004577637, "lr": 0.0001042811092893595, "tps": 25438, "wall": 57500.9} {"step": 22320, "train_loss": 3.2548766136169434, "lr": 0.00010426643559483265, "tps": 25437, "wall": 57506.4} {"step": 22321, "train_loss": 3.312549591064453, "lr": 0.00010425176321134196, "tps": 25436, "wall": 57512.0} {"step": 22322, "train_loss": 3.3064792156219482, "lr": 0.00010423709213905353, "tps": 25434, "wall": 57517.7} {"step": 22323, "train_loss": 3.20076584815979, "lr": 0.00010422242237813353, "tps": 25433, "wall": 57523.2} {"step": 22324, "train_loss": 3.3101744651794434, "lr": 0.00010420775392874826, "tps": 25432, "wall": 57528.8} {"step": 22325, "train_loss": 3.244152069091797, "lr": 0.00010419308679106383, "tps": 25430, "wall": 57534.5} {"step": 22326, "train_loss": 3.227844715118408, "lr": 0.00010417842096524628, "tps": 25429, "wall": 57540.0} {"step": 22327, "train_loss": 3.1962482929229736, "lr": 0.00010416375645146192, "tps": 25428, "wall": 57545.6} {"step": 22328, "train_loss": 3.2671895027160645, "lr": 0.00010414909324987681, "tps": 25426, "wall": 57551.2} {"step": 22329, "train_loss": 3.2113635540008545, "lr": 0.00010413443136065697, "tps": 25425, "wall": 57556.8} {"step": 22330, "train_loss": 3.2723512649536133, "lr": 0.00010411977078396862, "tps": 25424, "wall": 57562.5} {"step": 22331, "train_loss": 3.3449878692626953, "lr": 0.00010410511151997772, "tps": 25422, "wall": 57568.1} {"step": 22332, "train_loss": 3.2689239978790283, "lr": 0.00010409045356885043, "tps": 25421, "wall": 57573.7} {"step": 22333, "train_loss": 3.433408737182617, "lr": 0.00010407579693075278, "tps": 25420, "wall": 57579.4} {"step": 22334, "train_loss": 3.298537254333496, "lr": 0.0001040611416058507, "tps": 25418, "wall": 57585.0} {"step": 22335, "train_loss": 3.3185923099517822, "lr": 0.00010404648759431033, "tps": 25417, "wall": 57590.5} {"step": 22336, "train_loss": 3.2780303955078125, "lr": 0.00010403183489629763, "tps": 25416, "wall": 57596.1} {"step": 22337, "train_loss": 3.168691635131836, "lr": 0.00010401718351197858, "tps": 25414, "wall": 57601.7} {"step": 22338, "train_loss": 3.1739330291748047, "lr": 0.00010400253344151913, "tps": 25413, "wall": 57607.3} {"step": 22339, "train_loss": 3.2706799507141113, "lr": 0.00010398788468508522, "tps": 25412, "wall": 57612.9} {"step": 22340, "train_loss": 3.18983793258667, "lr": 0.00010397323724284289, "tps": 25410, "wall": 57618.5} {"step": 22341, "train_loss": 3.232083797454834, "lr": 0.000103958591114958, "tps": 25409, "wall": 57624.0} {"step": 22342, "train_loss": 3.262962818145752, "lr": 0.00010394394630159641, "tps": 25408, "wall": 57629.6} {"step": 22343, "train_loss": 3.1774959564208984, "lr": 0.0001039293028029241, "tps": 25406, "wall": 57635.2} {"step": 22344, "train_loss": 3.1793508529663086, "lr": 0.00010391466061910695, "tps": 25405, "wall": 57640.8} {"step": 22345, "train_loss": 3.2906570434570312, "lr": 0.00010390001975031078, "tps": 25404, "wall": 57646.4} {"step": 22346, "train_loss": 3.268467664718628, "lr": 0.00010388538019670149, "tps": 25402, "wall": 57652.0} {"step": 22347, "train_loss": 3.4336867332458496, "lr": 0.00010387074195844491, "tps": 25401, "wall": 57657.5} {"step": 22348, "train_loss": 3.4364070892333984, "lr": 0.00010385610503570678, "tps": 25400, "wall": 57663.1} {"step": 22349, "train_loss": 3.2613816261291504, "lr": 0.00010384146942865302, "tps": 25399, "wall": 57668.6} {"step": 22350, "train_loss": 3.3064804077148438, "lr": 0.0001038268351374494, "tps": 25397, "wall": 57674.3} {"step": 22351, "train_loss": 3.3177475929260254, "lr": 0.0001038122021622616, "tps": 25396, "wall": 57679.8} {"step": 22352, "train_loss": 3.2778801918029785, "lr": 0.00010379757050325554, "tps": 25395, "wall": 57685.4} {"step": 22353, "train_loss": 3.278245687484741, "lr": 0.00010378294016059684, "tps": 25393, "wall": 57691.0} {"step": 22354, "train_loss": 3.275503396987915, "lr": 0.00010376831113445132, "tps": 25392, "wall": 57696.6} {"step": 22355, "train_loss": 3.266897439956665, "lr": 0.00010375368342498464, "tps": 25391, "wall": 57702.2} {"step": 22356, "train_loss": 3.2931389808654785, "lr": 0.00010373905703236248, "tps": 25389, "wall": 57707.8} {"step": 22357, "train_loss": 3.261723756790161, "lr": 0.00010372443195675061, "tps": 25388, "wall": 57713.4} {"step": 22358, "train_loss": 3.164912462234497, "lr": 0.0001037098081983147, "tps": 25387, "wall": 57718.9} {"step": 22359, "train_loss": 3.3395490646362305, "lr": 0.0001036951857572203, "tps": 25385, "wall": 57724.5} {"step": 22360, "train_loss": 3.225123405456543, "lr": 0.00010368056463363318, "tps": 25384, "wall": 57730.1} {"step": 22361, "train_loss": 3.2424447536468506, "lr": 0.00010366594482771894, "tps": 25383, "wall": 57735.7} {"step": 22362, "train_loss": 3.2555861473083496, "lr": 0.00010365132633964312, "tps": 25381, "wall": 57741.2} {"step": 22363, "train_loss": 3.241969108581543, "lr": 0.0001036367091695714, "tps": 25380, "wall": 57746.7} {"step": 22364, "train_loss": 3.2314035892486572, "lr": 0.00010362209331766934, "tps": 25379, "wall": 57752.3} {"step": 22365, "train_loss": 3.2991294860839844, "lr": 0.00010360747878410242, "tps": 25377, "wall": 57757.9} {"step": 22366, "train_loss": 3.236133098602295, "lr": 0.00010359286556903636, "tps": 25376, "wall": 57763.5} {"step": 22367, "train_loss": 3.360603094100952, "lr": 0.00010357825367263662, "tps": 25375, "wall": 57769.0} {"step": 22368, "train_loss": 3.2415900230407715, "lr": 0.00010356364309506868, "tps": 25374, "wall": 57774.6} {"step": 22369, "train_loss": 3.278965473175049, "lr": 0.00010354903383649812, "tps": 25372, "wall": 57780.2} {"step": 22370, "train_loss": 3.2584376335144043, "lr": 0.00010353442589709041, "tps": 25371, "wall": 57785.8} {"step": 22371, "train_loss": 3.2667477130889893, "lr": 0.00010351981927701095, "tps": 25370, "wall": 57791.3} {"step": 22372, "train_loss": 3.308021068572998, "lr": 0.00010350521397642538, "tps": 25368, "wall": 57796.9} {"step": 22373, "train_loss": 3.3264379501342773, "lr": 0.00010349060999549895, "tps": 25367, "wall": 57802.5} {"step": 22374, "train_loss": 3.3315136432647705, "lr": 0.00010347600733439726, "tps": 25366, "wall": 57808.1} {"step": 22375, "train_loss": 3.295748710632324, "lr": 0.0001034614059932857, "tps": 25364, "wall": 57813.7} {"step": 22376, "train_loss": 3.2829179763793945, "lr": 0.00010344680597232952, "tps": 25363, "wall": 57819.3} {"step": 22377, "train_loss": 3.257262706756592, "lr": 0.00010343220727169431, "tps": 25362, "wall": 57824.9} {"step": 22378, "train_loss": 3.2828259468078613, "lr": 0.00010341760989154539, "tps": 25360, "wall": 57830.4} {"step": 22379, "train_loss": 3.3190600872039795, "lr": 0.000103403013832048, "tps": 25359, "wall": 57835.9} {"step": 22380, "train_loss": 3.2371411323547363, "lr": 0.00010338841909336766, "tps": 25358, "wall": 57841.5} {"step": 22381, "train_loss": 3.2728524208068848, "lr": 0.0001033738256756696, "tps": 25356, "wall": 57847.1} {"step": 22382, "train_loss": 3.2578768730163574, "lr": 0.0001033592335791191, "tps": 25355, "wall": 57852.7} {"step": 22383, "train_loss": 3.18833065032959, "lr": 0.00010334464280388154, "tps": 25354, "wall": 57858.2} {"step": 22384, "train_loss": 3.252525806427002, "lr": 0.0001033300533501222, "tps": 25353, "wall": 57863.8} {"step": 22385, "train_loss": 3.257390022277832, "lr": 0.0001033154652180063, "tps": 25351, "wall": 57869.4} {"step": 22386, "train_loss": 3.3011038303375244, "lr": 0.00010330087840769913, "tps": 25350, "wall": 57875.1} {"step": 22387, "train_loss": 3.1797478199005127, "lr": 0.00010328629291936595, "tps": 25349, "wall": 57880.8} {"step": 22388, "train_loss": 3.284146785736084, "lr": 0.0001032717087531719, "tps": 25347, "wall": 57886.3} {"step": 22389, "train_loss": 3.3633780479431152, "lr": 0.0001032571259092823, "tps": 25346, "wall": 57891.9} {"step": 22390, "train_loss": 3.356532335281372, "lr": 0.00010324254438786223, "tps": 25345, "wall": 57897.4} {"step": 22391, "train_loss": 3.2960638999938965, "lr": 0.00010322796418907702, "tps": 25343, "wall": 57903.0} {"step": 22392, "train_loss": 3.409177780151367, "lr": 0.0001032133853130917, "tps": 25342, "wall": 57908.6} {"step": 22393, "train_loss": 3.3090970516204834, "lr": 0.00010319880776007145, "tps": 25341, "wall": 57914.2} {"step": 22394, "train_loss": 3.350619316101074, "lr": 0.00010318423153018147, "tps": 25339, "wall": 57919.7} {"step": 22395, "train_loss": 3.1792969703674316, "lr": 0.00010316965662358684, "tps": 25338, "wall": 57925.3} {"step": 22396, "train_loss": 3.3580029010772705, "lr": 0.00010315508304045258, "tps": 25337, "wall": 57930.9} {"step": 22397, "train_loss": 3.277799129486084, "lr": 0.00010314051078094395, "tps": 25335, "wall": 57936.5} {"step": 22398, "train_loss": 3.2514798641204834, "lr": 0.00010312593984522592, "tps": 25334, "wall": 57942.1} {"step": 22399, "train_loss": 3.192852020263672, "lr": 0.00010311137023346354, "tps": 25333, "wall": 57947.6} {"step": 22400, "train_loss": 3.31650972366333, "lr": 0.00010309680194582187, "tps": 25332, "wall": 57953.2} {"step": 22401, "train_loss": 3.3961048126220703, "lr": 0.00010308223498246601, "tps": 25330, "wall": 57958.8} {"step": 22402, "train_loss": 3.3287792205810547, "lr": 0.00010306766934356085, "tps": 25329, "wall": 57964.3} {"step": 22403, "train_loss": 3.1906914710998535, "lr": 0.00010305310502927153, "tps": 25328, "wall": 57969.8} {"step": 22404, "train_loss": 3.303028106689453, "lr": 0.00010303854203976291, "tps": 25326, "wall": 57975.4} {"step": 22405, "train_loss": 3.2981209754943848, "lr": 0.0001030239803752, "tps": 25325, "wall": 57981.0} {"step": 22406, "train_loss": 3.2596309185028076, "lr": 0.0001030094200357478, "tps": 25324, "wall": 57986.5} {"step": 22407, "train_loss": 3.1753625869750977, "lr": 0.00010299486102157116, "tps": 25322, "wall": 57992.1} {"step": 22408, "train_loss": 3.274015426635742, "lr": 0.00010298030333283515, "tps": 25321, "wall": 57997.7} {"step": 22409, "train_loss": 3.2714297771453857, "lr": 0.0001029657469697046, "tps": 25320, "wall": 58003.3} {"step": 22410, "train_loss": 3.28511381149292, "lr": 0.00010295119193234431, "tps": 25319, "wall": 58008.8} {"step": 22411, "train_loss": 3.351050853729248, "lr": 0.00010293663822091933, "tps": 25317, "wall": 58014.4} {"step": 22412, "train_loss": 3.2647719383239746, "lr": 0.00010292208583559441, "tps": 25316, "wall": 58019.9} {"step": 22413, "train_loss": 3.195890426635742, "lr": 0.00010290753477653441, "tps": 25315, "wall": 58025.5} {"step": 22414, "train_loss": 3.3002891540527344, "lr": 0.00010289298504390425, "tps": 25313, "wall": 58031.1} {"step": 22415, "train_loss": 3.3589255809783936, "lr": 0.00010287843663786867, "tps": 25312, "wall": 58036.7} {"step": 22416, "train_loss": 3.3414440155029297, "lr": 0.00010286388955859246, "tps": 25311, "wall": 58042.3} {"step": 22417, "train_loss": 3.2534587383270264, "lr": 0.0001028493438062405, "tps": 25309, "wall": 58047.8} {"step": 22418, "train_loss": 3.2009358406066895, "lr": 0.00010283479938097748, "tps": 25308, "wall": 58053.4} {"step": 22419, "train_loss": 3.313206195831299, "lr": 0.00010282025628296819, "tps": 25307, "wall": 58059.0} {"step": 22420, "train_loss": 3.2470650672912598, "lr": 0.0001028057145123774, "tps": 25306, "wall": 58064.6} {"step": 22421, "train_loss": 3.363029956817627, "lr": 0.0001027911740693698, "tps": 25304, "wall": 58070.1} {"step": 22422, "train_loss": 3.3370485305786133, "lr": 0.00010277663495411008, "tps": 25303, "wall": 58075.7} {"step": 22423, "train_loss": 3.255863666534424, "lr": 0.00010276209716676304, "tps": 25302, "wall": 58081.2} {"step": 22424, "train_loss": 3.2219648361206055, "lr": 0.00010274756070749332, "tps": 25300, "wall": 58086.8} {"step": 22425, "train_loss": 3.231980800628662, "lr": 0.00010273302557646549, "tps": 25299, "wall": 58092.3} {"step": 22426, "train_loss": 3.295253276824951, "lr": 0.00010271849177384436, "tps": 25298, "wall": 58097.9} {"step": 22427, "train_loss": 3.2449746131896973, "lr": 0.00010270395929979446, "tps": 25296, "wall": 58103.5} {"step": 22428, "train_loss": 3.309788703918457, "lr": 0.00010268942815448048, "tps": 25295, "wall": 58109.1} {"step": 22429, "train_loss": 3.3921308517456055, "lr": 0.00010267489833806702, "tps": 25294, "wall": 58114.7} {"step": 22430, "train_loss": 3.3093600273132324, "lr": 0.00010266036985071861, "tps": 25293, "wall": 58120.3} {"step": 22431, "train_loss": 3.3032240867614746, "lr": 0.00010264584269259991, "tps": 25291, "wall": 58125.8} {"step": 22432, "train_loss": 3.2703211307525635, "lr": 0.00010263131686387548, "tps": 25290, "wall": 58131.4} {"step": 22433, "train_loss": 3.271186351776123, "lr": 0.0001026167923647098, "tps": 25289, "wall": 58136.9} {"step": 22434, "train_loss": 3.163762092590332, "lr": 0.00010260226919526748, "tps": 25287, "wall": 58142.5} {"step": 22435, "train_loss": 3.1900999546051025, "lr": 0.000102587747355713, "tps": 25286, "wall": 58148.1} {"step": 22436, "train_loss": 3.3259692192077637, "lr": 0.0001025732268462108, "tps": 25285, "wall": 58153.6} {"step": 22437, "train_loss": 3.2791967391967773, "lr": 0.00010255870766692552, "tps": 25283, "wall": 58159.2} {"step": 22438, "train_loss": 3.296693801879883, "lr": 0.00010254418981802154, "tps": 25282, "wall": 58164.8} {"step": 22439, "train_loss": 3.263123035430908, "lr": 0.00010252967329966328, "tps": 25281, "wall": 58170.4} {"step": 22440, "train_loss": 3.2259650230407715, "lr": 0.0001025151581120153, "tps": 25280, "wall": 58176.0} {"step": 22441, "train_loss": 3.3107070922851562, "lr": 0.00010250064425524195, "tps": 25278, "wall": 58181.6} {"step": 22442, "train_loss": 3.341630220413208, "lr": 0.0001024861317295076, "tps": 25277, "wall": 58187.2} {"step": 22443, "train_loss": 3.185910701751709, "lr": 0.00010247162053497681, "tps": 25276, "wall": 58192.8} {"step": 22444, "train_loss": 3.332066774368286, "lr": 0.00010245711067181377, "tps": 25274, "wall": 58198.3} {"step": 22445, "train_loss": 3.2994120121002197, "lr": 0.00010244260214018298, "tps": 25273, "wall": 58203.9} {"step": 22446, "train_loss": 3.2977843284606934, "lr": 0.00010242809494024878, "tps": 25272, "wall": 58209.4} {"step": 22447, "train_loss": 3.254007339477539, "lr": 0.0001024135890721754, "tps": 25271, "wall": 58215.0} {"step": 22448, "train_loss": 3.324370861053467, "lr": 0.0001023990845361273, "tps": 25269, "wall": 58220.5} {"step": 22449, "train_loss": 3.291463851928711, "lr": 0.00010238458133226876, "tps": 25268, "wall": 58226.1} {"step": 22450, "train_loss": 3.3000545501708984, "lr": 0.00010237007946076396, "tps": 25267, "wall": 58231.7} {"step": 22451, "train_loss": 3.2549381256103516, "lr": 0.00010235557892177734, "tps": 25265, "wall": 58237.3} {"step": 22452, "train_loss": 3.353895902633667, "lr": 0.00010234107971547309, "tps": 25264, "wall": 58242.9} {"step": 22453, "train_loss": 3.3013439178466797, "lr": 0.00010232658184201537, "tps": 25263, "wall": 58248.5} {"step": 22454, "train_loss": 3.247016191482544, "lr": 0.00010231208530156858, "tps": 25261, "wall": 58254.1} {"step": 22455, "train_loss": 3.2548694610595703, "lr": 0.00010229759009429684, "tps": 25260, "wall": 58259.6} {"step": 22456, "train_loss": 3.2856268882751465, "lr": 0.00010228309622036431, "tps": 25259, "wall": 58265.2} {"step": 22457, "train_loss": 3.2614288330078125, "lr": 0.00010226860367993531, "tps": 25258, "wall": 58270.8} {"step": 22458, "train_loss": 3.4118807315826416, "lr": 0.00010225411247317391, "tps": 25256, "wall": 58276.4} {"step": 22459, "train_loss": 3.2467474937438965, "lr": 0.00010223962260024426, "tps": 25255, "wall": 58281.9} {"step": 22460, "train_loss": 3.278952121734619, "lr": 0.0001022251340613106, "tps": 25254, "wall": 58287.4} {"step": 22461, "train_loss": 3.309467315673828, "lr": 0.00010221064685653699, "tps": 25252, "wall": 58293.1} {"step": 22462, "train_loss": 3.215305805206299, "lr": 0.00010219616098608744, "tps": 25251, "wall": 58298.7} {"step": 22463, "train_loss": 3.3469138145446777, "lr": 0.00010218167645012626, "tps": 25250, "wall": 58304.2} {"step": 22464, "train_loss": 3.3722856044769287, "lr": 0.00010216719324881734, "tps": 25249, "wall": 58309.8} {"step": 22465, "train_loss": 3.259514570236206, "lr": 0.00010215271138232492, "tps": 25247, "wall": 58315.4} {"step": 22466, "train_loss": 3.3374135494232178, "lr": 0.00010213823085081293, "tps": 25246, "wall": 58321.0} {"step": 22467, "train_loss": 3.115788221359253, "lr": 0.00010212375165444536, "tps": 25245, "wall": 58326.5} {"step": 22468, "train_loss": 3.293834686279297, "lr": 0.00010210927379338642, "tps": 25243, "wall": 58332.1} {"step": 22469, "train_loss": 3.3328933715820312, "lr": 0.00010209479726779996, "tps": 25242, "wall": 58337.7} {"step": 22470, "train_loss": 3.271951198577881, "lr": 0.00010208032207784998, "tps": 25241, "wall": 58343.2} {"step": 22471, "train_loss": 3.3065240383148193, "lr": 0.00010206584822370055, "tps": 25240, "wall": 58348.8} {"step": 22472, "train_loss": 3.2886271476745605, "lr": 0.00010205137570551557, "tps": 25238, "wall": 58354.5} {"step": 22473, "train_loss": 3.505559206008911, "lr": 0.00010203690452345891, "tps": 25237, "wall": 58360.0} {"step": 22474, "train_loss": 3.2168521881103516, "lr": 0.00010202243467769466, "tps": 25236, "wall": 58365.6} {"step": 22475, "train_loss": 3.3190548419952393, "lr": 0.00010200796616838664, "tps": 25234, "wall": 58371.1} {"step": 22476, "train_loss": 3.2124886512756348, "lr": 0.0001019934989956987, "tps": 25233, "wall": 58376.7} {"step": 22477, "train_loss": 3.237456798553467, "lr": 0.00010197903315979485, "tps": 25232, "wall": 58382.2} {"step": 22478, "train_loss": 3.329159736633301, "lr": 0.0001019645686608389, "tps": 25231, "wall": 58387.8} {"step": 22479, "train_loss": 3.231205940246582, "lr": 0.00010195010549899464, "tps": 25229, "wall": 58393.4} {"step": 22480, "train_loss": 3.217900037765503, "lr": 0.00010193564367442601, "tps": 25228, "wall": 58399.0} {"step": 22481, "train_loss": 3.2747902870178223, "lr": 0.00010192118318729678, "tps": 25227, "wall": 58404.6} {"step": 22482, "train_loss": 3.2851955890655518, "lr": 0.00010190672403777082, "tps": 25225, "wall": 58410.2} {"step": 22483, "train_loss": 3.2930166721343994, "lr": 0.00010189226622601186, "tps": 25224, "wall": 58415.8} {"step": 22484, "train_loss": 3.2481768131256104, "lr": 0.00010187780975218365, "tps": 25223, "wall": 58421.4} {"step": 22485, "train_loss": 3.2699732780456543, "lr": 0.00010186335461645007, "tps": 25221, "wall": 58427.0} {"step": 22486, "train_loss": 3.2781708240509033, "lr": 0.00010184890081897478, "tps": 25220, "wall": 58432.6} {"step": 22487, "train_loss": 3.28409481048584, "lr": 0.00010183444835992148, "tps": 25219, "wall": 58438.1} {"step": 22488, "train_loss": 3.262716293334961, "lr": 0.00010181999723945401, "tps": 25218, "wall": 58443.7} {"step": 22489, "train_loss": 3.281961679458618, "lr": 0.00010180554745773601, "tps": 25216, "wall": 58449.4} {"step": 22490, "train_loss": 3.2341768741607666, "lr": 0.00010179109901493106, "tps": 25215, "wall": 58454.9} {"step": 22491, "train_loss": 3.403373956680298, "lr": 0.00010177665191120302, "tps": 25214, "wall": 58460.5} {"step": 22492, "train_loss": 3.3179378509521484, "lr": 0.00010176220614671548, "tps": 25212, "wall": 58466.0} {"step": 22493, "train_loss": 3.387556791305542, "lr": 0.00010174776172163203, "tps": 25211, "wall": 58471.6} {"step": 22494, "train_loss": 3.3532228469848633, "lr": 0.00010173331863611632, "tps": 25210, "wall": 58477.3} {"step": 22495, "train_loss": 3.3252596855163574, "lr": 0.00010171887689033201, "tps": 25209, "wall": 58482.8} {"step": 22496, "train_loss": 3.2569785118103027, "lr": 0.00010170443648444264, "tps": 25207, "wall": 58488.4} {"step": 22497, "train_loss": 3.2724368572235107, "lr": 0.00010168999741861185, "tps": 25206, "wall": 58494.0} {"step": 22498, "train_loss": 3.242117404937744, "lr": 0.00010167555969300309, "tps": 25205, "wall": 58499.6} {"step": 22499, "train_loss": 3.2773852348327637, "lr": 0.00010166112330778003, "tps": 25203, "wall": 58505.1} {"step": 22500, "train_loss": 3.3445472717285156, "lr": 0.00010164668826310621, "tps": 25202, "wall": 58510.7} {"step": 22501, "train_loss": 3.318727493286133, "lr": 0.00010163225455914505, "tps": 25201, "wall": 58516.4} {"step": 22502, "train_loss": 3.296182155609131, "lr": 0.00010161782219606014, "tps": 25200, "wall": 58522.0} {"step": 22503, "train_loss": 3.292689800262451, "lr": 0.00010160339117401496, "tps": 25198, "wall": 58527.6} {"step": 22504, "train_loss": 3.2404372692108154, "lr": 0.00010158896149317291, "tps": 25197, "wall": 58533.2} {"step": 22505, "train_loss": 3.2038140296936035, "lr": 0.00010157453315369756, "tps": 25196, "wall": 58538.8} {"step": 22506, "train_loss": 3.3038225173950195, "lr": 0.00010156010615575233, "tps": 25194, "wall": 58544.4} {"step": 22507, "train_loss": 3.2504920959472656, "lr": 0.00010154568049950061, "tps": 25193, "wall": 58550.0} {"step": 22508, "train_loss": 3.3891608715057373, "lr": 0.00010153125618510584, "tps": 25192, "wall": 58555.6} {"step": 22509, "train_loss": 3.2492361068725586, "lr": 0.00010151683321273134, "tps": 25191, "wall": 58561.2} {"step": 22510, "train_loss": 3.261821746826172, "lr": 0.00010150241158254061, "tps": 25189, "wall": 58566.7} {"step": 22511, "train_loss": 3.3427734375, "lr": 0.00010148799129469699, "tps": 25188, "wall": 58572.4} {"step": 22512, "train_loss": 3.350416660308838, "lr": 0.00010147357234936374, "tps": 25187, "wall": 58577.9} {"step": 22513, "train_loss": 3.1934497356414795, "lr": 0.00010145915474670437, "tps": 25185, "wall": 58583.5} {"step": 22514, "train_loss": 3.3539369106292725, "lr": 0.00010144473848688209, "tps": 25184, "wall": 58589.1} {"step": 22515, "train_loss": 3.270066738128662, "lr": 0.00010143032357006017, "tps": 25183, "wall": 58594.8} {"step": 22516, "train_loss": 3.1808042526245117, "lr": 0.00010141590999640198, "tps": 25182, "wall": 58600.3} {"step": 22517, "train_loss": 3.227555274963379, "lr": 0.00010140149776607082, "tps": 25180, "wall": 58605.8} {"step": 22518, "train_loss": 3.315304756164551, "lr": 0.00010138708687922984, "tps": 25179, "wall": 58611.4} {"step": 22519, "train_loss": 3.2358460426330566, "lr": 0.00010137267733604242, "tps": 25178, "wall": 58617.0} {"step": 22520, "train_loss": 3.335998296737671, "lr": 0.00010135826913667173, "tps": 25176, "wall": 58622.5} {"step": 22521, "train_loss": 3.333946704864502, "lr": 0.0001013438622812809, "tps": 25175, "wall": 58628.1} {"step": 22522, "train_loss": 3.3064124584198, "lr": 0.00010132945677003327, "tps": 25174, "wall": 58633.7} {"step": 22523, "train_loss": 3.326813220977783, "lr": 0.00010131505260309198, "tps": 25173, "wall": 58639.3} {"step": 22524, "train_loss": 3.2109787464141846, "lr": 0.00010130064978062019, "tps": 25171, "wall": 58644.8} {"step": 22525, "train_loss": 3.25404691696167, "lr": 0.00010128624830278108, "tps": 25170, "wall": 58650.4} {"step": 22526, "train_loss": 3.3605313301086426, "lr": 0.00010127184816973773, "tps": 25169, "wall": 58656.0} {"step": 22527, "train_loss": 3.328864097595215, "lr": 0.00010125744938165333, "tps": 25167, "wall": 58661.6} {"step": 22528, "train_loss": 3.2284317016601562, "lr": 0.00010124305193869101, "tps": 25166, "wall": 58667.2} {"step": 22529, "train_loss": 3.3216261863708496, "lr": 0.00010122865584101373, "tps": 25165, "wall": 58672.8} {"step": 22530, "train_loss": 3.438051700592041, "lr": 0.00010121426108878473, "tps": 25164, "wall": 58678.4} {"step": 22531, "train_loss": 3.2765541076660156, "lr": 0.00010119986768216705, "tps": 25162, "wall": 58683.9} {"step": 22532, "train_loss": 3.3019304275512695, "lr": 0.00010118547562132356, "tps": 25161, "wall": 58689.5} {"step": 22533, "train_loss": 3.2715747356414795, "lr": 0.00010117108490641753, "tps": 25160, "wall": 58695.1} {"step": 22534, "train_loss": 3.2953219413757324, "lr": 0.00010115669553761189, "tps": 25159, "wall": 58700.6} {"step": 22535, "train_loss": 3.2457494735717773, "lr": 0.00010114230751506956, "tps": 25157, "wall": 58706.2} {"step": 22536, "train_loss": 3.293356418609619, "lr": 0.00010112792083895364, "tps": 25156, "wall": 58711.7} {"step": 22537, "train_loss": 3.2542924880981445, "lr": 0.00010111353550942708, "tps": 25155, "wall": 58717.4} {"step": 22538, "train_loss": 3.3990511894226074, "lr": 0.00010109915152665277, "tps": 25153, "wall": 58722.9} {"step": 22539, "train_loss": 3.394028425216675, "lr": 0.00010108476889079375, "tps": 25152, "wall": 58728.5} {"step": 22540, "train_loss": 3.30133318901062, "lr": 0.00010107038760201286, "tps": 25151, "wall": 58734.1} {"step": 22541, "train_loss": 3.2677175998687744, "lr": 0.00010105600766047309, "tps": 25150, "wall": 58739.6} {"step": 22542, "train_loss": 3.2387895584106445, "lr": 0.00010104162906633732, "tps": 25148, "wall": 58745.2} {"step": 22543, "train_loss": 3.200834274291992, "lr": 0.00010102725181976836, "tps": 25147, "wall": 58750.7} {"step": 22544, "train_loss": 3.171304941177368, "lr": 0.00010101287592092916, "tps": 25146, "wall": 58756.3} {"step": 22545, "train_loss": 3.3810625076293945, "lr": 0.00010099850136998254, "tps": 25145, "wall": 58761.8} {"step": 22546, "train_loss": 3.2837071418762207, "lr": 0.00010098412816709129, "tps": 25143, "wall": 58767.4} {"step": 22547, "train_loss": 3.3339908123016357, "lr": 0.00010096975631241832, "tps": 25142, "wall": 58772.9} {"step": 22548, "train_loss": 3.3016517162323, "lr": 0.0001009553858061264, "tps": 25141, "wall": 58778.6} {"step": 22549, "train_loss": 3.2369906902313232, "lr": 0.00010094101664837827, "tps": 25140, "wall": 58784.1} {"step": 22550, "train_loss": 3.263573169708252, "lr": 0.00010092664883933678, "tps": 25138, "wall": 58789.7} {"step": 22551, "train_loss": 3.2813761234283447, "lr": 0.00010091228237916466, "tps": 25137, "wall": 58795.3} {"step": 22552, "train_loss": 3.4094655513763428, "lr": 0.00010089791726802458, "tps": 25136, "wall": 58800.8} {"step": 22553, "train_loss": 3.200808525085449, "lr": 0.00010088355350607939, "tps": 25135, "wall": 58806.4} {"step": 22554, "train_loss": 3.254945755004883, "lr": 0.00010086919109349175, "tps": 25133, "wall": 58812.0} {"step": 22555, "train_loss": 3.3036181926727295, "lr": 0.00010085483003042431, "tps": 25132, "wall": 58817.6} {"step": 22556, "train_loss": 3.285813808441162, "lr": 0.00010084047031703985, "tps": 25131, "wall": 58823.1} {"step": 22557, "train_loss": 3.3258414268493652, "lr": 0.00010082611195350102, "tps": 25129, "wall": 58828.7} {"step": 22558, "train_loss": 3.2828736305236816, "lr": 0.00010081175493997035, "tps": 25128, "wall": 58834.4} {"step": 22559, "train_loss": 3.268754482269287, "lr": 0.00010079739927661065, "tps": 25127, "wall": 58839.9} {"step": 22560, "train_loss": 3.137558937072754, "lr": 0.0001007830449635844, "tps": 25126, "wall": 58845.5} {"step": 22561, "train_loss": 3.2397689819335938, "lr": 0.0001007686920010543, "tps": 25124, "wall": 58851.1} {"step": 22562, "train_loss": 3.251082420349121, "lr": 0.00010075434038918292, "tps": 25123, "wall": 58856.6} {"step": 22563, "train_loss": 3.3286190032958984, "lr": 0.00010073999012813277, "tps": 25122, "wall": 58862.2} {"step": 22564, "train_loss": 3.2867233753204346, "lr": 0.00010072564121806649, "tps": 25121, "wall": 58867.7} {"step": 22565, "train_loss": 3.2426860332489014, "lr": 0.00010071129365914665, "tps": 25119, "wall": 58873.4} {"step": 22566, "train_loss": 3.355821371078491, "lr": 0.00010069694745153562, "tps": 25118, "wall": 58878.9} {"step": 22567, "train_loss": 3.3493056297302246, "lr": 0.00010068260259539613, "tps": 25117, "wall": 58884.5} {"step": 22568, "train_loss": 3.3096964359283447, "lr": 0.00010066825909089055, "tps": 25115, "wall": 58890.1} {"step": 22569, "train_loss": 3.3666045665740967, "lr": 0.00010065391693818131, "tps": 25114, "wall": 58895.7} {"step": 22570, "train_loss": 3.250941038131714, "lr": 0.00010063957613743104, "tps": 25113, "wall": 58901.3} {"step": 22571, "train_loss": 3.3466551303863525, "lr": 0.00010062523668880212, "tps": 25112, "wall": 58906.8} {"step": 22572, "train_loss": 3.4174916744232178, "lr": 0.00010061089859245689, "tps": 25110, "wall": 58912.4} {"step": 22573, "train_loss": 3.3980116844177246, "lr": 0.00010059656184855792, "tps": 25109, "wall": 58918.0} {"step": 22574, "train_loss": 3.3565049171447754, "lr": 0.00010058222645726756, "tps": 25108, "wall": 58923.6} {"step": 22575, "train_loss": 3.3054699897766113, "lr": 0.00010056789241874815, "tps": 25107, "wall": 58929.2} {"step": 22576, "train_loss": 3.2180705070495605, "lr": 0.00010055355973316219, "tps": 25105, "wall": 58934.7} {"step": 22577, "train_loss": 3.273322105407715, "lr": 0.00010053922840067186, "tps": 25104, "wall": 58940.3} {"step": 22578, "train_loss": 3.325317144393921, "lr": 0.0001005248984214397, "tps": 25103, "wall": 58945.8} {"step": 22579, "train_loss": 3.3228037357330322, "lr": 0.00010051056979562798, "tps": 25102, "wall": 58951.4} {"step": 22580, "train_loss": 3.3405561447143555, "lr": 0.00010049624252339889, "tps": 25100, "wall": 58957.0} {"step": 22581, "train_loss": 3.209296941757202, "lr": 0.00010048191660491491, "tps": 25099, "wall": 58962.6} {"step": 22582, "train_loss": 3.3288893699645996, "lr": 0.00010046759204033826, "tps": 25098, "wall": 58968.2} {"step": 22583, "train_loss": 3.1709046363830566, "lr": 0.00010045326882983109, "tps": 25097, "wall": 58973.8} {"step": 22584, "train_loss": 3.279278039932251, "lr": 0.00010043894697355582, "tps": 25095, "wall": 58979.3} {"step": 22585, "train_loss": 3.294739246368408, "lr": 0.00010042462647167468, "tps": 25094, "wall": 58984.9} {"step": 22586, "train_loss": 3.3589367866516113, "lr": 0.00010041030732434973, "tps": 25093, "wall": 58990.5} {"step": 22587, "train_loss": 3.315500497817993, "lr": 0.00010039598953174336, "tps": 25091, "wall": 58996.1} {"step": 22588, "train_loss": 3.26760196685791, "lr": 0.00010038167309401771, "tps": 25090, "wall": 59001.6} {"step": 22589, "train_loss": 3.2625319957733154, "lr": 0.00010036735801133488, "tps": 25089, "wall": 59007.2} {"step": 22590, "train_loss": 3.2759041786193848, "lr": 0.00010035304428385712, "tps": 25088, "wall": 59012.8} {"step": 22591, "train_loss": 3.3099095821380615, "lr": 0.00010033873191174658, "tps": 25086, "wall": 59018.5} {"step": 22592, "train_loss": 3.2826669216156006, "lr": 0.00010032442089516529, "tps": 25085, "wall": 59024.1} {"step": 22593, "train_loss": 3.2385802268981934, "lr": 0.00010031011123427547, "tps": 25084, "wall": 59029.7} {"step": 22594, "train_loss": 3.228874683380127, "lr": 0.00010029580292923914, "tps": 25083, "wall": 59035.3} {"step": 22595, "train_loss": 3.2818543910980225, "lr": 0.0001002814959802185, "tps": 25081, "wall": 59040.8} {"step": 22596, "train_loss": 3.2185778617858887, "lr": 0.00010026719038737554, "tps": 25080, "wall": 59046.4} {"step": 22597, "train_loss": 3.3033714294433594, "lr": 0.00010025288615087227, "tps": 25079, "wall": 59052.0} {"step": 22598, "train_loss": 3.2815511226654053, "lr": 0.00010023858327087084, "tps": 25078, "wall": 59057.5} {"step": 22599, "train_loss": 3.2656314373016357, "lr": 0.00010022428174753322, "tps": 25076, "wall": 59063.1} {"step": 22600, "train_loss": 3.301302433013916, "lr": 0.00010020998158102135, "tps": 25075, "wall": 59068.6} {"step": 22601, "train_loss": 3.3922362327575684, "lr": 0.00010019568277149735, "tps": 25074, "wall": 59074.3} {"step": 22602, "train_loss": 3.3051204681396484, "lr": 0.00010018138531912316, "tps": 25073, "wall": 59079.9} {"step": 22603, "train_loss": 3.225116491317749, "lr": 0.00010016708922406061, "tps": 25071, "wall": 59085.4} {"step": 22604, "train_loss": 3.223193407058716, "lr": 0.00010015279448647188, "tps": 25070, "wall": 59091.0} {"step": 22605, "train_loss": 3.1971373558044434, "lr": 0.00010013850110651873, "tps": 25069, "wall": 59096.6} {"step": 22606, "train_loss": 3.283787727355957, "lr": 0.00010012420908436308, "tps": 25068, "wall": 59102.1} {"step": 22607, "train_loss": 3.197963237762451, "lr": 0.00010010991842016693, "tps": 25066, "wall": 59107.7} {"step": 22608, "train_loss": 3.205747127532959, "lr": 0.00010009562911409212, "tps": 25065, "wall": 59113.2} {"step": 22609, "train_loss": 3.1993887424468994, "lr": 0.00010008134116630042, "tps": 25064, "wall": 59118.8} {"step": 22610, "train_loss": 3.240316390991211, "lr": 0.00010006705457695387, "tps": 25063, "wall": 59124.3} {"step": 22611, "train_loss": 3.215766429901123, "lr": 0.00010005276934621419, "tps": 25061, "wall": 59129.9} {"step": 22612, "train_loss": 3.2663800716400146, "lr": 0.0001000384854742432, "tps": 25060, "wall": 59135.5} {"step": 22613, "train_loss": 3.3694236278533936, "lr": 0.00010002420296120277, "tps": 25059, "wall": 59141.1} {"step": 22614, "train_loss": 3.3212203979492188, "lr": 0.00010000992180725459, "tps": 25057, "wall": 59146.7} {"step": 22615, "train_loss": 3.1757442951202393, "lr": 9.99956420125606e-05, "tps": 25056, "wall": 59152.3} {"step": 22616, "train_loss": 3.3428773880004883, "lr": 9.998136357728243e-05, "tps": 25055, "wall": 59157.9} {"step": 22617, "train_loss": 3.237314224243164, "lr": 9.996708650158184e-05, "tps": 25054, "wall": 59163.5} {"step": 22618, "train_loss": 3.3228683471679688, "lr": 9.995281078562064e-05, "tps": 25052, "wall": 59169.0} {"step": 22619, "train_loss": 3.292482376098633, "lr": 9.993853642956048e-05, "tps": 25051, "wall": 59174.6} {"step": 22620, "train_loss": 3.3057217597961426, "lr": 9.992426343356302e-05, "tps": 25050, "wall": 59180.2} {"step": 22621, "train_loss": 3.2710275650024414, "lr": 9.990999179779008e-05, "tps": 25049, "wall": 59185.7} {"step": 22622, "train_loss": 3.2515177726745605, "lr": 9.989572152240323e-05, "tps": 25047, "wall": 59191.3} {"step": 22623, "train_loss": 3.3256494998931885, "lr": 9.988145260756409e-05, "tps": 25046, "wall": 59197.0} {"step": 22624, "train_loss": 3.335690975189209, "lr": 9.986718505343439e-05, "tps": 25045, "wall": 59202.6} {"step": 22625, "train_loss": 3.321348190307617, "lr": 9.985291886017575e-05, "tps": 25044, "wall": 59208.2} {"step": 22626, "train_loss": 3.2001821994781494, "lr": 9.983865402794968e-05, "tps": 25042, "wall": 59213.8} {"step": 22627, "train_loss": 3.204134941101074, "lr": 9.982439055691789e-05, "tps": 25041, "wall": 59219.3} {"step": 22628, "train_loss": 3.1614463329315186, "lr": 9.981012844724189e-05, "tps": 25040, "wall": 59224.9} {"step": 22629, "train_loss": 3.372058868408203, "lr": 9.979586769908321e-05, "tps": 25039, "wall": 59230.4} {"step": 22630, "train_loss": 3.276925563812256, "lr": 9.978160831260351e-05, "tps": 25037, "wall": 59236.0} {"step": 22631, "train_loss": 3.2961974143981934, "lr": 9.97673502879642e-05, "tps": 25036, "wall": 59241.5} {"step": 22632, "train_loss": 3.3052148818969727, "lr": 9.975309362532691e-05, "tps": 25035, "wall": 59247.1} {"step": 22633, "train_loss": 3.1943535804748535, "lr": 9.973883832485306e-05, "tps": 25034, "wall": 59252.7} {"step": 22634, "train_loss": 3.333765745162964, "lr": 9.972458438670412e-05, "tps": 25032, "wall": 59258.3} {"step": 22635, "train_loss": 3.2047297954559326, "lr": 9.971033181104163e-05, "tps": 25031, "wall": 59263.9} {"step": 22636, "train_loss": 3.2401671409606934, "lr": 9.969608059802702e-05, "tps": 25030, "wall": 59269.5} {"step": 22637, "train_loss": 3.394908905029297, "lr": 9.968183074782166e-05, "tps": 25029, "wall": 59275.1} {"step": 22638, "train_loss": 3.2426986694335938, "lr": 9.966758226058708e-05, "tps": 25027, "wall": 59280.7} {"step": 22639, "train_loss": 3.2014825344085693, "lr": 9.965333513648465e-05, "tps": 25026, "wall": 59286.2} {"step": 22640, "train_loss": 3.3373374938964844, "lr": 9.963908937567568e-05, "tps": 25025, "wall": 59291.8} {"step": 22641, "train_loss": 3.334247589111328, "lr": 9.962484497832171e-05, "tps": 25024, "wall": 59297.4} {"step": 22642, "train_loss": 3.2157130241394043, "lr": 9.961060194458398e-05, "tps": 25022, "wall": 59303.0} {"step": 22643, "train_loss": 3.2506816387176514, "lr": 9.95963602746238e-05, "tps": 25021, "wall": 59308.6} {"step": 22644, "train_loss": 3.218576669692993, "lr": 9.958211996860262e-05, "tps": 25020, "wall": 59314.3} {"step": 22645, "train_loss": 3.3286218643188477, "lr": 9.956788102668173e-05, "tps": 25019, "wall": 59319.8} {"step": 22646, "train_loss": 3.3307130336761475, "lr": 9.955364344902231e-05, "tps": 25017, "wall": 59325.4} {"step": 22647, "train_loss": 3.3291773796081543, "lr": 9.953940723578578e-05, "tps": 25016, "wall": 59330.9} {"step": 22648, "train_loss": 3.25972318649292, "lr": 9.952517238713334e-05, "tps": 25015, "wall": 59336.5} {"step": 22649, "train_loss": 3.304621696472168, "lr": 9.951093890322631e-05, "tps": 25014, "wall": 59342.0} {"step": 22650, "train_loss": 3.194063186645508, "lr": 9.949670678422588e-05, "tps": 25012, "wall": 59347.6} {"step": 22651, "train_loss": 3.3211588859558105, "lr": 9.948247603029322e-05, "tps": 25011, "wall": 59353.3} {"step": 22652, "train_loss": 3.306999683380127, "lr": 9.946824664158963e-05, "tps": 25010, "wall": 59358.8} {"step": 22653, "train_loss": 3.403326988220215, "lr": 9.94540186182763e-05, "tps": 25009, "wall": 59364.4} {"step": 22654, "train_loss": 3.3229665756225586, "lr": 9.943979196051428e-05, "tps": 25007, "wall": 59370.0} {"step": 22655, "train_loss": 3.2688934803009033, "lr": 9.94255666684649e-05, "tps": 25006, "wall": 59375.7} {"step": 22656, "train_loss": 3.2896199226379395, "lr": 9.941134274228921e-05, "tps": 25005, "wall": 59381.3} {"step": 22657, "train_loss": 3.1801395416259766, "lr": 9.939712018214827e-05, "tps": 25004, "wall": 59386.8} {"step": 22658, "train_loss": 3.233933925628662, "lr": 9.938289898820338e-05, "tps": 25002, "wall": 59392.4} {"step": 22659, "train_loss": 3.3041939735412598, "lr": 9.936867916061552e-05, "tps": 25001, "wall": 59398.0} {"step": 22660, "train_loss": 3.312744617462158, "lr": 9.935446069954572e-05, "tps": 25000, "wall": 59403.6} {"step": 22661, "train_loss": 3.2924935817718506, "lr": 9.934024360515518e-05, "tps": 24999, "wall": 59409.2} {"step": 22662, "train_loss": 3.254443645477295, "lr": 9.932602787760488e-05, "tps": 24997, "wall": 59414.8} {"step": 22663, "train_loss": 3.1684141159057617, "lr": 9.931181351705582e-05, "tps": 24996, "wall": 59420.4} {"step": 22664, "train_loss": 3.2648744583129883, "lr": 9.929760052366912e-05, "tps": 24995, "wall": 59425.9} {"step": 22665, "train_loss": 3.236825704574585, "lr": 9.928338889760573e-05, "tps": 24994, "wall": 59431.5} {"step": 22666, "train_loss": 3.255131721496582, "lr": 9.926917863902657e-05, "tps": 24992, "wall": 59437.1} {"step": 22667, "train_loss": 3.3123488426208496, "lr": 9.925496974809278e-05, "tps": 24991, "wall": 59442.7} {"step": 22668, "train_loss": 3.262295722961426, "lr": 9.924076222496513e-05, "tps": 24990, "wall": 59448.3} {"step": 22669, "train_loss": 3.3648815155029297, "lr": 9.922655606980475e-05, "tps": 24989, "wall": 59453.9} {"step": 22670, "train_loss": 3.2538204193115234, "lr": 9.921235128277244e-05, "tps": 24987, "wall": 59459.5} {"step": 22671, "train_loss": 3.277139902114868, "lr": 9.919814786402912e-05, "tps": 24986, "wall": 59465.1} {"step": 22672, "train_loss": 3.2122483253479004, "lr": 9.918394581373575e-05, "tps": 24985, "wall": 59470.6} {"step": 22673, "train_loss": 3.3236494064331055, "lr": 9.916974513205319e-05, "tps": 24984, "wall": 59476.2} {"step": 22674, "train_loss": 3.3658535480499268, "lr": 9.91555458191423e-05, "tps": 24982, "wall": 59481.8} {"step": 22675, "train_loss": 3.2311296463012695, "lr": 9.914134787516392e-05, "tps": 24981, "wall": 59487.4} {"step": 22676, "train_loss": 3.301915168762207, "lr": 9.912715130027883e-05, "tps": 24980, "wall": 59493.0} {"step": 22677, "train_loss": 3.3084046840667725, "lr": 9.911295609464797e-05, "tps": 24979, "wall": 59498.6} {"step": 22678, "train_loss": 3.3157925605773926, "lr": 9.909876225843208e-05, "tps": 24977, "wall": 59504.2} {"step": 22679, "train_loss": 3.262057304382324, "lr": 9.90845697917919e-05, "tps": 24976, "wall": 59509.8} {"step": 22680, "train_loss": 3.2283191680908203, "lr": 9.907037869488831e-05, "tps": 24975, "wall": 59515.5} {"step": 22681, "train_loss": 3.2412304878234863, "lr": 9.905618896788199e-05, "tps": 24974, "wall": 59521.1} {"step": 22682, "train_loss": 3.277452230453491, "lr": 9.904200061093369e-05, "tps": 24972, "wall": 59526.7} {"step": 22683, "train_loss": 3.3805370330810547, "lr": 9.902781362420417e-05, "tps": 24971, "wall": 59532.3} {"step": 22684, "train_loss": 3.266911029815674, "lr": 9.901362800785414e-05, "tps": 24970, "wall": 59537.9} {"step": 22685, "train_loss": 3.2668848037719727, "lr": 9.89994437620442e-05, "tps": 24969, "wall": 59543.5} {"step": 22686, "train_loss": 3.295393705368042, "lr": 9.89852608869352e-05, "tps": 24967, "wall": 59549.1} {"step": 22687, "train_loss": 3.1884613037109375, "lr": 9.897107938268769e-05, "tps": 24966, "wall": 59554.8} {"step": 22688, "train_loss": 3.263749361038208, "lr": 9.895689924946228e-05, "tps": 24965, "wall": 59560.4} {"step": 22689, "train_loss": 3.3566737174987793, "lr": 9.894272048741973e-05, "tps": 24964, "wall": 59566.0} {"step": 22690, "train_loss": 3.2763805389404297, "lr": 9.892854309672059e-05, "tps": 24962, "wall": 59571.6} {"step": 22691, "train_loss": 3.3110499382019043, "lr": 9.89143670775254e-05, "tps": 24961, "wall": 59577.1} {"step": 22692, "train_loss": 3.2688534259796143, "lr": 9.890019242999486e-05, "tps": 24960, "wall": 59582.8} {"step": 22693, "train_loss": 3.3293819427490234, "lr": 9.888601915428944e-05, "tps": 24959, "wall": 59588.3} {"step": 22694, "train_loss": 3.373535633087158, "lr": 9.887184725056981e-05, "tps": 24957, "wall": 59593.9} {"step": 22695, "train_loss": 3.290832042694092, "lr": 9.885767671899646e-05, "tps": 24956, "wall": 59599.5} {"step": 22696, "train_loss": 3.337357759475708, "lr": 9.884350755972983e-05, "tps": 24955, "wall": 59605.0} {"step": 22697, "train_loss": 3.26265549659729, "lr": 9.882933977293057e-05, "tps": 24954, "wall": 59610.7} {"step": 22698, "train_loss": 3.197338581085205, "lr": 9.881517335875909e-05, "tps": 24952, "wall": 59616.5} {"step": 22699, "train_loss": 3.221543788909912, "lr": 9.880100831737582e-05, "tps": 24951, "wall": 59622.0} {"step": 22700, "train_loss": 3.205631732940674, "lr": 9.878684464894136e-05, "tps": 24950, "wall": 59627.6} {"step": 22701, "train_loss": 3.31681489944458, "lr": 9.877268235361607e-05, "tps": 24949, "wall": 59633.2} {"step": 22702, "train_loss": 3.3147971630096436, "lr": 9.875852143156034e-05, "tps": 24947, "wall": 59638.8} {"step": 22703, "train_loss": 3.256417751312256, "lr": 9.87443618829347e-05, "tps": 24946, "wall": 59644.3} {"step": 22704, "train_loss": 3.2381601333618164, "lr": 9.873020370789948e-05, "tps": 24945, "wall": 59649.9} {"step": 22705, "train_loss": 3.360386371612549, "lr": 9.871604690661501e-05, "tps": 24944, "wall": 59655.5} {"step": 22706, "train_loss": 3.308751106262207, "lr": 9.870189147924177e-05, "tps": 24942, "wall": 59661.1} {"step": 22707, "train_loss": 3.310299873352051, "lr": 9.86877374259401e-05, "tps": 24941, "wall": 59666.7} {"step": 22708, "train_loss": 3.3625974655151367, "lr": 9.867358474687022e-05, "tps": 24940, "wall": 59672.3} {"step": 22709, "train_loss": 3.26920485496521, "lr": 9.865943344219261e-05, "tps": 24939, "wall": 59677.9} {"step": 22710, "train_loss": 3.352421522140503, "lr": 9.864528351206743e-05, "tps": 24938, "wall": 59683.5} {"step": 22711, "train_loss": 3.2496509552001953, "lr": 9.863113495665512e-05, "tps": 24936, "wall": 59689.1} {"step": 22712, "train_loss": 3.3025994300842285, "lr": 9.861698777611587e-05, "tps": 24935, "wall": 59694.7} {"step": 22713, "train_loss": 3.2131729125976562, "lr": 9.860284197060987e-05, "tps": 24934, "wall": 59700.3} {"step": 22714, "train_loss": 3.18509840965271, "lr": 9.858869754029752e-05, "tps": 24933, "wall": 59706.0} {"step": 22715, "train_loss": 3.334550619125366, "lr": 9.857455448533896e-05, "tps": 24931, "wall": 59711.6} {"step": 22716, "train_loss": 3.313594341278076, "lr": 9.856041280589439e-05, "tps": 24930, "wall": 59717.2} {"step": 22717, "train_loss": 3.355351209640503, "lr": 9.854627250212407e-05, "tps": 24929, "wall": 59722.8} {"step": 22718, "train_loss": 3.2602953910827637, "lr": 9.853213357418814e-05, "tps": 24928, "wall": 59728.4} {"step": 22719, "train_loss": 3.331606864929199, "lr": 9.851799602224671e-05, "tps": 24926, "wall": 59734.1} {"step": 22720, "train_loss": 3.3101131916046143, "lr": 9.850385984646008e-05, "tps": 24925, "wall": 59739.7} {"step": 22721, "train_loss": 3.302474021911621, "lr": 9.848972504698828e-05, "tps": 24924, "wall": 59745.3} {"step": 22722, "train_loss": 3.2547950744628906, "lr": 9.84755916239914e-05, "tps": 24923, "wall": 59750.9} {"step": 22723, "train_loss": 3.2447099685668945, "lr": 9.846145957762962e-05, "tps": 24921, "wall": 59756.5} {"step": 22724, "train_loss": 3.302445411682129, "lr": 9.844732890806302e-05, "tps": 24920, "wall": 59762.1} {"step": 22725, "train_loss": 3.2877230644226074, "lr": 9.843319961545161e-05, "tps": 24919, "wall": 59767.7} {"step": 22726, "train_loss": 3.2676658630371094, "lr": 9.841907169995552e-05, "tps": 24918, "wall": 59773.3} {"step": 22727, "train_loss": 3.3442249298095703, "lr": 9.840494516173473e-05, "tps": 24916, "wall": 59778.9} {"step": 22728, "train_loss": 3.2899928092956543, "lr": 9.839082000094934e-05, "tps": 24915, "wall": 59784.5} {"step": 22729, "train_loss": 3.3109607696533203, "lr": 9.837669621775936e-05, "tps": 24914, "wall": 59790.1} {"step": 22730, "train_loss": 3.301868200302124, "lr": 9.836257381232463e-05, "tps": 24913, "wall": 59795.7} {"step": 22731, "train_loss": 3.2566494941711426, "lr": 9.834845278480534e-05, "tps": 24911, "wall": 59801.3} {"step": 22732, "train_loss": 3.3352363109588623, "lr": 9.833433313536135e-05, "tps": 24910, "wall": 59806.9} {"step": 22733, "train_loss": 3.310546398162842, "lr": 9.832021486415255e-05, "tps": 24909, "wall": 59812.5} {"step": 22734, "train_loss": 3.200962781906128, "lr": 9.830609797133901e-05, "tps": 24908, "wall": 59818.1} {"step": 22735, "train_loss": 3.26198148727417, "lr": 9.829198245708056e-05, "tps": 24906, "wall": 59823.7} {"step": 22736, "train_loss": 3.16682767868042, "lr": 9.827786832153706e-05, "tps": 24905, "wall": 59829.2} {"step": 22737, "train_loss": 3.2633447647094727, "lr": 9.826375556486851e-05, "tps": 24904, "wall": 59834.9} {"step": 22738, "train_loss": 3.310689926147461, "lr": 9.824964418723475e-05, "tps": 24903, "wall": 59840.4} {"step": 22739, "train_loss": 3.2298200130462646, "lr": 9.823553418879552e-05, "tps": 24902, "wall": 59846.0} {"step": 22740, "train_loss": 3.194056749343872, "lr": 9.822142556971083e-05, "tps": 24900, "wall": 59851.7} {"step": 22741, "train_loss": 3.3503036499023438, "lr": 9.820731833014038e-05, "tps": 24899, "wall": 59857.3} {"step": 22742, "train_loss": 3.272493839263916, "lr": 9.8193212470244e-05, "tps": 24898, "wall": 59862.9} {"step": 22743, "train_loss": 3.3103511333465576, "lr": 9.817910799018153e-05, "tps": 24897, "wall": 59868.5} {"step": 22744, "train_loss": 3.3810105323791504, "lr": 9.816500489011272e-05, "tps": 24895, "wall": 59874.1} {"step": 22745, "train_loss": 3.302095413208008, "lr": 9.815090317019727e-05, "tps": 24894, "wall": 59879.7} {"step": 22746, "train_loss": 3.3830461502075195, "lr": 9.813680283059505e-05, "tps": 24893, "wall": 59885.4} {"step": 22747, "train_loss": 3.276503324508667, "lr": 9.812270387146566e-05, "tps": 24892, "wall": 59891.0} {"step": 22748, "train_loss": 3.318030834197998, "lr": 9.810860629296892e-05, "tps": 24890, "wall": 59896.6} {"step": 22749, "train_loss": 3.3175768852233887, "lr": 9.809451009526449e-05, "tps": 24889, "wall": 59902.3} {"step": 22750, "train_loss": 3.3273987770080566, "lr": 9.808041527851199e-05, "tps": 24888, "wall": 59907.9} {"step": 22751, "train_loss": 3.2556135654449463, "lr": 9.80663218428712e-05, "tps": 24887, "wall": 59913.5} {"step": 22752, "train_loss": 3.3034520149230957, "lr": 9.805222978850169e-05, "tps": 24885, "wall": 59919.2} {"step": 22753, "train_loss": 3.2389495372772217, "lr": 9.803813911556306e-05, "tps": 24884, "wall": 59924.8} {"step": 22754, "train_loss": 3.2577309608459473, "lr": 9.802404982421508e-05, "tps": 24883, "wall": 59930.4} {"step": 22755, "train_loss": 3.261756420135498, "lr": 9.800996191461724e-05, "tps": 24882, "wall": 59936.0} {"step": 22756, "train_loss": 3.3124313354492188, "lr": 9.79958753869291e-05, "tps": 24880, "wall": 59941.7} {"step": 22757, "train_loss": 3.2994697093963623, "lr": 9.798179024131032e-05, "tps": 24879, "wall": 59947.3} {"step": 22758, "train_loss": 3.310685157775879, "lr": 9.796770647792045e-05, "tps": 24878, "wall": 59952.9} {"step": 22759, "train_loss": 3.179457664489746, "lr": 9.795362409691894e-05, "tps": 24877, "wall": 59958.5} {"step": 22760, "train_loss": 3.1927223205566406, "lr": 9.793954309846542e-05, "tps": 24875, "wall": 59964.1} {"step": 22761, "train_loss": 3.324728012084961, "lr": 9.792546348271938e-05, "tps": 24874, "wall": 59969.7} {"step": 22762, "train_loss": 3.33438777923584, "lr": 9.791138524984023e-05, "tps": 24873, "wall": 59975.4} {"step": 22763, "train_loss": 3.314939022064209, "lr": 9.789730839998756e-05, "tps": 24872, "wall": 59981.0} {"step": 22764, "train_loss": 3.2109391689300537, "lr": 9.788323293332074e-05, "tps": 24870, "wall": 59986.6} {"step": 22765, "train_loss": 3.2898366451263428, "lr": 9.786915884999932e-05, "tps": 24869, "wall": 59992.3} {"step": 22766, "train_loss": 3.246565341949463, "lr": 9.785508615018268e-05, "tps": 24868, "wall": 59997.8} {"step": 22767, "train_loss": 3.2491769790649414, "lr": 9.784101483403016e-05, "tps": 24867, "wall": 60003.5} {"step": 22768, "train_loss": 3.331664562225342, "lr": 9.78269449017013e-05, "tps": 24866, "wall": 60009.1} {"step": 22769, "train_loss": 3.266498565673828, "lr": 9.781287635335541e-05, "tps": 24864, "wall": 60014.7} {"step": 22770, "train_loss": 3.2895073890686035, "lr": 9.77988091891518e-05, "tps": 24863, "wall": 60020.3} {"step": 22771, "train_loss": 3.3822507858276367, "lr": 9.778474340925e-05, "tps": 24862, "wall": 60025.9} {"step": 22772, "train_loss": 3.2429494857788086, "lr": 9.777067901380918e-05, "tps": 24861, "wall": 60031.5} {"step": 22773, "train_loss": 3.307032585144043, "lr": 9.775661600298868e-05, "tps": 24859, "wall": 60037.3} {"step": 22774, "train_loss": 3.343043804168701, "lr": 9.77425543769479e-05, "tps": 24858, "wall": 60042.9} {"step": 22775, "train_loss": 3.286804676055908, "lr": 9.77284941358461e-05, "tps": 24857, "wall": 60048.5} {"step": 22776, "train_loss": 3.261946201324463, "lr": 9.771443527984245e-05, "tps": 24856, "wall": 60054.2} {"step": 22777, "train_loss": 3.317509651184082, "lr": 9.770037780909636e-05, "tps": 24854, "wall": 60059.8} {"step": 22778, "train_loss": 3.325272798538208, "lr": 9.768632172376701e-05, "tps": 24853, "wall": 60065.5} {"step": 22779, "train_loss": 3.3505356311798096, "lr": 9.767226702401357e-05, "tps": 24852, "wall": 60071.1} {"step": 22780, "train_loss": 3.2323691844940186, "lr": 9.765821370999536e-05, "tps": 24851, "wall": 60076.7} {"step": 22781, "train_loss": 3.2134246826171875, "lr": 9.764416178187147e-05, "tps": 24849, "wall": 60082.4} {"step": 22782, "train_loss": 3.207592010498047, "lr": 9.76301112398012e-05, "tps": 24848, "wall": 60088.0} {"step": 22783, "train_loss": 3.225891351699829, "lr": 9.761606208394363e-05, "tps": 24847, "wall": 60093.7} {"step": 22784, "train_loss": 3.282170534133911, "lr": 9.76020143144579e-05, "tps": 24846, "wall": 60099.3} {"step": 22785, "train_loss": 3.227781295776367, "lr": 9.75879679315032e-05, "tps": 24844, "wall": 60104.9} {"step": 22786, "train_loss": 3.377918243408203, "lr": 9.757392293523863e-05, "tps": 24843, "wall": 60110.5} {"step": 22787, "train_loss": 3.3170971870422363, "lr": 9.755987932582322e-05, "tps": 24842, "wall": 60116.1} {"step": 22788, "train_loss": 3.2752935886383057, "lr": 9.754583710341621e-05, "tps": 24841, "wall": 60121.7} {"step": 22789, "train_loss": 3.242389678955078, "lr": 9.753179626817654e-05, "tps": 24840, "wall": 60127.3} {"step": 22790, "train_loss": 3.2751941680908203, "lr": 9.751775682026327e-05, "tps": 24838, "wall": 60133.0} {"step": 22791, "train_loss": 3.369699478149414, "lr": 9.750371875983554e-05, "tps": 24837, "wall": 60138.6} {"step": 22792, "train_loss": 3.1735029220581055, "lr": 9.748968208705231e-05, "tps": 24836, "wall": 60144.2} {"step": 22793, "train_loss": 3.281951904296875, "lr": 9.747564680207251e-05, "tps": 24835, "wall": 60149.9} {"step": 22794, "train_loss": 3.2144010066986084, "lr": 9.74616129050553e-05, "tps": 24833, "wall": 60155.7} {"step": 22795, "train_loss": 3.2872071266174316, "lr": 9.744758039615955e-05, "tps": 24832, "wall": 60161.3} {"step": 22796, "train_loss": 3.322744369506836, "lr": 9.743354927554418e-05, "tps": 24831, "wall": 60166.8} {"step": 22797, "train_loss": 3.2992095947265625, "lr": 9.741951954336827e-05, "tps": 24830, "wall": 60172.5} {"step": 22798, "train_loss": 3.204902172088623, "lr": 9.740549119979066e-05, "tps": 24828, "wall": 60178.1} {"step": 22799, "train_loss": 3.337749481201172, "lr": 9.739146424497023e-05, "tps": 24827, "wall": 60183.7} {"step": 22800, "train_loss": 3.3090341091156006, "lr": 9.737743867906597e-05, "tps": 24826, "wall": 60189.3} {"step": 22801, "train_loss": 3.4473137855529785, "lr": 9.736341450223666e-05, "tps": 24825, "wall": 60195.0} {"step": 22802, "train_loss": 3.2954869270324707, "lr": 9.73493917146413e-05, "tps": 24823, "wall": 60200.6} {"step": 22803, "train_loss": 3.2634077072143555, "lr": 9.733537031643866e-05, "tps": 24822, "wall": 60206.2} {"step": 22804, "train_loss": 3.1795477867126465, "lr": 9.732135030778751e-05, "tps": 24821, "wall": 60211.8} {"step": 22805, "train_loss": 3.2804291248321533, "lr": 9.730733168884681e-05, "tps": 24820, "wall": 60217.5} {"step": 22806, "train_loss": 3.2195181846618652, "lr": 9.729331445977528e-05, "tps": 24819, "wall": 60223.2} {"step": 22807, "train_loss": 3.2194135189056396, "lr": 9.72792986207317e-05, "tps": 24817, "wall": 60228.8} {"step": 22808, "train_loss": 3.1796398162841797, "lr": 9.726528417187487e-05, "tps": 24816, "wall": 60234.4} {"step": 22809, "train_loss": 3.37368106842041, "lr": 9.725127111336359e-05, "tps": 24815, "wall": 60240.0} {"step": 22810, "train_loss": 3.3010990619659424, "lr": 9.723725944535645e-05, "tps": 24814, "wall": 60245.6} {"step": 22811, "train_loss": 3.253744602203369, "lr": 9.722324916801238e-05, "tps": 24812, "wall": 60251.3} {"step": 22812, "train_loss": 3.3397138118743896, "lr": 9.720924028148996e-05, "tps": 24811, "wall": 60256.9} {"step": 22813, "train_loss": 3.348126173019409, "lr": 9.719523278594785e-05, "tps": 24810, "wall": 60262.6} {"step": 22814, "train_loss": 3.23565673828125, "lr": 9.718122668154485e-05, "tps": 24809, "wall": 60268.2} {"step": 22815, "train_loss": 3.2610042095184326, "lr": 9.716722196843955e-05, "tps": 24807, "wall": 60273.8} {"step": 22816, "train_loss": 3.3380517959594727, "lr": 9.715321864679057e-05, "tps": 24806, "wall": 60279.5} {"step": 22817, "train_loss": 3.218050003051758, "lr": 9.71392167167566e-05, "tps": 24805, "wall": 60285.1} {"step": 22818, "train_loss": 3.255391836166382, "lr": 9.71252161784962e-05, "tps": 24804, "wall": 60290.8} {"step": 22819, "train_loss": 3.2209320068359375, "lr": 9.711121703216803e-05, "tps": 24803, "wall": 60296.3} {"step": 22820, "train_loss": 3.245204448699951, "lr": 9.709721927793065e-05, "tps": 24801, "wall": 60301.9} {"step": 22821, "train_loss": 3.3339388370513916, "lr": 9.708322291594257e-05, "tps": 24800, "wall": 60307.6} {"step": 22822, "train_loss": 3.1824727058410645, "lr": 9.706922794636244e-05, "tps": 24799, "wall": 60313.2} {"step": 22823, "train_loss": 3.311574935913086, "lr": 9.705523436934876e-05, "tps": 24798, "wall": 60318.8} {"step": 22824, "train_loss": 3.1664209365844727, "lr": 9.704124218505997e-05, "tps": 24796, "wall": 60324.5} {"step": 22825, "train_loss": 3.3387341499328613, "lr": 9.702725139365469e-05, "tps": 24795, "wall": 60330.1} {"step": 22826, "train_loss": 3.2757413387298584, "lr": 9.701326199529138e-05, "tps": 24794, "wall": 60335.8} {"step": 22827, "train_loss": 3.2812294960021973, "lr": 9.699927399012841e-05, "tps": 24793, "wall": 60341.4} {"step": 22828, "train_loss": 3.3559439182281494, "lr": 9.698528737832439e-05, "tps": 24791, "wall": 60347.0} {"step": 22829, "train_loss": 3.4264631271362305, "lr": 9.697130216003769e-05, "tps": 24790, "wall": 60352.6} {"step": 22830, "train_loss": 3.2501001358032227, "lr": 9.695731833542666e-05, "tps": 24789, "wall": 60358.2} {"step": 22831, "train_loss": 3.3215372562408447, "lr": 9.694333590464986e-05, "tps": 24788, "wall": 60363.9} {"step": 22832, "train_loss": 3.2079055309295654, "lr": 9.692935486786562e-05, "tps": 24787, "wall": 60369.5} {"step": 22833, "train_loss": 3.3117804527282715, "lr": 9.691537522523222e-05, "tps": 24785, "wall": 60375.1} {"step": 22834, "train_loss": 3.3614745140075684, "lr": 9.690139697690819e-05, "tps": 24784, "wall": 60380.7} {"step": 22835, "train_loss": 3.3641984462738037, "lr": 9.688742012305171e-05, "tps": 24783, "wall": 60386.3} {"step": 22836, "train_loss": 3.244325876235962, "lr": 9.687344466382127e-05, "tps": 24782, "wall": 60391.9} {"step": 22837, "train_loss": 3.172825574874878, "lr": 9.685947059937512e-05, "tps": 24780, "wall": 60397.7} {"step": 22838, "train_loss": 3.2548468112945557, "lr": 9.684549792987146e-05, "tps": 24779, "wall": 60403.3} {"step": 22839, "train_loss": 3.167202949523926, "lr": 9.683152665546876e-05, "tps": 24778, "wall": 60408.9} {"step": 22840, "train_loss": 3.1921024322509766, "lr": 9.681755677632515e-05, "tps": 24777, "wall": 60414.5} {"step": 22841, "train_loss": 3.2747626304626465, "lr": 9.68035882925989e-05, "tps": 24776, "wall": 60420.1} {"step": 22842, "train_loss": 3.3746273517608643, "lr": 9.67896212044483e-05, "tps": 24774, "wall": 60425.7} {"step": 22843, "train_loss": 3.2400307655334473, "lr": 9.677565551203154e-05, "tps": 24773, "wall": 60431.3} {"step": 22844, "train_loss": 3.2894296646118164, "lr": 9.67616912155068e-05, "tps": 24772, "wall": 60436.9} {"step": 22845, "train_loss": 3.2809088230133057, "lr": 9.674772831503232e-05, "tps": 24771, "wall": 60442.5} {"step": 22846, "train_loss": 3.2221198081970215, "lr": 9.673376681076618e-05, "tps": 24770, "wall": 60448.1} {"step": 22847, "train_loss": 3.2100107669830322, "lr": 9.671980670286665e-05, "tps": 24768, "wall": 60453.8} {"step": 22848, "train_loss": 3.2664620876312256, "lr": 9.670584799149182e-05, "tps": 24767, "wall": 60459.4} {"step": 22849, "train_loss": 3.2823333740234375, "lr": 9.669189067679976e-05, "tps": 24766, "wall": 60465.0} {"step": 22850, "train_loss": 3.1786060333251953, "lr": 9.66779347589487e-05, "tps": 24765, "wall": 60470.7} {"step": 22851, "train_loss": 3.2547311782836914, "lr": 9.666398023809666e-05, "tps": 24763, "wall": 60476.3} {"step": 22852, "train_loss": 3.278823137283325, "lr": 9.665002711440163e-05, "tps": 24762, "wall": 60481.9} {"step": 22853, "train_loss": 3.238478660583496, "lr": 9.663607538802186e-05, "tps": 24761, "wall": 60487.5} {"step": 22854, "train_loss": 3.1956980228424072, "lr": 9.662212505911531e-05, "tps": 24760, "wall": 60493.1} {"step": 22855, "train_loss": 3.2960190773010254, "lr": 9.660817612783993e-05, "tps": 24759, "wall": 60498.7} {"step": 22856, "train_loss": 3.343742847442627, "lr": 9.659422859435387e-05, "tps": 24757, "wall": 60504.2} {"step": 22857, "train_loss": 3.37026309967041, "lr": 9.658028245881506e-05, "tps": 24756, "wall": 60509.8} {"step": 22858, "train_loss": 3.282813549041748, "lr": 9.656633772138142e-05, "tps": 24755, "wall": 60515.5} {"step": 22859, "train_loss": 3.2372231483459473, "lr": 9.655239438221106e-05, "tps": 24754, "wall": 60521.0} {"step": 22860, "train_loss": 3.2094039916992188, "lr": 9.653845244146177e-05, "tps": 24753, "wall": 60526.6} {"step": 22861, "train_loss": 3.255086898803711, "lr": 9.652451189929166e-05, "tps": 24751, "wall": 60532.2} {"step": 22862, "train_loss": 3.2896533012390137, "lr": 9.651057275585852e-05, "tps": 24750, "wall": 60537.8} {"step": 22863, "train_loss": 3.206223964691162, "lr": 9.649663501132027e-05, "tps": 24749, "wall": 60543.3} {"step": 22864, "train_loss": 3.267495632171631, "lr": 9.648269866583488e-05, "tps": 24748, "wall": 60548.9} {"step": 22865, "train_loss": 3.2132301330566406, "lr": 9.646876371956015e-05, "tps": 24747, "wall": 60554.5} {"step": 22866, "train_loss": 3.1779556274414062, "lr": 9.645483017265388e-05, "tps": 24745, "wall": 60560.0} {"step": 22867, "train_loss": 3.338009834289551, "lr": 9.644089802527403e-05, "tps": 24744, "wall": 60565.6} {"step": 22868, "train_loss": 3.2932894229888916, "lr": 9.642696727757839e-05, "tps": 24743, "wall": 60571.2} {"step": 22869, "train_loss": 3.3134818077087402, "lr": 9.641303792972471e-05, "tps": 24742, "wall": 60576.9} {"step": 22870, "train_loss": 3.310209274291992, "lr": 9.639910998187084e-05, "tps": 24741, "wall": 60582.5} {"step": 22871, "train_loss": 3.2390763759613037, "lr": 9.638518343417457e-05, "tps": 24739, "wall": 60588.1} {"step": 22872, "train_loss": 3.3207342624664307, "lr": 9.637125828679353e-05, "tps": 24738, "wall": 60593.7} {"step": 22873, "train_loss": 3.286184072494507, "lr": 9.635733453988567e-05, "tps": 24737, "wall": 60599.2} {"step": 22874, "train_loss": 3.2141494750976562, "lr": 9.634341219360859e-05, "tps": 24736, "wall": 60604.8} {"step": 22875, "train_loss": 3.2556328773498535, "lr": 9.632949124811997e-05, "tps": 24735, "wall": 60610.4} {"step": 22876, "train_loss": 3.3155434131622314, "lr": 9.631557170357763e-05, "tps": 24733, "wall": 60616.0} {"step": 22877, "train_loss": 3.221649169921875, "lr": 9.630165356013917e-05, "tps": 24732, "wall": 60621.5} {"step": 22878, "train_loss": 3.2215654850006104, "lr": 9.628773681796222e-05, "tps": 24731, "wall": 60627.1} {"step": 22879, "train_loss": 3.1360485553741455, "lr": 9.627382147720454e-05, "tps": 24730, "wall": 60632.7} {"step": 22880, "train_loss": 3.2391369342803955, "lr": 9.625990753802364e-05, "tps": 24729, "wall": 60638.3} {"step": 22881, "train_loss": 3.297485828399658, "lr": 9.624599500057728e-05, "tps": 24727, "wall": 60643.9} {"step": 22882, "train_loss": 3.255833625793457, "lr": 9.623208386502295e-05, "tps": 24726, "wall": 60649.5} {"step": 22883, "train_loss": 3.073174476623535, "lr": 9.621817413151825e-05, "tps": 24725, "wall": 60655.1} {"step": 22884, "train_loss": 3.339369297027588, "lr": 9.620426580022078e-05, "tps": 24724, "wall": 60660.7} {"step": 22885, "train_loss": 3.247436046600342, "lr": 9.619035887128813e-05, "tps": 24723, "wall": 60666.3} {"step": 22886, "train_loss": 3.228365898132324, "lr": 9.61764533448777e-05, "tps": 24721, "wall": 60671.9} {"step": 22887, "train_loss": 3.2396678924560547, "lr": 9.616254922114719e-05, "tps": 24720, "wall": 60677.5} {"step": 22888, "train_loss": 3.138420820236206, "lr": 9.614864650025401e-05, "tps": 24719, "wall": 60683.0} {"step": 22889, "train_loss": 3.2931525707244873, "lr": 9.613474518235561e-05, "tps": 24718, "wall": 60688.6} {"step": 22890, "train_loss": 3.2271203994750977, "lr": 9.612084526760956e-05, "tps": 24717, "wall": 60694.3} {"step": 22891, "train_loss": 3.3039326667785645, "lr": 9.610694675617329e-05, "tps": 24715, "wall": 60699.8} {"step": 22892, "train_loss": 3.295987606048584, "lr": 9.609304964820417e-05, "tps": 24714, "wall": 60705.5} {"step": 22893, "train_loss": 3.2324399948120117, "lr": 9.607915394385975e-05, "tps": 24713, "wall": 60711.1} {"step": 22894, "train_loss": 3.317619800567627, "lr": 9.606525964329738e-05, "tps": 24712, "wall": 60716.7} {"step": 22895, "train_loss": 3.262831926345825, "lr": 9.605136674667438e-05, "tps": 24711, "wall": 60722.2} {"step": 22896, "train_loss": 3.335730791091919, "lr": 9.603747525414827e-05, "tps": 24709, "wall": 60727.8} {"step": 22897, "train_loss": 3.2384517192840576, "lr": 9.602358516587627e-05, "tps": 24708, "wall": 60733.5} {"step": 22898, "train_loss": 3.2604153156280518, "lr": 9.600969648201588e-05, "tps": 24707, "wall": 60739.1} {"step": 22899, "train_loss": 3.2187728881835938, "lr": 9.599580920272436e-05, "tps": 24706, "wall": 60744.6} {"step": 22900, "train_loss": 3.431408643722534, "lr": 9.598192332815897e-05, "tps": 24705, "wall": 60750.2} {"step": 22901, "train_loss": 3.2095165252685547, "lr": 9.596803885847712e-05, "tps": 24703, "wall": 60755.9} {"step": 22902, "train_loss": 3.3112471103668213, "lr": 9.595415579383603e-05, "tps": 24702, "wall": 60761.5} {"step": 22903, "train_loss": 3.1878108978271484, "lr": 9.59402741343929e-05, "tps": 24701, "wall": 60767.1} {"step": 22904, "train_loss": 3.1916754245758057, "lr": 9.592639388030512e-05, "tps": 24700, "wall": 60772.7} {"step": 22905, "train_loss": 3.3373069763183594, "lr": 9.591251503172986e-05, "tps": 24699, "wall": 60778.3} {"step": 22906, "train_loss": 3.279572010040283, "lr": 9.58986375888243e-05, "tps": 24697, "wall": 60783.9} {"step": 22907, "train_loss": 3.2132723331451416, "lr": 9.588476155174574e-05, "tps": 24696, "wall": 60789.5} {"step": 22908, "train_loss": 3.184803009033203, "lr": 9.587088692065132e-05, "tps": 24695, "wall": 60795.2} {"step": 22909, "train_loss": 3.2668960094451904, "lr": 9.585701369569813e-05, "tps": 24694, "wall": 60800.8} {"step": 22910, "train_loss": 3.257058620452881, "lr": 9.584314187704348e-05, "tps": 24693, "wall": 60806.4} {"step": 22911, "train_loss": 3.2588374614715576, "lr": 9.582927146484443e-05, "tps": 24691, "wall": 60812.0} {"step": 22912, "train_loss": 3.341017961502075, "lr": 9.581540245925805e-05, "tps": 24690, "wall": 60817.7} {"step": 22913, "train_loss": 3.2912697792053223, "lr": 9.580153486044158e-05, "tps": 24689, "wall": 60823.3} {"step": 22914, "train_loss": 3.2679104804992676, "lr": 9.578766866855198e-05, "tps": 24688, "wall": 60828.9} {"step": 22915, "train_loss": 3.221379041671753, "lr": 9.577380388374643e-05, "tps": 24687, "wall": 60834.5} {"step": 22916, "train_loss": 3.328221559524536, "lr": 9.575994050618197e-05, "tps": 24685, "wall": 60840.1} {"step": 22917, "train_loss": 3.3197944164276123, "lr": 9.574607853601556e-05, "tps": 24684, "wall": 60845.7} {"step": 22918, "train_loss": 3.277115821838379, "lr": 9.573221797340437e-05, "tps": 24683, "wall": 60851.3} {"step": 22919, "train_loss": 3.2977311611175537, "lr": 9.571835881850531e-05, "tps": 24682, "wall": 60856.9} {"step": 22920, "train_loss": 3.2886064052581787, "lr": 9.570450107147534e-05, "tps": 24681, "wall": 60862.5} {"step": 22921, "train_loss": 3.242309093475342, "lr": 9.56906447324716e-05, "tps": 24679, "wall": 60868.1} {"step": 22922, "train_loss": 3.2122106552124023, "lr": 9.567678980165093e-05, "tps": 24678, "wall": 60873.8} {"step": 22923, "train_loss": 3.1860389709472656, "lr": 9.566293627917026e-05, "tps": 24677, "wall": 60879.4} {"step": 22924, "train_loss": 3.275576591491699, "lr": 9.564908416518665e-05, "tps": 24676, "wall": 60885.0} {"step": 22925, "train_loss": 3.237337112426758, "lr": 9.563523345985692e-05, "tps": 24675, "wall": 60890.7} {"step": 22926, "train_loss": 3.245079278945923, "lr": 9.562138416333795e-05, "tps": 24673, "wall": 60896.2} {"step": 22927, "train_loss": 3.3011159896850586, "lr": 9.560753627578674e-05, "tps": 24672, "wall": 60901.8} {"step": 22928, "train_loss": 3.2802371978759766, "lr": 9.559368979736005e-05, "tps": 24671, "wall": 60907.3} {"step": 22929, "train_loss": 3.296297311782837, "lr": 9.557984472821475e-05, "tps": 24670, "wall": 60912.9} {"step": 22930, "train_loss": 3.2586886882781982, "lr": 9.556600106850772e-05, "tps": 24669, "wall": 60918.4} {"step": 22931, "train_loss": 3.2974648475646973, "lr": 9.555215881839581e-05, "tps": 24667, "wall": 60924.1} {"step": 22932, "train_loss": 3.276674747467041, "lr": 9.553831797803569e-05, "tps": 24666, "wall": 60929.7} {"step": 22933, "train_loss": 3.178908348083496, "lr": 9.552447854758428e-05, "tps": 24665, "wall": 60935.4} {"step": 22934, "train_loss": 3.2947068214416504, "lr": 9.551064052719828e-05, "tps": 24664, "wall": 60941.0} {"step": 22935, "train_loss": 3.280867099761963, "lr": 9.549680391703453e-05, "tps": 24663, "wall": 60946.6} {"step": 22936, "train_loss": 3.4078218936920166, "lr": 9.54829687172497e-05, "tps": 24661, "wall": 60952.2} {"step": 22937, "train_loss": 3.2888896465301514, "lr": 9.546913492800053e-05, "tps": 24660, "wall": 60957.9} {"step": 22938, "train_loss": 3.309225082397461, "lr": 9.545530254944376e-05, "tps": 24659, "wall": 60963.5} {"step": 22939, "train_loss": 3.2748732566833496, "lr": 9.544147158173605e-05, "tps": 24658, "wall": 60969.1} {"step": 22940, "train_loss": 3.244504690170288, "lr": 9.542764202503404e-05, "tps": 24657, "wall": 60974.7} {"step": 22941, "train_loss": 3.2876315116882324, "lr": 9.541381387949452e-05, "tps": 24655, "wall": 60980.3} {"step": 22942, "train_loss": 3.3524394035339355, "lr": 9.539998714527402e-05, "tps": 24654, "wall": 60985.9} {"step": 22943, "train_loss": 3.3372435569763184, "lr": 9.538616182252918e-05, "tps": 24653, "wall": 60991.5} {"step": 22944, "train_loss": 3.2537388801574707, "lr": 9.537233791141667e-05, "tps": 24652, "wall": 60997.2} {"step": 22945, "train_loss": 3.1922473907470703, "lr": 9.535851541209308e-05, "tps": 24651, "wall": 61002.8} {"step": 22946, "train_loss": 3.262643575668335, "lr": 9.534469432471491e-05, "tps": 24649, "wall": 61008.4} {"step": 22947, "train_loss": 3.2989020347595215, "lr": 9.533087464943885e-05, "tps": 24648, "wall": 61014.0} {"step": 22948, "train_loss": 3.1667964458465576, "lr": 9.531705638642137e-05, "tps": 24647, "wall": 61019.7} {"step": 22949, "train_loss": 3.250173568725586, "lr": 9.530323953581896e-05, "tps": 24646, "wall": 61025.3} {"step": 22950, "train_loss": 3.250047206878662, "lr": 9.528942409778828e-05, "tps": 24645, "wall": 61030.9} {"step": 22951, "train_loss": 3.2109789848327637, "lr": 9.527561007248566e-05, "tps": 24643, "wall": 61036.5} {"step": 22952, "train_loss": 3.2520220279693604, "lr": 9.526179746006777e-05, "tps": 24642, "wall": 61042.1} {"step": 22953, "train_loss": 3.240267038345337, "lr": 9.524798626069097e-05, "tps": 24641, "wall": 61047.7} {"step": 22954, "train_loss": 3.277818202972412, "lr": 9.523417647451167e-05, "tps": 24640, "wall": 61053.3} {"step": 22955, "train_loss": 3.2384517192840576, "lr": 9.522036810168643e-05, "tps": 24639, "wall": 61059.1} {"step": 22956, "train_loss": 3.270724296569824, "lr": 9.52065611423716e-05, "tps": 24637, "wall": 61064.7} {"step": 22957, "train_loss": 3.4768776893615723, "lr": 9.519275559672356e-05, "tps": 24636, "wall": 61070.3} {"step": 22958, "train_loss": 3.2814698219299316, "lr": 9.517895146489877e-05, "tps": 24635, "wall": 61075.9} {"step": 22959, "train_loss": 3.2654032707214355, "lr": 9.516514874705359e-05, "tps": 24634, "wall": 61081.6} {"step": 22960, "train_loss": 3.323087692260742, "lr": 9.51513474433443e-05, "tps": 24633, "wall": 61087.2} {"step": 22961, "train_loss": 3.217243194580078, "lr": 9.513754755392735e-05, "tps": 24631, "wall": 61092.8} {"step": 22962, "train_loss": 3.2697181701660156, "lr": 9.512374907895902e-05, "tps": 24630, "wall": 61098.5} {"step": 22963, "train_loss": 3.302885055541992, "lr": 9.510995201859555e-05, "tps": 24629, "wall": 61104.1} {"step": 22964, "train_loss": 3.270533800125122, "lr": 9.509615637299336e-05, "tps": 24628, "wall": 61109.7} {"step": 22965, "train_loss": 3.2571053504943848, "lr": 9.508236214230866e-05, "tps": 24627, "wall": 61115.5} {"step": 22966, "train_loss": 3.163719654083252, "lr": 9.506856932669769e-05, "tps": 24625, "wall": 61121.1} {"step": 22967, "train_loss": 3.28379487991333, "lr": 9.505477792631678e-05, "tps": 24624, "wall": 61126.7} {"step": 22968, "train_loss": 3.2367446422576904, "lr": 9.504098794132202e-05, "tps": 24623, "wall": 61132.3} {"step": 22969, "train_loss": 3.221644401550293, "lr": 9.502719937186979e-05, "tps": 24622, "wall": 61138.0} {"step": 22970, "train_loss": 3.298323154449463, "lr": 9.501341221811619e-05, "tps": 24621, "wall": 61143.6} {"step": 22971, "train_loss": 3.2104134559631348, "lr": 9.499962648021737e-05, "tps": 24619, "wall": 61149.3} {"step": 22972, "train_loss": 3.268489360809326, "lr": 9.498584215832959e-05, "tps": 24618, "wall": 61154.9} {"step": 22973, "train_loss": 3.2589001655578613, "lr": 9.497205925260898e-05, "tps": 24617, "wall": 61160.6} {"step": 22974, "train_loss": 3.3696179389953613, "lr": 9.495827776321154e-05, "tps": 24616, "wall": 61166.1} {"step": 22975, "train_loss": 3.323479652404785, "lr": 9.49444976902936e-05, "tps": 24615, "wall": 61171.8} {"step": 22976, "train_loss": 3.329211473464966, "lr": 9.493071903401115e-05, "tps": 24613, "wall": 61177.5} {"step": 22977, "train_loss": 3.2851715087890625, "lr": 9.49169417945202e-05, "tps": 24612, "wall": 61183.0} {"step": 22978, "train_loss": 3.465254306793213, "lr": 9.490316597197696e-05, "tps": 24611, "wall": 61188.7} {"step": 22979, "train_loss": 3.327822208404541, "lr": 9.488939156653745e-05, "tps": 24610, "wall": 61194.4} {"step": 22980, "train_loss": 3.2391164302825928, "lr": 9.487561857835759e-05, "tps": 24609, "wall": 61199.9} {"step": 22981, "train_loss": 3.4083025455474854, "lr": 9.486184700759356e-05, "tps": 24608, "wall": 61205.5} {"step": 22982, "train_loss": 3.2969281673431396, "lr": 9.484807685440133e-05, "tps": 24606, "wall": 61211.0} {"step": 22983, "train_loss": 3.3025336265563965, "lr": 9.483430811893676e-05, "tps": 24605, "wall": 61216.6} {"step": 22984, "train_loss": 3.202622175216675, "lr": 9.4820540801356e-05, "tps": 24604, "wall": 61222.2} {"step": 22985, "train_loss": 3.2431209087371826, "lr": 9.48067749018149e-05, "tps": 24603, "wall": 61227.8} {"step": 22986, "train_loss": 3.286177635192871, "lr": 9.479301042046939e-05, "tps": 24602, "wall": 61233.4} {"step": 22987, "train_loss": 3.2595109939575195, "lr": 9.477924735747547e-05, "tps": 24600, "wall": 61239.1} {"step": 22988, "train_loss": 3.2613818645477295, "lr": 9.476548571298897e-05, "tps": 24599, "wall": 61244.8} {"step": 22989, "train_loss": 3.2138659954071045, "lr": 9.475172548716587e-05, "tps": 24598, "wall": 61250.4} {"step": 22990, "train_loss": 3.2688052654266357, "lr": 9.473796668016201e-05, "tps": 24597, "wall": 61256.0} {"step": 22991, "train_loss": 3.223365545272827, "lr": 9.472420929213317e-05, "tps": 24596, "wall": 61261.6} {"step": 22992, "train_loss": 3.323168992996216, "lr": 9.471045332323532e-05, "tps": 24595, "wall": 61267.2} {"step": 22993, "train_loss": 3.2197275161743164, "lr": 9.469669877362425e-05, "tps": 24593, "wall": 61272.9} {"step": 22994, "train_loss": 3.3077991008758545, "lr": 9.468294564345568e-05, "tps": 24592, "wall": 61278.5} {"step": 22995, "train_loss": 3.262009620666504, "lr": 9.466919393288556e-05, "tps": 24591, "wall": 61284.1} {"step": 22996, "train_loss": 3.311962842941284, "lr": 9.465544364206958e-05, "tps": 24590, "wall": 61289.7} {"step": 22997, "train_loss": 3.2405669689178467, "lr": 9.464169477116346e-05, "tps": 24589, "wall": 61295.5} {"step": 22998, "train_loss": 3.2238357067108154, "lr": 9.462794732032306e-05, "tps": 24587, "wall": 61301.1} {"step": 22999, "train_loss": 3.167792797088623, "lr": 9.461420128970405e-05, "tps": 24586, "wall": 61306.8} {"step": 23000, "train_loss": 3.2433457374572754, "lr": 9.46004566794621e-05, "tps": 24585, "wall": 61312.4, "val_loss_monitor": 3.340290016381255} {"step": 23001, "train_loss": 3.238455295562744, "lr": 9.458671348975302e-05, "tps": 24569, "wall": 61354.5} {"step": 23002, "train_loss": 3.209489345550537, "lr": 9.45729717207324e-05, "tps": 24568, "wall": 61360.2} {"step": 23003, "train_loss": 3.2271575927734375, "lr": 9.455923137255593e-05, "tps": 24567, "wall": 61365.8} {"step": 23004, "train_loss": 3.350466012954712, "lr": 9.45454924453793e-05, "tps": 24566, "wall": 61371.5} {"step": 23005, "train_loss": 3.3658957481384277, "lr": 9.453175493935809e-05, "tps": 24564, "wall": 61377.2} {"step": 23006, "train_loss": 3.2641377449035645, "lr": 9.451801885464799e-05, "tps": 24563, "wall": 61382.9} {"step": 23007, "train_loss": 3.229515552520752, "lr": 9.450428419140457e-05, "tps": 24562, "wall": 61388.5} {"step": 23008, "train_loss": 3.277724266052246, "lr": 9.449055094978334e-05, "tps": 24561, "wall": 61394.2} {"step": 23009, "train_loss": 3.237036943435669, "lr": 9.447681912993999e-05, "tps": 24560, "wall": 61399.9} {"step": 23010, "train_loss": 3.2248120307922363, "lr": 9.446308873203003e-05, "tps": 24558, "wall": 61405.6} {"step": 23011, "train_loss": 3.158775806427002, "lr": 9.444935975620894e-05, "tps": 24557, "wall": 61411.2} {"step": 23012, "train_loss": 3.098329544067383, "lr": 9.443563220263242e-05, "tps": 24556, "wall": 61417.0} {"step": 23013, "train_loss": 3.292900562286377, "lr": 9.442190607145571e-05, "tps": 24555, "wall": 61422.7} {"step": 23014, "train_loss": 3.340649366378784, "lr": 9.440818136283451e-05, "tps": 24553, "wall": 61428.4} {"step": 23015, "train_loss": 3.271500587463379, "lr": 9.439445807692423e-05, "tps": 24552, "wall": 61434.1} {"step": 23016, "train_loss": 3.267425537109375, "lr": 9.438073621388027e-05, "tps": 24551, "wall": 61439.8} {"step": 23017, "train_loss": 3.248905658721924, "lr": 9.436701577385816e-05, "tps": 24550, "wall": 61445.5} {"step": 23018, "train_loss": 3.2091081142425537, "lr": 9.435329675701331e-05, "tps": 24549, "wall": 61451.2} {"step": 23019, "train_loss": 3.265427589416504, "lr": 9.433957916350109e-05, "tps": 24547, "wall": 61456.8} {"step": 23020, "train_loss": 3.2577433586120605, "lr": 9.432586299347691e-05, "tps": 24546, "wall": 61462.5} {"step": 23021, "train_loss": 3.384190797805786, "lr": 9.431214824709617e-05, "tps": 24545, "wall": 61468.2} {"step": 23022, "train_loss": 3.2981832027435303, "lr": 9.429843492451418e-05, "tps": 24544, "wall": 61473.9} {"step": 23023, "train_loss": 3.2081193923950195, "lr": 9.428472302588636e-05, "tps": 24543, "wall": 61479.7} {"step": 23024, "train_loss": 3.3313703536987305, "lr": 9.4271012551368e-05, "tps": 24541, "wall": 61485.4} {"step": 23025, "train_loss": 3.206066608428955, "lr": 9.425730350111435e-05, "tps": 24540, "wall": 61491.1} {"step": 23026, "train_loss": 3.279325485229492, "lr": 9.424359587528084e-05, "tps": 24539, "wall": 61496.7} {"step": 23027, "train_loss": 3.271573781967163, "lr": 9.422988967402268e-05, "tps": 24538, "wall": 61502.4} {"step": 23028, "train_loss": 3.348160743713379, "lr": 9.421618489749507e-05, "tps": 24537, "wall": 61508.0} {"step": 23029, "train_loss": 3.2998197078704834, "lr": 9.420248154585337e-05, "tps": 24535, "wall": 61513.7} {"step": 23030, "train_loss": 3.324758768081665, "lr": 9.418877961925271e-05, "tps": 24534, "wall": 61519.3} {"step": 23031, "train_loss": 3.328010082244873, "lr": 9.417507911784845e-05, "tps": 24533, "wall": 61524.9} {"step": 23032, "train_loss": 3.3388795852661133, "lr": 9.416138004179565e-05, "tps": 24532, "wall": 61530.6} {"step": 23033, "train_loss": 3.3317666053771973, "lr": 9.414768239124951e-05, "tps": 24531, "wall": 61536.4} {"step": 23034, "train_loss": 3.369661331176758, "lr": 9.41339861663653e-05, "tps": 24529, "wall": 61542.0} {"step": 23035, "train_loss": 3.2258360385894775, "lr": 9.41202913672981e-05, "tps": 24528, "wall": 61547.6} {"step": 23036, "train_loss": 3.322554111480713, "lr": 9.410659799420298e-05, "tps": 24527, "wall": 61553.3} {"step": 23037, "train_loss": 3.209537982940674, "lr": 9.40929060472352e-05, "tps": 24526, "wall": 61558.9} {"step": 23038, "train_loss": 3.259092092514038, "lr": 9.407921552654978e-05, "tps": 24525, "wall": 61564.5} {"step": 23039, "train_loss": 3.201536178588867, "lr": 9.406552643230175e-05, "tps": 24524, "wall": 61570.1} {"step": 23040, "train_loss": 3.385599374771118, "lr": 9.405183876464633e-05, "tps": 24522, "wall": 61575.7} {"step": 23041, "train_loss": 3.2183175086975098, "lr": 9.403815252373848e-05, "tps": 24521, "wall": 61581.3} {"step": 23042, "train_loss": 3.2611241340637207, "lr": 9.402446770973323e-05, "tps": 24520, "wall": 61586.9} {"step": 23043, "train_loss": 3.2929930686950684, "lr": 9.401078432278564e-05, "tps": 24519, "wall": 61592.5} {"step": 23044, "train_loss": 3.298379421234131, "lr": 9.399710236305071e-05, "tps": 24518, "wall": 61598.1} {"step": 23045, "train_loss": 3.361067295074463, "lr": 9.398342183068338e-05, "tps": 24517, "wall": 61603.8} {"step": 23046, "train_loss": 3.2767176628112793, "lr": 9.396974272583871e-05, "tps": 24515, "wall": 61609.4} {"step": 23047, "train_loss": 3.3614485263824463, "lr": 9.395606504867153e-05, "tps": 24514, "wall": 61615.0} {"step": 23048, "train_loss": 3.368950843811035, "lr": 9.394238879933697e-05, "tps": 24513, "wall": 61620.5} {"step": 23049, "train_loss": 3.216801166534424, "lr": 9.392871397798981e-05, "tps": 24512, "wall": 61626.1} {"step": 23050, "train_loss": 3.297441244125366, "lr": 9.391504058478497e-05, "tps": 24511, "wall": 61631.7} {"step": 23051, "train_loss": 3.2897744178771973, "lr": 9.39013686198774e-05, "tps": 24510, "wall": 61637.3} {"step": 23052, "train_loss": 3.2617690563201904, "lr": 9.388769808342198e-05, "tps": 24508, "wall": 61642.9} {"step": 23053, "train_loss": 3.2569520473480225, "lr": 9.387402897557346e-05, "tps": 24507, "wall": 61648.5} {"step": 23054, "train_loss": 3.2748050689697266, "lr": 9.386036129648683e-05, "tps": 24506, "wall": 61654.2} {"step": 23055, "train_loss": 3.278404474258423, "lr": 9.384669504631684e-05, "tps": 24505, "wall": 61659.7} {"step": 23056, "train_loss": 3.2461183071136475, "lr": 9.383303022521826e-05, "tps": 24504, "wall": 61665.3} {"step": 23057, "train_loss": 3.15854549407959, "lr": 9.381936683334601e-05, "tps": 24503, "wall": 61671.0} {"step": 23058, "train_loss": 3.3522539138793945, "lr": 9.38057048708548e-05, "tps": 24501, "wall": 61676.6} {"step": 23059, "train_loss": 3.2377448081970215, "lr": 9.379204433789932e-05, "tps": 24500, "wall": 61682.1} {"step": 23060, "train_loss": 3.244907855987549, "lr": 9.377838523463446e-05, "tps": 24499, "wall": 61687.8} {"step": 23061, "train_loss": 3.3856096267700195, "lr": 9.376472756121487e-05, "tps": 24498, "wall": 61693.3} {"step": 23062, "train_loss": 3.2756903171539307, "lr": 9.375107131779522e-05, "tps": 24497, "wall": 61698.9} {"step": 23063, "train_loss": 3.3539795875549316, "lr": 9.373741650453031e-05, "tps": 24496, "wall": 61704.5} {"step": 23064, "train_loss": 3.3112969398498535, "lr": 9.372376312157473e-05, "tps": 24494, "wall": 61710.1} {"step": 23065, "train_loss": 3.1850624084472656, "lr": 9.371011116908325e-05, "tps": 24493, "wall": 61715.8} {"step": 23066, "train_loss": 3.207359790802002, "lr": 9.369646064721049e-05, "tps": 24492, "wall": 61721.3} {"step": 23067, "train_loss": 3.3115973472595215, "lr": 9.368281155611094e-05, "tps": 24491, "wall": 61726.9} {"step": 23068, "train_loss": 3.2410268783569336, "lr": 9.366916389593942e-05, "tps": 24490, "wall": 61732.5} {"step": 23069, "train_loss": 3.3122479915618896, "lr": 9.365551766685045e-05, "tps": 24489, "wall": 61738.1} {"step": 23070, "train_loss": 3.250445604324341, "lr": 9.364187286899856e-05, "tps": 24488, "wall": 61743.7} {"step": 23071, "train_loss": 3.2173473834991455, "lr": 9.362822950253844e-05, "tps": 24486, "wall": 61749.2} {"step": 23072, "train_loss": 3.445891857147217, "lr": 9.361458756762455e-05, "tps": 24485, "wall": 61754.8} {"step": 23073, "train_loss": 3.245697259902954, "lr": 9.360094706441139e-05, "tps": 24484, "wall": 61760.5} {"step": 23074, "train_loss": 3.1832239627838135, "lr": 9.358730799305361e-05, "tps": 24483, "wall": 61766.0} {"step": 23075, "train_loss": 3.3174831867218018, "lr": 9.357367035370562e-05, "tps": 24482, "wall": 61771.6} {"step": 23076, "train_loss": 3.184175968170166, "lr": 9.35600341465219e-05, "tps": 24481, "wall": 61777.2} {"step": 23077, "train_loss": 3.2840843200683594, "lr": 9.3546399371657e-05, "tps": 24479, "wall": 61782.8} {"step": 23078, "train_loss": 3.147120714187622, "lr": 9.353276602926533e-05, "tps": 24478, "wall": 61788.4} {"step": 23079, "train_loss": 3.213953733444214, "lr": 9.351913411950127e-05, "tps": 24477, "wall": 61793.9} {"step": 23080, "train_loss": 3.1897380352020264, "lr": 9.350550364251937e-05, "tps": 24476, "wall": 61799.6} {"step": 23081, "train_loss": 3.296675205230713, "lr": 9.349187459847394e-05, "tps": 24475, "wall": 61805.1} {"step": 23082, "train_loss": 3.239640712738037, "lr": 9.347824698751937e-05, "tps": 24474, "wall": 61810.7} {"step": 23083, "train_loss": 3.2836689949035645, "lr": 9.34646208098101e-05, "tps": 24473, "wall": 61816.4} {"step": 23084, "train_loss": 3.236884832382202, "lr": 9.34509960655004e-05, "tps": 24471, "wall": 61822.0} {"step": 23085, "train_loss": 3.2525808811187744, "lr": 9.343737275474473e-05, "tps": 24470, "wall": 61827.6} {"step": 23086, "train_loss": 3.347621440887451, "lr": 9.342375087769736e-05, "tps": 24469, "wall": 61833.2} {"step": 23087, "train_loss": 3.351378917694092, "lr": 9.34101304345125e-05, "tps": 24468, "wall": 61838.9} {"step": 23088, "train_loss": 3.2918291091918945, "lr": 9.339651142534459e-05, "tps": 24467, "wall": 61844.5} {"step": 23089, "train_loss": 3.4122867584228516, "lr": 9.338289385034786e-05, "tps": 24466, "wall": 61850.1} {"step": 23090, "train_loss": 3.257999897003174, "lr": 9.33692777096765e-05, "tps": 24464, "wall": 61855.8} {"step": 23091, "train_loss": 3.4136576652526855, "lr": 9.335566300348488e-05, "tps": 24463, "wall": 61861.3} {"step": 23092, "train_loss": 3.35626220703125, "lr": 9.334204973192714e-05, "tps": 24462, "wall": 61866.9} {"step": 23093, "train_loss": 3.204185962677002, "lr": 9.332843789515746e-05, "tps": 24461, "wall": 61872.5} {"step": 23094, "train_loss": 3.3439576625823975, "lr": 9.331482749333016e-05, "tps": 24460, "wall": 61878.1} {"step": 23095, "train_loss": 3.2436490058898926, "lr": 9.330121852659933e-05, "tps": 24459, "wall": 61883.8} {"step": 23096, "train_loss": 3.3227314949035645, "lr": 9.32876109951191e-05, "tps": 24457, "wall": 61889.4} {"step": 23097, "train_loss": 3.2278342247009277, "lr": 9.327400489904374e-05, "tps": 24456, "wall": 61895.1} {"step": 23098, "train_loss": 3.2953805923461914, "lr": 9.32604002385273e-05, "tps": 24455, "wall": 61900.6} {"step": 23099, "train_loss": 3.384524345397949, "lr": 9.324679701372383e-05, "tps": 24454, "wall": 61906.3} {"step": 23100, "train_loss": 3.2920126914978027, "lr": 9.323319522478756e-05, "tps": 24453, "wall": 61911.9} {"step": 23101, "train_loss": 3.2006289958953857, "lr": 9.321959487187247e-05, "tps": 24452, "wall": 61917.5} {"step": 23102, "train_loss": 3.2506260871887207, "lr": 9.320599595513271e-05, "tps": 24450, "wall": 61923.1} {"step": 23103, "train_loss": 3.338348388671875, "lr": 9.319239847472229e-05, "tps": 24449, "wall": 61928.7} {"step": 23104, "train_loss": 3.402838706970215, "lr": 9.31788024307952e-05, "tps": 24448, "wall": 61934.3} {"step": 23105, "train_loss": 3.2183661460876465, "lr": 9.316520782350555e-05, "tps": 24447, "wall": 61939.9} {"step": 23106, "train_loss": 3.1718521118164062, "lr": 9.315161465300727e-05, "tps": 24446, "wall": 61945.5} {"step": 23107, "train_loss": 3.3712401390075684, "lr": 9.313802291945431e-05, "tps": 24445, "wall": 61951.1} {"step": 23108, "train_loss": 3.3421120643615723, "lr": 9.312443262300078e-05, "tps": 24444, "wall": 61956.8} {"step": 23109, "train_loss": 3.2088465690612793, "lr": 9.31108437638005e-05, "tps": 24442, "wall": 61962.4} {"step": 23110, "train_loss": 3.2413971424102783, "lr": 9.30972563420074e-05, "tps": 24441, "wall": 61968.1} {"step": 23111, "train_loss": 3.3015313148498535, "lr": 9.30836703577755e-05, "tps": 24440, "wall": 61973.7} {"step": 23112, "train_loss": 3.4123318195343018, "lr": 9.307008581125865e-05, "tps": 24439, "wall": 61979.3} {"step": 23113, "train_loss": 3.3030357360839844, "lr": 9.305650270261068e-05, "tps": 24438, "wall": 61984.9} {"step": 23114, "train_loss": 3.4135029315948486, "lr": 9.304292103198558e-05, "tps": 24437, "wall": 61990.5} {"step": 23115, "train_loss": 3.350227117538452, "lr": 9.302934079953713e-05, "tps": 24435, "wall": 61996.1} {"step": 23116, "train_loss": 3.2935631275177, "lr": 9.301576200541912e-05, "tps": 24434, "wall": 62001.7} {"step": 23117, "train_loss": 3.321335792541504, "lr": 9.30021846497855e-05, "tps": 24433, "wall": 62007.3} {"step": 23118, "train_loss": 3.3494153022766113, "lr": 9.298860873278998e-05, "tps": 24432, "wall": 62012.9} {"step": 23119, "train_loss": 3.232419013977051, "lr": 9.297503425458632e-05, "tps": 24431, "wall": 62018.6} {"step": 23120, "train_loss": 3.3131539821624756, "lr": 9.29614612153284e-05, "tps": 24430, "wall": 62024.2} {"step": 23121, "train_loss": 3.2644548416137695, "lr": 9.294788961516986e-05, "tps": 24428, "wall": 62029.8} {"step": 23122, "train_loss": 3.290605068206787, "lr": 9.293431945426457e-05, "tps": 24427, "wall": 62035.4} {"step": 23123, "train_loss": 3.2773690223693848, "lr": 9.292075073276617e-05, "tps": 24426, "wall": 62041.0} {"step": 23124, "train_loss": 3.2617290019989014, "lr": 9.290718345082834e-05, "tps": 24425, "wall": 62046.6} {"step": 23125, "train_loss": 3.272930145263672, "lr": 9.289361760860485e-05, "tps": 24424, "wall": 62052.3} {"step": 23126, "train_loss": 3.25814151763916, "lr": 9.288005320624936e-05, "tps": 24423, "wall": 62057.9} {"step": 23127, "train_loss": 3.219066619873047, "lr": 9.286649024391542e-05, "tps": 24422, "wall": 62063.5} {"step": 23128, "train_loss": 3.312213897705078, "lr": 9.285292872175683e-05, "tps": 24420, "wall": 62069.2} {"step": 23129, "train_loss": 3.31019926071167, "lr": 9.283936863992712e-05, "tps": 24419, "wall": 62074.9} {"step": 23130, "train_loss": 3.2385647296905518, "lr": 9.282580999857991e-05, "tps": 24418, "wall": 62080.5} {"step": 23131, "train_loss": 3.30375337600708, "lr": 9.281225279786883e-05, "tps": 24417, "wall": 62086.1} {"step": 23132, "train_loss": 3.276980400085449, "lr": 9.279869703794741e-05, "tps": 24416, "wall": 62091.7} {"step": 23133, "train_loss": 3.244407892227173, "lr": 9.278514271896921e-05, "tps": 24415, "wall": 62097.3} {"step": 23134, "train_loss": 3.2431771755218506, "lr": 9.277158984108785e-05, "tps": 24413, "wall": 62102.9} {"step": 23135, "train_loss": 3.2751097679138184, "lr": 9.275803840445679e-05, "tps": 24412, "wall": 62108.5} {"step": 23136, "train_loss": 3.2760491371154785, "lr": 9.27444884092295e-05, "tps": 24411, "wall": 62114.1} {"step": 23137, "train_loss": 3.2623603343963623, "lr": 9.273093985555959e-05, "tps": 24410, "wall": 62119.7} {"step": 23138, "train_loss": 3.260610342025757, "lr": 9.271739274360043e-05, "tps": 24409, "wall": 62125.4} {"step": 23139, "train_loss": 3.313211441040039, "lr": 9.270384707350557e-05, "tps": 24408, "wall": 62131.0} {"step": 23140, "train_loss": 3.2626805305480957, "lr": 9.269030284542842e-05, "tps": 24406, "wall": 62136.7} {"step": 23141, "train_loss": 3.398864507675171, "lr": 9.267676005952236e-05, "tps": 24405, "wall": 62142.3} {"step": 23142, "train_loss": 3.234042167663574, "lr": 9.266321871594091e-05, "tps": 24404, "wall": 62147.9} {"step": 23143, "train_loss": 3.254405975341797, "lr": 9.264967881483738e-05, "tps": 24403, "wall": 62153.5} {"step": 23144, "train_loss": 3.242910385131836, "lr": 9.263614035636515e-05, "tps": 24402, "wall": 62159.1} {"step": 23145, "train_loss": 3.361873149871826, "lr": 9.262260334067767e-05, "tps": 24401, "wall": 62164.7} {"step": 23146, "train_loss": 3.3006296157836914, "lr": 9.26090677679282e-05, "tps": 24400, "wall": 62170.4} {"step": 23147, "train_loss": 3.2678916454315186, "lr": 9.259553363827008e-05, "tps": 24398, "wall": 62176.0} {"step": 23148, "train_loss": 3.2054710388183594, "lr": 9.258200095185669e-05, "tps": 24397, "wall": 62181.6} {"step": 23149, "train_loss": 3.290661573410034, "lr": 9.256846970884129e-05, "tps": 24396, "wall": 62187.2} {"step": 23150, "train_loss": 3.3130342960357666, "lr": 9.255493990937708e-05, "tps": 24395, "wall": 62192.8} {"step": 23151, "train_loss": 3.290363311767578, "lr": 9.254141155361747e-05, "tps": 24394, "wall": 62198.6} {"step": 23152, "train_loss": 3.2608728408813477, "lr": 9.252788464171565e-05, "tps": 24393, "wall": 62204.2} {"step": 23153, "train_loss": 3.323920965194702, "lr": 9.251435917382481e-05, "tps": 24391, "wall": 62209.9} {"step": 23154, "train_loss": 3.2948484420776367, "lr": 9.250083515009826e-05, "tps": 24390, "wall": 62215.5} {"step": 23155, "train_loss": 3.217360734939575, "lr": 9.248731257068907e-05, "tps": 24389, "wall": 62221.1} {"step": 23156, "train_loss": 3.257538318634033, "lr": 9.247379143575057e-05, "tps": 24388, "wall": 62226.7} {"step": 23157, "train_loss": 3.324432611465454, "lr": 9.246027174543588e-05, "tps": 24387, "wall": 62232.3} {"step": 23158, "train_loss": 3.3385002613067627, "lr": 9.244675349989804e-05, "tps": 24386, "wall": 62237.9} {"step": 23159, "train_loss": 3.276090621948242, "lr": 9.243323669929035e-05, "tps": 24385, "wall": 62243.5} {"step": 23160, "train_loss": 3.222604274749756, "lr": 9.241972134376586e-05, "tps": 24383, "wall": 62249.1} {"step": 23161, "train_loss": 3.2615346908569336, "lr": 9.24062074334776e-05, "tps": 24382, "wall": 62254.8} {"step": 23162, "train_loss": 3.2227296829223633, "lr": 9.239269496857877e-05, "tps": 24381, "wall": 62260.5} {"step": 23163, "train_loss": 3.228529453277588, "lr": 9.237918394922242e-05, "tps": 24380, "wall": 62266.1} {"step": 23164, "train_loss": 3.1698598861694336, "lr": 9.236567437556151e-05, "tps": 24379, "wall": 62271.6} {"step": 23165, "train_loss": 3.2736358642578125, "lr": 9.23521662477492e-05, "tps": 24378, "wall": 62277.3} {"step": 23166, "train_loss": 3.303314447402954, "lr": 9.233865956593847e-05, "tps": 24377, "wall": 62282.9} {"step": 23167, "train_loss": 3.247035264968872, "lr": 9.232515433028225e-05, "tps": 24375, "wall": 62288.4} {"step": 23168, "train_loss": 3.336005926132202, "lr": 9.231165054093363e-05, "tps": 24374, "wall": 62294.1} {"step": 23169, "train_loss": 3.2091095447540283, "lr": 9.229814819804555e-05, "tps": 24373, "wall": 62299.7} {"step": 23170, "train_loss": 3.372143030166626, "lr": 9.228464730177089e-05, "tps": 24372, "wall": 62305.4} {"step": 23171, "train_loss": 3.386626720428467, "lr": 9.227114785226273e-05, "tps": 24371, "wall": 62311.0} {"step": 23172, "train_loss": 3.276986598968506, "lr": 9.225764984967392e-05, "tps": 24370, "wall": 62316.7} {"step": 23173, "train_loss": 3.285871982574463, "lr": 9.224415329415728e-05, "tps": 24368, "wall": 62322.3} {"step": 23174, "train_loss": 3.3210060596466064, "lr": 9.223065818586587e-05, "tps": 24367, "wall": 62327.9} {"step": 23175, "train_loss": 3.3246030807495117, "lr": 9.221716452495239e-05, "tps": 24366, "wall": 62333.6} {"step": 23176, "train_loss": 3.270254611968994, "lr": 9.220367231156987e-05, "tps": 24365, "wall": 62339.2} {"step": 23177, "train_loss": 3.180537700653076, "lr": 9.219018154587105e-05, "tps": 24364, "wall": 62344.9} {"step": 23178, "train_loss": 3.328854560852051, "lr": 9.217669222800871e-05, "tps": 24363, "wall": 62350.5} {"step": 23179, "train_loss": 3.29500150680542, "lr": 9.216320435813577e-05, "tps": 24362, "wall": 62356.2} {"step": 23180, "train_loss": 3.1750235557556152, "lr": 9.214971793640496e-05, "tps": 24360, "wall": 62361.8} {"step": 23181, "train_loss": 3.223132610321045, "lr": 9.213623296296907e-05, "tps": 24359, "wall": 62367.4} {"step": 23182, "train_loss": 3.184403657913208, "lr": 9.212274943798085e-05, "tps": 24358, "wall": 62373.0} {"step": 23183, "train_loss": 3.329293727874756, "lr": 9.210926736159298e-05, "tps": 24357, "wall": 62378.8} {"step": 23184, "train_loss": 3.2408151626586914, "lr": 9.209578673395833e-05, "tps": 24356, "wall": 62384.4} {"step": 23185, "train_loss": 3.2247776985168457, "lr": 9.208230755522951e-05, "tps": 24355, "wall": 62390.0} {"step": 23186, "train_loss": 3.2537622451782227, "lr": 9.206882982555915e-05, "tps": 24354, "wall": 62395.6} {"step": 23187, "train_loss": 3.340552568435669, "lr": 9.20553535451001e-05, "tps": 24352, "wall": 62401.2} {"step": 23188, "train_loss": 3.2762272357940674, "lr": 9.204187871400492e-05, "tps": 24351, "wall": 62406.9} {"step": 23189, "train_loss": 3.3321032524108887, "lr": 9.202840533242619e-05, "tps": 24350, "wall": 62412.5} {"step": 23190, "train_loss": 3.204155921936035, "lr": 9.201493340051667e-05, "tps": 24349, "wall": 62418.1} {"step": 23191, "train_loss": 3.2323849201202393, "lr": 9.20014629184289e-05, "tps": 24348, "wall": 62423.7} {"step": 23192, "train_loss": 3.3101794719696045, "lr": 9.198799388631542e-05, "tps": 24347, "wall": 62429.3} {"step": 23193, "train_loss": 3.1488776206970215, "lr": 9.197452630432896e-05, "tps": 24345, "wall": 62435.1} {"step": 23194, "train_loss": 3.1899917125701904, "lr": 9.196106017262197e-05, "tps": 24344, "wall": 62440.7} {"step": 23195, "train_loss": 3.2972259521484375, "lr": 9.194759549134697e-05, "tps": 24343, "wall": 62446.3} {"step": 23196, "train_loss": 3.1655936241149902, "lr": 9.193413226065657e-05, "tps": 24342, "wall": 62452.0} {"step": 23197, "train_loss": 3.3569083213806152, "lr": 9.192067048070323e-05, "tps": 24341, "wall": 62457.6} {"step": 23198, "train_loss": 3.1925888061523438, "lr": 9.190721015163948e-05, "tps": 24340, "wall": 62463.2} {"step": 23199, "train_loss": 3.180253028869629, "lr": 9.18937512736178e-05, "tps": 24339, "wall": 62468.8} {"step": 23200, "train_loss": 3.2481465339660645, "lr": 9.18802938467906e-05, "tps": 24337, "wall": 62474.4} {"step": 23201, "train_loss": 3.2154126167297363, "lr": 9.18668378713104e-05, "tps": 24336, "wall": 62480.0} {"step": 23202, "train_loss": 3.292344093322754, "lr": 9.185338334732958e-05, "tps": 24335, "wall": 62485.6} {"step": 23203, "train_loss": 3.2758331298828125, "lr": 9.183993027500052e-05, "tps": 24334, "wall": 62491.3} {"step": 23204, "train_loss": 3.268185615539551, "lr": 9.182647865447573e-05, "tps": 24333, "wall": 62497.0} {"step": 23205, "train_loss": 3.325451612472534, "lr": 9.181302848590752e-05, "tps": 24332, "wall": 62502.6} {"step": 23206, "train_loss": 3.2551047801971436, "lr": 9.17995797694482e-05, "tps": 24331, "wall": 62508.2} {"step": 23207, "train_loss": 3.2242250442504883, "lr": 9.178613250525021e-05, "tps": 24329, "wall": 62513.8} {"step": 23208, "train_loss": 3.2454681396484375, "lr": 9.177268669346589e-05, "tps": 24328, "wall": 62519.4} {"step": 23209, "train_loss": 3.3301913738250732, "lr": 9.175924233424741e-05, "tps": 24327, "wall": 62525.1} {"step": 23210, "train_loss": 3.2250142097473145, "lr": 9.174579942774725e-05, "tps": 24326, "wall": 62530.7} {"step": 23211, "train_loss": 3.295341968536377, "lr": 9.173235797411762e-05, "tps": 24325, "wall": 62536.3} {"step": 23212, "train_loss": 3.1880810260772705, "lr": 9.17189179735107e-05, "tps": 24324, "wall": 62541.9} {"step": 23213, "train_loss": 3.2987823486328125, "lr": 9.170547942607889e-05, "tps": 24323, "wall": 62547.6} {"step": 23214, "train_loss": 3.3592031002044678, "lr": 9.169204233197435e-05, "tps": 24321, "wall": 62553.2} {"step": 23215, "train_loss": 3.2577338218688965, "lr": 9.167860669134923e-05, "tps": 24320, "wall": 62558.9} {"step": 23216, "train_loss": 3.249814987182617, "lr": 9.166517250435586e-05, "tps": 24319, "wall": 62564.5} {"step": 23217, "train_loss": 3.2579503059387207, "lr": 9.165173977114631e-05, "tps": 24318, "wall": 62570.2} {"step": 23218, "train_loss": 3.239086151123047, "lr": 9.163830849187284e-05, "tps": 24317, "wall": 62575.8} {"step": 23219, "train_loss": 3.2189412117004395, "lr": 9.162487866668755e-05, "tps": 24316, "wall": 62581.4} {"step": 23220, "train_loss": 3.258486270904541, "lr": 9.161145029574255e-05, "tps": 24315, "wall": 62587.0} {"step": 23221, "train_loss": 3.3288145065307617, "lr": 9.159802337919001e-05, "tps": 24313, "wall": 62592.6} {"step": 23222, "train_loss": 3.301126003265381, "lr": 9.158459791718203e-05, "tps": 24312, "wall": 62598.3} {"step": 23223, "train_loss": 3.303410530090332, "lr": 9.15711739098706e-05, "tps": 24311, "wall": 62603.9} {"step": 23224, "train_loss": 3.296107769012451, "lr": 9.155775135740791e-05, "tps": 24310, "wall": 62609.5} {"step": 23225, "train_loss": 3.308114528656006, "lr": 9.154433025994598e-05, "tps": 24309, "wall": 62615.2} {"step": 23226, "train_loss": 3.273439407348633, "lr": 9.153091061763676e-05, "tps": 24308, "wall": 62620.8} {"step": 23227, "train_loss": 3.2566394805908203, "lr": 9.151749243063242e-05, "tps": 24307, "wall": 62626.4} {"step": 23228, "train_loss": 3.2775020599365234, "lr": 9.150407569908483e-05, "tps": 24306, "wall": 62632.0} {"step": 23229, "train_loss": 3.264580488204956, "lr": 9.149066042314599e-05, "tps": 24304, "wall": 62637.6} {"step": 23230, "train_loss": 3.3071987628936768, "lr": 9.147724660296796e-05, "tps": 24303, "wall": 62643.2} {"step": 23231, "train_loss": 3.2587697505950928, "lr": 9.146383423870262e-05, "tps": 24302, "wall": 62648.8} {"step": 23232, "train_loss": 3.285137176513672, "lr": 9.145042333050187e-05, "tps": 24301, "wall": 62654.5} {"step": 23233, "train_loss": 3.4010534286499023, "lr": 9.143701387851773e-05, "tps": 24300, "wall": 62660.1} {"step": 23234, "train_loss": 3.2800393104553223, "lr": 9.1423605882902e-05, "tps": 24299, "wall": 62665.7} {"step": 23235, "train_loss": 3.253112316131592, "lr": 9.14101993438067e-05, "tps": 24298, "wall": 62671.3} {"step": 23236, "train_loss": 3.226181745529175, "lr": 9.13967942613836e-05, "tps": 24296, "wall": 62677.0} {"step": 23237, "train_loss": 3.241888999938965, "lr": 9.138339063578449e-05, "tps": 24295, "wall": 62682.6} {"step": 23238, "train_loss": 3.2310900688171387, "lr": 9.136998846716137e-05, "tps": 24294, "wall": 62688.2} {"step": 23239, "train_loss": 3.3104255199432373, "lr": 9.135658775566598e-05, "tps": 24293, "wall": 62693.8} {"step": 23240, "train_loss": 3.3934831619262695, "lr": 9.134318850145005e-05, "tps": 24292, "wall": 62699.4} {"step": 23241, "train_loss": 3.295243501663208, "lr": 9.132979070466553e-05, "tps": 24291, "wall": 62705.1} {"step": 23242, "train_loss": 3.1888046264648438, "lr": 9.131639436546406e-05, "tps": 24290, "wall": 62710.7} {"step": 23243, "train_loss": 3.2716803550720215, "lr": 9.130299948399741e-05, "tps": 24289, "wall": 62716.4} {"step": 23244, "train_loss": 3.398653268814087, "lr": 9.12896060604174e-05, "tps": 24287, "wall": 62722.0} {"step": 23245, "train_loss": 3.2536072731018066, "lr": 9.127621409487568e-05, "tps": 24286, "wall": 62727.6} {"step": 23246, "train_loss": 3.2922582626342773, "lr": 9.126282358752393e-05, "tps": 24285, "wall": 62733.2} {"step": 23247, "train_loss": 3.388126850128174, "lr": 9.124943453851392e-05, "tps": 24284, "wall": 62739.0} {"step": 23248, "train_loss": 3.308323860168457, "lr": 9.12360469479973e-05, "tps": 24283, "wall": 62744.7} {"step": 23249, "train_loss": 3.318913459777832, "lr": 9.122266081612563e-05, "tps": 24282, "wall": 62750.3} {"step": 23250, "train_loss": 3.098914623260498, "lr": 9.120927614305069e-05, "tps": 24281, "wall": 62755.9} {"step": 23251, "train_loss": 3.1847612857818604, "lr": 9.119589292892397e-05, "tps": 24279, "wall": 62761.6} {"step": 23252, "train_loss": 3.3341314792633057, "lr": 9.11825111738972e-05, "tps": 24278, "wall": 62767.2} {"step": 23253, "train_loss": 3.325540065765381, "lr": 9.116913087812193e-05, "tps": 24277, "wall": 62772.8} {"step": 23254, "train_loss": 3.3254153728485107, "lr": 9.115575204174965e-05, "tps": 24276, "wall": 62778.5} {"step": 23255, "train_loss": 3.3709185123443604, "lr": 9.114237466493204e-05, "tps": 24275, "wall": 62784.1} {"step": 23256, "train_loss": 3.269881248474121, "lr": 9.112899874782057e-05, "tps": 24274, "wall": 62789.7} {"step": 23257, "train_loss": 3.3027191162109375, "lr": 9.111562429056672e-05, "tps": 24273, "wall": 62795.5} {"step": 23258, "train_loss": 3.249574661254883, "lr": 9.110225129332213e-05, "tps": 24271, "wall": 62801.1} {"step": 23259, "train_loss": 3.29557466506958, "lr": 9.108887975623819e-05, "tps": 24270, "wall": 62806.8} {"step": 23260, "train_loss": 3.174699068069458, "lr": 9.107550967946635e-05, "tps": 24269, "wall": 62812.5} {"step": 23261, "train_loss": 3.2414326667785645, "lr": 9.106214106315815e-05, "tps": 24268, "wall": 62818.1} {"step": 23262, "train_loss": 3.3033199310302734, "lr": 9.104877390746501e-05, "tps": 24267, "wall": 62823.7} {"step": 23263, "train_loss": 3.259660482406616, "lr": 9.103540821253826e-05, "tps": 24266, "wall": 62829.3} {"step": 23264, "train_loss": 3.291171073913574, "lr": 9.102204397852945e-05, "tps": 24265, "wall": 62835.0} {"step": 23265, "train_loss": 3.253787040710449, "lr": 9.10086812055899e-05, "tps": 24263, "wall": 62840.7} {"step": 23266, "train_loss": 3.201969861984253, "lr": 9.099531989387092e-05, "tps": 24262, "wall": 62846.3} {"step": 23267, "train_loss": 3.2118282318115234, "lr": 9.098196004352402e-05, "tps": 24261, "wall": 62852.0} {"step": 23268, "train_loss": 3.331749439239502, "lr": 9.096860165470044e-05, "tps": 24260, "wall": 62857.7} {"step": 23269, "train_loss": 3.3035426139831543, "lr": 9.095524472755146e-05, "tps": 24259, "wall": 62863.4} {"step": 23270, "train_loss": 3.2334790229797363, "lr": 9.094188926222852e-05, "tps": 24258, "wall": 62869.0} {"step": 23271, "train_loss": 3.2727701663970947, "lr": 9.092853525888277e-05, "tps": 24257, "wall": 62874.7} {"step": 23272, "train_loss": 3.3445844650268555, "lr": 9.091518271766563e-05, "tps": 24255, "wall": 62880.3} {"step": 23273, "train_loss": 3.2728986740112305, "lr": 9.090183163872826e-05, "tps": 24254, "wall": 62885.9} {"step": 23274, "train_loss": 3.266650676727295, "lr": 9.088848202222189e-05, "tps": 24253, "wall": 62891.6} {"step": 23275, "train_loss": 3.25795841217041, "lr": 9.087513386829781e-05, "tps": 24252, "wall": 62897.2} {"step": 23276, "train_loss": 3.267035722732544, "lr": 9.086178717710724e-05, "tps": 24251, "wall": 62902.9} {"step": 23277, "train_loss": 3.259485960006714, "lr": 9.084844194880123e-05, "tps": 24250, "wall": 62908.6} {"step": 23278, "train_loss": 3.2415788173675537, "lr": 9.083509818353114e-05, "tps": 24249, "wall": 62914.2} {"step": 23279, "train_loss": 3.2915687561035156, "lr": 9.082175588144804e-05, "tps": 24247, "wall": 62919.9} {"step": 23280, "train_loss": 3.240403175354004, "lr": 9.080841504270301e-05, "tps": 24246, "wall": 62925.6} {"step": 23281, "train_loss": 3.2653675079345703, "lr": 9.079507566744731e-05, "tps": 24245, "wall": 62931.3} {"step": 23282, "train_loss": 3.228240489959717, "lr": 9.078173775583198e-05, "tps": 24244, "wall": 62936.9} {"step": 23283, "train_loss": 3.3145291805267334, "lr": 9.076840130800806e-05, "tps": 24243, "wall": 62942.6} {"step": 23284, "train_loss": 3.272428035736084, "lr": 9.075506632412675e-05, "tps": 24242, "wall": 62948.2} {"step": 23285, "train_loss": 3.304222345352173, "lr": 9.074173280433902e-05, "tps": 24241, "wall": 62954.0} {"step": 23286, "train_loss": 3.190680503845215, "lr": 9.07284007487959e-05, "tps": 24239, "wall": 62959.6} {"step": 23287, "train_loss": 3.3362016677856445, "lr": 9.071507015764849e-05, "tps": 24238, "wall": 62965.3} {"step": 23288, "train_loss": 3.1594481468200684, "lr": 9.070174103104772e-05, "tps": 24237, "wall": 62970.9} {"step": 23289, "train_loss": 3.2678287029266357, "lr": 9.068841336914463e-05, "tps": 24236, "wall": 62976.7} {"step": 23290, "train_loss": 3.3710877895355225, "lr": 9.067508717209025e-05, "tps": 24235, "wall": 62982.3} {"step": 23291, "train_loss": 3.260012149810791, "lr": 9.066176244003539e-05, "tps": 24234, "wall": 62987.9} {"step": 23292, "train_loss": 3.2796826362609863, "lr": 9.064843917313113e-05, "tps": 24233, "wall": 62993.6} {"step": 23293, "train_loss": 3.346815586090088, "lr": 9.063511737152836e-05, "tps": 24231, "wall": 62999.3} {"step": 23294, "train_loss": 3.2491068840026855, "lr": 9.062179703537794e-05, "tps": 24230, "wall": 63004.9} {"step": 23295, "train_loss": 3.280221462249756, "lr": 9.060847816483085e-05, "tps": 24229, "wall": 63010.5} {"step": 23296, "train_loss": 3.197007656097412, "lr": 9.059516076003791e-05, "tps": 24228, "wall": 63016.2} {"step": 23297, "train_loss": 3.222379207611084, "lr": 9.058184482114995e-05, "tps": 24227, "wall": 63021.8} {"step": 23298, "train_loss": 3.2719593048095703, "lr": 9.056853034831788e-05, "tps": 24226, "wall": 63027.5} {"step": 23299, "train_loss": 3.180288791656494, "lr": 9.055521734169254e-05, "tps": 24225, "wall": 63033.1} {"step": 23300, "train_loss": 3.319756031036377, "lr": 9.054190580142462e-05, "tps": 24224, "wall": 63038.9} {"step": 23301, "train_loss": 3.180492877960205, "lr": 9.052859572766503e-05, "tps": 24222, "wall": 63044.5} {"step": 23302, "train_loss": 3.2585549354553223, "lr": 9.051528712056456e-05, "tps": 24221, "wall": 63050.2} {"step": 23303, "train_loss": 3.247445583343506, "lr": 9.050197998027382e-05, "tps": 24220, "wall": 63055.8} {"step": 23304, "train_loss": 3.234057903289795, "lr": 9.048867430694373e-05, "tps": 24219, "wall": 63061.5} {"step": 23305, "train_loss": 3.358243465423584, "lr": 9.047537010072489e-05, "tps": 24218, "wall": 63067.1} {"step": 23306, "train_loss": 3.3410565853118896, "lr": 9.046206736176812e-05, "tps": 24217, "wall": 63072.8} {"step": 23307, "train_loss": 3.2859158515930176, "lr": 9.044876609022407e-05, "tps": 24216, "wall": 63078.4} {"step": 23308, "train_loss": 3.2727127075195312, "lr": 9.043546628624334e-05, "tps": 24214, "wall": 63084.0} {"step": 23309, "train_loss": 3.267080783843994, "lr": 9.042216794997672e-05, "tps": 24213, "wall": 63089.7} {"step": 23310, "train_loss": 3.356069564819336, "lr": 9.040887108157477e-05, "tps": 24212, "wall": 63095.4} {"step": 23311, "train_loss": 3.1960277557373047, "lr": 9.039557568118812e-05, "tps": 24211, "wall": 63101.0} {"step": 23312, "train_loss": 3.3344664573669434, "lr": 9.038228174896744e-05, "tps": 24210, "wall": 63106.7} {"step": 23313, "train_loss": 3.204202175140381, "lr": 9.036898928506328e-05, "tps": 24209, "wall": 63112.3} {"step": 23314, "train_loss": 3.3278589248657227, "lr": 9.035569828962615e-05, "tps": 24208, "wall": 63117.9} {"step": 23315, "train_loss": 3.312983751296997, "lr": 9.034240876280675e-05, "tps": 24207, "wall": 63123.6} {"step": 23316, "train_loss": 3.23880672454834, "lr": 9.032912070475555e-05, "tps": 24205, "wall": 63129.2} {"step": 23317, "train_loss": 3.230520248413086, "lr": 9.031583411562307e-05, "tps": 24204, "wall": 63134.8} {"step": 23318, "train_loss": 3.334850311279297, "lr": 9.030254899555987e-05, "tps": 24203, "wall": 63140.5} {"step": 23319, "train_loss": 3.238194227218628, "lr": 9.02892653447164e-05, "tps": 24202, "wall": 63146.2} {"step": 23320, "train_loss": 3.144144296646118, "lr": 9.027598316324312e-05, "tps": 24201, "wall": 63151.9} {"step": 23321, "train_loss": 3.1845712661743164, "lr": 9.026270245129055e-05, "tps": 24200, "wall": 63157.6} {"step": 23322, "train_loss": 3.178243398666382, "lr": 9.024942320900909e-05, "tps": 24199, "wall": 63163.2} {"step": 23323, "train_loss": 3.3387794494628906, "lr": 9.023614543654915e-05, "tps": 24197, "wall": 63168.9} {"step": 23324, "train_loss": 3.1949031352996826, "lr": 9.022286913406125e-05, "tps": 24196, "wall": 63174.6} {"step": 23325, "train_loss": 3.189126491546631, "lr": 9.020959430169563e-05, "tps": 24195, "wall": 63180.2} {"step": 23326, "train_loss": 3.287810802459717, "lr": 9.01963209396028e-05, "tps": 24194, "wall": 63185.8} {"step": 23327, "train_loss": 3.163146734237671, "lr": 9.018304904793309e-05, "tps": 24193, "wall": 63191.4} {"step": 23328, "train_loss": 3.196706771850586, "lr": 9.016977862683675e-05, "tps": 24192, "wall": 63197.0} {"step": 23329, "train_loss": 3.2106125354766846, "lr": 9.015650967646422e-05, "tps": 24191, "wall": 63202.7} {"step": 23330, "train_loss": 3.341928005218506, "lr": 9.014324219696582e-05, "tps": 24190, "wall": 63208.3} {"step": 23331, "train_loss": 3.2430238723754883, "lr": 9.01299761884917e-05, "tps": 24189, "wall": 63214.0} {"step": 23332, "train_loss": 3.2334141731262207, "lr": 9.011671165119231e-05, "tps": 24187, "wall": 63219.7} {"step": 23333, "train_loss": 3.291224241256714, "lr": 9.010344858521784e-05, "tps": 24186, "wall": 63225.3} {"step": 23334, "train_loss": 3.3079047203063965, "lr": 9.009018699071847e-05, "tps": 24185, "wall": 63231.0} {"step": 23335, "train_loss": 3.3294005393981934, "lr": 9.007692686784454e-05, "tps": 24184, "wall": 63236.6} {"step": 23336, "train_loss": 3.292008876800537, "lr": 9.006366821674623e-05, "tps": 24183, "wall": 63242.3} {"step": 23337, "train_loss": 3.2210536003112793, "lr": 9.005041103757364e-05, "tps": 24182, "wall": 63247.9} {"step": 23338, "train_loss": 3.369040012359619, "lr": 9.003715533047707e-05, "tps": 24181, "wall": 63253.6} {"step": 23339, "train_loss": 3.239917516708374, "lr": 9.002390109560668e-05, "tps": 24180, "wall": 63259.2} {"step": 23340, "train_loss": 3.2928812503814697, "lr": 9.001064833311247e-05, "tps": 24178, "wall": 63264.8} {"step": 23341, "train_loss": 3.263091802597046, "lr": 8.999739704314474e-05, "tps": 24177, "wall": 63270.4} {"step": 23342, "train_loss": 3.407426357269287, "lr": 8.998414722585347e-05, "tps": 24176, "wall": 63276.2} {"step": 23343, "train_loss": 3.2679290771484375, "lr": 8.997089888138887e-05, "tps": 24175, "wall": 63281.8} {"step": 23344, "train_loss": 3.2171247005462646, "lr": 8.995765200990096e-05, "tps": 24174, "wall": 63287.4} {"step": 23345, "train_loss": 3.2843246459960938, "lr": 8.994440661153976e-05, "tps": 24173, "wall": 63293.0} {"step": 23346, "train_loss": 3.27313232421875, "lr": 8.99311626864554e-05, "tps": 24172, "wall": 63298.8} {"step": 23347, "train_loss": 3.3292393684387207, "lr": 8.991792023479787e-05, "tps": 24171, "wall": 63304.4} {"step": 23348, "train_loss": 3.1350879669189453, "lr": 8.990467925671713e-05, "tps": 24169, "wall": 63310.1} {"step": 23349, "train_loss": 3.3012261390686035, "lr": 8.989143975236332e-05, "tps": 24168, "wall": 63315.7} {"step": 23350, "train_loss": 3.382315158843994, "lr": 8.987820172188622e-05, "tps": 24167, "wall": 63321.3} {"step": 23351, "train_loss": 3.2583987712860107, "lr": 8.986496516543593e-05, "tps": 24166, "wall": 63327.0} {"step": 23352, "train_loss": 3.260795831680298, "lr": 8.985173008316237e-05, "tps": 24165, "wall": 63332.6} {"step": 23353, "train_loss": 3.2393317222595215, "lr": 8.983849647521538e-05, "tps": 24164, "wall": 63338.4} {"step": 23354, "train_loss": 3.3425493240356445, "lr": 8.982526434174501e-05, "tps": 24163, "wall": 63344.1} {"step": 23355, "train_loss": 3.2971956729888916, "lr": 8.98120336829011e-05, "tps": 24162, "wall": 63349.7} {"step": 23356, "train_loss": 3.272778272628784, "lr": 8.979880449883345e-05, "tps": 24160, "wall": 63355.4} {"step": 23357, "train_loss": 3.2050108909606934, "lr": 8.978557678969205e-05, "tps": 24159, "wall": 63361.0} {"step": 23358, "train_loss": 3.1994969844818115, "lr": 8.977235055562666e-05, "tps": 24158, "wall": 63366.7} {"step": 23359, "train_loss": 3.287217617034912, "lr": 8.975912579678707e-05, "tps": 24157, "wall": 63372.3} {"step": 23360, "train_loss": 3.227518320083618, "lr": 8.974590251332323e-05, "tps": 24156, "wall": 63377.9} {"step": 23361, "train_loss": 3.3229379653930664, "lr": 8.973268070538483e-05, "tps": 24155, "wall": 63383.6} {"step": 23362, "train_loss": 3.3198609352111816, "lr": 8.971946037312164e-05, "tps": 24154, "wall": 63389.2} {"step": 23363, "train_loss": 3.3202757835388184, "lr": 8.970624151668348e-05, "tps": 24153, "wall": 63395.0} {"step": 23364, "train_loss": 3.430946111679077, "lr": 8.969302413622008e-05, "tps": 24151, "wall": 63400.6} {"step": 23365, "train_loss": 3.2471632957458496, "lr": 8.967980823188109e-05, "tps": 24150, "wall": 63406.3} {"step": 23366, "train_loss": 3.311450481414795, "lr": 8.966659380381634e-05, "tps": 24149, "wall": 63411.9} {"step": 23367, "train_loss": 3.3325483798980713, "lr": 8.96533808521754e-05, "tps": 24148, "wall": 63417.5} {"step": 23368, "train_loss": 3.2445554733276367, "lr": 8.964016937710811e-05, "tps": 24147, "wall": 63423.2} {"step": 23369, "train_loss": 3.3338122367858887, "lr": 8.9626959378764e-05, "tps": 24146, "wall": 63428.8} {"step": 23370, "train_loss": 3.2402846813201904, "lr": 8.961375085729267e-05, "tps": 24145, "wall": 63434.5} {"step": 23371, "train_loss": 3.2731752395629883, "lr": 8.960054381284393e-05, "tps": 24144, "wall": 63440.1} {"step": 23372, "train_loss": 3.26464581489563, "lr": 8.958733824556726e-05, "tps": 24143, "wall": 63445.7} {"step": 23373, "train_loss": 3.299567461013794, "lr": 8.957413415561222e-05, "tps": 24141, "wall": 63451.4} {"step": 23374, "train_loss": 3.2164249420166016, "lr": 8.95609315431285e-05, "tps": 24140, "wall": 63457.2} {"step": 23375, "train_loss": 3.3207778930664062, "lr": 8.954773040826558e-05, "tps": 24139, "wall": 63462.8} {"step": 23376, "train_loss": 3.241936206817627, "lr": 8.953453075117302e-05, "tps": 24138, "wall": 63468.5} {"step": 23377, "train_loss": 3.252371311187744, "lr": 8.952133257200039e-05, "tps": 24137, "wall": 63474.1} {"step": 23378, "train_loss": 3.3452296257019043, "lr": 8.950813587089716e-05, "tps": 24136, "wall": 63479.8} {"step": 23379, "train_loss": 3.2314937114715576, "lr": 8.949494064801276e-05, "tps": 24135, "wall": 63485.4} {"step": 23380, "train_loss": 3.3244588375091553, "lr": 8.94817469034968e-05, "tps": 24134, "wall": 63491.1} {"step": 23381, "train_loss": 3.236379623413086, "lr": 8.946855463749867e-05, "tps": 24132, "wall": 63496.7} {"step": 23382, "train_loss": 3.2457401752471924, "lr": 8.945536385016777e-05, "tps": 24131, "wall": 63502.3} {"step": 23383, "train_loss": 3.291638135910034, "lr": 8.94421745416536e-05, "tps": 24130, "wall": 63507.9} {"step": 23384, "train_loss": 3.2539894580841064, "lr": 8.942898671210551e-05, "tps": 24129, "wall": 63513.6} {"step": 23385, "train_loss": 3.2187719345092773, "lr": 8.941580036167296e-05, "tps": 24128, "wall": 63519.3} {"step": 23386, "train_loss": 3.2618000507354736, "lr": 8.94026154905053e-05, "tps": 24127, "wall": 63525.0} {"step": 23387, "train_loss": 3.2831292152404785, "lr": 8.938943209875182e-05, "tps": 24126, "wall": 63530.6} {"step": 23388, "train_loss": 3.2452123165130615, "lr": 8.937625018656197e-05, "tps": 24125, "wall": 63536.3} {"step": 23389, "train_loss": 3.1953516006469727, "lr": 8.936306975408501e-05, "tps": 24124, "wall": 63541.9} {"step": 23390, "train_loss": 3.2496886253356934, "lr": 8.934989080147025e-05, "tps": 24122, "wall": 63547.6} {"step": 23391, "train_loss": 3.279738426208496, "lr": 8.933671332886704e-05, "tps": 24121, "wall": 63553.2} {"step": 23392, "train_loss": 3.254488229751587, "lr": 8.932353733642458e-05, "tps": 24120, "wall": 63558.9} {"step": 23393, "train_loss": 3.193389892578125, "lr": 8.931036282429212e-05, "tps": 24119, "wall": 63564.5} {"step": 23394, "train_loss": 3.1659669876098633, "lr": 8.929718979261898e-05, "tps": 24118, "wall": 63570.1} {"step": 23395, "train_loss": 3.334129810333252, "lr": 8.928401824155437e-05, "tps": 24117, "wall": 63575.8} {"step": 23396, "train_loss": 3.2742106914520264, "lr": 8.92708481712474e-05, "tps": 24116, "wall": 63581.4} {"step": 23397, "train_loss": 3.4347493648529053, "lr": 8.925767958184738e-05, "tps": 24115, "wall": 63587.1} {"step": 23398, "train_loss": 3.2377986907958984, "lr": 8.924451247350347e-05, "tps": 24114, "wall": 63592.7} {"step": 23399, "train_loss": 3.3920342922210693, "lr": 8.923134684636474e-05, "tps": 24112, "wall": 63598.3} {"step": 23400, "train_loss": 3.204498767852783, "lr": 8.92181827005804e-05, "tps": 24111, "wall": 63604.0} {"step": 23401, "train_loss": 3.291977882385254, "lr": 8.920502003629963e-05, "tps": 24110, "wall": 63609.7} {"step": 23402, "train_loss": 3.278954267501831, "lr": 8.919185885367133e-05, "tps": 24109, "wall": 63615.3} {"step": 23403, "train_loss": 3.334731101989746, "lr": 8.917869915284485e-05, "tps": 24108, "wall": 63620.9} {"step": 23404, "train_loss": 3.314453125, "lr": 8.916554093396908e-05, "tps": 24107, "wall": 63626.6} {"step": 23405, "train_loss": 3.1949501037597656, "lr": 8.915238419719316e-05, "tps": 24106, "wall": 63632.3} {"step": 23406, "train_loss": 3.396146774291992, "lr": 8.913922894266614e-05, "tps": 24105, "wall": 63638.1} {"step": 23407, "train_loss": 3.378174304962158, "lr": 8.912607517053695e-05, "tps": 24103, "wall": 63643.7} {"step": 23408, "train_loss": 3.3262131214141846, "lr": 8.911292288095472e-05, "tps": 24102, "wall": 63649.3} {"step": 23409, "train_loss": 3.324695110321045, "lr": 8.909977207406838e-05, "tps": 24101, "wall": 63654.9} {"step": 23410, "train_loss": 3.254737138748169, "lr": 8.908662275002683e-05, "tps": 24100, "wall": 63660.6} {"step": 23411, "train_loss": 3.3696160316467285, "lr": 8.907347490897917e-05, "tps": 24099, "wall": 63666.2} {"step": 23412, "train_loss": 3.329157829284668, "lr": 8.906032855107426e-05, "tps": 24098, "wall": 63671.8} {"step": 23413, "train_loss": 3.2814137935638428, "lr": 8.904718367646102e-05, "tps": 24097, "wall": 63677.5} {"step": 23414, "train_loss": 3.184264898300171, "lr": 8.903404028528839e-05, "tps": 24096, "wall": 63683.1} {"step": 23415, "train_loss": 3.3109450340270996, "lr": 8.902089837770523e-05, "tps": 24095, "wall": 63688.7} {"step": 23416, "train_loss": 3.2787535190582275, "lr": 8.900775795386038e-05, "tps": 24094, "wall": 63694.5} {"step": 23417, "train_loss": 3.307826042175293, "lr": 8.899461901390277e-05, "tps": 24092, "wall": 63700.2} {"step": 23418, "train_loss": 3.2599732875823975, "lr": 8.89814815579812e-05, "tps": 24091, "wall": 63705.8} {"step": 23419, "train_loss": 3.2787346839904785, "lr": 8.896834558624447e-05, "tps": 24090, "wall": 63711.5} {"step": 23420, "train_loss": 3.348217010498047, "lr": 8.895521109884144e-05, "tps": 24089, "wall": 63717.1} {"step": 23421, "train_loss": 3.3510732650756836, "lr": 8.894207809592082e-05, "tps": 24088, "wall": 63722.7} {"step": 23422, "train_loss": 3.337893486022949, "lr": 8.89289465776315e-05, "tps": 24087, "wall": 63728.4} {"step": 23423, "train_loss": 3.269526481628418, "lr": 8.891581654412214e-05, "tps": 24086, "wall": 63734.0} {"step": 23424, "train_loss": 3.355520725250244, "lr": 8.890268799554145e-05, "tps": 24085, "wall": 63739.7} {"step": 23425, "train_loss": 3.140453815460205, "lr": 8.888956093203827e-05, "tps": 24084, "wall": 63745.3} {"step": 23426, "train_loss": 3.194838047027588, "lr": 8.887643535376123e-05, "tps": 24082, "wall": 63751.0} {"step": 23427, "train_loss": 3.200532913208008, "lr": 8.886331126085896e-05, "tps": 24081, "wall": 63756.7} {"step": 23428, "train_loss": 3.232170581817627, "lr": 8.885018865348027e-05, "tps": 24080, "wall": 63762.3} {"step": 23429, "train_loss": 3.363348960876465, "lr": 8.883706753177371e-05, "tps": 24079, "wall": 63768.0} {"step": 23430, "train_loss": 3.2445056438446045, "lr": 8.882394789588792e-05, "tps": 24078, "wall": 63773.6} {"step": 23431, "train_loss": 3.2110755443573, "lr": 8.88108297459716e-05, "tps": 24077, "wall": 63779.3} {"step": 23432, "train_loss": 3.2884230613708496, "lr": 8.879771308217328e-05, "tps": 24076, "wall": 63784.9} {"step": 23433, "train_loss": 3.2475104331970215, "lr": 8.878459790464148e-05, "tps": 24075, "wall": 63790.6} {"step": 23434, "train_loss": 3.2446417808532715, "lr": 8.877148421352497e-05, "tps": 24074, "wall": 63796.3} {"step": 23435, "train_loss": 3.2560343742370605, "lr": 8.875837200897215e-05, "tps": 24072, "wall": 63802.0} {"step": 23436, "train_loss": 3.266700267791748, "lr": 8.874526129113156e-05, "tps": 24071, "wall": 63807.6} {"step": 23437, "train_loss": 3.2905328273773193, "lr": 8.873215206015179e-05, "tps": 24070, "wall": 63813.3} {"step": 23438, "train_loss": 3.178856372833252, "lr": 8.871904431618123e-05, "tps": 24069, "wall": 63819.1} {"step": 23439, "train_loss": 3.175480842590332, "lr": 8.870593805936852e-05, "tps": 24068, "wall": 63824.7} {"step": 23440, "train_loss": 3.2765610218048096, "lr": 8.869283328986204e-05, "tps": 24067, "wall": 63830.4} {"step": 23441, "train_loss": 3.151552677154541, "lr": 8.867973000781019e-05, "tps": 24066, "wall": 63836.1} {"step": 23442, "train_loss": 3.256106376647949, "lr": 8.866662821336152e-05, "tps": 24065, "wall": 63841.8} {"step": 23443, "train_loss": 3.318311929702759, "lr": 8.865352790666438e-05, "tps": 24063, "wall": 63847.5} {"step": 23444, "train_loss": 3.250209331512451, "lr": 8.864042908786714e-05, "tps": 24062, "wall": 63853.3} {"step": 23445, "train_loss": 3.2406625747680664, "lr": 8.862733175711828e-05, "tps": 24061, "wall": 63858.9} {"step": 23446, "train_loss": 3.2857820987701416, "lr": 8.86142359145661e-05, "tps": 24060, "wall": 63864.6} {"step": 23447, "train_loss": 3.1801772117614746, "lr": 8.860114156035892e-05, "tps": 24059, "wall": 63870.3} {"step": 23448, "train_loss": 3.3224048614501953, "lr": 8.858804869464519e-05, "tps": 24058, "wall": 63876.0} {"step": 23449, "train_loss": 3.2902421951293945, "lr": 8.857495731757311e-05, "tps": 24057, "wall": 63881.8} {"step": 23450, "train_loss": 3.1933531761169434, "lr": 8.856186742929102e-05, "tps": 24056, "wall": 63887.4} {"step": 23451, "train_loss": 3.2835350036621094, "lr": 8.854877902994722e-05, "tps": 24055, "wall": 63893.1} {"step": 23452, "train_loss": 3.2844743728637695, "lr": 8.853569211968999e-05, "tps": 24053, "wall": 63898.7} {"step": 23453, "train_loss": 3.261183500289917, "lr": 8.852260669866746e-05, "tps": 24052, "wall": 63904.4} {"step": 23454, "train_loss": 3.153209686279297, "lr": 8.850952276702805e-05, "tps": 24051, "wall": 63910.1} {"step": 23455, "train_loss": 3.235283136367798, "lr": 8.849644032491986e-05, "tps": 24050, "wall": 63915.8} {"step": 23456, "train_loss": 3.260373115539551, "lr": 8.848335937249105e-05, "tps": 24049, "wall": 63921.5} {"step": 23457, "train_loss": 3.397054672241211, "lr": 8.847027990988992e-05, "tps": 24048, "wall": 63927.1} {"step": 23458, "train_loss": 3.2408976554870605, "lr": 8.845720193726453e-05, "tps": 24047, "wall": 63932.8} {"step": 23459, "train_loss": 3.35750675201416, "lr": 8.844412545476311e-05, "tps": 24046, "wall": 63938.6} {"step": 23460, "train_loss": 3.1622188091278076, "lr": 8.843105046253375e-05, "tps": 24045, "wall": 63944.2} {"step": 23461, "train_loss": 3.2299013137817383, "lr": 8.841797696072454e-05, "tps": 24043, "wall": 63949.9} {"step": 23462, "train_loss": 3.314006805419922, "lr": 8.840490494948365e-05, "tps": 24042, "wall": 63955.6} {"step": 23463, "train_loss": 3.196463108062744, "lr": 8.83918344289591e-05, "tps": 24041, "wall": 63961.2} {"step": 23464, "train_loss": 3.3589508533477783, "lr": 8.837876539929894e-05, "tps": 24040, "wall": 63966.9} {"step": 23465, "train_loss": 3.294562816619873, "lr": 8.836569786065128e-05, "tps": 24039, "wall": 63972.6} {"step": 23466, "train_loss": 3.246680736541748, "lr": 8.835263181316411e-05, "tps": 24038, "wall": 63978.3} {"step": 23467, "train_loss": 3.2542340755462646, "lr": 8.833956725698543e-05, "tps": 24037, "wall": 63984.0} {"step": 23468, "train_loss": 3.2023842334747314, "lr": 8.832650419226327e-05, "tps": 24036, "wall": 63989.7} {"step": 23469, "train_loss": 3.336008310317993, "lr": 8.831344261914562e-05, "tps": 24034, "wall": 63995.5} {"step": 23470, "train_loss": 3.2161641120910645, "lr": 8.830038253778033e-05, "tps": 24033, "wall": 64001.2} {"step": 23471, "train_loss": 3.1906638145446777, "lr": 8.828732394831554e-05, "tps": 24032, "wall": 64006.9} {"step": 23472, "train_loss": 3.208465099334717, "lr": 8.827426685089902e-05, "tps": 24031, "wall": 64012.6} {"step": 23473, "train_loss": 3.314061164855957, "lr": 8.826121124567869e-05, "tps": 24030, "wall": 64018.2} {"step": 23474, "train_loss": 3.316645860671997, "lr": 8.824815713280255e-05, "tps": 24029, "wall": 64023.9} {"step": 23475, "train_loss": 3.2489311695098877, "lr": 8.823510451241837e-05, "tps": 24028, "wall": 64029.7} {"step": 23476, "train_loss": 3.1775999069213867, "lr": 8.822205338467408e-05, "tps": 24027, "wall": 64035.3} {"step": 23477, "train_loss": 3.1913602352142334, "lr": 8.82090037497175e-05, "tps": 24026, "wall": 64041.0} {"step": 23478, "train_loss": 3.2230396270751953, "lr": 8.819595560769643e-05, "tps": 24024, "wall": 64046.7} {"step": 23479, "train_loss": 3.2998063564300537, "lr": 8.818290895875874e-05, "tps": 24023, "wall": 64052.4} {"step": 23480, "train_loss": 3.3194756507873535, "lr": 8.816986380305216e-05, "tps": 24022, "wall": 64058.1} {"step": 23481, "train_loss": 3.324012041091919, "lr": 8.81568201407245e-05, "tps": 24021, "wall": 64063.8} {"step": 23482, "train_loss": 3.318159580230713, "lr": 8.814377797192354e-05, "tps": 24020, "wall": 64069.6} {"step": 23483, "train_loss": 3.314143180847168, "lr": 8.813073729679698e-05, "tps": 24019, "wall": 64075.4} {"step": 23484, "train_loss": 3.369992971420288, "lr": 8.811769811549254e-05, "tps": 24018, "wall": 64081.0} {"step": 23485, "train_loss": 3.2733898162841797, "lr": 8.810466042815798e-05, "tps": 24017, "wall": 64086.7} {"step": 23486, "train_loss": 3.1825621128082275, "lr": 8.809162423494097e-05, "tps": 24016, "wall": 64092.4} {"step": 23487, "train_loss": 3.2264153957366943, "lr": 8.807858953598914e-05, "tps": 24014, "wall": 64098.1} {"step": 23488, "train_loss": 3.2044460773468018, "lr": 8.806555633145022e-05, "tps": 24013, "wall": 64103.8} {"step": 23489, "train_loss": 3.301736354827881, "lr": 8.80525246214718e-05, "tps": 24012, "wall": 64109.5} {"step": 23490, "train_loss": 3.1817734241485596, "lr": 8.803949440620147e-05, "tps": 24011, "wall": 64115.3} {"step": 23491, "train_loss": 3.2979440689086914, "lr": 8.802646568578696e-05, "tps": 24010, "wall": 64121.0} {"step": 23492, "train_loss": 3.3131184577941895, "lr": 8.801343846037573e-05, "tps": 24009, "wall": 64126.8} {"step": 23493, "train_loss": 3.221151828765869, "lr": 8.800041273011545e-05, "tps": 24008, "wall": 64132.5} {"step": 23494, "train_loss": 3.270918369293213, "lr": 8.798738849515367e-05, "tps": 24006, "wall": 64138.3} {"step": 23495, "train_loss": 3.2598042488098145, "lr": 8.79743657556378e-05, "tps": 24005, "wall": 64144.0} {"step": 23496, "train_loss": 3.3222832679748535, "lr": 8.796134451171554e-05, "tps": 24004, "wall": 64149.7} {"step": 23497, "train_loss": 3.16232967376709, "lr": 8.794832476353427e-05, "tps": 24003, "wall": 64155.5} {"step": 23498, "train_loss": 3.280304193496704, "lr": 8.793530651124151e-05, "tps": 24002, "wall": 64161.2} {"step": 23499, "train_loss": 3.236359119415283, "lr": 8.792228975498478e-05, "tps": 24001, "wall": 64166.9} {"step": 23500, "train_loss": 3.310546875, "lr": 8.79092744949115e-05, "tps": 24000, "wall": 64172.9} {"step": 23501, "train_loss": 3.3076491355895996, "lr": 8.789626073116905e-05, "tps": 23998, "wall": 64179.0} {"step": 23502, "train_loss": 3.3241209983825684, "lr": 8.788324846390497e-05, "tps": 23997, "wall": 64184.7} {"step": 23503, "train_loss": 3.2837517261505127, "lr": 8.787023769326657e-05, "tps": 23996, "wall": 64190.5} {"step": 23504, "train_loss": 3.3679423332214355, "lr": 8.785722841940123e-05, "tps": 23995, "wall": 64196.5} {"step": 23505, "train_loss": 3.2734994888305664, "lr": 8.784422064245642e-05, "tps": 23994, "wall": 64202.3} {"step": 23506, "train_loss": 3.155986785888672, "lr": 8.783121436257941e-05, "tps": 23993, "wall": 64208.0} {"step": 23507, "train_loss": 3.2575840950012207, "lr": 8.781820957991751e-05, "tps": 23992, "wall": 64213.7} {"step": 23508, "train_loss": 3.253971576690674, "lr": 8.780520629461812e-05, "tps": 23990, "wall": 64219.5} {"step": 23509, "train_loss": 3.3137965202331543, "lr": 8.779220450682852e-05, "tps": 23989, "wall": 64225.4} {"step": 23510, "train_loss": 3.1611523628234863, "lr": 8.777920421669592e-05, "tps": 23988, "wall": 64231.4} {"step": 23511, "train_loss": 3.1743056774139404, "lr": 8.776620542436772e-05, "tps": 23987, "wall": 64237.6} {"step": 23512, "train_loss": 3.2413816452026367, "lr": 8.775320812999101e-05, "tps": 23986, "wall": 64243.4} {"step": 23513, "train_loss": 3.2032599449157715, "lr": 8.774021233371322e-05, "tps": 23984, "wall": 64249.3} {"step": 23514, "train_loss": 3.312873363494873, "lr": 8.77272180356814e-05, "tps": 23983, "wall": 64255.1} {"step": 23515, "train_loss": 3.25858736038208, "lr": 8.771422523604278e-05, "tps": 23982, "wall": 64260.9} {"step": 23516, "train_loss": 3.394881248474121, "lr": 8.770123393494462e-05, "tps": 23981, "wall": 64266.7} {"step": 23517, "train_loss": 3.264770030975342, "lr": 8.768824413253406e-05, "tps": 23980, "wall": 64272.4} {"step": 23518, "train_loss": 3.3394830226898193, "lr": 8.767525582895823e-05, "tps": 23979, "wall": 64278.1} {"step": 23519, "train_loss": 3.2058303356170654, "lr": 8.766226902436423e-05, "tps": 23978, "wall": 64283.8} {"step": 23520, "train_loss": 3.264103412628174, "lr": 8.764928371889918e-05, "tps": 23977, "wall": 64289.6} {"step": 23521, "train_loss": 3.341587543487549, "lr": 8.763629991271023e-05, "tps": 23975, "wall": 64295.4} {"step": 23522, "train_loss": 3.3040714263916016, "lr": 8.762331760594447e-05, "tps": 23974, "wall": 64301.1} {"step": 23523, "train_loss": 3.2639622688293457, "lr": 8.761033679874885e-05, "tps": 23973, "wall": 64306.9} {"step": 23524, "train_loss": 3.2924013137817383, "lr": 8.759735749127056e-05, "tps": 23972, "wall": 64312.5} {"step": 23525, "train_loss": 3.2216827869415283, "lr": 8.758437968365657e-05, "tps": 23971, "wall": 64318.2} {"step": 23526, "train_loss": 3.2784388065338135, "lr": 8.757140337605382e-05, "tps": 23970, "wall": 64323.9} {"step": 23527, "train_loss": 3.203169584274292, "lr": 8.755842856860945e-05, "tps": 23969, "wall": 64329.5} {"step": 23528, "train_loss": 3.2503609657287598, "lr": 8.754545526147036e-05, "tps": 23968, "wall": 64335.2} {"step": 23529, "train_loss": 3.136399030685425, "lr": 8.753248345478345e-05, "tps": 23967, "wall": 64340.9} {"step": 23530, "train_loss": 3.290736198425293, "lr": 8.751951314869582e-05, "tps": 23965, "wall": 64346.6} {"step": 23531, "train_loss": 3.313114643096924, "lr": 8.750654434335429e-05, "tps": 23964, "wall": 64352.2} {"step": 23532, "train_loss": 3.231090784072876, "lr": 8.749357703890575e-05, "tps": 23963, "wall": 64358.0} {"step": 23533, "train_loss": 3.300473690032959, "lr": 8.748061123549718e-05, "tps": 23962, "wall": 64363.7} {"step": 23534, "train_loss": 3.2878994941711426, "lr": 8.746764693327543e-05, "tps": 23961, "wall": 64369.5} {"step": 23535, "train_loss": 3.1897149085998535, "lr": 8.745468413238728e-05, "tps": 23960, "wall": 64375.1} {"step": 23536, "train_loss": 3.2756214141845703, "lr": 8.744172283297969e-05, "tps": 23959, "wall": 64380.8} {"step": 23537, "train_loss": 3.2695205211639404, "lr": 8.742876303519937e-05, "tps": 23958, "wall": 64386.5} {"step": 23538, "train_loss": 3.2129108905792236, "lr": 8.741580473919327e-05, "tps": 23957, "wall": 64392.1} {"step": 23539, "train_loss": 3.3039674758911133, "lr": 8.740284794510812e-05, "tps": 23956, "wall": 64397.8} {"step": 23540, "train_loss": 3.2953338623046875, "lr": 8.738989265309059e-05, "tps": 23954, "wall": 64403.4} {"step": 23541, "train_loss": 3.1812117099761963, "lr": 8.73769388632876e-05, "tps": 23953, "wall": 64409.1} {"step": 23542, "train_loss": 3.270223379135132, "lr": 8.736398657584584e-05, "tps": 23952, "wall": 64414.8} {"step": 23543, "train_loss": 3.288351058959961, "lr": 8.735103579091193e-05, "tps": 23951, "wall": 64420.5} {"step": 23544, "train_loss": 3.2467100620269775, "lr": 8.733808650863273e-05, "tps": 23950, "wall": 64426.1} {"step": 23545, "train_loss": 3.197896957397461, "lr": 8.732513872915488e-05, "tps": 23949, "wall": 64431.7} {"step": 23546, "train_loss": 3.3252599239349365, "lr": 8.731219245262497e-05, "tps": 23948, "wall": 64437.4} {"step": 23547, "train_loss": 3.2811481952667236, "lr": 8.729924767918976e-05, "tps": 23947, "wall": 64443.1} {"step": 23548, "train_loss": 3.2892799377441406, "lr": 8.728630440899587e-05, "tps": 23946, "wall": 64448.8} {"step": 23549, "train_loss": 3.2413251399993896, "lr": 8.727336264218985e-05, "tps": 23945, "wall": 64454.4} {"step": 23550, "train_loss": 3.3132529258728027, "lr": 8.726042237891841e-05, "tps": 23944, "wall": 64460.1} {"step": 23551, "train_loss": 3.183623790740967, "lr": 8.724748361932807e-05, "tps": 23943, "wall": 64465.8} {"step": 23552, "train_loss": 3.323587417602539, "lr": 8.723454636356538e-05, "tps": 23941, "wall": 64471.4} {"step": 23553, "train_loss": 3.372187376022339, "lr": 8.722161061177697e-05, "tps": 23940, "wall": 64477.2} {"step": 23554, "train_loss": 3.3108320236206055, "lr": 8.72086763641093e-05, "tps": 23939, "wall": 64482.8} {"step": 23555, "train_loss": 3.3126416206359863, "lr": 8.719574362070899e-05, "tps": 23938, "wall": 64488.5} {"step": 23556, "train_loss": 3.278956890106201, "lr": 8.718281238172245e-05, "tps": 23937, "wall": 64494.2} {"step": 23557, "train_loss": 3.2153992652893066, "lr": 8.716988264729616e-05, "tps": 23936, "wall": 64499.9} {"step": 23558, "train_loss": 3.2313263416290283, "lr": 8.71569544175767e-05, "tps": 23935, "wall": 64505.5} {"step": 23559, "train_loss": 3.410062551498413, "lr": 8.714402769271042e-05, "tps": 23934, "wall": 64511.2} {"step": 23560, "train_loss": 3.236494779586792, "lr": 8.713110247284373e-05, "tps": 23933, "wall": 64516.9} {"step": 23561, "train_loss": 3.3106179237365723, "lr": 8.711817875812316e-05, "tps": 23932, "wall": 64522.5} {"step": 23562, "train_loss": 3.2886838912963867, "lr": 8.710525654869504e-05, "tps": 23931, "wall": 64528.1} {"step": 23563, "train_loss": 3.25663423538208, "lr": 8.709233584470574e-05, "tps": 23929, "wall": 64533.8} {"step": 23564, "train_loss": 3.2266311645507812, "lr": 8.707941664630166e-05, "tps": 23928, "wall": 64539.5} {"step": 23565, "train_loss": 3.366842269897461, "lr": 8.706649895362917e-05, "tps": 23927, "wall": 64545.2} {"step": 23566, "train_loss": 3.292872905731201, "lr": 8.70535827668345e-05, "tps": 23926, "wall": 64550.8} {"step": 23567, "train_loss": 3.2373719215393066, "lr": 8.70406680860641e-05, "tps": 23925, "wall": 64556.4} {"step": 23568, "train_loss": 3.17818021774292, "lr": 8.70277549114642e-05, "tps": 23924, "wall": 64562.1} {"step": 23569, "train_loss": 3.1888818740844727, "lr": 8.701484324318103e-05, "tps": 23923, "wall": 64567.7} {"step": 23570, "train_loss": 3.3922488689422607, "lr": 8.700193308136097e-05, "tps": 23922, "wall": 64573.4} {"step": 23571, "train_loss": 3.3684234619140625, "lr": 8.698902442615015e-05, "tps": 23921, "wall": 64579.0} {"step": 23572, "train_loss": 3.34152889251709, "lr": 8.697611727769492e-05, "tps": 23920, "wall": 64584.7} {"step": 23573, "train_loss": 3.1266679763793945, "lr": 8.696321163614143e-05, "tps": 23919, "wall": 64590.3} {"step": 23574, "train_loss": 3.2939794063568115, "lr": 8.695030750163581e-05, "tps": 23918, "wall": 64596.1} {"step": 23575, "train_loss": 3.252426862716675, "lr": 8.693740487432439e-05, "tps": 23916, "wall": 64601.7} {"step": 23576, "train_loss": 3.236726760864258, "lr": 8.69245037543532e-05, "tps": 23915, "wall": 64607.4} {"step": 23577, "train_loss": 3.3091816902160645, "lr": 8.691160414186839e-05, "tps": 23914, "wall": 64613.0} {"step": 23578, "train_loss": 3.2273292541503906, "lr": 8.689870603701617e-05, "tps": 23913, "wall": 64618.7} {"step": 23579, "train_loss": 3.262967109680176, "lr": 8.688580943994265e-05, "tps": 23912, "wall": 64624.3} {"step": 23580, "train_loss": 3.2345099449157715, "lr": 8.68729143507938e-05, "tps": 23911, "wall": 64630.0} {"step": 23581, "train_loss": 3.392803907394409, "lr": 8.686002076971584e-05, "tps": 23910, "wall": 64635.7} {"step": 23582, "train_loss": 3.245913505554199, "lr": 8.684712869685476e-05, "tps": 23909, "wall": 64641.4} {"step": 23583, "train_loss": 3.324955940246582, "lr": 8.683423813235656e-05, "tps": 23908, "wall": 64647.1} {"step": 23584, "train_loss": 3.2396931648254395, "lr": 8.682134907636738e-05, "tps": 23907, "wall": 64652.7} {"step": 23585, "train_loss": 3.2807371616363525, "lr": 8.680846152903314e-05, "tps": 23906, "wall": 64658.5} {"step": 23586, "train_loss": 3.294358253479004, "lr": 8.679557549049982e-05, "tps": 23905, "wall": 64664.1} {"step": 23587, "train_loss": 3.3074851036071777, "lr": 8.678269096091347e-05, "tps": 23903, "wall": 64669.8} {"step": 23588, "train_loss": 3.307328701019287, "lr": 8.676980794042e-05, "tps": 23902, "wall": 64675.4} {"step": 23589, "train_loss": 3.344255208969116, "lr": 8.675692642916531e-05, "tps": 23901, "wall": 64681.0} {"step": 23590, "train_loss": 3.329707622528076, "lr": 8.674404642729541e-05, "tps": 23900, "wall": 64686.7} {"step": 23591, "train_loss": 3.222384214401245, "lr": 8.673116793495612e-05, "tps": 23899, "wall": 64692.3} {"step": 23592, "train_loss": 3.2592411041259766, "lr": 8.67182909522934e-05, "tps": 23898, "wall": 64697.9} {"step": 23593, "train_loss": 3.2677361965179443, "lr": 8.670541547945312e-05, "tps": 23897, "wall": 64703.6} {"step": 23594, "train_loss": 3.250107526779175, "lr": 8.669254151658104e-05, "tps": 23896, "wall": 64709.3} {"step": 23595, "train_loss": 3.358398914337158, "lr": 8.667966906382312e-05, "tps": 23895, "wall": 64715.0} {"step": 23596, "train_loss": 3.343153715133667, "lr": 8.666679812132509e-05, "tps": 23894, "wall": 64720.6} {"step": 23597, "train_loss": 3.25100040435791, "lr": 8.665392868923276e-05, "tps": 23893, "wall": 64726.3} {"step": 23598, "train_loss": 3.2726364135742188, "lr": 8.664106076769198e-05, "tps": 23892, "wall": 64732.0} {"step": 23599, "train_loss": 3.303292751312256, "lr": 8.66281943568485e-05, "tps": 23891, "wall": 64737.6} {"step": 23600, "train_loss": 3.278904914855957, "lr": 8.661532945684798e-05, "tps": 23889, "wall": 64743.3} {"step": 23601, "train_loss": 3.159665584564209, "lr": 8.660246606783627e-05, "tps": 23888, "wall": 64749.1} {"step": 23602, "train_loss": 3.2632977962493896, "lr": 8.658960418995907e-05, "tps": 23887, "wall": 64754.7} {"step": 23603, "train_loss": 3.273038387298584, "lr": 8.657674382336196e-05, "tps": 23886, "wall": 64760.4} {"step": 23604, "train_loss": 3.322331428527832, "lr": 8.656388496819079e-05, "tps": 23885, "wall": 64766.0} {"step": 23605, "train_loss": 3.2547497749328613, "lr": 8.655102762459112e-05, "tps": 23884, "wall": 64771.7} {"step": 23606, "train_loss": 3.3013815879821777, "lr": 8.653817179270862e-05, "tps": 23883, "wall": 64777.5} {"step": 23607, "train_loss": 3.205197811126709, "lr": 8.652531747268897e-05, "tps": 23882, "wall": 64783.2} {"step": 23608, "train_loss": 3.2811334133148193, "lr": 8.651246466467768e-05, "tps": 23881, "wall": 64788.8} {"step": 23609, "train_loss": 3.339432716369629, "lr": 8.649961336882047e-05, "tps": 23880, "wall": 64794.4} {"step": 23610, "train_loss": 3.1672282218933105, "lr": 8.648676358526286e-05, "tps": 23879, "wall": 64800.1} {"step": 23611, "train_loss": 3.2663402557373047, "lr": 8.647391531415037e-05, "tps": 23878, "wall": 64805.8} {"step": 23612, "train_loss": 3.388425350189209, "lr": 8.646106855562863e-05, "tps": 23876, "wall": 64811.4} {"step": 23613, "train_loss": 3.2015838623046875, "lr": 8.644822330984315e-05, "tps": 23875, "wall": 64817.1} {"step": 23614, "train_loss": 3.3109593391418457, "lr": 8.643537957693936e-05, "tps": 23874, "wall": 64822.8} {"step": 23615, "train_loss": 3.2639408111572266, "lr": 8.642253735706285e-05, "tps": 23873, "wall": 64828.4} {"step": 23616, "train_loss": 3.1955840587615967, "lr": 8.640969665035908e-05, "tps": 23872, "wall": 64834.0} {"step": 23617, "train_loss": 3.265263557434082, "lr": 8.639685745697344e-05, "tps": 23871, "wall": 64839.8} {"step": 23618, "train_loss": 3.2087795734405518, "lr": 8.638401977705149e-05, "tps": 23870, "wall": 64845.4} {"step": 23619, "train_loss": 3.288290500640869, "lr": 8.637118361073857e-05, "tps": 23869, "wall": 64851.0} {"step": 23620, "train_loss": 3.1676485538482666, "lr": 8.635834895818006e-05, "tps": 23868, "wall": 64856.7} {"step": 23621, "train_loss": 3.274815797805786, "lr": 8.634551581952148e-05, "tps": 23867, "wall": 64862.4} {"step": 23622, "train_loss": 3.2580161094665527, "lr": 8.633268419490811e-05, "tps": 23866, "wall": 64868.1} {"step": 23623, "train_loss": 3.2637643814086914, "lr": 8.631985408448526e-05, "tps": 23865, "wall": 64873.7} {"step": 23624, "train_loss": 3.3601503372192383, "lr": 8.63070254883984e-05, "tps": 23864, "wall": 64879.4} {"step": 23625, "train_loss": 3.2510271072387695, "lr": 8.629419840679274e-05, "tps": 23863, "wall": 64885.0} {"step": 23626, "train_loss": 3.2363178730010986, "lr": 8.628137283981369e-05, "tps": 23861, "wall": 64890.7} {"step": 23627, "train_loss": 3.1695573329925537, "lr": 8.626854878760648e-05, "tps": 23860, "wall": 64896.5} {"step": 23628, "train_loss": 3.2567365169525146, "lr": 8.625572625031632e-05, "tps": 23859, "wall": 64902.1} {"step": 23629, "train_loss": 3.3611412048339844, "lr": 8.62429052280886e-05, "tps": 23858, "wall": 64907.8} {"step": 23630, "train_loss": 3.1169519424438477, "lr": 8.623008572106846e-05, "tps": 23857, "wall": 64913.4} {"step": 23631, "train_loss": 3.2975549697875977, "lr": 8.621726772940111e-05, "tps": 23856, "wall": 64919.1} {"step": 23632, "train_loss": 3.33805513381958, "lr": 8.620445125323185e-05, "tps": 23855, "wall": 64924.7} {"step": 23633, "train_loss": 3.301579475402832, "lr": 8.619163629270578e-05, "tps": 23854, "wall": 64930.4} {"step": 23634, "train_loss": 3.234877109527588, "lr": 8.617882284796805e-05, "tps": 23853, "wall": 64936.1} {"step": 23635, "train_loss": 3.24070405960083, "lr": 8.61660109191639e-05, "tps": 23852, "wall": 64941.7} {"step": 23636, "train_loss": 3.199230670928955, "lr": 8.615320050643845e-05, "tps": 23851, "wall": 64947.4} {"step": 23637, "train_loss": 3.40687894821167, "lr": 8.61403916099367e-05, "tps": 23850, "wall": 64953.0} {"step": 23638, "train_loss": 3.329014778137207, "lr": 8.612758422980391e-05, "tps": 23849, "wall": 64958.8} {"step": 23639, "train_loss": 3.1963722705841064, "lr": 8.611477836618507e-05, "tps": 23847, "wall": 64964.5} {"step": 23640, "train_loss": 3.312180995941162, "lr": 8.610197401922521e-05, "tps": 23846, "wall": 64970.2} {"step": 23641, "train_loss": 3.3065900802612305, "lr": 8.608917118906951e-05, "tps": 23845, "wall": 64975.8} {"step": 23642, "train_loss": 3.3402538299560547, "lr": 8.60763698758629e-05, "tps": 23844, "wall": 64981.5} {"step": 23643, "train_loss": 3.201063632965088, "lr": 8.606357007975037e-05, "tps": 23843, "wall": 64987.2} {"step": 23644, "train_loss": 3.360959768295288, "lr": 8.605077180087701e-05, "tps": 23842, "wall": 64992.8} {"step": 23645, "train_loss": 3.2664237022399902, "lr": 8.60379750393877e-05, "tps": 23841, "wall": 64998.5} {"step": 23646, "train_loss": 3.368760824203491, "lr": 8.602517979542753e-05, "tps": 23840, "wall": 65004.2} {"step": 23647, "train_loss": 3.265781879425049, "lr": 8.601238606914135e-05, "tps": 23839, "wall": 65009.8} {"step": 23648, "train_loss": 3.2718939781188965, "lr": 8.599959386067407e-05, "tps": 23838, "wall": 65015.6} {"step": 23649, "train_loss": 3.230762243270874, "lr": 8.598680317017071e-05, "tps": 23837, "wall": 65021.3} {"step": 23650, "train_loss": 3.1989870071411133, "lr": 8.597401399777604e-05, "tps": 23836, "wall": 65026.9} {"step": 23651, "train_loss": 3.3139867782592773, "lr": 8.596122634363498e-05, "tps": 23835, "wall": 65032.5} {"step": 23652, "train_loss": 3.238007068634033, "lr": 8.594844020789243e-05, "tps": 23834, "wall": 65038.2} {"step": 23653, "train_loss": 3.2343978881835938, "lr": 8.593565559069323e-05, "tps": 23832, "wall": 65043.9} {"step": 23654, "train_loss": 3.2519679069519043, "lr": 8.592287249218212e-05, "tps": 23831, "wall": 65049.6} {"step": 23655, "train_loss": 3.30271577835083, "lr": 8.591009091250397e-05, "tps": 23830, "wall": 65055.2} {"step": 23656, "train_loss": 3.247253894805908, "lr": 8.589731085180362e-05, "tps": 23829, "wall": 65060.9} {"step": 23657, "train_loss": 3.16485595703125, "lr": 8.58845323102257e-05, "tps": 23828, "wall": 65066.5} {"step": 23658, "train_loss": 3.223886013031006, "lr": 8.587175528791513e-05, "tps": 23827, "wall": 65072.2} {"step": 23659, "train_loss": 3.2698822021484375, "lr": 8.585897978501656e-05, "tps": 23826, "wall": 65078.0} {"step": 23660, "train_loss": 3.233712673187256, "lr": 8.584620580167466e-05, "tps": 23825, "wall": 65083.6} {"step": 23661, "train_loss": 3.218235969543457, "lr": 8.583343333803428e-05, "tps": 23824, "wall": 65089.3} {"step": 23662, "train_loss": 3.2610573768615723, "lr": 8.582066239423996e-05, "tps": 23823, "wall": 65095.0} {"step": 23663, "train_loss": 3.335174560546875, "lr": 8.580789297043647e-05, "tps": 23822, "wall": 65100.6} {"step": 23664, "train_loss": 3.343693256378174, "lr": 8.579512506676844e-05, "tps": 23821, "wall": 65106.3} {"step": 23665, "train_loss": 3.325690746307373, "lr": 8.578235868338045e-05, "tps": 23820, "wall": 65111.9} {"step": 23666, "train_loss": 3.239384174346924, "lr": 8.576959382041721e-05, "tps": 23819, "wall": 65117.6} {"step": 23667, "train_loss": 3.3085570335388184, "lr": 8.575683047802325e-05, "tps": 23817, "wall": 65123.3} {"step": 23668, "train_loss": 3.236194610595703, "lr": 8.574406865634315e-05, "tps": 23816, "wall": 65128.9} {"step": 23669, "train_loss": 3.2780911922454834, "lr": 8.573130835552156e-05, "tps": 23815, "wall": 65134.6} {"step": 23670, "train_loss": 3.2552428245544434, "lr": 8.571854957570296e-05, "tps": 23814, "wall": 65140.4} {"step": 23671, "train_loss": 3.3141589164733887, "lr": 8.570579231703186e-05, "tps": 23813, "wall": 65146.0} {"step": 23672, "train_loss": 3.188225269317627, "lr": 8.569303657965283e-05, "tps": 23812, "wall": 65151.7} {"step": 23673, "train_loss": 3.202601671218872, "lr": 8.568028236371035e-05, "tps": 23811, "wall": 65157.4} {"step": 23674, "train_loss": 3.285459280014038, "lr": 8.566752966934887e-05, "tps": 23810, "wall": 65163.0} {"step": 23675, "train_loss": 3.3136935234069824, "lr": 8.565477849671293e-05, "tps": 23809, "wall": 65168.6} {"step": 23676, "train_loss": 3.3769001960754395, "lr": 8.564202884594692e-05, "tps": 23808, "wall": 65174.3} {"step": 23677, "train_loss": 3.270599603652954, "lr": 8.562928071719522e-05, "tps": 23807, "wall": 65179.9} {"step": 23678, "train_loss": 3.188563346862793, "lr": 8.561653411060237e-05, "tps": 23806, "wall": 65185.6} {"step": 23679, "train_loss": 3.271601915359497, "lr": 8.56037890263126e-05, "tps": 23805, "wall": 65191.2} {"step": 23680, "train_loss": 3.2177960872650146, "lr": 8.559104546447047e-05, "tps": 23804, "wall": 65197.0} {"step": 23681, "train_loss": 3.2850334644317627, "lr": 8.557830342522022e-05, "tps": 23803, "wall": 65202.7} {"step": 23682, "train_loss": 3.3027491569519043, "lr": 8.55655629087062e-05, "tps": 23801, "wall": 65208.3} {"step": 23683, "train_loss": 3.2154879570007324, "lr": 8.55528239150728e-05, "tps": 23800, "wall": 65213.9} {"step": 23684, "train_loss": 3.2286078929901123, "lr": 8.554008644446426e-05, "tps": 23799, "wall": 65219.6} {"step": 23685, "train_loss": 3.186558246612549, "lr": 8.552735049702485e-05, "tps": 23798, "wall": 65225.3} {"step": 23686, "train_loss": 3.194467067718506, "lr": 8.551461607289899e-05, "tps": 23797, "wall": 65230.9} {"step": 23687, "train_loss": 3.1595616340637207, "lr": 8.550188317223076e-05, "tps": 23796, "wall": 65236.5} {"step": 23688, "train_loss": 3.3209943771362305, "lr": 8.548915179516449e-05, "tps": 23795, "wall": 65242.2} {"step": 23689, "train_loss": 3.232964515686035, "lr": 8.547642194184443e-05, "tps": 23794, "wall": 65247.8} {"step": 23690, "train_loss": 3.2910454273223877, "lr": 8.546369361241462e-05, "tps": 23793, "wall": 65253.5} {"step": 23691, "train_loss": 3.251187801361084, "lr": 8.545096680701947e-05, "tps": 23792, "wall": 65259.2} {"step": 23692, "train_loss": 3.2528367042541504, "lr": 8.543824152580304e-05, "tps": 23791, "wall": 65264.8} {"step": 23693, "train_loss": 3.2186362743377686, "lr": 8.542551776890944e-05, "tps": 23790, "wall": 65270.5} {"step": 23694, "train_loss": 3.299156427383423, "lr": 8.54127955364829e-05, "tps": 23789, "wall": 65276.2} {"step": 23695, "train_loss": 3.309399127960205, "lr": 8.54000748286675e-05, "tps": 23788, "wall": 65281.8} {"step": 23696, "train_loss": 3.3918609619140625, "lr": 8.538735564560724e-05, "tps": 23787, "wall": 65287.5} {"step": 23697, "train_loss": 3.294821262359619, "lr": 8.53746379874464e-05, "tps": 23786, "wall": 65293.2} {"step": 23698, "train_loss": 3.298757314682007, "lr": 8.536192185432894e-05, "tps": 23785, "wall": 65298.8} {"step": 23699, "train_loss": 3.2548933029174805, "lr": 8.534920724639883e-05, "tps": 23784, "wall": 65304.4} {"step": 23700, "train_loss": 3.2963123321533203, "lr": 8.533649416380028e-05, "tps": 23782, "wall": 65310.1} {"step": 23701, "train_loss": 3.246089220046997, "lr": 8.53237826066772e-05, "tps": 23781, "wall": 65315.8} {"step": 23702, "train_loss": 3.292384147644043, "lr": 8.53110725751735e-05, "tps": 23780, "wall": 65321.4} {"step": 23703, "train_loss": 3.174238920211792, "lr": 8.529836406943334e-05, "tps": 23779, "wall": 65327.1} {"step": 23704, "train_loss": 3.1878740787506104, "lr": 8.528565708960054e-05, "tps": 23778, "wall": 65332.8} {"step": 23705, "train_loss": 3.358978271484375, "lr": 8.527295163581917e-05, "tps": 23777, "wall": 65338.4} {"step": 23706, "train_loss": 3.2097489833831787, "lr": 8.52602477082331e-05, "tps": 23776, "wall": 65344.0} {"step": 23707, "train_loss": 3.324949264526367, "lr": 8.524754530698615e-05, "tps": 23775, "wall": 65349.7} {"step": 23708, "train_loss": 3.341689109802246, "lr": 8.523484443222237e-05, "tps": 23774, "wall": 65355.4} {"step": 23709, "train_loss": 3.183518409729004, "lr": 8.522214508408555e-05, "tps": 23773, "wall": 65361.0} {"step": 23710, "train_loss": 3.2691848278045654, "lr": 8.520944726271951e-05, "tps": 23772, "wall": 65366.7} {"step": 23711, "train_loss": 3.3014187812805176, "lr": 8.51967509682682e-05, "tps": 23771, "wall": 65372.3} {"step": 23712, "train_loss": 3.287827253341675, "lr": 8.51840562008754e-05, "tps": 23770, "wall": 65378.1} {"step": 23713, "train_loss": 3.4024085998535156, "lr": 8.517136296068487e-05, "tps": 23769, "wall": 65383.7} {"step": 23714, "train_loss": 3.185101270675659, "lr": 8.515867124784043e-05, "tps": 23768, "wall": 65389.4} {"step": 23715, "train_loss": 3.1638717651367188, "lr": 8.514598106248587e-05, "tps": 23767, "wall": 65395.0} {"step": 23716, "train_loss": 3.218065023422241, "lr": 8.513329240476492e-05, "tps": 23766, "wall": 65400.7} {"step": 23717, "train_loss": 3.207955837249756, "lr": 8.512060527482135e-05, "tps": 23765, "wall": 65406.4} {"step": 23718, "train_loss": 3.294914722442627, "lr": 8.510791967279889e-05, "tps": 23763, "wall": 65412.0} {"step": 23719, "train_loss": 3.255138635635376, "lr": 8.509523559884113e-05, "tps": 23762, "wall": 65417.6} {"step": 23720, "train_loss": 3.175161600112915, "lr": 8.508255305309191e-05, "tps": 23761, "wall": 65423.3} {"step": 23721, "train_loss": 3.2013449668884277, "lr": 8.50698720356948e-05, "tps": 23760, "wall": 65429.0} {"step": 23722, "train_loss": 3.3194825649261475, "lr": 8.505719254679345e-05, "tps": 23759, "wall": 65434.7} {"step": 23723, "train_loss": 3.3483831882476807, "lr": 8.504451458653157e-05, "tps": 23758, "wall": 65440.4} {"step": 23724, "train_loss": 3.2095947265625, "lr": 8.503183815505269e-05, "tps": 23757, "wall": 65446.0} {"step": 23725, "train_loss": 3.1949210166931152, "lr": 8.501916325250049e-05, "tps": 23756, "wall": 65451.7} {"step": 23726, "train_loss": 3.3296773433685303, "lr": 8.500648987901851e-05, "tps": 23755, "wall": 65457.3} {"step": 23727, "train_loss": 3.2457737922668457, "lr": 8.499381803475027e-05, "tps": 23754, "wall": 65462.9} {"step": 23728, "train_loss": 3.2793283462524414, "lr": 8.49811477198394e-05, "tps": 23753, "wall": 65468.6} {"step": 23729, "train_loss": 3.2372453212738037, "lr": 8.49684789344294e-05, "tps": 23752, "wall": 65474.2} {"step": 23730, "train_loss": 3.261869430541992, "lr": 8.495581167866374e-05, "tps": 23751, "wall": 65479.8} {"step": 23731, "train_loss": 3.3583569526672363, "lr": 8.4943145952686e-05, "tps": 23750, "wall": 65485.5} {"step": 23732, "train_loss": 3.301154613494873, "lr": 8.493048175663959e-05, "tps": 23749, "wall": 65491.1} {"step": 23733, "train_loss": 3.3088574409484863, "lr": 8.491781909066793e-05, "tps": 23748, "wall": 65496.9} {"step": 23734, "train_loss": 3.2607204914093018, "lr": 8.490515795491461e-05, "tps": 23747, "wall": 65502.5} {"step": 23735, "train_loss": 3.244542121887207, "lr": 8.489249834952296e-05, "tps": 23746, "wall": 65508.1} {"step": 23736, "train_loss": 3.3037490844726562, "lr": 8.487984027463633e-05, "tps": 23745, "wall": 65513.8} {"step": 23737, "train_loss": 3.190035820007324, "lr": 8.486718373039823e-05, "tps": 23743, "wall": 65519.5} {"step": 23738, "train_loss": 3.307300329208374, "lr": 8.485452871695199e-05, "tps": 23742, "wall": 65525.1} {"step": 23739, "train_loss": 3.1618354320526123, "lr": 8.484187523444092e-05, "tps": 23741, "wall": 65530.8} {"step": 23740, "train_loss": 3.238816022872925, "lr": 8.482922328300843e-05, "tps": 23740, "wall": 65536.5} {"step": 23741, "train_loss": 3.422452688217163, "lr": 8.481657286279779e-05, "tps": 23739, "wall": 65542.1} {"step": 23742, "train_loss": 3.2100167274475098, "lr": 8.480392397395234e-05, "tps": 23738, "wall": 65547.8} {"step": 23743, "train_loss": 3.3398513793945312, "lr": 8.479127661661536e-05, "tps": 23737, "wall": 65553.4} {"step": 23744, "train_loss": 3.1554758548736572, "lr": 8.477863079093008e-05, "tps": 23736, "wall": 65559.1} {"step": 23745, "train_loss": 3.2206053733825684, "lr": 8.476598649703984e-05, "tps": 23735, "wall": 65564.8} {"step": 23746, "train_loss": 3.247964382171631, "lr": 8.47533437350878e-05, "tps": 23734, "wall": 65570.5} {"step": 23747, "train_loss": 3.4029269218444824, "lr": 8.474070250521716e-05, "tps": 23733, "wall": 65576.1} {"step": 23748, "train_loss": 3.2204325199127197, "lr": 8.47280628075712e-05, "tps": 23732, "wall": 65581.7} {"step": 23749, "train_loss": 3.136110305786133, "lr": 8.47154246422931e-05, "tps": 23731, "wall": 65587.4} {"step": 23750, "train_loss": 3.256246566772461, "lr": 8.470278800952591e-05, "tps": 23730, "wall": 65593.1} {"step": 23751, "train_loss": 3.268313407897949, "lr": 8.469015290941289e-05, "tps": 23729, "wall": 65598.8} {"step": 23752, "train_loss": 3.228048324584961, "lr": 8.467751934209716e-05, "tps": 23728, "wall": 65604.4} {"step": 23753, "train_loss": 3.205352783203125, "lr": 8.466488730772176e-05, "tps": 23727, "wall": 65610.1} {"step": 23754, "train_loss": 3.2574939727783203, "lr": 8.465225680642988e-05, "tps": 23726, "wall": 65615.8} {"step": 23755, "train_loss": 3.2731752395629883, "lr": 8.463962783836456e-05, "tps": 23725, "wall": 65621.4} {"step": 23756, "train_loss": 3.339384078979492, "lr": 8.46270004036688e-05, "tps": 23724, "wall": 65627.1} {"step": 23757, "train_loss": 3.18896746635437, "lr": 8.461437450248577e-05, "tps": 23722, "wall": 65632.8} {"step": 23758, "train_loss": 3.2543282508850098, "lr": 8.460175013495838e-05, "tps": 23721, "wall": 65638.5} {"step": 23759, "train_loss": 3.316636085510254, "lr": 8.458912730122974e-05, "tps": 23720, "wall": 65644.1} {"step": 23760, "train_loss": 3.2434611320495605, "lr": 8.457650600144278e-05, "tps": 23719, "wall": 65649.8} {"step": 23761, "train_loss": 3.377671241760254, "lr": 8.456388623574043e-05, "tps": 23718, "wall": 65655.4} {"step": 23762, "train_loss": 3.369760274887085, "lr": 8.455126800426576e-05, "tps": 23717, "wall": 65661.1} {"step": 23763, "train_loss": 3.213602066040039, "lr": 8.453865130716166e-05, "tps": 23716, "wall": 65666.7} {"step": 23764, "train_loss": 3.2025399208068848, "lr": 8.4526036144571e-05, "tps": 23715, "wall": 65672.4} {"step": 23765, "train_loss": 3.3554437160491943, "lr": 8.451342251663676e-05, "tps": 23714, "wall": 65678.1} {"step": 23766, "train_loss": 3.2877302169799805, "lr": 8.450081042350182e-05, "tps": 23713, "wall": 65683.8} {"step": 23767, "train_loss": 3.21362042427063, "lr": 8.448819986530898e-05, "tps": 23712, "wall": 65689.5} {"step": 23768, "train_loss": 3.3207926750183105, "lr": 8.44755908422012e-05, "tps": 23711, "wall": 65695.1} {"step": 23769, "train_loss": 3.1733317375183105, "lr": 8.446298335432124e-05, "tps": 23710, "wall": 65700.7} {"step": 23770, "train_loss": 3.275698184967041, "lr": 8.445037740181188e-05, "tps": 23709, "wall": 65706.4} {"step": 23771, "train_loss": 3.258441925048828, "lr": 8.443777298481605e-05, "tps": 23708, "wall": 65711.9} {"step": 23772, "train_loss": 3.3056623935699463, "lr": 8.442517010347646e-05, "tps": 23707, "wall": 65717.6} {"step": 23773, "train_loss": 3.2524595260620117, "lr": 8.441256875793581e-05, "tps": 23706, "wall": 65723.3} {"step": 23774, "train_loss": 3.293552875518799, "lr": 8.439996894833697e-05, "tps": 23705, "wall": 65729.0} {"step": 23775, "train_loss": 3.3382151126861572, "lr": 8.438737067482265e-05, "tps": 23704, "wall": 65734.7} {"step": 23776, "train_loss": 3.3217995166778564, "lr": 8.437477393753544e-05, "tps": 23703, "wall": 65740.4} {"step": 23777, "train_loss": 3.3469929695129395, "lr": 8.436217873661819e-05, "tps": 23702, "wall": 65746.0} {"step": 23778, "train_loss": 3.183016300201416, "lr": 8.434958507221347e-05, "tps": 23700, "wall": 65751.7} {"step": 23779, "train_loss": 3.2582502365112305, "lr": 8.433699294446404e-05, "tps": 23699, "wall": 65757.4} {"step": 23780, "train_loss": 3.326779365539551, "lr": 8.432440235351251e-05, "tps": 23698, "wall": 65763.0} {"step": 23781, "train_loss": 3.4007177352905273, "lr": 8.431181329950142e-05, "tps": 23697, "wall": 65768.7} {"step": 23782, "train_loss": 3.232386589050293, "lr": 8.429922578257349e-05, "tps": 23696, "wall": 65774.3} {"step": 23783, "train_loss": 3.4122824668884277, "lr": 8.428663980287129e-05, "tps": 23695, "wall": 65780.0} {"step": 23784, "train_loss": 3.257976770401001, "lr": 8.427405536053732e-05, "tps": 23694, "wall": 65785.6} {"step": 23785, "train_loss": 3.302706718444824, "lr": 8.426147245571423e-05, "tps": 23693, "wall": 65791.3} {"step": 23786, "train_loss": 3.3123085498809814, "lr": 8.424889108854454e-05, "tps": 23692, "wall": 65797.0} {"step": 23787, "train_loss": 3.1198954582214355, "lr": 8.423631125917071e-05, "tps": 23691, "wall": 65802.7} {"step": 23788, "train_loss": 3.265834093093872, "lr": 8.422373296773533e-05, "tps": 23690, "wall": 65808.4} {"step": 23789, "train_loss": 3.309640645980835, "lr": 8.421115621438086e-05, "tps": 23689, "wall": 65814.0} {"step": 23790, "train_loss": 3.283174514770508, "lr": 8.41985809992497e-05, "tps": 23688, "wall": 65819.7} {"step": 23791, "train_loss": 3.187769889831543, "lr": 8.418600732248441e-05, "tps": 23687, "wall": 65825.3} {"step": 23792, "train_loss": 3.301356792449951, "lr": 8.417343518422738e-05, "tps": 23686, "wall": 65831.0} {"step": 23793, "train_loss": 3.2783474922180176, "lr": 8.416086458462099e-05, "tps": 23685, "wall": 65836.7} {"step": 23794, "train_loss": 3.239499092102051, "lr": 8.414829552380769e-05, "tps": 23684, "wall": 65842.4} {"step": 23795, "train_loss": 3.261859655380249, "lr": 8.413572800192981e-05, "tps": 23683, "wall": 65848.0} {"step": 23796, "train_loss": 3.3289220333099365, "lr": 8.412316201912981e-05, "tps": 23682, "wall": 65853.7} {"step": 23797, "train_loss": 3.2023749351501465, "lr": 8.411059757554998e-05, "tps": 23681, "wall": 65859.4} {"step": 23798, "train_loss": 3.2387492656707764, "lr": 8.40980346713326e-05, "tps": 23680, "wall": 65865.1} {"step": 23799, "train_loss": 3.298426866531372, "lr": 8.408547330662009e-05, "tps": 23679, "wall": 65870.8} {"step": 23800, "train_loss": 3.287691116333008, "lr": 8.40729134815547e-05, "tps": 23677, "wall": 65876.5} {"step": 23801, "train_loss": 3.2662899494171143, "lr": 8.406035519627864e-05, "tps": 23676, "wall": 65882.1} {"step": 23802, "train_loss": 3.230937957763672, "lr": 8.404779845093427e-05, "tps": 23675, "wall": 65887.8} {"step": 23803, "train_loss": 3.291149139404297, "lr": 8.403524324566378e-05, "tps": 23674, "wall": 65893.5} {"step": 23804, "train_loss": 3.322887897491455, "lr": 8.402268958060941e-05, "tps": 23673, "wall": 65899.1} {"step": 23805, "train_loss": 3.341266632080078, "lr": 8.40101374559134e-05, "tps": 23672, "wall": 65904.8} {"step": 23806, "train_loss": 3.248086452484131, "lr": 8.399758687171789e-05, "tps": 23671, "wall": 65910.5} {"step": 23807, "train_loss": 3.3243520259857178, "lr": 8.398503782816503e-05, "tps": 23670, "wall": 65916.2} {"step": 23808, "train_loss": 3.3204476833343506, "lr": 8.397249032539707e-05, "tps": 23669, "wall": 65922.0} {"step": 23809, "train_loss": 3.275089979171753, "lr": 8.395994436355612e-05, "tps": 23668, "wall": 65927.6} {"step": 23810, "train_loss": 3.3034815788269043, "lr": 8.39473999427842e-05, "tps": 23667, "wall": 65933.3} {"step": 23811, "train_loss": 3.234729290008545, "lr": 8.393485706322357e-05, "tps": 23666, "wall": 65938.9} {"step": 23812, "train_loss": 3.2891154289245605, "lr": 8.392231572501616e-05, "tps": 23665, "wall": 65944.6} {"step": 23813, "train_loss": 3.3294715881347656, "lr": 8.39097759283042e-05, "tps": 23664, "wall": 65950.2} {"step": 23814, "train_loss": 3.2874152660369873, "lr": 8.389723767322963e-05, "tps": 23663, "wall": 65955.9} {"step": 23815, "train_loss": 3.1839919090270996, "lr": 8.388470095993448e-05, "tps": 23662, "wall": 65961.5} {"step": 23816, "train_loss": 3.2665891647338867, "lr": 8.387216578856087e-05, "tps": 23661, "wall": 65967.2} {"step": 23817, "train_loss": 3.2864482402801514, "lr": 8.385963215925071e-05, "tps": 23660, "wall": 65972.9} {"step": 23818, "train_loss": 3.2676568031311035, "lr": 8.384710007214596e-05, "tps": 23659, "wall": 65978.6} {"step": 23819, "train_loss": 3.262533664703369, "lr": 8.383456952738865e-05, "tps": 23658, "wall": 65984.2} {"step": 23820, "train_loss": 3.2516300678253174, "lr": 8.382204052512075e-05, "tps": 23657, "wall": 65989.9} {"step": 23821, "train_loss": 3.195286989212036, "lr": 8.380951306548406e-05, "tps": 23656, "wall": 65995.6} {"step": 23822, "train_loss": 3.3204660415649414, "lr": 8.379698714862063e-05, "tps": 23655, "wall": 66001.3} {"step": 23823, "train_loss": 3.1903533935546875, "lr": 8.378446277467228e-05, "tps": 23654, "wall": 66007.0} {"step": 23824, "train_loss": 3.230320453643799, "lr": 8.377193994378087e-05, "tps": 23652, "wall": 66012.6} {"step": 23825, "train_loss": 3.3089044094085693, "lr": 8.375941865608836e-05, "tps": 23651, "wall": 66018.3} {"step": 23826, "train_loss": 3.3715407848358154, "lr": 8.37468989117365e-05, "tps": 23650, "wall": 66024.0} {"step": 23827, "train_loss": 3.257323741912842, "lr": 8.373438071086712e-05, "tps": 23649, "wall": 66029.7} {"step": 23828, "train_loss": 3.2510173320770264, "lr": 8.372186405362207e-05, "tps": 23648, "wall": 66035.4} {"step": 23829, "train_loss": 3.200737953186035, "lr": 8.370934894014315e-05, "tps": 23647, "wall": 66041.1} {"step": 23830, "train_loss": 3.3354241847991943, "lr": 8.3696835370572e-05, "tps": 23646, "wall": 66046.7} {"step": 23831, "train_loss": 3.2116312980651855, "lr": 8.368432334505056e-05, "tps": 23645, "wall": 66052.4} {"step": 23832, "train_loss": 3.185654878616333, "lr": 8.36718128637204e-05, "tps": 23644, "wall": 66058.1} {"step": 23833, "train_loss": 3.331329822540283, "lr": 8.365930392672341e-05, "tps": 23643, "wall": 66063.8} {"step": 23834, "train_loss": 3.460986614227295, "lr": 8.364679653420116e-05, "tps": 23642, "wall": 66069.5} {"step": 23835, "train_loss": 3.2903199195861816, "lr": 8.363429068629535e-05, "tps": 23641, "wall": 66075.1} {"step": 23836, "train_loss": 3.1540091037750244, "lr": 8.36217863831477e-05, "tps": 23640, "wall": 66080.8} {"step": 23837, "train_loss": 3.3891396522521973, "lr": 8.360928362489988e-05, "tps": 23639, "wall": 66086.5} {"step": 23838, "train_loss": 3.3247921466827393, "lr": 8.359678241169338e-05, "tps": 23638, "wall": 66092.1} {"step": 23839, "train_loss": 3.239774227142334, "lr": 8.358428274366997e-05, "tps": 23637, "wall": 66097.9} {"step": 23840, "train_loss": 3.2626500129699707, "lr": 8.357178462097117e-05, "tps": 23636, "wall": 66103.6} {"step": 23841, "train_loss": 3.298128128051758, "lr": 8.355928804373854e-05, "tps": 23635, "wall": 66109.3} {"step": 23842, "train_loss": 3.2309186458587646, "lr": 8.354679301211373e-05, "tps": 23634, "wall": 66114.9} {"step": 23843, "train_loss": 3.266502857208252, "lr": 8.353429952623823e-05, "tps": 23633, "wall": 66120.6} {"step": 23844, "train_loss": 3.2770581245422363, "lr": 8.35218075862535e-05, "tps": 23632, "wall": 66126.3} {"step": 23845, "train_loss": 3.314626455307007, "lr": 8.35093171923012e-05, "tps": 23631, "wall": 66131.9} {"step": 23846, "train_loss": 3.1789491176605225, "lr": 8.349682834452271e-05, "tps": 23630, "wall": 66137.6} {"step": 23847, "train_loss": 3.259640693664551, "lr": 8.34843410430595e-05, "tps": 23629, "wall": 66143.2} {"step": 23848, "train_loss": 3.271986722946167, "lr": 8.34718552880531e-05, "tps": 23628, "wall": 66148.8} {"step": 23849, "train_loss": 3.2287652492523193, "lr": 8.345937107964485e-05, "tps": 23626, "wall": 66154.6} {"step": 23850, "train_loss": 3.2153351306915283, "lr": 8.34468884179763e-05, "tps": 23625, "wall": 66160.3} {"step": 23851, "train_loss": 3.1916184425354004, "lr": 8.343440730318878e-05, "tps": 23624, "wall": 66166.0} {"step": 23852, "train_loss": 3.3467936515808105, "lr": 8.342192773542361e-05, "tps": 23623, "wall": 66171.6} {"step": 23853, "train_loss": 3.3495290279388428, "lr": 8.340944971482232e-05, "tps": 23622, "wall": 66177.3} {"step": 23854, "train_loss": 3.2728219032287598, "lr": 8.339697324152616e-05, "tps": 23621, "wall": 66183.0} {"step": 23855, "train_loss": 3.2598330974578857, "lr": 8.338449831567647e-05, "tps": 23620, "wall": 66188.6} {"step": 23856, "train_loss": 3.316204786300659, "lr": 8.337202493741456e-05, "tps": 23619, "wall": 66194.3} {"step": 23857, "train_loss": 3.3811416625976562, "lr": 8.335955310688173e-05, "tps": 23618, "wall": 66200.0} {"step": 23858, "train_loss": 3.2407493591308594, "lr": 8.334708282421928e-05, "tps": 23617, "wall": 66205.6} {"step": 23859, "train_loss": 3.2932233810424805, "lr": 8.33346140895685e-05, "tps": 23616, "wall": 66211.2} {"step": 23860, "train_loss": 3.2671804428100586, "lr": 8.332214690307056e-05, "tps": 23615, "wall": 66217.0} {"step": 23861, "train_loss": 3.169921875, "lr": 8.330968126486678e-05, "tps": 23614, "wall": 66222.7} {"step": 23862, "train_loss": 3.459275722503662, "lr": 8.329721717509831e-05, "tps": 23613, "wall": 66228.3} {"step": 23863, "train_loss": 3.258452892303467, "lr": 8.32847546339063e-05, "tps": 23612, "wall": 66233.9} {"step": 23864, "train_loss": 3.16141414642334, "lr": 8.327229364143208e-05, "tps": 23611, "wall": 66239.6} {"step": 23865, "train_loss": 3.264531135559082, "lr": 8.325983419781668e-05, "tps": 23610, "wall": 66245.3} {"step": 23866, "train_loss": 3.1992921829223633, "lr": 8.32473763032012e-05, "tps": 23609, "wall": 66250.9} {"step": 23867, "train_loss": 3.241274118423462, "lr": 8.323491995772694e-05, "tps": 23608, "wall": 66256.6} {"step": 23868, "train_loss": 3.1496989727020264, "lr": 8.322246516153488e-05, "tps": 23607, "wall": 66262.3} {"step": 23869, "train_loss": 3.3572463989257812, "lr": 8.32100119147661e-05, "tps": 23606, "wall": 66267.9} {"step": 23870, "train_loss": 3.27150821685791, "lr": 8.319756021756175e-05, "tps": 23605, "wall": 66273.5} {"step": 23871, "train_loss": 3.24222993850708, "lr": 8.318511007006283e-05, "tps": 23604, "wall": 66279.2} {"step": 23872, "train_loss": 3.2837867736816406, "lr": 8.317266147241034e-05, "tps": 23603, "wall": 66284.9} {"step": 23873, "train_loss": 3.2498676776885986, "lr": 8.316021442474537e-05, "tps": 23602, "wall": 66290.5} {"step": 23874, "train_loss": 3.286682605743408, "lr": 8.314776892720887e-05, "tps": 23601, "wall": 66296.2} {"step": 23875, "train_loss": 3.2478861808776855, "lr": 8.313532497994192e-05, "tps": 23600, "wall": 66301.8} {"step": 23876, "train_loss": 3.19073748588562, "lr": 8.312288258308537e-05, "tps": 23599, "wall": 66307.4} {"step": 23877, "train_loss": 3.287579298019409, "lr": 8.311044173678019e-05, "tps": 23598, "wall": 66313.1} {"step": 23878, "train_loss": 3.2259559631347656, "lr": 8.309800244116737e-05, "tps": 23597, "wall": 66318.8} {"step": 23879, "train_loss": 3.280689001083374, "lr": 8.308556469638778e-05, "tps": 23596, "wall": 66324.5} {"step": 23880, "train_loss": 3.3528690338134766, "lr": 8.307312850258227e-05, "tps": 23595, "wall": 66330.1} {"step": 23881, "train_loss": 3.1730873584747314, "lr": 8.306069385989182e-05, "tps": 23594, "wall": 66335.9} {"step": 23882, "train_loss": 3.2488515377044678, "lr": 8.304826076845724e-05, "tps": 23592, "wall": 66341.6} {"step": 23883, "train_loss": 3.4200356006622314, "lr": 8.303582922841931e-05, "tps": 23591, "wall": 66347.2} {"step": 23884, "train_loss": 3.2980117797851562, "lr": 8.302339923991899e-05, "tps": 23590, "wall": 66352.9} {"step": 23885, "train_loss": 3.3002638816833496, "lr": 8.301097080309702e-05, "tps": 23589, "wall": 66358.6} {"step": 23886, "train_loss": 3.287931442260742, "lr": 8.299854391809408e-05, "tps": 23588, "wall": 66364.2} {"step": 23887, "train_loss": 3.2769739627838135, "lr": 8.298611858505114e-05, "tps": 23587, "wall": 66369.9} {"step": 23888, "train_loss": 3.2847790718078613, "lr": 8.297369480410885e-05, "tps": 23586, "wall": 66375.5} {"step": 23889, "train_loss": 3.1998696327209473, "lr": 8.296127257540792e-05, "tps": 23585, "wall": 66381.2} {"step": 23890, "train_loss": 3.253485918045044, "lr": 8.294885189908915e-05, "tps": 23584, "wall": 66386.9} {"step": 23891, "train_loss": 3.306375741958618, "lr": 8.293643277529313e-05, "tps": 23583, "wall": 66392.6} {"step": 23892, "train_loss": 3.227238416671753, "lr": 8.29240152041607e-05, "tps": 23582, "wall": 66398.3} {"step": 23893, "train_loss": 3.2530221939086914, "lr": 8.291159918583243e-05, "tps": 23581, "wall": 66404.0} {"step": 23894, "train_loss": 3.1830198764801025, "lr": 8.28991847204489e-05, "tps": 23580, "wall": 66409.6} {"step": 23895, "train_loss": 3.293290138244629, "lr": 8.288677180815092e-05, "tps": 23579, "wall": 66415.3} {"step": 23896, "train_loss": 3.342468023300171, "lr": 8.287436044907897e-05, "tps": 23578, "wall": 66421.0} {"step": 23897, "train_loss": 3.1975483894348145, "lr": 8.286195064337366e-05, "tps": 23577, "wall": 66426.6} {"step": 23898, "train_loss": 3.272228240966797, "lr": 8.284954239117561e-05, "tps": 23576, "wall": 66432.3} {"step": 23899, "train_loss": 3.2169432640075684, "lr": 8.28371356926254e-05, "tps": 23575, "wall": 66437.9} {"step": 23900, "train_loss": 3.256957530975342, "lr": 8.282473054786346e-05, "tps": 23574, "wall": 66443.6} {"step": 23901, "train_loss": 3.2544431686401367, "lr": 8.281232695703045e-05, "tps": 23573, "wall": 66449.3} {"step": 23902, "train_loss": 3.3089659214019775, "lr": 8.279992492026682e-05, "tps": 23572, "wall": 66455.0} {"step": 23903, "train_loss": 3.4197072982788086, "lr": 8.278752443771303e-05, "tps": 23571, "wall": 66460.6} {"step": 23904, "train_loss": 3.270808458328247, "lr": 8.277512550950964e-05, "tps": 23570, "wall": 66466.3} {"step": 23905, "train_loss": 3.248368263244629, "lr": 8.276272813579702e-05, "tps": 23569, "wall": 66471.9} {"step": 23906, "train_loss": 3.234952449798584, "lr": 8.27503323167156e-05, "tps": 23568, "wall": 66477.6} {"step": 23907, "train_loss": 3.299942970275879, "lr": 8.273793805240591e-05, "tps": 23567, "wall": 66483.3} {"step": 23908, "train_loss": 3.1645708084106445, "lr": 8.272554534300821e-05, "tps": 23566, "wall": 66488.9} {"step": 23909, "train_loss": 3.262439727783203, "lr": 8.271315418866304e-05, "tps": 23565, "wall": 66494.6} {"step": 23910, "train_loss": 3.301140785217285, "lr": 8.270076458951066e-05, "tps": 23564, "wall": 66500.2} {"step": 23911, "train_loss": 3.2668869495391846, "lr": 8.268837654569139e-05, "tps": 23563, "wall": 66505.9} {"step": 23912, "train_loss": 3.1846230030059814, "lr": 8.26759900573457e-05, "tps": 23562, "wall": 66511.5} {"step": 23913, "train_loss": 3.1709961891174316, "lr": 8.266360512461378e-05, "tps": 23561, "wall": 66517.3} {"step": 23914, "train_loss": 3.2491917610168457, "lr": 8.265122174763595e-05, "tps": 23560, "wall": 66522.9} {"step": 23915, "train_loss": 3.3217334747314453, "lr": 8.263883992655258e-05, "tps": 23559, "wall": 66528.6} {"step": 23916, "train_loss": 3.2832834720611572, "lr": 8.262645966150382e-05, "tps": 23558, "wall": 66534.2} {"step": 23917, "train_loss": 3.3015873432159424, "lr": 8.261408095262993e-05, "tps": 23557, "wall": 66540.0} {"step": 23918, "train_loss": 3.2454895973205566, "lr": 8.260170380007119e-05, "tps": 23556, "wall": 66545.8} {"step": 23919, "train_loss": 3.2221438884735107, "lr": 8.258932820396783e-05, "tps": 23555, "wall": 66551.4} {"step": 23920, "train_loss": 3.1926982402801514, "lr": 8.257695416445989e-05, "tps": 23554, "wall": 66557.1} {"step": 23921, "train_loss": 3.2545220851898193, "lr": 8.256458168168773e-05, "tps": 23552, "wall": 66562.8} {"step": 23922, "train_loss": 3.2275617122650146, "lr": 8.255221075579142e-05, "tps": 23551, "wall": 66568.4} {"step": 23923, "train_loss": 3.2056760787963867, "lr": 8.253984138691105e-05, "tps": 23550, "wall": 66574.1} {"step": 23924, "train_loss": 3.2612390518188477, "lr": 8.252747357518684e-05, "tps": 23549, "wall": 66579.8} {"step": 23925, "train_loss": 3.2103500366210938, "lr": 8.251510732075885e-05, "tps": 23548, "wall": 66585.5} {"step": 23926, "train_loss": 3.2425060272216797, "lr": 8.250274262376712e-05, "tps": 23547, "wall": 66591.1} {"step": 23927, "train_loss": 3.336472511291504, "lr": 8.249037948435178e-05, "tps": 23546, "wall": 66596.8} {"step": 23928, "train_loss": 3.296902656555176, "lr": 8.247801790265286e-05, "tps": 23545, "wall": 66602.5} {"step": 23929, "train_loss": 3.2695279121398926, "lr": 8.246565787881039e-05, "tps": 23544, "wall": 66608.2} {"step": 23930, "train_loss": 3.3393845558166504, "lr": 8.245329941296442e-05, "tps": 23543, "wall": 66613.8} {"step": 23931, "train_loss": 3.290109634399414, "lr": 8.244094250525488e-05, "tps": 23542, "wall": 66619.6} {"step": 23932, "train_loss": 3.2363643646240234, "lr": 8.242858715582178e-05, "tps": 23541, "wall": 66625.2} {"step": 23933, "train_loss": 3.3184003829956055, "lr": 8.241623336480513e-05, "tps": 23540, "wall": 66630.9} {"step": 23934, "train_loss": 3.323235034942627, "lr": 8.240388113234476e-05, "tps": 23539, "wall": 66636.6} {"step": 23935, "train_loss": 3.1373794078826904, "lr": 8.239153045858075e-05, "tps": 23538, "wall": 66642.3} {"step": 23936, "train_loss": 3.2493486404418945, "lr": 8.23791813436529e-05, "tps": 23537, "wall": 66647.9} {"step": 23937, "train_loss": 3.2707066535949707, "lr": 8.236683378770108e-05, "tps": 23536, "wall": 66653.6} {"step": 23938, "train_loss": 3.244783878326416, "lr": 8.235448779086528e-05, "tps": 23535, "wall": 66659.2} {"step": 23939, "train_loss": 3.2259268760681152, "lr": 8.234214335328529e-05, "tps": 23534, "wall": 66664.8} {"step": 23940, "train_loss": 3.396179437637329, "lr": 8.232980047510088e-05, "tps": 23533, "wall": 66670.5} {"step": 23941, "train_loss": 3.280940532684326, "lr": 8.231745915645197e-05, "tps": 23532, "wall": 66676.2} {"step": 23942, "train_loss": 3.258338451385498, "lr": 8.230511939747836e-05, "tps": 23531, "wall": 66681.8} {"step": 23943, "train_loss": 3.170017957687378, "lr": 8.229278119831974e-05, "tps": 23530, "wall": 66687.5} {"step": 23944, "train_loss": 3.2588155269622803, "lr": 8.2280444559116e-05, "tps": 23529, "wall": 66693.1} {"step": 23945, "train_loss": 3.306884765625, "lr": 8.226810948000681e-05, "tps": 23528, "wall": 66698.9} {"step": 23946, "train_loss": 3.176016092300415, "lr": 8.225577596113197e-05, "tps": 23527, "wall": 66704.5} {"step": 23947, "train_loss": 3.17313289642334, "lr": 8.224344400263113e-05, "tps": 23526, "wall": 66710.2} {"step": 23948, "train_loss": 3.3145499229431152, "lr": 8.223111360464397e-05, "tps": 23525, "wall": 66715.9} {"step": 23949, "train_loss": 3.2283599376678467, "lr": 8.221878476731024e-05, "tps": 23524, "wall": 66721.6} {"step": 23950, "train_loss": 3.2808966636657715, "lr": 8.22064574907696e-05, "tps": 23523, "wall": 66727.3} {"step": 23951, "train_loss": 3.221442222595215, "lr": 8.21941317751616e-05, "tps": 23522, "wall": 66732.9} {"step": 23952, "train_loss": 3.2522506713867188, "lr": 8.218180762062597e-05, "tps": 23521, "wall": 66738.6} {"step": 23953, "train_loss": 3.290372610092163, "lr": 8.216948502730229e-05, "tps": 23520, "wall": 66744.2} {"step": 23954, "train_loss": 3.2756731510162354, "lr": 8.215716399533009e-05, "tps": 23519, "wall": 66749.9} {"step": 23955, "train_loss": 3.3253939151763916, "lr": 8.214484452484905e-05, "tps": 23518, "wall": 66755.6} {"step": 23956, "train_loss": 3.289414405822754, "lr": 8.213252661599864e-05, "tps": 23517, "wall": 66761.2} {"step": 23957, "train_loss": 3.2222251892089844, "lr": 8.212021026891843e-05, "tps": 23516, "wall": 66766.9} {"step": 23958, "train_loss": 3.294785976409912, "lr": 8.210789548374795e-05, "tps": 23515, "wall": 66772.5} {"step": 23959, "train_loss": 3.298738956451416, "lr": 8.20955822606267e-05, "tps": 23514, "wall": 66778.2} {"step": 23960, "train_loss": 3.2982301712036133, "lr": 8.20832705996941e-05, "tps": 23513, "wall": 66783.9} {"step": 23961, "train_loss": 3.3129448890686035, "lr": 8.207096050108972e-05, "tps": 23512, "wall": 66789.5} {"step": 23962, "train_loss": 3.1931471824645996, "lr": 8.205865196495291e-05, "tps": 23511, "wall": 66795.1} {"step": 23963, "train_loss": 3.3243942260742188, "lr": 8.204634499142321e-05, "tps": 23510, "wall": 66800.8} {"step": 23964, "train_loss": 3.294003963470459, "lr": 8.203403958063996e-05, "tps": 23509, "wall": 66806.4} {"step": 23965, "train_loss": 3.257479190826416, "lr": 8.202173573274254e-05, "tps": 23508, "wall": 66812.1} {"step": 23966, "train_loss": 3.3577866554260254, "lr": 8.200943344787042e-05, "tps": 23507, "wall": 66817.8} {"step": 23967, "train_loss": 3.28408145904541, "lr": 8.19971327261629e-05, "tps": 23506, "wall": 66823.5} {"step": 23968, "train_loss": 3.2771458625793457, "lr": 8.198483356775926e-05, "tps": 23505, "wall": 66829.1} {"step": 23969, "train_loss": 3.3024158477783203, "lr": 8.197253597279893e-05, "tps": 23504, "wall": 66834.8} {"step": 23970, "train_loss": 3.2404305934906006, "lr": 8.196023994142122e-05, "tps": 23503, "wall": 66840.4} {"step": 23971, "train_loss": 3.17972993850708, "lr": 8.194794547376531e-05, "tps": 23502, "wall": 66846.1} {"step": 23972, "train_loss": 3.2309322357177734, "lr": 8.19356525699706e-05, "tps": 23501, "wall": 66851.8} {"step": 23973, "train_loss": 3.2338504791259766, "lr": 8.192336123017626e-05, "tps": 23500, "wall": 66857.5} {"step": 23974, "train_loss": 3.288996934890747, "lr": 8.191107145452152e-05, "tps": 23499, "wall": 66863.2} {"step": 23975, "train_loss": 3.2076940536499023, "lr": 8.189878324314568e-05, "tps": 23498, "wall": 66868.8} {"step": 23976, "train_loss": 3.2745790481567383, "lr": 8.188649659618793e-05, "tps": 23497, "wall": 66874.5} {"step": 23977, "train_loss": 3.2827115058898926, "lr": 8.187421151378732e-05, "tps": 23496, "wall": 66880.2} {"step": 23978, "train_loss": 3.2082526683807373, "lr": 8.186192799608318e-05, "tps": 23495, "wall": 66885.9} {"step": 23979, "train_loss": 3.4029431343078613, "lr": 8.18496460432146e-05, "tps": 23494, "wall": 66891.6} {"step": 23980, "train_loss": 3.2413291931152344, "lr": 8.183736565532065e-05, "tps": 23493, "wall": 66897.2} {"step": 23981, "train_loss": 3.263004779815674, "lr": 8.182508683254056e-05, "tps": 23492, "wall": 66902.9} {"step": 23982, "train_loss": 3.2416481971740723, "lr": 8.181280957501329e-05, "tps": 23491, "wall": 66908.6} {"step": 23983, "train_loss": 3.253215789794922, "lr": 8.180053388287803e-05, "tps": 23489, "wall": 66914.2} {"step": 23984, "train_loss": 3.297384262084961, "lr": 8.178825975627382e-05, "tps": 23488, "wall": 66920.0} {"step": 23985, "train_loss": 3.234926223754883, "lr": 8.177598719533963e-05, "tps": 23487, "wall": 66925.6} {"step": 23986, "train_loss": 3.196944236755371, "lr": 8.176371620021458e-05, "tps": 23486, "wall": 66931.3} {"step": 23987, "train_loss": 3.24636173248291, "lr": 8.175144677103763e-05, "tps": 23485, "wall": 66937.0} {"step": 23988, "train_loss": 3.2502429485321045, "lr": 8.173917890794773e-05, "tps": 23484, "wall": 66942.7} {"step": 23989, "train_loss": 3.3802599906921387, "lr": 8.172691261108392e-05, "tps": 23483, "wall": 66948.4} {"step": 23990, "train_loss": 3.1656999588012695, "lr": 8.171464788058514e-05, "tps": 23482, "wall": 66954.0} {"step": 23991, "train_loss": 3.3013830184936523, "lr": 8.170238471659026e-05, "tps": 23481, "wall": 66959.7} {"step": 23992, "train_loss": 3.279099464416504, "lr": 8.169012311923829e-05, "tps": 23480, "wall": 66965.3} {"step": 23993, "train_loss": 3.309575080871582, "lr": 8.167786308866809e-05, "tps": 23479, "wall": 66971.0} {"step": 23994, "train_loss": 3.2815496921539307, "lr": 8.16656046250185e-05, "tps": 23478, "wall": 66976.7} {"step": 23995, "train_loss": 3.3469111919403076, "lr": 8.165334772842848e-05, "tps": 23477, "wall": 66982.4} {"step": 23996, "train_loss": 3.3245983123779297, "lr": 8.164109239903679e-05, "tps": 23476, "wall": 66988.1} {"step": 23997, "train_loss": 3.163106679916382, "lr": 8.162883863698226e-05, "tps": 23475, "wall": 66993.7} {"step": 23998, "train_loss": 3.254929304122925, "lr": 8.161658644240378e-05, "tps": 23474, "wall": 66999.5} {"step": 23999, "train_loss": 3.2117228507995605, "lr": 8.160433581544006e-05, "tps": 23473, "wall": 67005.2} {"step": 24000, "train_loss": 3.324214458465576, "lr": 8.159208675622994e-05, "tps": 23472, "wall": 67010.8, "val_loss_monitor": 3.3287320683654036} {"step": 24001, "train_loss": 3.289940357208252, "lr": 8.157983926491218e-05, "tps": 23458, "wall": 67053.1} {"step": 24002, "train_loss": 3.235342502593994, "lr": 8.15675933416254e-05, "tps": 23457, "wall": 67058.9} {"step": 24003, "train_loss": 3.2397494316101074, "lr": 8.155534898650848e-05, "tps": 23456, "wall": 67064.6} {"step": 24004, "train_loss": 3.277367115020752, "lr": 8.154310619970004e-05, "tps": 23455, "wall": 67070.3} {"step": 24005, "train_loss": 3.220179796218872, "lr": 8.153086498133873e-05, "tps": 23454, "wall": 67076.0} {"step": 24006, "train_loss": 3.255295515060425, "lr": 8.151862533156335e-05, "tps": 23453, "wall": 67081.7} {"step": 24007, "train_loss": 3.3080878257751465, "lr": 8.150638725051245e-05, "tps": 23452, "wall": 67087.4} {"step": 24008, "train_loss": 3.2787442207336426, "lr": 8.149415073832467e-05, "tps": 23451, "wall": 67093.1} {"step": 24009, "train_loss": 3.2781686782836914, "lr": 8.148191579513869e-05, "tps": 23450, "wall": 67098.9} {"step": 24010, "train_loss": 3.2360472679138184, "lr": 8.146968242109303e-05, "tps": 23449, "wall": 67104.6} {"step": 24011, "train_loss": 3.1192517280578613, "lr": 8.145745061632627e-05, "tps": 23448, "wall": 67110.4} {"step": 24012, "train_loss": 3.242481231689453, "lr": 8.144522038097703e-05, "tps": 23447, "wall": 67116.2} {"step": 24013, "train_loss": 3.2589244842529297, "lr": 8.143299171518387e-05, "tps": 23446, "wall": 67121.9} {"step": 24014, "train_loss": 3.225554943084717, "lr": 8.142076461908521e-05, "tps": 23445, "wall": 67127.7} {"step": 24015, "train_loss": 3.2079527378082275, "lr": 8.140853909281966e-05, "tps": 23444, "wall": 67133.4} {"step": 24016, "train_loss": 3.218529462814331, "lr": 8.139631513652568e-05, "tps": 23443, "wall": 67139.1} {"step": 24017, "train_loss": 3.300391674041748, "lr": 8.138409275034171e-05, "tps": 23442, "wall": 67144.9} {"step": 24018, "train_loss": 3.259176015853882, "lr": 8.137187193440627e-05, "tps": 23441, "wall": 67150.6} {"step": 24019, "train_loss": 3.3292391300201416, "lr": 8.135965268885773e-05, "tps": 23440, "wall": 67156.3} {"step": 24020, "train_loss": 3.3312017917633057, "lr": 8.13474350138346e-05, "tps": 23439, "wall": 67162.0} {"step": 24021, "train_loss": 3.2507715225219727, "lr": 8.13352189094752e-05, "tps": 23438, "wall": 67167.7} {"step": 24022, "train_loss": 3.2465500831604004, "lr": 8.132300437591789e-05, "tps": 23437, "wall": 67173.5} {"step": 24023, "train_loss": 3.3165183067321777, "lr": 8.131079141330116e-05, "tps": 23436, "wall": 67179.3} {"step": 24024, "train_loss": 3.3475470542907715, "lr": 8.129858002176329e-05, "tps": 23435, "wall": 67185.1} {"step": 24025, "train_loss": 3.2928295135498047, "lr": 8.12863702014426e-05, "tps": 23434, "wall": 67190.8} {"step": 24026, "train_loss": 3.303652763366699, "lr": 8.127416195247741e-05, "tps": 23433, "wall": 67196.5} {"step": 24027, "train_loss": 3.326198101043701, "lr": 8.126195527500597e-05, "tps": 23432, "wall": 67202.3} {"step": 24028, "train_loss": 3.2330026626586914, "lr": 8.124975016916666e-05, "tps": 23431, "wall": 67208.1} {"step": 24029, "train_loss": 3.220808982849121, "lr": 8.123754663509768e-05, "tps": 23430, "wall": 67213.8} {"step": 24030, "train_loss": 3.2457327842712402, "lr": 8.122534467293723e-05, "tps": 23429, "wall": 67219.5} {"step": 24031, "train_loss": 3.3247785568237305, "lr": 8.121314428282363e-05, "tps": 23428, "wall": 67225.2} {"step": 24032, "train_loss": 3.317906379699707, "lr": 8.120094546489505e-05, "tps": 23427, "wall": 67230.9} {"step": 24033, "train_loss": 3.2649240493774414, "lr": 8.118874821928961e-05, "tps": 23426, "wall": 67236.8} {"step": 24034, "train_loss": 3.336101531982422, "lr": 8.117655254614561e-05, "tps": 23425, "wall": 67242.5} {"step": 24035, "train_loss": 3.205711841583252, "lr": 8.116435844560109e-05, "tps": 23424, "wall": 67248.3} {"step": 24036, "train_loss": 3.1616251468658447, "lr": 8.115216591779422e-05, "tps": 23422, "wall": 67254.0} {"step": 24037, "train_loss": 3.2906365394592285, "lr": 8.113997496286317e-05, "tps": 23421, "wall": 67259.7} {"step": 24038, "train_loss": 3.1970252990722656, "lr": 8.112778558094597e-05, "tps": 23420, "wall": 67265.4} {"step": 24039, "train_loss": 3.3591549396514893, "lr": 8.11155977721807e-05, "tps": 23419, "wall": 67271.1} {"step": 24040, "train_loss": 3.250828266143799, "lr": 8.110341153670548e-05, "tps": 23418, "wall": 67276.8} {"step": 24041, "train_loss": 3.238476514816284, "lr": 8.10912268746583e-05, "tps": 23417, "wall": 67282.5} {"step": 24042, "train_loss": 3.2175097465515137, "lr": 8.107904378617725e-05, "tps": 23416, "wall": 67288.3} {"step": 24043, "train_loss": 3.1776812076568604, "lr": 8.106686227140033e-05, "tps": 23415, "wall": 67294.0} {"step": 24044, "train_loss": 3.22575044631958, "lr": 8.105468233046547e-05, "tps": 23414, "wall": 67299.8} {"step": 24045, "train_loss": 3.28255033493042, "lr": 8.10425039635107e-05, "tps": 23413, "wall": 67305.4} {"step": 24046, "train_loss": 3.4351415634155273, "lr": 8.103032717067399e-05, "tps": 23412, "wall": 67311.1} {"step": 24047, "train_loss": 3.2715682983398438, "lr": 8.101815195209319e-05, "tps": 23411, "wall": 67316.8} {"step": 24048, "train_loss": 3.2660655975341797, "lr": 8.100597830790633e-05, "tps": 23410, "wall": 67322.5} {"step": 24049, "train_loss": 3.246771812438965, "lr": 8.099380623825125e-05, "tps": 23409, "wall": 67328.2} {"step": 24050, "train_loss": 3.2891921997070312, "lr": 8.098163574326583e-05, "tps": 23408, "wall": 67333.9} {"step": 24051, "train_loss": 3.2866621017456055, "lr": 8.0969466823088e-05, "tps": 23407, "wall": 67339.7} {"step": 24052, "train_loss": 3.4024534225463867, "lr": 8.095729947785559e-05, "tps": 23406, "wall": 67345.3} {"step": 24053, "train_loss": 3.190871477127075, "lr": 8.094513370770636e-05, "tps": 23405, "wall": 67351.1} {"step": 24054, "train_loss": 3.2162890434265137, "lr": 8.09329695127782e-05, "tps": 23404, "wall": 67356.9} {"step": 24055, "train_loss": 3.223721742630005, "lr": 8.092080689320891e-05, "tps": 23403, "wall": 67362.6} {"step": 24056, "train_loss": 3.201841354370117, "lr": 8.090864584913618e-05, "tps": 23402, "wall": 67368.3} {"step": 24057, "train_loss": 3.257877826690674, "lr": 8.089648638069788e-05, "tps": 23401, "wall": 67374.0} {"step": 24058, "train_loss": 3.362884521484375, "lr": 8.088432848803172e-05, "tps": 23400, "wall": 67379.7} {"step": 24059, "train_loss": 3.201230525970459, "lr": 8.087217217127536e-05, "tps": 23399, "wall": 67385.3} {"step": 24060, "train_loss": 3.1926169395446777, "lr": 8.086001743056661e-05, "tps": 23398, "wall": 67391.1} {"step": 24061, "train_loss": 3.242337703704834, "lr": 8.084786426604307e-05, "tps": 23397, "wall": 67396.8} {"step": 24062, "train_loss": 3.2126219272613525, "lr": 8.083571267784248e-05, "tps": 23396, "wall": 67402.5} {"step": 24063, "train_loss": 3.315294027328491, "lr": 8.08235626661025e-05, "tps": 23395, "wall": 67408.2} {"step": 24064, "train_loss": 3.3213915824890137, "lr": 8.081141423096063e-05, "tps": 23394, "wall": 67413.9} {"step": 24065, "train_loss": 3.2516136169433594, "lr": 8.079926737255468e-05, "tps": 23393, "wall": 67419.7} {"step": 24066, "train_loss": 3.2552828788757324, "lr": 8.078712209102214e-05, "tps": 23392, "wall": 67425.4} {"step": 24067, "train_loss": 3.166280746459961, "lr": 8.077497838650058e-05, "tps": 23391, "wall": 67431.1} {"step": 24068, "train_loss": 3.2368874549865723, "lr": 8.076283625912764e-05, "tps": 23390, "wall": 67436.8} {"step": 24069, "train_loss": 3.263303279876709, "lr": 8.075069570904082e-05, "tps": 23389, "wall": 67442.5} {"step": 24070, "train_loss": 3.2128078937530518, "lr": 8.07385567363776e-05, "tps": 23388, "wall": 67448.2} {"step": 24071, "train_loss": 3.115724802017212, "lr": 8.072641934127558e-05, "tps": 23387, "wall": 67454.0} {"step": 24072, "train_loss": 3.255553722381592, "lr": 8.071428352387225e-05, "tps": 23386, "wall": 67459.7} {"step": 24073, "train_loss": 3.3033838272094727, "lr": 8.070214928430498e-05, "tps": 23385, "wall": 67465.4} {"step": 24074, "train_loss": 3.3049237728118896, "lr": 8.069001662271136e-05, "tps": 23384, "wall": 67471.1} {"step": 24075, "train_loss": 3.2254581451416016, "lr": 8.067788553922875e-05, "tps": 23383, "wall": 67476.9} {"step": 24076, "train_loss": 3.325253486633301, "lr": 8.066575603399455e-05, "tps": 23382, "wall": 67482.7} {"step": 24077, "train_loss": 3.329807758331299, "lr": 8.065362810714627e-05, "tps": 23381, "wall": 67488.4} {"step": 24078, "train_loss": 3.2810325622558594, "lr": 8.064150175882115e-05, "tps": 23380, "wall": 67494.1} {"step": 24079, "train_loss": 3.2127182483673096, "lr": 8.06293769891567e-05, "tps": 23379, "wall": 67499.8} {"step": 24080, "train_loss": 3.2311789989471436, "lr": 8.061725379829021e-05, "tps": 23378, "wall": 67505.6} {"step": 24081, "train_loss": 3.4002676010131836, "lr": 8.060513218635896e-05, "tps": 23377, "wall": 67511.4} {"step": 24082, "train_loss": 3.260240316390991, "lr": 8.059301215350035e-05, "tps": 23376, "wall": 67517.1} {"step": 24083, "train_loss": 3.147409439086914, "lr": 8.058089369985166e-05, "tps": 23375, "wall": 67522.9} {"step": 24084, "train_loss": 3.261077880859375, "lr": 8.05687768255501e-05, "tps": 23374, "wall": 67528.6} {"step": 24085, "train_loss": 3.3316221237182617, "lr": 8.055666153073303e-05, "tps": 23373, "wall": 67534.3} {"step": 24086, "train_loss": 3.2689743041992188, "lr": 8.05445478155376e-05, "tps": 23372, "wall": 67540.1} {"step": 24087, "train_loss": 3.258573293685913, "lr": 8.053243568010107e-05, "tps": 23371, "wall": 67545.8} {"step": 24088, "train_loss": 3.3779191970825195, "lr": 8.052032512456069e-05, "tps": 23370, "wall": 67551.5} {"step": 24089, "train_loss": 3.202681064605713, "lr": 8.050821614905362e-05, "tps": 23369, "wall": 67557.2} {"step": 24090, "train_loss": 3.2360165119171143, "lr": 8.049610875371697e-05, "tps": 23368, "wall": 67562.9} {"step": 24091, "train_loss": 3.2053632736206055, "lr": 8.048400293868799e-05, "tps": 23367, "wall": 67568.6} {"step": 24092, "train_loss": 3.199770212173462, "lr": 8.04718987041038e-05, "tps": 23366, "wall": 67574.3} {"step": 24093, "train_loss": 3.4488911628723145, "lr": 8.045979605010139e-05, "tps": 23365, "wall": 67580.0} {"step": 24094, "train_loss": 3.2421116828918457, "lr": 8.044769497681806e-05, "tps": 23364, "wall": 67585.7} {"step": 24095, "train_loss": 3.399301767349243, "lr": 8.04355954843907e-05, "tps": 23363, "wall": 67591.4} {"step": 24096, "train_loss": 3.3137314319610596, "lr": 8.042349757295654e-05, "tps": 23362, "wall": 67597.2} {"step": 24097, "train_loss": 3.205476760864258, "lr": 8.041140124265253e-05, "tps": 23361, "wall": 67602.9} {"step": 24098, "train_loss": 3.226691484451294, "lr": 8.039930649361568e-05, "tps": 23360, "wall": 67608.6} {"step": 24099, "train_loss": 3.2389535903930664, "lr": 8.03872133259831e-05, "tps": 23359, "wall": 67614.3} {"step": 24100, "train_loss": 3.17431902885437, "lr": 8.037512173989172e-05, "tps": 23358, "wall": 67620.0} {"step": 24101, "train_loss": 3.3643834590911865, "lr": 8.036303173547845e-05, "tps": 23357, "wall": 67625.7} {"step": 24102, "train_loss": 3.1733648777008057, "lr": 8.035094331288035e-05, "tps": 23356, "wall": 67631.4} {"step": 24103, "train_loss": 3.178090810775757, "lr": 8.033885647223434e-05, "tps": 23355, "wall": 67637.1} {"step": 24104, "train_loss": 3.203537940979004, "lr": 8.032677121367726e-05, "tps": 23354, "wall": 67642.8} {"step": 24105, "train_loss": 3.345224142074585, "lr": 8.031468753734612e-05, "tps": 23353, "wall": 67648.5} {"step": 24106, "train_loss": 3.1566224098205566, "lr": 8.030260544337778e-05, "tps": 23352, "wall": 67654.1} {"step": 24107, "train_loss": 3.255141496658325, "lr": 8.029052493190901e-05, "tps": 23351, "wall": 67659.9} {"step": 24108, "train_loss": 3.272721290588379, "lr": 8.027844600307678e-05, "tps": 23350, "wall": 67665.6} {"step": 24109, "train_loss": 3.1775503158569336, "lr": 8.026636865701788e-05, "tps": 23349, "wall": 67671.3} {"step": 24110, "train_loss": 3.3440184593200684, "lr": 8.025429289386908e-05, "tps": 23348, "wall": 67677.0} {"step": 24111, "train_loss": 3.2534220218658447, "lr": 8.024221871376723e-05, "tps": 23347, "wall": 67682.7} {"step": 24112, "train_loss": 3.2809572219848633, "lr": 8.02301461168491e-05, "tps": 23346, "wall": 67688.4} {"step": 24113, "train_loss": 3.272608995437622, "lr": 8.021807510325139e-05, "tps": 23345, "wall": 67694.1} {"step": 24114, "train_loss": 3.326417922973633, "lr": 8.020600567311094e-05, "tps": 23344, "wall": 67699.8} {"step": 24115, "train_loss": 3.2916486263275146, "lr": 8.019393782656435e-05, "tps": 23343, "wall": 67705.4} {"step": 24116, "train_loss": 3.249901294708252, "lr": 8.018187156374846e-05, "tps": 23342, "wall": 67711.1} {"step": 24117, "train_loss": 3.1845767498016357, "lr": 8.016980688479991e-05, "tps": 23341, "wall": 67716.9} {"step": 24118, "train_loss": 3.222169876098633, "lr": 8.015774378985528e-05, "tps": 23340, "wall": 67722.6} {"step": 24119, "train_loss": 3.335426092147827, "lr": 8.014568227905134e-05, "tps": 23339, "wall": 67728.4} {"step": 24120, "train_loss": 3.260505437850952, "lr": 8.013362235252469e-05, "tps": 23338, "wall": 67734.1} {"step": 24121, "train_loss": 3.230780601501465, "lr": 8.012156401041189e-05, "tps": 23337, "wall": 67739.8} {"step": 24122, "train_loss": 3.3006346225738525, "lr": 8.010950725284963e-05, "tps": 23336, "wall": 67745.4} {"step": 24123, "train_loss": 3.1720941066741943, "lr": 8.009745207997441e-05, "tps": 23335, "wall": 67751.1} {"step": 24124, "train_loss": 3.224480628967285, "lr": 8.00853984919228e-05, "tps": 23334, "wall": 67756.8} {"step": 24125, "train_loss": 3.3075413703918457, "lr": 8.00733464888314e-05, "tps": 23333, "wall": 67762.5} {"step": 24126, "train_loss": 3.284749984741211, "lr": 8.006129607083672e-05, "tps": 23332, "wall": 67768.2} {"step": 24127, "train_loss": 3.2473855018615723, "lr": 8.004924723807519e-05, "tps": 23331, "wall": 67773.9} {"step": 24128, "train_loss": 3.226874828338623, "lr": 8.00371999906834e-05, "tps": 23330, "wall": 67779.7} {"step": 24129, "train_loss": 3.2472448348999023, "lr": 8.00251543287978e-05, "tps": 23329, "wall": 67785.4} {"step": 24130, "train_loss": 3.2959136962890625, "lr": 8.001311025255473e-05, "tps": 23328, "wall": 67791.1} {"step": 24131, "train_loss": 3.2526369094848633, "lr": 8.000106776209081e-05, "tps": 23327, "wall": 67796.8} {"step": 24132, "train_loss": 3.2292816638946533, "lr": 7.998902685754231e-05, "tps": 23326, "wall": 67802.5} {"step": 24133, "train_loss": 3.32236647605896, "lr": 7.997698753904572e-05, "tps": 23325, "wall": 67808.2} {"step": 24134, "train_loss": 3.1460280418395996, "lr": 7.996494980673743e-05, "tps": 23324, "wall": 67813.9} {"step": 24135, "train_loss": 3.3701133728027344, "lr": 7.995291366075369e-05, "tps": 23323, "wall": 67819.6} {"step": 24136, "train_loss": 3.2561264038085938, "lr": 7.994087910123096e-05, "tps": 23322, "wall": 67825.3} {"step": 24137, "train_loss": 3.17185640335083, "lr": 7.992884612830553e-05, "tps": 23321, "wall": 67831.0} {"step": 24138, "train_loss": 3.2416114807128906, "lr": 7.991681474211367e-05, "tps": 23320, "wall": 67836.8} {"step": 24139, "train_loss": 3.3043200969696045, "lr": 7.990478494279177e-05, "tps": 23319, "wall": 67842.5} {"step": 24140, "train_loss": 3.1778435707092285, "lr": 7.989275673047604e-05, "tps": 23318, "wall": 67848.2} {"step": 24141, "train_loss": 3.180152177810669, "lr": 7.988073010530269e-05, "tps": 23317, "wall": 67853.9} {"step": 24142, "train_loss": 3.2240936756134033, "lr": 7.986870506740805e-05, "tps": 23316, "wall": 67859.6} {"step": 24143, "train_loss": 3.2523725032806396, "lr": 7.98566816169283e-05, "tps": 23315, "wall": 67865.3} {"step": 24144, "train_loss": 3.3488597869873047, "lr": 7.984465975399959e-05, "tps": 23314, "wall": 67870.9} {"step": 24145, "train_loss": 3.2589454650878906, "lr": 7.983263947875823e-05, "tps": 23313, "wall": 67876.6} {"step": 24146, "train_loss": 3.1685235500335693, "lr": 7.98206207913403e-05, "tps": 23312, "wall": 67882.3} {"step": 24147, "train_loss": 3.271334171295166, "lr": 7.980860369188189e-05, "tps": 23311, "wall": 67887.9} {"step": 24148, "train_loss": 3.32523775100708, "lr": 7.979658818051927e-05, "tps": 23310, "wall": 67893.6} {"step": 24149, "train_loss": 3.22711443901062, "lr": 7.978457425738843e-05, "tps": 23309, "wall": 67899.3} {"step": 24150, "train_loss": 3.3099424839019775, "lr": 7.977256192262559e-05, "tps": 23308, "wall": 67905.0} {"step": 24151, "train_loss": 3.1566176414489746, "lr": 7.976055117636674e-05, "tps": 23307, "wall": 67910.7} {"step": 24152, "train_loss": 3.353250026702881, "lr": 7.97485420187479e-05, "tps": 23306, "wall": 67916.3} {"step": 24153, "train_loss": 3.3733408451080322, "lr": 7.973653444990521e-05, "tps": 23305, "wall": 67921.9} {"step": 24154, "train_loss": 3.2499356269836426, "lr": 7.972452846997463e-05, "tps": 23304, "wall": 67927.6} {"step": 24155, "train_loss": 3.213921546936035, "lr": 7.971252407909216e-05, "tps": 23303, "wall": 67933.3} {"step": 24156, "train_loss": 3.2996301651000977, "lr": 7.970052127739385e-05, "tps": 23302, "wall": 67938.9} {"step": 24157, "train_loss": 3.2375283241271973, "lr": 7.968852006501564e-05, "tps": 23301, "wall": 67944.6} {"step": 24158, "train_loss": 3.249022960662842, "lr": 7.967652044209338e-05, "tps": 23300, "wall": 67950.2} {"step": 24159, "train_loss": 3.3264031410217285, "lr": 7.966452240876314e-05, "tps": 23299, "wall": 67956.0} {"step": 24160, "train_loss": 3.3309197425842285, "lr": 7.96525259651608e-05, "tps": 23298, "wall": 67961.6} {"step": 24161, "train_loss": 3.2947909832000732, "lr": 7.96405311114222e-05, "tps": 23297, "wall": 67967.2} {"step": 24162, "train_loss": 3.282447576522827, "lr": 7.962853784768326e-05, "tps": 23296, "wall": 67972.9} {"step": 24163, "train_loss": 3.2944841384887695, "lr": 7.96165461740799e-05, "tps": 23295, "wall": 67978.6} {"step": 24164, "train_loss": 3.328176975250244, "lr": 7.960455609074782e-05, "tps": 23294, "wall": 67984.2} {"step": 24165, "train_loss": 3.2755205631256104, "lr": 7.959256759782297e-05, "tps": 23293, "wall": 67989.9} {"step": 24166, "train_loss": 3.1975772380828857, "lr": 7.95805806954411e-05, "tps": 23292, "wall": 67995.5} {"step": 24167, "train_loss": 3.2338452339172363, "lr": 7.956859538373798e-05, "tps": 23291, "wall": 68001.2} {"step": 24168, "train_loss": 3.311521530151367, "lr": 7.955661166284946e-05, "tps": 23290, "wall": 68006.8} {"step": 24169, "train_loss": 3.289900064468384, "lr": 7.954462953291118e-05, "tps": 23289, "wall": 68012.5} {"step": 24170, "train_loss": 3.318427562713623, "lr": 7.953264899405898e-05, "tps": 23288, "wall": 68018.2} {"step": 24171, "train_loss": 3.284991979598999, "lr": 7.952067004642854e-05, "tps": 23287, "wall": 68023.9} {"step": 24172, "train_loss": 3.238673210144043, "lr": 7.950869269015549e-05, "tps": 23286, "wall": 68029.5} {"step": 24173, "train_loss": 3.255751132965088, "lr": 7.949671692537562e-05, "tps": 23285, "wall": 68035.2} {"step": 24174, "train_loss": 3.2728967666625977, "lr": 7.948474275222457e-05, "tps": 23285, "wall": 68040.9} {"step": 24175, "train_loss": 3.389099359512329, "lr": 7.94727701708379e-05, "tps": 23284, "wall": 68046.5} {"step": 24176, "train_loss": 3.325833797454834, "lr": 7.946079918135129e-05, "tps": 23283, "wall": 68052.1} {"step": 24177, "train_loss": 3.2699990272521973, "lr": 7.944882978390041e-05, "tps": 23282, "wall": 68057.8} {"step": 24178, "train_loss": 3.2410800457000732, "lr": 7.94368619786207e-05, "tps": 23281, "wall": 68063.4} {"step": 24179, "train_loss": 3.211883068084717, "lr": 7.942489576564789e-05, "tps": 23280, "wall": 68069.0} {"step": 24180, "train_loss": 3.2626137733459473, "lr": 7.941293114511745e-05, "tps": 23279, "wall": 68074.7} {"step": 24181, "train_loss": 3.1073296070098877, "lr": 7.94009681171649e-05, "tps": 23278, "wall": 68080.4} {"step": 24182, "train_loss": 3.3566677570343018, "lr": 7.938900668192585e-05, "tps": 23277, "wall": 68086.1} {"step": 24183, "train_loss": 3.1437363624572754, "lr": 7.937704683953573e-05, "tps": 23276, "wall": 68091.8} {"step": 24184, "train_loss": 3.2254717350006104, "lr": 7.936508859012997e-05, "tps": 23275, "wall": 68097.4} {"step": 24185, "train_loss": 3.200413703918457, "lr": 7.935313193384415e-05, "tps": 23274, "wall": 68103.1} {"step": 24186, "train_loss": 3.3165359497070312, "lr": 7.934117687081362e-05, "tps": 23273, "wall": 68108.7} {"step": 24187, "train_loss": 3.1297948360443115, "lr": 7.932922340117386e-05, "tps": 23272, "wall": 68114.3} {"step": 24188, "train_loss": 3.249520778656006, "lr": 7.931727152506032e-05, "tps": 23271, "wall": 68120.0} {"step": 24189, "train_loss": 3.2527546882629395, "lr": 7.930532124260825e-05, "tps": 23270, "wall": 68125.7} {"step": 24190, "train_loss": 3.2346272468566895, "lr": 7.929337255395317e-05, "tps": 23269, "wall": 68131.3} {"step": 24191, "train_loss": 3.2359304428100586, "lr": 7.92814254592304e-05, "tps": 23268, "wall": 68137.1} {"step": 24192, "train_loss": 3.2245588302612305, "lr": 7.926947995857523e-05, "tps": 23267, "wall": 68142.7} {"step": 24193, "train_loss": 3.1965999603271484, "lr": 7.925753605212302e-05, "tps": 23266, "wall": 68148.4} {"step": 24194, "train_loss": 3.260668992996216, "lr": 7.9245593740009e-05, "tps": 23265, "wall": 68154.1} {"step": 24195, "train_loss": 3.3471429347991943, "lr": 7.923365302236855e-05, "tps": 23264, "wall": 68159.8} {"step": 24196, "train_loss": 3.1941776275634766, "lr": 7.922171389933692e-05, "tps": 23263, "wall": 68165.4} {"step": 24197, "train_loss": 3.295135498046875, "lr": 7.920977637104924e-05, "tps": 23262, "wall": 68171.1} {"step": 24198, "train_loss": 3.161377429962158, "lr": 7.919784043764092e-05, "tps": 23261, "wall": 68176.7} {"step": 24199, "train_loss": 3.220780611038208, "lr": 7.918590609924707e-05, "tps": 23260, "wall": 68182.4} {"step": 24200, "train_loss": 3.2398927211761475, "lr": 7.917397335600284e-05, "tps": 23259, "wall": 68188.0} {"step": 24201, "train_loss": 3.222827196121216, "lr": 7.916204220804348e-05, "tps": 23258, "wall": 68193.7} {"step": 24202, "train_loss": 3.277285575866699, "lr": 7.915011265550419e-05, "tps": 23257, "wall": 68199.4} {"step": 24203, "train_loss": 3.194079875946045, "lr": 7.913818469851992e-05, "tps": 23256, "wall": 68205.1} {"step": 24204, "train_loss": 3.404292583465576, "lr": 7.9126258337226e-05, "tps": 23255, "wall": 68210.8} {"step": 24205, "train_loss": 3.2731103897094727, "lr": 7.911433357175746e-05, "tps": 23254, "wall": 68216.4} {"step": 24206, "train_loss": 3.3354153633117676, "lr": 7.910241040224931e-05, "tps": 23253, "wall": 68222.0} {"step": 24207, "train_loss": 3.272549867630005, "lr": 7.909048882883673e-05, "tps": 23252, "wall": 68227.6} {"step": 24208, "train_loss": 3.2464516162872314, "lr": 7.90785688516547e-05, "tps": 23252, "wall": 68233.3} {"step": 24209, "train_loss": 3.3356149196624756, "lr": 7.906665047083824e-05, "tps": 23251, "wall": 68238.9} {"step": 24210, "train_loss": 3.314944267272949, "lr": 7.905473368652242e-05, "tps": 23250, "wall": 68244.6} {"step": 24211, "train_loss": 3.21962308883667, "lr": 7.904281849884214e-05, "tps": 23249, "wall": 68250.2} {"step": 24212, "train_loss": 3.201617479324341, "lr": 7.903090490793252e-05, "tps": 23248, "wall": 68255.9} {"step": 24213, "train_loss": 3.2112274169921875, "lr": 7.90189929139284e-05, "tps": 23247, "wall": 68261.6} {"step": 24214, "train_loss": 3.279115676879883, "lr": 7.900708251696473e-05, "tps": 23246, "wall": 68267.2} {"step": 24215, "train_loss": 3.2125062942504883, "lr": 7.89951737171765e-05, "tps": 23245, "wall": 68272.9} {"step": 24216, "train_loss": 3.1809043884277344, "lr": 7.898326651469856e-05, "tps": 23244, "wall": 68278.6} {"step": 24217, "train_loss": 3.2714591026306152, "lr": 7.897136090966577e-05, "tps": 23243, "wall": 68284.3} {"step": 24218, "train_loss": 3.291280746459961, "lr": 7.895945690221309e-05, "tps": 23242, "wall": 68289.9} {"step": 24219, "train_loss": 3.2954955101013184, "lr": 7.894755449247529e-05, "tps": 23241, "wall": 68295.6} {"step": 24220, "train_loss": 3.196408748626709, "lr": 7.89356536805872e-05, "tps": 23240, "wall": 68301.2} {"step": 24221, "train_loss": 3.1980233192443848, "lr": 7.89237544666837e-05, "tps": 23239, "wall": 68306.9} {"step": 24222, "train_loss": 3.3118133544921875, "lr": 7.891185685089952e-05, "tps": 23238, "wall": 68312.5} {"step": 24223, "train_loss": 3.2284200191497803, "lr": 7.889996083336942e-05, "tps": 23237, "wall": 68318.3} {"step": 24224, "train_loss": 3.2469120025634766, "lr": 7.888806641422825e-05, "tps": 23236, "wall": 68323.9} {"step": 24225, "train_loss": 3.2594799995422363, "lr": 7.88761735936107e-05, "tps": 23235, "wall": 68329.5} {"step": 24226, "train_loss": 3.256321430206299, "lr": 7.886428237165145e-05, "tps": 23234, "wall": 68335.2} {"step": 24227, "train_loss": 3.3603739738464355, "lr": 7.885239274848527e-05, "tps": 23233, "wall": 68340.8} {"step": 24228, "train_loss": 3.34440016746521, "lr": 7.884050472424678e-05, "tps": 23232, "wall": 68346.5} {"step": 24229, "train_loss": 3.361884832382202, "lr": 7.882861829907074e-05, "tps": 23231, "wall": 68352.1} {"step": 24230, "train_loss": 3.2270894050598145, "lr": 7.881673347309175e-05, "tps": 23230, "wall": 68357.8} {"step": 24231, "train_loss": 3.3323111534118652, "lr": 7.880485024644439e-05, "tps": 23229, "wall": 68363.5} {"step": 24232, "train_loss": 3.3843250274658203, "lr": 7.879296861926337e-05, "tps": 23228, "wall": 68369.1} {"step": 24233, "train_loss": 3.325112819671631, "lr": 7.878108859168326e-05, "tps": 23227, "wall": 68374.8} {"step": 24234, "train_loss": 3.339827537536621, "lr": 7.876921016383855e-05, "tps": 23226, "wall": 68380.5} {"step": 24235, "train_loss": 3.1764869689941406, "lr": 7.875733333586392e-05, "tps": 23225, "wall": 68386.2} {"step": 24236, "train_loss": 3.2204713821411133, "lr": 7.874545810789388e-05, "tps": 23224, "wall": 68391.8} {"step": 24237, "train_loss": 3.2151811122894287, "lr": 7.873358448006285e-05, "tps": 23223, "wall": 68397.5} {"step": 24238, "train_loss": 3.242428779602051, "lr": 7.872171245250549e-05, "tps": 23223, "wall": 68403.1} {"step": 24239, "train_loss": 3.2318549156188965, "lr": 7.87098420253562e-05, "tps": 23222, "wall": 68408.8} {"step": 24240, "train_loss": 3.2273826599121094, "lr": 7.869797319874943e-05, "tps": 23221, "wall": 68414.5} {"step": 24241, "train_loss": 3.3214359283447266, "lr": 7.86861059728197e-05, "tps": 23220, "wall": 68420.1} {"step": 24242, "train_loss": 3.2792248725891113, "lr": 7.867424034770142e-05, "tps": 23219, "wall": 68425.7} {"step": 24243, "train_loss": 3.252396583557129, "lr": 7.866237632352891e-05, "tps": 23218, "wall": 68431.4} {"step": 24244, "train_loss": 3.2005295753479004, "lr": 7.865051390043672e-05, "tps": 23217, "wall": 68437.1} {"step": 24245, "train_loss": 3.3548545837402344, "lr": 7.863865307855917e-05, "tps": 23216, "wall": 68442.8} {"step": 24246, "train_loss": 3.1487512588500977, "lr": 7.862679385803053e-05, "tps": 23215, "wall": 68448.4} {"step": 24247, "train_loss": 3.364048480987549, "lr": 7.861493623898528e-05, "tps": 23214, "wall": 68454.0} {"step": 24248, "train_loss": 3.335282802581787, "lr": 7.860308022155762e-05, "tps": 23213, "wall": 68459.7} {"step": 24249, "train_loss": 3.3084323406219482, "lr": 7.859122580588199e-05, "tps": 23212, "wall": 68465.3} {"step": 24250, "train_loss": 3.327432870864868, "lr": 7.857937299209258e-05, "tps": 23211, "wall": 68471.0} {"step": 24251, "train_loss": 3.1922168731689453, "lr": 7.856752178032364e-05, "tps": 23210, "wall": 68476.6} {"step": 24252, "train_loss": 3.2693819999694824, "lr": 7.855567217070951e-05, "tps": 23209, "wall": 68482.3} {"step": 24253, "train_loss": 3.3069381713867188, "lr": 7.85438241633844e-05, "tps": 23208, "wall": 68487.9} {"step": 24254, "train_loss": 3.219226121902466, "lr": 7.853197775848241e-05, "tps": 23207, "wall": 68493.6} {"step": 24255, "train_loss": 3.180330276489258, "lr": 7.852013295613792e-05, "tps": 23206, "wall": 68499.3} {"step": 24256, "train_loss": 3.3173422813415527, "lr": 7.850828975648502e-05, "tps": 23205, "wall": 68505.0} {"step": 24257, "train_loss": 3.1974496841430664, "lr": 7.849644815965778e-05, "tps": 23204, "wall": 68510.7} {"step": 24258, "train_loss": 3.2200942039489746, "lr": 7.84846081657905e-05, "tps": 23203, "wall": 68516.3} {"step": 24259, "train_loss": 3.2408008575439453, "lr": 7.847276977501722e-05, "tps": 23202, "wall": 68522.0} {"step": 24260, "train_loss": 3.2592451572418213, "lr": 7.846093298747205e-05, "tps": 23201, "wall": 68527.6} {"step": 24261, "train_loss": 3.2727441787719727, "lr": 7.844909780328913e-05, "tps": 23200, "wall": 68533.2} {"step": 24262, "train_loss": 3.2116544246673584, "lr": 7.843726422260245e-05, "tps": 23199, "wall": 68538.9} {"step": 24263, "train_loss": 3.350538730621338, "lr": 7.842543224554609e-05, "tps": 23199, "wall": 68544.5} {"step": 24264, "train_loss": 3.236544370651245, "lr": 7.841360187225411e-05, "tps": 23198, "wall": 68550.1} {"step": 24265, "train_loss": 3.1307382583618164, "lr": 7.84017731028605e-05, "tps": 23197, "wall": 68555.9} {"step": 24266, "train_loss": 3.1832661628723145, "lr": 7.838994593749927e-05, "tps": 23196, "wall": 68561.5} {"step": 24267, "train_loss": 3.1561696529388428, "lr": 7.837812037630441e-05, "tps": 23195, "wall": 68567.2} {"step": 24268, "train_loss": 3.34151291847229, "lr": 7.83662964194098e-05, "tps": 23194, "wall": 68572.8} {"step": 24269, "train_loss": 3.2782723903656006, "lr": 7.835447406694953e-05, "tps": 23193, "wall": 68578.4} {"step": 24270, "train_loss": 3.2153048515319824, "lr": 7.834265331905744e-05, "tps": 23192, "wall": 68584.1} {"step": 24271, "train_loss": 3.230875015258789, "lr": 7.833083417586733e-05, "tps": 23191, "wall": 68589.7} {"step": 24272, "train_loss": 3.2576212882995605, "lr": 7.831901663751331e-05, "tps": 23190, "wall": 68595.4} {"step": 24273, "train_loss": 3.174654483795166, "lr": 7.83072007041291e-05, "tps": 23189, "wall": 68601.0} {"step": 24274, "train_loss": 3.2059152126312256, "lr": 7.829538637584855e-05, "tps": 23188, "wall": 68606.7} {"step": 24275, "train_loss": 3.216850519180298, "lr": 7.828357365280556e-05, "tps": 23187, "wall": 68612.4} {"step": 24276, "train_loss": 3.3309926986694336, "lr": 7.827176253513394e-05, "tps": 23186, "wall": 68618.1} {"step": 24277, "train_loss": 3.2912774085998535, "lr": 7.82599530229674e-05, "tps": 23185, "wall": 68623.7} {"step": 24278, "train_loss": 3.2153236865997314, "lr": 7.824814511643983e-05, "tps": 23184, "wall": 68629.4} {"step": 24279, "train_loss": 3.1747593879699707, "lr": 7.823633881568493e-05, "tps": 23183, "wall": 68635.0} {"step": 24280, "train_loss": 3.245851993560791, "lr": 7.822453412083642e-05, "tps": 23182, "wall": 68640.7} {"step": 24281, "train_loss": 3.2013912200927734, "lr": 7.821273103202809e-05, "tps": 23181, "wall": 68646.4} {"step": 24282, "train_loss": 3.190825939178467, "lr": 7.820092954939357e-05, "tps": 23180, "wall": 68652.0} {"step": 24283, "train_loss": 3.125765800476074, "lr": 7.818912967306666e-05, "tps": 23179, "wall": 68657.7} {"step": 24284, "train_loss": 3.414231061935425, "lr": 7.817733140318093e-05, "tps": 23178, "wall": 68663.3} {"step": 24285, "train_loss": 3.377542018890381, "lr": 7.816553473987004e-05, "tps": 23177, "wall": 68669.0} {"step": 24286, "train_loss": 3.199296474456787, "lr": 7.815373968326766e-05, "tps": 23177, "wall": 68674.6} {"step": 24287, "train_loss": 3.27323842048645, "lr": 7.814194623350742e-05, "tps": 23176, "wall": 68680.3} {"step": 24288, "train_loss": 3.1166226863861084, "lr": 7.813015439072285e-05, "tps": 23175, "wall": 68686.0} {"step": 24289, "train_loss": 3.3288450241088867, "lr": 7.811836415504759e-05, "tps": 23174, "wall": 68691.7} {"step": 24290, "train_loss": 3.280496597290039, "lr": 7.81065755266152e-05, "tps": 23173, "wall": 68697.3} {"step": 24291, "train_loss": 3.174379348754883, "lr": 7.809478850555912e-05, "tps": 23172, "wall": 68703.0} {"step": 24292, "train_loss": 3.286947011947632, "lr": 7.808300309201299e-05, "tps": 23171, "wall": 68708.7} {"step": 24293, "train_loss": 3.255650520324707, "lr": 7.807121928611033e-05, "tps": 23170, "wall": 68714.3} {"step": 24294, "train_loss": 3.1613686084747314, "lr": 7.80594370879845e-05, "tps": 23169, "wall": 68719.9} {"step": 24295, "train_loss": 3.280158519744873, "lr": 7.804765649776909e-05, "tps": 23168, "wall": 68725.6} {"step": 24296, "train_loss": 3.32700252532959, "lr": 7.80358775155975e-05, "tps": 23167, "wall": 68731.2} {"step": 24297, "train_loss": 3.2784926891326904, "lr": 7.802410014160315e-05, "tps": 23166, "wall": 68737.0} {"step": 24298, "train_loss": 3.2485480308532715, "lr": 7.80123243759195e-05, "tps": 23165, "wall": 68742.6} {"step": 24299, "train_loss": 3.2688374519348145, "lr": 7.800055021867993e-05, "tps": 23164, "wall": 68748.3} {"step": 24300, "train_loss": 3.2239131927490234, "lr": 7.798877767001775e-05, "tps": 23163, "wall": 68753.9} {"step": 24301, "train_loss": 3.1934218406677246, "lr": 7.797700673006644e-05, "tps": 23162, "wall": 68759.6} {"step": 24302, "train_loss": 3.196133613586426, "lr": 7.796523739895923e-05, "tps": 23161, "wall": 68765.3} {"step": 24303, "train_loss": 3.2820634841918945, "lr": 7.795346967682955e-05, "tps": 23160, "wall": 68771.0} {"step": 24304, "train_loss": 3.1776883602142334, "lr": 7.794170356381064e-05, "tps": 23159, "wall": 68776.6} {"step": 24305, "train_loss": 3.3149163722991943, "lr": 7.792993906003574e-05, "tps": 23158, "wall": 68782.3} {"step": 24306, "train_loss": 3.28208589553833, "lr": 7.791817616563825e-05, "tps": 23157, "wall": 68787.9} {"step": 24307, "train_loss": 3.2684216499328613, "lr": 7.790641488075132e-05, "tps": 23156, "wall": 68793.5} {"step": 24308, "train_loss": 3.1543703079223633, "lr": 7.789465520550819e-05, "tps": 23155, "wall": 68799.4} {"step": 24309, "train_loss": 3.3106658458709717, "lr": 7.788289714004212e-05, "tps": 23154, "wall": 68805.1} {"step": 24310, "train_loss": 3.1997737884521484, "lr": 7.787114068448629e-05, "tps": 23154, "wall": 68810.7} {"step": 24311, "train_loss": 3.1475651264190674, "lr": 7.78593858389738e-05, "tps": 23153, "wall": 68816.4} {"step": 24312, "train_loss": 3.3809115886688232, "lr": 7.784763260363795e-05, "tps": 23152, "wall": 68822.1} {"step": 24313, "train_loss": 3.2301459312438965, "lr": 7.783588097861176e-05, "tps": 23151, "wall": 68827.7} {"step": 24314, "train_loss": 3.319425582885742, "lr": 7.782413096402842e-05, "tps": 23150, "wall": 68833.4} {"step": 24315, "train_loss": 3.258321523666382, "lr": 7.781238256002101e-05, "tps": 23149, "wall": 68839.0} {"step": 24316, "train_loss": 3.348485231399536, "lr": 7.780063576672267e-05, "tps": 23148, "wall": 68844.7} {"step": 24317, "train_loss": 3.2485857009887695, "lr": 7.778889058426632e-05, "tps": 23147, "wall": 68850.3} {"step": 24318, "train_loss": 3.3961925506591797, "lr": 7.777714701278522e-05, "tps": 23146, "wall": 68856.1} {"step": 24319, "train_loss": 3.314330577850342, "lr": 7.776540505241221e-05, "tps": 23145, "wall": 68861.7} {"step": 24320, "train_loss": 3.2788753509521484, "lr": 7.775366470328043e-05, "tps": 23144, "wall": 68867.4} {"step": 24321, "train_loss": 3.266252040863037, "lr": 7.774192596552283e-05, "tps": 23143, "wall": 68873.1} {"step": 24322, "train_loss": 3.2831082344055176, "lr": 7.773018883927236e-05, "tps": 23142, "wall": 68878.7} {"step": 24323, "train_loss": 3.1788811683654785, "lr": 7.771845332466203e-05, "tps": 23141, "wall": 68884.4} {"step": 24324, "train_loss": 3.278289318084717, "lr": 7.770671942182477e-05, "tps": 23140, "wall": 68890.0} {"step": 24325, "train_loss": 3.260507822036743, "lr": 7.769498713089344e-05, "tps": 23139, "wall": 68895.7} {"step": 24326, "train_loss": 3.27359938621521, "lr": 7.768325645200107e-05, "tps": 23138, "wall": 68901.4} {"step": 24327, "train_loss": 3.363452911376953, "lr": 7.767152738528043e-05, "tps": 23137, "wall": 68907.0} {"step": 24328, "train_loss": 3.368274211883545, "lr": 7.765979993086441e-05, "tps": 23136, "wall": 68912.7} {"step": 24329, "train_loss": 3.2501220703125, "lr": 7.76480740888859e-05, "tps": 23135, "wall": 68918.4} {"step": 24330, "train_loss": 3.2636616230010986, "lr": 7.763634985947775e-05, "tps": 23134, "wall": 68924.0} {"step": 24331, "train_loss": 3.2574400901794434, "lr": 7.762462724277263e-05, "tps": 23134, "wall": 68929.7} {"step": 24332, "train_loss": 3.2965476512908936, "lr": 7.761290623890351e-05, "tps": 23133, "wall": 68935.4} {"step": 24333, "train_loss": 3.29728364944458, "lr": 7.760118684800308e-05, "tps": 23132, "wall": 68941.0} {"step": 24334, "train_loss": 3.4077131748199463, "lr": 7.758946907020408e-05, "tps": 23131, "wall": 68946.7} {"step": 24335, "train_loss": 3.3456058502197266, "lr": 7.757775290563932e-05, "tps": 23130, "wall": 68952.3} {"step": 24336, "train_loss": 3.349839687347412, "lr": 7.75660383544414e-05, "tps": 23129, "wall": 68958.0} {"step": 24337, "train_loss": 3.209582805633545, "lr": 7.75543254167432e-05, "tps": 23128, "wall": 68963.7} {"step": 24338, "train_loss": 3.238352060317993, "lr": 7.754261409267727e-05, "tps": 23127, "wall": 68969.4} {"step": 24339, "train_loss": 3.132467269897461, "lr": 7.753090438237629e-05, "tps": 23126, "wall": 68975.1} {"step": 24340, "train_loss": 3.2645926475524902, "lr": 7.751919628597298e-05, "tps": 23125, "wall": 68980.8} {"step": 24341, "train_loss": 3.2679648399353027, "lr": 7.75074898035999e-05, "tps": 23124, "wall": 68986.6} {"step": 24342, "train_loss": 3.325352191925049, "lr": 7.749578493538966e-05, "tps": 23123, "wall": 68992.2} {"step": 24343, "train_loss": 3.254202365875244, "lr": 7.748408168147492e-05, "tps": 23122, "wall": 68997.8} {"step": 24344, "train_loss": 3.277026653289795, "lr": 7.74723800419882e-05, "tps": 23121, "wall": 69003.4} {"step": 24345, "train_loss": 3.248073101043701, "lr": 7.746068001706204e-05, "tps": 23120, "wall": 69009.1} {"step": 24346, "train_loss": 3.2325501441955566, "lr": 7.744898160682903e-05, "tps": 23119, "wall": 69014.8} {"step": 24347, "train_loss": 3.302281379699707, "lr": 7.743728481142169e-05, "tps": 23118, "wall": 69020.4} {"step": 24348, "train_loss": 3.1900508403778076, "lr": 7.742558963097245e-05, "tps": 23117, "wall": 69026.0} {"step": 24349, "train_loss": 3.2564034461975098, "lr": 7.741389606561389e-05, "tps": 23116, "wall": 69031.7} {"step": 24350, "train_loss": 3.2766709327697754, "lr": 7.740220411547843e-05, "tps": 23115, "wall": 69037.4} {"step": 24351, "train_loss": 3.2735507488250732, "lr": 7.739051378069846e-05, "tps": 23115, "wall": 69043.1} {"step": 24352, "train_loss": 3.2293758392333984, "lr": 7.737882506140653e-05, "tps": 23114, "wall": 69048.8} {"step": 24353, "train_loss": 3.296154260635376, "lr": 7.736713795773498e-05, "tps": 23113, "wall": 69054.4} {"step": 24354, "train_loss": 3.2550196647644043, "lr": 7.735545246981614e-05, "tps": 23112, "wall": 69060.1} {"step": 24355, "train_loss": 3.33174991607666, "lr": 7.734376859778251e-05, "tps": 23111, "wall": 69065.8} {"step": 24356, "train_loss": 3.2615184783935547, "lr": 7.733208634176634e-05, "tps": 23110, "wall": 69071.4} {"step": 24357, "train_loss": 3.186750888824463, "lr": 7.732040570190007e-05, "tps": 23109, "wall": 69077.1} {"step": 24358, "train_loss": 3.2994933128356934, "lr": 7.730872667831596e-05, "tps": 23108, "wall": 69082.7} {"step": 24359, "train_loss": 3.275893449783325, "lr": 7.729704927114627e-05, "tps": 23107, "wall": 69088.4} {"step": 24360, "train_loss": 3.2674665451049805, "lr": 7.728537348052337e-05, "tps": 23106, "wall": 69094.1} {"step": 24361, "train_loss": 3.157848358154297, "lr": 7.727369930657946e-05, "tps": 23105, "wall": 69099.8} {"step": 24362, "train_loss": 3.216790199279785, "lr": 7.726202674944682e-05, "tps": 23104, "wall": 69105.5} {"step": 24363, "train_loss": 3.1795787811279297, "lr": 7.725035580925768e-05, "tps": 23103, "wall": 69111.1} {"step": 24364, "train_loss": 3.231388807296753, "lr": 7.723868648614416e-05, "tps": 23102, "wall": 69116.8} {"step": 24365, "train_loss": 3.314570188522339, "lr": 7.722701878023859e-05, "tps": 23101, "wall": 69122.6} {"step": 24366, "train_loss": 3.1963939666748047, "lr": 7.721535269167307e-05, "tps": 23100, "wall": 69128.2} {"step": 24367, "train_loss": 3.120779037475586, "lr": 7.720368822057969e-05, "tps": 23099, "wall": 69133.8} {"step": 24368, "train_loss": 3.2148990631103516, "lr": 7.719202536709074e-05, "tps": 23098, "wall": 69139.5} {"step": 24369, "train_loss": 3.2927045822143555, "lr": 7.718036413133822e-05, "tps": 23097, "wall": 69145.1} {"step": 24370, "train_loss": 3.2392702102661133, "lr": 7.716870451345424e-05, "tps": 23097, "wall": 69150.7} {"step": 24371, "train_loss": 3.2031447887420654, "lr": 7.715704651357092e-05, "tps": 23096, "wall": 69156.5} {"step": 24372, "train_loss": 3.2367286682128906, "lr": 7.714539013182034e-05, "tps": 23095, "wall": 69162.1} {"step": 24373, "train_loss": 3.3029041290283203, "lr": 7.713373536833443e-05, "tps": 23094, "wall": 69167.8} {"step": 24374, "train_loss": 3.27945613861084, "lr": 7.712208222324535e-05, "tps": 23093, "wall": 69173.4} {"step": 24375, "train_loss": 3.3009326457977295, "lr": 7.711043069668505e-05, "tps": 23092, "wall": 69179.1} {"step": 24376, "train_loss": 3.252354383468628, "lr": 7.709878078878549e-05, "tps": 23091, "wall": 69184.7} {"step": 24377, "train_loss": 3.20487904548645, "lr": 7.708713249967871e-05, "tps": 23090, "wall": 69190.3} {"step": 24378, "train_loss": 3.235100030899048, "lr": 7.707548582949662e-05, "tps": 23089, "wall": 69196.0} {"step": 24379, "train_loss": 3.3266539573669434, "lr": 7.706384077837112e-05, "tps": 23088, "wall": 69201.6} {"step": 24380, "train_loss": 3.2459402084350586, "lr": 7.70521973464342e-05, "tps": 23087, "wall": 69207.2} {"step": 24381, "train_loss": 3.1959123611450195, "lr": 7.704055553381769e-05, "tps": 23086, "wall": 69212.8} {"step": 24382, "train_loss": 3.2870869636535645, "lr": 7.702891534065353e-05, "tps": 23085, "wall": 69218.6} {"step": 24383, "train_loss": 3.2562758922576904, "lr": 7.701727676707356e-05, "tps": 23084, "wall": 69224.3} {"step": 24384, "train_loss": 3.227665424346924, "lr": 7.700563981320959e-05, "tps": 23083, "wall": 69230.0} {"step": 24385, "train_loss": 3.297719955444336, "lr": 7.699400447919347e-05, "tps": 23082, "wall": 69235.6} {"step": 24386, "train_loss": 3.1714441776275635, "lr": 7.698237076515704e-05, "tps": 23081, "wall": 69241.3} {"step": 24387, "train_loss": 3.219996929168701, "lr": 7.697073867123197e-05, "tps": 23081, "wall": 69246.9} {"step": 24388, "train_loss": 3.1429123878479004, "lr": 7.69591081975502e-05, "tps": 23080, "wall": 69252.6} {"step": 24389, "train_loss": 3.232510566711426, "lr": 7.694747934424337e-05, "tps": 23079, "wall": 69258.3} {"step": 24390, "train_loss": 3.2685956954956055, "lr": 7.693585211144317e-05, "tps": 23078, "wall": 69264.0} {"step": 24391, "train_loss": 3.179983139038086, "lr": 7.692422649928145e-05, "tps": 23077, "wall": 69269.7} {"step": 24392, "train_loss": 3.332146406173706, "lr": 7.691260250788982e-05, "tps": 23076, "wall": 69275.4} {"step": 24393, "train_loss": 3.1953001022338867, "lr": 7.690098013739992e-05, "tps": 23075, "wall": 69281.0} {"step": 24394, "train_loss": 3.319108009338379, "lr": 7.68893593879435e-05, "tps": 23074, "wall": 69286.7} {"step": 24395, "train_loss": 3.285867691040039, "lr": 7.687774025965219e-05, "tps": 23073, "wall": 69292.4} {"step": 24396, "train_loss": 3.268404483795166, "lr": 7.68661227526575e-05, "tps": 23072, "wall": 69298.0} {"step": 24397, "train_loss": 3.2559657096862793, "lr": 7.685450686709117e-05, "tps": 23071, "wall": 69303.6} {"step": 24398, "train_loss": 3.138500213623047, "lr": 7.684289260308469e-05, "tps": 23070, "wall": 69309.3} {"step": 24399, "train_loss": 3.333199977874756, "lr": 7.68312799607697e-05, "tps": 23069, "wall": 69314.9} {"step": 24400, "train_loss": 3.1898837089538574, "lr": 7.681966894027775e-05, "tps": 23068, "wall": 69320.6} {"step": 24401, "train_loss": 3.3556079864501953, "lr": 7.680805954174026e-05, "tps": 23067, "wall": 69326.3} {"step": 24402, "train_loss": 3.209420680999756, "lr": 7.679645176528886e-05, "tps": 23066, "wall": 69331.9} {"step": 24403, "train_loss": 3.3395698070526123, "lr": 7.678484561105502e-05, "tps": 23065, "wall": 69337.7} {"step": 24404, "train_loss": 3.308736562728882, "lr": 7.677324107917015e-05, "tps": 23065, "wall": 69343.3} {"step": 24405, "train_loss": 3.3058533668518066, "lr": 7.67616381697658e-05, "tps": 23064, "wall": 69349.0} {"step": 24406, "train_loss": 3.289414405822754, "lr": 7.675003688297336e-05, "tps": 23063, "wall": 69354.6} {"step": 24407, "train_loss": 3.1837759017944336, "lr": 7.673843721892417e-05, "tps": 23062, "wall": 69360.3} {"step": 24408, "train_loss": 3.204453945159912, "lr": 7.672683917774982e-05, "tps": 23061, "wall": 69365.9} {"step": 24409, "train_loss": 3.200859546661377, "lr": 7.671524275958155e-05, "tps": 23060, "wall": 69371.6} {"step": 24410, "train_loss": 3.1061339378356934, "lr": 7.670364796455072e-05, "tps": 23059, "wall": 69377.2} {"step": 24411, "train_loss": 3.2733287811279297, "lr": 7.669205479278876e-05, "tps": 23058, "wall": 69382.9} {"step": 24412, "train_loss": 3.2302639484405518, "lr": 7.668046324442697e-05, "tps": 23057, "wall": 69388.6} {"step": 24413, "train_loss": 3.267744541168213, "lr": 7.66688733195966e-05, "tps": 23056, "wall": 69394.2} {"step": 24414, "train_loss": 3.304499626159668, "lr": 7.665728501842903e-05, "tps": 23055, "wall": 69400.0} {"step": 24415, "train_loss": 3.212745428085327, "lr": 7.664569834105544e-05, "tps": 23054, "wall": 69405.6} {"step": 24416, "train_loss": 3.208160400390625, "lr": 7.663411328760717e-05, "tps": 23053, "wall": 69411.3} {"step": 24417, "train_loss": 3.252671241760254, "lr": 7.662252985821544e-05, "tps": 23052, "wall": 69417.0} {"step": 24418, "train_loss": 3.098104476928711, "lr": 7.661094805301137e-05, "tps": 23051, "wall": 69422.6} {"step": 24419, "train_loss": 3.2186996936798096, "lr": 7.659936787212633e-05, "tps": 23050, "wall": 69428.3} {"step": 24420, "train_loss": 3.271786689758301, "lr": 7.658778931569137e-05, "tps": 23050, "wall": 69433.9} {"step": 24421, "train_loss": 3.191284656524658, "lr": 7.657621238383767e-05, "tps": 23049, "wall": 69439.6} {"step": 24422, "train_loss": 3.315418243408203, "lr": 7.656463707669643e-05, "tps": 23048, "wall": 69445.3} {"step": 24423, "train_loss": 3.2786974906921387, "lr": 7.655306339439876e-05, "tps": 23047, "wall": 69451.0} {"step": 24424, "train_loss": 3.279376983642578, "lr": 7.654149133707566e-05, "tps": 23046, "wall": 69456.7} {"step": 24425, "train_loss": 3.191232681274414, "lr": 7.65299209048584e-05, "tps": 23045, "wall": 69462.4} {"step": 24426, "train_loss": 3.2059426307678223, "lr": 7.651835209787793e-05, "tps": 23044, "wall": 69468.1} {"step": 24427, "train_loss": 3.3340516090393066, "lr": 7.650678491626529e-05, "tps": 23043, "wall": 69473.7} {"step": 24428, "train_loss": 3.30556058883667, "lr": 7.649521936015158e-05, "tps": 23042, "wall": 69479.4} {"step": 24429, "train_loss": 3.26906681060791, "lr": 7.648365542966782e-05, "tps": 23041, "wall": 69485.0} {"step": 24430, "train_loss": 3.2303307056427, "lr": 7.647209312494491e-05, "tps": 23040, "wall": 69490.7} {"step": 24431, "train_loss": 3.2876577377319336, "lr": 7.646053244611396e-05, "tps": 23039, "wall": 69496.3} {"step": 24432, "train_loss": 3.286785125732422, "lr": 7.644897339330586e-05, "tps": 23038, "wall": 69501.9} {"step": 24433, "train_loss": 3.2187228202819824, "lr": 7.643741596665148e-05, "tps": 23037, "wall": 69507.6} {"step": 24434, "train_loss": 3.1324892044067383, "lr": 7.642586016628189e-05, "tps": 23036, "wall": 69513.2} {"step": 24435, "train_loss": 3.2909576892852783, "lr": 7.641430599232786e-05, "tps": 23035, "wall": 69519.0} {"step": 24436, "train_loss": 3.154383659362793, "lr": 7.64027534449204e-05, "tps": 23035, "wall": 69524.6} {"step": 24437, "train_loss": 3.292365312576294, "lr": 7.639120252419032e-05, "tps": 23034, "wall": 69530.3} {"step": 24438, "train_loss": 3.1518027782440186, "lr": 7.637965323026842e-05, "tps": 23033, "wall": 69535.9} {"step": 24439, "train_loss": 3.2456345558166504, "lr": 7.636810556328562e-05, "tps": 23032, "wall": 69541.6} {"step": 24440, "train_loss": 3.282658815383911, "lr": 7.635655952337269e-05, "tps": 23031, "wall": 69547.2} {"step": 24441, "train_loss": 3.1982309818267822, "lr": 7.634501511066039e-05, "tps": 23029, "wall": 69554.8} {"step": 24442, "train_loss": 3.271031618118286, "lr": 7.633347232527954e-05, "tps": 23028, "wall": 69561.2} {"step": 24443, "train_loss": 3.2060017585754395, "lr": 7.632193116736093e-05, "tps": 23027, "wall": 69567.1} {"step": 24444, "train_loss": 3.256770133972168, "lr": 7.63103916370352e-05, "tps": 23026, "wall": 69572.7} {"step": 24445, "train_loss": 3.2182483673095703, "lr": 7.629885373443316e-05, "tps": 23025, "wall": 69578.5} {"step": 24446, "train_loss": 3.121979236602783, "lr": 7.628731745968548e-05, "tps": 23024, "wall": 69584.2} {"step": 24447, "train_loss": 3.2769412994384766, "lr": 7.62757828129228e-05, "tps": 23023, "wall": 69590.0} {"step": 24448, "train_loss": 3.2451794147491455, "lr": 7.62642497942759e-05, "tps": 23022, "wall": 69596.1} {"step": 24449, "train_loss": 3.2856831550598145, "lr": 7.625271840387532e-05, "tps": 23021, "wall": 69601.8} {"step": 24450, "train_loss": 3.2841432094573975, "lr": 7.624118864185168e-05, "tps": 23020, "wall": 69607.6} {"step": 24451, "train_loss": 3.240211009979248, "lr": 7.62296605083357e-05, "tps": 23019, "wall": 69613.6} {"step": 24452, "train_loss": 3.265566825866699, "lr": 7.621813400345783e-05, "tps": 23018, "wall": 69619.5} {"step": 24453, "train_loss": 3.258350372314453, "lr": 7.620660912734878e-05, "tps": 23017, "wall": 69625.2} {"step": 24454, "train_loss": 3.2723495960235596, "lr": 7.619508588013904e-05, "tps": 23016, "wall": 69631.1} {"step": 24455, "train_loss": 3.2985219955444336, "lr": 7.618356426195907e-05, "tps": 23015, "wall": 69636.9} {"step": 24456, "train_loss": 3.156802177429199, "lr": 7.617204427293954e-05, "tps": 23014, "wall": 69642.6} {"step": 24457, "train_loss": 3.2676918506622314, "lr": 7.616052591321089e-05, "tps": 23013, "wall": 69648.8} {"step": 24458, "train_loss": 3.2001254558563232, "lr": 7.614900918290351e-05, "tps": 23012, "wall": 69654.6} {"step": 24459, "train_loss": 3.252556562423706, "lr": 7.613749408214799e-05, "tps": 23011, "wall": 69660.4} {"step": 24460, "train_loss": 3.2116072177886963, "lr": 7.612598061107472e-05, "tps": 23010, "wall": 69666.2} {"step": 24461, "train_loss": 3.2653191089630127, "lr": 7.611446876981407e-05, "tps": 23009, "wall": 69672.0} {"step": 24462, "train_loss": 3.24143123626709, "lr": 7.610295855849656e-05, "tps": 23008, "wall": 69677.8} {"step": 24463, "train_loss": 3.2674520015716553, "lr": 7.609144997725252e-05, "tps": 23007, "wall": 69683.5} {"step": 24464, "train_loss": 3.2520358562469482, "lr": 7.607994302621227e-05, "tps": 23006, "wall": 69689.4} {"step": 24465, "train_loss": 3.309535503387451, "lr": 7.606843770550627e-05, "tps": 23005, "wall": 69695.5} {"step": 24466, "train_loss": 3.2893097400665283, "lr": 7.605693401526477e-05, "tps": 23004, "wall": 69701.6} {"step": 24467, "train_loss": 3.2271981239318848, "lr": 7.604543195561808e-05, "tps": 23003, "wall": 69707.5} {"step": 24468, "train_loss": 3.288012742996216, "lr": 7.603393152669658e-05, "tps": 23002, "wall": 69713.4} {"step": 24469, "train_loss": 3.2747745513916016, "lr": 7.602243272863043e-05, "tps": 23001, "wall": 69719.2} {"step": 24470, "train_loss": 3.3579423427581787, "lr": 7.601093556155e-05, "tps": 23000, "wall": 69724.9} {"step": 24471, "train_loss": 3.159966468811035, "lr": 7.599944002558548e-05, "tps": 22999, "wall": 69730.5} {"step": 24472, "train_loss": 3.173353910446167, "lr": 7.598794612086704e-05, "tps": 22998, "wall": 69736.2} {"step": 24473, "train_loss": 3.241218328475952, "lr": 7.597645384752501e-05, "tps": 22998, "wall": 69741.9} {"step": 24474, "train_loss": 3.282318592071533, "lr": 7.596496320568946e-05, "tps": 22997, "wall": 69747.7} {"step": 24475, "train_loss": 3.142350673675537, "lr": 7.59534741954906e-05, "tps": 22996, "wall": 69753.5} {"step": 24476, "train_loss": 3.2852137088775635, "lr": 7.59419868170586e-05, "tps": 22995, "wall": 69759.4} {"step": 24477, "train_loss": 3.3016934394836426, "lr": 7.593050107052355e-05, "tps": 22994, "wall": 69765.3} {"step": 24478, "train_loss": 3.1619322299957275, "lr": 7.591901695601556e-05, "tps": 22993, "wall": 69771.1} {"step": 24479, "train_loss": 3.248579740524292, "lr": 7.590753447366478e-05, "tps": 22992, "wall": 69776.9} {"step": 24480, "train_loss": 3.21632981300354, "lr": 7.589605362360124e-05, "tps": 22991, "wall": 69782.8} {"step": 24481, "train_loss": 3.386197566986084, "lr": 7.588457440595495e-05, "tps": 22990, "wall": 69788.7} {"step": 24482, "train_loss": 3.374488115310669, "lr": 7.587309682085606e-05, "tps": 22989, "wall": 69794.5} {"step": 24483, "train_loss": 3.3343169689178467, "lr": 7.586162086843452e-05, "tps": 22988, "wall": 69800.4} {"step": 24484, "train_loss": 3.2943525314331055, "lr": 7.585014654882028e-05, "tps": 22987, "wall": 69806.3} {"step": 24485, "train_loss": 3.2644832134246826, "lr": 7.583867386214343e-05, "tps": 22986, "wall": 69812.0} {"step": 24486, "train_loss": 3.178266763687134, "lr": 7.582720280853387e-05, "tps": 22985, "wall": 69817.9} {"step": 24487, "train_loss": 3.3031163215637207, "lr": 7.581573338812152e-05, "tps": 22984, "wall": 69824.1} {"step": 24488, "train_loss": 3.4353749752044678, "lr": 7.58042656010364e-05, "tps": 22982, "wall": 69830.7} {"step": 24489, "train_loss": 3.284517526626587, "lr": 7.579279944740829e-05, "tps": 22981, "wall": 69837.5} {"step": 24490, "train_loss": 3.2192606925964355, "lr": 7.578133492736724e-05, "tps": 22980, "wall": 69843.3} {"step": 24491, "train_loss": 3.2949087619781494, "lr": 7.576987204104297e-05, "tps": 22979, "wall": 69849.2} {"step": 24492, "train_loss": 3.1564037799835205, "lr": 7.575841078856538e-05, "tps": 22978, "wall": 69855.4} {"step": 24493, "train_loss": 3.281010389328003, "lr": 7.574695117006436e-05, "tps": 22977, "wall": 69861.6} {"step": 24494, "train_loss": 3.2971301078796387, "lr": 7.573549318566968e-05, "tps": 22976, "wall": 69867.7} {"step": 24495, "train_loss": 3.3296031951904297, "lr": 7.572403683551109e-05, "tps": 22975, "wall": 69873.5} {"step": 24496, "train_loss": 3.3171448707580566, "lr": 7.571258211971846e-05, "tps": 22974, "wall": 69879.3} {"step": 24497, "train_loss": 3.21630597114563, "lr": 7.570112903842151e-05, "tps": 22973, "wall": 69885.1} {"step": 24498, "train_loss": 3.3153748512268066, "lr": 7.568967759174993e-05, "tps": 22972, "wall": 69890.9} {"step": 24499, "train_loss": 3.391386032104492, "lr": 7.567822777983352e-05, "tps": 22971, "wall": 69896.9} {"step": 24500, "train_loss": 3.2277650833129883, "lr": 7.566677960280198e-05, "tps": 22970, "wall": 69902.8} {"step": 24501, "train_loss": 3.3262345790863037, "lr": 7.565533306078492e-05, "tps": 22969, "wall": 69908.8} {"step": 24502, "train_loss": 3.270582675933838, "lr": 7.564388815391208e-05, "tps": 22968, "wall": 69914.7} {"step": 24503, "train_loss": 3.2209296226501465, "lr": 7.563244488231309e-05, "tps": 22967, "wall": 69920.6} {"step": 24504, "train_loss": 3.181222438812256, "lr": 7.562100324611755e-05, "tps": 22966, "wall": 69926.3} {"step": 24505, "train_loss": 3.0918869972229004, "lr": 7.560956324545515e-05, "tps": 22965, "wall": 69932.1} {"step": 24506, "train_loss": 3.290802001953125, "lr": 7.559812488045532e-05, "tps": 22964, "wall": 69938.0} {"step": 24507, "train_loss": 3.163959503173828, "lr": 7.558668815124784e-05, "tps": 22963, "wall": 69943.8} {"step": 24508, "train_loss": 3.224795341491699, "lr": 7.557525305796215e-05, "tps": 22962, "wall": 69949.8} {"step": 24509, "train_loss": 3.1965491771698, "lr": 7.556381960072778e-05, "tps": 22961, "wall": 69955.6} {"step": 24510, "train_loss": 3.28668212890625, "lr": 7.555238777967431e-05, "tps": 22960, "wall": 69961.4} {"step": 24511, "train_loss": 3.2373993396759033, "lr": 7.55409575949312e-05, "tps": 22959, "wall": 69967.3} {"step": 24512, "train_loss": 3.225980520248413, "lr": 7.552952904662789e-05, "tps": 22958, "wall": 69973.1} {"step": 24513, "train_loss": 3.2313523292541504, "lr": 7.551810213489396e-05, "tps": 22957, "wall": 69978.9} {"step": 24514, "train_loss": 3.103919744491577, "lr": 7.550667685985876e-05, "tps": 22956, "wall": 69984.6} {"step": 24515, "train_loss": 3.2175188064575195, "lr": 7.549525322165172e-05, "tps": 22955, "wall": 69990.4} {"step": 24516, "train_loss": 3.0989904403686523, "lr": 7.54838312204023e-05, "tps": 22954, "wall": 69996.3} {"step": 24517, "train_loss": 3.332700252532959, "lr": 7.547241085623984e-05, "tps": 22953, "wall": 70002.2} {"step": 24518, "train_loss": 3.3808577060699463, "lr": 7.546099212929372e-05, "tps": 22952, "wall": 70008.0} {"step": 24519, "train_loss": 3.3013644218444824, "lr": 7.544957503969333e-05, "tps": 22951, "wall": 70013.8} {"step": 24520, "train_loss": 3.284090042114258, "lr": 7.543815958756796e-05, "tps": 22950, "wall": 70019.5} {"step": 24521, "train_loss": 3.225386619567871, "lr": 7.542674577304692e-05, "tps": 22949, "wall": 70025.6} {"step": 24522, "train_loss": 3.4050445556640625, "lr": 7.541533359625954e-05, "tps": 22948, "wall": 70031.6} {"step": 24501, "train_loss": 3.185450315475464, "lr": 7.565533306078492e-05, "tps": 355791862, "wall": 4.5} {"step": 24502, "train_loss": 3.193821430206299, "lr": 7.564388815391208e-05, "tps": 189842011, "wall": 8.5} {"step": 24503, "train_loss": 3.1938741207122803, "lr": 7.563244488231309e-05, "tps": 128871558, "wall": 12.5} {"step": 24504, "train_loss": 3.2562623023986816, "lr": 7.562100324611755e-05, "tps": 96734715, "wall": 16.6} {"step": 24505, "train_loss": 3.1531827449798584, "lr": 7.560956324545515e-05, "tps": 77162361, "wall": 20.8} {"step": 24506, "train_loss": 3.166550636291504, "lr": 7.559812488045532e-05, "tps": 64001027, "wall": 25.1} {"step": 24507, "train_loss": 3.1804592609405518, "lr": 7.558668815124784e-05, "tps": 54477809, "wall": 29.5} {"step": 24508, "train_loss": 3.259772300720215, "lr": 7.557525305796215e-05, "tps": 47433760, "wall": 33.9} {"step": 24509, "train_loss": 3.24395751953125, "lr": 7.556381960072778e-05, "tps": 42002810, "wall": 38.2} {"step": 24510, "train_loss": 3.260739326477051, "lr": 7.555238777967431e-05, "tps": 37654818, "wall": 42.7} {"step": 24511, "train_loss": 3.1657657623291016, "lr": 7.55409575949312e-05, "tps": 34109540, "wall": 47.1} {"step": 24512, "train_loss": 3.245985507965088, "lr": 7.552952904662789e-05, "tps": 31169501, "wall": 51.5} {"step": 24513, "train_loss": 3.1175971031188965, "lr": 7.551810213489396e-05, "tps": 28682836, "wall": 56.0} {"step": 24514, "train_loss": 3.168748378753662, "lr": 7.550667685985876e-05, "tps": 26491083, "wall": 60.6} {"step": 24515, "train_loss": 3.335998058319092, "lr": 7.549525322165172e-05, "tps": 24564202, "wall": 65.4} {"step": 24516, "train_loss": 3.241814136505127, "lr": 7.54838312204023e-05, "tps": 22952689, "wall": 70.0} {"step": 24517, "train_loss": 3.1676993370056152, "lr": 7.547241085623984e-05, "tps": 21488759, "wall": 74.8} {"step": 24518, "train_loss": 3.264084577560425, "lr": 7.546099212929372e-05, "tps": 20239413, "wall": 79.4} {"step": 24519, "train_loss": 3.2396113872528076, "lr": 7.544957503969333e-05, "tps": 19091356, "wall": 84.2} {"step": 24520, "train_loss": 3.206808567047119, "lr": 7.543815958756796e-05, "tps": 18003181, "wall": 89.3} {"step": 24521, "train_loss": 3.3113043308258057, "lr": 7.542674577304692e-05, "tps": 17061982, "wall": 94.2} {"step": 24522, "train_loss": 3.278738260269165, "lr": 7.541533359625954e-05, "tps": 16212667, "wall": 99.1} {"step": 24523, "train_loss": 3.1991353034973145, "lr": 7.540392305733506e-05, "tps": 15442500, "wall": 104.1} {"step": 24524, "train_loss": 3.168069839477539, "lr": 7.539251415640281e-05, "tps": 14748053, "wall": 109.0} {"step": 24525, "train_loss": 3.1824588775634766, "lr": 7.538110689359196e-05, "tps": 14117282, "wall": 113.9} {"step": 24526, "train_loss": 3.081674337387085, "lr": 7.536970126903174e-05, "tps": 13533856, "wall": 118.8} {"step": 24527, "train_loss": 3.1918528079986572, "lr": 7.535829728285139e-05, "tps": 13006550, "wall": 123.6} {"step": 24528, "train_loss": 3.299881935119629, "lr": 7.534689493518007e-05, "tps": 12519977, "wall": 128.4} {"step": 24529, "train_loss": 3.2004425525665283, "lr": 7.53354942261469e-05, "tps": 12071150, "wall": 133.2} {"step": 24530, "train_loss": 3.227559804916382, "lr": 7.532409515588121e-05, "tps": 11650318, "wall": 138.0} {"step": 24531, "train_loss": 3.176530599594116, "lr": 7.531269772451189e-05, "tps": 11257701, "wall": 142.8} {"step": 24532, "train_loss": 3.2499332427978516, "lr": 7.530130193216815e-05, "tps": 10883620, "wall": 147.7} {"step": 24533, "train_loss": 3.235560894012451, "lr": 7.528990777897916e-05, "tps": 10524486, "wall": 152.8} {"step": 24534, "train_loss": 3.090761661529541, "lr": 7.527851526507386e-05, "tps": 10200161, "wall": 157.6} {"step": 24535, "train_loss": 3.2578301429748535, "lr": 7.52671243905814e-05, "tps": 9876439, "wall": 162.8} {"step": 24536, "train_loss": 3.2027487754821777, "lr": 7.525573515563079e-05, "tps": 9582247, "wall": 167.8} {"step": 24537, "train_loss": 3.257199287414551, "lr": 7.524434756035098e-05, "tps": 9301677, "wall": 172.9} {"step": 24538, "train_loss": 3.199057102203369, "lr": 7.52329616048711e-05, "tps": 9040632, "wall": 177.9} {"step": 24539, "train_loss": 3.1475672721862793, "lr": 7.522157728932007e-05, "tps": 8789117, "wall": 183.0} {"step": 24540, "train_loss": 3.1821048259735107, "lr": 7.521019461382677e-05, "tps": 8553355, "wall": 188.0} {"step": 24541, "train_loss": 3.1688075065612793, "lr": 7.519881357852028e-05, "tps": 8326303, "wall": 193.2} {"step": 24542, "train_loss": 3.2663044929504395, "lr": 7.518743418352946e-05, "tps": 8114749, "wall": 198.2} {"step": 24543, "train_loss": 3.0927538871765137, "lr": 7.517605642898318e-05, "tps": 7911611, "wall": 203.3} {"step": 24544, "train_loss": 3.282414674758911, "lr": 7.516468031501041e-05, "tps": 7714979, "wall": 208.5} {"step": 24545, "train_loss": 3.1230149269104004, "lr": 7.515330584173999e-05, "tps": 7531146, "wall": 213.6} {"step": 24546, "train_loss": 3.2888011932373047, "lr": 7.514193300930068e-05, "tps": 7354726, "wall": 218.7} {"step": 24547, "train_loss": 3.07327938079834, "lr": 7.513056181782145e-05, "tps": 7184593, "wall": 223.9} {"step": 24548, "train_loss": 3.2493951320648193, "lr": 7.511919226743103e-05, "tps": 7019138, "wall": 229.2} {"step": 24549, "train_loss": 3.3027281761169434, "lr": 7.510782435825823e-05, "tps": 6860084, "wall": 234.5} {"step": 24550, "train_loss": 3.2198574542999268, "lr": 7.509645809043188e-05, "tps": 6706985, "wall": 239.9} {"step": 24551, "train_loss": 3.1246211528778076, "lr": 7.508509346408064e-05, "tps": 6561323, "wall": 245.2} {"step": 24552, "train_loss": 3.2359933853149414, "lr": 7.507373047933334e-05, "tps": 6423094, "wall": 250.5} {"step": 24553, "train_loss": 3.262119770050049, "lr": 7.506236913631866e-05, "tps": 6290406, "wall": 255.8} {"step": 24554, "train_loss": 3.2162842750549316, "lr": 7.505100943516527e-05, "tps": 6163903, "wall": 261.1} {"step": 24555, "train_loss": 3.176410675048828, "lr": 7.503965137600191e-05, "tps": 6041715, "wall": 266.4} {"step": 24556, "train_loss": 3.1423044204711914, "lr": 7.502829495895724e-05, "tps": 5920294, "wall": 271.8} {"step": 24557, "train_loss": 3.241469383239746, "lr": 7.501694018415986e-05, "tps": 5805727, "wall": 277.2} {"step": 24558, "train_loss": 3.2344744205474854, "lr": 7.500558705173843e-05, "tps": 5698500, "wall": 282.4} {"step": 24559, "train_loss": 3.223851203918457, "lr": 7.499423556182158e-05, "tps": 5596276, "wall": 287.6} {"step": 24560, "train_loss": 3.334667205810547, "lr": 7.498288571453783e-05, "tps": 5497165, "wall": 292.8} {"step": 24561, "train_loss": 3.246901035308838, "lr": 7.497153751001581e-05, "tps": 5401985, "wall": 298.0} {"step": 24562, "train_loss": 3.207103729248047, "lr": 7.496019094838409e-05, "tps": 5308154, "wall": 303.3} {"step": 24563, "train_loss": 3.2715258598327637, "lr": 7.494884602977113e-05, "tps": 5216582, "wall": 308.6} {"step": 24564, "train_loss": 3.1992669105529785, "lr": 7.493750275430552e-05, "tps": 5129739, "wall": 313.8} {"step": 24565, "train_loss": 3.207638740539551, "lr": 7.492616112211567e-05, "tps": 5045153, "wall": 319.1} {"step": 24566, "train_loss": 3.2854385375976562, "lr": 7.491482113333018e-05, "tps": 4963675, "wall": 324.4} {"step": 24567, "train_loss": 3.324796438217163, "lr": 7.490348278807744e-05, "tps": 4884695, "wall": 329.6} {"step": 24568, "train_loss": 3.1878576278686523, "lr": 7.489214608648585e-05, "tps": 4808612, "wall": 334.8} {"step": 24569, "train_loss": 3.1052322387695312, "lr": 7.488081102868392e-05, "tps": 4734453, "wall": 340.1} {"step": 24570, "train_loss": 3.3228795528411865, "lr": 7.486947761480004e-05, "tps": 4662379, "wall": 345.4} {"step": 24571, "train_loss": 3.229489326477051, "lr": 7.485814584496248e-05, "tps": 4592393, "wall": 350.7} {"step": 24572, "train_loss": 3.205789089202881, "lr": 7.484681571929977e-05, "tps": 4525017, "wall": 355.9} {"step": 24573, "train_loss": 3.2455716133117676, "lr": 7.483548723794018e-05, "tps": 4458006, "wall": 361.3} {"step": 24574, "train_loss": 3.1606040000915527, "lr": 7.4824160401012e-05, "tps": 4394090, "wall": 366.5} {"step": 24575, "train_loss": 3.2269985675811768, "lr": 7.481283520864363e-05, "tps": 4331622, "wall": 371.8} {"step": 24576, "train_loss": 3.267958879470825, "lr": 7.480151166096332e-05, "tps": 4270665, "wall": 377.1} {"step": 24577, "train_loss": 3.231421709060669, "lr": 7.479018975809928e-05, "tps": 4211896, "wall": 382.4} {"step": 24578, "train_loss": 3.2310001850128174, "lr": 7.477886950017989e-05, "tps": 4154718, "wall": 387.7} {"step": 24579, "train_loss": 3.3317008018493652, "lr": 7.47675508873333e-05, "tps": 4099021, "wall": 393.0} {"step": 24580, "train_loss": 3.163679599761963, "lr": 7.475623391968772e-05, "tps": 4044680, "wall": 398.3} {"step": 24581, "train_loss": 3.24202036857605, "lr": 7.474491859737143e-05, "tps": 3990993, "wall": 403.7} {"step": 24582, "train_loss": 3.199754238128662, "lr": 7.473360492051256e-05, "tps": 3939165, "wall": 409.0} {"step": 24583, "train_loss": 3.1860620975494385, "lr": 7.472229288923922e-05, "tps": 3888318, "wall": 414.4} {"step": 24584, "train_loss": 3.221496343612671, "lr": 7.471098250367965e-05, "tps": 3837816, "wall": 419.8} {"step": 24585, "train_loss": 3.274878740310669, "lr": 7.46996737639619e-05, "tps": 3789445, "wall": 425.2} {"step": 24586, "train_loss": 3.221616506576538, "lr": 7.468836667021413e-05, "tps": 3741924, "wall": 430.6} {"step": 24587, "train_loss": 3.2093911170959473, "lr": 7.46770612225644e-05, "tps": 3695508, "wall": 436.0} {"step": 24588, "train_loss": 3.2255029678344727, "lr": 7.466575742114074e-05, "tps": 3649989, "wall": 441.5} {"step": 24589, "train_loss": 3.232426404953003, "lr": 7.465445526607131e-05, "tps": 3605504, "wall": 447.0} {"step": 24590, "train_loss": 3.202281951904297, "lr": 7.464315475748407e-05, "tps": 3562226, "wall": 452.4} {"step": 24591, "train_loss": 3.138087749481201, "lr": 7.463185589550696e-05, "tps": 3519691, "wall": 457.9} {"step": 24592, "train_loss": 3.2732431888580322, "lr": 7.462055868026813e-05, "tps": 3478268, "wall": 463.4} {"step": 24593, "train_loss": 3.243720531463623, "lr": 7.460926311189546e-05, "tps": 3437501, "wall": 468.9} {"step": 24594, "train_loss": 3.2568774223327637, "lr": 7.459796919051691e-05, "tps": 3397584, "wall": 474.4} {"step": 24595, "train_loss": 3.165942668914795, "lr": 7.458667691626044e-05, "tps": 3358106, "wall": 480.0} {"step": 24596, "train_loss": 3.21529483795166, "lr": 7.457538628925396e-05, "tps": 3320054, "wall": 485.5} {"step": 24597, "train_loss": 3.209843158721924, "lr": 7.456409730962535e-05, "tps": 3282689, "wall": 491.1} {"step": 24598, "train_loss": 3.2593960762023926, "lr": 7.455280997750254e-05, "tps": 3245876, "wall": 496.7} {"step": 24599, "train_loss": 3.287139415740967, "lr": 7.454152429301336e-05, "tps": 3210173, "wall": 502.2} {"step": 24600, "train_loss": 3.2098090648651123, "lr": 7.453024025628563e-05, "tps": 3175031, "wall": 507.8} {"step": 24601, "train_loss": 3.0939853191375732, "lr": 7.451895786744725e-05, "tps": 3140215, "wall": 513.4} {"step": 24602, "train_loss": 3.1409778594970703, "lr": 7.450767712662594e-05, "tps": 3106634, "wall": 519.0} {"step": 24603, "train_loss": 3.146536111831665, "lr": 7.449639803394958e-05, "tps": 3073805, "wall": 524.6} {"step": 24604, "train_loss": 3.125650405883789, "lr": 7.448512058954589e-05, "tps": 3041375, "wall": 530.2} {"step": 24605, "train_loss": 3.1742472648620605, "lr": 7.447384479354258e-05, "tps": 3009833, "wall": 535.8} {"step": 24606, "train_loss": 3.247964382171631, "lr": 7.44625706460675e-05, "tps": 2978345, "wall": 541.5} {"step": 24607, "train_loss": 3.1476283073425293, "lr": 7.445129814724827e-05, "tps": 2947907, "wall": 547.1} {"step": 24608, "train_loss": 3.285877227783203, "lr": 7.444002729721256e-05, "tps": 2917775, "wall": 552.7} {"step": 24609, "train_loss": 3.1754751205444336, "lr": 7.442875809608816e-05, "tps": 2888662, "wall": 558.3} {"step": 24610, "train_loss": 3.201909065246582, "lr": 7.441749054400266e-05, "tps": 2860081, "wall": 563.9} {"step": 24611, "train_loss": 3.178779125213623, "lr": 7.440622464108364e-05, "tps": 2831841, "wall": 569.6} {"step": 24612, "train_loss": 3.201484441757202, "lr": 7.439496038745886e-05, "tps": 2804391, "wall": 575.2} {"step": 24613, "train_loss": 3.2056379318237305, "lr": 7.438369778325581e-05, "tps": 2777353, "wall": 580.8} {"step": 24614, "train_loss": 3.177074432373047, "lr": 7.437243682860207e-05, "tps": 2750813, "wall": 586.4} {"step": 24615, "train_loss": 3.209016799926758, "lr": 7.436117752362532e-05, "tps": 2724871, "wall": 592.0} {"step": 24616, "train_loss": 3.2108922004699707, "lr": 7.434991986845299e-05, "tps": 2699279, "wall": 597.7} {"step": 24617, "train_loss": 3.2068405151367188, "lr": 7.433866386321262e-05, "tps": 2673817, "wall": 603.4} {"step": 24618, "train_loss": 3.141416072845459, "lr": 7.432740950803178e-05, "tps": 2649292, "wall": 609.0} {"step": 24619, "train_loss": 3.270657539367676, "lr": 7.431615680303795e-05, "tps": 2625236, "wall": 614.6} {"step": 24620, "train_loss": 3.27579927444458, "lr": 7.430490574835852e-05, "tps": 2601604, "wall": 620.2} {"step": 24621, "train_loss": 3.197000026702881, "lr": 7.429365634412105e-05, "tps": 2577970, "wall": 625.9} {"step": 24622, "train_loss": 3.2400879859924316, "lr": 7.428240859045287e-05, "tps": 2555417, "wall": 631.5} {"step": 24623, "train_loss": 3.2083683013916016, "lr": 7.42711624874815e-05, "tps": 2533069, "wall": 637.1} {"step": 24624, "train_loss": 3.1885032653808594, "lr": 7.425991803533427e-05, "tps": 2511109, "wall": 642.7} {"step": 24625, "train_loss": 3.204655647277832, "lr": 7.424867523413854e-05, "tps": 2489552, "wall": 648.3} {"step": 24626, "train_loss": 3.156902313232422, "lr": 7.423743408402175e-05, "tps": 2468327, "wall": 653.9} {"step": 24627, "train_loss": 3.2540817260742188, "lr": 7.422619458511117e-05, "tps": 2447144, "wall": 659.6} {"step": 24628, "train_loss": 3.2262089252471924, "lr": 7.421495673753413e-05, "tps": 2426748, "wall": 665.1} {"step": 24629, "train_loss": 3.190258741378784, "lr": 7.420372054141797e-05, "tps": 2406629, "wall": 670.7} {"step": 24630, "train_loss": 3.241919994354248, "lr": 7.419248599688997e-05, "tps": 2386762, "wall": 676.3} {"step": 24631, "train_loss": 3.196394920349121, "lr": 7.41812531040773e-05, "tps": 2367462, "wall": 681.9} {"step": 24632, "train_loss": 3.284879207611084, "lr": 7.417002186310737e-05, "tps": 2348305, "wall": 687.5} {"step": 24633, "train_loss": 3.104142665863037, "lr": 7.41587922741073e-05, "tps": 2329507, "wall": 693.0} {"step": 24634, "train_loss": 3.1190967559814453, "lr": 7.414756433720428e-05, "tps": 2311019, "wall": 698.6} {"step": 24635, "train_loss": 3.082883358001709, "lr": 7.413633805252558e-05, "tps": 2292927, "wall": 704.1} {"step": 24636, "train_loss": 3.342180013656616, "lr": 7.412511342019835e-05, "tps": 2275097, "wall": 709.7} {"step": 24637, "train_loss": 3.2396538257598877, "lr": 7.411389044034967e-05, "tps": 2257578, "wall": 715.2} {"step": 24638, "train_loss": 3.1213436126708984, "lr": 7.410266911310678e-05, "tps": 2239710, "wall": 721.0} {"step": 24639, "train_loss": 3.3255507946014404, "lr": 7.409144943859668e-05, "tps": 2222659, "wall": 726.5} {"step": 24640, "train_loss": 3.1131393909454346, "lr": 7.40802314169466e-05, "tps": 2205871, "wall": 732.1} {"step": 24641, "train_loss": 3.214545488357544, "lr": 7.406901504828357e-05, "tps": 2189346, "wall": 737.6} {"step": 24642, "train_loss": 3.192044973373413, "lr": 7.405780033273455e-05, "tps": 2173106, "wall": 743.2} {"step": 24643, "train_loss": 3.280402421951294, "lr": 7.404658727042674e-05, "tps": 2157097, "wall": 748.7} {"step": 24644, "train_loss": 3.32997989654541, "lr": 7.403537586148705e-05, "tps": 2141339, "wall": 754.3} {"step": 24645, "train_loss": 3.2258529663085938, "lr": 7.40241661060425e-05, "tps": 2125767, "wall": 759.8} {"step": 24646, "train_loss": 3.1388237476348877, "lr": 7.401295800422015e-05, "tps": 2110543, "wall": 765.3} {"step": 24647, "train_loss": 3.184955596923828, "lr": 7.400175155614688e-05, "tps": 2095474, "wall": 770.9} {"step": 24648, "train_loss": 3.219968795776367, "lr": 7.399054676194963e-05, "tps": 2080630, "wall": 776.4} {"step": 24649, "train_loss": 3.2312142848968506, "lr": 7.397934362175543e-05, "tps": 2065705, "wall": 782.0} {"step": 24650, "train_loss": 3.090564727783203, "lr": 7.396814213569112e-05, "tps": 2051209, "wall": 787.6} {"step": 24651, "train_loss": 3.182096004486084, "lr": 7.395694230388353e-05, "tps": 2036919, "wall": 793.2} {"step": 24652, "train_loss": 3.218327522277832, "lr": 7.394574412645965e-05, "tps": 2022804, "wall": 798.7} {"step": 24653, "train_loss": 3.2642264366149902, "lr": 7.393454760354628e-05, "tps": 2009011, "wall": 804.2} {"step": 24654, "train_loss": 3.219054937362671, "lr": 7.392335273527021e-05, "tps": 1995371, "wall": 809.8} {"step": 24655, "train_loss": 3.13952374458313, "lr": 7.391215952175837e-05, "tps": 1981863, "wall": 815.3} {"step": 24656, "train_loss": 3.2099311351776123, "lr": 7.390096796313744e-05, "tps": 1967658, "wall": 821.2} {"step": 24657, "train_loss": 3.1753015518188477, "lr": 7.388977805953428e-05, "tps": 1953139, "wall": 827.4} {"step": 24658, "train_loss": 3.261528968811035, "lr": 7.387858981107563e-05, "tps": 1938134, "wall": 833.8} {"step": 24659, "train_loss": 3.174105405807495, "lr": 7.386740321788816e-05, "tps": 1922208, "wall": 840.8} {"step": 24660, "train_loss": 3.2218031883239746, "lr": 7.38562182800987e-05, "tps": 1909082, "wall": 846.6} {"step": 24661, "train_loss": 3.3436543941497803, "lr": 7.38450349978339e-05, "tps": 1896249, "wall": 852.3} {"step": 24662, "train_loss": 3.1261463165283203, "lr": 7.383385337122042e-05, "tps": 1883399, "wall": 858.2} {"step": 24663, "train_loss": 3.221566677093506, "lr": 7.382267340038501e-05, "tps": 1871187, "wall": 863.8} {"step": 24664, "train_loss": 3.139713764190674, "lr": 7.381149508545424e-05, "tps": 1859150, "wall": 869.5} {"step": 24665, "train_loss": 3.188575506210327, "lr": 7.380031842655474e-05, "tps": 1847341, "wall": 875.0} {"step": 24666, "train_loss": 3.3351054191589355, "lr": 7.378914342381317e-05, "tps": 1835579, "wall": 880.7} {"step": 24667, "train_loss": 3.093672752380371, "lr": 7.37779700773561e-05, "tps": 1824169, "wall": 886.2} {"step": 24668, "train_loss": 3.0865635871887207, "lr": 7.376679838731005e-05, "tps": 1811907, "wall": 892.3} {"step": 24669, "train_loss": 3.138420820236206, "lr": 7.375562835380165e-05, "tps": 1800695, "wall": 897.9} {"step": 24670, "train_loss": 3.2288825511932373, "lr": 7.374445997695742e-05, "tps": 1789372, "wall": 903.6} {"step": 24671, "train_loss": 3.2398457527160645, "lr": 7.373329325690381e-05, "tps": 1778393, "wall": 909.2} {"step": 24672, "train_loss": 3.2751901149749756, "lr": 7.372212819376742e-05, "tps": 1765697, "wall": 915.8} {"step": 24673, "train_loss": 3.0962018966674805, "lr": 7.371096478767468e-05, "tps": 1754107, "wall": 921.9} {"step": 24674, "train_loss": 3.1953041553497314, "lr": 7.369980303875199e-05, "tps": 1742968, "wall": 927.8} {"step": 24675, "train_loss": 3.3291497230529785, "lr": 7.368864294712587e-05, "tps": 1732135, "wall": 933.6} {"step": 24501, "train_loss": 3.185450315475464, "lr": 7.565533306078492e-05, "tps": 354232844, "wall": 4.5} {"step": 24502, "train_loss": 3.193821430206299, "lr": 7.564388815391208e-05, "tps": 190148855, "wall": 8.4} {"step": 24503, "train_loss": 3.1938741207122803, "lr": 7.563244488231309e-05, "tps": 128773353, "wall": 12.5} {"step": 24504, "train_loss": 3.2562623023986816, "lr": 7.562100324611755e-05, "tps": 96108412, "wall": 16.7} {"step": 24505, "train_loss": 3.1531827449798584, "lr": 7.560956324545515e-05, "tps": 76589751, "wall": 21.0} {"step": 24506, "train_loss": 3.166550636291504, "lr": 7.559812488045532e-05, "tps": 63519517, "wall": 25.3} {"step": 24507, "train_loss": 3.1804592609405518, "lr": 7.558668815124784e-05, "tps": 54094404, "wall": 29.7} {"step": 24508, "train_loss": 3.259772300720215, "lr": 7.557525305796215e-05, "tps": 47144010, "wall": 34.1} {"step": 24509, "train_loss": 3.24395751953125, "lr": 7.556381960072778e-05, "tps": 41681613, "wall": 38.5} {"step": 24510, "train_loss": 3.260739326477051, "lr": 7.555238777967431e-05, "tps": 37375837, "wall": 43.0} {"step": 24511, "train_loss": 3.1657657623291016, "lr": 7.55409575949312e-05, "tps": 33802215, "wall": 47.5} {"step": 24512, "train_loss": 3.245985507965088, "lr": 7.552952904662789e-05, "tps": 30817524, "wall": 52.1} {"step": 24513, "train_loss": 3.1175971031188965, "lr": 7.551810213489396e-05, "tps": 28324038, "wall": 56.7} {"step": 24514, "train_loss": 3.168748378753662, "lr": 7.550667685985876e-05, "tps": 26209013, "wall": 61.3} {"step": 24515, "train_loss": 3.335998058319092, "lr": 7.549525322165172e-05, "tps": 24374926, "wall": 65.9} {"step": 24516, "train_loss": 3.241814136505127, "lr": 7.54838312204023e-05, "tps": 22773111, "wall": 70.6} {"step": 24517, "train_loss": 3.1676993370056152, "lr": 7.547241085623984e-05, "tps": 21353283, "wall": 75.2} {"step": 24518, "train_loss": 3.264084577560425, "lr": 7.546099212929372e-05, "tps": 20065353, "wall": 80.1} {"step": 24519, "train_loss": 3.2396113872528076, "lr": 7.544957503969333e-05, "tps": 18931374, "wall": 84.9} {"step": 24520, "train_loss": 3.206808567047119, "lr": 7.543815958756796e-05, "tps": 17903491, "wall": 89.8} {"step": 24521, "train_loss": 3.3113043308258057, "lr": 7.542674577304692e-05, "tps": 16978408, "wall": 94.7} {"step": 24522, "train_loss": 3.278738260269165, "lr": 7.541533359625954e-05, "tps": 16139176, "wall": 99.6} {"step": 24523, "train_loss": 3.1991353034973145, "lr": 7.540392305733506e-05, "tps": 15390378, "wall": 104.4} {"step": 24524, "train_loss": 3.168069839477539, "lr": 7.539251415640281e-05, "tps": 14711851, "wall": 109.3} {"step": 24525, "train_loss": 3.1824588775634766, "lr": 7.538110689359196e-05, "tps": 14092313, "wall": 114.1} {"step": 24526, "train_loss": 3.081674337387085, "lr": 7.536970126903174e-05, "tps": 13523321, "wall": 118.9} {"step": 24527, "train_loss": 3.1918528079986572, "lr": 7.535829728285139e-05, "tps": 12993825, "wall": 123.7} {"step": 24528, "train_loss": 3.299881935119629, "lr": 7.534689493518007e-05, "tps": 12507873, "wall": 128.5} {"step": 24529, "train_loss": 3.2004425525665283, "lr": 7.53354942261469e-05, "tps": 12054224, "wall": 133.4} {"step": 24530, "train_loss": 3.227559804916382, "lr": 7.532409515588121e-05, "tps": 11632394, "wall": 138.2} {"step": 24531, "train_loss": 3.176530599594116, "lr": 7.531269772451189e-05, "tps": 11238266, "wall": 143.1} {"step": 24532, "train_loss": 3.2499332427978516, "lr": 7.530130193216815e-05, "tps": 10867256, "wall": 147.9} {"step": 24533, "train_loss": 3.235560894012451, "lr": 7.528990777897916e-05, "tps": 10520053, "wall": 152.8} {"step": 24534, "train_loss": 3.090761661529541, "lr": 7.527851526507386e-05, "tps": 10190747, "wall": 157.8} {"step": 24535, "train_loss": 3.2578301429748535, "lr": 7.52671243905814e-05, "tps": 9884295, "wall": 162.7} {"step": 24536, "train_loss": 3.2027487754821777, "lr": 7.525573515563079e-05, "tps": 9595483, "wall": 167.6} {"step": 24537, "train_loss": 3.257199287414551, "lr": 7.524434756035098e-05, "tps": 9319975, "wall": 172.5} {"step": 24538, "train_loss": 3.199057102203369, "lr": 7.52329616048711e-05, "tps": 9059137, "wall": 177.5} {"step": 24539, "train_loss": 3.1475672721862793, "lr": 7.522157728932007e-05, "tps": 8811201, "wall": 182.5} {"step": 24540, "train_loss": 3.1821048259735107, "lr": 7.521019461382677e-05, "tps": 8575316, "wall": 187.6} {"step": 24541, "train_loss": 3.1688075065612793, "lr": 7.519881357852028e-05, "tps": 8350588, "wall": 192.6} {"step": 24542, "train_loss": 3.2663044929504395, "lr": 7.518743418352946e-05, "tps": 8139056, "wall": 197.6} {"step": 24543, "train_loss": 3.0927538871765137, "lr": 7.517605642898318e-05, "tps": 7936967, "wall": 202.7} {"step": 24544, "train_loss": 3.282414674758911, "lr": 7.516468031501041e-05, "tps": 7743952, "wall": 207.7} {"step": 24545, "train_loss": 3.1230149269104004, "lr": 7.515330584173999e-05, "tps": 7560868, "wall": 212.8} {"step": 24546, "train_loss": 3.2888011932373047, "lr": 7.514193300930068e-05, "tps": 7382392, "wall": 217.9} {"step": 24547, "train_loss": 3.07327938079834, "lr": 7.513056181782145e-05, "tps": 7213896, "wall": 223.0} {"step": 24548, "train_loss": 3.2493951320648193, "lr": 7.511919226743103e-05, "tps": 7039241, "wall": 228.6} {"step": 24549, "train_loss": 3.3027281761169434, "lr": 7.510782435825823e-05, "tps": 6871933, "wall": 234.1} {"step": 24550, "train_loss": 3.2198574542999268, "lr": 7.509645809043188e-05, "tps": 6716505, "wall": 239.6} {"step": 24551, "train_loss": 3.1246211528778076, "lr": 7.508509346408064e-05, "tps": 6570737, "wall": 244.9} {"step": 24552, "train_loss": 3.2359933853149414, "lr": 7.507373047933334e-05, "tps": 6430671, "wall": 250.2} {"step": 24553, "train_loss": 3.262119770050049, "lr": 7.506236913631866e-05, "tps": 6300065, "wall": 255.4} {"step": 24554, "train_loss": 3.2162842750549316, "lr": 7.505100943516527e-05, "tps": 6171980, "wall": 260.7} {"step": 24555, "train_loss": 3.176410675048828, "lr": 7.503965137600191e-05, "tps": 6050965, "wall": 266.0} {"step": 24556, "train_loss": 3.1423044204711914, "lr": 7.502829495895724e-05, "tps": 5933666, "wall": 271.2} {"step": 24557, "train_loss": 3.241469383239746, "lr": 7.501694018415986e-05, "tps": 5820507, "wall": 276.5} {"step": 24558, "train_loss": 3.2344744205474854, "lr": 7.500558705173843e-05, "tps": 5712581, "wall": 281.7} {"step": 24559, "train_loss": 3.223851203918457, "lr": 7.499423556182158e-05, "tps": 5607842, "wall": 287.0} {"step": 24560, "train_loss": 3.334667205810547, "lr": 7.498288571453783e-05, "tps": 5506148, "wall": 292.3} {"step": 24561, "train_loss": 3.246901035308838, "lr": 7.497153751001581e-05, "tps": 5408297, "wall": 297.6} {"step": 24562, "train_loss": 3.207103729248047, "lr": 7.496019094838409e-05, "tps": 5314320, "wall": 302.9} {"step": 24563, "train_loss": 3.2715258598327637, "lr": 7.494884602977113e-05, "tps": 5215375, "wall": 308.7} {"step": 24564, "train_loss": 3.1992669105529785, "lr": 7.493750275430552e-05, "tps": 5120184, "wall": 314.4} {"step": 24565, "train_loss": 3.207638740539551, "lr": 7.492616112211567e-05, "tps": 5037320, "wall": 319.6} {"step": 24566, "train_loss": 3.2854385375976562, "lr": 7.491482113333018e-05, "tps": 4955948, "wall": 324.9} {"step": 24567, "train_loss": 3.324796438217163, "lr": 7.490348278807744e-05, "tps": 4875894, "wall": 330.2} {"step": 24568, "train_loss": 3.1878576278686523, "lr": 7.489214608648585e-05, "tps": 4796047, "wall": 335.7} {"step": 24569, "train_loss": 3.1052322387695312, "lr": 7.488081102868392e-05, "tps": 4721543, "wall": 341.0} {"step": 24570, "train_loss": 3.3228795528411865, "lr": 7.486947761480004e-05, "tps": 4645912, "wall": 346.6} {"step": 24571, "train_loss": 3.229489326477051, "lr": 7.485814584496248e-05, "tps": 4573836, "wall": 352.1} {"step": 24572, "train_loss": 3.205789089202881, "lr": 7.484681571929977e-05, "tps": 4506354, "wall": 357.4} {"step": 24573, "train_loss": 3.2455716133117676, "lr": 7.483548723794018e-05, "tps": 4438658, "wall": 362.8} {"step": 24574, "train_loss": 3.1606040000915527, "lr": 7.4824160401012e-05, "tps": 4372016, "wall": 368.4} {"step": 24575, "train_loss": 3.2269985675811768, "lr": 7.481283520864363e-05, "tps": 4309769, "wall": 373.7} {"step": 24576, "train_loss": 3.267958879470825, "lr": 7.480151166096332e-05, "tps": 4242419, "wall": 379.7} {"step": 24577, "train_loss": 3.231421709060669, "lr": 7.479018975809928e-05, "tps": 4184232, "wall": 385.0} {"step": 24578, "train_loss": 3.2310001850128174, "lr": 7.477886950017989e-05, "tps": 4127888, "wall": 390.2} {"step": 24579, "train_loss": 3.3317008018493652, "lr": 7.47675508873333e-05, "tps": 4071474, "wall": 395.6} {"step": 24580, "train_loss": 3.163679599761963, "lr": 7.475623391968772e-05, "tps": 4016561, "wall": 401.1} {"step": 24581, "train_loss": 3.24202036857605, "lr": 7.474491859737143e-05, "tps": 3962547, "wall": 406.6} {"step": 24582, "train_loss": 3.199754238128662, "lr": 7.473360492051256e-05, "tps": 3909668, "wall": 412.1} {"step": 24583, "train_loss": 3.1860620975494385, "lr": 7.472229288923922e-05, "tps": 3858117, "wall": 417.6} {"step": 24584, "train_loss": 3.221496343612671, "lr": 7.471098250367965e-05, "tps": 3806752, "wall": 423.2} {"step": 24585, "train_loss": 3.274878740310669, "lr": 7.46996737639619e-05, "tps": 3756114, "wall": 429.0} {"step": 24586, "train_loss": 3.221616506576538, "lr": 7.468836667021413e-05, "tps": 3709048, "wall": 434.4} {"step": 24587, "train_loss": 3.2093911170959473, "lr": 7.46770612225644e-05, "tps": 3663365, "wall": 439.9} {"step": 24588, "train_loss": 3.2255029678344727, "lr": 7.466575742114074e-05, "tps": 3617996, "wall": 445.4} {"step": 24589, "train_loss": 3.232426404953003, "lr": 7.465445526607131e-05, "tps": 3574050, "wall": 450.9} {"step": 24590, "train_loss": 3.202281951904297, "lr": 7.464315475748407e-05, "tps": 3527273, "wall": 456.9} {"step": 24591, "train_loss": 3.138087749481201, "lr": 7.463185589550696e-05, "tps": 3484350, "wall": 462.5} {"step": 24592, "train_loss": 3.2732431888580322, "lr": 7.462055868026813e-05, "tps": 3442630, "wall": 468.2} {"step": 24593, "train_loss": 3.243720531463623, "lr": 7.460926311189546e-05, "tps": 3402595, "wall": 473.7} {"step": 24594, "train_loss": 3.2568774223327637, "lr": 7.459796919051691e-05, "tps": 3361028, "wall": 479.6} {"step": 24595, "train_loss": 3.165942668914795, "lr": 7.458667691626044e-05, "tps": 3320463, "wall": 485.5} {"step": 24596, "train_loss": 3.21529483795166, "lr": 7.457538628925396e-05, "tps": 3281161, "wall": 491.3} {"step": 24597, "train_loss": 3.209843158721924, "lr": 7.456409730962535e-05, "tps": 3243611, "wall": 497.0} {"step": 24598, "train_loss": 3.2593960762023926, "lr": 7.455280997750254e-05, "tps": 3207354, "wall": 502.6} {"step": 24599, "train_loss": 3.287139415740967, "lr": 7.454152429301336e-05, "tps": 3172230, "wall": 508.2} {"step": 24600, "train_loss": 3.2098090648651123, "lr": 7.453024025628563e-05, "tps": 3137770, "wall": 513.8} {"step": 24601, "train_loss": 3.0939853191375732, "lr": 7.451895786744725e-05, "tps": 3099550, "wall": 520.2} {"step": 24602, "train_loss": 3.1409778594970703, "lr": 7.450767712662594e-05, "tps": 3063966, "wall": 526.2} {"step": 24603, "train_loss": 3.146536111831665, "lr": 7.449639803394958e-05, "tps": 3030903, "wall": 532.0} {"step": 24604, "train_loss": 3.125650405883789, "lr": 7.448512058954589e-05, "tps": 2997408, "wall": 538.0} {"step": 24605, "train_loss": 3.1742472648620605, "lr": 7.447384479354258e-05, "tps": 2960872, "wall": 544.6} {"step": 24606, "train_loss": 3.247964382171631, "lr": 7.44625706460675e-05, "tps": 2926668, "wall": 551.0} {"step": 24607, "train_loss": 3.1476283073425293, "lr": 7.445129814724827e-05, "tps": 2895871, "wall": 556.9} {"step": 24608, "train_loss": 3.285877227783203, "lr": 7.444002729721256e-05, "tps": 2865116, "wall": 562.9} {"step": 24609, "train_loss": 3.1754751205444336, "lr": 7.442875809608816e-05, "tps": 2834914, "wall": 568.9} {"step": 24610, "train_loss": 3.201909065246582, "lr": 7.441749054400266e-05, "tps": 2805092, "wall": 575.0} {"step": 24611, "train_loss": 3.178779125213623, "lr": 7.440622464108364e-05, "tps": 2775384, "wall": 581.2} {"step": 24612, "train_loss": 3.201484441757202, "lr": 7.439496038745886e-05, "tps": 2747577, "wall": 587.1} {"step": 24613, "train_loss": 3.2056379318237305, "lr": 7.438369778325581e-05, "tps": 2719998, "wall": 593.1} {"step": 24614, "train_loss": 3.177074432373047, "lr": 7.437243682860207e-05, "tps": 2693109, "wall": 599.0} {"step": 24615, "train_loss": 3.209016799926758, "lr": 7.436117752362532e-05, "tps": 2666022, "wall": 605.1} {"step": 24616, "train_loss": 3.2108922004699707, "lr": 7.434991986845299e-05, "tps": 2639058, "wall": 611.3} {"step": 24617, "train_loss": 3.2068405151367188, "lr": 7.433866386321262e-05, "tps": 2613626, "wall": 617.3} {"step": 24618, "train_loss": 3.141416072845459, "lr": 7.432740950803178e-05, "tps": 2589416, "wall": 623.1} {"step": 24619, "train_loss": 3.270657539367676, "lr": 7.431615680303795e-05, "tps": 2565740, "wall": 628.9} {"step": 24620, "train_loss": 3.27579927444458, "lr": 7.430490574835852e-05, "tps": 2542723, "wall": 634.6} {"step": 24621, "train_loss": 3.197000026702881, "lr": 7.429365634412105e-05, "tps": 2519285, "wall": 640.5} {"step": 24622, "train_loss": 3.2400879859924316, "lr": 7.428240859045287e-05, "tps": 2497390, "wall": 646.2} {"step": 24623, "train_loss": 3.2083683013916016, "lr": 7.42711624874815e-05, "tps": 2476289, "wall": 651.7} {"step": 24624, "train_loss": 3.1885032653808594, "lr": 7.425991803533427e-05, "tps": 2455567, "wall": 657.2} {"step": 24625, "train_loss": 3.204655647277832, "lr": 7.424867523413854e-05, "tps": 2434402, "wall": 663.0} {"step": 24626, "train_loss": 3.156902313232422, "lr": 7.423743408402175e-05, "tps": 2413922, "wall": 668.6} {"step": 24627, "train_loss": 3.2540817260742188, "lr": 7.422619458511117e-05, "tps": 2394163, "wall": 674.1} {"step": 24628, "train_loss": 3.2262089252471924, "lr": 7.421495673753413e-05, "tps": 2375011, "wall": 679.6} {"step": 24629, "train_loss": 3.190258741378784, "lr": 7.420372054141797e-05, "tps": 2356529, "wall": 685.0} {"step": 24630, "train_loss": 3.241919994354248, "lr": 7.419248599688997e-05, "tps": 2338536, "wall": 690.3} {"step": 24631, "train_loss": 3.196394920349121, "lr": 7.41812531040773e-05, "tps": 2320388, "wall": 695.7} {"step": 24632, "train_loss": 3.284879207611084, "lr": 7.417002186310737e-05, "tps": 2302894, "wall": 701.0} {"step": 24633, "train_loss": 3.104142665863037, "lr": 7.41587922741073e-05, "tps": 2285984, "wall": 706.2} {"step": 24634, "train_loss": 3.1190967559814453, "lr": 7.414756433720428e-05, "tps": 2269469, "wall": 711.4} {"step": 24635, "train_loss": 3.082883358001709, "lr": 7.413633805252558e-05, "tps": 2253550, "wall": 716.4} {"step": 24636, "train_loss": 3.342180013656616, "lr": 7.412511342019835e-05, "tps": 2237949, "wall": 721.5} {"step": 24637, "train_loss": 3.2396538257598877, "lr": 7.411389044034967e-05, "tps": 2222670, "wall": 726.5} {"step": 24638, "train_loss": 3.1213436126708984, "lr": 7.410266911310678e-05, "tps": 2207674, "wall": 731.4} {"step": 24639, "train_loss": 3.3255507946014404, "lr": 7.409144943859668e-05, "tps": 2192972, "wall": 736.4} {"step": 24640, "train_loss": 3.1131393909454346, "lr": 7.40802314169466e-05, "tps": 2178569, "wall": 741.3} {"step": 24641, "train_loss": 3.214545488357544, "lr": 7.406901504828357e-05, "tps": 2164454, "wall": 746.1} {"step": 24642, "train_loss": 3.192044973373413, "lr": 7.405780033273455e-05, "tps": 2150574, "wall": 751.0} {"step": 24643, "train_loss": 3.280402421951294, "lr": 7.404658727042674e-05, "tps": 2136423, "wall": 756.0} {"step": 24644, "train_loss": 3.32997989654541, "lr": 7.403537586148705e-05, "tps": 2122735, "wall": 760.9} {"step": 24645, "train_loss": 3.2258529663085938, "lr": 7.40241661060425e-05, "tps": 2109320, "wall": 765.7} {"step": 24646, "train_loss": 3.1388237476348877, "lr": 7.401295800422015e-05, "tps": 2096355, "wall": 770.5} {"step": 24647, "train_loss": 3.184955596923828, "lr": 7.400175155614688e-05, "tps": 2083654, "wall": 775.2} {"step": 24648, "train_loss": 3.219968795776367, "lr": 7.399054676194963e-05, "tps": 2071643, "wall": 779.8} {"step": 24649, "train_loss": 3.2312142848968506, "lr": 7.397934362175543e-05, "tps": 2059832, "wall": 784.3} {"step": 24650, "train_loss": 3.090564727783203, "lr": 7.396814213569112e-05, "tps": 2048303, "wall": 788.7} {"step": 24651, "train_loss": 3.182096004486084, "lr": 7.395694230388353e-05, "tps": 2036910, "wall": 793.2} {"step": 24652, "train_loss": 3.218327522277832, "lr": 7.394574412645965e-05, "tps": 2025705, "wall": 797.6} {"step": 24653, "train_loss": 3.2642264366149902, "lr": 7.393454760354628e-05, "tps": 2014597, "wall": 802.0} {"step": 24654, "train_loss": 3.219054937362671, "lr": 7.392335273527021e-05, "tps": 2003618, "wall": 806.4} {"step": 24655, "train_loss": 3.13952374458313, "lr": 7.391215952175837e-05, "tps": 1992701, "wall": 810.9} {"step": 24656, "train_loss": 3.2099311351776123, "lr": 7.390096796313744e-05, "tps": 1981448, "wall": 815.5} {"step": 24657, "train_loss": 3.1753015518188477, "lr": 7.388977805953428e-05, "tps": 1970362, "wall": 820.1} {"step": 24658, "train_loss": 3.261528968811035, "lr": 7.387858981107563e-05, "tps": 1959344, "wall": 824.8} {"step": 24659, "train_loss": 3.174105405807495, "lr": 7.386740321788816e-05, "tps": 1948491, "wall": 829.4} {"step": 24660, "train_loss": 3.2218031883239746, "lr": 7.38562182800987e-05, "tps": 1937920, "wall": 834.0} {"step": 24661, "train_loss": 3.3436543941497803, "lr": 7.38450349978339e-05, "tps": 1927390, "wall": 838.6} {"step": 24662, "train_loss": 3.1261463165283203, "lr": 7.383385337122042e-05, "tps": 1916893, "wall": 843.2} {"step": 24663, "train_loss": 3.221566677093506, "lr": 7.382267340038501e-05, "tps": 1906636, "wall": 847.8} {"step": 24664, "train_loss": 3.139713764190674, "lr": 7.381149508545424e-05, "tps": 1896454, "wall": 852.4} {"step": 24665, "train_loss": 3.188575506210327, "lr": 7.380031842655474e-05, "tps": 1886331, "wall": 857.0} {"step": 24666, "train_loss": 3.3351054191589355, "lr": 7.378914342381317e-05, "tps": 1876376, "wall": 861.5} {"step": 24667, "train_loss": 3.093672752380371, "lr": 7.37779700773561e-05, "tps": 1866575, "wall": 866.1} {"step": 24668, "train_loss": 3.0865635871887207, "lr": 7.376679838731005e-05, "tps": 1856951, "wall": 870.6} {"step": 24669, "train_loss": 3.138420820236206, "lr": 7.375562835380165e-05, "tps": 1847023, "wall": 875.3} {"step": 24670, "train_loss": 3.2288825511932373, "lr": 7.374445997695742e-05, "tps": 1837503, "wall": 879.9} {"step": 24671, "train_loss": 3.2398457527160645, "lr": 7.373329325690381e-05, "tps": 1828135, "wall": 884.5} {"step": 24672, "train_loss": 3.2751901149749756, "lr": 7.372212819376742e-05, "tps": 1818851, "wall": 889.0} {"step": 24673, "train_loss": 3.0962018966674805, "lr": 7.371096478767468e-05, "tps": 1809770, "wall": 893.5} {"step": 24674, "train_loss": 3.1953041553497314, "lr": 7.369980303875199e-05, "tps": 1800772, "wall": 898.0} {"step": 24675, "train_loss": 3.3291497230529785, "lr": 7.368864294712587e-05, "tps": 1791631, "wall": 902.6} {"step": 24676, "train_loss": 3.187481164932251, "lr": 7.367748451292271e-05, "tps": 1782582, "wall": 907.2} {"step": 24677, "train_loss": 3.210082530975342, "lr": 7.366632773626893e-05, "tps": 1773576, "wall": 911.9} {"step": 24678, "train_loss": 3.1817572116851807, "lr": 7.365517261729094e-05, "tps": 1764692, "wall": 916.5} {"step": 24679, "train_loss": 3.1871755123138428, "lr": 7.364401915611501e-05, "tps": 1755991, "wall": 921.1} {"step": 24680, "train_loss": 3.1256213188171387, "lr": 7.36328673528676e-05, "tps": 1747367, "wall": 925.7} {"step": 24681, "train_loss": 3.2882466316223145, "lr": 7.362171720767497e-05, "tps": 1738785, "wall": 930.3} {"step": 24682, "train_loss": 3.153158664703369, "lr": 7.361056872066341e-05, "tps": 1730339, "wall": 934.9} {"step": 24683, "train_loss": 3.2654454708099365, "lr": 7.35994218919593e-05, "tps": 1721921, "wall": 939.5} {"step": 24684, "train_loss": 3.2181649208068848, "lr": 7.358827672168886e-05, "tps": 1713646, "wall": 944.0} {"step": 24685, "train_loss": 3.247981071472168, "lr": 7.357713320997828e-05, "tps": 1705449, "wall": 948.6} {"step": 24686, "train_loss": 3.2936627864837646, "lr": 7.356599135695392e-05, "tps": 1697243, "wall": 953.2} {"step": 24687, "train_loss": 3.2357587814331055, "lr": 7.355485116274193e-05, "tps": 1689119, "wall": 957.9} {"step": 24688, "train_loss": 3.260479211807251, "lr": 7.354371262746847e-05, "tps": 1681153, "wall": 962.4} {"step": 24689, "train_loss": 3.204713821411133, "lr": 7.353257575125978e-05, "tps": 1673220, "wall": 967.0} {"step": 24690, "train_loss": 3.0929605960845947, "lr": 7.352144053424201e-05, "tps": 1665422, "wall": 971.6} {"step": 24691, "train_loss": 3.3200628757476807, "lr": 7.351030697654124e-05, "tps": 1657734, "wall": 976.2} {"step": 24692, "train_loss": 3.1296820640563965, "lr": 7.349917507828368e-05, "tps": 1650155, "wall": 980.7} {"step": 24693, "train_loss": 3.0918800830841064, "lr": 7.348804483959533e-05, "tps": 1642503, "wall": 985.3} {"step": 24694, "train_loss": 3.1791162490844727, "lr": 7.34769162606024e-05, "tps": 1635055, "wall": 989.8} {"step": 24695, "train_loss": 3.198514223098755, "lr": 7.346578934143087e-05, "tps": 1627704, "wall": 994.3} {"step": 24696, "train_loss": 3.2521378993988037, "lr": 7.345466408220679e-05, "tps": 1620339, "wall": 998.9} {"step": 24697, "train_loss": 3.1118812561035156, "lr": 7.344354048305621e-05, "tps": 1613101, "wall": 1003.4} {"step": 24698, "train_loss": 3.1865599155426025, "lr": 7.343241854410517e-05, "tps": 1605923, "wall": 1007.9} {"step": 24699, "train_loss": 3.275318145751953, "lr": 7.342129826547962e-05, "tps": 1598820, "wall": 1012.5} {"step": 24700, "train_loss": 3.2571616172790527, "lr": 7.341017964730551e-05, "tps": 1591769, "wall": 1017.0} {"step": 24701, "train_loss": 3.2730355262756348, "lr": 7.339906268970878e-05, "tps": 1584794, "wall": 1021.5} {"step": 24702, "train_loss": 3.2271971702575684, "lr": 7.338794739281545e-05, "tps": 1577873, "wall": 1026.0} {"step": 24703, "train_loss": 3.2083983421325684, "lr": 7.337683375675137e-05, "tps": 1570982, "wall": 1030.6} {"step": 24704, "train_loss": 3.1263272762298584, "lr": 7.336572178164242e-05, "tps": 1564181, "wall": 1035.1} {"step": 24705, "train_loss": 3.1563456058502197, "lr": 7.335461146761453e-05, "tps": 1557457, "wall": 1039.6} {"step": 24706, "train_loss": 3.2242465019226074, "lr": 7.334350281479356e-05, "tps": 1550648, "wall": 1044.2} {"step": 24707, "train_loss": 3.179110288619995, "lr": 7.333239582330527e-05, "tps": 1543870, "wall": 1048.8} {"step": 24708, "train_loss": 3.1116294860839844, "lr": 7.332129049327556e-05, "tps": 1537170, "wall": 1053.4} {"step": 24709, "train_loss": 3.2113423347473145, "lr": 7.331018682483022e-05, "tps": 1530599, "wall": 1058.0} {"step": 24710, "train_loss": 3.1166017055511475, "lr": 7.329908481809498e-05, "tps": 1524073, "wall": 1062.6} {"step": 24711, "train_loss": 3.157332181930542, "lr": 7.328798447319569e-05, "tps": 1517654, "wall": 1067.1} {"step": 24712, "train_loss": 3.1401870250701904, "lr": 7.327688579025805e-05, "tps": 1511260, "wall": 1071.7} {"step": 24713, "train_loss": 3.208542823791504, "lr": 7.326578876940772e-05, "tps": 1504778, "wall": 1076.3} {"step": 24714, "train_loss": 3.2025952339172363, "lr": 7.325469341077053e-05, "tps": 1498483, "wall": 1080.9} {"step": 24715, "train_loss": 3.2712273597717285, "lr": 7.324359971447212e-05, "tps": 1492318, "wall": 1085.4} {"step": 24716, "train_loss": 3.220973253250122, "lr": 7.32325076806381e-05, "tps": 1486167, "wall": 1090.0} {"step": 24717, "train_loss": 3.1675543785095215, "lr": 7.322141730939423e-05, "tps": 1480084, "wall": 1094.5} {"step": 24718, "train_loss": 3.1617612838745117, "lr": 7.321032860086603e-05, "tps": 1474048, "wall": 1099.0} {"step": 24719, "train_loss": 3.1626553535461426, "lr": 7.319924155517918e-05, "tps": 1468068, "wall": 1103.5} {"step": 24720, "train_loss": 3.2636311054229736, "lr": 7.318815617245933e-05, "tps": 1462142, "wall": 1108.0} {"step": 24721, "train_loss": 3.2147374153137207, "lr": 7.31770724528319e-05, "tps": 1456256, "wall": 1112.6} {"step": 24722, "train_loss": 3.279780864715576, "lr": 7.316599039642258e-05, "tps": 1450281, "wall": 1117.2} {"step": 24723, "train_loss": 3.213609218597412, "lr": 7.315491000335687e-05, "tps": 1444478, "wall": 1121.7} {"step": 24724, "train_loss": 3.235246181488037, "lr": 7.314383127376025e-05, "tps": 1438625, "wall": 1126.3} {"step": 24725, "train_loss": 3.2876386642456055, "lr": 7.31327542077583e-05, "tps": 1432790, "wall": 1131.0} {"step": 24726, "train_loss": 3.1841187477111816, "lr": 7.312167880547645e-05, "tps": 1426954, "wall": 1135.6} {"step": 24727, "train_loss": 3.095607042312622, "lr": 7.311060506704016e-05, "tps": 1421150, "wall": 1140.3} {"step": 24728, "train_loss": 3.2295005321502686, "lr": 7.309953299257488e-05, "tps": 1415396, "wall": 1145.0} {"step": 24729, "train_loss": 3.2679479122161865, "lr": 7.308846258220604e-05, "tps": 1409705, "wall": 1149.7} {"step": 24730, "train_loss": 3.1229701042175293, "lr": 7.3077393836059e-05, "tps": 1404118, "wall": 1154.3} {"step": 24731, "train_loss": 3.1673049926757812, "lr": 7.306632675425924e-05, "tps": 1398571, "wall": 1158.9} {"step": 24732, "train_loss": 3.1245853900909424, "lr": 7.305526133693207e-05, "tps": 1393152, "wall": 1163.5} {"step": 24733, "train_loss": 3.1973695755004883, "lr": 7.304419758420284e-05, "tps": 1387763, "wall": 1168.0} {"step": 24734, "train_loss": 3.2826902866363525, "lr": 7.303313549619691e-05, "tps": 1382448, "wall": 1172.6} {"step": 24735, "train_loss": 3.1603214740753174, "lr": 7.302207507303952e-05, "tps": 1377087, "wall": 1177.2} {"step": 24736, "train_loss": 3.176093578338623, "lr": 7.301101631485608e-05, "tps": 1371815, "wall": 1181.8} {"step": 24737, "train_loss": 3.2362680435180664, "lr": 7.299995922177178e-05, "tps": 1366594, "wall": 1186.3} {"step": 24738, "train_loss": 3.2629318237304688, "lr": 7.298890379391183e-05, "tps": 1361397, "wall": 1190.9} {"step": 24739, "train_loss": 3.1664886474609375, "lr": 7.297785003140163e-05, "tps": 1356241, "wall": 1195.5} {"step": 24740, "train_loss": 3.240872859954834, "lr": 7.296679793436626e-05, "tps": 1351104, "wall": 1200.1} {"step": 24741, "train_loss": 3.156827211380005, "lr": 7.295574750293093e-05, "tps": 1346030, "wall": 1204.6} {"step": 24742, "train_loss": 3.197725772857666, "lr": 7.294469873722089e-05, "tps": 1340895, "wall": 1209.3} {"step": 24743, "train_loss": 3.2180638313293457, "lr": 7.293365163736126e-05, "tps": 1335766, "wall": 1214.0} {"step": 24744, "train_loss": 3.1814682483673096, "lr": 7.292260620347711e-05, "tps": 1330683, "wall": 1218.7} {"step": 24745, "train_loss": 3.240898609161377, "lr": 7.29115624356937e-05, "tps": 1325718, "wall": 1223.3} {"step": 24746, "train_loss": 3.202202796936035, "lr": 7.290052033413609e-05, "tps": 1320783, "wall": 1227.9} {"step": 24747, "train_loss": 3.2347359657287598, "lr": 7.288947989892926e-05, "tps": 1315914, "wall": 1232.5} {"step": 24748, "train_loss": 3.1451311111450195, "lr": 7.287844113019841e-05, "tps": 1310995, "wall": 1237.2} {"step": 24749, "train_loss": 3.2509751319885254, "lr": 7.286740402806855e-05, "tps": 1306187, "wall": 1241.8} {"step": 24750, "train_loss": 3.229499340057373, "lr": 7.285636859266465e-05, "tps": 1301412, "wall": 1246.4} {"step": 24751, "train_loss": 3.148139476776123, "lr": 7.284533482411182e-05, "tps": 1296692, "wall": 1251.0} {"step": 24752, "train_loss": 3.1165590286254883, "lr": 7.283430272253495e-05, "tps": 1292006, "wall": 1255.6} {"step": 24753, "train_loss": 3.1887176036834717, "lr": 7.28232722880591e-05, "tps": 1287333, "wall": 1260.2} {"step": 24754, "train_loss": 3.270979642868042, "lr": 7.281224352080917e-05, "tps": 1282718, "wall": 1264.8} {"step": 24755, "train_loss": 3.256019353866577, "lr": 7.280121642091009e-05, "tps": 1278144, "wall": 1269.3} {"step": 24756, "train_loss": 3.282592296600342, "lr": 7.279019098848681e-05, "tps": 1273585, "wall": 1273.9} {"step": 24757, "train_loss": 3.145899772644043, "lr": 7.277916722366424e-05, "tps": 1269093, "wall": 1278.5} {"step": 24758, "train_loss": 3.2227344512939453, "lr": 7.276814512656718e-05, "tps": 1264618, "wall": 1283.1} {"step": 24759, "train_loss": 3.2620534896850586, "lr": 7.275712469732057e-05, "tps": 1260196, "wall": 1287.6} {"step": 24760, "train_loss": 3.057191848754883, "lr": 7.274610593604922e-05, "tps": 1255785, "wall": 1292.2} {"step": 24761, "train_loss": 3.163567304611206, "lr": 7.273508884287788e-05, "tps": 1251355, "wall": 1296.8} {"step": 24762, "train_loss": 3.245208263397217, "lr": 7.272407341793149e-05, "tps": 1247019, "wall": 1301.4} {"step": 24763, "train_loss": 3.306959390640259, "lr": 7.271305966133478e-05, "tps": 1242718, "wall": 1306.0} {"step": 24764, "train_loss": 3.238319158554077, "lr": 7.270204757321241e-05, "tps": 1238430, "wall": 1310.5} {"step": 24765, "train_loss": 3.060866355895996, "lr": 7.26910371536893e-05, "tps": 1234173, "wall": 1315.1} {"step": 24766, "train_loss": 3.1197566986083984, "lr": 7.268002840289008e-05, "tps": 1229957, "wall": 1319.7} {"step": 24767, "train_loss": 3.1755285263061523, "lr": 7.266902132093942e-05, "tps": 1225754, "wall": 1324.2} {"step": 24768, "train_loss": 3.2542731761932373, "lr": 7.265801590796209e-05, "tps": 1221595, "wall": 1328.8} {"step": 24769, "train_loss": 3.185835123062134, "lr": 7.264701216408274e-05, "tps": 1217450, "wall": 1333.4} {"step": 24770, "train_loss": 3.234604597091675, "lr": 7.263601008942596e-05, "tps": 1213346, "wall": 1337.9} {"step": 24771, "train_loss": 3.1967482566833496, "lr": 7.262500968411647e-05, "tps": 1209277, "wall": 1342.5} {"step": 24772, "train_loss": 3.2289509773254395, "lr": 7.26140109482788e-05, "tps": 1205231, "wall": 1347.1} {"step": 24773, "train_loss": 3.162135362625122, "lr": 7.260301388203763e-05, "tps": 1201210, "wall": 1351.6} {"step": 24774, "train_loss": 3.319364070892334, "lr": 7.259201848551749e-05, "tps": 1197146, "wall": 1356.3} {"step": 24775, "train_loss": 3.1806468963623047, "lr": 7.258102475884291e-05, "tps": 1193164, "wall": 1360.9} {"step": 24776, "train_loss": 3.1991820335388184, "lr": 7.257003270213849e-05, "tps": 1189223, "wall": 1365.4} {"step": 24777, "train_loss": 3.2270448207855225, "lr": 7.255904231552872e-05, "tps": 1185274, "wall": 1370.0} {"step": 24778, "train_loss": 3.227660655975342, "lr": 7.254805359913805e-05, "tps": 1181370, "wall": 1374.6} {"step": 24779, "train_loss": 3.2387142181396484, "lr": 7.253706655309105e-05, "tps": 1177498, "wall": 1379.2} {"step": 24780, "train_loss": 3.276453971862793, "lr": 7.252608117751214e-05, "tps": 1173620, "wall": 1383.8} {"step": 24781, "train_loss": 3.168728828430176, "lr": 7.251509747252572e-05, "tps": 1169800, "wall": 1388.4} {"step": 24782, "train_loss": 3.1940653324127197, "lr": 7.25041154382563e-05, "tps": 1166006, "wall": 1392.9} {"step": 24783, "train_loss": 3.1540868282318115, "lr": 7.24931350748282e-05, "tps": 1162189, "wall": 1397.6} {"step": 24784, "train_loss": 3.2337934970855713, "lr": 7.248215638236585e-05, "tps": 1158165, "wall": 1402.5} {"step": 24785, "train_loss": 3.1923859119415283, "lr": 7.247117936099363e-05, "tps": 1154215, "wall": 1407.3} {"step": 24786, "train_loss": 3.2538723945617676, "lr": 7.246020401083589e-05, "tps": 1150326, "wall": 1412.2} {"step": 24787, "train_loss": 3.192284107208252, "lr": 7.24492303320169e-05, "tps": 1146438, "wall": 1417.0} {"step": 24788, "train_loss": 3.1964218616485596, "lr": 7.243825832466102e-05, "tps": 1142597, "wall": 1421.8} {"step": 24789, "train_loss": 3.136723518371582, "lr": 7.242728798889253e-05, "tps": 1138751, "wall": 1426.7} {"step": 24790, "train_loss": 3.2096946239471436, "lr": 7.241631932483573e-05, "tps": 1134920, "wall": 1431.6} {"step": 24791, "train_loss": 3.3099799156188965, "lr": 7.240535233261485e-05, "tps": 1131314, "wall": 1436.2} {"step": 24792, "train_loss": 3.179518222808838, "lr": 7.239438701235409e-05, "tps": 1127525, "wall": 1441.1} {"step": 24793, "train_loss": 3.2184505462646484, "lr": 7.238342336417771e-05, "tps": 1123805, "wall": 1445.9} {"step": 24794, "train_loss": 3.2198479175567627, "lr": 7.237246138820992e-05, "tps": 1120114, "wall": 1450.7} {"step": 24795, "train_loss": 3.184173107147217, "lr": 7.236150108457483e-05, "tps": 1116438, "wall": 1455.5} {"step": 24796, "train_loss": 3.202008008956909, "lr": 7.235054245339669e-05, "tps": 1112710, "wall": 1460.5} {"step": 24797, "train_loss": 3.227242946624756, "lr": 7.23395854947996e-05, "tps": 1108974, "wall": 1465.5} {"step": 24798, "train_loss": 3.2763047218322754, "lr": 7.23286302089076e-05, "tps": 1105362, "wall": 1470.3} {"step": 24799, "train_loss": 3.2940878868103027, "lr": 7.231767659584494e-05, "tps": 1101669, "wall": 1475.3} {"step": 24800, "train_loss": 3.108811616897583, "lr": 7.230672465573563e-05, "tps": 1098098, "wall": 1480.2} {"step": 24801, "train_loss": 3.274233102798462, "lr": 7.229577438870367e-05, "tps": 1094536, "wall": 1485.0} {"step": 24802, "train_loss": 3.202409267425537, "lr": 7.228482579487321e-05, "tps": 1091025, "wall": 1489.9} {"step": 24803, "train_loss": 3.1901299953460693, "lr": 7.227387887436825e-05, "tps": 1087547, "wall": 1494.7} {"step": 24804, "train_loss": 3.1571550369262695, "lr": 7.226293362731273e-05, "tps": 1084013, "wall": 1499.6} {"step": 24805, "train_loss": 3.1647467613220215, "lr": 7.225199005383074e-05, "tps": 1080605, "wall": 1504.4} {"step": 24806, "train_loss": 3.1582260131835938, "lr": 7.224104815404614e-05, "tps": 1077209, "wall": 1509.2} {"step": 24807, "train_loss": 3.163964033126831, "lr": 7.223010792808299e-05, "tps": 1073910, "wall": 1513.9} {"step": 24808, "train_loss": 3.190974712371826, "lr": 7.221916937606518e-05, "tps": 1070658, "wall": 1518.6} {"step": 24809, "train_loss": 3.1634457111358643, "lr": 7.220823249811657e-05, "tps": 1067403, "wall": 1523.3} {"step": 24810, "train_loss": 3.0906553268432617, "lr": 7.219729729436113e-05, "tps": 1064019, "wall": 1528.2} {"step": 24811, "train_loss": 3.215104818344116, "lr": 7.218636376492271e-05, "tps": 1060764, "wall": 1532.9} {"step": 24812, "train_loss": 3.2377023696899414, "lr": 7.217543190992514e-05, "tps": 1057594, "wall": 1537.6} {"step": 24813, "train_loss": 3.270608425140381, "lr": 7.216450172949227e-05, "tps": 1054424, "wall": 1542.3} {"step": 24814, "train_loss": 3.274721622467041, "lr": 7.215357322374797e-05, "tps": 1051267, "wall": 1547.0} {"step": 24815, "train_loss": 3.2341156005859375, "lr": 7.214264639281592e-05, "tps": 1048157, "wall": 1551.6} {"step": 24816, "train_loss": 3.1355299949645996, "lr": 7.213172123681999e-05, "tps": 1045061, "wall": 1556.3} {"step": 24817, "train_loss": 3.1868481636047363, "lr": 7.212079775588397e-05, "tps": 1041957, "wall": 1561.0} {"step": 24818, "train_loss": 3.152986526489258, "lr": 7.210987595013148e-05, "tps": 1038953, "wall": 1565.6} {"step": 24819, "train_loss": 3.186394214630127, "lr": 7.209895581968638e-05, "tps": 1035966, "wall": 1570.1} {"step": 24820, "train_loss": 3.1277287006378174, "lr": 7.208803736467229e-05, "tps": 1032959, "wall": 1574.8} {"step": 24821, "train_loss": 3.2660508155822754, "lr": 7.207712058521287e-05, "tps": 1030005, "wall": 1579.3} {"step": 24822, "train_loss": 3.2077670097351074, "lr": 7.20662054814319e-05, "tps": 1027064, "wall": 1583.9} {"step": 24823, "train_loss": 3.155423402786255, "lr": 7.205529205345294e-05, "tps": 1024115, "wall": 1588.6} {"step": 24824, "train_loss": 3.105280876159668, "lr": 7.204438030139957e-05, "tps": 1021149, "wall": 1593.2} {"step": 24825, "train_loss": 3.1748979091644287, "lr": 7.203347022539553e-05, "tps": 1018246, "wall": 1597.8} {"step": 24826, "train_loss": 3.2398691177368164, "lr": 7.202256182556431e-05, "tps": 1015363, "wall": 1602.4} {"step": 24827, "train_loss": 3.313699245452881, "lr": 7.201165510202953e-05, "tps": 1012477, "wall": 1607.1} {"step": 24828, "train_loss": 3.158224582672119, "lr": 7.200075005491476e-05, "tps": 1009621, "wall": 1611.7} {"step": 24829, "train_loss": 3.1419601440429688, "lr": 7.198984668434344e-05, "tps": 1006799, "wall": 1616.3} {"step": 24830, "train_loss": 3.1712028980255127, "lr": 7.197894499043919e-05, "tps": 1003977, "wall": 1620.9} {"step": 24831, "train_loss": 3.2782368659973145, "lr": 7.196804497332546e-05, "tps": 1001088, "wall": 1625.6} {"step": 24832, "train_loss": 3.1515979766845703, "lr": 7.195714663312569e-05, "tps": 998306, "wall": 1630.2} {"step": 24833, "train_loss": 3.170545816421509, "lr": 7.194624996996338e-05, "tps": 995520, "wall": 1634.8} {"step": 24834, "train_loss": 3.1364710330963135, "lr": 7.1935354983962e-05, "tps": 992617, "wall": 1639.7} {"step": 24835, "train_loss": 3.2967779636383057, "lr": 7.192446167524487e-05, "tps": 989858, "wall": 1644.3} {"step": 24836, "train_loss": 3.1899302005767822, "lr": 7.191357004393549e-05, "tps": 987130, "wall": 1648.9} {"step": 24837, "train_loss": 3.2468013763427734, "lr": 7.190268009015722e-05, "tps": 984415, "wall": 1653.6} {"step": 24838, "train_loss": 3.2349324226379395, "lr": 7.189179181403333e-05, "tps": 981670, "wall": 1658.2} {"step": 24839, "train_loss": 3.1656100749969482, "lr": 7.188090521568729e-05, "tps": 979010, "wall": 1662.8} {"step": 24840, "train_loss": 3.1574978828430176, "lr": 7.187002029524236e-05, "tps": 976337, "wall": 1667.4} {"step": 24841, "train_loss": 3.1831326484680176, "lr": 7.185913705282181e-05, "tps": 973677, "wall": 1672.1} {"step": 24842, "train_loss": 3.4516844749450684, "lr": 7.184825548854904e-05, "tps": 971024, "wall": 1676.7} {"step": 24843, "train_loss": 3.2043416500091553, "lr": 7.18373756025472e-05, "tps": 968417, "wall": 1681.3} {"step": 24844, "train_loss": 3.2065017223358154, "lr": 7.182649739493961e-05, "tps": 965831, "wall": 1685.8} {"step": 24845, "train_loss": 3.159101963043213, "lr": 7.181562086584947e-05, "tps": 963244, "wall": 1690.4} {"step": 24846, "train_loss": 3.200486183166504, "lr": 7.180474601539995e-05, "tps": 960650, "wall": 1695.1} {"step": 24847, "train_loss": 3.2537994384765625, "lr": 7.179387284371435e-05, "tps": 958016, "wall": 1699.8} {"step": 24848, "train_loss": 3.1548709869384766, "lr": 7.178300135091576e-05, "tps": 955425, "wall": 1704.5} {"step": 24849, "train_loss": 3.196462631225586, "lr": 7.177213153712729e-05, "tps": 952884, "wall": 1709.1} {"step": 24850, "train_loss": 3.136286735534668, "lr": 7.17612634024722e-05, "tps": 950362, "wall": 1713.7} {"step": 24851, "train_loss": 3.2715578079223633, "lr": 7.175039694707353e-05, "tps": 947812, "wall": 1718.4} {"step": 24852, "train_loss": 3.171609878540039, "lr": 7.173953217105435e-05, "tps": 945292, "wall": 1723.0} {"step": 24853, "train_loss": 3.2690606117248535, "lr": 7.172866907453779e-05, "tps": 942781, "wall": 1727.7} {"step": 24854, "train_loss": 3.238217353820801, "lr": 7.17178076576469e-05, "tps": 940111, "wall": 1732.7} {"step": 24855, "train_loss": 3.282026529312134, "lr": 7.170694792050467e-05, "tps": 937497, "wall": 1737.6} {"step": 24856, "train_loss": 3.133206367492676, "lr": 7.169608986323419e-05, "tps": 934909, "wall": 1742.4} {"step": 24857, "train_loss": 3.1933212280273438, "lr": 7.168523348595843e-05, "tps": 932350, "wall": 1747.3} {"step": 24858, "train_loss": 3.203010082244873, "lr": 7.167437878880034e-05, "tps": 929803, "wall": 1752.2} {"step": 24859, "train_loss": 3.183030128479004, "lr": 7.166352577188293e-05, "tps": 927238, "wall": 1757.1} {"step": 24860, "train_loss": 3.176881790161133, "lr": 7.165267443532912e-05, "tps": 924714, "wall": 1761.9} {"step": 24861, "train_loss": 3.1747608184814453, "lr": 7.164182477926184e-05, "tps": 922333, "wall": 1766.6} {"step": 24862, "train_loss": 3.2483291625976562, "lr": 7.163097680380401e-05, "tps": 919963, "wall": 1771.2} {"step": 24863, "train_loss": 3.123889923095703, "lr": 7.162013050907846e-05, "tps": 917565, "wall": 1775.9} {"step": 24864, "train_loss": 3.1522789001464844, "lr": 7.160928589520815e-05, "tps": 915262, "wall": 1780.4} {"step": 24865, "train_loss": 3.23217511177063, "lr": 7.159844296231586e-05, "tps": 912958, "wall": 1785.0} {"step": 24866, "train_loss": 3.138871431350708, "lr": 7.158760171052441e-05, "tps": 910673, "wall": 1789.5} {"step": 24867, "train_loss": 3.2998387813568115, "lr": 7.157676213995672e-05, "tps": 908412, "wall": 1794.1} {"step": 24868, "train_loss": 3.0337066650390625, "lr": 7.15659242507354e-05, "tps": 906121, "wall": 1798.7} {"step": 24869, "train_loss": 3.1366636753082275, "lr": 7.155508804298339e-05, "tps": 903856, "wall": 1803.3} {"step": 24870, "train_loss": 3.0686421394348145, "lr": 7.154425351682334e-05, "tps": 901587, "wall": 1807.9} {"step": 24871, "train_loss": 3.175468921661377, "lr": 7.153342067237798e-05, "tps": 899291, "wall": 1812.6} {"step": 24872, "train_loss": 3.0665059089660645, "lr": 7.152258950977011e-05, "tps": 897008, "wall": 1817.2} {"step": 24873, "train_loss": 3.2190542221069336, "lr": 7.151176002912241e-05, "tps": 894746, "wall": 1821.9} {"step": 24874, "train_loss": 3.0857291221618652, "lr": 7.150093223055745e-05, "tps": 892520, "wall": 1826.5} {"step": 24875, "train_loss": 3.1089563369750977, "lr": 7.1490106114198e-05, "tps": 890306, "wall": 1831.1} {"step": 24876, "train_loss": 3.2623839378356934, "lr": 7.147928168016668e-05, "tps": 888075, "wall": 1835.8} {"step": 24877, "train_loss": 3.2273612022399902, "lr": 7.146845892858605e-05, "tps": 885889, "wall": 1840.4} {"step": 24878, "train_loss": 3.2663044929504395, "lr": 7.14576378595788e-05, "tps": 883708, "wall": 1845.0} {"step": 24879, "train_loss": 3.2221035957336426, "lr": 7.144681847326744e-05, "tps": 881545, "wall": 1849.6} {"step": 24880, "train_loss": 3.291097640991211, "lr": 7.143600076977453e-05, "tps": 879401, "wall": 1854.2} {"step": 24881, "train_loss": 3.0930824279785156, "lr": 7.142518474922266e-05, "tps": 877260, "wall": 1858.8} {"step": 24882, "train_loss": 3.2005720138549805, "lr": 7.141437041173436e-05, "tps": 875134, "wall": 1863.4} {"step": 24883, "train_loss": 3.227388381958008, "lr": 7.140355775743206e-05, "tps": 873031, "wall": 1868.0} {"step": 24884, "train_loss": 3.230790615081787, "lr": 7.139274678643835e-05, "tps": 870938, "wall": 1872.5} {"step": 24885, "train_loss": 3.127694606781006, "lr": 7.138193749887558e-05, "tps": 868835, "wall": 1877.1} {"step": 24886, "train_loss": 3.202691078186035, "lr": 7.137112989486634e-05, "tps": 866733, "wall": 1881.8} {"step": 24887, "train_loss": 3.172161102294922, "lr": 7.136032397453296e-05, "tps": 864646, "wall": 1886.4} {"step": 24888, "train_loss": 3.1978628635406494, "lr": 7.134951973799782e-05, "tps": 862568, "wall": 1891.0} {"step": 24889, "train_loss": 3.1300251483917236, "lr": 7.133871718538341e-05, "tps": 860414, "wall": 1895.8} {"step": 24890, "train_loss": 3.2548580169677734, "lr": 7.132791631681206e-05, "tps": 858264, "wall": 1900.6} {"step": 24891, "train_loss": 3.2565500736236572, "lr": 7.131711713240608e-05, "tps": 856132, "wall": 1905.5} {"step": 24892, "train_loss": 3.230739116668701, "lr": 7.130631963228787e-05, "tps": 854017, "wall": 1910.3} {"step": 24893, "train_loss": 3.1389966011047363, "lr": 7.129552381657973e-05, "tps": 851918, "wall": 1915.0} {"step": 24894, "train_loss": 3.1918935775756836, "lr": 7.128472968540387e-05, "tps": 849815, "wall": 1919.9} {"step": 24895, "train_loss": 3.265993356704712, "lr": 7.127393723888272e-05, "tps": 847673, "wall": 1924.8} {"step": 24896, "train_loss": 3.171546459197998, "lr": 7.126314647713841e-05, "tps": 845648, "wall": 1929.5} {"step": 24897, "train_loss": 3.2333388328552246, "lr": 7.125235740029321e-05, "tps": 843677, "wall": 1934.1} {"step": 24898, "train_loss": 3.2166123390197754, "lr": 7.124157000846941e-05, "tps": 841716, "wall": 1938.6} {"step": 24899, "train_loss": 3.238189458847046, "lr": 7.123078430178912e-05, "tps": 839774, "wall": 1943.2} {"step": 24900, "train_loss": 3.1187524795532227, "lr": 7.122000028037452e-05, "tps": 837837, "wall": 1947.8} {"step": 24901, "train_loss": 3.1996583938598633, "lr": 7.120921794434785e-05, "tps": 835906, "wall": 1952.3} {"step": 24902, "train_loss": 3.204900026321411, "lr": 7.119843729383122e-05, "tps": 833971, "wall": 1957.0} {"step": 24903, "train_loss": 3.2486836910247803, "lr": 7.118765832894668e-05, "tps": 832051, "wall": 1961.5} {"step": 24904, "train_loss": 3.2829842567443848, "lr": 7.117688104981646e-05, "tps": 830155, "wall": 1966.1} {"step": 24905, "train_loss": 3.1874914169311523, "lr": 7.116610545656253e-05, "tps": 828258, "wall": 1970.7} {"step": 24906, "train_loss": 3.249786138534546, "lr": 7.115533154930704e-05, "tps": 826365, "wall": 1975.3} {"step": 24907, "train_loss": 3.149977207183838, "lr": 7.114455932817202e-05, "tps": 824482, "wall": 1979.9} {"step": 24908, "train_loss": 3.2469491958618164, "lr": 7.113378879327944e-05, "tps": 822600, "wall": 1984.5} {"step": 24909, "train_loss": 3.2542166709899902, "lr": 7.112301994475139e-05, "tps": 820669, "wall": 1989.2} {"step": 24910, "train_loss": 3.1802568435668945, "lr": 7.111225278270984e-05, "tps": 818807, "wall": 1993.8} {"step": 24911, "train_loss": 3.1788434982299805, "lr": 7.110148730727668e-05, "tps": 816954, "wall": 1998.4} {"step": 24912, "train_loss": 3.1023831367492676, "lr": 7.1090723518574e-05, "tps": 815112, "wall": 2003.0} {"step": 24913, "train_loss": 3.1610937118530273, "lr": 7.107996141672363e-05, "tps": 813273, "wall": 2007.6} {"step": 24914, "train_loss": 3.1803629398345947, "lr": 7.106920100184747e-05, "tps": 811347, "wall": 2012.5} {"step": 24915, "train_loss": 3.3051095008850098, "lr": 7.105844227406753e-05, "tps": 809435, "wall": 2017.3} {"step": 24916, "train_loss": 3.2416610717773438, "lr": 7.10476852335056e-05, "tps": 807568, "wall": 2022.1} {"step": 24917, "train_loss": 3.126884698867798, "lr": 7.10369298802835e-05, "tps": 805766, "wall": 2026.7} {"step": 24918, "train_loss": 3.1176021099090576, "lr": 7.102617621452316e-05, "tps": 803974, "wall": 2031.3} {"step": 24919, "train_loss": 3.229637861251831, "lr": 7.101542423634637e-05, "tps": 802196, "wall": 2035.9} {"step": 24920, "train_loss": 3.1481821537017822, "lr": 7.100467394587484e-05, "tps": 800412, "wall": 2040.5} {"step": 24921, "train_loss": 3.180246114730835, "lr": 7.099392534323051e-05, "tps": 798537, "wall": 2045.3} {"step": 24922, "train_loss": 3.211798906326294, "lr": 7.098317842853499e-05, "tps": 796648, "wall": 2050.3} {"step": 24923, "train_loss": 3.1916732788085938, "lr": 7.097243320191012e-05, "tps": 794803, "wall": 2055.1} {"step": 24924, "train_loss": 3.238586902618408, "lr": 7.09616896634776e-05, "tps": 792990, "wall": 2059.9} {"step": 24925, "train_loss": 3.0950870513916016, "lr": 7.095094781335909e-05, "tps": 791165, "wall": 2064.7} {"step": 24926, "train_loss": 3.200833559036255, "lr": 7.094020765167634e-05, "tps": 789325, "wall": 2069.6} {"step": 24927, "train_loss": 3.2980926036834717, "lr": 7.092946917855096e-05, "tps": 787530, "wall": 2074.4} {"step": 24928, "train_loss": 3.2544047832489014, "lr": 7.09187323941046e-05, "tps": 785803, "wall": 2079.1} {"step": 24929, "train_loss": 3.2423622608184814, "lr": 7.090799729845893e-05, "tps": 784102, "wall": 2083.7} {"step": 24930, "train_loss": 3.2424638271331787, "lr": 7.089726389173557e-05, "tps": 782416, "wall": 2088.2} {"step": 24931, "train_loss": 3.194634437561035, "lr": 7.088653217405599e-05, "tps": 780740, "wall": 2092.8} {"step": 24932, "train_loss": 3.173164129257202, "lr": 7.087580214554189e-05, "tps": 779056, "wall": 2097.4} {"step": 24933, "train_loss": 3.2379255294799805, "lr": 7.08650738063148e-05, "tps": 777385, "wall": 2102.0} {"step": 24934, "train_loss": 3.291997194290161, "lr": 7.085434715649615e-05, "tps": 775737, "wall": 2106.6} {"step": 24935, "train_loss": 3.2760181427001953, "lr": 7.084362219620757e-05, "tps": 774094, "wall": 2111.1} {"step": 24936, "train_loss": 3.2052555084228516, "lr": 7.08328989255705e-05, "tps": 772467, "wall": 2115.7} {"step": 24937, "train_loss": 3.26175594329834, "lr": 7.082217734470639e-05, "tps": 770852, "wall": 2120.2} {"step": 24938, "train_loss": 3.238722801208496, "lr": 7.081145745373677e-05, "tps": 769225, "wall": 2124.7} {"step": 24939, "train_loss": 3.1772565841674805, "lr": 7.080073925278297e-05, "tps": 767546, "wall": 2129.5} {"step": 24940, "train_loss": 3.1243202686309814, "lr": 7.079002274196653e-05, "tps": 765950, "wall": 2134.0} {"step": 24941, "train_loss": 3.227449655532837, "lr": 7.077930792140878e-05, "tps": 764343, "wall": 2138.6} {"step": 24942, "train_loss": 3.1129865646362305, "lr": 7.076859479123104e-05, "tps": 762740, "wall": 2143.1} {"step": 24943, "train_loss": 3.204252243041992, "lr": 7.07578833515548e-05, "tps": 761121, "wall": 2147.8} {"step": 24944, "train_loss": 3.2103004455566406, "lr": 7.074717360250134e-05, "tps": 759505, "wall": 2152.4} {"step": 24945, "train_loss": 3.158611297607422, "lr": 7.073646554419191e-05, "tps": 757929, "wall": 2157.0} {"step": 24946, "train_loss": 3.2082724571228027, "lr": 7.072575917674791e-05, "tps": 756335, "wall": 2161.6} {"step": 24947, "train_loss": 3.1993536949157715, "lr": 7.07150545002906e-05, "tps": 754768, "wall": 2166.2} {"step": 24948, "train_loss": 3.2751078605651855, "lr": 7.070435151494117e-05, "tps": 753183, "wall": 2170.9} {"step": 24949, "train_loss": 3.254756450653076, "lr": 7.069365022082097e-05, "tps": 751625, "wall": 2175.4} {"step": 24950, "train_loss": 3.169747829437256, "lr": 7.06829506180512e-05, "tps": 750052, "wall": 2180.1} {"step": 24951, "train_loss": 3.298973798751831, "lr": 7.067225270675297e-05, "tps": 748476, "wall": 2184.8} {"step": 24952, "train_loss": 3.2492244243621826, "lr": 7.06615564870476e-05, "tps": 746910, "wall": 2189.4} {"step": 24953, "train_loss": 3.221177577972412, "lr": 7.06508619590562e-05, "tps": 745368, "wall": 2194.1} {"step": 24954, "train_loss": 3.221524715423584, "lr": 7.064016912289986e-05, "tps": 743817, "wall": 2198.7} {"step": 24955, "train_loss": 3.3331379890441895, "lr": 7.062947797869984e-05, "tps": 742293, "wall": 2203.3} {"step": 24956, "train_loss": 3.217189073562622, "lr": 7.061878852657713e-05, "tps": 740775, "wall": 2207.9} {"step": 24957, "train_loss": 3.231973648071289, "lr": 7.060810076665283e-05, "tps": 739262, "wall": 2212.5} {"step": 24958, "train_loss": 3.1404032707214355, "lr": 7.05974146990481e-05, "tps": 737753, "wall": 2217.2} {"step": 24959, "train_loss": 3.1438441276550293, "lr": 7.058673032388389e-05, "tps": 736270, "wall": 2221.7} {"step": 24960, "train_loss": 3.137634754180908, "lr": 7.057604764128134e-05, "tps": 734790, "wall": 2226.3} {"step": 24961, "train_loss": 3.151707410812378, "lr": 7.05653666513614e-05, "tps": 733314, "wall": 2230.8} {"step": 24962, "train_loss": 3.1304078102111816, "lr": 7.055468735424502e-05, "tps": 731845, "wall": 2235.4} {"step": 24963, "train_loss": 3.16920804977417, "lr": 7.054400975005326e-05, "tps": 730388, "wall": 2240.0} {"step": 24964, "train_loss": 3.0956058502197266, "lr": 7.053333383890705e-05, "tps": 728923, "wall": 2244.6} {"step": 24965, "train_loss": 3.207771062850952, "lr": 7.05226596209273e-05, "tps": 727461, "wall": 2249.2} {"step": 24966, "train_loss": 3.214592695236206, "lr": 7.051198709623497e-05, "tps": 725998, "wall": 2253.8} {"step": 24967, "train_loss": 3.1599345207214355, "lr": 7.050131626495095e-05, "tps": 724523, "wall": 2258.5} {"step": 24968, "train_loss": 3.2395477294921875, "lr": 7.049064712719604e-05, "tps": 723071, "wall": 2263.1} {"step": 24969, "train_loss": 3.2143497467041016, "lr": 7.047997968309123e-05, "tps": 721623, "wall": 2267.7} {"step": 24970, "train_loss": 3.193390369415283, "lr": 7.04693139327573e-05, "tps": 720190, "wall": 2272.3} {"step": 24971, "train_loss": 3.1441049575805664, "lr": 7.045864987631503e-05, "tps": 718772, "wall": 2276.9} {"step": 24972, "train_loss": 3.2574403285980225, "lr": 7.044798751388529e-05, "tps": 717360, "wall": 2281.5} {"step": 24973, "train_loss": 3.183310031890869, "lr": 7.043732684558886e-05, "tps": 715955, "wall": 2286.0} {"step": 24974, "train_loss": 3.187309980392456, "lr": 7.042666787154642e-05, "tps": 714551, "wall": 2290.6} {"step": 24975, "train_loss": 3.16678786277771, "lr": 7.041601059187884e-05, "tps": 713156, "wall": 2295.2} {"step": 24976, "train_loss": 3.236499071121216, "lr": 7.040535500670673e-05, "tps": 711768, "wall": 2299.8} {"step": 24977, "train_loss": 3.235402822494507, "lr": 7.03947011161509e-05, "tps": 710368, "wall": 2304.4} {"step": 24978, "train_loss": 3.1513543128967285, "lr": 7.038404892033199e-05, "tps": 708982, "wall": 2309.0} {"step": 24979, "train_loss": 3.2329750061035156, "lr": 7.03733984193706e-05, "tps": 707587, "wall": 2313.6} {"step": 24980, "train_loss": 3.186243772506714, "lr": 7.036274961338752e-05, "tps": 706160, "wall": 2318.4} {"step": 24981, "train_loss": 3.1718592643737793, "lr": 7.035210250250329e-05, "tps": 704779, "wall": 2323.0} {"step": 24982, "train_loss": 3.124985694885254, "lr": 7.034145708683851e-05, "tps": 703432, "wall": 2327.6} {"step": 24983, "train_loss": 3.315580129623413, "lr": 7.033081336651384e-05, "tps": 702082, "wall": 2332.1} {"step": 24984, "train_loss": 3.185149669647217, "lr": 7.032017134164982e-05, "tps": 700741, "wall": 2336.7} {"step": 24985, "train_loss": 3.100069046020508, "lr": 7.030953101236695e-05, "tps": 699395, "wall": 2341.3} {"step": 24986, "train_loss": 3.1803057193756104, "lr": 7.029889237878584e-05, "tps": 698034, "wall": 2345.9} {"step": 24987, "train_loss": 3.2389683723449707, "lr": 7.028825544102698e-05, "tps": 696702, "wall": 2350.5} {"step": 24988, "train_loss": 3.2408690452575684, "lr": 7.027762019921083e-05, "tps": 695346, "wall": 2355.2} {"step": 24989, "train_loss": 3.2778470516204834, "lr": 7.026698665345792e-05, "tps": 693940, "wall": 2360.1} {"step": 24990, "train_loss": 3.1794514656066895, "lr": 7.02563548038887e-05, "tps": 692579, "wall": 2364.8} {"step": 24991, "train_loss": 3.2479910850524902, "lr": 7.024572465062355e-05, "tps": 691232, "wall": 2369.5} {"step": 24992, "train_loss": 3.1818790435791016, "lr": 7.023509619378298e-05, "tps": 689924, "wall": 2374.1} {"step": 24993, "train_loss": 3.189925193786621, "lr": 7.022446943348728e-05, "tps": 688619, "wall": 2378.7} {"step": 24994, "train_loss": 3.253302574157715, "lr": 7.021384436985697e-05, "tps": 687338, "wall": 2383.2} {"step": 24995, "train_loss": 3.1760873794555664, "lr": 7.020322100301232e-05, "tps": 686035, "wall": 2387.8} {"step": 24996, "train_loss": 3.219369411468506, "lr": 7.019259933307363e-05, "tps": 684731, "wall": 2392.5} {"step": 24997, "train_loss": 3.205409049987793, "lr": 7.018197936016133e-05, "tps": 683428, "wall": 2397.1} {"step": 24998, "train_loss": 3.143383502960205, "lr": 7.017136108439568e-05, "tps": 682145, "wall": 2401.7} {"step": 24999, "train_loss": 3.2185170650482178, "lr": 7.016074450589691e-05, "tps": 680869, "wall": 2406.3} {"step": 25000, "train_loss": 3.2065439224243164, "lr": 7.015012962478538e-05, "tps": 679603, "wall": 2410.9, "val_loss_monitor": 3.324721693626568, "val_loss_full": 3.3426666770592814} {"step": 25001, "train_loss": 3.271540641784668, "lr": 7.013951644118127e-05, "tps": 649209, "wall": 2523.9} {"step": 25002, "train_loss": 3.183959722518921, "lr": 7.012890495520478e-05, "tps": 648026, "wall": 2528.6} {"step": 25003, "train_loss": 3.08809757232666, "lr": 7.011829516697624e-05, "tps": 646846, "wall": 2533.3} {"step": 25004, "train_loss": 3.197537660598755, "lr": 7.010768707661572e-05, "tps": 645666, "wall": 2538.0} {"step": 25005, "train_loss": 3.2431626319885254, "lr": 7.009708068424342e-05, "tps": 644507, "wall": 2542.7} {"step": 25006, "train_loss": 3.1394174098968506, "lr": 7.008647598997953e-05, "tps": 643365, "wall": 2547.3} {"step": 25007, "train_loss": 3.1041324138641357, "lr": 7.007587299394415e-05, "tps": 642226, "wall": 2551.9} {"step": 25008, "train_loss": 3.0144665241241455, "lr": 7.006527169625734e-05, "tps": 641075, "wall": 2556.6} {"step": 25009, "train_loss": 3.2437007427215576, "lr": 7.00546720970393e-05, "tps": 639945, "wall": 2561.2} {"step": 25010, "train_loss": 3.221653938293457, "lr": 7.004407419641004e-05, "tps": 638817, "wall": 2565.9} {"step": 25011, "train_loss": 3.099876642227173, "lr": 7.003347799448958e-05, "tps": 637681, "wall": 2570.5} {"step": 25012, "train_loss": 3.1574392318725586, "lr": 7.002288349139806e-05, "tps": 636554, "wall": 2575.2} {"step": 25013, "train_loss": 3.3569531440734863, "lr": 7.001229068725535e-05, "tps": 635404, "wall": 2580.0} {"step": 25014, "train_loss": 3.1992578506469727, "lr": 7.000169958218157e-05, "tps": 634226, "wall": 2584.9} {"step": 25015, "train_loss": 3.2035369873046875, "lr": 6.999111017629668e-05, "tps": 633116, "wall": 2589.5} {"step": 25016, "train_loss": 3.3119258880615234, "lr": 6.998052246972053e-05, "tps": 632005, "wall": 2594.1} {"step": 25017, "train_loss": 3.201200485229492, "lr": 6.996993646257321e-05, "tps": 630903, "wall": 2598.8} {"step": 25018, "train_loss": 3.2227048873901367, "lr": 6.995935215497456e-05, "tps": 629817, "wall": 2603.4} {"step": 25019, "train_loss": 3.203657627105713, "lr": 6.994876954704443e-05, "tps": 628737, "wall": 2607.9} {"step": 25020, "train_loss": 3.142073154449463, "lr": 6.993818863890279e-05, "tps": 627657, "wall": 2612.5} {"step": 25021, "train_loss": 3.202502727508545, "lr": 6.99276094306695e-05, "tps": 626577, "wall": 2617.1} {"step": 25022, "train_loss": 3.1575400829315186, "lr": 6.991703192246431e-05, "tps": 625515, "wall": 2621.7} {"step": 25023, "train_loss": 3.2545223236083984, "lr": 6.990645611440713e-05, "tps": 624455, "wall": 2626.2} {"step": 25024, "train_loss": 3.212188720703125, "lr": 6.989588200661775e-05, "tps": 623400, "wall": 2630.8} {"step": 25025, "train_loss": 3.134885311126709, "lr": 6.98853095992159e-05, "tps": 622349, "wall": 2635.3} {"step": 25026, "train_loss": 3.117621421813965, "lr": 6.987473889232142e-05, "tps": 621304, "wall": 2639.9} {"step": 25027, "train_loss": 3.223362445831299, "lr": 6.986416988605403e-05, "tps": 620262, "wall": 2644.4} {"step": 25028, "train_loss": 3.099741220474243, "lr": 6.98536025805334e-05, "tps": 619225, "wall": 2649.0} {"step": 25029, "train_loss": 3.097355365753174, "lr": 6.984303697587931e-05, "tps": 618189, "wall": 2653.5} {"step": 25030, "train_loss": 3.231733798980713, "lr": 6.98324730722114e-05, "tps": 617158, "wall": 2658.0} {"step": 25031, "train_loss": 3.1691789627075195, "lr": 6.98219108696494e-05, "tps": 616129, "wall": 2662.6} {"step": 25032, "train_loss": 3.2054648399353027, "lr": 6.98113503683129e-05, "tps": 615104, "wall": 2667.1} {"step": 25033, "train_loss": 3.2583670616149902, "lr": 6.980079156832151e-05, "tps": 614085, "wall": 2671.7} {"step": 25034, "train_loss": 3.170362949371338, "lr": 6.979023446979492e-05, "tps": 613055, "wall": 2676.3} {"step": 25035, "train_loss": 3.241304636001587, "lr": 6.977967907285267e-05, "tps": 612047, "wall": 2680.8} {"step": 25036, "train_loss": 3.1987733840942383, "lr": 6.976912537761438e-05, "tps": 611038, "wall": 2685.3} {"step": 25037, "train_loss": 3.2543301582336426, "lr": 6.975857338419953e-05, "tps": 610033, "wall": 2689.8} {"step": 25038, "train_loss": 3.127523899078369, "lr": 6.974802309272768e-05, "tps": 609031, "wall": 2694.4} {"step": 25039, "train_loss": 3.2457003593444824, "lr": 6.973747450331838e-05, "tps": 608014, "wall": 2699.0} {"step": 25040, "train_loss": 3.2828245162963867, "lr": 6.972692761609108e-05, "tps": 607018, "wall": 2703.5} {"step": 25041, "train_loss": 3.1217684745788574, "lr": 6.971638243116522e-05, "tps": 606027, "wall": 2708.0} {"step": 25042, "train_loss": 3.14827299118042, "lr": 6.97058389486604e-05, "tps": 605038, "wall": 2712.6} {"step": 25043, "train_loss": 3.2480697631835938, "lr": 6.969529716869594e-05, "tps": 604050, "wall": 2717.1} {"step": 25044, "train_loss": 3.1673903465270996, "lr": 6.968475709139124e-05, "tps": 603067, "wall": 2721.7} {"step": 25045, "train_loss": 3.23048734664917, "lr": 6.96742187168658e-05, "tps": 602087, "wall": 2726.2} {"step": 25046, "train_loss": 3.2774384021759033, "lr": 6.966368204523894e-05, "tps": 601102, "wall": 2730.8} {"step": 25047, "train_loss": 3.2062344551086426, "lr": 6.965314707662997e-05, "tps": 600111, "wall": 2735.4} {"step": 25048, "train_loss": 3.1726183891296387, "lr": 6.964261381115834e-05, "tps": 599146, "wall": 2739.9} {"step": 25049, "train_loss": 3.095916986465454, "lr": 6.96320822489433e-05, "tps": 598175, "wall": 2744.5} {"step": 25050, "train_loss": 3.1379988193511963, "lr": 6.962155239010413e-05, "tps": 597206, "wall": 2749.0} {"step": 25051, "train_loss": 3.1541709899902344, "lr": 6.961102423476018e-05, "tps": 596245, "wall": 2753.6} {"step": 25052, "train_loss": 3.22591495513916, "lr": 6.960049778303071e-05, "tps": 595265, "wall": 2758.2} {"step": 25053, "train_loss": 3.18550705909729, "lr": 6.958997303503487e-05, "tps": 594291, "wall": 2762.9} {"step": 25054, "train_loss": 3.1435863971710205, "lr": 6.957944999089201e-05, "tps": 593317, "wall": 2767.5} {"step": 25055, "train_loss": 3.194512367248535, "lr": 6.956892865072122e-05, "tps": 592349, "wall": 2772.1} {"step": 25056, "train_loss": 3.2294750213623047, "lr": 6.955840901464182e-05, "tps": 591394, "wall": 2776.7} {"step": 25057, "train_loss": 3.102097511291504, "lr": 6.954789108277288e-05, "tps": 590445, "wall": 2781.3} {"step": 25058, "train_loss": 3.046973466873169, "lr": 6.953737485523352e-05, "tps": 589498, "wall": 2785.9} {"step": 25059, "train_loss": 3.204563856124878, "lr": 6.952686033214297e-05, "tps": 588555, "wall": 2790.4} {"step": 25060, "train_loss": 3.103830337524414, "lr": 6.951634751362029e-05, "tps": 587608, "wall": 2795.1} {"step": 25061, "train_loss": 3.207845449447632, "lr": 6.950583639978451e-05, "tps": 586667, "wall": 2799.7} {"step": 25062, "train_loss": 3.173957109451294, "lr": 6.949532699075481e-05, "tps": 585722, "wall": 2804.3} {"step": 25063, "train_loss": 3.13266921043396, "lr": 6.948481928665019e-05, "tps": 584779, "wall": 2808.9} {"step": 25064, "train_loss": 3.2405428886413574, "lr": 6.947431328758962e-05, "tps": 583852, "wall": 2813.5} {"step": 25065, "train_loss": 3.173891305923462, "lr": 6.946380899369224e-05, "tps": 582921, "wall": 2818.1} {"step": 25066, "train_loss": 3.086249828338623, "lr": 6.945330640507697e-05, "tps": 581996, "wall": 2822.7} {"step": 25067, "train_loss": 3.058445453643799, "lr": 6.944280552186273e-05, "tps": 581077, "wall": 2827.3} {"step": 25068, "train_loss": 3.2823922634124756, "lr": 6.94323063441686e-05, "tps": 580155, "wall": 2831.9} {"step": 25069, "train_loss": 3.1203932762145996, "lr": 6.942180887211341e-05, "tps": 579239, "wall": 2836.5} {"step": 25070, "train_loss": 3.2763214111328125, "lr": 6.941131310581611e-05, "tps": 578328, "wall": 2841.0} {"step": 25071, "train_loss": 3.0785999298095703, "lr": 6.940081904539564e-05, "tps": 577420, "wall": 2845.6} {"step": 25072, "train_loss": 3.1040782928466797, "lr": 6.939032669097077e-05, "tps": 576517, "wall": 2850.2} {"step": 25073, "train_loss": 3.0711495876312256, "lr": 6.937983604266049e-05, "tps": 575584, "wall": 2854.9} {"step": 25074, "train_loss": 3.275564193725586, "lr": 6.936934710058358e-05, "tps": 574676, "wall": 2859.5} {"step": 25075, "train_loss": 3.1974971294403076, "lr": 6.935885986485881e-05, "tps": 573718, "wall": 2864.4} {"step": 25076, "train_loss": 3.149136543273926, "lr": 6.934837433560506e-05, "tps": 572804, "wall": 2869.1} {"step": 25077, "train_loss": 3.2400217056274414, "lr": 6.933789051294109e-05, "tps": 571917, "wall": 2873.7} {"step": 25078, "train_loss": 3.0821149349212646, "lr": 6.932740839698558e-05, "tps": 571030, "wall": 2878.3} {"step": 25079, "train_loss": 3.197458505630493, "lr": 6.93169279878574e-05, "tps": 570142, "wall": 2882.9} {"step": 25080, "train_loss": 3.219099521636963, "lr": 6.930644928567521e-05, "tps": 569265, "wall": 2887.4} {"step": 25081, "train_loss": 3.2127842903137207, "lr": 6.929597229055767e-05, "tps": 568395, "wall": 2892.0} {"step": 25082, "train_loss": 3.3113174438476562, "lr": 6.928549700262354e-05, "tps": 567529, "wall": 2896.5} {"step": 25083, "train_loss": 3.1630148887634277, "lr": 6.927502342199148e-05, "tps": 566671, "wall": 2901.0} {"step": 25084, "train_loss": 3.290452480316162, "lr": 6.926455154878004e-05, "tps": 565813, "wall": 2905.5} {"step": 25085, "train_loss": 3.152782440185547, "lr": 6.925408138310799e-05, "tps": 564957, "wall": 2910.0} {"step": 25086, "train_loss": 3.151280403137207, "lr": 6.924361292509382e-05, "tps": 564104, "wall": 2914.5} {"step": 25087, "train_loss": 3.231294631958008, "lr": 6.923314617485612e-05, "tps": 563244, "wall": 2919.1} {"step": 25088, "train_loss": 3.0702412128448486, "lr": 6.922268113251357e-05, "tps": 562395, "wall": 2923.6} {"step": 25089, "train_loss": 3.164750814437866, "lr": 6.921221779818464e-05, "tps": 561549, "wall": 2928.1} {"step": 25090, "train_loss": 3.185661554336548, "lr": 6.920175617198781e-05, "tps": 560698, "wall": 2932.7} {"step": 25091, "train_loss": 3.0680246353149414, "lr": 6.919129625404169e-05, "tps": 559858, "wall": 2937.2} {"step": 25092, "train_loss": 3.2044427394866943, "lr": 6.918083804446467e-05, "tps": 559019, "wall": 2941.8} {"step": 25093, "train_loss": 3.1104366779327393, "lr": 6.917038154337533e-05, "tps": 558183, "wall": 2946.3} {"step": 25094, "train_loss": 3.2823257446289062, "lr": 6.915992675089207e-05, "tps": 557342, "wall": 2950.8} {"step": 25095, "train_loss": 3.206145763397217, "lr": 6.914947366713326e-05, "tps": 556510, "wall": 2955.4} {"step": 25096, "train_loss": 3.145796775817871, "lr": 6.913902229221745e-05, "tps": 555680, "wall": 2959.9} {"step": 25097, "train_loss": 3.109985828399658, "lr": 6.912857262626293e-05, "tps": 554851, "wall": 2964.4} {"step": 25098, "train_loss": 3.223667621612549, "lr": 6.911812466938808e-05, "tps": 554028, "wall": 2969.0} {"step": 25099, "train_loss": 3.271085739135742, "lr": 6.910767842171129e-05, "tps": 553206, "wall": 2973.5} {"step": 25100, "train_loss": 3.086747646331787, "lr": 6.909723388335088e-05, "tps": 552380, "wall": 2978.1} {"step": 25101, "train_loss": 3.2944092750549316, "lr": 6.908679105442515e-05, "tps": 551564, "wall": 2982.6} {"step": 25102, "train_loss": 3.2106285095214844, "lr": 6.907634993505245e-05, "tps": 550749, "wall": 2987.1} {"step": 25103, "train_loss": 3.251638412475586, "lr": 6.906591052535103e-05, "tps": 549929, "wall": 2991.7} {"step": 25104, "train_loss": 3.0911431312561035, "lr": 6.905547282543909e-05, "tps": 549119, "wall": 2996.2} {"step": 25105, "train_loss": 3.181718111038208, "lr": 6.904503683543496e-05, "tps": 548300, "wall": 3000.8} {"step": 25106, "train_loss": 3.190504312515259, "lr": 6.903460255545681e-05, "tps": 547495, "wall": 3005.3} {"step": 25107, "train_loss": 3.1836774349212646, "lr": 6.902416998562282e-05, "tps": 546686, "wall": 3009.9} {"step": 25108, "train_loss": 3.1316957473754883, "lr": 6.901373912605124e-05, "tps": 545854, "wall": 3014.6} {"step": 25109, "train_loss": 3.2783305644989014, "lr": 6.900330997686017e-05, "tps": 545052, "wall": 3019.2} {"step": 25110, "train_loss": 3.035125494003296, "lr": 6.899288253816778e-05, "tps": 544255, "wall": 3023.7} {"step": 25111, "train_loss": 3.145833969116211, "lr": 6.89824568100922e-05, "tps": 543451, "wall": 3028.3} {"step": 25112, "train_loss": 3.174140453338623, "lr": 6.89720327927515e-05, "tps": 542652, "wall": 3032.9} {"step": 25113, "train_loss": 3.197368621826172, "lr": 6.896161048626379e-05, "tps": 541780, "wall": 3037.9} {"step": 25114, "train_loss": 3.240060329437256, "lr": 6.895118989074715e-05, "tps": 540912, "wall": 3042.9} {"step": 25115, "train_loss": 3.149813652038574, "lr": 6.894077100631954e-05, "tps": 540105, "wall": 3047.6} {"step": 25116, "train_loss": 3.262727975845337, "lr": 6.89303538330991e-05, "tps": 539322, "wall": 3052.1} {"step": 25117, "train_loss": 3.2204251289367676, "lr": 6.891993837120379e-05, "tps": 538533, "wall": 3056.7} {"step": 25118, "train_loss": 3.1762685775756836, "lr": 6.890952462075156e-05, "tps": 537752, "wall": 3061.3} {"step": 25119, "train_loss": 3.1946263313293457, "lr": 6.889911258186041e-05, "tps": 536979, "wall": 3065.8} {"step": 25120, "train_loss": 3.1967227458953857, "lr": 6.888870225464832e-05, "tps": 536203, "wall": 3070.3} {"step": 25121, "train_loss": 3.2549548149108887, "lr": 6.887829363923315e-05, "tps": 535431, "wall": 3074.9} {"step": 25122, "train_loss": 3.1997079849243164, "lr": 6.886788673573287e-05, "tps": 534662, "wall": 3079.4} {"step": 25123, "train_loss": 3.152615785598755, "lr": 6.885748154426534e-05, "tps": 533893, "wall": 3084.0} {"step": 25124, "train_loss": 3.1415586471557617, "lr": 6.884707806494844e-05, "tps": 533128, "wall": 3088.5} {"step": 25125, "train_loss": 3.1513280868530273, "lr": 6.883667629790001e-05, "tps": 532339, "wall": 3093.2} {"step": 25126, "train_loss": 3.228128671646118, "lr": 6.882627624323785e-05, "tps": 531565, "wall": 3097.9} {"step": 25127, "train_loss": 3.0937600135803223, "lr": 6.881587790107986e-05, "tps": 530805, "wall": 3102.4} {"step": 25128, "train_loss": 3.265794277191162, "lr": 6.880548127154378e-05, "tps": 530047, "wall": 3107.0} {"step": 25129, "train_loss": 3.187520742416382, "lr": 6.879508635474738e-05, "tps": 529288, "wall": 3111.6} {"step": 25130, "train_loss": 3.2058701515197754, "lr": 6.878469315080842e-05, "tps": 528529, "wall": 3116.2} {"step": 25131, "train_loss": 3.2562217712402344, "lr": 6.877430165984465e-05, "tps": 527779, "wall": 3120.7} {"step": 25132, "train_loss": 3.1800129413604736, "lr": 6.876391188197374e-05, "tps": 527031, "wall": 3125.3} {"step": 25133, "train_loss": 3.154508113861084, "lr": 6.875352381731344e-05, "tps": 526284, "wall": 3129.8} {"step": 25134, "train_loss": 3.168421745300293, "lr": 6.874313746598142e-05, "tps": 525530, "wall": 3134.4} {"step": 25135, "train_loss": 3.186769723892212, "lr": 6.873275282809528e-05, "tps": 524776, "wall": 3139.1} {"step": 25136, "train_loss": 3.2730021476745605, "lr": 6.872236990377273e-05, "tps": 524038, "wall": 3143.6} {"step": 25137, "train_loss": 3.1815576553344727, "lr": 6.871198869313138e-05, "tps": 523299, "wall": 3148.2} {"step": 25138, "train_loss": 3.2247772216796875, "lr": 6.870160919628876e-05, "tps": 522555, "wall": 3152.8} {"step": 25139, "train_loss": 3.152005910873413, "lr": 6.869123141336251e-05, "tps": 521804, "wall": 3157.5} {"step": 25140, "train_loss": 3.3173880577087402, "lr": 6.868085534447019e-05, "tps": 521071, "wall": 3162.0} {"step": 25141, "train_loss": 3.1238043308258057, "lr": 6.86704809897293e-05, "tps": 520308, "wall": 3166.8} {"step": 25142, "train_loss": 3.052342414855957, "lr": 6.866010834925742e-05, "tps": 519545, "wall": 3171.6} {"step": 25143, "train_loss": 3.2149786949157715, "lr": 6.864973742317202e-05, "tps": 518793, "wall": 3176.3} {"step": 25144, "train_loss": 3.24544095993042, "lr": 6.863936821159054e-05, "tps": 518065, "wall": 3180.9} {"step": 25145, "train_loss": 3.165963888168335, "lr": 6.862900071463053e-05, "tps": 517337, "wall": 3185.5} {"step": 25146, "train_loss": 3.187943935394287, "lr": 6.861863493240934e-05, "tps": 516605, "wall": 3190.1} {"step": 25147, "train_loss": 3.135957717895508, "lr": 6.860827086504448e-05, "tps": 515863, "wall": 3194.8} {"step": 25148, "train_loss": 3.261007070541382, "lr": 6.859790851265335e-05, "tps": 515121, "wall": 3199.6} {"step": 25149, "train_loss": 3.216646671295166, "lr": 6.858754787535324e-05, "tps": 514385, "wall": 3204.3} {"step": 25150, "train_loss": 3.1245405673980713, "lr": 6.857718895326161e-05, "tps": 513635, "wall": 3209.1} {"step": 25151, "train_loss": 3.224522113800049, "lr": 6.856683174649577e-05, "tps": 512916, "wall": 3213.7} {"step": 25152, "train_loss": 3.191819190979004, "lr": 6.855647625517303e-05, "tps": 512186, "wall": 3218.4} {"step": 25153, "train_loss": 3.2163801193237305, "lr": 6.854612247941077e-05, "tps": 511463, "wall": 3223.1} {"step": 25154, "train_loss": 3.266040802001953, "lr": 6.853577041932622e-05, "tps": 510742, "wall": 3227.8} {"step": 25155, "train_loss": 3.239955186843872, "lr": 6.85254200750366e-05, "tps": 510026, "wall": 3232.4} {"step": 25156, "train_loss": 3.2463276386260986, "lr": 6.851507144665928e-05, "tps": 509320, "wall": 3237.0} {"step": 25157, "train_loss": 3.2319495677948, "lr": 6.85047245343114e-05, "tps": 508595, "wall": 3241.8} {"step": 25158, "train_loss": 3.1228420734405518, "lr": 6.849437933811017e-05, "tps": 507870, "wall": 3246.5} {"step": 25159, "train_loss": 3.208315372467041, "lr": 6.848403585817284e-05, "tps": 507158, "wall": 3251.2} {"step": 25160, "train_loss": 3.116023302078247, "lr": 6.847369409461657e-05, "tps": 506454, "wall": 3255.9} {"step": 25161, "train_loss": 3.1407690048217773, "lr": 6.846335404755844e-05, "tps": 505744, "wall": 3260.6} {"step": 25162, "train_loss": 3.190425157546997, "lr": 6.845301571711567e-05, "tps": 505041, "wall": 3265.2} {"step": 25163, "train_loss": 3.14408016204834, "lr": 6.844267910340527e-05, "tps": 504333, "wall": 3270.0} {"step": 25164, "train_loss": 3.180288791656494, "lr": 6.843234420654449e-05, "tps": 503589, "wall": 3274.9} {"step": 25165, "train_loss": 3.175241708755493, "lr": 6.842201102665029e-05, "tps": 502885, "wall": 3279.6} {"step": 25166, "train_loss": 3.1554651260375977, "lr": 6.841167956383971e-05, "tps": 502193, "wall": 3284.3} {"step": 25167, "train_loss": 3.228451728820801, "lr": 6.840134981822986e-05, "tps": 501490, "wall": 3289.0} {"step": 25168, "train_loss": 3.291807174682617, "lr": 6.839102178993772e-05, "tps": 500792, "wall": 3293.7} {"step": 25169, "train_loss": 3.1616406440734863, "lr": 6.838069547908026e-05, "tps": 500104, "wall": 3298.4} {"step": 25170, "train_loss": 3.1405715942382812, "lr": 6.837037088577451e-05, "tps": 499424, "wall": 3303.0} {"step": 25171, "train_loss": 3.2116029262542725, "lr": 6.836004801013741e-05, "tps": 498754, "wall": 3307.6} {"step": 25172, "train_loss": 3.173527240753174, "lr": 6.834972685228583e-05, "tps": 498076, "wall": 3312.2} {"step": 25173, "train_loss": 3.1444311141967773, "lr": 6.833940741233682e-05, "tps": 497408, "wall": 3316.8} {"step": 25174, "train_loss": 3.201225757598877, "lr": 6.832908969040719e-05, "tps": 496745, "wall": 3321.4} {"step": 25175, "train_loss": 3.179363250732422, "lr": 6.831877368661382e-05, "tps": 496085, "wall": 3325.9} {"step": 25176, "train_loss": 3.185044288635254, "lr": 6.830845940107359e-05, "tps": 495411, "wall": 3330.6} {"step": 25177, "train_loss": 3.1377010345458984, "lr": 6.829814683390337e-05, "tps": 494736, "wall": 3335.2} {"step": 25178, "train_loss": 3.146921157836914, "lr": 6.828783598521988e-05, "tps": 494062, "wall": 3339.9} {"step": 25179, "train_loss": 3.263169527053833, "lr": 6.827752685514006e-05, "tps": 493403, "wall": 3344.5} {"step": 25180, "train_loss": 3.1645078659057617, "lr": 6.826721944378056e-05, "tps": 492736, "wall": 3349.2} {"step": 25181, "train_loss": 3.2943201065063477, "lr": 6.825691375125827e-05, "tps": 492080, "wall": 3353.8} {"step": 25182, "train_loss": 3.2360775470733643, "lr": 6.824660977768985e-05, "tps": 491426, "wall": 3358.4} {"step": 25183, "train_loss": 3.123599052429199, "lr": 6.823630752319201e-05, "tps": 490766, "wall": 3363.0} {"step": 25184, "train_loss": 3.073082685470581, "lr": 6.822600698788154e-05, "tps": 490112, "wall": 3367.6} {"step": 25185, "train_loss": 3.2086033821105957, "lr": 6.821570817187506e-05, "tps": 489439, "wall": 3372.4} {"step": 25186, "train_loss": 3.2229561805725098, "lr": 6.820541107528922e-05, "tps": 488768, "wall": 3377.2} {"step": 25187, "train_loss": 3.257796287536621, "lr": 6.819511569824074e-05, "tps": 488099, "wall": 3381.9} {"step": 25188, "train_loss": 3.2223668098449707, "lr": 6.818482204084617e-05, "tps": 487443, "wall": 3386.6} {"step": 25189, "train_loss": 3.1416873931884766, "lr": 6.817453010322212e-05, "tps": 486797, "wall": 3391.2} {"step": 25190, "train_loss": 3.2185139656066895, "lr": 6.816423988548528e-05, "tps": 486151, "wall": 3395.9} {"step": 25191, "train_loss": 3.1022324562072754, "lr": 6.815395138775212e-05, "tps": 485522, "wall": 3400.4} {"step": 25192, "train_loss": 3.241297721862793, "lr": 6.814366461013917e-05, "tps": 484891, "wall": 3405.0} {"step": 25193, "train_loss": 3.173222303390503, "lr": 6.813337955276305e-05, "tps": 484258, "wall": 3409.6} {"step": 25194, "train_loss": 3.1969385147094727, "lr": 6.812309621574021e-05, "tps": 483633, "wall": 3414.1} {"step": 25195, "train_loss": 3.1705074310302734, "lr": 6.811281459918712e-05, "tps": 483008, "wall": 3418.7} {"step": 25196, "train_loss": 3.2444982528686523, "lr": 6.810253470322035e-05, "tps": 482384, "wall": 3423.2} {"step": 25197, "train_loss": 3.1637706756591797, "lr": 6.809225652795625e-05, "tps": 481762, "wall": 3427.8} {"step": 25198, "train_loss": 3.1067514419555664, "lr": 6.808198007351125e-05, "tps": 481141, "wall": 3432.3} {"step": 25199, "train_loss": 3.2112369537353516, "lr": 6.807170534000185e-05, "tps": 480523, "wall": 3436.9} {"step": 25200, "train_loss": 3.206699848175049, "lr": 6.806143232754434e-05, "tps": 479905, "wall": 3441.5} {"step": 25201, "train_loss": 3.2143774032592773, "lr": 6.80511610362552e-05, "tps": 479291, "wall": 3446.0} {"step": 25202, "train_loss": 3.2139439582824707, "lr": 6.80408914662507e-05, "tps": 478678, "wall": 3450.5} {"step": 25203, "train_loss": 3.2500357627868652, "lr": 6.803062361764718e-05, "tps": 478060, "wall": 3455.1} {"step": 25204, "train_loss": 3.157363176345825, "lr": 6.802035749056107e-05, "tps": 477449, "wall": 3459.7} {"step": 25205, "train_loss": 3.1711602210998535, "lr": 6.801009308510848e-05, "tps": 476840, "wall": 3464.3} {"step": 25206, "train_loss": 3.2793588638305664, "lr": 6.799983040140581e-05, "tps": 476234, "wall": 3468.8} {"step": 25207, "train_loss": 3.144467830657959, "lr": 6.798956943956929e-05, "tps": 475628, "wall": 3473.4} {"step": 25208, "train_loss": 3.2434942722320557, "lr": 6.797931019971512e-05, "tps": 475025, "wall": 3477.9} {"step": 25209, "train_loss": 3.0836472511291504, "lr": 6.796905268195958e-05, "tps": 474424, "wall": 3482.5} {"step": 25210, "train_loss": 3.233980655670166, "lr": 6.795879688641882e-05, "tps": 473814, "wall": 3487.1} {"step": 25211, "train_loss": 3.189929485321045, "lr": 6.794854281320902e-05, "tps": 473199, "wall": 3491.7} {"step": 25212, "train_loss": 3.210836887359619, "lr": 6.79382904624464e-05, "tps": 472596, "wall": 3496.3} {"step": 25213, "train_loss": 3.1367433071136475, "lr": 6.792803983424702e-05, "tps": 472000, "wall": 3500.9} {"step": 25214, "train_loss": 3.211300849914551, "lr": 6.7917790928727e-05, "tps": 471406, "wall": 3505.4} {"step": 25215, "train_loss": 3.2907092571258545, "lr": 6.790754374600254e-05, "tps": 470814, "wall": 3510.0} {"step": 25216, "train_loss": 3.2667510509490967, "lr": 6.789729828618963e-05, "tps": 470218, "wall": 3514.6} {"step": 25217, "train_loss": 3.145402431488037, "lr": 6.78870545494043e-05, "tps": 469623, "wall": 3519.2} {"step": 25218, "train_loss": 3.2204651832580566, "lr": 6.78768125357627e-05, "tps": 469036, "wall": 3523.7} {"step": 25219, "train_loss": 3.10837459564209, "lr": 6.78665722453808e-05, "tps": 468448, "wall": 3528.3} {"step": 25220, "train_loss": 3.188791513442993, "lr": 6.785633367837456e-05, "tps": 467862, "wall": 3532.8} {"step": 25221, "train_loss": 3.215202569961548, "lr": 6.784609683486005e-05, "tps": 467278, "wall": 3537.4} {"step": 25222, "train_loss": 3.2130300998687744, "lr": 6.783586171495313e-05, "tps": 466696, "wall": 3541.9} {"step": 25223, "train_loss": 3.153075933456421, "lr": 6.782562831876985e-05, "tps": 466116, "wall": 3546.5} {"step": 25224, "train_loss": 3.220749616622925, "lr": 6.781539664642607e-05, "tps": 465535, "wall": 3551.1} {"step": 25225, "train_loss": 3.1752216815948486, "lr": 6.78051666980377e-05, "tps": 464950, "wall": 3555.7} {"step": 25226, "train_loss": 3.2257192134857178, "lr": 6.779493847372065e-05, "tps": 464366, "wall": 3560.3} {"step": 25227, "train_loss": 3.223383665084839, "lr": 6.77847119735908e-05, "tps": 463772, "wall": 3565.0} {"step": 25228, "train_loss": 3.1769659519195557, "lr": 6.77744871977639e-05, "tps": 463199, "wall": 3569.5} {"step": 25229, "train_loss": 3.2260091304779053, "lr": 6.776426414635588e-05, "tps": 462627, "wall": 3574.1} {"step": 25230, "train_loss": 3.1867241859436035, "lr": 6.775404281948253e-05, "tps": 462023, "wall": 3578.9} {"step": 25231, "train_loss": 3.1262011528015137, "lr": 6.774382321725956e-05, "tps": 461417, "wall": 3583.8} {"step": 25232, "train_loss": 3.2043368816375732, "lr": 6.773360533980286e-05, "tps": 460829, "wall": 3588.5} {"step": 25233, "train_loss": 3.153928756713867, "lr": 6.772338918722809e-05, "tps": 460248, "wall": 3593.1} {"step": 25234, "train_loss": 3.2029168605804443, "lr": 6.7713174759651e-05, "tps": 459666, "wall": 3597.8} {"step": 25235, "train_loss": 3.1913318634033203, "lr": 6.770296205718732e-05, "tps": 459093, "wall": 3602.5} {"step": 25236, "train_loss": 3.247809886932373, "lr": 6.769275107995272e-05, "tps": 458524, "wall": 3607.1} {"step": 25237, "train_loss": 3.1915597915649414, "lr": 6.768254182806287e-05, "tps": 457956, "wall": 3611.7} {"step": 25238, "train_loss": 3.157846450805664, "lr": 6.767233430163344e-05, "tps": 457385, "wall": 3616.3} {"step": 25239, "train_loss": 3.198235034942627, "lr": 6.766212850078002e-05, "tps": 456790, "wall": 3621.2} {"step": 25240, "train_loss": 3.2290525436401367, "lr": 6.765192442561825e-05, "tps": 456227, "wall": 3625.8} {"step": 25241, "train_loss": 3.0657033920288086, "lr": 6.764172207626376e-05, "tps": 455665, "wall": 3630.4} {"step": 25242, "train_loss": 3.1770060062408447, "lr": 6.763152145283202e-05, "tps": 455096, "wall": 3635.1} {"step": 25243, "train_loss": 3.223752021789551, "lr": 6.762132255543872e-05, "tps": 454536, "wall": 3639.7} {"step": 25244, "train_loss": 3.1761574745178223, "lr": 6.76111253841993e-05, "tps": 453983, "wall": 3644.3} {"step": 25245, "train_loss": 3.2635374069213867, "lr": 6.760092993922926e-05, "tps": 453433, "wall": 3648.9} {"step": 25246, "train_loss": 3.097505569458008, "lr": 6.759073622064416e-05, "tps": 452886, "wall": 3653.4} {"step": 25247, "train_loss": 3.177006959915161, "lr": 6.758054422855948e-05, "tps": 452340, "wall": 3658.0} {"step": 25248, "train_loss": 3.3316969871520996, "lr": 6.757035396309057e-05, "tps": 451796, "wall": 3662.5} {"step": 25249, "train_loss": 3.180025577545166, "lr": 6.756016542435298e-05, "tps": 451253, "wall": 3667.1} {"step": 25250, "train_loss": 3.16571307182312, "lr": 6.754997861246209e-05, "tps": 450711, "wall": 3671.6} {"step": 25251, "train_loss": 3.2254810333251953, "lr": 6.753979352753325e-05, "tps": 450166, "wall": 3676.2} {"step": 25252, "train_loss": 3.091810941696167, "lr": 6.752961016968191e-05, "tps": 449614, "wall": 3680.9} {"step": 25253, "train_loss": 3.1332640647888184, "lr": 6.75194285390234e-05, "tps": 449071, "wall": 3685.5} {"step": 25254, "train_loss": 3.131962299346924, "lr": 6.750924863567301e-05, "tps": 448520, "wall": 3690.2} {"step": 25255, "train_loss": 3.0700135231018066, "lr": 6.749907045974614e-05, "tps": 447984, "wall": 3694.7} {"step": 25256, "train_loss": 3.2993571758270264, "lr": 6.748889401135806e-05, "tps": 447445, "wall": 3699.3} {"step": 25257, "train_loss": 3.166421890258789, "lr": 6.747871929062399e-05, "tps": 446911, "wall": 3703.9} {"step": 25258, "train_loss": 3.1608567237854004, "lr": 6.746854629765929e-05, "tps": 446376, "wall": 3708.5} {"step": 25259, "train_loss": 3.217820167541504, "lr": 6.745837503257908e-05, "tps": 445820, "wall": 3713.2} {"step": 25260, "train_loss": 3.1621527671813965, "lr": 6.744820549549873e-05, "tps": 445292, "wall": 3717.8} {"step": 25261, "train_loss": 3.1936655044555664, "lr": 6.743803768653334e-05, "tps": 444765, "wall": 3722.3} {"step": 25262, "train_loss": 3.2493410110473633, "lr": 6.742787160579806e-05, "tps": 444222, "wall": 3727.0} {"step": 25263, "train_loss": 3.245011329650879, "lr": 6.741770725340816e-05, "tps": 443680, "wall": 3731.7} {"step": 25264, "train_loss": 3.0767035484313965, "lr": 6.740754462947874e-05, "tps": 443154, "wall": 3736.3} {"step": 25265, "train_loss": 3.127152919769287, "lr": 6.739738373412486e-05, "tps": 442630, "wall": 3740.9} {"step": 25266, "train_loss": 3.207613945007324, "lr": 6.73872245674617e-05, "tps": 442101, "wall": 3745.5} {"step": 25267, "train_loss": 3.168013334274292, "lr": 6.737706712960433e-05, "tps": 441567, "wall": 3750.2} {"step": 25268, "train_loss": 3.1625750064849854, "lr": 6.736691142066776e-05, "tps": 441043, "wall": 3754.8} {"step": 25269, "train_loss": 3.213583469390869, "lr": 6.735675744076709e-05, "tps": 440516, "wall": 3759.4} {"step": 25270, "train_loss": 3.14265775680542, "lr": 6.734660519001736e-05, "tps": 439996, "wall": 3764.0} {"step": 25271, "train_loss": 3.182119369506836, "lr": 6.733645466853348e-05, "tps": 439463, "wall": 3768.7} {"step": 25272, "train_loss": 3.2220420837402344, "lr": 6.732630587643055e-05, "tps": 438939, "wall": 3773.4} {"step": 25273, "train_loss": 3.1816763877868652, "lr": 6.731615881382349e-05, "tps": 438415, "wall": 3778.1} {"step": 25274, "train_loss": 3.089674472808838, "lr": 6.730601348082721e-05, "tps": 437895, "wall": 3782.7} {"step": 25275, "train_loss": 3.218597173690796, "lr": 6.729586987755672e-05, "tps": 437369, "wall": 3787.4} {"step": 25276, "train_loss": 3.3005785942077637, "lr": 6.728572800412685e-05, "tps": 436843, "wall": 3792.1} {"step": 25277, "train_loss": 3.2297983169555664, "lr": 6.727558786065247e-05, "tps": 436332, "wall": 3796.7} {"step": 25278, "train_loss": 3.2624459266662598, "lr": 6.726544944724856e-05, "tps": 435813, "wall": 3801.4} {"step": 25279, "train_loss": 3.1142776012420654, "lr": 6.725531276402984e-05, "tps": 435300, "wall": 3806.0} {"step": 25280, "train_loss": 3.086472511291504, "lr": 6.724517781111126e-05, "tps": 434789, "wall": 3810.6} {"step": 25281, "train_loss": 3.1455252170562744, "lr": 6.723504458860756e-05, "tps": 434273, "wall": 3815.3} {"step": 25282, "train_loss": 3.2127020359039307, "lr": 6.722491309663348e-05, "tps": 433763, "wall": 3819.9} {"step": 25283, "train_loss": 3.121772289276123, "lr": 6.721478333530391e-05, "tps": 433258, "wall": 3824.5} {"step": 25284, "train_loss": 3.248931646347046, "lr": 6.720465530473355e-05, "tps": 432751, "wall": 3829.2} {"step": 25285, "train_loss": 3.1360485553741455, "lr": 6.719452900503706e-05, "tps": 432242, "wall": 3833.8} {"step": 25286, "train_loss": 3.3691866397857666, "lr": 6.718440443632926e-05, "tps": 431737, "wall": 3838.5} {"step": 25287, "train_loss": 3.1628544330596924, "lr": 6.717428159872478e-05, "tps": 431231, "wall": 3843.1} {"step": 25288, "train_loss": 3.2563576698303223, "lr": 6.716416049233831e-05, "tps": 430702, "wall": 3848.0} {"step": 25289, "train_loss": 3.223069429397583, "lr": 6.715404111728449e-05, "tps": 430206, "wall": 3852.6} {"step": 25290, "train_loss": 3.228813886642456, "lr": 6.7143923473678e-05, "tps": 429712, "wall": 3857.2} {"step": 25291, "train_loss": 3.239095449447632, "lr": 6.713380756163334e-05, "tps": 429218, "wall": 3861.8} {"step": 25292, "train_loss": 3.2245397567749023, "lr": 6.712369338126523e-05, "tps": 428720, "wall": 3866.4} {"step": 25293, "train_loss": 3.1741251945495605, "lr": 6.71135809326882e-05, "tps": 428226, "wall": 3871.0} {"step": 25294, "train_loss": 3.2079148292541504, "lr": 6.710347021601676e-05, "tps": 427726, "wall": 3875.7} {"step": 25295, "train_loss": 3.2348766326904297, "lr": 6.709336123136549e-05, "tps": 427235, "wall": 3880.3} {"step": 25296, "train_loss": 3.1267635822296143, "lr": 6.708325397884889e-05, "tps": 426746, "wall": 3884.9} {"step": 25297, "train_loss": 3.313619375228882, "lr": 6.707314845858149e-05, "tps": 426256, "wall": 3889.5} {"step": 25298, "train_loss": 3.1683549880981445, "lr": 6.706304467067774e-05, "tps": 425758, "wall": 3894.2} {"step": 25299, "train_loss": 3.2376022338867188, "lr": 6.705294261525204e-05, "tps": 425258, "wall": 3899.0} {"step": 25300, "train_loss": 3.102369785308838, "lr": 6.704284229241892e-05, "tps": 424760, "wall": 3903.7} {"step": 25301, "train_loss": 3.268576145172119, "lr": 6.703274370229277e-05, "tps": 424269, "wall": 3908.3} {"step": 25302, "train_loss": 3.192084789276123, "lr": 6.702264684498794e-05, "tps": 423779, "wall": 3913.0} {"step": 25303, "train_loss": 3.2413907051086426, "lr": 6.701255172061889e-05, "tps": 423303, "wall": 3917.6} {"step": 25304, "train_loss": 3.2504758834838867, "lr": 6.70024583292999e-05, "tps": 422829, "wall": 3922.1} {"step": 25305, "train_loss": 3.1754870414733887, "lr": 6.69923666711453e-05, "tps": 422353, "wall": 3926.7} {"step": 25306, "train_loss": 3.2213101387023926, "lr": 6.698227674626951e-05, "tps": 421879, "wall": 3931.3} {"step": 25307, "train_loss": 3.1407294273376465, "lr": 6.697218855478677e-05, "tps": 421393, "wall": 3936.0} {"step": 25308, "train_loss": 3.1771798133850098, "lr": 6.696210209681131e-05, "tps": 420924, "wall": 3940.5} {"step": 25309, "train_loss": 3.170097827911377, "lr": 6.695201737245747e-05, "tps": 420440, "wall": 3945.2} {"step": 25310, "train_loss": 3.2419216632843018, "lr": 6.694193438183945e-05, "tps": 419972, "wall": 3949.7} {"step": 25311, "train_loss": 3.158626079559326, "lr": 6.693185312507144e-05, "tps": 419504, "wall": 3954.3} {"step": 25312, "train_loss": 3.117888927459717, "lr": 6.692177360226774e-05, "tps": 419035, "wall": 3958.9} {"step": 25313, "train_loss": 3.0787510871887207, "lr": 6.691169581354241e-05, "tps": 418569, "wall": 3963.5} {"step": 25314, "train_loss": 3.1485891342163086, "lr": 6.690161975900971e-05, "tps": 418094, "wall": 3968.1} {"step": 25315, "train_loss": 3.2189507484436035, "lr": 6.689154543878376e-05, "tps": 417627, "wall": 3972.7} {"step": 25316, "train_loss": 3.1807456016540527, "lr": 6.688147285297863e-05, "tps": 417145, "wall": 3977.5} {"step": 25317, "train_loss": 3.1996891498565674, "lr": 6.687140200170847e-05, "tps": 416659, "wall": 3982.2} {"step": 25318, "train_loss": 3.192856788635254, "lr": 6.686133288508738e-05, "tps": 416198, "wall": 3986.8} {"step": 25319, "train_loss": 3.2479910850524902, "lr": 6.685126550322933e-05, "tps": 415713, "wall": 3991.6} {"step": 25320, "train_loss": 3.2001285552978516, "lr": 6.68411998562485e-05, "tps": 415237, "wall": 3996.4} {"step": 25321, "train_loss": 3.224325656890869, "lr": 6.68311359442588e-05, "tps": 414756, "wall": 4001.1} {"step": 25322, "train_loss": 3.2862210273742676, "lr": 6.682107376737429e-05, "tps": 414291, "wall": 4005.8} {"step": 25323, "train_loss": 3.23287034034729, "lr": 6.681101332570895e-05, "tps": 413826, "wall": 4010.5} {"step": 25324, "train_loss": 3.350736141204834, "lr": 6.680095461937676e-05, "tps": 413367, "wall": 4015.1} {"step": 25325, "train_loss": 3.2218263149261475, "lr": 6.679089764849159e-05, "tps": 412908, "wall": 4019.7} {"step": 25326, "train_loss": 3.1009669303894043, "lr": 6.678084241316744e-05, "tps": 412448, "wall": 4024.3} {"step": 25327, "train_loss": 3.1152243614196777, "lr": 6.677078891351824e-05, "tps": 411992, "wall": 4029.0} {"step": 25328, "train_loss": 3.224208116531372, "lr": 6.676073714965777e-05, "tps": 411524, "wall": 4033.7} {"step": 25329, "train_loss": 3.2927370071411133, "lr": 6.67506871217e-05, "tps": 411053, "wall": 4038.5} {"step": 25330, "train_loss": 3.2133822441101074, "lr": 6.674063882975873e-05, "tps": 410605, "wall": 4043.0} {"step": 25331, "train_loss": 3.2253737449645996, "lr": 6.673059227394776e-05, "tps": 410149, "wall": 4047.7} {"step": 25332, "train_loss": 3.1486542224884033, "lr": 6.6720547454381e-05, "tps": 409700, "wall": 4052.3} {"step": 25333, "train_loss": 3.176179885864258, "lr": 6.671050437117208e-05, "tps": 409249, "wall": 4056.9} {"step": 25334, "train_loss": 3.273714780807495, "lr": 6.670046302443494e-05, "tps": 408806, "wall": 4061.5} {"step": 25335, "train_loss": 3.177485466003418, "lr": 6.669042341428324e-05, "tps": 408365, "wall": 4066.0} {"step": 25336, "train_loss": 3.1924567222595215, "lr": 6.668038554083064e-05, "tps": 407921, "wall": 4070.6} {"step": 25337, "train_loss": 3.1479246616363525, "lr": 6.667034940419102e-05, "tps": 407476, "wall": 4075.2} {"step": 25338, "train_loss": 3.184598445892334, "lr": 6.666031500447793e-05, "tps": 407034, "wall": 4079.8} {"step": 25339, "train_loss": 3.328372001647949, "lr": 6.66502823418051e-05, "tps": 406578, "wall": 4084.5} {"step": 25340, "train_loss": 3.2286674976348877, "lr": 6.664025141628616e-05, "tps": 406117, "wall": 4089.3} {"step": 25341, "train_loss": 3.2361104488372803, "lr": 6.663022222803478e-05, "tps": 405663, "wall": 4094.1} {"step": 25342, "train_loss": 3.1064505577087402, "lr": 6.662019477716449e-05, "tps": 405227, "wall": 4098.6} {"step": 25343, "train_loss": 3.088484525680542, "lr": 6.661016906378896e-05, "tps": 404784, "wall": 4103.3} {"step": 25344, "train_loss": 3.1836259365081787, "lr": 6.660014508802175e-05, "tps": 404340, "wall": 4107.9} {"step": 25345, "train_loss": 3.115382194519043, "lr": 6.659012284997634e-05, "tps": 403901, "wall": 4112.6} {"step": 25346, "train_loss": 3.1335368156433105, "lr": 6.658010234976636e-05, "tps": 403449, "wall": 4117.3} {"step": 25347, "train_loss": 3.2310545444488525, "lr": 6.657008358750529e-05, "tps": 403020, "wall": 4121.9} {"step": 25348, "train_loss": 3.2313878536224365, "lr": 6.656006656330658e-05, "tps": 402583, "wall": 4126.5} {"step": 25349, "train_loss": 3.191098690032959, "lr": 6.655005127728375e-05, "tps": 402152, "wall": 4131.1} {"step": 25350, "train_loss": 3.224965810775757, "lr": 6.654003772955022e-05, "tps": 401717, "wall": 4135.8} {"step": 25351, "train_loss": 3.1288819313049316, "lr": 6.653002592021949e-05, "tps": 401278, "wall": 4140.4} {"step": 25352, "train_loss": 3.21087646484375, "lr": 6.65200158494049e-05, "tps": 400839, "wall": 4145.1} {"step": 25353, "train_loss": 3.253647804260254, "lr": 6.651000751721986e-05, "tps": 400402, "wall": 4149.8} {"step": 25354, "train_loss": 3.2911059856414795, "lr": 6.65000009237778e-05, "tps": 399972, "wall": 4154.4} {"step": 25355, "train_loss": 3.198782444000244, "lr": 6.648999606919203e-05, "tps": 399543, "wall": 4159.1} {"step": 25356, "train_loss": 3.1983046531677246, "lr": 6.647999295357583e-05, "tps": 399118, "wall": 4163.7} {"step": 25357, "train_loss": 3.304561138153076, "lr": 6.646999157704265e-05, "tps": 398694, "wall": 4168.3} {"step": 25358, "train_loss": 3.2339468002319336, "lr": 6.645999193970568e-05, "tps": 398272, "wall": 4172.8} {"step": 25359, "train_loss": 3.278860092163086, "lr": 6.644999404167818e-05, "tps": 397845, "wall": 4177.5} {"step": 25360, "train_loss": 3.2349014282226562, "lr": 6.643999788307353e-05, "tps": 397424, "wall": 4182.1} {"step": 25361, "train_loss": 3.1905038356781006, "lr": 6.643000346400488e-05, "tps": 397006, "wall": 4186.6} {"step": 25362, "train_loss": 3.13327693939209, "lr": 6.642001078458541e-05, "tps": 396588, "wall": 4191.2} {"step": 25363, "train_loss": 3.2022476196289062, "lr": 6.64100198449284e-05, "tps": 396173, "wall": 4195.8} {"step": 25364, "train_loss": 3.276017665863037, "lr": 6.640003064514701e-05, "tps": 395762, "wall": 4200.3} {"step": 25365, "train_loss": 3.1644232273101807, "lr": 6.639004318535435e-05, "tps": 395351, "wall": 4204.8} {"step": 25366, "train_loss": 3.2884039878845215, "lr": 6.638005746566359e-05, "tps": 394941, "wall": 4209.4} {"step": 25367, "train_loss": 3.149209499359131, "lr": 6.637007348618785e-05, "tps": 394532, "wall": 4213.9} {"step": 25368, "train_loss": 3.2056241035461426, "lr": 6.636009124704026e-05, "tps": 394122, "wall": 4218.4} {"step": 25369, "train_loss": 3.209735870361328, "lr": 6.635011074833386e-05, "tps": 393709, "wall": 4223.0} {"step": 25370, "train_loss": 3.1767947673797607, "lr": 6.634013199018169e-05, "tps": 393297, "wall": 4227.6} {"step": 25371, "train_loss": 3.191300630569458, "lr": 6.633015497269684e-05, "tps": 392885, "wall": 4232.2} {"step": 25372, "train_loss": 3.1808600425720215, "lr": 6.632017969599231e-05, "tps": 392471, "wall": 4236.9} {"step": 25373, "train_loss": 3.1530368328094482, "lr": 6.631020616018111e-05, "tps": 392063, "wall": 4241.4} {"step": 25374, "train_loss": 3.2633678913116455, "lr": 6.63002343653762e-05, "tps": 391654, "wall": 4246.0} {"step": 25375, "train_loss": 3.191183090209961, "lr": 6.629026431169053e-05, "tps": 391241, "wall": 4250.7} {"step": 25376, "train_loss": 3.2386293411254883, "lr": 6.628029599923708e-05, "tps": 390830, "wall": 4255.3} {"step": 25377, "train_loss": 3.166055202484131, "lr": 6.627032942812877e-05, "tps": 390419, "wall": 4260.0} {"step": 25378, "train_loss": 3.2040154933929443, "lr": 6.626036459847842e-05, "tps": 390012, "wall": 4264.6} {"step": 25379, "train_loss": 3.059678077697754, "lr": 6.625040151039904e-05, "tps": 389612, "wall": 4269.1} {"step": 25380, "train_loss": 3.1444716453552246, "lr": 6.624044016400342e-05, "tps": 389209, "wall": 4273.7} {"step": 25381, "train_loss": 3.217351198196411, "lr": 6.623048055940437e-05, "tps": 388807, "wall": 4278.3} {"step": 25382, "train_loss": 3.0693211555480957, "lr": 6.622052269671481e-05, "tps": 388407, "wall": 4282.9} {"step": 25383, "train_loss": 3.246521472930908, "lr": 6.621056657604748e-05, "tps": 388006, "wall": 4287.5} {"step": 25384, "train_loss": 3.1995177268981934, "lr": 6.62006121975151e-05, "tps": 387606, "wall": 4292.1} {"step": 25385, "train_loss": 3.211639881134033, "lr": 6.619065956123058e-05, "tps": 387201, "wall": 4296.7} {"step": 25386, "train_loss": 3.172755002975464, "lr": 6.618070866730659e-05, "tps": 386802, "wall": 4301.3} {"step": 25387, "train_loss": 3.232851505279541, "lr": 6.617075951585579e-05, "tps": 386407, "wall": 4305.9} {"step": 25388, "train_loss": 3.1280627250671387, "lr": 6.6160812106991e-05, "tps": 386013, "wall": 4310.5} {"step": 25389, "train_loss": 3.116187572479248, "lr": 6.615086644082488e-05, "tps": 385615, "wall": 4315.1} {"step": 25390, "train_loss": 3.189293146133423, "lr": 6.614092251747001e-05, "tps": 385219, "wall": 4319.7} {"step": 25391, "train_loss": 3.3724474906921387, "lr": 6.61309803370391e-05, "tps": 384821, "wall": 4324.3} {"step": 25392, "train_loss": 3.128938674926758, "lr": 6.612103989964477e-05, "tps": 384427, "wall": 4328.9} {"step": 25393, "train_loss": 3.1481575965881348, "lr": 6.611110120539966e-05, "tps": 384032, "wall": 4333.5} {"step": 25394, "train_loss": 3.2223362922668457, "lr": 6.61011642544163e-05, "tps": 383643, "wall": 4338.1} {"step": 25395, "train_loss": 3.1245980262756348, "lr": 6.609122904680727e-05, "tps": 383253, "wall": 4342.7} {"step": 25396, "train_loss": 3.2984910011291504, "lr": 6.608129558268514e-05, "tps": 382864, "wall": 4347.3} {"step": 25397, "train_loss": 3.317948818206787, "lr": 6.607136386216242e-05, "tps": 382473, "wall": 4351.9} {"step": 25398, "train_loss": 3.174849033355713, "lr": 6.606143388535157e-05, "tps": 382081, "wall": 4356.5} {"step": 25399, "train_loss": 3.2081549167633057, "lr": 6.605150565236519e-05, "tps": 381697, "wall": 4361.1} {"step": 25400, "train_loss": 3.222806930541992, "lr": 6.604157916331567e-05, "tps": 381309, "wall": 4365.7} {"step": 25401, "train_loss": 3.2274422645568848, "lr": 6.603165441831544e-05, "tps": 380925, "wall": 4370.3} {"step": 25402, "train_loss": 3.2654027938842773, "lr": 6.602173141747698e-05, "tps": 380541, "wall": 4374.8} {"step": 25403, "train_loss": 3.2161169052124023, "lr": 6.60118101609127e-05, "tps": 380157, "wall": 4379.4} {"step": 25404, "train_loss": 3.2437446117401123, "lr": 6.600189064873488e-05, "tps": 379774, "wall": 4384.0} {"step": 25405, "train_loss": 3.2144858837127686, "lr": 6.599197288105606e-05, "tps": 379390, "wall": 4388.6} {"step": 25406, "train_loss": 3.1639013290405273, "lr": 6.598205685798847e-05, "tps": 379007, "wall": 4393.2} {"step": 25407, "train_loss": 3.1538596153259277, "lr": 6.597214257964446e-05, "tps": 378627, "wall": 4397.8} {"step": 25408, "train_loss": 3.1607840061187744, "lr": 6.596223004613639e-05, "tps": 378249, "wall": 4402.4} {"step": 25409, "train_loss": 3.18847393989563, "lr": 6.595231925757645e-05, "tps": 377873, "wall": 4407.0} {"step": 25410, "train_loss": 3.1752681732177734, "lr": 6.594241021407702e-05, "tps": 377495, "wall": 4411.5} {"step": 25411, "train_loss": 3.1473937034606934, "lr": 6.593250291575031e-05, "tps": 377114, "wall": 4416.2} {"step": 25412, "train_loss": 3.1671905517578125, "lr": 6.592259736270849e-05, "tps": 376738, "wall": 4420.8} {"step": 25413, "train_loss": 3.226555109024048, "lr": 6.591269355506387e-05, "tps": 376365, "wall": 4425.3} {"step": 25414, "train_loss": 3.2345566749572754, "lr": 6.590279149292859e-05, "tps": 375994, "wall": 4429.8} {"step": 25415, "train_loss": 3.1613852977752686, "lr": 6.58928911764148e-05, "tps": 375623, "wall": 4434.4} {"step": 25416, "train_loss": 3.1872308254241943, "lr": 6.588299260563468e-05, "tps": 375238, "wall": 4439.1} {"step": 25417, "train_loss": 3.173910617828369, "lr": 6.58730957807004e-05, "tps": 374864, "wall": 4443.7} {"step": 25418, "train_loss": 3.257927179336548, "lr": 6.586320070172396e-05, "tps": 374492, "wall": 4448.3} {"step": 25419, "train_loss": 3.103586435317993, "lr": 6.585330736881757e-05, "tps": 374119, "wall": 4452.9} {"step": 25420, "train_loss": 3.16088604927063, "lr": 6.584341578209326e-05, "tps": 373745, "wall": 4457.6} {"step": 25421, "train_loss": 3.189136028289795, "lr": 6.583352594166301e-05, "tps": 373374, "wall": 4462.2} {"step": 25422, "train_loss": 3.138838291168213, "lr": 6.5823637847639e-05, "tps": 373004, "wall": 4466.8} {"step": 25423, "train_loss": 3.1589226722717285, "lr": 6.581375150013313e-05, "tps": 372621, "wall": 4471.5} {"step": 25424, "train_loss": 3.215787649154663, "lr": 6.58038668992574e-05, "tps": 372248, "wall": 4476.2} {"step": 25425, "train_loss": 3.2617506980895996, "lr": 6.579398404512384e-05, "tps": 371856, "wall": 4481.1} {"step": 25426, "train_loss": 3.1799044609069824, "lr": 6.578410293784436e-05, "tps": 371469, "wall": 4485.9} {"step": 25427, "train_loss": 3.259377956390381, "lr": 6.577422357753088e-05, "tps": 371088, "wall": 4490.7} {"step": 25428, "train_loss": 3.0954837799072266, "lr": 6.576434596429537e-05, "tps": 370703, "wall": 4495.6} {"step": 25429, "train_loss": 3.2040915489196777, "lr": 6.575447009824967e-05, "tps": 370322, "wall": 4500.4} {"step": 25430, "train_loss": 3.1997625827789307, "lr": 6.574459597950571e-05, "tps": 369935, "wall": 4505.2} {"step": 25431, "train_loss": 3.146383762359619, "lr": 6.57347236081753e-05, "tps": 369559, "wall": 4510.0} {"step": 25432, "train_loss": 3.1707520484924316, "lr": 6.572485298437025e-05, "tps": 369200, "wall": 4514.6} {"step": 25433, "train_loss": 3.2520322799682617, "lr": 6.571498410820247e-05, "tps": 368842, "wall": 4519.1} {"step": 25434, "train_loss": 3.156252861022949, "lr": 6.570511697978367e-05, "tps": 368483, "wall": 4523.7} {"step": 25435, "train_loss": 3.105823516845703, "lr": 6.569525159922563e-05, "tps": 368127, "wall": 4528.2} {"step": 25436, "train_loss": 3.2437667846679688, "lr": 6.568538796664017e-05, "tps": 367770, "wall": 4532.8} {"step": 25437, "train_loss": 3.2656021118164062, "lr": 6.567552608213896e-05, "tps": 367408, "wall": 4537.5} {"step": 25438, "train_loss": 3.120364189147949, "lr": 6.566566594583372e-05, "tps": 367048, "wall": 4542.1} {"step": 25439, "train_loss": 3.3520944118499756, "lr": 6.56558075578362e-05, "tps": 366690, "wall": 4546.7} {"step": 25440, "train_loss": 3.230151653289795, "lr": 6.564595091825805e-05, "tps": 366335, "wall": 4551.3} {"step": 25441, "train_loss": 3.1548633575439453, "lr": 6.563609602721086e-05, "tps": 365978, "wall": 4555.9} {"step": 25442, "train_loss": 3.1877474784851074, "lr": 6.562624288480637e-05, "tps": 365610, "wall": 4560.7} {"step": 25443, "train_loss": 3.1595849990844727, "lr": 6.561639149115617e-05, "tps": 365251, "wall": 4565.3} {"step": 25444, "train_loss": 3.2294185161590576, "lr": 6.560654184637179e-05, "tps": 364896, "wall": 4570.0} {"step": 25445, "train_loss": 3.248991012573242, "lr": 6.559669395056487e-05, "tps": 364543, "wall": 4574.6} {"step": 25446, "train_loss": 3.2294180393218994, "lr": 6.558684780384693e-05, "tps": 364194, "wall": 4579.1} {"step": 25447, "train_loss": 3.157687187194824, "lr": 6.557700340632959e-05, "tps": 363849, "wall": 4583.7} {"step": 25448, "train_loss": 3.320117235183716, "lr": 6.55671607581243e-05, "tps": 363503, "wall": 4588.2} {"step": 25449, "train_loss": 3.221193790435791, "lr": 6.555731985934255e-05, "tps": 363157, "wall": 4592.7} {"step": 25450, "train_loss": 3.2044479846954346, "lr": 6.554748071009584e-05, "tps": 362808, "wall": 4597.4} {"step": 25451, "train_loss": 3.234166383743286, "lr": 6.553764331049563e-05, "tps": 362463, "wall": 4601.9} {"step": 25452, "train_loss": 3.1418073177337646, "lr": 6.552780766065333e-05, "tps": 362120, "wall": 4606.4} {"step": 25453, "train_loss": 3.1991450786590576, "lr": 6.55179737606804e-05, "tps": 361778, "wall": 4611.0} {"step": 25454, "train_loss": 3.2222213745117188, "lr": 6.550814161068822e-05, "tps": 361437, "wall": 4615.5} {"step": 25455, "train_loss": 3.109808921813965, "lr": 6.549831121078815e-05, "tps": 361097, "wall": 4620.0} {"step": 25456, "train_loss": 3.104865074157715, "lr": 6.54884825610916e-05, "tps": 360757, "wall": 4624.6} {"step": 25457, "train_loss": 3.1272218227386475, "lr": 6.547865566170987e-05, "tps": 360416, "wall": 4629.1} {"step": 25458, "train_loss": 3.2628531455993652, "lr": 6.546883051275428e-05, "tps": 360075, "wall": 4633.7} {"step": 25459, "train_loss": 3.1088671684265137, "lr": 6.545900711433615e-05, "tps": 359737, "wall": 4638.2} {"step": 25460, "train_loss": 3.146576166152954, "lr": 6.544918546656675e-05, "tps": 359398, "wall": 4642.8} {"step": 25461, "train_loss": 3.0629940032958984, "lr": 6.54393655695573e-05, "tps": 359062, "wall": 4647.3} {"step": 25462, "train_loss": 3.108269691467285, "lr": 6.542954742341912e-05, "tps": 358726, "wall": 4651.8} {"step": 25463, "train_loss": 3.1599831581115723, "lr": 6.541973102826336e-05, "tps": 358387, "wall": 4656.4} {"step": 25464, "train_loss": 3.121110200881958, "lr": 6.540991638420127e-05, "tps": 358050, "wall": 4661.0} {"step": 25465, "train_loss": 3.1876401901245117, "lr": 6.540010349134403e-05, "tps": 357696, "wall": 4665.8} {"step": 25466, "train_loss": 3.1986446380615234, "lr": 6.53902923498027e-05, "tps": 357338, "wall": 4670.7} {"step": 25467, "train_loss": 3.200470209121704, "lr": 6.538048295968857e-05, "tps": 356986, "wall": 4675.5} {"step": 25468, "train_loss": 3.175416946411133, "lr": 6.537067532111269e-05, "tps": 356634, "wall": 4680.2} {"step": 25469, "train_loss": 3.2181732654571533, "lr": 6.536086943418614e-05, "tps": 356281, "wall": 4685.1} {"step": 25470, "train_loss": 3.1489925384521484, "lr": 6.535106529902006e-05, "tps": 355924, "wall": 4690.0} {"step": 25471, "train_loss": 3.2466514110565186, "lr": 6.534126291572548e-05, "tps": 355574, "wall": 4694.7} {"step": 25472, "train_loss": 3.0895562171936035, "lr": 6.53314622844134e-05, "tps": 355229, "wall": 4699.5} {"step": 25473, "train_loss": 3.2336812019348145, "lr": 6.532166340519492e-05, "tps": 354869, "wall": 4704.4} {"step": 25474, "train_loss": 3.172227382659912, "lr": 6.5311866278181e-05, "tps": 354506, "wall": 4709.4} {"step": 25475, "train_loss": 3.1678240299224854, "lr": 6.530207090348258e-05, "tps": 354155, "wall": 4714.3} {"step": 25476, "train_loss": 3.1594552993774414, "lr": 6.529227728121073e-05, "tps": 353809, "wall": 4719.1} {"step": 25477, "train_loss": 3.223048686981201, "lr": 6.528248541147633e-05, "tps": 353462, "wall": 4723.9} {"step": 25478, "train_loss": 3.1390278339385986, "lr": 6.527269529439027e-05, "tps": 353110, "wall": 4728.8} {"step": 25479, "train_loss": 3.212216377258301, "lr": 6.52629069300635e-05, "tps": 352757, "wall": 4733.7} {"step": 25480, "train_loss": 3.1583681106567383, "lr": 6.52531203186069e-05, "tps": 352427, "wall": 4738.3} {"step": 25481, "train_loss": 3.2125661373138428, "lr": 6.524333546013131e-05, "tps": 352096, "wall": 4743.0} {"step": 25482, "train_loss": 3.0942986011505127, "lr": 6.523355235474761e-05, "tps": 351769, "wall": 4747.6} {"step": 25483, "train_loss": 3.2031683921813965, "lr": 6.522377100256656e-05, "tps": 351443, "wall": 4752.2} {"step": 25484, "train_loss": 3.2069997787475586, "lr": 6.521399140369904e-05, "tps": 351119, "wall": 4756.7} {"step": 25485, "train_loss": 3.2074575424194336, "lr": 6.520421355825582e-05, "tps": 350793, "wall": 4761.3} {"step": 25486, "train_loss": 3.0871965885162354, "lr": 6.51944374663476e-05, "tps": 350468, "wall": 4766.0} {"step": 25487, "train_loss": 3.0521774291992188, "lr": 6.518466312808519e-05, "tps": 350145, "wall": 4770.5} {"step": 25488, "train_loss": 3.1782476902008057, "lr": 6.51748905435793e-05, "tps": 349822, "wall": 4775.1} {"step": 25489, "train_loss": 3.2413434982299805, "lr": 6.516511971294059e-05, "tps": 349498, "wall": 4779.7} {"step": 25490, "train_loss": 3.166917324066162, "lr": 6.51553506362798e-05, "tps": 349177, "wall": 4784.3} {"step": 25491, "train_loss": 3.1905858516693115, "lr": 6.51455833137076e-05, "tps": 348853, "wall": 4789.0} {"step": 25492, "train_loss": 3.221031665802002, "lr": 6.513581774533457e-05, "tps": 348535, "wall": 4793.5} {"step": 25493, "train_loss": 3.1967241764068604, "lr": 6.51260539312714e-05, "tps": 348217, "wall": 4798.1} {"step": 25494, "train_loss": 3.201345443725586, "lr": 6.511629187162866e-05, "tps": 347899, "wall": 4802.7} {"step": 25495, "train_loss": 3.1779348850250244, "lr": 6.510653156651694e-05, "tps": 347580, "wall": 4807.2} {"step": 25496, "train_loss": 3.1103553771972656, "lr": 6.509677301604682e-05, "tps": 347258, "wall": 4811.9} {"step": 25497, "train_loss": 3.198357582092285, "lr": 6.508701622032884e-05, "tps": 346938, "wall": 4816.5} {"step": 25498, "train_loss": 3.107301712036133, "lr": 6.507726117947349e-05, "tps": 346623, "wall": 4821.1} {"step": 25499, "train_loss": 3.1146538257598877, "lr": 6.506750789359134e-05, "tps": 346311, "wall": 4825.6} {"step": 25500, "train_loss": 3.1903772354125977, "lr": 6.505775636279282e-05, "tps": 345998, "wall": 4830.2} {"step": 25501, "train_loss": 3.131875991821289, "lr": 6.504800658718843e-05, "tps": 345672, "wall": 4834.9} {"step": 25502, "train_loss": 3.2334136962890625, "lr": 6.503825856688861e-05, "tps": 345359, "wall": 4839.5} {"step": 25503, "train_loss": 3.176316261291504, "lr": 6.502851230200376e-05, "tps": 345049, "wall": 4844.0} {"step": 25504, "train_loss": 3.1712751388549805, "lr": 6.501876779264432e-05, "tps": 344740, "wall": 4848.6} {"step": 25505, "train_loss": 3.024160385131836, "lr": 6.500902503892069e-05, "tps": 344423, "wall": 4853.2} {"step": 25506, "train_loss": 3.1526594161987305, "lr": 6.499928404094316e-05, "tps": 344108, "wall": 4857.9} {"step": 25507, "train_loss": 3.234982490539551, "lr": 6.498954479882214e-05, "tps": 343793, "wall": 4862.5} {"step": 25508, "train_loss": 3.318268299102783, "lr": 6.497980731266797e-05, "tps": 343482, "wall": 4867.1} {"step": 25509, "train_loss": 3.1349315643310547, "lr": 6.49700715825909e-05, "tps": 343172, "wall": 4871.7} {"step": 25510, "train_loss": 3.1994595527648926, "lr": 6.496033760870125e-05, "tps": 342863, "wall": 4876.3} {"step": 25511, "train_loss": 3.275940418243408, "lr": 6.49506053911093e-05, "tps": 342559, "wall": 4880.8} {"step": 25512, "train_loss": 3.219529151916504, "lr": 6.494087492992526e-05, "tps": 342256, "wall": 4885.3} {"step": 25513, "train_loss": 3.1378026008605957, "lr": 6.493114622525939e-05, "tps": 341949, "wall": 4889.9} {"step": 25514, "train_loss": 3.208421230316162, "lr": 6.49214192772219e-05, "tps": 341638, "wall": 4894.5} {"step": 25515, "train_loss": 3.229355812072754, "lr": 6.491169408592291e-05, "tps": 341306, "wall": 4899.5} {"step": 25516, "train_loss": 3.21836256980896, "lr": 6.490197065147269e-05, "tps": 340981, "wall": 4904.3} {"step": 25517, "train_loss": 3.2443161010742188, "lr": 6.489224897398128e-05, "tps": 340656, "wall": 4909.2} {"step": 25518, "train_loss": 3.1495232582092285, "lr": 6.488252905355893e-05, "tps": 340332, "wall": 4914.1} {"step": 25519, "train_loss": 3.19411039352417, "lr": 6.487281089031567e-05, "tps": 340012, "wall": 4918.9} {"step": 25520, "train_loss": 3.2153220176696777, "lr": 6.486309448436156e-05, "tps": 339687, "wall": 4923.8} {"step": 25521, "train_loss": 3.2552714347839355, "lr": 6.485337983580674e-05, "tps": 339363, "wall": 4928.7} {"step": 25522, "train_loss": 3.269365072250366, "lr": 6.484366694476125e-05, "tps": 339059, "wall": 4933.3} {"step": 25523, "train_loss": 3.1135241985321045, "lr": 6.483395581133505e-05, "tps": 338759, "wall": 4937.8} {"step": 25524, "train_loss": 3.271122694015503, "lr": 6.48242464356382e-05, "tps": 338454, "wall": 4942.5} {"step": 25525, "train_loss": 3.0646536350250244, "lr": 6.481453881778071e-05, "tps": 338150, "wall": 4947.1} {"step": 25526, "train_loss": 3.2095894813537598, "lr": 6.480483295787247e-05, "tps": 337845, "wall": 4951.8} {"step": 25501, "train_loss": 3.0701308250427246, "lr": 6.504800658718843e-05, "tps": 377437475, "wall": 4.4} {"step": 25502, "train_loss": 3.09199857711792, "lr": 6.503825856688861e-05, "tps": 199915178, "wall": 8.4} {"step": 25503, "train_loss": 3.102029800415039, "lr": 6.502851230200376e-05, "tps": 135059444, "wall": 12.4} {"step": 25504, "train_loss": 3.1562578678131104, "lr": 6.501876779264432e-05, "tps": 100652729, "wall": 16.6} {"step": 25505, "train_loss": 3.046208381652832, "lr": 6.500902503892069e-05, "tps": 79970775, "wall": 20.9} {"step": 25506, "train_loss": 3.0536367893218994, "lr": 6.499928404094316e-05, "tps": 66066490, "wall": 25.3} {"step": 25507, "train_loss": 3.0756607055664062, "lr": 6.498954479882214e-05, "tps": 56485703, "wall": 29.6} {"step": 25508, "train_loss": 3.157334089279175, "lr": 6.497980731266797e-05, "tps": 49306636, "wall": 33.9} {"step": 25509, "train_loss": 3.129457950592041, "lr": 6.49700715825909e-05, "tps": 43713364, "wall": 38.2} {"step": 25510, "train_loss": 3.161862373352051, "lr": 6.496033760870125e-05, "tps": 39273600, "wall": 42.6} {"step": 25511, "train_loss": 3.060063362121582, "lr": 6.49506053911093e-05, "tps": 35642083, "wall": 46.9} {"step": 25512, "train_loss": 3.1296119689941406, "lr": 6.494087492992526e-05, "tps": 32620589, "wall": 51.3} {"step": 25513, "train_loss": 3.020439624786377, "lr": 6.493114622525939e-05, "tps": 30030521, "wall": 55.7} {"step": 25514, "train_loss": 3.065746307373047, "lr": 6.49214192772219e-05, "tps": 27808061, "wall": 60.1} {"step": 25515, "train_loss": 3.231647253036499, "lr": 6.491169408592291e-05, "tps": 25905714, "wall": 64.6} {"step": 25516, "train_loss": 3.1327011585235596, "lr": 6.490197065147269e-05, "tps": 24200246, "wall": 69.1} {"step": 25517, "train_loss": 3.0565125942230225, "lr": 6.489224897398128e-05, "tps": 22735529, "wall": 73.6} {"step": 25518, "train_loss": 3.158579111099243, "lr": 6.488252905355893e-05, "tps": 21391420, "wall": 78.2} {"step": 25519, "train_loss": 3.1274707317352295, "lr": 6.487281089031567e-05, "tps": 20189799, "wall": 82.8} {"step": 25520, "train_loss": 3.106353282928467, "lr": 6.486309448436156e-05, "tps": 19123364, "wall": 87.5} {"step": 25521, "train_loss": 3.193451404571533, "lr": 6.485337983580674e-05, "tps": 18171315, "wall": 92.0} {"step": 25522, "train_loss": 3.1759557723999023, "lr": 6.484366694476125e-05, "tps": 17301927, "wall": 96.7} {"step": 25523, "train_loss": 3.0884482860565186, "lr": 6.483395581133505e-05, "tps": 16508968, "wall": 101.3} {"step": 25524, "train_loss": 3.0500328540802, "lr": 6.48242464356382e-05, "tps": 15787823, "wall": 106.0} {"step": 25525, "train_loss": 3.0771985054016113, "lr": 6.481453881778071e-05, "tps": 15133327, "wall": 110.5} {"step": 25526, "train_loss": 2.9705119132995605, "lr": 6.480483295787247e-05, "tps": 14528504, "wall": 115.1} {"step": 25527, "train_loss": 3.0820086002349854, "lr": 6.479512885602353e-05, "tps": 13966521, "wall": 119.8} {"step": 25528, "train_loss": 3.1995418071746826, "lr": 6.478542651234375e-05, "tps": 13452092, "wall": 124.4} {"step": 25529, "train_loss": 3.090555429458618, "lr": 6.477572592694304e-05, "tps": 12980421, "wall": 128.9} {"step": 25530, "train_loss": 3.1174676418304443, "lr": 6.476602709993133e-05, "tps": 12531479, "wall": 133.5} {"step": 25531, "train_loss": 3.078930139541626, "lr": 6.475633003141846e-05, "tps": 12110951, "wall": 138.2} {"step": 25532, "train_loss": 3.131831169128418, "lr": 6.474663472151425e-05, "tps": 11721488, "wall": 142.8} {"step": 25533, "train_loss": 3.127051830291748, "lr": 6.473694117032857e-05, "tps": 11357781, "wall": 147.3} {"step": 25534, "train_loss": 2.994100332260132, "lr": 6.472724937797125e-05, "tps": 11012129, "wall": 152.0} {"step": 25535, "train_loss": 3.14444637298584, "lr": 6.471755934455201e-05, "tps": 10686464, "wall": 156.6} {"step": 25536, "train_loss": 3.0985283851623535, "lr": 6.470787107018068e-05, "tps": 10379476, "wall": 161.2} {"step": 25537, "train_loss": 3.1486496925354004, "lr": 6.469818455496697e-05, "tps": 10090397, "wall": 165.9} {"step": 25538, "train_loss": 3.093848705291748, "lr": 6.468849979902067e-05, "tps": 9816827, "wall": 170.5} {"step": 25539, "train_loss": 3.0415399074554443, "lr": 6.467881680245142e-05, "tps": 9557678, "wall": 175.1} {"step": 25540, "train_loss": 3.0744056701660156, "lr": 6.466913556536892e-05, "tps": 9312639, "wall": 179.7} {"step": 25541, "train_loss": 3.068307876586914, "lr": 6.465945608788288e-05, "tps": 9079615, "wall": 184.4} {"step": 25542, "train_loss": 3.159360408782959, "lr": 6.464977837010293e-05, "tps": 8858291, "wall": 189.0} {"step": 25543, "train_loss": 2.990619659423828, "lr": 6.46401024121387e-05, "tps": 8645926, "wall": 193.6} {"step": 25544, "train_loss": 3.1747419834136963, "lr": 6.463042821409977e-05, "tps": 8444099, "wall": 198.3} {"step": 25545, "train_loss": 3.023693323135376, "lr": 6.462075577609573e-05, "tps": 8255865, "wall": 202.8} {"step": 25546, "train_loss": 3.181943655014038, "lr": 6.461108509823622e-05, "tps": 8076945, "wall": 207.3} {"step": 25547, "train_loss": 2.966526746749878, "lr": 6.460141618063076e-05, "tps": 7908069, "wall": 211.7} {"step": 25548, "train_loss": 3.130790948867798, "lr": 6.459174902338881e-05, "tps": 7746216, "wall": 216.2} {"step": 25549, "train_loss": 3.193635940551758, "lr": 6.458208362661996e-05, "tps": 7589651, "wall": 220.6} {"step": 25550, "train_loss": 3.114901065826416, "lr": 6.457241999043371e-05, "tps": 7431964, "wall": 225.3} {"step": 25551, "train_loss": 3.0129458904266357, "lr": 6.456275811493942e-05, "tps": 7282144, "wall": 230.0} {"step": 25552, "train_loss": 3.128589630126953, "lr": 6.455309800024667e-05, "tps": 7137282, "wall": 234.6} {"step": 25553, "train_loss": 3.153477430343628, "lr": 6.45434396464648e-05, "tps": 6997673, "wall": 239.3} {"step": 25554, "train_loss": 3.1037676334381104, "lr": 6.453378305370327e-05, "tps": 6864189, "wall": 244.0} {"step": 25555, "train_loss": 3.0687453746795654, "lr": 6.452412822207148e-05, "tps": 6736420, "wall": 248.6} {"step": 25556, "train_loss": 3.0364279747009277, "lr": 6.451447515167876e-05, "tps": 6612807, "wall": 253.3} {"step": 25557, "train_loss": 3.132859230041504, "lr": 6.450482384263446e-05, "tps": 6493643, "wall": 257.9} {"step": 25558, "train_loss": 3.1268038749694824, "lr": 6.449517429504794e-05, "tps": 6378585, "wall": 262.6} {"step": 25559, "train_loss": 3.1169989109039307, "lr": 6.448552650902852e-05, "tps": 6267688, "wall": 267.3} {"step": 25560, "train_loss": 3.2218856811523438, "lr": 6.447588048468541e-05, "tps": 6160762, "wall": 271.9} {"step": 25561, "train_loss": 3.142861843109131, "lr": 6.446623622212802e-05, "tps": 6056956, "wall": 276.6} {"step": 25562, "train_loss": 3.096668243408203, "lr": 6.445659372146545e-05, "tps": 5956658, "wall": 281.2} {"step": 25563, "train_loss": 3.1634793281555176, "lr": 6.444695298280703e-05, "tps": 5862295, "wall": 285.8} {"step": 25564, "train_loss": 3.092761516571045, "lr": 6.443731400626196e-05, "tps": 5773501, "wall": 290.2} {"step": 25565, "train_loss": 3.1067261695861816, "lr": 6.442767679193937e-05, "tps": 5687074, "wall": 294.6} {"step": 25566, "train_loss": 3.164551258087158, "lr": 6.44180413399485e-05, "tps": 5602546, "wall": 299.1} {"step": 25567, "train_loss": 3.2085697650909424, "lr": 6.44084076503985e-05, "tps": 5521452, "wall": 303.5} {"step": 25568, "train_loss": 3.090481758117676, "lr": 6.43987757233984e-05, "tps": 5442805, "wall": 307.9} {"step": 25569, "train_loss": 3.0033178329467773, "lr": 6.438914555905747e-05, "tps": 5366185, "wall": 312.3} {"step": 25570, "train_loss": 3.211635112762451, "lr": 6.437951715748468e-05, "tps": 5291562, "wall": 316.7} {"step": 25571, "train_loss": 3.1200027465820312, "lr": 6.436989051878911e-05, "tps": 5219371, "wall": 321.1} {"step": 25572, "train_loss": 3.0975756645202637, "lr": 6.43602656430799e-05, "tps": 5148846, "wall": 325.5} {"step": 25573, "train_loss": 3.134305953979492, "lr": 6.435064253046601e-05, "tps": 5080143, "wall": 329.9} {"step": 25574, "train_loss": 3.0475056171417236, "lr": 6.43410211810564e-05, "tps": 5013196, "wall": 334.3} {"step": 25575, "train_loss": 3.1063425540924072, "lr": 6.433140159496019e-05, "tps": 4948245, "wall": 338.7} {"step": 25576, "train_loss": 3.15313982963562, "lr": 6.432178377228629e-05, "tps": 4884859, "wall": 343.1} {"step": 25577, "train_loss": 3.123682975769043, "lr": 6.431216771314357e-05, "tps": 4822898, "wall": 347.6} {"step": 25578, "train_loss": 3.123138189315796, "lr": 6.43025534176411e-05, "tps": 4762677, "wall": 352.0} {"step": 25579, "train_loss": 3.2134451866149902, "lr": 6.429294088588768e-05, "tps": 4703774, "wall": 356.4} {"step": 25580, "train_loss": 3.061309814453125, "lr": 6.42833301179923e-05, "tps": 4645719, "wall": 360.9} {"step": 25581, "train_loss": 3.1423473358154297, "lr": 6.427372111406375e-05, "tps": 4589503, "wall": 365.3} {"step": 25582, "train_loss": 3.0965383052825928, "lr": 6.426411387421092e-05, "tps": 4534762, "wall": 369.7} {"step": 25583, "train_loss": 3.0690717697143555, "lr": 6.425450839854264e-05, "tps": 4481302, "wall": 374.1} {"step": 25584, "train_loss": 3.10776424407959, "lr": 6.424490468716771e-05, "tps": 4429049, "wall": 378.6} {"step": 25585, "train_loss": 3.1657896041870117, "lr": 6.423530274019492e-05, "tps": 4378013, "wall": 383.0} {"step": 25586, "train_loss": 3.116504192352295, "lr": 6.422570255773308e-05, "tps": 4328100, "wall": 387.4} {"step": 25587, "train_loss": 3.100822687149048, "lr": 6.421610413989087e-05, "tps": 4278983, "wall": 391.9} {"step": 25588, "train_loss": 3.1179187297821045, "lr": 6.420650748677706e-05, "tps": 4231376, "wall": 396.3} {"step": 25589, "train_loss": 3.11494517326355, "lr": 6.419691259850038e-05, "tps": 4184862, "wall": 400.7} {"step": 25590, "train_loss": 3.09588885307312, "lr": 6.41873194751695e-05, "tps": 4139136, "wall": 405.2} {"step": 25591, "train_loss": 3.026151180267334, "lr": 6.417772811689306e-05, "tps": 4094274, "wall": 409.6} {"step": 25592, "train_loss": 3.1616311073303223, "lr": 6.416813852377978e-05, "tps": 4050500, "wall": 414.1} {"step": 25593, "train_loss": 3.1344876289367676, "lr": 6.415855069593829e-05, "tps": 4007115, "wall": 418.6} {"step": 25594, "train_loss": 3.144810676574707, "lr": 6.414896463347711e-05, "tps": 3965395, "wall": 423.0} {"step": 25595, "train_loss": 3.065290689468384, "lr": 6.413938033650493e-05, "tps": 3924433, "wall": 427.4} {"step": 25596, "train_loss": 3.113436222076416, "lr": 6.412979780513022e-05, "tps": 3884285, "wall": 431.9} {"step": 25597, "train_loss": 3.1025075912475586, "lr": 6.412021703946166e-05, "tps": 3844623, "wall": 436.3} {"step": 25598, "train_loss": 3.15755033493042, "lr": 6.411063803960769e-05, "tps": 3806258, "wall": 440.8} {"step": 25599, "train_loss": 3.182722806930542, "lr": 6.410106080567682e-05, "tps": 3768388, "wall": 445.2} {"step": 25600, "train_loss": 3.103536367416382, "lr": 6.409148533777762e-05, "tps": 3731298, "wall": 449.7} {"step": 25601, "train_loss": 2.984309673309326, "lr": 6.408191163601849e-05, "tps": 3694973, "wall": 454.1} {"step": 25602, "train_loss": 3.028573751449585, "lr": 6.407233970050785e-05, "tps": 3659427, "wall": 458.5} {"step": 25603, "train_loss": 3.0460567474365234, "lr": 6.406276953135425e-05, "tps": 3624398, "wall": 463.0} {"step": 25604, "train_loss": 3.013509511947632, "lr": 6.405320112866603e-05, "tps": 3590069, "wall": 467.4} {"step": 25605, "train_loss": 3.067694664001465, "lr": 6.404363449255151e-05, "tps": 3556445, "wall": 471.9} {"step": 25606, "train_loss": 3.1395416259765625, "lr": 6.403406962311922e-05, "tps": 3523332, "wall": 476.3} {"step": 25607, "train_loss": 3.0299997329711914, "lr": 6.40245065204774e-05, "tps": 3490593, "wall": 480.8} {"step": 25608, "train_loss": 3.188906669616699, "lr": 6.401494518473438e-05, "tps": 3458712, "wall": 485.2} {"step": 25609, "train_loss": 3.073190212249756, "lr": 6.400538561599853e-05, "tps": 3427559, "wall": 489.7} {"step": 25610, "train_loss": 3.0786380767822266, "lr": 6.399582781437812e-05, "tps": 3396988, "wall": 494.1} {"step": 25611, "train_loss": 3.068251132965088, "lr": 6.398627177998137e-05, "tps": 3366921, "wall": 498.5} {"step": 25612, "train_loss": 3.087226390838623, "lr": 6.39767175129166e-05, "tps": 3337364, "wall": 503.0} {"step": 25613, "train_loss": 3.0980281829833984, "lr": 6.396716501329203e-05, "tps": 3308312, "wall": 507.4} {"step": 25614, "train_loss": 3.072251796722412, "lr": 6.395761428121582e-05, "tps": 3279749, "wall": 511.8} {"step": 25615, "train_loss": 3.0986506938934326, "lr": 6.394806531679621e-05, "tps": 3251555, "wall": 516.3} {"step": 25616, "train_loss": 3.103090286254883, "lr": 6.393851812014134e-05, "tps": 3223980, "wall": 520.7} {"step": 25617, "train_loss": 3.1009161472320557, "lr": 6.392897269135943e-05, "tps": 3196844, "wall": 525.2} {"step": 25618, "train_loss": 3.0483226776123047, "lr": 6.391942903055855e-05, "tps": 3170168, "wall": 529.6} {"step": 25619, "train_loss": 3.172403573989868, "lr": 6.390988713784677e-05, "tps": 3143882, "wall": 534.1} {"step": 25620, "train_loss": 3.164799213409424, "lr": 6.390034701333228e-05, "tps": 3117529, "wall": 538.6} {"step": 25621, "train_loss": 3.087291955947876, "lr": 6.38908086571231e-05, "tps": 3092335, "wall": 543.0} {"step": 25622, "train_loss": 3.134730815887451, "lr": 6.388127206932727e-05, "tps": 3067364, "wall": 547.5} {"step": 25623, "train_loss": 3.09377384185791, "lr": 6.387173725005285e-05, "tps": 3042788, "wall": 551.9} {"step": 25624, "train_loss": 3.0696511268615723, "lr": 6.386220419940784e-05, "tps": 3018519, "wall": 556.4} {"step": 25625, "train_loss": 3.0989010334014893, "lr": 6.385267291750019e-05, "tps": 2994751, "wall": 560.8} {"step": 25626, "train_loss": 3.0456762313842773, "lr": 6.384314340443796e-05, "tps": 2971283, "wall": 565.2} {"step": 25627, "train_loss": 3.1447744369506836, "lr": 6.383361566032903e-05, "tps": 2948189, "wall": 569.7} {"step": 25628, "train_loss": 3.123047113418579, "lr": 6.382408968528133e-05, "tps": 2925505, "wall": 574.1} {"step": 25629, "train_loss": 3.086385726928711, "lr": 6.381456547940281e-05, "tps": 2902839, "wall": 578.6} {"step": 25630, "train_loss": 3.1295721530914307, "lr": 6.380504304280135e-05, "tps": 2880671, "wall": 583.1} {"step": 25631, "train_loss": 3.089245319366455, "lr": 6.379552237558477e-05, "tps": 2859014, "wall": 587.6} {"step": 25632, "train_loss": 3.171912908554077, "lr": 6.378600347786101e-05, "tps": 2837701, "wall": 592.0} {"step": 25633, "train_loss": 3.0016589164733887, "lr": 6.377648634973782e-05, "tps": 2816704, "wall": 596.4} {"step": 25634, "train_loss": 3.0055580139160156, "lr": 6.376697099132307e-05, "tps": 2795796, "wall": 600.9} {"step": 25635, "train_loss": 2.9816720485687256, "lr": 6.375745740272452e-05, "tps": 2775390, "wall": 605.3} {"step": 25636, "train_loss": 3.2231338024139404, "lr": 6.374794558404993e-05, "tps": 2755323, "wall": 609.8} {"step": 25637, "train_loss": 3.126383066177368, "lr": 6.373843553540709e-05, "tps": 2735449, "wall": 614.2} {"step": 25638, "train_loss": 3.016481637954712, "lr": 6.372892725690369e-05, "tps": 2715956, "wall": 618.7} {"step": 25639, "train_loss": 3.2181057929992676, "lr": 6.371942074864743e-05, "tps": 2696706, "wall": 623.1} {"step": 25640, "train_loss": 3.0106682777404785, "lr": 6.370991601074608e-05, "tps": 2677745, "wall": 627.5} {"step": 25641, "train_loss": 3.1116812229156494, "lr": 6.370041304330726e-05, "tps": 2659046, "wall": 632.0} {"step": 25642, "train_loss": 3.0834150314331055, "lr": 6.369091184643853e-05, "tps": 2640580, "wall": 636.4} {"step": 25643, "train_loss": 3.1669247150421143, "lr": 6.36814124202477e-05, "tps": 2622388, "wall": 640.9} {"step": 25644, "train_loss": 3.217268466949463, "lr": 6.367191476484228e-05, "tps": 2604390, "wall": 645.3} {"step": 25645, "train_loss": 3.1182966232299805, "lr": 6.366241888032981e-05, "tps": 2586654, "wall": 649.8} {"step": 25646, "train_loss": 3.0321972370147705, "lr": 6.365292476681794e-05, "tps": 2569166, "wall": 654.2} {"step": 25647, "train_loss": 3.0847043991088867, "lr": 6.364343242441422e-05, "tps": 2551696, "wall": 658.7} {"step": 25648, "train_loss": 3.118837356567383, "lr": 6.363394185322613e-05, "tps": 2534752, "wall": 663.2} {"step": 25649, "train_loss": 3.129546642303467, "lr": 6.362445305336122e-05, "tps": 2517944, "wall": 667.6} {"step": 25650, "train_loss": 2.9921727180480957, "lr": 6.361496602492693e-05, "tps": 2501361, "wall": 672.1} {"step": 25651, "train_loss": 3.07886004447937, "lr": 6.360548076803081e-05, "tps": 2484991, "wall": 676.5} {"step": 25652, "train_loss": 3.1124496459960938, "lr": 6.359599728278026e-05, "tps": 2468905, "wall": 680.9} {"step": 25653, "train_loss": 3.164285659790039, "lr": 6.358651556928268e-05, "tps": 2452970, "wall": 685.4} {"step": 25654, "train_loss": 3.101274251937866, "lr": 6.357703562764555e-05, "tps": 2437266, "wall": 689.8} {"step": 25655, "train_loss": 3.037714958190918, "lr": 6.356755745797622e-05, "tps": 2421744, "wall": 694.3} {"step": 25656, "train_loss": 3.0934481620788574, "lr": 6.355808106038203e-05, "tps": 2406467, "wall": 698.7} {"step": 25657, "train_loss": 3.0634539127349854, "lr": 6.35486064349704e-05, "tps": 2391319, "wall": 703.2} {"step": 25658, "train_loss": 3.1573853492736816, "lr": 6.353913358184862e-05, "tps": 2376375, "wall": 707.6} {"step": 25659, "train_loss": 3.061953067779541, "lr": 6.352966250112396e-05, "tps": 2361627, "wall": 712.1} {"step": 25660, "train_loss": 3.11357045173645, "lr": 6.352019319290376e-05, "tps": 2347037, "wall": 716.5} {"step": 25661, "train_loss": 3.240859270095825, "lr": 6.351072565729533e-05, "tps": 2332494, "wall": 721.0} {"step": 25662, "train_loss": 3.0152440071105957, "lr": 6.350125989440579e-05, "tps": 2318289, "wall": 725.5} {"step": 25663, "train_loss": 3.1231071949005127, "lr": 6.349179590434248e-05, "tps": 2304288, "wall": 729.9} {"step": 25664, "train_loss": 3.03629469871521, "lr": 6.348233368721259e-05, "tps": 2290422, "wall": 734.4} {"step": 25665, "train_loss": 3.0852534770965576, "lr": 6.347287324312326e-05, "tps": 2276738, "wall": 738.8} {"step": 25666, "train_loss": 3.2183704376220703, "lr": 6.34634145721817e-05, "tps": 2263182, "wall": 743.3} {"step": 25667, "train_loss": 2.990178346633911, "lr": 6.345395767449506e-05, "tps": 2249825, "wall": 747.7} {"step": 25668, "train_loss": 2.976907730102539, "lr": 6.344450255017042e-05, "tps": 2236600, "wall": 752.1} {"step": 25669, "train_loss": 3.022357940673828, "lr": 6.343504919931496e-05, "tps": 2223553, "wall": 756.6} {"step": 25670, "train_loss": 3.1170012950897217, "lr": 6.34255976220357e-05, "tps": 2210625, "wall": 761.0} {"step": 25671, "train_loss": 3.13248348236084, "lr": 6.341614781843978e-05, "tps": 2197886, "wall": 765.5} {"step": 25672, "train_loss": 3.1722207069396973, "lr": 6.340669978863421e-05, "tps": 2185281, "wall": 769.9} {"step": 25673, "train_loss": 2.9898314476013184, "lr": 6.339725353272599e-05, "tps": 2172819, "wall": 774.4} {"step": 25674, "train_loss": 3.098743200302124, "lr": 6.338780905082215e-05, "tps": 2160364, "wall": 778.9} {"step": 25675, "train_loss": 3.2252557277679443, "lr": 6.337836634302971e-05, "tps": 2148209, "wall": 783.3} {"step": 25676, "train_loss": 3.076587677001953, "lr": 6.336892540945558e-05, "tps": 2136179, "wall": 787.7} {"step": 25677, "train_loss": 3.1074323654174805, "lr": 6.335948625020675e-05, "tps": 2124259, "wall": 792.2} {"step": 25678, "train_loss": 3.08097505569458, "lr": 6.335004886539015e-05, "tps": 2112493, "wall": 796.6} {"step": 25679, "train_loss": 3.0810201168060303, "lr": 6.334061325511265e-05, "tps": 2100869, "wall": 801.1} {"step": 25680, "train_loss": 3.022674798965454, "lr": 6.333117941948116e-05, "tps": 2089373, "wall": 805.5} {"step": 25681, "train_loss": 3.184826374053955, "lr": 6.332174735860256e-05, "tps": 2078009, "wall": 810.0} {"step": 25682, "train_loss": 3.031676769256592, "lr": 6.331231707258366e-05, "tps": 2066756, "wall": 814.4} {"step": 25683, "train_loss": 3.15873384475708, "lr": 6.330288856153132e-05, "tps": 2055627, "wall": 818.8} {"step": 25684, "train_loss": 3.1125006675720215, "lr": 6.329346182555235e-05, "tps": 2044600, "wall": 823.3} {"step": 25685, "train_loss": 3.1402599811553955, "lr": 6.328403686475348e-05, "tps": 2033696, "wall": 827.7} {"step": 25686, "train_loss": 3.1798832416534424, "lr": 6.327461367924157e-05, "tps": 2022882, "wall": 832.2} {"step": 25687, "train_loss": 3.1333751678466797, "lr": 6.326519226912327e-05, "tps": 2012179, "wall": 836.6} {"step": 25688, "train_loss": 3.150552272796631, "lr": 6.325577263450537e-05, "tps": 2001497, "wall": 841.1} {"step": 25689, "train_loss": 3.1000890731811523, "lr": 6.324635477549457e-05, "tps": 1991029, "wall": 845.6} {"step": 25690, "train_loss": 2.987194776535034, "lr": 6.323693869219753e-05, "tps": 1980676, "wall": 850.1} {"step": 25691, "train_loss": 3.2022836208343506, "lr": 6.322752438472093e-05, "tps": 1970440, "wall": 854.5} {"step": 25692, "train_loss": 3.0203447341918945, "lr": 6.321811185317144e-05, "tps": 1960320, "wall": 858.9} {"step": 25693, "train_loss": 2.9863858222961426, "lr": 6.32087010976556e-05, "tps": 1950285, "wall": 863.4} {"step": 25694, "train_loss": 3.075235605239868, "lr": 6.319929211828013e-05, "tps": 1940388, "wall": 867.8} {"step": 25695, "train_loss": 3.0956711769104004, "lr": 6.318988491515157e-05, "tps": 1930559, "wall": 872.3} {"step": 25696, "train_loss": 3.1537749767303467, "lr": 6.318047948837641e-05, "tps": 1920798, "wall": 876.8} {"step": 25697, "train_loss": 3.008678436279297, "lr": 6.317107583806132e-05, "tps": 1911182, "wall": 881.2} {"step": 25698, "train_loss": 3.075772762298584, "lr": 6.316167396431279e-05, "tps": 1901662, "wall": 885.7} {"step": 25699, "train_loss": 3.162233352661133, "lr": 6.31522738672372e-05, "tps": 1892234, "wall": 890.1} {"step": 25700, "train_loss": 3.156374931335449, "lr": 6.314287554694125e-05, "tps": 1882903, "wall": 894.5} {"step": 25701, "train_loss": 3.1654865741729736, "lr": 6.313347900353124e-05, "tps": 1873545, "wall": 899.0} {"step": 25702, "train_loss": 3.1178481578826904, "lr": 6.312408423711365e-05, "tps": 1864387, "wall": 903.5} {"step": 25703, "train_loss": 3.1029133796691895, "lr": 6.311469124779493e-05, "tps": 1855318, "wall": 908.0} {"step": 25704, "train_loss": 3.0306878089904785, "lr": 6.310530003568147e-05, "tps": 1846321, "wall": 912.4} {"step": 25705, "train_loss": 3.050630569458008, "lr": 6.30959106008797e-05, "tps": 1837407, "wall": 916.9} {"step": 25706, "train_loss": 3.1180615425109863, "lr": 6.308652294349592e-05, "tps": 1828589, "wall": 921.3} {"step": 25707, "train_loss": 3.070861339569092, "lr": 6.307713706363647e-05, "tps": 1819864, "wall": 925.8} {"step": 25708, "train_loss": 3.0015511512756348, "lr": 6.306775296140773e-05, "tps": 1811244, "wall": 930.2} {"step": 25709, "train_loss": 3.104750871658325, "lr": 6.305837063691599e-05, "tps": 1802654, "wall": 934.7} {"step": 25710, "train_loss": 3.0153095722198486, "lr": 6.304899009026751e-05, "tps": 1794186, "wall": 939.1} {"step": 25711, "train_loss": 3.0530030727386475, "lr": 6.303961132156857e-05, "tps": 1785797, "wall": 943.6} {"step": 25712, "train_loss": 3.0306034088134766, "lr": 6.303023433092534e-05, "tps": 1777478, "wall": 948.0} {"step": 25713, "train_loss": 3.1002111434936523, "lr": 6.302085911844417e-05, "tps": 1769231, "wall": 952.5} {"step": 25714, "train_loss": 3.094738721847534, "lr": 6.301148568423119e-05, "tps": 1761066, "wall": 957.0} {"step": 25715, "train_loss": 3.1583523750305176, "lr": 6.300211402839257e-05, "tps": 1752925, "wall": 961.4} {"step": 25716, "train_loss": 3.1214945316314697, "lr": 6.299274415103452e-05, "tps": 1744912, "wall": 965.9} {"step": 25717, "train_loss": 3.0608325004577637, "lr": 6.298337605226314e-05, "tps": 1736965, "wall": 970.3} {"step": 25718, "train_loss": 3.059244394302368, "lr": 6.297400973218456e-05, "tps": 1729095, "wall": 974.8} {"step": 25719, "train_loss": 3.055687427520752, "lr": 6.296464519090492e-05, "tps": 1721302, "wall": 979.3} {"step": 25720, "train_loss": 3.1497721672058105, "lr": 6.295528242853027e-05, "tps": 1713593, "wall": 983.7} {"step": 25721, "train_loss": 3.1120107173919678, "lr": 6.294592144516666e-05, "tps": 1705928, "wall": 988.2} {"step": 25722, "train_loss": 3.170635223388672, "lr": 6.293656224092017e-05, "tps": 1698359, "wall": 992.6} {"step": 25723, "train_loss": 3.094259262084961, "lr": 6.292720481589682e-05, "tps": 1690839, "wall": 997.0} {"step": 25724, "train_loss": 3.1178669929504395, "lr": 6.291784917020252e-05, "tps": 1683386, "wall": 1001.5} {"step": 25725, "train_loss": 3.1824915409088135, "lr": 6.290849530394338e-05, "tps": 1676000, "wall": 1006.0} {"step": 25726, "train_loss": 3.0756301879882812, "lr": 6.289914321722529e-05, "tps": 1668659, "wall": 1010.4} {"step": 25727, "train_loss": 2.9875946044921875, "lr": 6.288979291015417e-05, "tps": 1661404, "wall": 1014.9} {"step": 25728, "train_loss": 3.1196179389953613, "lr": 6.288044438283602e-05, "tps": 1654103, "wall": 1019.4} {"step": 25729, "train_loss": 3.156850576400757, "lr": 6.287109763537666e-05, "tps": 1646998, "wall": 1023.8} {"step": 25730, "train_loss": 3.0207200050354004, "lr": 6.286175266788206e-05, "tps": 1639917, "wall": 1028.3} {"step": 25731, "train_loss": 3.071784019470215, "lr": 6.285240948045799e-05, "tps": 1632900, "wall": 1032.7} {"step": 25732, "train_loss": 3.0276522636413574, "lr": 6.284306807321033e-05, "tps": 1625956, "wall": 1037.2} {"step": 25733, "train_loss": 3.0907392501831055, "lr": 6.283372844624489e-05, "tps": 1619075, "wall": 1041.6} {"step": 25734, "train_loss": 3.1733622550964355, "lr": 6.282439059966751e-05, "tps": 1612245, "wall": 1046.1} {"step": 25735, "train_loss": 3.060892343521118, "lr": 6.28150545335839e-05, "tps": 1605476, "wall": 1050.6} {"step": 25736, "train_loss": 3.0579822063446045, "lr": 6.280572024809987e-05, "tps": 1598755, "wall": 1055.0} {"step": 25737, "train_loss": 3.125222682952881, "lr": 6.279638774332116e-05, "tps": 1592099, "wall": 1059.5} {"step": 25738, "train_loss": 3.1491262912750244, "lr": 6.278705701935343e-05, "tps": 1585467, "wall": 1063.9} {"step": 25739, "train_loss": 3.0595803260803223, "lr": 6.277772807630247e-05, "tps": 1578927, "wall": 1068.4} {"step": 25740, "train_loss": 3.1351466178894043, "lr": 6.276840091427391e-05, "tps": 1572452, "wall": 1072.8} {"step": 25741, "train_loss": 3.0553579330444336, "lr": 6.275907553337335e-05, "tps": 1565944, "wall": 1077.3} {"step": 25742, "train_loss": 3.0941193103790283, "lr": 6.274975193370656e-05, "tps": 1559536, "wall": 1081.8} {"step": 25743, "train_loss": 3.1005024909973145, "lr": 6.274043011537906e-05, "tps": 1553186, "wall": 1086.3} {"step": 25744, "train_loss": 3.0781421661376953, "lr": 6.273111007849645e-05, "tps": 1546925, "wall": 1090.7} {"step": 25745, "train_loss": 3.1323745250701904, "lr": 6.27217918231644e-05, "tps": 1540693, "wall": 1095.1} {"step": 25746, "train_loss": 3.0923004150390625, "lr": 6.271247534948836e-05, "tps": 1534504, "wall": 1099.6} {"step": 25747, "train_loss": 3.1307570934295654, "lr": 6.270316065757387e-05, "tps": 1528381, "wall": 1104.1} {"step": 25748, "train_loss": 3.038754463195801, "lr": 6.269384774752655e-05, "tps": 1522299, "wall": 1108.5} {"step": 25749, "train_loss": 3.147676467895508, "lr": 6.268453661945178e-05, "tps": 1516267, "wall": 1113.0} {"step": 25750, "train_loss": 3.1259727478027344, "lr": 6.267522727345513e-05, "tps": 1510302, "wall": 1117.4} {"step": 25751, "train_loss": 3.0460662841796875, "lr": 6.266591970964202e-05, "tps": 1504364, "wall": 1121.9} {"step": 25752, "train_loss": 3.0180978775024414, "lr": 6.265661392811783e-05, "tps": 1498461, "wall": 1126.3} {"step": 25753, "train_loss": 3.080446481704712, "lr": 6.264730992898808e-05, "tps": 1492622, "wall": 1130.8} {"step": 25754, "train_loss": 3.1585710048675537, "lr": 6.263800771235813e-05, "tps": 1486814, "wall": 1135.2} {"step": 25755, "train_loss": 3.143505334854126, "lr": 6.262870727833327e-05, "tps": 1480997, "wall": 1139.7} {"step": 25756, "train_loss": 3.1825003623962402, "lr": 6.261940862701899e-05, "tps": 1475286, "wall": 1144.2} {"step": 25757, "train_loss": 3.044675588607788, "lr": 6.261011175852057e-05, "tps": 1469627, "wall": 1148.6} {"step": 25758, "train_loss": 3.1118812561035156, "lr": 6.260081667294325e-05, "tps": 1464003, "wall": 1153.1} {"step": 25759, "train_loss": 3.15653920173645, "lr": 6.259152337039245e-05, "tps": 1458429, "wall": 1157.6} {"step": 25760, "train_loss": 2.955592632293701, "lr": 6.25822318509734e-05, "tps": 1452895, "wall": 1162.0} {"step": 25761, "train_loss": 3.059825897216797, "lr": 6.257294211479127e-05, "tps": 1447404, "wall": 1166.5} {"step": 25762, "train_loss": 3.131875514984131, "lr": 6.256365416195145e-05, "tps": 1441955, "wall": 1170.9} {"step": 25763, "train_loss": 3.1986641883850098, "lr": 6.255436799255904e-05, "tps": 1436545, "wall": 1175.4} {"step": 25764, "train_loss": 3.1328258514404297, "lr": 6.254508360671925e-05, "tps": 1431173, "wall": 1179.8} {"step": 25765, "train_loss": 2.9520556926727295, "lr": 6.25358010045373e-05, "tps": 1425840, "wall": 1184.3} {"step": 25766, "train_loss": 3.0144474506378174, "lr": 6.252652018611828e-05, "tps": 1420522, "wall": 1188.8} {"step": 25767, "train_loss": 3.0729641914367676, "lr": 6.25172411515674e-05, "tps": 1415311, "wall": 1193.2} {"step": 25768, "train_loss": 3.1506521701812744, "lr": 6.250796390098972e-05, "tps": 1410005, "wall": 1197.7} {"step": 25769, "train_loss": 3.0757806301116943, "lr": 6.24986884344903e-05, "tps": 1404873, "wall": 1202.1} {"step": 25770, "train_loss": 3.1311755180358887, "lr": 6.248941475217431e-05, "tps": 1399746, "wall": 1206.6} {"step": 25771, "train_loss": 3.0918188095092773, "lr": 6.248014285414676e-05, "tps": 1394652, "wall": 1211.0} {"step": 25772, "train_loss": 3.117600917816162, "lr": 6.247087274051263e-05, "tps": 1389557, "wall": 1215.5} {"step": 25773, "train_loss": 3.0610647201538086, "lr": 6.246160441137702e-05, "tps": 1384569, "wall": 1220.0} {"step": 25774, "train_loss": 3.2181992530822754, "lr": 6.245233786684486e-05, "tps": 1379579, "wall": 1224.4} {"step": 25775, "train_loss": 3.0793051719665527, "lr": 6.244307310702111e-05, "tps": 1374640, "wall": 1228.9} {"step": 25776, "train_loss": 3.089693546295166, "lr": 6.243381013201078e-05, "tps": 1369727, "wall": 1233.3} {"step": 25777, "train_loss": 3.1168911457061768, "lr": 6.242454894191879e-05, "tps": 1364854, "wall": 1237.8} {"step": 25778, "train_loss": 3.1186864376068115, "lr": 6.241528953684999e-05, "tps": 1360014, "wall": 1242.2} {"step": 25779, "train_loss": 3.140065908432007, "lr": 6.240603191690934e-05, "tps": 1355216, "wall": 1246.7} {"step": 25780, "train_loss": 3.164121150970459, "lr": 6.239677608220171e-05, "tps": 1350431, "wall": 1251.1} {"step": 25781, "train_loss": 3.062556266784668, "lr": 6.238752203283186e-05, "tps": 1345692, "wall": 1255.6} {"step": 25782, "train_loss": 3.0911660194396973, "lr": 6.237826976890476e-05, "tps": 1340930, "wall": 1260.1} {"step": 25783, "train_loss": 3.0551047325134277, "lr": 6.236901929052508e-05, "tps": 1336260, "wall": 1264.6} {"step": 25784, "train_loss": 3.1309337615966797, "lr": 6.235977059779773e-05, "tps": 1331617, "wall": 1269.0} {"step": 25785, "train_loss": 3.0911879539489746, "lr": 6.235052369082742e-05, "tps": 1327016, "wall": 1273.5} {"step": 25786, "train_loss": 3.1528480052948, "lr": 6.234127856971888e-05, "tps": 1322447, "wall": 1277.9} {"step": 25787, "train_loss": 3.0902810096740723, "lr": 6.23320352345769e-05, "tps": 1317904, "wall": 1282.4} {"step": 25788, "train_loss": 3.0920894145965576, "lr": 6.232279368550613e-05, "tps": 1313378, "wall": 1286.8} {"step": 25789, "train_loss": 3.03322696685791, "lr": 6.231355392261128e-05, "tps": 1308852, "wall": 1291.3} {"step": 25790, "train_loss": 3.1077609062194824, "lr": 6.230431594599704e-05, "tps": 1304408, "wall": 1295.8} {"step": 25791, "train_loss": 3.2053682804107666, "lr": 6.229507975576804e-05, "tps": 1299975, "wall": 1300.3} {"step": 25792, "train_loss": 3.0716559886932373, "lr": 6.228584535202887e-05, "tps": 1295586, "wall": 1304.7} {"step": 25793, "train_loss": 3.1143040657043457, "lr": 6.227661273488423e-05, "tps": 1291201, "wall": 1309.2} {"step": 25794, "train_loss": 3.1044607162475586, "lr": 6.226738190443863e-05, "tps": 1286853, "wall": 1313.7} {"step": 25795, "train_loss": 3.0868687629699707, "lr": 6.225815286079664e-05, "tps": 1282477, "wall": 1318.2} {"step": 25796, "train_loss": 3.104372024536133, "lr": 6.224892560406287e-05, "tps": 1278233, "wall": 1322.6} {"step": 25797, "train_loss": 3.126716136932373, "lr": 6.223970013434179e-05, "tps": 1273983, "wall": 1327.1} {"step": 25798, "train_loss": 3.1724345684051514, "lr": 6.223047645173789e-05, "tps": 1269774, "wall": 1331.5} {"step": 25799, "train_loss": 3.180534839630127, "lr": 6.222125455635573e-05, "tps": 1265582, "wall": 1336.0} {"step": 25800, "train_loss": 3.004525661468506, "lr": 6.221203444829973e-05, "tps": 1261418, "wall": 1340.5} {"step": 25801, "train_loss": 3.1726200580596924, "lr": 6.22028161276743e-05, "tps": 1257288, "wall": 1344.9} {"step": 25802, "train_loss": 3.0960052013397217, "lr": 6.219359959458394e-05, "tps": 1253180, "wall": 1349.4} {"step": 25803, "train_loss": 3.0907557010650635, "lr": 6.218438484913299e-05, "tps": 1249106, "wall": 1353.8} {"step": 25804, "train_loss": 3.0501174926757812, "lr": 6.21751718914259e-05, "tps": 1245048, "wall": 1358.3} {"step": 25805, "train_loss": 3.0631840229034424, "lr": 6.216596072156701e-05, "tps": 1241035, "wall": 1362.8} {"step": 25806, "train_loss": 3.0524628162384033, "lr": 6.215675133966062e-05, "tps": 1237035, "wall": 1367.2} {"step": 25807, "train_loss": 3.0621252059936523, "lr": 6.214754374581111e-05, "tps": 1233060, "wall": 1371.7} {"step": 25808, "train_loss": 3.087135076522827, "lr": 6.213833794012278e-05, "tps": 1229111, "wall": 1376.1} {"step": 25809, "train_loss": 3.053384780883789, "lr": 6.212913392269985e-05, "tps": 1225154, "wall": 1380.6} {"step": 25810, "train_loss": 2.9959545135498047, "lr": 6.211993169364666e-05, "tps": 1221253, "wall": 1385.1} {"step": 25811, "train_loss": 3.113523244857788, "lr": 6.211073125306744e-05, "tps": 1217388, "wall": 1389.5} {"step": 25812, "train_loss": 3.129469394683838, "lr": 6.210153260106635e-05, "tps": 1213552, "wall": 1394.0} {"step": 25813, "train_loss": 3.1706833839416504, "lr": 6.20923357377477e-05, "tps": 1209740, "wall": 1398.4} {"step": 25814, "train_loss": 3.1657772064208984, "lr": 6.208314066321561e-05, "tps": 1205944, "wall": 1402.9} {"step": 25815, "train_loss": 3.135108232498169, "lr": 6.207394737757419e-05, "tps": 1202174, "wall": 1407.3} {"step": 25816, "train_loss": 3.0308005809783936, "lr": 6.206475588092768e-05, "tps": 1198437, "wall": 1411.8} {"step": 25817, "train_loss": 3.0830326080322266, "lr": 6.205556617338017e-05, "tps": 1194707, "wall": 1416.3} {"step": 25818, "train_loss": 3.048588275909424, "lr": 6.20463782550357e-05, "tps": 1191011, "wall": 1420.7} {"step": 25819, "train_loss": 3.080409526824951, "lr": 6.203719212599845e-05, "tps": 1187340, "wall": 1425.2} {"step": 25820, "train_loss": 3.024282455444336, "lr": 6.20280077863724e-05, "tps": 1183657, "wall": 1429.6} {"step": 25821, "train_loss": 3.1612906455993652, "lr": 6.201882523626165e-05, "tps": 1180038, "wall": 1434.1} {"step": 25822, "train_loss": 3.1045713424682617, "lr": 6.20096444757702e-05, "tps": 1176373, "wall": 1438.6} {"step": 25823, "train_loss": 3.0609922409057617, "lr": 6.200046550500199e-05, "tps": 1172810, "wall": 1443.0} {"step": 25824, "train_loss": 3.0065670013427734, "lr": 6.199128832406112e-05, "tps": 1169252, "wall": 1447.5} {"step": 25825, "train_loss": 3.0728516578674316, "lr": 6.198211293305146e-05, "tps": 1165716, "wall": 1451.9} {"step": 25826, "train_loss": 3.1319289207458496, "lr": 6.197293933207695e-05, "tps": 1162200, "wall": 1456.4} {"step": 25827, "train_loss": 3.2119882106781006, "lr": 6.196376752124157e-05, "tps": 1158705, "wall": 1460.8} {"step": 25828, "train_loss": 3.0616111755371094, "lr": 6.195459750064916e-05, "tps": 1155228, "wall": 1465.3} {"step": 25829, "train_loss": 3.0366532802581787, "lr": 6.194542927040361e-05, "tps": 1151772, "wall": 1469.7} {"step": 25830, "train_loss": 3.0674335956573486, "lr": 6.193626283060882e-05, "tps": 1148328, "wall": 1474.2} {"step": 25831, "train_loss": 3.1783382892608643, "lr": 6.192709818136859e-05, "tps": 1144915, "wall": 1478.6} {"step": 25832, "train_loss": 3.046454668045044, "lr": 6.191793532278671e-05, "tps": 1141516, "wall": 1483.1} {"step": 25833, "train_loss": 3.072553873062134, "lr": 6.190877425496704e-05, "tps": 1138144, "wall": 1487.6} {"step": 25834, "train_loss": 3.0383176803588867, "lr": 6.189961497801335e-05, "tps": 1134781, "wall": 1492.0} {"step": 25835, "train_loss": 3.191234588623047, "lr": 6.18904574920293e-05, "tps": 1131440, "wall": 1496.5} {"step": 25836, "train_loss": 3.088697910308838, "lr": 6.188130179711876e-05, "tps": 1128093, "wall": 1501.0} {"step": 25837, "train_loss": 3.139293670654297, "lr": 6.187214789338534e-05, "tps": 1124798, "wall": 1505.4} {"step": 25838, "train_loss": 3.133540630340576, "lr": 6.186299578093283e-05, "tps": 1121523, "wall": 1509.9} {"step": 25839, "train_loss": 3.0620408058166504, "lr": 6.185384545986486e-05, "tps": 1118248, "wall": 1514.4} {"step": 25840, "train_loss": 3.059861660003662, "lr": 6.184469693028505e-05, "tps": 1115020, "wall": 1518.8} {"step": 25841, "train_loss": 3.0797805786132812, "lr": 6.183555019229711e-05, "tps": 1111795, "wall": 1523.3} {"step": 25842, "train_loss": 3.3476200103759766, "lr": 6.18264052460046e-05, "tps": 1108593, "wall": 1527.7} {"step": 25843, "train_loss": 3.0971555709838867, "lr": 6.181726209151109e-05, "tps": 1105412, "wall": 1532.2} {"step": 25844, "train_loss": 3.105940103530884, "lr": 6.180812072892023e-05, "tps": 1102250, "wall": 1536.7} {"step": 25845, "train_loss": 3.053999185562134, "lr": 6.179898115833556e-05, "tps": 1099099, "wall": 1541.1} {"step": 25846, "train_loss": 3.0956029891967773, "lr": 6.178984337986054e-05, "tps": 1095971, "wall": 1545.6} {"step": 25847, "train_loss": 3.1530070304870605, "lr": 6.178070739359874e-05, "tps": 1092853, "wall": 1550.0} {"step": 25848, "train_loss": 3.0538532733917236, "lr": 6.177157319965369e-05, "tps": 1089764, "wall": 1554.5} {"step": 25849, "train_loss": 3.0975663661956787, "lr": 6.176244079812873e-05, "tps": 1086647, "wall": 1559.0} {"step": 25850, "train_loss": 3.03637433052063, "lr": 6.175331018912749e-05, "tps": 1083591, "wall": 1563.5} {"step": 25851, "train_loss": 3.1747026443481445, "lr": 6.174418137275331e-05, "tps": 1080549, "wall": 1567.9} {"step": 25852, "train_loss": 3.075854539871216, "lr": 6.173505434910954e-05, "tps": 1077522, "wall": 1572.4} {"step": 25853, "train_loss": 3.1631181240081787, "lr": 6.172592911829968e-05, "tps": 1074513, "wall": 1576.9} {"step": 25854, "train_loss": 3.1297571659088135, "lr": 6.171680568042708e-05, "tps": 1071522, "wall": 1581.3} {"step": 25855, "train_loss": 3.180856943130493, "lr": 6.170768403559501e-05, "tps": 1068546, "wall": 1585.8} {"step": 25856, "train_loss": 3.028989791870117, "lr": 6.16985641839069e-05, "tps": 1065591, "wall": 1590.3} {"step": 25857, "train_loss": 3.090925693511963, "lr": 6.168944612546598e-05, "tps": 1062649, "wall": 1594.7} {"step": 25858, "train_loss": 3.1068215370178223, "lr": 6.168032986037562e-05, "tps": 1059725, "wall": 1599.2} {"step": 25859, "train_loss": 3.083756446838379, "lr": 6.167121538873906e-05, "tps": 1056810, "wall": 1603.7} {"step": 25860, "train_loss": 3.0838711261749268, "lr": 6.166210271065947e-05, "tps": 1053904, "wall": 1608.1} {"step": 25861, "train_loss": 3.0750315189361572, "lr": 6.165299182624021e-05, "tps": 1051026, "wall": 1612.6} {"step": 25862, "train_loss": 3.142921209335327, "lr": 6.164388273558441e-05, "tps": 1048163, "wall": 1617.1} {"step": 25863, "train_loss": 3.0222647190093994, "lr": 6.163477543879525e-05, "tps": 1045290, "wall": 1621.6} {"step": 25864, "train_loss": 3.055598735809326, "lr": 6.162566993597594e-05, "tps": 1042454, "wall": 1626.1} {"step": 25865, "train_loss": 3.1371240615844727, "lr": 6.161656622722961e-05, "tps": 1039642, "wall": 1630.5} {"step": 25866, "train_loss": 3.0405986309051514, "lr": 6.160746431265937e-05, "tps": 1036841, "wall": 1635.0} {"step": 25867, "train_loss": 3.198965072631836, "lr": 6.159836419236835e-05, "tps": 1034053, "wall": 1639.5} {"step": 25868, "train_loss": 2.9326751232147217, "lr": 6.158926586645965e-05, "tps": 1031283, "wall": 1643.9} {"step": 25869, "train_loss": 3.033595323562622, "lr": 6.158016933503628e-05, "tps": 1028528, "wall": 1648.4} {"step": 25870, "train_loss": 2.970263957977295, "lr": 6.157107459820138e-05, "tps": 1025790, "wall": 1652.9} {"step": 25871, "train_loss": 3.074233293533325, "lr": 6.156198165605786e-05, "tps": 1023070, "wall": 1657.3} {"step": 25872, "train_loss": 2.9673304557800293, "lr": 6.15528905087088e-05, "tps": 1020363, "wall": 1661.8} {"step": 25873, "train_loss": 3.1154041290283203, "lr": 6.154380115625718e-05, "tps": 1017668, "wall": 1666.2} {"step": 25874, "train_loss": 2.9852843284606934, "lr": 6.153471359880591e-05, "tps": 1014984, "wall": 1670.7} {"step": 25875, "train_loss": 3.012444496154785, "lr": 6.152562783645804e-05, "tps": 1012314, "wall": 1675.2} {"step": 25876, "train_loss": 3.1595048904418945, "lr": 6.151654386931643e-05, "tps": 1009632, "wall": 1679.7} {"step": 25877, "train_loss": 3.128416061401367, "lr": 6.150746169748392e-05, "tps": 1006994, "wall": 1684.2} {"step": 25878, "train_loss": 3.1683578491210938, "lr": 6.14983813210635e-05, "tps": 1004371, "wall": 1688.6} {"step": 25879, "train_loss": 3.1110267639160156, "lr": 6.148930274015802e-05, "tps": 1001761, "wall": 1693.1} {"step": 25880, "train_loss": 3.192786455154419, "lr": 6.148022595487028e-05, "tps": 999164, "wall": 1697.6} {"step": 25881, "train_loss": 2.991525173187256, "lr": 6.147115096530309e-05, "tps": 996578, "wall": 1702.0} {"step": 25882, "train_loss": 3.1042375564575195, "lr": 6.146207777155928e-05, "tps": 994005, "wall": 1706.5} {"step": 25883, "train_loss": 3.1215314865112305, "lr": 6.145300637374165e-05, "tps": 991450, "wall": 1711.0} {"step": 25884, "train_loss": 3.1220691204071045, "lr": 6.144393677195292e-05, "tps": 988906, "wall": 1715.4} {"step": 25885, "train_loss": 3.0317742824554443, "lr": 6.143486896629583e-05, "tps": 986376, "wall": 1719.9} {"step": 25886, "train_loss": 3.098619222640991, "lr": 6.142580295687317e-05, "tps": 983861, "wall": 1724.4} {"step": 25887, "train_loss": 3.073324680328369, "lr": 6.141673874378759e-05, "tps": 981358, "wall": 1728.8} {"step": 25888, "train_loss": 3.0897507667541504, "lr": 6.140767632714173e-05, "tps": 978864, "wall": 1733.3} {"step": 25889, "train_loss": 3.0274691581726074, "lr": 6.139861570703833e-05, "tps": 976339, "wall": 1737.8} {"step": 25890, "train_loss": 3.152648687362671, "lr": 6.138955688357999e-05, "tps": 973890, "wall": 1742.3} {"step": 25891, "train_loss": 3.158473491668701, "lr": 6.13804998568693e-05, "tps": 971440, "wall": 1746.7} {"step": 25892, "train_loss": 3.1251845359802246, "lr": 6.137144462700894e-05, "tps": 969000, "wall": 1751.2} {"step": 25893, "train_loss": 3.037571668624878, "lr": 6.13623911941014e-05, "tps": 966573, "wall": 1755.7} {"step": 25894, "train_loss": 3.0898373126983643, "lr": 6.135333955824927e-05, "tps": 964156, "wall": 1760.1} {"step": 25895, "train_loss": 3.1616623401641846, "lr": 6.134428971955511e-05, "tps": 961753, "wall": 1764.6} {"step": 25896, "train_loss": 3.0676116943359375, "lr": 6.133524167812143e-05, "tps": 959357, "wall": 1769.1} {"step": 25897, "train_loss": 3.133587121963501, "lr": 6.132619543405067e-05, "tps": 956977, "wall": 1773.6} {"step": 25898, "train_loss": 3.1179399490356445, "lr": 6.131715098744539e-05, "tps": 954609, "wall": 1778.0} {"step": 25899, "train_loss": 3.132293701171875, "lr": 6.130810833840798e-05, "tps": 952250, "wall": 1782.5} {"step": 25900, "train_loss": 3.01869535446167, "lr": 6.129906748704092e-05, "tps": 949901, "wall": 1787.0} {"step": 25901, "train_loss": 3.097381591796875, "lr": 6.129002843344663e-05, "tps": 947567, "wall": 1791.4} {"step": 25902, "train_loss": 3.1060078144073486, "lr": 6.128099117772744e-05, "tps": 945243, "wall": 1795.9} {"step": 25903, "train_loss": 3.146148681640625, "lr": 6.127195571998582e-05, "tps": 942911, "wall": 1800.4} {"step": 25904, "train_loss": 3.173262596130371, "lr": 6.126292206032407e-05, "tps": 940617, "wall": 1804.9} {"step": 25905, "train_loss": 3.0818889141082764, "lr": 6.125389019884447e-05, "tps": 938334, "wall": 1809.4} {"step": 25906, "train_loss": 3.152810573577881, "lr": 6.124486013564944e-05, "tps": 936061, "wall": 1813.8} {"step": 25907, "train_loss": 3.0430378913879395, "lr": 6.12358318708412e-05, "tps": 933801, "wall": 1818.3} {"step": 25908, "train_loss": 3.1404812335968018, "lr": 6.122680540452202e-05, "tps": 931550, "wall": 1822.7} {"step": 25909, "train_loss": 3.1475419998168945, "lr": 6.121778073679425e-05, "tps": 929311, "wall": 1827.2} {"step": 25910, "train_loss": 3.0865325927734375, "lr": 6.120875786776e-05, "tps": 927084, "wall": 1831.7} {"step": 25911, "train_loss": 3.0739102363586426, "lr": 6.119973679752154e-05, "tps": 924861, "wall": 1836.1} {"step": 25912, "train_loss": 3.009352207183838, "lr": 6.119071752618105e-05, "tps": 922650, "wall": 1840.6} {"step": 25913, "train_loss": 3.0603785514831543, "lr": 6.118170005384071e-05, "tps": 920453, "wall": 1845.1} {"step": 25914, "train_loss": 3.077873706817627, "lr": 6.117268438060265e-05, "tps": 918269, "wall": 1849.5} {"step": 25915, "train_loss": 3.2037014961242676, "lr": 6.116367050656902e-05, "tps": 916095, "wall": 1854.0} {"step": 25916, "train_loss": 3.1409378051757812, "lr": 6.115465843184192e-05, "tps": 913890, "wall": 1858.5} {"step": 25917, "train_loss": 3.023883819580078, "lr": 6.114564815652346e-05, "tps": 911746, "wall": 1863.0} {"step": 25918, "train_loss": 3.0152597427368164, "lr": 6.11366396807157e-05, "tps": 909598, "wall": 1867.4} {"step": 25919, "train_loss": 3.1285738945007324, "lr": 6.112763300452063e-05, "tps": 907463, "wall": 1871.9} {"step": 25920, "train_loss": 3.0570688247680664, "lr": 6.111862812804036e-05, "tps": 905339, "wall": 1876.4} {"step": 25921, "train_loss": 3.076899528503418, "lr": 6.110962505137691e-05, "tps": 903228, "wall": 1880.8} {"step": 25922, "train_loss": 3.114753246307373, "lr": 6.110062377463213e-05, "tps": 901123, "wall": 1885.3} {"step": 25923, "train_loss": 3.0866150856018066, "lr": 6.109162429790813e-05, "tps": 899025, "wall": 1889.8} {"step": 25924, "train_loss": 3.142451524734497, "lr": 6.108262662130684e-05, "tps": 896937, "wall": 1894.2} {"step": 25925, "train_loss": 2.9930663108825684, "lr": 6.10736307449301e-05, "tps": 894865, "wall": 1898.7} {"step": 25926, "train_loss": 3.09647274017334, "lr": 6.10646366688799e-05, "tps": 892792, "wall": 1903.2} {"step": 25927, "train_loss": 3.1971683502197266, "lr": 6.105564439325808e-05, "tps": 890743, "wall": 1907.6} {"step": 25928, "train_loss": 3.1545662879943848, "lr": 6.104665391816651e-05, "tps": 888692, "wall": 1912.1} {"step": 25929, "train_loss": 3.1393661499023438, "lr": 6.103766524370705e-05, "tps": 886653, "wall": 1916.6} {"step": 25930, "train_loss": 3.1389434337615967, "lr": 6.102867836998154e-05, "tps": 884602, "wall": 1921.1} {"step": 25931, "train_loss": 3.090907335281372, "lr": 6.101969329709172e-05, "tps": 882590, "wall": 1925.6} {"step": 25932, "train_loss": 3.073451519012451, "lr": 6.101071002513946e-05, "tps": 880583, "wall": 1930.0} {"step": 25933, "train_loss": 3.1352925300598145, "lr": 6.100172855422647e-05, "tps": 878588, "wall": 1934.5} {"step": 25934, "train_loss": 3.186706066131592, "lr": 6.099274888445445e-05, "tps": 876600, "wall": 1938.9} {"step": 25935, "train_loss": 3.183821201324463, "lr": 6.098377101592523e-05, "tps": 874621, "wall": 1943.4} {"step": 25936, "train_loss": 3.1080708503723145, "lr": 6.097479494874041e-05, "tps": 872650, "wall": 1947.9} {"step": 25937, "train_loss": 3.165647506713867, "lr": 6.0965820683001764e-05, "tps": 870689, "wall": 1952.3} {"step": 25938, "train_loss": 3.144702434539795, "lr": 6.095684821881087e-05, "tps": 868737, "wall": 1956.8} {"step": 25939, "train_loss": 3.0772573947906494, "lr": 6.0947877556269396e-05, "tps": 866790, "wall": 1961.3} {"step": 25940, "train_loss": 3.026370048522949, "lr": 6.0938908695479e-05, "tps": 864853, "wall": 1965.7} {"step": 25941, "train_loss": 3.1225476264953613, "lr": 6.092994163654127e-05, "tps": 862916, "wall": 1970.2} {"step": 25942, "train_loss": 3.0097124576568604, "lr": 6.0920976379557716e-05, "tps": 861009, "wall": 1974.7} {"step": 25943, "train_loss": 3.106581687927246, "lr": 6.0912012924629956e-05, "tps": 859078, "wall": 1979.2} {"step": 25944, "train_loss": 3.108161449432373, "lr": 6.090305127185956e-05, "tps": 857180, "wall": 1983.6} {"step": 25945, "train_loss": 3.0601253509521484, "lr": 6.0894091421347946e-05, "tps": 855290, "wall": 1988.1} {"step": 25946, "train_loss": 3.106637716293335, "lr": 6.088513337319672e-05, "tps": 853408, "wall": 1992.6} {"step": 25947, "train_loss": 3.1019861698150635, "lr": 6.087617712750731e-05, "tps": 851519, "wall": 1997.1} {"step": 25948, "train_loss": 3.1717493534088135, "lr": 6.086722268438113e-05, "tps": 849655, "wall": 2001.5} {"step": 25949, "train_loss": 3.144451379776001, "lr": 6.0858270043919706e-05, "tps": 847797, "wall": 2006.0} {"step": 25950, "train_loss": 3.0743117332458496, "lr": 6.08493192062244e-05, "tps": 845946, "wall": 2010.4} {"step": 25951, "train_loss": 3.1971421241760254, "lr": 6.08403701713966e-05, "tps": 844102, "wall": 2014.9} {"step": 25952, "train_loss": 3.147991895675659, "lr": 6.0831422939537695e-05, "tps": 842268, "wall": 2019.4} {"step": 25953, "train_loss": 3.1244571208953857, "lr": 6.082247751074904e-05, "tps": 840443, "wall": 2023.8} {"step": 25954, "train_loss": 3.11970591545105, "lr": 6.081353388513199e-05, "tps": 838628, "wall": 2028.3} {"step": 25955, "train_loss": 3.231210708618164, "lr": 6.0804592062787844e-05, "tps": 836820, "wall": 2032.8} {"step": 25956, "train_loss": 3.124701738357544, "lr": 6.079565204381786e-05, "tps": 835007, "wall": 2037.2} {"step": 25957, "train_loss": 3.1279945373535156, "lr": 6.078671382832338e-05, "tps": 833207, "wall": 2041.7} {"step": 25958, "train_loss": 3.0440962314605713, "lr": 6.077777741640562e-05, "tps": 831418, "wall": 2046.2} {"step": 25959, "train_loss": 3.0443196296691895, "lr": 6.076884280816577e-05, "tps": 829641, "wall": 2050.7} {"step": 25960, "train_loss": 3.043499231338501, "lr": 6.07599100037051e-05, "tps": 827871, "wall": 2055.1} {"step": 25961, "train_loss": 3.044066905975342, "lr": 6.075097900312482e-05, "tps": 826110, "wall": 2059.6} {"step": 25962, "train_loss": 3.0329642295837402, "lr": 6.0742049806526005e-05, "tps": 824349, "wall": 2064.1} {"step": 25963, "train_loss": 3.066600799560547, "lr": 6.0733122414009914e-05, "tps": 822602, "wall": 2068.5} {"step": 25964, "train_loss": 2.985806465148926, "lr": 6.072419682567761e-05, "tps": 820864, "wall": 2073.0} {"step": 25965, "train_loss": 3.1079280376434326, "lr": 6.07152730416302e-05, "tps": 819135, "wall": 2077.4} {"step": 25966, "train_loss": 3.1181087493896484, "lr": 6.0706351061968834e-05, "tps": 817412, "wall": 2081.9} {"step": 25967, "train_loss": 3.0578231811523438, "lr": 6.0697430886794525e-05, "tps": 815698, "wall": 2086.4} {"step": 25968, "train_loss": 3.1312432289123535, "lr": 6.068851251620832e-05, "tps": 813980, "wall": 2090.8} {"step": 25969, "train_loss": 3.104156017303467, "lr": 6.067959595031128e-05, "tps": 812283, "wall": 2095.3} {"step": 25970, "train_loss": 3.083651542663574, "lr": 6.067068118920437e-05, "tps": 810568, "wall": 2099.8} {"step": 25971, "train_loss": 3.047661304473877, "lr": 6.066176823298866e-05, "tps": 808879, "wall": 2104.3} {"step": 25972, "train_loss": 3.1533374786376953, "lr": 6.0652857081765025e-05, "tps": 807194, "wall": 2108.7} {"step": 25973, "train_loss": 3.084928035736084, "lr": 6.064394773563442e-05, "tps": 805521, "wall": 2113.2} {"step": 25974, "train_loss": 3.090531826019287, "lr": 6.063504019469784e-05, "tps": 803849, "wall": 2117.7} {"step": 25975, "train_loss": 3.0741233825683594, "lr": 6.062613445905615e-05, "tps": 802190, "wall": 2122.1} {"step": 25976, "train_loss": 3.1397948265075684, "lr": 6.0617230528810186e-05, "tps": 800537, "wall": 2126.6} {"step": 25977, "train_loss": 3.134030342102051, "lr": 6.060832840406089e-05, "tps": 798892, "wall": 2131.1} {"step": 25978, "train_loss": 3.048307180404663, "lr": 6.059942808490906e-05, "tps": 797253, "wall": 2135.5} {"step": 25979, "train_loss": 3.139298915863037, "lr": 6.0590529571455536e-05, "tps": 795621, "wall": 2140.0} {"step": 25980, "train_loss": 3.0877742767333984, "lr": 6.0581632863801107e-05, "tps": 793996, "wall": 2144.5} {"step": 25981, "train_loss": 3.0727765560150146, "lr": 6.05727379620466e-05, "tps": 792375, "wall": 2148.9} {"step": 25982, "train_loss": 3.028040885925293, "lr": 6.05638448662927e-05, "tps": 790762, "wall": 2153.4} {"step": 25983, "train_loss": 3.215404510498047, "lr": 6.0554953576640214e-05, "tps": 789126, "wall": 2157.9} {"step": 25984, "train_loss": 3.086460590362549, "lr": 6.054606409318985e-05, "tps": 787537, "wall": 2162.4} {"step": 25985, "train_loss": 2.993391513824463, "lr": 6.053717641604225e-05, "tps": 785941, "wall": 2166.9} {"step": 25986, "train_loss": 3.078746795654297, "lr": 6.0528290545298196e-05, "tps": 784355, "wall": 2171.3} {"step": 25987, "train_loss": 3.134801149368286, "lr": 6.051940648105829e-05, "tps": 782776, "wall": 2175.8} {"step": 25988, "train_loss": 3.138625144958496, "lr": 6.051052422342313e-05, "tps": 781205, "wall": 2180.2} {"step": 25989, "train_loss": 3.1724085807800293, "lr": 6.050164377249341e-05, "tps": 779640, "wall": 2184.7} {"step": 25990, "train_loss": 3.087472438812256, "lr": 6.0492765128369675e-05, "tps": 778075, "wall": 2189.2} {"step": 25991, "train_loss": 3.1513352394104004, "lr": 6.048388829115256e-05, "tps": 776515, "wall": 2193.7} {"step": 25992, "train_loss": 3.079897880554199, "lr": 6.047501326094259e-05, "tps": 774968, "wall": 2198.1} {"step": 25993, "train_loss": 3.088599681854248, "lr": 6.046614003784026e-05, "tps": 773432, "wall": 2202.6} {"step": 25994, "train_loss": 3.152956485748291, "lr": 6.045726862194616e-05, "tps": 771902, "wall": 2207.0} {"step": 25995, "train_loss": 3.0787456035614014, "lr": 6.0448399013360765e-05, "tps": 770373, "wall": 2211.5} {"step": 25996, "train_loss": 3.123354196548462, "lr": 6.04395312121845e-05, "tps": 768855, "wall": 2215.9} {"step": 25997, "train_loss": 3.098665237426758, "lr": 6.0430665218517866e-05, "tps": 767327, "wall": 2220.4} {"step": 25998, "train_loss": 3.039717197418213, "lr": 6.042180103246131e-05, "tps": 765817, "wall": 2224.9} {"step": 25999, "train_loss": 3.1138062477111816, "lr": 6.041293865411519e-05, "tps": 764311, "wall": 2229.4} {"step": 26000, "train_loss": 3.1020548343658447, "lr": 6.040407808357996e-05, "tps": 762814, "wall": 2233.8, "val_loss_monitor": 3.339243261694542} {"step": 26001, "train_loss": 3.170443296432495, "lr": 6.0395219320955975e-05, "tps": 751292, "wall": 2268.2} {"step": 26002, "train_loss": 3.0861902236938477, "lr": 6.0386362366343563e-05, "tps": 749832, "wall": 2272.7} {"step": 26003, "train_loss": 2.993947744369507, "lr": 6.037750721984308e-05, "tps": 748380, "wall": 2277.2} {"step": 26004, "train_loss": 3.1017258167266846, "lr": 6.036865388155485e-05, "tps": 746924, "wall": 2281.7} {"step": 26005, "train_loss": 3.1408729553222656, "lr": 6.035980235157909e-05, "tps": 745485, "wall": 2286.2} {"step": 26006, "train_loss": 3.039865493774414, "lr": 6.0350952630016154e-05, "tps": 744053, "wall": 2290.7} {"step": 26007, "train_loss": 3.0055289268493652, "lr": 6.034210471696625e-05, "tps": 742628, "wall": 2295.2} {"step": 26008, "train_loss": 2.915443181991577, "lr": 6.033325861252967e-05, "tps": 741209, "wall": 2299.7} {"step": 26009, "train_loss": 3.1447644233703613, "lr": 6.0324414316806544e-05, "tps": 739792, "wall": 2304.1} {"step": 26010, "train_loss": 3.1163578033447266, "lr": 6.0315571829897074e-05, "tps": 738382, "wall": 2308.6} {"step": 26011, "train_loss": 3.0024166107177734, "lr": 6.030673115190146e-05, "tps": 736977, "wall": 2313.1} {"step": 26012, "train_loss": 3.056664228439331, "lr": 6.0297892282919855e-05, "tps": 735581, "wall": 2317.6} {"step": 26013, "train_loss": 3.252139091491699, "lr": 6.0289055223052326e-05, "tps": 734191, "wall": 2322.1} {"step": 26014, "train_loss": 3.0934829711914062, "lr": 6.0280219972399046e-05, "tps": 732800, "wall": 2326.6} {"step": 26015, "train_loss": 3.1038875579833984, "lr": 6.0271386531060095e-05, "tps": 731415, "wall": 2331.1} {"step": 26016, "train_loss": 3.2095632553100586, "lr": 6.026255489913547e-05, "tps": 730044, "wall": 2335.5} {"step": 26017, "train_loss": 3.105069637298584, "lr": 6.02537250767253e-05, "tps": 728661, "wall": 2340.1} {"step": 26018, "train_loss": 3.1264491081237793, "lr": 6.0244897063929576e-05, "tps": 727297, "wall": 2344.5} {"step": 26019, "train_loss": 3.102105140686035, "lr": 6.0236070860848246e-05, "tps": 725938, "wall": 2349.0} {"step": 26020, "train_loss": 3.0499165058135986, "lr": 6.022724646758141e-05, "tps": 724586, "wall": 2353.5} {"step": 26021, "train_loss": 3.1063854694366455, "lr": 6.021842388422896e-05, "tps": 723238, "wall": 2358.0} {"step": 26022, "train_loss": 3.0664572715759277, "lr": 6.020960311089081e-05, "tps": 721890, "wall": 2362.5} {"step": 26023, "train_loss": 3.1566085815429688, "lr": 6.0200784147666965e-05, "tps": 720551, "wall": 2366.9} {"step": 26024, "train_loss": 3.1136603355407715, "lr": 6.0191966994657254e-05, "tps": 719221, "wall": 2371.4} {"step": 26025, "train_loss": 3.0342607498168945, "lr": 6.01831516519616e-05, "tps": 717895, "wall": 2375.9} {"step": 26026, "train_loss": 3.0155527591705322, "lr": 6.0174338119679855e-05, "tps": 716572, "wall": 2380.4} {"step": 26027, "train_loss": 3.1279234886169434, "lr": 6.016552639791184e-05, "tps": 715255, "wall": 2384.8} {"step": 26028, "train_loss": 3.0061957836151123, "lr": 6.01567164867574e-05, "tps": 713938, "wall": 2389.3} {"step": 26029, "train_loss": 2.997917413711548, "lr": 6.014790838631632e-05, "tps": 712629, "wall": 2393.8} {"step": 26030, "train_loss": 3.1403725147247314, "lr": 6.013910209668837e-05, "tps": 711306, "wall": 2398.4} {"step": 26031, "train_loss": 3.0626840591430664, "lr": 6.013029761797333e-05, "tps": 710018, "wall": 2402.8} {"step": 26032, "train_loss": 3.1023716926574707, "lr": 6.012149495027094e-05, "tps": 708729, "wall": 2407.3} {"step": 26033, "train_loss": 3.162039279937744, "lr": 6.0112694093680877e-05, "tps": 707444, "wall": 2411.7} {"step": 26034, "train_loss": 3.0702216625213623, "lr": 6.0103895048302886e-05, "tps": 706163, "wall": 2416.2} {"step": 26035, "train_loss": 3.1346421241760254, "lr": 6.0095097814236636e-05, "tps": 704886, "wall": 2420.7} {"step": 26036, "train_loss": 3.1067566871643066, "lr": 6.008630239158172e-05, "tps": 703614, "wall": 2425.1} {"step": 26037, "train_loss": 3.153444290161133, "lr": 6.0077508780437866e-05, "tps": 702346, "wall": 2429.6} {"step": 26038, "train_loss": 3.025932550430298, "lr": 6.006871698090463e-05, "tps": 701086, "wall": 2434.1} {"step": 26039, "train_loss": 3.153385639190674, "lr": 6.0059926993081595e-05, "tps": 699831, "wall": 2438.5} {"step": 26040, "train_loss": 3.1748874187469482, "lr": 6.005113881706841e-05, "tps": 698577, "wall": 2443.0} {"step": 26041, "train_loss": 3.0140695571899414, "lr": 6.0042352452964545e-05, "tps": 697331, "wall": 2447.5} {"step": 26042, "train_loss": 3.0558817386627197, "lr": 6.003356790086956e-05, "tps": 696084, "wall": 2451.9} {"step": 26043, "train_loss": 3.1450531482696533, "lr": 6.0024785160883e-05, "tps": 694846, "wall": 2456.4} {"step": 26044, "train_loss": 3.070873498916626, "lr": 6.001600423310428e-05, "tps": 693600, "wall": 2460.9} {"step": 26045, "train_loss": 3.1361546516418457, "lr": 6.000722511763296e-05, "tps": 692372, "wall": 2465.4} {"step": 26046, "train_loss": 3.1792449951171875, "lr": 5.999844781456845e-05, "tps": 691150, "wall": 2469.8} {"step": 26047, "train_loss": 3.108959674835205, "lr": 5.998967232401015e-05, "tps": 689921, "wall": 2474.3} {"step": 26048, "train_loss": 3.0775880813598633, "lr": 5.998089864605755e-05, "tps": 688709, "wall": 2478.8} {"step": 26049, "train_loss": 2.9960360527038574, "lr": 5.9972126780809945e-05, "tps": 687496, "wall": 2483.2} {"step": 26050, "train_loss": 3.032118558883667, "lr": 5.996335672836676e-05, "tps": 686292, "wall": 2487.7} {"step": 26051, "train_loss": 3.063981533050537, "lr": 5.9954588488827346e-05, "tps": 685091, "wall": 2492.1} {"step": 26052, "train_loss": 3.1307575702667236, "lr": 5.994582206229096e-05, "tps": 683892, "wall": 2496.6} {"step": 26053, "train_loss": 3.092494010925293, "lr": 5.993705744885699e-05, "tps": 682698, "wall": 2501.1} {"step": 26054, "train_loss": 3.0455050468444824, "lr": 5.9928294648624706e-05, "tps": 681510, "wall": 2505.5} {"step": 26055, "train_loss": 3.0955257415771484, "lr": 5.9919533661693314e-05, "tps": 680325, "wall": 2510.0} {"step": 26056, "train_loss": 3.1346325874328613, "lr": 5.991077448816215e-05, "tps": 679144, "wall": 2514.4} {"step": 26057, "train_loss": 3.010239601135254, "lr": 5.9902017128130386e-05, "tps": 677949, "wall": 2519.0} {"step": 26058, "train_loss": 2.9529013633728027, "lr": 5.989326158169721e-05, "tps": 676780, "wall": 2523.4} {"step": 26059, "train_loss": 3.107365608215332, "lr": 5.9884507848961856e-05, "tps": 675610, "wall": 2527.9} {"step": 26060, "train_loss": 3.001408815383911, "lr": 5.987575593002346e-05, "tps": 674447, "wall": 2532.3} {"step": 26061, "train_loss": 3.115993022918701, "lr": 5.9867005824981124e-05, "tps": 673286, "wall": 2536.8} {"step": 26062, "train_loss": 3.0758392810821533, "lr": 5.985825753393406e-05, "tps": 672128, "wall": 2541.3} {"step": 26063, "train_loss": 3.04203462600708, "lr": 5.98495110569813e-05, "tps": 670979, "wall": 2545.7} {"step": 26064, "train_loss": 3.1309573650360107, "lr": 5.984076639422191e-05, "tps": 669832, "wall": 2550.2} {"step": 26065, "train_loss": 3.0800118446350098, "lr": 5.9832023545755026e-05, "tps": 668689, "wall": 2554.6} {"step": 26066, "train_loss": 2.9858767986297607, "lr": 5.9823282511679604e-05, "tps": 667550, "wall": 2559.1} {"step": 26067, "train_loss": 2.9591336250305176, "lr": 5.981454329209473e-05, "tps": 666415, "wall": 2563.6} {"step": 26068, "train_loss": 3.1846799850463867, "lr": 5.9805805887099384e-05, "tps": 665283, "wall": 2568.0} {"step": 26069, "train_loss": 3.0289411544799805, "lr": 5.979707029679251e-05, "tps": 664154, "wall": 2572.5} {"step": 26070, "train_loss": 3.179868698120117, "lr": 5.978833652127311e-05, "tps": 663032, "wall": 2576.9} {"step": 26071, "train_loss": 2.984281539916992, "lr": 5.9779604560640114e-05, "tps": 661904, "wall": 2581.4} {"step": 26072, "train_loss": 3.0104334354400635, "lr": 5.9770874414992384e-05, "tps": 660789, "wall": 2585.9} {"step": 26073, "train_loss": 2.9747214317321777, "lr": 5.976214608442889e-05, "tps": 659677, "wall": 2590.3} {"step": 26074, "train_loss": 3.1759326457977295, "lr": 5.975341956904847e-05, "tps": 658569, "wall": 2594.8} {"step": 26075, "train_loss": 3.092824935913086, "lr": 5.974469486894996e-05, "tps": 657467, "wall": 2599.2} {"step": 26076, "train_loss": 3.0579400062561035, "lr": 5.973597198423224e-05, "tps": 656369, "wall": 2603.7} {"step": 26077, "train_loss": 3.1447134017944336, "lr": 5.9727250914994104e-05, "tps": 655275, "wall": 2608.1} {"step": 26078, "train_loss": 2.989708662033081, "lr": 5.97185316613343e-05, "tps": 654182, "wall": 2612.6} {"step": 26079, "train_loss": 3.0947556495666504, "lr": 5.970981422335169e-05, "tps": 653093, "wall": 2617.1} {"step": 26080, "train_loss": 3.1227080821990967, "lr": 5.9701098601144966e-05, "tps": 652010, "wall": 2621.5} {"step": 26081, "train_loss": 3.117053270339966, "lr": 5.9692384794812825e-05, "tps": 650924, "wall": 2626.0} {"step": 26082, "train_loss": 3.2138357162475586, "lr": 5.968367280445406e-05, "tps": 649847, "wall": 2630.4} {"step": 26083, "train_loss": 3.0676918029785156, "lr": 5.967496263016734e-05, "tps": 648771, "wall": 2634.9} {"step": 26084, "train_loss": 3.1854794025421143, "lr": 5.966625427205126e-05, "tps": 647685, "wall": 2639.4} {"step": 26085, "train_loss": 3.051865816116333, "lr": 5.965754773020458e-05, "tps": 646622, "wall": 2643.8} {"step": 26086, "train_loss": 3.0505447387695312, "lr": 5.9648843004725815e-05, "tps": 645558, "wall": 2648.3} {"step": 26087, "train_loss": 3.128535032272339, "lr": 5.964014009571368e-05, "tps": 644498, "wall": 2652.8} {"step": 26088, "train_loss": 2.979262590408325, "lr": 5.963143900326671e-05, "tps": 643442, "wall": 2657.2} {"step": 26089, "train_loss": 3.073176860809326, "lr": 5.962273972748344e-05, "tps": 642392, "wall": 2661.7} {"step": 26090, "train_loss": 3.0867724418640137, "lr": 5.96140422684625e-05, "tps": 641344, "wall": 2666.1} {"step": 26091, "train_loss": 2.9710285663604736, "lr": 5.960534662630237e-05, "tps": 640300, "wall": 2670.6} {"step": 26092, "train_loss": 3.0991578102111816, "lr": 5.959665280110148e-05, "tps": 639258, "wall": 2675.0} {"step": 26093, "train_loss": 2.998614549636841, "lr": 5.958796079295844e-05, "tps": 638219, "wall": 2679.5} {"step": 26094, "train_loss": 3.1848716735839844, "lr": 5.957927060197166e-05, "tps": 637185, "wall": 2683.9} {"step": 26095, "train_loss": 3.106588363647461, "lr": 5.957058222823956e-05, "tps": 636154, "wall": 2688.4} {"step": 26096, "train_loss": 3.054960012435913, "lr": 5.956189567186059e-05, "tps": 635123, "wall": 2692.8} {"step": 26097, "train_loss": 3.0143914222717285, "lr": 5.9553210932933166e-05, "tps": 634095, "wall": 2697.3} {"step": 26098, "train_loss": 3.1279938220977783, "lr": 5.95445280115556e-05, "tps": 633066, "wall": 2701.8} {"step": 26099, "train_loss": 3.1687119007110596, "lr": 5.953584690782633e-05, "tps": 632049, "wall": 2706.3} {"step": 26100, "train_loss": 2.9815402030944824, "lr": 5.952716762184369e-05, "tps": 631033, "wall": 2710.7} {"step": 26101, "train_loss": 3.19528865814209, "lr": 5.951849015370594e-05, "tps": 630017, "wall": 2715.2} {"step": 26102, "train_loss": 3.119448661804199, "lr": 5.9509814503511426e-05, "tps": 629008, "wall": 2719.7} {"step": 26103, "train_loss": 3.1518661975860596, "lr": 5.9501140671358403e-05, "tps": 628002, "wall": 2724.1} {"step": 26104, "train_loss": 2.9929122924804688, "lr": 5.9492468657345176e-05, "tps": 626999, "wall": 2728.6} {"step": 26105, "train_loss": 3.081488847732544, "lr": 5.9483798461569926e-05, "tps": 626000, "wall": 2733.0} {"step": 26106, "train_loss": 3.090369462966919, "lr": 5.947513008413088e-05, "tps": 625005, "wall": 2737.5} {"step": 26107, "train_loss": 3.0842814445495605, "lr": 5.9466463525126284e-05, "tps": 624014, "wall": 2741.9} {"step": 26108, "train_loss": 3.041201114654541, "lr": 5.945779878465424e-05, "tps": 623025, "wall": 2746.4} {"step": 26109, "train_loss": 3.1857712268829346, "lr": 5.944913586281292e-05, "tps": 622039, "wall": 2750.9} {"step": 26110, "train_loss": 2.943542242050171, "lr": 5.944047475970051e-05, "tps": 621055, "wall": 2755.3} {"step": 26111, "train_loss": 3.0380146503448486, "lr": 5.94318154754151e-05, "tps": 620066, "wall": 2759.8} {"step": 26112, "train_loss": 3.0713367462158203, "lr": 5.942315801005474e-05, "tps": 619089, "wall": 2764.3} {"step": 26113, "train_loss": 3.1029906272888184, "lr": 5.941450236371754e-05, "tps": 618115, "wall": 2768.7} {"step": 26114, "train_loss": 3.1404740810394287, "lr": 5.940584853650155e-05, "tps": 617142, "wall": 2773.2} {"step": 26115, "train_loss": 3.0587568283081055, "lr": 5.9397196528504774e-05, "tps": 616171, "wall": 2777.7} {"step": 26116, "train_loss": 3.1675376892089844, "lr": 5.9388546339825276e-05, "tps": 615207, "wall": 2782.2} {"step": 26117, "train_loss": 3.115583896636963, "lr": 5.9379897970561016e-05, "tps": 614245, "wall": 2786.6} {"step": 26118, "train_loss": 3.075244903564453, "lr": 5.937125142080992e-05, "tps": 613287, "wall": 2791.1} {"step": 26119, "train_loss": 3.1016972064971924, "lr": 5.936260669067002e-05, "tps": 612325, "wall": 2795.6} {"step": 26120, "train_loss": 3.103395462036133, "lr": 5.9353963780239155e-05, "tps": 611373, "wall": 2800.0} {"step": 26121, "train_loss": 3.1498122215270996, "lr": 5.9345322689615326e-05, "tps": 610425, "wall": 2804.5} {"step": 26122, "train_loss": 3.102506637573242, "lr": 5.9336683418896354e-05, "tps": 609479, "wall": 2808.9} {"step": 26123, "train_loss": 3.060800552368164, "lr": 5.9328045968180114e-05, "tps": 608536, "wall": 2813.4} {"step": 26124, "train_loss": 3.0423498153686523, "lr": 5.931941033756448e-05, "tps": 607581, "wall": 2817.9} {"step": 26125, "train_loss": 3.051422357559204, "lr": 5.931077652714727e-05, "tps": 606649, "wall": 2822.4} {"step": 26126, "train_loss": 3.137010097503662, "lr": 5.930214453702623e-05, "tps": 605715, "wall": 2826.8} {"step": 26127, "train_loss": 2.9908223152160645, "lr": 5.929351436729923e-05, "tps": 604783, "wall": 2831.3} {"step": 26128, "train_loss": 3.1699020862579346, "lr": 5.9284886018064e-05, "tps": 603857, "wall": 2835.8} {"step": 26129, "train_loss": 3.0806050300598145, "lr": 5.927625948941822e-05, "tps": 602932, "wall": 2840.2} {"step": 26130, "train_loss": 3.1101436614990234, "lr": 5.9267634781459723e-05, "tps": 602010, "wall": 2844.7} {"step": 26131, "train_loss": 3.1481852531433105, "lr": 5.925901189428616e-05, "tps": 601092, "wall": 2849.1} {"step": 26132, "train_loss": 3.087533950805664, "lr": 5.925039082799515e-05, "tps": 600174, "wall": 2853.6} {"step": 26133, "train_loss": 3.0575883388519287, "lr": 5.924177158268447e-05, "tps": 599264, "wall": 2858.0} {"step": 26134, "train_loss": 3.068908214569092, "lr": 5.923315415845168e-05, "tps": 598353, "wall": 2862.5} {"step": 26135, "train_loss": 3.0913567543029785, "lr": 5.922453855539437e-05, "tps": 597446, "wall": 2866.9} {"step": 26136, "train_loss": 3.178196668624878, "lr": 5.921592477361024e-05, "tps": 596538, "wall": 2871.4} {"step": 26137, "train_loss": 3.093838930130005, "lr": 5.9207312813196804e-05, "tps": 595639, "wall": 2875.9} {"step": 26138, "train_loss": 3.1297271251678467, "lr": 5.919870267425161e-05, "tps": 594727, "wall": 2880.4} {"step": 26139, "train_loss": 3.059563636779785, "lr": 5.919009435687222e-05, "tps": 593831, "wall": 2884.8} {"step": 26140, "train_loss": 3.2248384952545166, "lr": 5.918148786115612e-05, "tps": 592936, "wall": 2889.3} {"step": 26141, "train_loss": 3.0274219512939453, "lr": 5.9172883187200845e-05, "tps": 592046, "wall": 2893.8} {"step": 26142, "train_loss": 2.959975242614746, "lr": 5.916428033510386e-05, "tps": 591159, "wall": 2898.2} {"step": 26143, "train_loss": 3.1160049438476562, "lr": 5.9155679304962574e-05, "tps": 590274, "wall": 2902.7} {"step": 26144, "train_loss": 3.143772602081299, "lr": 5.9147080096874494e-05, "tps": 589388, "wall": 2907.1} {"step": 26145, "train_loss": 3.069511651992798, "lr": 5.9138482710937006e-05, "tps": 588507, "wall": 2911.6} {"step": 26146, "train_loss": 3.084406852722168, "lr": 5.912988714724743e-05, "tps": 587628, "wall": 2916.1} {"step": 26147, "train_loss": 3.0470633506774902, "lr": 5.912129340590322e-05, "tps": 586754, "wall": 2920.5} {"step": 26148, "train_loss": 3.165816307067871, "lr": 5.9112701487001746e-05, "tps": 585882, "wall": 2925.0} {"step": 26149, "train_loss": 3.1184611320495605, "lr": 5.910411139064022e-05, "tps": 585016, "wall": 2929.4} {"step": 26150, "train_loss": 3.0255823135375977, "lr": 5.9095523116916066e-05, "tps": 584150, "wall": 2933.9} {"step": 26151, "train_loss": 3.126845121383667, "lr": 5.908693666592654e-05, "tps": 583271, "wall": 2938.4} {"step": 26152, "train_loss": 3.0946664810180664, "lr": 5.907835203776887e-05, "tps": 582415, "wall": 2942.9} {"step": 26153, "train_loss": 3.1207118034362793, "lr": 5.906976923254035e-05, "tps": 581558, "wall": 2947.3} {"step": 26154, "train_loss": 3.168640613555908, "lr": 5.906118825033819e-05, "tps": 580700, "wall": 2951.8} {"step": 26155, "train_loss": 3.1401891708374023, "lr": 5.905260909125959e-05, "tps": 579846, "wall": 2956.2} {"step": 26156, "train_loss": 3.1471166610717773, "lr": 5.9044031755401754e-05, "tps": 578998, "wall": 2960.7} {"step": 26157, "train_loss": 3.133542537689209, "lr": 5.9035456242861795e-05, "tps": 578152, "wall": 2965.1} {"step": 26158, "train_loss": 3.026597023010254, "lr": 5.902688255373694e-05, "tps": 577308, "wall": 2969.6} {"step": 26159, "train_loss": 3.116875648498535, "lr": 5.901831068812429e-05, "tps": 576468, "wall": 2974.0} {"step": 26160, "train_loss": 3.0160365104675293, "lr": 5.900974064612085e-05, "tps": 575629, "wall": 2978.5} {"step": 26161, "train_loss": 3.049330234527588, "lr": 5.900117242782382e-05, "tps": 574791, "wall": 2982.9} {"step": 26162, "train_loss": 3.0923712253570557, "lr": 5.899260603333024e-05, "tps": 573956, "wall": 2987.4} {"step": 26163, "train_loss": 3.046637773513794, "lr": 5.898404146273708e-05, "tps": 573122, "wall": 2991.8} {"step": 26164, "train_loss": 3.0841455459594727, "lr": 5.897547871614144e-05, "tps": 572295, "wall": 2996.3} {"step": 26165, "train_loss": 3.083159923553467, "lr": 5.89669177936403e-05, "tps": 571460, "wall": 3000.8} {"step": 26166, "train_loss": 3.0664632320404053, "lr": 5.895835869533059e-05, "tps": 570634, "wall": 3005.2} {"step": 26167, "train_loss": 3.1281018257141113, "lr": 5.8949801421309335e-05, "tps": 569812, "wall": 3009.7} {"step": 26168, "train_loss": 3.200028419494629, "lr": 5.894124597167344e-05, "tps": 568993, "wall": 3014.1} {"step": 26169, "train_loss": 3.0686702728271484, "lr": 5.8932692346519814e-05, "tps": 568177, "wall": 3018.6} {"step": 26170, "train_loss": 3.040806293487549, "lr": 5.892414054594536e-05, "tps": 567362, "wall": 3023.0} {"step": 26171, "train_loss": 3.111520528793335, "lr": 5.891559057004696e-05, "tps": 566549, "wall": 3027.5} {"step": 26172, "train_loss": 3.076298236846924, "lr": 5.890704241892147e-05, "tps": 565740, "wall": 3031.9} {"step": 26173, "train_loss": 3.0478413105010986, "lr": 5.889849609266571e-05, "tps": 564930, "wall": 3036.4} {"step": 26174, "train_loss": 3.112379789352417, "lr": 5.888995159137652e-05, "tps": 564122, "wall": 3040.8} {"step": 26175, "train_loss": 3.0873119831085205, "lr": 5.8881408915150636e-05, "tps": 563319, "wall": 3045.3} {"step": 26176, "train_loss": 3.089796781539917, "lr": 5.8872868064084916e-05, "tps": 562516, "wall": 3049.8} {"step": 26177, "train_loss": 3.043268918991089, "lr": 5.8864329038276014e-05, "tps": 561716, "wall": 3054.2} {"step": 26178, "train_loss": 3.054016351699829, "lr": 5.885579183782074e-05, "tps": 560907, "wall": 3058.7} {"step": 26179, "train_loss": 3.1637003421783447, "lr": 5.884725646281578e-05, "tps": 560117, "wall": 3063.2} {"step": 26180, "train_loss": 3.064873218536377, "lr": 5.883872291335777e-05, "tps": 559326, "wall": 3067.6} {"step": 26181, "train_loss": 3.201411008834839, "lr": 5.883019118954348e-05, "tps": 558534, "wall": 3072.1} {"step": 26182, "train_loss": 3.1404755115509033, "lr": 5.882166129146951e-05, "tps": 557747, "wall": 3076.5} {"step": 26183, "train_loss": 3.027318239212036, "lr": 5.881313321923242e-05, "tps": 556961, "wall": 3081.0} {"step": 26184, "train_loss": 2.981987714767456, "lr": 5.880460697292893e-05, "tps": 556179, "wall": 3085.4} {"step": 26185, "train_loss": 3.1121692657470703, "lr": 5.879608255265557e-05, "tps": 555392, "wall": 3089.9} {"step": 26186, "train_loss": 3.1298060417175293, "lr": 5.878755995850887e-05, "tps": 554616, "wall": 3094.4} {"step": 26187, "train_loss": 3.157331943511963, "lr": 5.877903919058545e-05, "tps": 553840, "wall": 3098.8} {"step": 26188, "train_loss": 3.1316967010498047, "lr": 5.877052024898179e-05, "tps": 553065, "wall": 3103.3} {"step": 26189, "train_loss": 3.0342695713043213, "lr": 5.876200313379436e-05, "tps": 552281, "wall": 3107.8} {"step": 26190, "train_loss": 3.126437187194824, "lr": 5.8753487845119714e-05, "tps": 551507, "wall": 3112.3} {"step": 26191, "train_loss": 3.001676559448242, "lr": 5.874497438305431e-05, "tps": 550739, "wall": 3116.8} {"step": 26192, "train_loss": 3.1513671875, "lr": 5.873646274769449e-05, "tps": 549966, "wall": 3121.3} {"step": 26193, "train_loss": 3.078000068664551, "lr": 5.872795293913681e-05, "tps": 549205, "wall": 3125.7} {"step": 26194, "train_loss": 3.101212501525879, "lr": 5.8719444957477545e-05, "tps": 548444, "wall": 3130.2} {"step": 26195, "train_loss": 3.076080322265625, "lr": 5.871093880281316e-05, "tps": 547685, "wall": 3134.6} {"step": 26196, "train_loss": 3.138781785964966, "lr": 5.870243447524001e-05, "tps": 546930, "wall": 3139.1} {"step": 26197, "train_loss": 3.065861701965332, "lr": 5.8693931974854375e-05, "tps": 546177, "wall": 3143.5} {"step": 26198, "train_loss": 3.0104825496673584, "lr": 5.8685431301752625e-05, "tps": 545425, "wall": 3148.0} {"step": 26199, "train_loss": 3.122962236404419, "lr": 5.867693245603104e-05, "tps": 544675, "wall": 3152.4} {"step": 26200, "train_loss": 3.111776351928711, "lr": 5.866843543778585e-05, "tps": 543929, "wall": 3156.9} {"step": 26201, "train_loss": 3.1222829818725586, "lr": 5.8659940247113385e-05, "tps": 543183, "wall": 3161.3} {"step": 26202, "train_loss": 3.1227128505706787, "lr": 5.865144688410986e-05, "tps": 542438, "wall": 3165.8} {"step": 26203, "train_loss": 3.155696392059326, "lr": 5.864295534887144e-05, "tps": 541695, "wall": 3170.2} {"step": 26204, "train_loss": 3.0640320777893066, "lr": 5.8634465641494385e-05, "tps": 540956, "wall": 3174.7} {"step": 26205, "train_loss": 3.0790886878967285, "lr": 5.8625977762074826e-05, "tps": 540209, "wall": 3179.2} {"step": 26206, "train_loss": 3.1805458068847656, "lr": 5.861749171070887e-05, "tps": 539475, "wall": 3183.7} {"step": 26207, "train_loss": 3.05155086517334, "lr": 5.8609007487492764e-05, "tps": 538743, "wall": 3188.1} {"step": 26208, "train_loss": 3.1444058418273926, "lr": 5.860052509252254e-05, "tps": 538012, "wall": 3192.6} {"step": 26209, "train_loss": 2.987027168273926, "lr": 5.8592044525894254e-05, "tps": 537284, "wall": 3197.0} {"step": 26210, "train_loss": 3.132286548614502, "lr": 5.858356578770407e-05, "tps": 536559, "wall": 3201.4} {"step": 26211, "train_loss": 3.0979228019714355, "lr": 5.8575088878047955e-05, "tps": 535833, "wall": 3205.9} {"step": 26212, "train_loss": 3.11112642288208, "lr": 5.8566613797021986e-05, "tps": 535110, "wall": 3210.4} {"step": 26213, "train_loss": 3.041677713394165, "lr": 5.855814054472214e-05, "tps": 534392, "wall": 3214.8} {"step": 26214, "train_loss": 3.119508743286133, "lr": 5.85496691212444e-05, "tps": 533672, "wall": 3219.2} {"step": 26215, "train_loss": 3.198042631149292, "lr": 5.8541199526684767e-05, "tps": 532953, "wall": 3223.7} {"step": 26216, "train_loss": 3.168130397796631, "lr": 5.853273176113919e-05, "tps": 532238, "wall": 3228.2} {"step": 26217, "train_loss": 3.0419297218322754, "lr": 5.852426582470351e-05, "tps": 531521, "wall": 3232.6} {"step": 26218, "train_loss": 3.1253232955932617, "lr": 5.8515801717473704e-05, "tps": 530811, "wall": 3237.1} {"step": 26219, "train_loss": 3.018911361694336, "lr": 5.850733943954559e-05, "tps": 530095, "wall": 3241.6} {"step": 26220, "train_loss": 3.094235420227051, "lr": 5.8498878991015114e-05, "tps": 529387, "wall": 3246.1} {"step": 26221, "train_loss": 3.1153435707092285, "lr": 5.849042037197808e-05, "tps": 528682, "wall": 3250.5} {"step": 26222, "train_loss": 3.1191139221191406, "lr": 5.8481963582530266e-05, "tps": 527978, "wall": 3255.0} {"step": 26223, "train_loss": 3.068802833557129, "lr": 5.847350862276753e-05, "tps": 527277, "wall": 3259.4} {"step": 26224, "train_loss": 3.12463116645813, "lr": 5.8465055492785636e-05, "tps": 526577, "wall": 3263.9} {"step": 26225, "train_loss": 3.077571392059326, "lr": 5.84566041926803e-05, "tps": 525878, "wall": 3268.3} {"step": 26226, "train_loss": 3.1315970420837402, "lr": 5.844815472254731e-05, "tps": 525184, "wall": 3272.8} {"step": 26227, "train_loss": 3.1289355754852295, "lr": 5.843970708248239e-05, "tps": 524491, "wall": 3277.2} {"step": 26228, "train_loss": 3.0844688415527344, "lr": 5.843126127258116e-05, "tps": 523799, "wall": 3281.7} {"step": 26229, "train_loss": 3.1328611373901367, "lr": 5.842281729293937e-05, "tps": 523109, "wall": 3286.1} {"step": 26230, "train_loss": 3.098905086517334, "lr": 5.8414375143652654e-05, "tps": 522421, "wall": 3290.6} {"step": 26231, "train_loss": 3.030078887939453, "lr": 5.84059348248166e-05, "tps": 521734, "wall": 3295.0} {"step": 26232, "train_loss": 3.100525379180908, "lr": 5.83974963365269e-05, "tps": 521040, "wall": 3299.6} {"step": 26233, "train_loss": 3.0585415363311768, "lr": 5.8389059678879087e-05, "tps": 520358, "wall": 3304.0} {"step": 26234, "train_loss": 3.1108200550079346, "lr": 5.838062485196874e-05, "tps": 519678, "wall": 3308.5} {"step": 26235, "train_loss": 3.0999748706817627, "lr": 5.837219185589143e-05, "tps": 518998, "wall": 3312.9} {"step": 26236, "train_loss": 3.1495232582092285, "lr": 5.836376069074265e-05, "tps": 518322, "wall": 3317.4} {"step": 26237, "train_loss": 3.100581645965576, "lr": 5.835533135661797e-05, "tps": 517648, "wall": 3321.8} {"step": 26238, "train_loss": 3.0673105716705322, "lr": 5.8346903853612845e-05, "tps": 516974, "wall": 3326.3} {"step": 26239, "train_loss": 3.1004583835601807, "lr": 5.83384781818227e-05, "tps": 516301, "wall": 3330.7} {"step": 26240, "train_loss": 3.136232614517212, "lr": 5.8330054341343056e-05, "tps": 515631, "wall": 3335.2} {"step": 26241, "train_loss": 2.9718222618103027, "lr": 5.8321632332269295e-05, "tps": 514962, "wall": 3339.6} {"step": 26242, "train_loss": 3.0806350708007812, "lr": 5.831321215469678e-05, "tps": 514294, "wall": 3344.1} {"step": 26243, "train_loss": 3.1302757263183594, "lr": 5.8304793808721016e-05, "tps": 513630, "wall": 3348.6} {"step": 26244, "train_loss": 3.0844523906707764, "lr": 5.8296377294437275e-05, "tps": 512964, "wall": 3353.0} {"step": 26245, "train_loss": 3.1660988330841064, "lr": 5.828796261194088e-05, "tps": 512300, "wall": 3357.5} {"step": 26246, "train_loss": 3.0023279190063477, "lr": 5.827954976132724e-05, "tps": 511639, "wall": 3362.0} {"step": 26247, "train_loss": 3.0809006690979004, "lr": 5.827113874269161e-05, "tps": 510981, "wall": 3366.4} {"step": 26248, "train_loss": 3.2334542274475098, "lr": 5.8262729556129225e-05, "tps": 510326, "wall": 3370.9} {"step": 26249, "train_loss": 3.091244697570801, "lr": 5.8254322201735434e-05, "tps": 509672, "wall": 3375.3} {"step": 26250, "train_loss": 3.0717086791992188, "lr": 5.824591667960543e-05, "tps": 509019, "wall": 3379.8} {"step": 26251, "train_loss": 3.1312255859375, "lr": 5.8237512989834387e-05, "tps": 508368, "wall": 3384.3} {"step": 26252, "train_loss": 3.003204345703125, "lr": 5.822911113251759e-05, "tps": 507717, "wall": 3388.7} {"step": 26253, "train_loss": 3.0370707511901855, "lr": 5.8220711107750146e-05, "tps": 507069, "wall": 3393.2} {"step": 26254, "train_loss": 3.0436127185821533, "lr": 5.8212312915627266e-05, "tps": 506423, "wall": 3397.6} {"step": 26255, "train_loss": 2.966449499130249, "lr": 5.8203916556244054e-05, "tps": 505779, "wall": 3402.1} {"step": 26256, "train_loss": 3.2023510932922363, "lr": 5.8195522029695595e-05, "tps": 505137, "wall": 3406.6} {"step": 26257, "train_loss": 3.068057060241699, "lr": 5.818712933607706e-05, "tps": 504497, "wall": 3411.0} {"step": 26258, "train_loss": 3.0644173622131348, "lr": 5.817873847548347e-05, "tps": 503858, "wall": 3415.5} {"step": 26259, "train_loss": 3.126157283782959, "lr": 5.817034944800984e-05, "tps": 503214, "wall": 3420.0} {"step": 26260, "train_loss": 3.0597996711730957, "lr": 5.8161962253751304e-05, "tps": 502578, "wall": 3424.4} {"step": 26261, "train_loss": 3.095349073410034, "lr": 5.81535768928028e-05, "tps": 501940, "wall": 3428.9} {"step": 26262, "train_loss": 3.1583468914031982, "lr": 5.81451933652593e-05, "tps": 501308, "wall": 3433.4} {"step": 26263, "train_loss": 3.1532950401306152, "lr": 5.813681167121583e-05, "tps": 500677, "wall": 3437.8} {"step": 26264, "train_loss": 2.980180025100708, "lr": 5.812843181076733e-05, "tps": 500047, "wall": 3442.3} {"step": 26265, "train_loss": 3.025729179382324, "lr": 5.812005378400868e-05, "tps": 499421, "wall": 3446.7} {"step": 26266, "train_loss": 3.11246919631958, "lr": 5.811167759103483e-05, "tps": 498796, "wall": 3451.2} {"step": 26267, "train_loss": 3.07387113571167, "lr": 5.810330323194068e-05, "tps": 498173, "wall": 3455.6} {"step": 26268, "train_loss": 3.068363904953003, "lr": 5.809493070682103e-05, "tps": 497550, "wall": 3460.1} {"step": 26269, "train_loss": 3.124624013900757, "lr": 5.808656001577079e-05, "tps": 496930, "wall": 3464.5} {"step": 26270, "train_loss": 3.0543878078460693, "lr": 5.807819115888475e-05, "tps": 496311, "wall": 3469.0} {"step": 26271, "train_loss": 3.0929670333862305, "lr": 5.8069824136257714e-05, "tps": 495691, "wall": 3473.5} {"step": 26272, "train_loss": 3.1298723220825195, "lr": 5.806145894798448e-05, "tps": 495068, "wall": 3478.0} {"step": 26273, "train_loss": 3.0921833515167236, "lr": 5.805309559415978e-05, "tps": 494456, "wall": 3482.4} {"step": 26274, "train_loss": 3.00056791305542, "lr": 5.804473407487839e-05, "tps": 493842, "wall": 3486.9} {"step": 26275, "train_loss": 3.1265077590942383, "lr": 5.803637439023504e-05, "tps": 493231, "wall": 3491.3} {"step": 26276, "train_loss": 3.2043027877807617, "lr": 5.8028016540324334e-05, "tps": 492622, "wall": 3495.8} {"step": 26277, "train_loss": 3.1339168548583984, "lr": 5.801966052524109e-05, "tps": 492012, "wall": 3500.2} {"step": 26278, "train_loss": 3.16310453414917, "lr": 5.8011306345079875e-05, "tps": 491406, "wall": 3504.7} {"step": 26279, "train_loss": 3.0222136974334717, "lr": 5.800295399993531e-05, "tps": 490801, "wall": 3509.1} {"step": 26280, "train_loss": 2.990687608718872, "lr": 5.799460348990209e-05, "tps": 490197, "wall": 3513.6} {"step": 26281, "train_loss": 3.052532434463501, "lr": 5.7986254815074745e-05, "tps": 489597, "wall": 3518.0} {"step": 26282, "train_loss": 3.118603229522705, "lr": 5.797790797554786e-05, "tps": 488996, "wall": 3522.5} {"step": 26283, "train_loss": 3.0226552486419678, "lr": 5.7969562971416026e-05, "tps": 488398, "wall": 3526.9} {"step": 26284, "train_loss": 3.1405467987060547, "lr": 5.796121980277375e-05, "tps": 487800, "wall": 3531.4} {"step": 26285, "train_loss": 3.038694381713867, "lr": 5.79528784697155e-05, "tps": 487204, "wall": 3535.8} {"step": 26286, "train_loss": 3.2701783180236816, "lr": 5.794453897233584e-05, "tps": 486604, "wall": 3540.3} {"step": 26287, "train_loss": 3.061978578567505, "lr": 5.793620131072923e-05, "tps": 486011, "wall": 3544.8} {"step": 26288, "train_loss": 3.1616930961608887, "lr": 5.792786548499004e-05, "tps": 485419, "wall": 3549.3} {"step": 26289, "train_loss": 3.1317901611328125, "lr": 5.791953149521281e-05, "tps": 484829, "wall": 3553.7} {"step": 26290, "train_loss": 3.1360268592834473, "lr": 5.791119934149185e-05, "tps": 484238, "wall": 3558.2} {"step": 26291, "train_loss": 3.152899980545044, "lr": 5.7902869023921646e-05, "tps": 483651, "wall": 3562.6} {"step": 26292, "train_loss": 3.1354918479919434, "lr": 5.789454054259649e-05, "tps": 483067, "wall": 3567.1} {"step": 26293, "train_loss": 3.0885472297668457, "lr": 5.788621389761072e-05, "tps": 482483, "wall": 3571.5} {"step": 26294, "train_loss": 3.1221675872802734, "lr": 5.787788908905873e-05, "tps": 481901, "wall": 3576.0} {"step": 26295, "train_loss": 3.138695240020752, "lr": 5.786956611703478e-05, "tps": 481320, "wall": 3580.4} {"step": 26296, "train_loss": 3.0390431880950928, "lr": 5.786124498163311e-05, "tps": 480742, "wall": 3584.9} {"step": 26297, "train_loss": 3.220191717147827, "lr": 5.785292568294809e-05, "tps": 480163, "wall": 3589.3} {"step": 26298, "train_loss": 3.0765554904937744, "lr": 5.784460822107387e-05, "tps": 479586, "wall": 3593.8} {"step": 26299, "train_loss": 3.1475906372070312, "lr": 5.7836292596104667e-05, "tps": 479002, "wall": 3598.3} {"step": 26300, "train_loss": 3.0062990188598633, "lr": 5.782797880813478e-05, "tps": 478433, "wall": 3602.7} {"step": 26301, "train_loss": 3.17336368560791, "lr": 5.7819666857258293e-05, "tps": 477861, "wall": 3607.2} {"step": 26302, "train_loss": 3.1017050743103027, "lr": 5.781135674356937e-05, "tps": 477291, "wall": 3611.6} {"step": 26303, "train_loss": 3.149503469467163, "lr": 5.780304846716221e-05, "tps": 476721, "wall": 3616.1} {"step": 26304, "train_loss": 3.160275936126709, "lr": 5.779474202813089e-05, "tps": 476153, "wall": 3620.5} {"step": 26305, "train_loss": 3.075646162033081, "lr": 5.778643742656946e-05, "tps": 475586, "wall": 3625.0} {"step": 26306, "train_loss": 3.1151933670043945, "lr": 5.7778134662572104e-05, "tps": 475019, "wall": 3629.4} {"step": 26307, "train_loss": 3.050126314163208, "lr": 5.776983373623276e-05, "tps": 474457, "wall": 3633.9} {"step": 26308, "train_loss": 3.0802841186523438, "lr": 5.776153464764556e-05, "tps": 473895, "wall": 3638.3} {"step": 26309, "train_loss": 3.076730966567993, "lr": 5.7753237396904456e-05, "tps": 473336, "wall": 3642.8} {"step": 26310, "train_loss": 3.145824432373047, "lr": 5.7744941984103426e-05, "tps": 472777, "wall": 3647.2} {"step": 26311, "train_loss": 3.0732338428497314, "lr": 5.7736648409336515e-05, "tps": 472220, "wall": 3651.6} {"step": 26312, "train_loss": 3.030277729034424, "lr": 5.7728356672697616e-05, "tps": 471661, "wall": 3656.1} {"step": 26313, "train_loss": 2.991889238357544, "lr": 5.7720066774280654e-05, "tps": 471099, "wall": 3660.6} {"step": 26314, "train_loss": 3.059077739715576, "lr": 5.771177871417959e-05, "tps": 470543, "wall": 3665.1} {"step": 26315, "train_loss": 3.117825984954834, "lr": 5.7703492492488265e-05, "tps": 469991, "wall": 3669.5} {"step": 26316, "train_loss": 3.088552474975586, "lr": 5.769520810930051e-05, "tps": 469440, "wall": 3674.0} {"step": 26317, "train_loss": 3.1073756217956543, "lr": 5.768692556471028e-05, "tps": 468890, "wall": 3678.4} {"step": 26318, "train_loss": 3.0965425968170166, "lr": 5.7678644858811314e-05, "tps": 468339, "wall": 3682.9} {"step": 26319, "train_loss": 3.1497859954833984, "lr": 5.767036599169743e-05, "tps": 467789, "wall": 3687.4} {"step": 26320, "train_loss": 3.0982511043548584, "lr": 5.766208896346245e-05, "tps": 467243, "wall": 3691.8} {"step": 26321, "train_loss": 3.1336541175842285, "lr": 5.76538137742001e-05, "tps": 466694, "wall": 3696.3} {"step": 26322, "train_loss": 3.1867899894714355, "lr": 5.76455404240041e-05, "tps": 466150, "wall": 3700.7} {"step": 26323, "train_loss": 3.14322566986084, "lr": 5.763726891296823e-05, "tps": 465606, "wall": 3705.2} {"step": 26324, "train_loss": 3.251225471496582, "lr": 5.762899924118618e-05, "tps": 465064, "wall": 3709.7} {"step": 26325, "train_loss": 3.1360878944396973, "lr": 5.762073140875155e-05, "tps": 464522, "wall": 3714.1} {"step": 26326, "train_loss": 3.008821487426758, "lr": 5.761246541575811e-05, "tps": 463976, "wall": 3718.6} {"step": 26327, "train_loss": 3.02097749710083, "lr": 5.7604201262299415e-05, "tps": 463441, "wall": 3723.1} {"step": 26328, "train_loss": 3.1273841857910156, "lr": 5.759593894846914e-05, "tps": 462906, "wall": 3727.5} {"step": 26329, "train_loss": 3.2012836933135986, "lr": 5.758767847436085e-05, "tps": 462371, "wall": 3732.0} {"step": 26330, "train_loss": 3.1212058067321777, "lr": 5.757941984006809e-05, "tps": 461837, "wall": 3736.4} {"step": 26331, "train_loss": 3.1358485221862793, "lr": 5.7571163045684506e-05, "tps": 461306, "wall": 3740.9} {"step": 26332, "train_loss": 3.0539400577545166, "lr": 5.7562908091303544e-05, "tps": 460775, "wall": 3745.3} {"step": 26333, "train_loss": 3.086839437484741, "lr": 5.755465497701874e-05, "tps": 460246, "wall": 3749.8} {"step": 26334, "train_loss": 3.1756772994995117, "lr": 5.754640370292361e-05, "tps": 459716, "wall": 3754.3} {"step": 26335, "train_loss": 3.085439443588257, "lr": 5.75381542691116e-05, "tps": 459184, "wall": 3758.7} {"step": 26336, "train_loss": 3.0986740589141846, "lr": 5.752990667567615e-05, "tps": 458658, "wall": 3763.2} {"step": 26337, "train_loss": 3.0514256954193115, "lr": 5.752166092271074e-05, "tps": 458133, "wall": 3767.6} {"step": 26338, "train_loss": 3.0964138507843018, "lr": 5.7513417010308734e-05, "tps": 457610, "wall": 3772.1} {"step": 26339, "train_loss": 3.2358641624450684, "lr": 5.750517493856351e-05, "tps": 457087, "wall": 3776.6} {"step": 26340, "train_loss": 3.1385231018066406, "lr": 5.7496934707568486e-05, "tps": 456559, "wall": 3781.1} {"step": 26341, "train_loss": 3.148125410079956, "lr": 5.748869631741696e-05, "tps": 456039, "wall": 3785.5} {"step": 26342, "train_loss": 3.012758493423462, "lr": 5.748045976820227e-05, "tps": 455521, "wall": 3790.0} {"step": 26343, "train_loss": 2.9975697994232178, "lr": 5.747222506001773e-05, "tps": 455002, "wall": 3794.4} {"step": 26344, "train_loss": 3.095871686935425, "lr": 5.7463992192956594e-05, "tps": 454486, "wall": 3798.9} {"step": 26345, "train_loss": 3.027287721633911, "lr": 5.7455761167112167e-05, "tps": 453972, "wall": 3803.3} {"step": 26346, "train_loss": 3.0416641235351562, "lr": 5.744753198257769e-05, "tps": 453459, "wall": 3807.8} {"step": 26347, "train_loss": 3.13505220413208, "lr": 5.7439304639446336e-05, "tps": 452946, "wall": 3812.2} {"step": 26348, "train_loss": 3.1333491802215576, "lr": 5.743107913781136e-05, "tps": 452433, "wall": 3816.7} {"step": 26349, "train_loss": 3.097778558731079, "lr": 5.7422855477765904e-05, "tps": 451922, "wall": 3821.2} {"step": 26350, "train_loss": 3.1352314949035645, "lr": 5.74146336594031e-05, "tps": 451413, "wall": 3825.6} {"step": 26351, "train_loss": 3.0397021770477295, "lr": 5.740641368281617e-05, "tps": 450905, "wall": 3830.1} {"step": 26352, "train_loss": 3.1123626232147217, "lr": 5.739819554809816e-05, "tps": 450398, "wall": 3834.5} {"step": 26353, "train_loss": 3.1596381664276123, "lr": 5.7389979255342195e-05, "tps": 449886, "wall": 3839.1} {"step": 26354, "train_loss": 3.197826862335205, "lr": 5.738176480464135e-05, "tps": 449382, "wall": 3843.5} {"step": 26355, "train_loss": 3.1092755794525146, "lr": 5.737355219608867e-05, "tps": 448878, "wall": 3848.0} {"step": 26356, "train_loss": 3.095392942428589, "lr": 5.7365341429777155e-05, "tps": 448374, "wall": 3852.4} {"step": 26357, "train_loss": 3.2084879875183105, "lr": 5.7357132505799884e-05, "tps": 447876, "wall": 3856.9} {"step": 26358, "train_loss": 3.143916130065918, "lr": 5.734892542424982e-05, "tps": 447377, "wall": 3861.3} {"step": 26359, "train_loss": 3.1863787174224854, "lr": 5.73407201852199e-05, "tps": 446879, "wall": 3865.8} {"step": 26360, "train_loss": 3.149069309234619, "lr": 5.7332516788803116e-05, "tps": 446382, "wall": 3870.2} {"step": 26361, "train_loss": 3.0996971130371094, "lr": 5.7324315235092365e-05, "tps": 445887, "wall": 3874.7} {"step": 26362, "train_loss": 3.0405097007751465, "lr": 5.73161155241806e-05, "tps": 445392, "wall": 3879.1} {"step": 26363, "train_loss": 3.1163558959960938, "lr": 5.730791765616068e-05, "tps": 444898, "wall": 3883.6} {"step": 26364, "train_loss": 3.1781396865844727, "lr": 5.729972163112542e-05, "tps": 444406, "wall": 3888.0} {"step": 26365, "train_loss": 3.073126792907715, "lr": 5.729152744916777e-05, "tps": 443916, "wall": 3892.5} {"step": 26366, "train_loss": 3.1987481117248535, "lr": 5.7283335110380485e-05, "tps": 443426, "wall": 3896.9} {"step": 26367, "train_loss": 3.058812379837036, "lr": 5.727514461485638e-05, "tps": 442932, "wall": 3901.4} {"step": 26368, "train_loss": 3.1067965030670166, "lr": 5.726695596268824e-05, "tps": 442443, "wall": 3905.8} {"step": 26369, "train_loss": 3.121553659439087, "lr": 5.725876915396884e-05, "tps": 441956, "wall": 3910.3} {"step": 26370, "train_loss": 3.0909337997436523, "lr": 5.725058418879087e-05, "tps": 441471, "wall": 3914.7} {"step": 26371, "train_loss": 3.101400136947632, "lr": 5.724240106724712e-05, "tps": 440987, "wall": 3919.2} {"step": 26372, "train_loss": 3.0915589332580566, "lr": 5.7234219789430255e-05, "tps": 440504, "wall": 3923.6} {"step": 26373, "train_loss": 3.0656774044036865, "lr": 5.722604035543292e-05, "tps": 440022, "wall": 3928.1} {"step": 26374, "train_loss": 3.1699867248535156, "lr": 5.721786276534785e-05, "tps": 439541, "wall": 3932.5} {"step": 26375, "train_loss": 3.101628303527832, "lr": 5.7209687019267635e-05, "tps": 439060, "wall": 3937.0} {"step": 26376, "train_loss": 3.1423161029815674, "lr": 5.7201513117284844e-05, "tps": 438581, "wall": 3941.4} {"step": 26377, "train_loss": 3.0619723796844482, "lr": 5.719334105949216e-05, "tps": 438102, "wall": 3945.9} {"step": 26378, "train_loss": 3.113684892654419, "lr": 5.718517084598212e-05, "tps": 437625, "wall": 3950.4} {"step": 26379, "train_loss": 2.9666621685028076, "lr": 5.717700247684723e-05, "tps": 437148, "wall": 3954.8} {"step": 26380, "train_loss": 3.049100399017334, "lr": 5.71688359521801e-05, "tps": 436667, "wall": 3959.3} {"step": 26381, "train_loss": 3.129897356033325, "lr": 5.716067127207321e-05, "tps": 436193, "wall": 3963.8} {"step": 26382, "train_loss": 2.9827842712402344, "lr": 5.715250843661904e-05, "tps": 435720, "wall": 3968.2} {"step": 26383, "train_loss": 3.1509881019592285, "lr": 5.714434744591005e-05, "tps": 435248, "wall": 3972.7} {"step": 26384, "train_loss": 3.106968879699707, "lr": 5.71361883000387e-05, "tps": 434778, "wall": 3977.1} {"step": 26385, "train_loss": 3.1150197982788086, "lr": 5.7128030999097474e-05, "tps": 434310, "wall": 3981.6} {"step": 26386, "train_loss": 3.082125186920166, "lr": 5.711987554317866e-05, "tps": 433841, "wall": 3986.0} {"step": 26387, "train_loss": 3.1505348682403564, "lr": 5.711172193237473e-05, "tps": 433366, "wall": 3990.5} {"step": 26388, "train_loss": 3.040304183959961, "lr": 5.7103570166778054e-05, "tps": 432902, "wall": 3995.0} {"step": 26389, "train_loss": 3.0293307304382324, "lr": 5.709542024648088e-05, "tps": 432435, "wall": 3999.4} {"step": 26390, "train_loss": 3.10330867767334, "lr": 5.708727217157566e-05, "tps": 431970, "wall": 4003.9} {"step": 26391, "train_loss": 3.280080795288086, "lr": 5.7079125942154634e-05, "tps": 431506, "wall": 4008.3} {"step": 26392, "train_loss": 3.0439720153808594, "lr": 5.7070981558310035e-05, "tps": 431044, "wall": 4012.8} {"step": 26393, "train_loss": 3.059476613998413, "lr": 5.706283902013421e-05, "tps": 430582, "wall": 4017.3} {"step": 26394, "train_loss": 3.1283485889434814, "lr": 5.705469832771935e-05, "tps": 430117, "wall": 4021.7} {"step": 26395, "train_loss": 3.0350983142852783, "lr": 5.7046559481157647e-05, "tps": 429655, "wall": 4026.2} {"step": 26396, "train_loss": 3.200207233428955, "lr": 5.703842248054139e-05, "tps": 429199, "wall": 4030.7} {"step": 26397, "train_loss": 3.2260470390319824, "lr": 5.7030287325962686e-05, "tps": 428742, "wall": 4035.1} {"step": 26398, "train_loss": 3.0796799659729004, "lr": 5.702215401751367e-05, "tps": 428285, "wall": 4039.6} {"step": 26399, "train_loss": 3.1182870864868164, "lr": 5.7014022555286537e-05, "tps": 427830, "wall": 4044.0} {"step": 26400, "train_loss": 3.1276967525482178, "lr": 5.700589293937338e-05, "tps": 427376, "wall": 4048.5} {"step": 26401, "train_loss": 3.1375105381011963, "lr": 5.699776516986626e-05, "tps": 426922, "wall": 4052.9} {"step": 26402, "train_loss": 3.174746513366699, "lr": 5.69896392468573e-05, "tps": 426471, "wall": 4057.4} {"step": 26403, "train_loss": 3.131108522415161, "lr": 5.6981515170438524e-05, "tps": 426019, "wall": 4061.8} {"step": 26404, "train_loss": 3.1513822078704834, "lr": 5.697339294070192e-05, "tps": 425568, "wall": 4066.3} {"step": 26405, "train_loss": 3.113010883331299, "lr": 5.696527255773959e-05, "tps": 425119, "wall": 4070.7} {"step": 26406, "train_loss": 3.0753672122955322, "lr": 5.6957154021643445e-05, "tps": 424666, "wall": 4075.2} {"step": 26407, "train_loss": 3.050454616546631, "lr": 5.6949037332505495e-05, "tps": 424214, "wall": 4079.7} {"step": 26408, "train_loss": 3.07027530670166, "lr": 5.694092249041769e-05, "tps": 423768, "wall": 4084.2} {"step": 26409, "train_loss": 3.1066856384277344, "lr": 5.69328094954719e-05, "tps": 423322, "wall": 4088.6} {"step": 26410, "train_loss": 3.076716184616089, "lr": 5.6924698347760065e-05, "tps": 422877, "wall": 4093.1} {"step": 26411, "train_loss": 3.0502891540527344, "lr": 5.691658904737411e-05, "tps": 422433, "wall": 4097.5} {"step": 26412, "train_loss": 3.0741968154907227, "lr": 5.690848159440579e-05, "tps": 421991, "wall": 4102.0} {"step": 26413, "train_loss": 3.133821964263916, "lr": 5.690037598894708e-05, "tps": 421550, "wall": 4106.4} {"step": 26414, "train_loss": 3.142552375793457, "lr": 5.6892272231089725e-05, "tps": 421109, "wall": 4110.9} {"step": 26415, "train_loss": 3.071660041809082, "lr": 5.688417032092549e-05, "tps": 420669, "wall": 4115.3} {"step": 26416, "train_loss": 3.092926263809204, "lr": 5.687607025854623e-05, "tps": 420231, "wall": 4119.8} {"step": 26417, "train_loss": 3.0762834548950195, "lr": 5.6867972044043696e-05, "tps": 419793, "wall": 4124.2} {"step": 26418, "train_loss": 3.1616339683532715, "lr": 5.685987567750954e-05, "tps": 419357, "wall": 4128.7} {"step": 26419, "train_loss": 3.0143747329711914, "lr": 5.685178115903559e-05, "tps": 418921, "wall": 4133.1} {"step": 26420, "train_loss": 3.069634199142456, "lr": 5.6843688488713473e-05, "tps": 418482, "wall": 4137.6} {"step": 26421, "train_loss": 3.0977070331573486, "lr": 5.6835597666634845e-05, "tps": 418047, "wall": 4142.1} {"step": 26422, "train_loss": 3.0458977222442627, "lr": 5.682750869289144e-05, "tps": 417613, "wall": 4146.6} {"step": 26423, "train_loss": 3.0650928020477295, "lr": 5.681942156757481e-05, "tps": 417181, "wall": 4151.0} {"step": 26424, "train_loss": 3.125474691390991, "lr": 5.681133629077663e-05, "tps": 416749, "wall": 4155.5} {"step": 26425, "train_loss": 3.1704375743865967, "lr": 5.6803252862588464e-05, "tps": 416319, "wall": 4159.9} {"step": 26426, "train_loss": 3.0890555381774902, "lr": 5.6795171283101845e-05, "tps": 415890, "wall": 4164.4} {"step": 26427, "train_loss": 3.170344352722168, "lr": 5.678709155240838e-05, "tps": 415461, "wall": 4168.8} {"step": 26428, "train_loss": 3.0025081634521484, "lr": 5.677901367059957e-05, "tps": 415033, "wall": 4173.3} {"step": 26429, "train_loss": 3.1145167350769043, "lr": 5.677093763776689e-05, "tps": 414607, "wall": 4177.7} {"step": 26430, "train_loss": 3.114353656768799, "lr": 5.6762863454001905e-05, "tps": 414181, "wall": 4182.2} {"step": 26431, "train_loss": 3.056702136993408, "lr": 5.6754791119396026e-05, "tps": 413755, "wall": 4186.6} {"step": 26432, "train_loss": 3.0746467113494873, "lr": 5.674672063404068e-05, "tps": 413331, "wall": 4191.1} {"step": 26433, "train_loss": 3.153031826019287, "lr": 5.6738651998027336e-05, "tps": 412909, "wall": 4195.5} {"step": 26434, "train_loss": 3.068197727203369, "lr": 5.673058521144738e-05, "tps": 412479, "wall": 4200.1} {"step": 26435, "train_loss": 3.015138864517212, "lr": 5.6722520274392155e-05, "tps": 412058, "wall": 4204.5} {"step": 26436, "train_loss": 3.1611199378967285, "lr": 5.671445718695306e-05, "tps": 411637, "wall": 4209.0} {"step": 26437, "train_loss": 3.177532196044922, "lr": 5.670639594922147e-05, "tps": 411218, "wall": 4213.4} {"step": 26438, "train_loss": 3.0327529907226562, "lr": 5.66983365612886e-05, "tps": 410799, "wall": 4217.9} {"step": 26439, "train_loss": 3.2586758136749268, "lr": 5.669027902324586e-05, "tps": 410382, "wall": 4222.3} {"step": 26440, "train_loss": 3.1371288299560547, "lr": 5.668222333518442e-05, "tps": 409964, "wall": 4226.8} {"step": 26441, "train_loss": 3.0727498531341553, "lr": 5.667416949719565e-05, "tps": 409548, "wall": 4231.2} {"step": 26442, "train_loss": 3.0941686630249023, "lr": 5.6666117509370706e-05, "tps": 409134, "wall": 4235.7} {"step": 26443, "train_loss": 3.069699764251709, "lr": 5.6658067371800784e-05, "tps": 408719, "wall": 4240.2} {"step": 26444, "train_loss": 3.146354913711548, "lr": 5.665001908457714e-05, "tps": 408307, "wall": 4244.6} {"step": 26445, "train_loss": 3.1596245765686035, "lr": 5.6641972647790944e-05, "tps": 407894, "wall": 4249.1} {"step": 26446, "train_loss": 3.1403822898864746, "lr": 5.663392806153326e-05, "tps": 407483, "wall": 4253.5} {"step": 26447, "train_loss": 3.0630767345428467, "lr": 5.6625885325895325e-05, "tps": 407065, "wall": 4258.0} {"step": 26448, "train_loss": 3.223682403564453, "lr": 5.6617844440968184e-05, "tps": 406657, "wall": 4262.5} {"step": 26449, "train_loss": 3.123861074447632, "lr": 5.6609805406842896e-05, "tps": 406247, "wall": 4266.9} {"step": 26450, "train_loss": 3.114642381668091, "lr": 5.660176822361063e-05, "tps": 405839, "wall": 4271.4} {"step": 26451, "train_loss": 3.146906852722168, "lr": 5.659373289136237e-05, "tps": 405432, "wall": 4275.8} {"step": 26452, "train_loss": 3.055953025817871, "lr": 5.658569941018911e-05, "tps": 405025, "wall": 4280.3} {"step": 26453, "train_loss": 3.1073966026306152, "lr": 5.657766778018192e-05, "tps": 404620, "wall": 4284.7} {"step": 26454, "train_loss": 3.1213231086730957, "lr": 5.656963800143175e-05, "tps": 404216, "wall": 4289.2} {"step": 26455, "train_loss": 3.0148637294769287, "lr": 5.6561610074029526e-05, "tps": 403812, "wall": 4293.6} {"step": 26456, "train_loss": 3.021160125732422, "lr": 5.655358399806626e-05, "tps": 403409, "wall": 4298.1} {"step": 26457, "train_loss": 3.036954402923584, "lr": 5.654555977363283e-05, "tps": 403006, "wall": 4302.5} {"step": 26458, "train_loss": 3.1730806827545166, "lr": 5.653753740082012e-05, "tps": 402606, "wall": 4307.0} {"step": 26459, "train_loss": 3.019275188446045, "lr": 5.652951687971906e-05, "tps": 402206, "wall": 4311.4} {"step": 26460, "train_loss": 3.0573501586914062, "lr": 5.6521498210420445e-05, "tps": 401806, "wall": 4315.9} {"step": 26461, "train_loss": 2.9788711071014404, "lr": 5.6513481393015164e-05, "tps": 401403, "wall": 4320.4} {"step": 26462, "train_loss": 3.0219004154205322, "lr": 5.6505466427594026e-05, "tps": 401004, "wall": 4324.8} {"step": 26463, "train_loss": 3.0733566284179688, "lr": 5.6497453314247764e-05, "tps": 400607, "wall": 4329.3} {"step": 26464, "train_loss": 3.0360355377197266, "lr": 5.6489442053067234e-05, "tps": 400210, "wall": 4333.7} {"step": 26465, "train_loss": 3.1039772033691406, "lr": 5.648143264414315e-05, "tps": 399813, "wall": 4338.2} {"step": 26466, "train_loss": 3.10966420173645, "lr": 5.64734250875662e-05, "tps": 399417, "wall": 4342.7} {"step": 26467, "train_loss": 3.112100601196289, "lr": 5.6465419383427185e-05, "tps": 399023, "wall": 4347.1} {"step": 26468, "train_loss": 3.083446741104126, "lr": 5.645741553181674e-05, "tps": 398630, "wall": 4351.6} {"step": 26469, "train_loss": 3.123621940612793, "lr": 5.644941353282551e-05, "tps": 398238, "wall": 4356.0} {"step": 26470, "train_loss": 3.0594582557678223, "lr": 5.64414133865442e-05, "tps": 397846, "wall": 4360.5} {"step": 26471, "train_loss": 3.1544041633605957, "lr": 5.643341509306341e-05, "tps": 397456, "wall": 4364.9} {"step": 26472, "train_loss": 3.004316568374634, "lr": 5.642541865247371e-05, "tps": 397064, "wall": 4369.4} {"step": 26473, "train_loss": 3.143782377243042, "lr": 5.641742406486574e-05, "tps": 396676, "wall": 4373.8} {"step": 26474, "train_loss": 3.082918405532837, "lr": 5.640943133033006e-05, "tps": 396280, "wall": 4378.4} {"step": 26475, "train_loss": 3.0795915126800537, "lr": 5.640144044895714e-05, "tps": 395895, "wall": 4382.8} {"step": 26476, "train_loss": 3.062298536300659, "lr": 5.6393451420837594e-05, "tps": 395508, "wall": 4387.3} {"step": 26477, "train_loss": 3.137814998626709, "lr": 5.638546424606185e-05, "tps": 395122, "wall": 4391.7} {"step": 26478, "train_loss": 3.050693988800049, "lr": 5.637747892472044e-05, "tps": 394733, "wall": 4396.2} {"step": 26479, "train_loss": 3.120208501815796, "lr": 5.636949545690381e-05, "tps": 394350, "wall": 4400.6} {"step": 26480, "train_loss": 3.0653815269470215, "lr": 5.636151384270236e-05, "tps": 393967, "wall": 4405.1} {"step": 26481, "train_loss": 3.1216461658477783, "lr": 5.635353408220656e-05, "tps": 393584, "wall": 4409.5} {"step": 26482, "train_loss": 3.006291389465332, "lr": 5.634555617550678e-05, "tps": 393201, "wall": 4414.0} {"step": 26483, "train_loss": 3.107992172241211, "lr": 5.6337580122693366e-05, "tps": 392820, "wall": 4418.4} {"step": 26484, "train_loss": 3.121889591217041, "lr": 5.632960592385672e-05, "tps": 392440, "wall": 4422.9} {"step": 26485, "train_loss": 3.1172008514404297, "lr": 5.6321633579087176e-05, "tps": 392059, "wall": 4427.4} {"step": 26486, "train_loss": 2.9995980262756348, "lr": 5.6313663088474944e-05, "tps": 391681, "wall": 4431.8} {"step": 26487, "train_loss": 2.9666547775268555, "lr": 5.630569445211047e-05, "tps": 391301, "wall": 4436.3} {"step": 26488, "train_loss": 3.0923314094543457, "lr": 5.6297727670083924e-05, "tps": 390920, "wall": 4440.8} {"step": 26489, "train_loss": 3.155719518661499, "lr": 5.628976274248554e-05, "tps": 390541, "wall": 4445.2} {"step": 26490, "train_loss": 3.0720977783203125, "lr": 5.628179966940562e-05, "tps": 390165, "wall": 4449.7} {"step": 26491, "train_loss": 3.096126079559326, "lr": 5.627383845093435e-05, "tps": 389789, "wall": 4454.2} {"step": 26492, "train_loss": 3.1331324577331543, "lr": 5.626587908716181e-05, "tps": 389414, "wall": 4458.6} {"step": 26493, "train_loss": 3.1084883213043213, "lr": 5.6257921578178327e-05, "tps": 389040, "wall": 4463.1} {"step": 26494, "train_loss": 3.1124672889709473, "lr": 5.624996592407391e-05, "tps": 388666, "wall": 4467.5} {"step": 26495, "train_loss": 3.0918073654174805, "lr": 5.624201212493879e-05, "tps": 388294, "wall": 4472.0} {"step": 26496, "train_loss": 3.021510601043701, "lr": 5.623406018086299e-05, "tps": 387923, "wall": 4476.4} {"step": 26497, "train_loss": 3.1031031608581543, "lr": 5.622611009193661e-05, "tps": 387552, "wall": 4480.9} {"step": 26498, "train_loss": 3.0235819816589355, "lr": 5.621816185824974e-05, "tps": 387181, "wall": 4485.3} {"step": 26499, "train_loss": 3.0301411151885986, "lr": 5.621021547989239e-05, "tps": 386812, "wall": 4489.8} {"step": 26500, "train_loss": 3.0982506275177, "lr": 5.620227095695455e-05, "tps": 386441, "wall": 4494.3} {"step": 26501, "train_loss": 3.1416306495666504, "lr": 5.6194328289526285e-05, "tps": 386053, "wall": 4498.9} {"step": 26502, "train_loss": 3.243544101715088, "lr": 5.618638747769751e-05, "tps": 385686, "wall": 4503.4} {"step": 26503, "train_loss": 3.1857757568359375, "lr": 5.617844852155819e-05, "tps": 385319, "wall": 4507.9} {"step": 26504, "train_loss": 3.1827328205108643, "lr": 5.617051142119827e-05, "tps": 384952, "wall": 4512.3} {"step": 26505, "train_loss": 3.030667781829834, "lr": 5.616257617670769e-05, "tps": 384587, "wall": 4516.8} {"step": 26506, "train_loss": 3.1595702171325684, "lr": 5.615464278817626e-05, "tps": 384223, "wall": 4521.2} {"step": 26507, "train_loss": 3.2388875484466553, "lr": 5.614671125569395e-05, "tps": 383859, "wall": 4525.7} {"step": 26508, "train_loss": 3.331831455230713, "lr": 5.613878157935055e-05, "tps": 383495, "wall": 4530.2} {"step": 26509, "train_loss": 3.1406564712524414, "lr": 5.613085375923587e-05, "tps": 383133, "wall": 4534.6} {"step": 26510, "train_loss": 3.199272871017456, "lr": 5.612292779543976e-05, "tps": 382772, "wall": 4539.0} {"step": 26511, "train_loss": 3.2849159240722656, "lr": 5.6115003688052e-05, "tps": 382413, "wall": 4543.5} {"step": 26512, "train_loss": 3.2220067977905273, "lr": 5.61070814371623e-05, "tps": 382053, "wall": 4547.9} {"step": 26513, "train_loss": 3.140113353729248, "lr": 5.6099161042860504e-05, "tps": 381694, "wall": 4552.4} {"step": 26514, "train_loss": 3.215700149536133, "lr": 5.609124250523624e-05, "tps": 381335, "wall": 4556.8} {"step": 26515, "train_loss": 3.239955186843872, "lr": 5.6083325824379275e-05, "tps": 380973, "wall": 4561.4} {"step": 26516, "train_loss": 3.2227697372436523, "lr": 5.607541100037925e-05, "tps": 380616, "wall": 4565.8} {"step": 26517, "train_loss": 3.250983715057373, "lr": 5.6067498033325826e-05, "tps": 380259, "wall": 4570.3} {"step": 26518, "train_loss": 3.156667709350586, "lr": 5.6059586923308674e-05, "tps": 379903, "wall": 4574.7} {"step": 26519, "train_loss": 3.197403907775879, "lr": 5.605167767041739e-05, "tps": 379548, "wall": 4579.2} {"step": 26520, "train_loss": 3.2244415283203125, "lr": 5.6043770274741545e-05, "tps": 379194, "wall": 4583.6} {"step": 26521, "train_loss": 3.256274700164795, "lr": 5.603586473637077e-05, "tps": 378840, "wall": 4588.1} {"step": 26522, "train_loss": 3.278271436691284, "lr": 5.602796105539459e-05, "tps": 378487, "wall": 4592.5} {"step": 26523, "train_loss": 3.118746042251587, "lr": 5.60200592319025e-05, "tps": 378134, "wall": 4597.0} {"step": 26524, "train_loss": 3.2815444469451904, "lr": 5.601215926598409e-05, "tps": 377782, "wall": 4601.4} {"step": 26525, "train_loss": 3.0660338401794434, "lr": 5.60042611577288e-05, "tps": 377431, "wall": 4605.9} {"step": 26526, "train_loss": 3.2176613807678223, "lr": 5.599636490722608e-05, "tps": 377082, "wall": 4610.3} {"step": 26527, "train_loss": 3.1916987895965576, "lr": 5.598847051456546e-05, "tps": 376730, "wall": 4614.8} {"step": 26528, "train_loss": 3.1827569007873535, "lr": 5.598057797983631e-05, "tps": 376377, "wall": 4619.3} {"step": 26529, "train_loss": 3.2294905185699463, "lr": 5.597268730312801e-05, "tps": 376028, "wall": 4623.8} {"step": 26530, "train_loss": 3.2894201278686523, "lr": 5.596479848453001e-05, "tps": 375680, "wall": 4628.2} {"step": 26531, "train_loss": 3.174969434738159, "lr": 5.595691152413164e-05, "tps": 375332, "wall": 4632.7} {"step": 26532, "train_loss": 3.2112998962402344, "lr": 5.594902642202225e-05, "tps": 374986, "wall": 4637.1} {"step": 26533, "train_loss": 3.28476619720459, "lr": 5.594114317829119e-05, "tps": 374640, "wall": 4641.6} {"step": 26534, "train_loss": 3.138169288635254, "lr": 5.5933261793027694e-05, "tps": 374295, "wall": 4646.1} {"step": 26535, "train_loss": 3.24519681930542, "lr": 5.592538226632109e-05, "tps": 373950, "wall": 4650.5} {"step": 26536, "train_loss": 3.2403042316436768, "lr": 5.5917504598260664e-05, "tps": 373607, "wall": 4655.0} {"step": 26537, "train_loss": 3.2192978858947754, "lr": 5.5909628788935595e-05, "tps": 373264, "wall": 4659.4} {"step": 26538, "train_loss": 3.243018627166748, "lr": 5.590175483843514e-05, "tps": 372922, "wall": 4663.9} {"step": 26539, "train_loss": 3.1458802223205566, "lr": 5.589388274684848e-05, "tps": 372579, "wall": 4668.3} {"step": 26540, "train_loss": 3.1491599082946777, "lr": 5.5886012514264784e-05, "tps": 372238, "wall": 4672.8} {"step": 26541, "train_loss": 3.1742711067199707, "lr": 5.587814414077325e-05, "tps": 371897, "wall": 4677.2} {"step": 26542, "train_loss": 3.1084964275360107, "lr": 5.5870277626462955e-05, "tps": 371554, "wall": 4681.7} {"step": 26543, "train_loss": 3.2159323692321777, "lr": 5.586241297142303e-05, "tps": 371213, "wall": 4686.2} {"step": 26544, "train_loss": 3.1254091262817383, "lr": 5.585455017574257e-05, "tps": 370875, "wall": 4690.7} {"step": 26545, "train_loss": 3.157733917236328, "lr": 5.5846689239510667e-05, "tps": 370537, "wall": 4695.1} {"step": 26546, "train_loss": 3.068260908126831, "lr": 5.5838830162816314e-05, "tps": 370200, "wall": 4699.6} {"step": 26547, "train_loss": 3.2395200729370117, "lr": 5.5830972945748604e-05, "tps": 369862, "wall": 4704.0} {"step": 26548, "train_loss": 3.1654458045959473, "lr": 5.582311758839647e-05, "tps": 369525, "wall": 4708.5} {"step": 26549, "train_loss": 3.1938629150390625, "lr": 5.581526409084898e-05, "tps": 369190, "wall": 4713.0} {"step": 26550, "train_loss": 3.183152914047241, "lr": 5.580741245319508e-05, "tps": 368855, "wall": 4717.4} {"step": 26551, "train_loss": 3.222726345062256, "lr": 5.5799562675523646e-05, "tps": 368521, "wall": 4721.9} {"step": 26552, "train_loss": 3.186067819595337, "lr": 5.579171475792369e-05, "tps": 368187, "wall": 4726.3} {"step": 26553, "train_loss": 3.2385501861572266, "lr": 5.5783868700484056e-05, "tps": 367855, "wall": 4730.8} {"step": 26554, "train_loss": 3.286018133163452, "lr": 5.577602450329366e-05, "tps": 367520, "wall": 4735.3} {"step": 26555, "train_loss": 3.15313458442688, "lr": 5.576818216644134e-05, "tps": 367186, "wall": 4739.8} {"step": 26556, "train_loss": 3.220806360244751, "lr": 5.5760341690015896e-05, "tps": 366855, "wall": 4744.2} {"step": 26557, "train_loss": 3.204732894897461, "lr": 5.575250307410622e-05, "tps": 366525, "wall": 4748.7} {"step": 26558, "train_loss": 3.2552316188812256, "lr": 5.5744666318801065e-05, "tps": 366193, "wall": 4753.1} {"step": 26559, "train_loss": 3.2205753326416016, "lr": 5.573683142418922e-05, "tps": 365864, "wall": 4757.6} {"step": 26560, "train_loss": 3.171799421310425, "lr": 5.572899839035943e-05, "tps": 365535, "wall": 4762.1} {"step": 26561, "train_loss": 3.100132465362549, "lr": 5.572116721740045e-05, "tps": 365206, "wall": 4766.5} {"step": 26562, "train_loss": 3.181478261947632, "lr": 5.571333790540093e-05, "tps": 364879, "wall": 4771.0} {"step": 26563, "train_loss": 3.0633726119995117, "lr": 5.570551045444965e-05, "tps": 364553, "wall": 4775.4} {"step": 26564, "train_loss": 3.1506168842315674, "lr": 5.5697684864635224e-05, "tps": 364227, "wall": 4779.9} {"step": 26565, "train_loss": 3.202692747116089, "lr": 5.568986113604631e-05, "tps": 363901, "wall": 4784.3} {"step": 26566, "train_loss": 3.1729743480682373, "lr": 5.5682039268771536e-05, "tps": 363576, "wall": 4788.8} {"step": 26567, "train_loss": 3.1633341312408447, "lr": 5.5674219262899526e-05, "tps": 363252, "wall": 4793.3} {"step": 26568, "train_loss": 3.2568466663360596, "lr": 5.566640111851882e-05, "tps": 362925, "wall": 4797.8} {"step": 26569, "train_loss": 3.190732479095459, "lr": 5.565858483571804e-05, "tps": 362600, "wall": 4802.2} {"step": 26570, "train_loss": 3.12373423576355, "lr": 5.565077041458571e-05, "tps": 362278, "wall": 4806.7} {"step": 26571, "train_loss": 3.1802706718444824, "lr": 5.564295785521029e-05, "tps": 361955, "wall": 4811.2} {"step": 26572, "train_loss": 3.1652121543884277, "lr": 5.563514715768038e-05, "tps": 361633, "wall": 4815.6} {"step": 26573, "train_loss": 3.1635937690734863, "lr": 5.5627338322084386e-05, "tps": 361311, "wall": 4820.1} {"step": 26574, "train_loss": 3.188316822052002, "lr": 5.561953134851082e-05, "tps": 360991, "wall": 4824.5} {"step": 26575, "train_loss": 3.189331293106079, "lr": 5.561172623704811e-05, "tps": 360671, "wall": 4829.0} {"step": 26576, "train_loss": 3.1561009883880615, "lr": 5.560392298778463e-05, "tps": 360353, "wall": 4833.4} {"step": 26577, "train_loss": 3.2397820949554443, "lr": 5.55961216008088e-05, "tps": 360035, "wall": 4837.9} {"step": 26578, "train_loss": 3.212235450744629, "lr": 5.558832207620903e-05, "tps": 359716, "wall": 4842.4} {"step": 26579, "train_loss": 3.190728187561035, "lr": 5.55805244140736e-05, "tps": 359399, "wall": 4846.8} {"step": 26580, "train_loss": 3.1072511672973633, "lr": 5.557272861449092e-05, "tps": 359081, "wall": 4851.3} {"step": 26581, "train_loss": 3.1210179328918457, "lr": 5.5564934677549264e-05, "tps": 358763, "wall": 4855.8} {"step": 26582, "train_loss": 3.0511651039123535, "lr": 5.555714260333691e-05, "tps": 358444, "wall": 4860.3} {"step": 26583, "train_loss": 3.215134859085083, "lr": 5.554935239194216e-05, "tps": 358128, "wall": 4864.8} {"step": 26584, "train_loss": 3.221431255340576, "lr": 5.554156404345322e-05, "tps": 357813, "wall": 4869.2} {"step": 26585, "train_loss": 3.142629384994507, "lr": 5.553377755795832e-05, "tps": 357499, "wall": 4873.7} {"step": 26586, "train_loss": 3.209031581878662, "lr": 5.5525992935545744e-05, "tps": 357186, "wall": 4878.1} {"step": 26587, "train_loss": 3.2584476470947266, "lr": 5.5518210176303586e-05, "tps": 356873, "wall": 4882.6} {"step": 26588, "train_loss": 3.1404905319213867, "lr": 5.5510429280320034e-05, "tps": 356560, "wall": 4887.1} {"step": 26589, "train_loss": 3.193331480026245, "lr": 5.550265024768324e-05, "tps": 356245, "wall": 4891.6} {"step": 26590, "train_loss": 3.3028922080993652, "lr": 5.5494873078481345e-05, "tps": 355933, "wall": 4896.0} {"step": 26591, "train_loss": 3.156724214553833, "lr": 5.548709777280238e-05, "tps": 355622, "wall": 4900.5} {"step": 26592, "train_loss": 3.25246000289917, "lr": 5.5479324330734526e-05, "tps": 355311, "wall": 4905.0} {"step": 26593, "train_loss": 3.1713109016418457, "lr": 5.547155275236574e-05, "tps": 355002, "wall": 4909.4} {"step": 26594, "train_loss": 3.2280492782592773, "lr": 5.5463783037784143e-05, "tps": 354693, "wall": 4913.9} {"step": 26595, "train_loss": 3.2184853553771973, "lr": 5.54560151870777e-05, "tps": 354380, "wall": 4918.4} {"step": 26596, "train_loss": 3.1645233631134033, "lr": 5.54482492003344e-05, "tps": 354073, "wall": 4922.9} {"step": 26597, "train_loss": 3.1809797286987305, "lr": 5.5440485077642256e-05, "tps": 353766, "wall": 4927.3} {"step": 26598, "train_loss": 3.2699460983276367, "lr": 5.543272281908921e-05, "tps": 353459, "wall": 4931.8} {"step": 26599, "train_loss": 3.181483745574951, "lr": 5.542496242476314e-05, "tps": 353152, "wall": 4936.3} {"step": 26600, "train_loss": 3.218360424041748, "lr": 5.541720389475204e-05, "tps": 352846, "wall": 4940.7} {"step": 26601, "train_loss": 3.18046236038208, "lr": 5.540944722914375e-05, "tps": 352541, "wall": 4945.2} {"step": 26602, "train_loss": 3.0035977363586426, "lr": 5.5401692428026145e-05, "tps": 352237, "wall": 4949.7} {"step": 26603, "train_loss": 3.1404240131378174, "lr": 5.539393949148706e-05, "tps": 351932, "wall": 4954.1} {"step": 26604, "train_loss": 3.175553798675537, "lr": 5.538618841961436e-05, "tps": 351628, "wall": 4958.6} {"step": 26605, "train_loss": 3.2006664276123047, "lr": 5.5378439212495784e-05, "tps": 351325, "wall": 4963.1} {"step": 26606, "train_loss": 3.130296230316162, "lr": 5.537069187021917e-05, "tps": 351021, "wall": 4967.5} {"step": 26607, "train_loss": 3.1466426849365234, "lr": 5.5362946392872296e-05, "tps": 350718, "wall": 4972.0} {"step": 26608, "train_loss": 3.086168050765991, "lr": 5.535520278054281e-05, "tps": 350415, "wall": 4976.5} {"step": 26609, "train_loss": 3.1162540912628174, "lr": 5.534746103331855e-05, "tps": 350110, "wall": 4981.0} {"step": 26610, "train_loss": 3.1565704345703125, "lr": 5.533972115128712e-05, "tps": 349809, "wall": 4985.5} {"step": 26611, "train_loss": 3.1914801597595215, "lr": 5.533198313453628e-05, "tps": 349509, "wall": 4990.0} {"step": 26612, "train_loss": 3.1212942600250244, "lr": 5.532424698315363e-05, "tps": 349209, "wall": 4994.4} {"step": 26613, "train_loss": 3.128859043121338, "lr": 5.531651269722677e-05, "tps": 348910, "wall": 4998.9} {"step": 26614, "train_loss": 3.1381514072418213, "lr": 5.530878027684343e-05, "tps": 348612, "wall": 5003.4} {"step": 26615, "train_loss": 3.2381796836853027, "lr": 5.5301049722091114e-05, "tps": 348315, "wall": 5007.8} {"step": 26616, "train_loss": 3.28773832321167, "lr": 5.529332103305739e-05, "tps": 348017, "wall": 5012.3} {"step": 26617, "train_loss": 3.23583722114563, "lr": 5.528559420982986e-05, "tps": 347721, "wall": 5016.8} {"step": 26618, "train_loss": 3.160923957824707, "lr": 5.527786925249605e-05, "tps": 347424, "wall": 5021.2} {"step": 26619, "train_loss": 3.11662220954895, "lr": 5.527014616114339e-05, "tps": 347129, "wall": 5025.7} {"step": 26620, "train_loss": 3.137357473373413, "lr": 5.526242493585949e-05, "tps": 346834, "wall": 5030.2} {"step": 26621, "train_loss": 3.2422611713409424, "lr": 5.5254705576731715e-05, "tps": 346539, "wall": 5034.6} {"step": 26622, "train_loss": 3.219954490661621, "lr": 5.524698808384755e-05, "tps": 346240, "wall": 5039.2} {"step": 26623, "train_loss": 3.2746670246124268, "lr": 5.523927245729444e-05, "tps": 345947, "wall": 5043.6} {"step": 26624, "train_loss": 3.2114107608795166, "lr": 5.523155869715977e-05, "tps": 345654, "wall": 5048.1} {"step": 26625, "train_loss": 3.2952919006347656, "lr": 5.522384680353086e-05, "tps": 345361, "wall": 5052.6} {"step": 26626, "train_loss": 3.269746780395508, "lr": 5.5216136776495174e-05, "tps": 345067, "wall": 5057.1} {"step": 26627, "train_loss": 3.2327864170074463, "lr": 5.520842861613997e-05, "tps": 344777, "wall": 5061.5} {"step": 26628, "train_loss": 3.2078585624694824, "lr": 5.5200722322552635e-05, "tps": 344485, "wall": 5066.0} {"step": 26629, "train_loss": 3.1291213035583496, "lr": 5.5193017895820444e-05, "tps": 344195, "wall": 5070.4} {"step": 26630, "train_loss": 3.159256935119629, "lr": 5.518531533603062e-05, "tps": 343905, "wall": 5074.9} {"step": 26631, "train_loss": 3.1301069259643555, "lr": 5.5177614643270495e-05, "tps": 343615, "wall": 5079.4} {"step": 26632, "train_loss": 3.3572371006011963, "lr": 5.5169915817627246e-05, "tps": 343326, "wall": 5083.9} {"step": 26633, "train_loss": 3.1987385749816895, "lr": 5.516221885918811e-05, "tps": 343037, "wall": 5088.3} {"step": 26634, "train_loss": 3.201871395111084, "lr": 5.51545237680403e-05, "tps": 342748, "wall": 5092.8} {"step": 26635, "train_loss": 3.3116159439086914, "lr": 5.514683054427094e-05, "tps": 342459, "wall": 5097.3} {"step": 26636, "train_loss": 3.178633689880371, "lr": 5.513913918796719e-05, "tps": 342170, "wall": 5101.8} {"step": 26637, "train_loss": 3.213073253631592, "lr": 5.5131449699216244e-05, "tps": 341881, "wall": 5106.3} {"step": 26638, "train_loss": 3.216187000274658, "lr": 5.512376207810512e-05, "tps": 341596, "wall": 5110.7} {"step": 26639, "train_loss": 3.1082019805908203, "lr": 5.511607632472091e-05, "tps": 341310, "wall": 5115.2} {"step": 26640, "train_loss": 3.191452980041504, "lr": 5.510839243915076e-05, "tps": 341025, "wall": 5119.7} {"step": 26641, "train_loss": 3.1605584621429443, "lr": 5.510071042148165e-05, "tps": 340740, "wall": 5124.2} {"step": 26642, "train_loss": 3.2084295749664307, "lr": 5.509303027180057e-05, "tps": 340456, "wall": 5128.6} {"step": 26643, "train_loss": 3.1097240447998047, "lr": 5.50853519901946e-05, "tps": 340172, "wall": 5133.1} {"step": 26644, "train_loss": 3.1950843334198, "lr": 5.50776755767507e-05, "tps": 339890, "wall": 5137.6} {"step": 26645, "train_loss": 3.275367259979248, "lr": 5.5070001031555774e-05, "tps": 339607, "wall": 5142.0} {"step": 26646, "train_loss": 3.166045665740967, "lr": 5.5062328354696815e-05, "tps": 339325, "wall": 5146.5} {"step": 26647, "train_loss": 3.1797800064086914, "lr": 5.505465754626071e-05, "tps": 339044, "wall": 5151.0} {"step": 26648, "train_loss": 3.193906784057617, "lr": 5.504698860633439e-05, "tps": 338761, "wall": 5155.4} {"step": 26649, "train_loss": 3.280568838119507, "lr": 5.503932153500471e-05, "tps": 338478, "wall": 5160.0} {"step": 26650, "train_loss": 3.138784646987915, "lr": 5.503165633235849e-05, "tps": 338198, "wall": 5164.4} {"step": 26651, "train_loss": 3.182314872741699, "lr": 5.502399299848262e-05, "tps": 337918, "wall": 5168.9} {"step": 26652, "train_loss": 3.181581974029541, "lr": 5.501633153346391e-05, "tps": 337639, "wall": 5173.4} {"step": 26653, "train_loss": 3.221625804901123, "lr": 5.500867193738906e-05, "tps": 337361, "wall": 5177.8} {"step": 26654, "train_loss": 3.2180750370025635, "lr": 5.5001014210344914e-05, "tps": 337083, "wall": 5182.3} {"step": 26655, "train_loss": 3.2116522789001465, "lr": 5.499335835241822e-05, "tps": 336805, "wall": 5186.8} {"step": 26656, "train_loss": 3.1997828483581543, "lr": 5.4985704363695675e-05, "tps": 336528, "wall": 5191.2} {"step": 26657, "train_loss": 3.256895065307617, "lr": 5.4978052244264024e-05, "tps": 336251, "wall": 5195.7} {"step": 26658, "train_loss": 3.1868834495544434, "lr": 5.497040199420992e-05, "tps": 335975, "wall": 5200.2} {"step": 26659, "train_loss": 3.1002798080444336, "lr": 5.496275361362001e-05, "tps": 335699, "wall": 5204.6} {"step": 26660, "train_loss": 3.237159013748169, "lr": 5.495510710258096e-05, "tps": 335424, "wall": 5209.1} {"step": 26661, "train_loss": 3.153341770172119, "lr": 5.494746246117941e-05, "tps": 335149, "wall": 5213.6} {"step": 26662, "train_loss": 3.2780752182006836, "lr": 5.4939819689501906e-05, "tps": 334871, "wall": 5218.1} {"step": 26663, "train_loss": 3.17922306060791, "lr": 5.4932178787635055e-05, "tps": 334598, "wall": 5222.5} {"step": 26664, "train_loss": 3.202434778213501, "lr": 5.492453975566541e-05, "tps": 334324, "wall": 5227.0} {"step": 26665, "train_loss": 3.1970531940460205, "lr": 5.491690259367954e-05, "tps": 334051, "wall": 5231.5} {"step": 26666, "train_loss": 3.108520746231079, "lr": 5.490926730176392e-05, "tps": 333778, "wall": 5236.0} {"step": 26667, "train_loss": 3.1578943729400635, "lr": 5.490163388000501e-05, "tps": 333506, "wall": 5240.4} {"step": 26668, "train_loss": 3.1098756790161133, "lr": 5.489400232848936e-05, "tps": 333235, "wall": 5244.9} {"step": 26669, "train_loss": 3.174546003341675, "lr": 5.48863726473034e-05, "tps": 332964, "wall": 5249.3} {"step": 26670, "train_loss": 3.0617308616638184, "lr": 5.48787448365335e-05, "tps": 332694, "wall": 5253.8} {"step": 26671, "train_loss": 3.2208166122436523, "lr": 5.487111889626614e-05, "tps": 332424, "wall": 5258.3} {"step": 26672, "train_loss": 3.1263723373413086, "lr": 5.486349482658768e-05, "tps": 332154, "wall": 5262.7} {"step": 26673, "train_loss": 3.2282190322875977, "lr": 5.4855872627584445e-05, "tps": 331885, "wall": 5267.2} {"step": 26674, "train_loss": 3.239311695098877, "lr": 5.484825229934287e-05, "tps": 331617, "wall": 5271.7} {"step": 26675, "train_loss": 3.1477465629577637, "lr": 5.4840633841949206e-05, "tps": 331348, "wall": 5276.1} {"step": 26676, "train_loss": 3.1871337890625, "lr": 5.483301725548975e-05, "tps": 331078, "wall": 5280.6} {"step": 26677, "train_loss": 3.1651082038879395, "lr": 5.4825402540050864e-05, "tps": 330809, "wall": 5285.1} {"step": 26678, "train_loss": 3.1728885173797607, "lr": 5.4817789695718736e-05, "tps": 330542, "wall": 5289.6} {"step": 26679, "train_loss": 3.1452717781066895, "lr": 5.481017872257959e-05, "tps": 330276, "wall": 5294.1} {"step": 26680, "train_loss": 3.0924549102783203, "lr": 5.48025696207197e-05, "tps": 330010, "wall": 5298.5} {"step": 26681, "train_loss": 3.210519790649414, "lr": 5.4794962390225235e-05, "tps": 329745, "wall": 5303.0} {"step": 26682, "train_loss": 3.1232833862304688, "lr": 5.478735703118237e-05, "tps": 329480, "wall": 5307.4} {"step": 26683, "train_loss": 3.1813414096832275, "lr": 5.4779753543677284e-05, "tps": 329216, "wall": 5311.9} {"step": 26684, "train_loss": 3.096487045288086, "lr": 5.477215192779606e-05, "tps": 328952, "wall": 5316.4} {"step": 26685, "train_loss": 3.117055654525757, "lr": 5.4764552183624853e-05, "tps": 328687, "wall": 5320.8} {"step": 26686, "train_loss": 3.24522066116333, "lr": 5.475695431124974e-05, "tps": 328424, "wall": 5325.3} {"step": 26687, "train_loss": 3.1636931896209717, "lr": 5.474935831075677e-05, "tps": 328161, "wall": 5329.8} {"step": 26688, "train_loss": 3.080355167388916, "lr": 5.474176418223202e-05, "tps": 327899, "wall": 5334.2} {"step": 26689, "train_loss": 3.3113651275634766, "lr": 5.473417192576153e-05, "tps": 327633, "wall": 5338.8} {"step": 26690, "train_loss": 3.259517192840576, "lr": 5.4726581541431246e-05, "tps": 327373, "wall": 5343.2} {"step": 26691, "train_loss": 3.1649882793426514, "lr": 5.471899302932721e-05, "tps": 327111, "wall": 5347.7} {"step": 26692, "train_loss": 3.1113643646240234, "lr": 5.471140638953536e-05, "tps": 326850, "wall": 5352.2} {"step": 26693, "train_loss": 3.1685280799865723, "lr": 5.470382162214161e-05, "tps": 326588, "wall": 5356.6} {"step": 26694, "train_loss": 3.1998722553253174, "lr": 5.469623872723194e-05, "tps": 326330, "wall": 5361.1} {"step": 26695, "train_loss": 3.1985621452331543, "lr": 5.468865770489223e-05, "tps": 326071, "wall": 5365.5} {"step": 26696, "train_loss": 3.2185311317443848, "lr": 5.468107855520832e-05, "tps": 325813, "wall": 5370.0} {"step": 26697, "train_loss": 3.232332706451416, "lr": 5.4673501278266105e-05, "tps": 325555, "wall": 5374.5} {"step": 26698, "train_loss": 3.1374573707580566, "lr": 5.466592587415142e-05, "tps": 325297, "wall": 5378.9} {"step": 26699, "train_loss": 3.293353796005249, "lr": 5.465835234295007e-05, "tps": 325040, "wall": 5383.4} {"step": 26700, "train_loss": 3.250079870223999, "lr": 5.4650780684747845e-05, "tps": 324783, "wall": 5387.8} {"step": 26701, "train_loss": 3.3043971061706543, "lr": 5.4643210899630515e-05, "tps": 324526, "wall": 5392.3} {"step": 26702, "train_loss": 3.1558547019958496, "lr": 5.463564298768383e-05, "tps": 324270, "wall": 5396.8} {"step": 26703, "train_loss": 3.2185981273651123, "lr": 5.462807694899357e-05, "tps": 324011, "wall": 5401.3} {"step": 26704, "train_loss": 3.238348960876465, "lr": 5.462051278364535e-05, "tps": 323755, "wall": 5405.7} {"step": 26705, "train_loss": 3.2468650341033936, "lr": 5.461295049172494e-05, "tps": 323499, "wall": 5410.2} {"step": 26706, "train_loss": 3.214557647705078, "lr": 5.4605390073317976e-05, "tps": 323245, "wall": 5414.7} {"step": 26707, "train_loss": 3.160644769668579, "lr": 5.459783152851008e-05, "tps": 322991, "wall": 5419.1} {"step": 26708, "train_loss": 3.230419635772705, "lr": 5.4590274857386916e-05, "tps": 322738, "wall": 5423.6} {"step": 26709, "train_loss": 3.175954580307007, "lr": 5.4582720060034066e-05, "tps": 322484, "wall": 5428.1} {"step": 26710, "train_loss": 3.132960796356201, "lr": 5.457516713653708e-05, "tps": 322231, "wall": 5432.5} {"step": 26711, "train_loss": 3.1737518310546875, "lr": 5.456761608698159e-05, "tps": 321979, "wall": 5437.0} {"step": 26712, "train_loss": 3.1790058612823486, "lr": 5.456006691145309e-05, "tps": 321727, "wall": 5441.4} {"step": 26713, "train_loss": 3.205889940261841, "lr": 5.455251961003707e-05, "tps": 321476, "wall": 5445.9} {"step": 26714, "train_loss": 3.227442502975464, "lr": 5.4544974182819074e-05, "tps": 321225, "wall": 5450.4} {"step": 26715, "train_loss": 3.190308094024658, "lr": 5.453743062988459e-05, "tps": 320975, "wall": 5454.8} {"step": 26716, "train_loss": 3.1854114532470703, "lr": 5.4529888951318995e-05, "tps": 320721, "wall": 5459.3} {"step": 26717, "train_loss": 3.2242002487182617, "lr": 5.4522349147207806e-05, "tps": 320472, "wall": 5463.8} {"step": 26718, "train_loss": 3.232574939727783, "lr": 5.451481121763637e-05, "tps": 320222, "wall": 5468.2} {"step": 26719, "train_loss": 3.1356358528137207, "lr": 5.450727516269013e-05, "tps": 319974, "wall": 5472.7} {"step": 26720, "train_loss": 3.1560559272766113, "lr": 5.4499740982454426e-05, "tps": 319726, "wall": 5477.1} {"step": 26721, "train_loss": 3.1845786571502686, "lr": 5.449220867701459e-05, "tps": 319478, "wall": 5481.6} {"step": 26722, "train_loss": 3.1850662231445312, "lr": 5.4484678246456023e-05, "tps": 319231, "wall": 5486.0} {"step": 26723, "train_loss": 3.2315802574157715, "lr": 5.4477149690863926e-05, "tps": 318984, "wall": 5490.5} {"step": 26724, "train_loss": 3.2182862758636475, "lr": 5.4469623010323645e-05, "tps": 318737, "wall": 5495.0} {"step": 26725, "train_loss": 3.210452079772949, "lr": 5.446209820492044e-05, "tps": 318490, "wall": 5499.4} {"step": 26726, "train_loss": 3.187537670135498, "lr": 5.44545752747395e-05, "tps": 318244, "wall": 5503.9} {"step": 26727, "train_loss": 3.184959888458252, "lr": 5.444705421986612e-05, "tps": 317998, "wall": 5508.4} {"step": 26728, "train_loss": 3.405405044555664, "lr": 5.443953504038549e-05, "tps": 317753, "wall": 5512.8} {"step": 26729, "train_loss": 3.1360132694244385, "lr": 5.443201773638271e-05, "tps": 317506, "wall": 5517.3} {"step": 26730, "train_loss": 3.181856393814087, "lr": 5.4424502307943015e-05, "tps": 317261, "wall": 5521.8} {"step": 26731, "train_loss": 3.1306209564208984, "lr": 5.4416988755151534e-05, "tps": 317015, "wall": 5526.2} {"step": 26732, "train_loss": 3.164632797241211, "lr": 5.440947707809333e-05, "tps": 316772, "wall": 5530.7} {"step": 26733, "train_loss": 3.0614233016967773, "lr": 5.440196727685354e-05, "tps": 316528, "wall": 5535.2} {"step": 26734, "train_loss": 3.1628565788269043, "lr": 5.439445935151725e-05, "tps": 316285, "wall": 5539.6} {"step": 26735, "train_loss": 3.187887668609619, "lr": 5.438695330216943e-05, "tps": 316043, "wall": 5544.1} {"step": 26736, "train_loss": 3.2027931213378906, "lr": 5.4379449128895196e-05, "tps": 315800, "wall": 5548.5} {"step": 26737, "train_loss": 3.2253735065460205, "lr": 5.437194683177953e-05, "tps": 315558, "wall": 5553.0} {"step": 26738, "train_loss": 3.234471082687378, "lr": 5.436444641090739e-05, "tps": 315317, "wall": 5557.5} {"step": 26739, "train_loss": 3.1076672077178955, "lr": 5.4356947866363774e-05, "tps": 315076, "wall": 5561.9} {"step": 26740, "train_loss": 3.179572582244873, "lr": 5.4349451198233626e-05, "tps": 314835, "wall": 5566.4} {"step": 26741, "train_loss": 3.1730854511260986, "lr": 5.4341956406601804e-05, "tps": 314595, "wall": 5570.8} {"step": 26742, "train_loss": 3.2127435207366943, "lr": 5.43344634915533e-05, "tps": 314355, "wall": 5575.3} {"step": 26743, "train_loss": 3.211355447769165, "lr": 5.432697245317294e-05, "tps": 314113, "wall": 5579.8} {"step": 26744, "train_loss": 3.219561815261841, "lr": 5.431948329154564e-05, "tps": 313874, "wall": 5584.3} {"step": 26745, "train_loss": 3.183248996734619, "lr": 5.431199600675616e-05, "tps": 313635, "wall": 5588.7} {"step": 26746, "train_loss": 3.3216042518615723, "lr": 5.4304510598889335e-05, "tps": 313395, "wall": 5593.2} {"step": 26747, "train_loss": 3.320857048034668, "lr": 5.429702706803001e-05, "tps": 313158, "wall": 5597.7} {"step": 26748, "train_loss": 3.2891159057617188, "lr": 5.428954541426294e-05, "tps": 312920, "wall": 5602.1} {"step": 26749, "train_loss": 3.2332100868225098, "lr": 5.428206563767284e-05, "tps": 312683, "wall": 5606.6} {"step": 26750, "train_loss": 3.1431431770324707, "lr": 5.427458773834446e-05, "tps": 312446, "wall": 5611.0} {"step": 26751, "train_loss": 3.2523820400238037, "lr": 5.426711171636255e-05, "tps": 312210, "wall": 5615.5} {"step": 26752, "train_loss": 3.232705593109131, "lr": 5.4259637571811715e-05, "tps": 311974, "wall": 5620.0} {"step": 26753, "train_loss": 3.2068638801574707, "lr": 5.425216530477671e-05, "tps": 311738, "wall": 5624.4} {"step": 26754, "train_loss": 3.165299892425537, "lr": 5.4244694915342146e-05, "tps": 311503, "wall": 5628.9} {"step": 26755, "train_loss": 3.180718183517456, "lr": 5.42372264035926e-05, "tps": 311268, "wall": 5633.3} {"step": 26756, "train_loss": 3.124011278152466, "lr": 5.4229759769612775e-05, "tps": 311030, "wall": 5637.9} {"step": 26757, "train_loss": 3.1870036125183105, "lr": 5.422229501348719e-05, "tps": 310795, "wall": 5642.3} {"step": 26758, "train_loss": 3.118722438812256, "lr": 5.421483213530038e-05, "tps": 310561, "wall": 5646.8} {"step": 26759, "train_loss": 3.2577614784240723, "lr": 5.420737113513695e-05, "tps": 310327, "wall": 5651.3} {"step": 26760, "train_loss": 3.187325954437256, "lr": 5.4199912013081355e-05, "tps": 310093, "wall": 5655.7} {"step": 26761, "train_loss": 3.2050254344940186, "lr": 5.419245476921816e-05, "tps": 309860, "wall": 5660.2} {"step": 26762, "train_loss": 3.2334377765655518, "lr": 5.418499940363182e-05, "tps": 309628, "wall": 5664.7} {"step": 26763, "train_loss": 3.1305181980133057, "lr": 5.417754591640674e-05, "tps": 309395, "wall": 5669.1} {"step": 26764, "train_loss": 3.17071270942688, "lr": 5.417009430762742e-05, "tps": 309164, "wall": 5673.6} {"step": 26765, "train_loss": 3.0636565685272217, "lr": 5.416264457737823e-05, "tps": 308932, "wall": 5678.1} {"step": 26766, "train_loss": 3.188872814178467, "lr": 5.415519672574355e-05, "tps": 308701, "wall": 5682.5} {"step": 26767, "train_loss": 3.173731565475464, "lr": 5.414775075280782e-05, "tps": 308471, "wall": 5687.0} {"step": 26768, "train_loss": 3.039649724960327, "lr": 5.4140306658655324e-05, "tps": 308240, "wall": 5691.4} {"step": 26769, "train_loss": 3.0873560905456543, "lr": 5.413286444337039e-05, "tps": 308011, "wall": 5695.9} {"step": 26770, "train_loss": 3.274470806121826, "lr": 5.412542410703736e-05, "tps": 307779, "wall": 5700.4} {"step": 26771, "train_loss": 3.1220016479492188, "lr": 5.4117985649740486e-05, "tps": 307549, "wall": 5704.9} {"step": 26772, "train_loss": 3.190659999847412, "lr": 5.4110549071564056e-05, "tps": 307320, "wall": 5709.3} {"step": 26773, "train_loss": 3.2344698905944824, "lr": 5.410311437259229e-05, "tps": 307092, "wall": 5713.8} {"step": 26774, "train_loss": 3.224144458770752, "lr": 5.409568155290945e-05, "tps": 306864, "wall": 5718.2} {"step": 26775, "train_loss": 3.2115960121154785, "lr": 5.4088250612599644e-05, "tps": 306637, "wall": 5722.7} {"step": 26776, "train_loss": 3.260523796081543, "lr": 5.4080821551747155e-05, "tps": 306410, "wall": 5727.1} {"step": 26777, "train_loss": 3.207594633102417, "lr": 5.407339437043608e-05, "tps": 306184, "wall": 5731.6} {"step": 26778, "train_loss": 3.246906042098999, "lr": 5.406596906875059e-05, "tps": 305957, "wall": 5736.0} {"step": 26779, "train_loss": 3.1417436599731445, "lr": 5.405854564677476e-05, "tps": 305731, "wall": 5740.5} {"step": 26780, "train_loss": 3.281383514404297, "lr": 5.40511241045927e-05, "tps": 305505, "wall": 5745.0} {"step": 26781, "train_loss": 3.11548113822937, "lr": 5.40437044422885e-05, "tps": 305280, "wall": 5749.4} {"step": 26782, "train_loss": 3.139449119567871, "lr": 5.403628665994619e-05, "tps": 305054, "wall": 5753.9} {"step": 26783, "train_loss": 3.157933235168457, "lr": 5.402887075764979e-05, "tps": 304825, "wall": 5758.4} {"step": 26784, "train_loss": 3.2088942527770996, "lr": 5.4021456735483334e-05, "tps": 304601, "wall": 5762.9} {"step": 26785, "train_loss": 3.125399589538574, "lr": 5.401404459353081e-05, "tps": 304377, "wall": 5767.3} {"step": 26786, "train_loss": 3.198805332183838, "lr": 5.400663433187611e-05, "tps": 304153, "wall": 5771.8} {"step": 26787, "train_loss": 3.153414011001587, "lr": 5.3999225950603296e-05, "tps": 303930, "wall": 5776.3} {"step": 26788, "train_loss": 3.154189348220825, "lr": 5.399181944979623e-05, "tps": 303706, "wall": 5780.7} {"step": 26789, "train_loss": 3.2260847091674805, "lr": 5.398441482953878e-05, "tps": 303483, "wall": 5785.2} {"step": 26790, "train_loss": 3.221174716949463, "lr": 5.397701208991488e-05, "tps": 303260, "wall": 5789.7} {"step": 26791, "train_loss": 3.1730165481567383, "lr": 5.396961123100838e-05, "tps": 303036, "wall": 5794.1} {"step": 26792, "train_loss": 3.1328654289245605, "lr": 5.3962212252903055e-05, "tps": 302814, "wall": 5798.6} {"step": 26793, "train_loss": 3.1988821029663086, "lr": 5.395481515568283e-05, "tps": 302593, "wall": 5803.1} {"step": 26794, "train_loss": 3.1952762603759766, "lr": 5.3947419939431445e-05, "tps": 302372, "wall": 5807.5} {"step": 26795, "train_loss": 3.1452078819274902, "lr": 5.394002660423262e-05, "tps": 302152, "wall": 5812.0} {"step": 26796, "train_loss": 3.1837992668151855, "lr": 5.393263515017019e-05, "tps": 301930, "wall": 5816.5} {"step": 26797, "train_loss": 3.2032470703125, "lr": 5.3925245577327824e-05, "tps": 301708, "wall": 5821.0} {"step": 26798, "train_loss": 3.1600325107574463, "lr": 5.39178578857893e-05, "tps": 301489, "wall": 5825.4} {"step": 26799, "train_loss": 3.1186130046844482, "lr": 5.391047207563824e-05, "tps": 301269, "wall": 5829.9} {"step": 26800, "train_loss": 3.179028034210205, "lr": 5.3903088146958335e-05, "tps": 301050, "wall": 5834.3} {"step": 26801, "train_loss": 3.2546839714050293, "lr": 5.389570609983325e-05, "tps": 300831, "wall": 5838.8} {"step": 26802, "train_loss": 3.033158779144287, "lr": 5.388832593434662e-05, "tps": 300612, "wall": 5843.3} {"step": 26803, "train_loss": 3.191443681716919, "lr": 5.388094765058196e-05, "tps": 300394, "wall": 5847.7} {"step": 26804, "train_loss": 3.282301902770996, "lr": 5.3873571248622946e-05, "tps": 300177, "wall": 5852.2} {"step": 26805, "train_loss": 3.1690967082977295, "lr": 5.386619672855311e-05, "tps": 299960, "wall": 5856.6} {"step": 26806, "train_loss": 3.134294033050537, "lr": 5.385882409045594e-05, "tps": 299743, "wall": 5861.1} {"step": 26807, "train_loss": 3.2367806434631348, "lr": 5.385145333441505e-05, "tps": 299526, "wall": 5865.6} {"step": 26808, "train_loss": 3.213212251663208, "lr": 5.3844084460513875e-05, "tps": 299309, "wall": 5870.0} {"step": 26809, "train_loss": 3.146177291870117, "lr": 5.383671746883586e-05, "tps": 299094, "wall": 5874.5} {"step": 26810, "train_loss": 3.1721153259277344, "lr": 5.382935235946454e-05, "tps": 298874, "wall": 5879.0} {"step": 26811, "train_loss": 3.100879669189453, "lr": 5.3821989132483316e-05, "tps": 298659, "wall": 5883.5} {"step": 26812, "train_loss": 3.2369308471679688, "lr": 5.3814627787975545e-05, "tps": 298444, "wall": 5887.9} {"step": 26813, "train_loss": 3.1349172592163086, "lr": 5.3807268326024704e-05, "tps": 298229, "wall": 5892.4} {"step": 26814, "train_loss": 3.2063045501708984, "lr": 5.3799910746714086e-05, "tps": 298012, "wall": 5896.9} {"step": 26815, "train_loss": 3.2788710594177246, "lr": 5.379255505012709e-05, "tps": 297800, "wall": 5901.3} {"step": 26816, "train_loss": 3.129743814468384, "lr": 5.378520123634702e-05, "tps": 297586, "wall": 5905.8} {"step": 26817, "train_loss": 3.2656469345092773, "lr": 5.377784930545715e-05, "tps": 297372, "wall": 5910.2} {"step": 26818, "train_loss": 3.234544515609741, "lr": 5.377049925754084e-05, "tps": 297159, "wall": 5914.7} {"step": 26819, "train_loss": 3.11845064163208, "lr": 5.376315109268131e-05, "tps": 296946, "wall": 5919.2} {"step": 26820, "train_loss": 3.301008701324463, "lr": 5.375580481096176e-05, "tps": 296733, "wall": 5923.6} {"step": 26821, "train_loss": 3.205630302429199, "lr": 5.374846041246547e-05, "tps": 296521, "wall": 5928.1} {"step": 26822, "train_loss": 3.2431559562683105, "lr": 5.3741117897275614e-05, "tps": 296310, "wall": 5932.5} {"step": 26823, "train_loss": 3.2430992126464844, "lr": 5.3733777265475346e-05, "tps": 296098, "wall": 5937.0} {"step": 26824, "train_loss": 3.1388206481933594, "lr": 5.3726438517147894e-05, "tps": 295885, "wall": 5941.5} {"step": 26825, "train_loss": 3.2137084007263184, "lr": 5.3719101652376314e-05, "tps": 295674, "wall": 5946.0} {"step": 26826, "train_loss": 3.2646803855895996, "lr": 5.371176667124371e-05, "tps": 295464, "wall": 5950.4} {"step": 26827, "train_loss": 3.144294023513794, "lr": 5.370443357383327e-05, "tps": 295253, "wall": 5954.9} {"step": 26828, "train_loss": 3.1736135482788086, "lr": 5.369710236022798e-05, "tps": 295043, "wall": 5959.3} {"step": 26829, "train_loss": 3.3363585472106934, "lr": 5.368977303051088e-05, "tps": 294834, "wall": 5963.8} {"step": 26830, "train_loss": 3.159355401992798, "lr": 5.3682445584765075e-05, "tps": 294624, "wall": 5968.3} {"step": 26831, "train_loss": 3.2939846515655518, "lr": 5.367512002307351e-05, "tps": 294415, "wall": 5972.7} {"step": 26832, "train_loss": 3.254641532897949, "lr": 5.366779634551916e-05, "tps": 294207, "wall": 5977.2} {"step": 26833, "train_loss": 3.1669816970825195, "lr": 5.3660474552185035e-05, "tps": 293998, "wall": 5981.6} {"step": 26834, "train_loss": 3.1206164360046387, "lr": 5.3653154643154025e-05, "tps": 293790, "wall": 5986.1} {"step": 26835, "train_loss": 3.11688232421875, "lr": 5.3645836618509115e-05, "tps": 293582, "wall": 5990.6} {"step": 26836, "train_loss": 3.14237642288208, "lr": 5.363852047833315e-05, "tps": 293376, "wall": 5995.0} {"step": 26837, "train_loss": 3.205604076385498, "lr": 5.363120622270903e-05, "tps": 293166, "wall": 5999.5} {"step": 26838, "train_loss": 3.1397719383239746, "lr": 5.362389385171961e-05, "tps": 292959, "wall": 6004.0} {"step": 26839, "train_loss": 3.2282538414001465, "lr": 5.361658336544773e-05, "tps": 292753, "wall": 6008.4} {"step": 26840, "train_loss": 3.0499677658081055, "lr": 5.3609274763976146e-05, "tps": 292547, "wall": 6012.9} {"step": 26841, "train_loss": 3.1690797805786133, "lr": 5.360196804738775e-05, "tps": 292341, "wall": 6017.3} {"step": 26842, "train_loss": 3.2944796085357666, "lr": 5.359466321576524e-05, "tps": 292135, "wall": 6021.8} {"step": 26843, "train_loss": 3.2977490425109863, "lr": 5.3587360269191386e-05, "tps": 291930, "wall": 6026.3} {"step": 26844, "train_loss": 3.1106040477752686, "lr": 5.3580059207748925e-05, "tps": 291726, "wall": 6030.7} {"step": 26845, "train_loss": 3.1602301597595215, "lr": 5.357276003152056e-05, "tps": 291521, "wall": 6035.2} {"step": 26846, "train_loss": 3.180265426635742, "lr": 5.356546274058897e-05, "tps": 291316, "wall": 6039.6} {"step": 26847, "train_loss": 3.270908832550049, "lr": 5.355816733503682e-05, "tps": 291112, "wall": 6044.1} {"step": 26848, "train_loss": 3.1283559799194336, "lr": 5.3550873814946765e-05, "tps": 290908, "wall": 6048.5} {"step": 26849, "train_loss": 3.2400968074798584, "lr": 5.3543582180401386e-05, "tps": 290705, "wall": 6053.0} {"step": 26850, "train_loss": 3.126199722290039, "lr": 5.353629243148335e-05, "tps": 290501, "wall": 6057.5} {"step": 26851, "train_loss": 3.256619453430176, "lr": 5.352900456827516e-05, "tps": 290298, "wall": 6061.9} {"step": 26852, "train_loss": 3.256808280944824, "lr": 5.352171859085945e-05, "tps": 290095, "wall": 6066.4} {"step": 26853, "train_loss": 3.0650155544281006, "lr": 5.351443449931871e-05, "tps": 289893, "wall": 6070.9} {"step": 26854, "train_loss": 3.2979068756103516, "lr": 5.350715229373543e-05, "tps": 289691, "wall": 6075.3} {"step": 26855, "train_loss": 3.205409526824951, "lr": 5.349987197419218e-05, "tps": 289489, "wall": 6079.8} {"step": 26856, "train_loss": 3.143916606903076, "lr": 5.349259354077137e-05, "tps": 289287, "wall": 6084.3} {"step": 26857, "train_loss": 3.1394121646881104, "lr": 5.348531699355544e-05, "tps": 289086, "wall": 6088.7} {"step": 26858, "train_loss": 3.140503406524658, "lr": 5.34780423326269e-05, "tps": 288885, "wall": 6093.2} {"step": 26859, "train_loss": 3.180379867553711, "lr": 5.347076955806809e-05, "tps": 288686, "wall": 6097.6} {"step": 26860, "train_loss": 3.238434314727783, "lr": 5.3463498669961376e-05, "tps": 288485, "wall": 6102.1} {"step": 26861, "train_loss": 3.2121658325195312, "lr": 5.345622966838919e-05, "tps": 288286, "wall": 6106.5} {"step": 26862, "train_loss": 3.1667098999023438, "lr": 5.344896255343386e-05, "tps": 288086, "wall": 6111.0} {"step": 26863, "train_loss": 3.2089662551879883, "lr": 5.3441697325177655e-05, "tps": 287888, "wall": 6115.4} {"step": 26864, "train_loss": 3.133507013320923, "lr": 5.3434433983702935e-05, "tps": 287686, "wall": 6119.9} {"step": 26865, "train_loss": 3.1713197231292725, "lr": 5.3427172529091954e-05, "tps": 287487, "wall": 6124.4} {"step": 26866, "train_loss": 3.203085422515869, "lr": 5.341991296142697e-05, "tps": 287288, "wall": 6128.9} {"step": 26867, "train_loss": 3.1865992546081543, "lr": 5.3412655280790224e-05, "tps": 287090, "wall": 6133.3} {"step": 26868, "train_loss": 3.232330799102783, "lr": 5.340539948726391e-05, "tps": 286892, "wall": 6137.8} {"step": 26869, "train_loss": 3.233537435531616, "lr": 5.339814558093028e-05, "tps": 286694, "wall": 6142.3} {"step": 26870, "train_loss": 3.10884428024292, "lr": 5.339089356187147e-05, "tps": 286498, "wall": 6146.7} {"step": 26871, "train_loss": 3.137054681777954, "lr": 5.338364343016959e-05, "tps": 286300, "wall": 6151.2} {"step": 26872, "train_loss": 3.1383304595947266, "lr": 5.3376395185906845e-05, "tps": 286103, "wall": 6155.6} {"step": 26873, "train_loss": 3.190211057662964, "lr": 5.3369148829165304e-05, "tps": 285907, "wall": 6160.1} {"step": 26874, "train_loss": 3.2219252586364746, "lr": 5.336190436002705e-05, "tps": 285712, "wall": 6164.5} {"step": 26875, "train_loss": 3.2165818214416504, "lr": 5.335466177857418e-05, "tps": 285516, "wall": 6169.0} {"step": 26876, "train_loss": 3.149409532546997, "lr": 5.3347421084888715e-05, "tps": 285321, "wall": 6173.4} {"step": 26877, "train_loss": 3.1692233085632324, "lr": 5.3340182279052645e-05, "tps": 285123, "wall": 6177.9} {"step": 26878, "train_loss": 3.2047488689422607, "lr": 5.333294536114804e-05, "tps": 284929, "wall": 6182.4} {"step": 26879, "train_loss": 3.1580049991607666, "lr": 5.332571033125684e-05, "tps": 284734, "wall": 6186.9} {"step": 26880, "train_loss": 3.216737747192383, "lr": 5.3318477189460994e-05, "tps": 284539, "wall": 6191.3} {"step": 26881, "train_loss": 3.2280125617980957, "lr": 5.331124593584247e-05, "tps": 284346, "wall": 6195.8} {"step": 26882, "train_loss": 3.1497087478637695, "lr": 5.330401657048318e-05, "tps": 284152, "wall": 6200.2} {"step": 26883, "train_loss": 3.1929540634155273, "lr": 5.3296789093464974e-05, "tps": 283958, "wall": 6204.7} {"step": 26884, "train_loss": 3.1353931427001953, "lr": 5.32895635048698e-05, "tps": 283765, "wall": 6209.1} {"step": 26885, "train_loss": 3.2057502269744873, "lr": 5.328233980477946e-05, "tps": 283571, "wall": 6213.6} {"step": 26886, "train_loss": 3.2375736236572266, "lr": 5.327511799327577e-05, "tps": 283379, "wall": 6218.0} {"step": 26887, "train_loss": 3.3028149604797363, "lr": 5.326789807044058e-05, "tps": 283187, "wall": 6222.5} {"step": 26888, "train_loss": 3.155057430267334, "lr": 5.3260680036355645e-05, "tps": 282995, "wall": 6226.9} {"step": 26889, "train_loss": 3.297438383102417, "lr": 5.325346389110277e-05, "tps": 282803, "wall": 6231.4} {"step": 26890, "train_loss": 3.1887340545654297, "lr": 5.324624963476368e-05, "tps": 282612, "wall": 6235.9} {"step": 26891, "train_loss": 3.1758193969726562, "lr": 5.32390372674201e-05, "tps": 282419, "wall": 6240.3} {"step": 26892, "train_loss": 3.185182809829712, "lr": 5.3231826789153714e-05, "tps": 282228, "wall": 6244.8} {"step": 26893, "train_loss": 3.139880657196045, "lr": 5.3224618200046185e-05, "tps": 282037, "wall": 6249.3} {"step": 26894, "train_loss": 3.173880100250244, "lr": 5.321741150017925e-05, "tps": 281846, "wall": 6253.7} {"step": 26895, "train_loss": 3.2037453651428223, "lr": 5.321020668963448e-05, "tps": 281656, "wall": 6258.2} {"step": 26896, "train_loss": 3.257730484008789, "lr": 5.320300376849351e-05, "tps": 281466, "wall": 6262.6} {"step": 26897, "train_loss": 3.1812894344329834, "lr": 5.319580273683794e-05, "tps": 281276, "wall": 6267.1} {"step": 26898, "train_loss": 3.1503849029541016, "lr": 5.318860359474935e-05, "tps": 281087, "wall": 6271.5} {"step": 26899, "train_loss": 3.1610727310180664, "lr": 5.3181406342309245e-05, "tps": 280898, "wall": 6276.0} {"step": 26900, "train_loss": 3.2036960124969482, "lr": 5.3174210979599225e-05, "tps": 280709, "wall": 6280.5} {"step": 26901, "train_loss": 3.23588228225708, "lr": 5.316701750670079e-05, "tps": 280521, "wall": 6284.9} {"step": 26902, "train_loss": 3.1771931648254395, "lr": 5.315982592369536e-05, "tps": 280332, "wall": 6289.4} {"step": 26903, "train_loss": 3.229128837585449, "lr": 5.315263623066449e-05, "tps": 280144, "wall": 6293.8} {"step": 26904, "train_loss": 3.134308099746704, "lr": 5.3145448427689574e-05, "tps": 279953, "wall": 6298.4} {"step": 26905, "train_loss": 3.1548759937286377, "lr": 5.3138262514852e-05, "tps": 279767, "wall": 6302.8} {"step": 26906, "train_loss": 3.118410587310791, "lr": 5.3131078492233265e-05, "tps": 279579, "wall": 6307.3} {"step": 26907, "train_loss": 3.094709873199463, "lr": 5.3123896359914705e-05, "tps": 279392, "wall": 6311.7} {"step": 26908, "train_loss": 3.2889225482940674, "lr": 5.311671611797762e-05, "tps": 279205, "wall": 6316.2} {"step": 26909, "train_loss": 3.2090494632720947, "lr": 5.310953776650345e-05, "tps": 279019, "wall": 6320.6} {"step": 26910, "train_loss": 3.1700780391693115, "lr": 5.3102361305573426e-05, "tps": 278833, "wall": 6325.1} {"step": 26911, "train_loss": 3.2902822494506836, "lr": 5.309518673526891e-05, "tps": 278648, "wall": 6329.5} {"step": 26912, "train_loss": 3.2222111225128174, "lr": 5.308801405567116e-05, "tps": 278462, "wall": 6334.0} {"step": 26913, "train_loss": 3.110093832015991, "lr": 5.308084326686138e-05, "tps": 278277, "wall": 6338.4} {"step": 26914, "train_loss": 3.236021041870117, "lr": 5.307367436892088e-05, "tps": 278091, "wall": 6342.9} {"step": 26915, "train_loss": 3.1581172943115234, "lr": 5.306650736193082e-05, "tps": 277906, "wall": 6347.3} {"step": 26916, "train_loss": 3.1956191062927246, "lr": 5.305934224597237e-05, "tps": 277722, "wall": 6351.8} {"step": 26917, "train_loss": 3.159386157989502, "lr": 5.3052179021126746e-05, "tps": 277538, "wall": 6356.2} {"step": 26918, "train_loss": 3.2761878967285156, "lr": 5.3045017687475065e-05, "tps": 277351, "wall": 6360.7} {"step": 26919, "train_loss": 3.102510452270508, "lr": 5.303785824509842e-05, "tps": 277166, "wall": 6365.2} {"step": 26920, "train_loss": 3.1381211280822754, "lr": 5.3030700694077994e-05, "tps": 276983, "wall": 6369.7} {"step": 26921, "train_loss": 3.1740927696228027, "lr": 5.30235450344948e-05, "tps": 276800, "wall": 6374.1} {"step": 26922, "train_loss": 3.16512393951416, "lr": 5.301639126642992e-05, "tps": 276617, "wall": 6378.6} {"step": 26923, "train_loss": 3.1292717456817627, "lr": 5.30092393899644e-05, "tps": 276434, "wall": 6383.0} {"step": 26924, "train_loss": 3.1225061416625977, "lr": 5.3002089405179276e-05, "tps": 276251, "wall": 6387.5} {"step": 26925, "train_loss": 3.182985305786133, "lr": 5.2994941312155475e-05, "tps": 276069, "wall": 6392.0} {"step": 26926, "train_loss": 3.163076400756836, "lr": 5.2987795110974056e-05, "tps": 275887, "wall": 6396.4} {"step": 26927, "train_loss": 3.109806537628174, "lr": 5.29806508017159e-05, "tps": 275705, "wall": 6400.9} {"step": 26928, "train_loss": 3.2232184410095215, "lr": 5.2973508384461965e-05, "tps": 275524, "wall": 6405.3} {"step": 26929, "train_loss": 3.1522650718688965, "lr": 5.2966367859293185e-05, "tps": 275343, "wall": 6409.8} {"step": 26930, "train_loss": 3.2397725582122803, "lr": 5.295922922629037e-05, "tps": 275162, "wall": 6414.2} {"step": 26931, "train_loss": 3.174919605255127, "lr": 5.295209248553452e-05, "tps": 274978, "wall": 6418.7} {"step": 26932, "train_loss": 3.2420413494110107, "lr": 5.294495763710636e-05, "tps": 274799, "wall": 6423.2} {"step": 26933, "train_loss": 3.1758980751037598, "lr": 5.2937824681086764e-05, "tps": 274618, "wall": 6427.6} {"step": 26934, "train_loss": 3.2163748741149902, "lr": 5.2930693617556535e-05, "tps": 274438, "wall": 6432.1} {"step": 26935, "train_loss": 3.1888277530670166, "lr": 5.292356444659645e-05, "tps": 274258, "wall": 6436.6} {"step": 26936, "train_loss": 3.1758768558502197, "lr": 5.2916437168287234e-05, "tps": 274078, "wall": 6441.0} {"step": 26937, "train_loss": 3.1609768867492676, "lr": 5.2909311782709714e-05, "tps": 273899, "wall": 6445.5} {"step": 26938, "train_loss": 3.1551856994628906, "lr": 5.290218828994451e-05, "tps": 273720, "wall": 6449.9} {"step": 26939, "train_loss": 3.082451820373535, "lr": 5.2895066690072356e-05, "tps": 273541, "wall": 6454.4} {"step": 26940, "train_loss": 3.143503427505493, "lr": 5.288794698317394e-05, "tps": 273362, "wall": 6458.8} {"step": 26941, "train_loss": 2.9909420013427734, "lr": 5.2880829169329905e-05, "tps": 273184, "wall": 6463.3} {"step": 26942, "train_loss": 3.174546718597412, "lr": 5.287371324862085e-05, "tps": 273006, "wall": 6467.7} {"step": 26943, "train_loss": 3.179236888885498, "lr": 5.286659922112744e-05, "tps": 272828, "wall": 6472.2} {"step": 26944, "train_loss": 3.0642333030700684, "lr": 5.285948708693025e-05, "tps": 272651, "wall": 6476.7} {"step": 26945, "train_loss": 3.1980791091918945, "lr": 5.2852376846109786e-05, "tps": 272471, "wall": 6481.2} {"step": 26946, "train_loss": 3.1872451305389404, "lr": 5.284526849874666e-05, "tps": 272294, "wall": 6485.6} {"step": 26947, "train_loss": 3.21543025970459, "lr": 5.283816204492136e-05, "tps": 272117, "wall": 6490.1} {"step": 26948, "train_loss": 3.1941123008728027, "lr": 5.283105748471444e-05, "tps": 271941, "wall": 6494.5} {"step": 26949, "train_loss": 3.0023584365844727, "lr": 5.2823954818206344e-05, "tps": 271765, "wall": 6499.0} {"step": 26950, "train_loss": 3.1143274307250977, "lr": 5.281685404547749e-05, "tps": 271589, "wall": 6503.4} {"step": 26951, "train_loss": 3.184014320373535, "lr": 5.28097551666084e-05, "tps": 271413, "wall": 6507.9} {"step": 26952, "train_loss": 3.126255989074707, "lr": 5.280265818167944e-05, "tps": 271238, "wall": 6512.3} {"step": 26953, "train_loss": 3.1562888622283936, "lr": 5.279556309077096e-05, "tps": 271063, "wall": 6516.8} {"step": 26954, "train_loss": 2.9788198471069336, "lr": 5.2788469893963444e-05, "tps": 270888, "wall": 6521.2} {"step": 26955, "train_loss": 3.2397782802581787, "lr": 5.27813785913372e-05, "tps": 270713, "wall": 6525.7} {"step": 26956, "train_loss": 3.0832910537719727, "lr": 5.2774289182972504e-05, "tps": 270538, "wall": 6530.1} {"step": 26957, "train_loss": 3.1398799419403076, "lr": 5.2767201668949726e-05, "tps": 270364, "wall": 6534.6} {"step": 26958, "train_loss": 3.2679123878479004, "lr": 5.276011604934914e-05, "tps": 270187, "wall": 6539.1} {"step": 26959, "train_loss": 3.256033182144165, "lr": 5.275303232425097e-05, "tps": 270014, "wall": 6543.5} {"step": 26960, "train_loss": 3.2401862144470215, "lr": 5.274595049373554e-05, "tps": 269840, "wall": 6548.0} {"step": 26961, "train_loss": 3.1466522216796875, "lr": 5.2738870557883027e-05, "tps": 269666, "wall": 6552.5} {"step": 26962, "train_loss": 3.27010440826416, "lr": 5.273179251677363e-05, "tps": 269493, "wall": 6556.9} {"step": 26963, "train_loss": 3.1167235374450684, "lr": 5.2724716370487526e-05, "tps": 269321, "wall": 6561.4} {"step": 26964, "train_loss": 3.1096014976501465, "lr": 5.2717642119104874e-05, "tps": 269148, "wall": 6565.8} {"step": 26965, "train_loss": 3.1973681449890137, "lr": 5.2710569762705855e-05, "tps": 268976, "wall": 6570.3} {"step": 26966, "train_loss": 3.2238872051239014, "lr": 5.270349930137054e-05, "tps": 268804, "wall": 6574.7} {"step": 26967, "train_loss": 3.1750621795654297, "lr": 5.2696430735179016e-05, "tps": 268632, "wall": 6579.2} {"step": 26968, "train_loss": 3.2701668739318848, "lr": 5.26893640642114e-05, "tps": 268460, "wall": 6583.6} {"step": 26969, "train_loss": 3.2121224403381348, "lr": 5.268229928854772e-05, "tps": 268288, "wall": 6588.1} {"step": 26970, "train_loss": 3.114259719848633, "lr": 5.267523640826797e-05, "tps": 268117, "wall": 6592.5} {"step": 26971, "train_loss": 3.1107401847839355, "lr": 5.266817542345225e-05, "tps": 267946, "wall": 6597.0} {"step": 26972, "train_loss": 3.1821677684783936, "lr": 5.266111633418047e-05, "tps": 267774, "wall": 6601.5} {"step": 26973, "train_loss": 3.088578701019287, "lr": 5.265405914053259e-05, "tps": 267603, "wall": 6605.9} {"step": 26974, "train_loss": 3.2563772201538086, "lr": 5.264700384258859e-05, "tps": 267433, "wall": 6610.4} {"step": 26975, "train_loss": 3.267869710922241, "lr": 5.263995044042841e-05, "tps": 267263, "wall": 6614.8} {"step": 26976, "train_loss": 3.137773036956787, "lr": 5.2632898934131905e-05, "tps": 267093, "wall": 6619.3} {"step": 26977, "train_loss": 3.1521363258361816, "lr": 5.262584932377899e-05, "tps": 266923, "wall": 6623.7} {"step": 26978, "train_loss": 3.2775228023529053, "lr": 5.26188016094495e-05, "tps": 266754, "wall": 6628.2} {"step": 26979, "train_loss": 3.2357349395751953, "lr": 5.261175579122326e-05, "tps": 266585, "wall": 6632.6} {"step": 26980, "train_loss": 3.1377625465393066, "lr": 5.2604711869180126e-05, "tps": 266416, "wall": 6637.1} {"step": 26981, "train_loss": 3.146993398666382, "lr": 5.259766984339989e-05, "tps": 266248, "wall": 6641.5} {"step": 26982, "train_loss": 3.1330368518829346, "lr": 5.259062971396227e-05, "tps": 266080, "wall": 6646.0} {"step": 26983, "train_loss": 3.0864667892456055, "lr": 5.2583591480947094e-05, "tps": 265912, "wall": 6650.4} {"step": 26984, "train_loss": 3.0822319984436035, "lr": 5.257655514443398e-05, "tps": 265744, "wall": 6654.8} {"step": 26985, "train_loss": 3.1589651107788086, "lr": 5.2569520704502774e-05, "tps": 265574, "wall": 6659.4} {"step": 26986, "train_loss": 3.155921697616577, "lr": 5.256248816123308e-05, "tps": 265406, "wall": 6663.8} {"step": 26987, "train_loss": 3.078779458999634, "lr": 5.255545751470456e-05, "tps": 265238, "wall": 6668.3} {"step": 26988, "train_loss": 3.095717430114746, "lr": 5.25484287649969e-05, "tps": 265070, "wall": 6672.8} {"step": 26989, "train_loss": 3.1984853744506836, "lr": 5.2541401912189704e-05, "tps": 264901, "wall": 6677.3} {"step": 26990, "train_loss": 3.2208662033081055, "lr": 5.253437695636253e-05, "tps": 264735, "wall": 6681.7} {"step": 26991, "train_loss": 3.2015950679779053, "lr": 5.252735389759502e-05, "tps": 264569, "wall": 6686.1} {"step": 26992, "train_loss": 3.0599749088287354, "lr": 5.2520332735966714e-05, "tps": 264400, "wall": 6690.6} {"step": 26993, "train_loss": 3.2133636474609375, "lr": 5.25133134715571e-05, "tps": 264235, "wall": 6695.1} {"step": 26994, "train_loss": 3.0807113647460938, "lr": 5.250629610444576e-05, "tps": 264069, "wall": 6699.5} {"step": 26995, "train_loss": 3.2245237827301025, "lr": 5.2499280634712165e-05, "tps": 263903, "wall": 6704.0} {"step": 26996, "train_loss": 3.09281063079834, "lr": 5.249226706243575e-05, "tps": 263738, "wall": 6708.4} {"step": 26997, "train_loss": 3.123613119125366, "lr": 5.2485255387696034e-05, "tps": 263573, "wall": 6712.9} {"step": 26998, "train_loss": 3.1984238624572754, "lr": 5.2478245610572395e-05, "tps": 263408, "wall": 6717.4} {"step": 26999, "train_loss": 3.2025146484375, "lr": 5.247123773114422e-05, "tps": 263240, "wall": 6721.9} {"step": 27000, "train_loss": 3.0090103149414062, "lr": 5.246423174949097e-05, "tps": 263075, "wall": 6726.3, "val_loss_monitor": 3.3239706321528892} {"step": 27001, "train_loss": 3.1599440574645996, "lr": 5.245722766569193e-05, "tps": 261731, "wall": 6761.1} {"step": 27002, "train_loss": 3.1150503158569336, "lr": 5.2450225479826495e-05, "tps": 261566, "wall": 6765.7} {"step": 27003, "train_loss": 3.2325265407562256, "lr": 5.2443225191974e-05, "tps": 261403, "wall": 6770.1} {"step": 27004, "train_loss": 3.1587953567504883, "lr": 5.243622680221367e-05, "tps": 261241, "wall": 6774.6} {"step": 27005, "train_loss": 3.0722134113311768, "lr": 5.242923031062487e-05, "tps": 261076, "wall": 6779.1} {"step": 27006, "train_loss": 3.0652413368225098, "lr": 5.2422235717286795e-05, "tps": 260915, "wall": 6783.5} {"step": 27007, "train_loss": 3.168095111846924, "lr": 5.241524302227866e-05, "tps": 260754, "wall": 6788.0} {"step": 27008, "train_loss": 3.1741445064544678, "lr": 5.240825222567978e-05, "tps": 260592, "wall": 6792.4} {"step": 27009, "train_loss": 3.2115402221679688, "lr": 5.240126332756926e-05, "tps": 260431, "wall": 6796.9} {"step": 27010, "train_loss": 3.126832962036133, "lr": 5.2394276328026284e-05, "tps": 260271, "wall": 6801.3} {"step": 27011, "train_loss": 3.1703202724456787, "lr": 5.238729122713003e-05, "tps": 260111, "wall": 6805.8} {"step": 27012, "train_loss": 3.232710838317871, "lr": 5.2380308024959614e-05, "tps": 259950, "wall": 6810.2} {"step": 27013, "train_loss": 3.291185140609741, "lr": 5.237332672159411e-05, "tps": 259789, "wall": 6814.7} {"step": 27014, "train_loss": 3.1928038597106934, "lr": 5.236634731711265e-05, "tps": 259629, "wall": 6819.2} {"step": 27015, "train_loss": 3.2196803092956543, "lr": 5.235936981159428e-05, "tps": 259469, "wall": 6823.6} {"step": 27016, "train_loss": 3.1672489643096924, "lr": 5.2352394205118014e-05, "tps": 259309, "wall": 6828.1} {"step": 27017, "train_loss": 3.1851677894592285, "lr": 5.234542049776293e-05, "tps": 259150, "wall": 6832.5} {"step": 27018, "train_loss": 3.250912666320801, "lr": 5.233844868960794e-05, "tps": 258990, "wall": 6837.0} {"step": 27019, "train_loss": 3.0533571243286133, "lr": 5.233147878073213e-05, "tps": 258829, "wall": 6841.5} {"step": 27020, "train_loss": 3.2009966373443604, "lr": 5.232451077121439e-05, "tps": 258670, "wall": 6846.0} {"step": 27021, "train_loss": 3.247413158416748, "lr": 5.231754466113361e-05, "tps": 258511, "wall": 6850.4} {"step": 27022, "train_loss": 3.107004165649414, "lr": 5.231058045056883e-05, "tps": 258352, "wall": 6854.9} {"step": 27023, "train_loss": 3.1805412769317627, "lr": 5.230361813959883e-05, "tps": 258194, "wall": 6859.4} {"step": 27024, "train_loss": 3.224189043045044, "lr": 5.22966577283025e-05, "tps": 258036, "wall": 6863.8} {"step": 27025, "train_loss": 3.0748982429504395, "lr": 5.2289699216758725e-05, "tps": 257878, "wall": 6868.3} {"step": 27026, "train_loss": 3.0234475135803223, "lr": 5.228274260504633e-05, "tps": 257720, "wall": 6872.7} {"step": 27027, "train_loss": 3.089893102645874, "lr": 5.227578789324405e-05, "tps": 257563, "wall": 6877.2} {"step": 27028, "train_loss": 3.170858383178711, "lr": 5.2268835081430765e-05, "tps": 257406, "wall": 6881.6} {"step": 27029, "train_loss": 3.2964019775390625, "lr": 5.226188416968518e-05, "tps": 257249, "wall": 6886.1} {"step": 27030, "train_loss": 3.2276318073272705, "lr": 5.225493515808602e-05, "tps": 257092, "wall": 6890.5} {"step": 27031, "train_loss": 3.1932928562164307, "lr": 5.224798804671205e-05, "tps": 256936, "wall": 6895.0} {"step": 27032, "train_loss": 3.1401453018188477, "lr": 5.224104283564195e-05, "tps": 256777, "wall": 6899.5} {"step": 27033, "train_loss": 3.1660349369049072, "lr": 5.2234099524954374e-05, "tps": 256622, "wall": 6903.9} {"step": 27034, "train_loss": 3.1332573890686035, "lr": 5.2227158114728e-05, "tps": 256466, "wall": 6908.4} {"step": 27035, "train_loss": 3.231491804122925, "lr": 5.222021860504147e-05, "tps": 256310, "wall": 6912.8} {"step": 27036, "train_loss": 3.101626396179199, "lr": 5.2213280995973366e-05, "tps": 256154, "wall": 6917.3} {"step": 27037, "train_loss": 3.173727512359619, "lr": 5.22063452876023e-05, "tps": 256000, "wall": 6921.7} {"step": 27038, "train_loss": 3.1770997047424316, "lr": 5.219941148000681e-05, "tps": 255845, "wall": 6926.2} {"step": 27039, "train_loss": 3.154923915863037, "lr": 5.2192479573265496e-05, "tps": 255690, "wall": 6930.6} {"step": 27040, "train_loss": 3.09875226020813, "lr": 5.218554956745684e-05, "tps": 255534, "wall": 6935.1} {"step": 27041, "train_loss": 3.163794994354248, "lr": 5.2178621462659336e-05, "tps": 255381, "wall": 6939.5} {"step": 27042, "train_loss": 3.253765106201172, "lr": 5.217169525895154e-05, "tps": 255226, "wall": 6944.0} {"step": 27043, "train_loss": 3.1844472885131836, "lr": 5.2164770956411827e-05, "tps": 255072, "wall": 6948.4} {"step": 27044, "train_loss": 3.1455459594726562, "lr": 5.2157848555118636e-05, "tps": 254918, "wall": 6952.9} {"step": 27045, "train_loss": 3.1740682125091553, "lr": 5.215092805515047e-05, "tps": 254764, "wall": 6957.4} {"step": 27046, "train_loss": 3.124650478363037, "lr": 5.214400945658566e-05, "tps": 254609, "wall": 6961.9} {"step": 27047, "train_loss": 3.2144765853881836, "lr": 5.213709275950256e-05, "tps": 254454, "wall": 6966.3} {"step": 27048, "train_loss": 3.141380786895752, "lr": 5.213017796397959e-05, "tps": 254302, "wall": 6970.8} {"step": 27049, "train_loss": 3.2309062480926514, "lr": 5.212326507009504e-05, "tps": 254149, "wall": 6975.2} {"step": 27050, "train_loss": 3.2221739292144775, "lr": 5.2116354077927196e-05, "tps": 253996, "wall": 6979.7} {"step": 27051, "train_loss": 3.212277889251709, "lr": 5.21094449875544e-05, "tps": 253844, "wall": 6984.1} {"step": 27052, "train_loss": 3.1722378730773926, "lr": 5.210253779905492e-05, "tps": 253692, "wall": 6988.6} {"step": 27053, "train_loss": 3.213468551635742, "lr": 5.209563251250692e-05, "tps": 253539, "wall": 6993.0} {"step": 27054, "train_loss": 3.166386842727661, "lr": 5.20887291279887e-05, "tps": 253387, "wall": 6997.5} {"step": 27055, "train_loss": 3.221473217010498, "lr": 5.208182764557844e-05, "tps": 253236, "wall": 7001.9} {"step": 27056, "train_loss": 3.2637219429016113, "lr": 5.207492806535433e-05, "tps": 253084, "wall": 7006.4} {"step": 27057, "train_loss": 3.143307685852051, "lr": 5.206803038739453e-05, "tps": 252932, "wall": 7010.8} {"step": 27058, "train_loss": 3.1673166751861572, "lr": 5.206113461177713e-05, "tps": 252781, "wall": 7015.3} {"step": 27059, "train_loss": 3.239882230758667, "lr": 5.205424073858031e-05, "tps": 252628, "wall": 7019.8} {"step": 27060, "train_loss": 3.129502773284912, "lr": 5.204734876788217e-05, "tps": 252477, "wall": 7024.3} {"step": 27061, "train_loss": 3.082510471343994, "lr": 5.204045869976067e-05, "tps": 252326, "wall": 7028.7} {"step": 27062, "train_loss": 3.1680166721343994, "lr": 5.2033570534294005e-05, "tps": 252175, "wall": 7033.2} {"step": 27063, "train_loss": 3.118093252182007, "lr": 5.202668427156011e-05, "tps": 252026, "wall": 7037.6} {"step": 27064, "train_loss": 3.215545654296875, "lr": 5.2019799911637035e-05, "tps": 251876, "wall": 7042.1} {"step": 27065, "train_loss": 3.188350200653076, "lr": 5.201291745460275e-05, "tps": 251726, "wall": 7046.5} {"step": 27066, "train_loss": 3.096388578414917, "lr": 5.20060369005352e-05, "tps": 251576, "wall": 7051.0} {"step": 27067, "train_loss": 3.185457944869995, "lr": 5.199915824951239e-05, "tps": 251427, "wall": 7055.4} {"step": 27068, "train_loss": 3.195124864578247, "lr": 5.1992281501612195e-05, "tps": 251277, "wall": 7059.9} {"step": 27069, "train_loss": 3.2028915882110596, "lr": 5.198540665691248e-05, "tps": 251128, "wall": 7064.4} {"step": 27070, "train_loss": 3.1326205730438232, "lr": 5.197853371549122e-05, "tps": 250979, "wall": 7068.8} {"step": 27071, "train_loss": 3.2017316818237305, "lr": 5.1971662677426226e-05, "tps": 250830, "wall": 7073.3} {"step": 27072, "train_loss": 3.191807985305786, "lr": 5.1964793542795276e-05, "tps": 250681, "wall": 7077.7} {"step": 27073, "train_loss": 3.2101521492004395, "lr": 5.195792631167629e-05, "tps": 250532, "wall": 7082.2} {"step": 27074, "train_loss": 3.1878037452697754, "lr": 5.195106098414697e-05, "tps": 250384, "wall": 7086.7} {"step": 27075, "train_loss": 3.251969337463379, "lr": 5.1944197560285123e-05, "tps": 250236, "wall": 7091.1} {"step": 27076, "train_loss": 3.2494375705718994, "lr": 5.193733604016852e-05, "tps": 250088, "wall": 7095.5} {"step": 27077, "train_loss": 3.243213653564453, "lr": 5.193047642387485e-05, "tps": 249941, "wall": 7100.0} {"step": 27078, "train_loss": 3.198202610015869, "lr": 5.1923618711481826e-05, "tps": 249794, "wall": 7104.4} {"step": 27079, "train_loss": 3.1468019485473633, "lr": 5.191676290306717e-05, "tps": 249646, "wall": 7108.9} {"step": 27080, "train_loss": 3.2018561363220215, "lr": 5.1909908998708465e-05, "tps": 249499, "wall": 7113.4} {"step": 27081, "train_loss": 3.1601569652557373, "lr": 5.1903056998483455e-05, "tps": 249352, "wall": 7117.8} {"step": 27082, "train_loss": 3.1660869121551514, "lr": 5.189620690246971e-05, "tps": 249206, "wall": 7122.3} {"step": 27083, "train_loss": 3.173187732696533, "lr": 5.188935871074481e-05, "tps": 249059, "wall": 7126.7} {"step": 27084, "train_loss": 3.2453484535217285, "lr": 5.188251242338635e-05, "tps": 248912, "wall": 7131.2} {"step": 27085, "train_loss": 3.1975884437561035, "lr": 5.1875668040471906e-05, "tps": 248766, "wall": 7135.6} {"step": 27086, "train_loss": 3.1760025024414062, "lr": 5.1868825562078937e-05, "tps": 248618, "wall": 7140.2} {"step": 27087, "train_loss": 3.2959072589874268, "lr": 5.1861984988285065e-05, "tps": 248472, "wall": 7144.6} {"step": 27088, "train_loss": 3.1702003479003906, "lr": 5.185514631916769e-05, "tps": 248326, "wall": 7149.1} {"step": 27089, "train_loss": 3.126020908355713, "lr": 5.184830955480432e-05, "tps": 248180, "wall": 7153.5} {"step": 27090, "train_loss": 3.2271149158477783, "lr": 5.184147469527241e-05, "tps": 248035, "wall": 7158.0} {"step": 27091, "train_loss": 3.3019561767578125, "lr": 5.183464174064937e-05, "tps": 247890, "wall": 7162.4} {"step": 27092, "train_loss": 3.159515380859375, "lr": 5.182781069101257e-05, "tps": 247745, "wall": 7166.9} {"step": 27093, "train_loss": 3.196503162384033, "lr": 5.182098154643947e-05, "tps": 247601, "wall": 7171.3} {"step": 27094, "train_loss": 3.160501003265381, "lr": 5.181415430700739e-05, "tps": 247456, "wall": 7175.8} {"step": 27095, "train_loss": 3.1613388061523438, "lr": 5.180732897279362e-05, "tps": 247312, "wall": 7180.3} {"step": 27096, "train_loss": 3.1010243892669678, "lr": 5.180050554387558e-05, "tps": 247168, "wall": 7184.7} {"step": 27097, "train_loss": 3.1625239849090576, "lr": 5.179368402033048e-05, "tps": 247024, "wall": 7189.1} {"step": 27098, "train_loss": 3.2148220539093018, "lr": 5.1786864402235644e-05, "tps": 246880, "wall": 7193.6} {"step": 27099, "train_loss": 3.223832607269287, "lr": 5.1780046689668315e-05, "tps": 246734, "wall": 7198.1} {"step": 27100, "train_loss": 3.2728586196899414, "lr": 5.1773230882705695e-05, "tps": 246591, "wall": 7202.6} {"step": 27101, "train_loss": 3.1567392349243164, "lr": 5.1766416981425034e-05, "tps": 246448, "wall": 7207.0} {"step": 27102, "train_loss": 3.179410457611084, "lr": 5.17596049859035e-05, "tps": 246305, "wall": 7211.5} {"step": 27103, "train_loss": 3.116180181503296, "lr": 5.175279489621825e-05, "tps": 246162, "wall": 7215.9} {"step": 27104, "train_loss": 3.305122137069702, "lr": 5.1745986712446456e-05, "tps": 246020, "wall": 7220.4} {"step": 27105, "train_loss": 3.135634422302246, "lr": 5.1739180434665236e-05, "tps": 245877, "wall": 7224.8} {"step": 27106, "train_loss": 3.1572442054748535, "lr": 5.173237606295165e-05, "tps": 245735, "wall": 7229.3} {"step": 27107, "train_loss": 3.1473569869995117, "lr": 5.1725573597382825e-05, "tps": 245593, "wall": 7233.7} {"step": 27108, "train_loss": 3.2300002574920654, "lr": 5.171877303803584e-05, "tps": 245451, "wall": 7238.2} {"step": 27109, "train_loss": 3.1265709400177, "lr": 5.171197438498764e-05, "tps": 245309, "wall": 7242.6} {"step": 27110, "train_loss": 3.2379798889160156, "lr": 5.1705177638315326e-05, "tps": 245167, "wall": 7247.1} {"step": 27111, "train_loss": 3.1178321838378906, "lr": 5.169838279809588e-05, "tps": 245026, "wall": 7251.5} {"step": 27112, "train_loss": 3.1715548038482666, "lr": 5.169158986440623e-05, "tps": 244884, "wall": 7256.0} {"step": 27113, "train_loss": 3.178115129470825, "lr": 5.168479883732338e-05, "tps": 244741, "wall": 7260.5} {"step": 27114, "train_loss": 3.1618597507476807, "lr": 5.1678009716924235e-05, "tps": 244599, "wall": 7265.0} {"step": 27115, "train_loss": 3.130000114440918, "lr": 5.167122250328567e-05, "tps": 244458, "wall": 7269.4} {"step": 27116, "train_loss": 3.068580150604248, "lr": 5.166443719648464e-05, "tps": 244317, "wall": 7273.9} {"step": 27117, "train_loss": 3.113154888153076, "lr": 5.165765379659794e-05, "tps": 244176, "wall": 7278.4} {"step": 27118, "train_loss": 3.204075336456299, "lr": 5.165087230370246e-05, "tps": 244036, "wall": 7282.8} {"step": 27119, "train_loss": 3.18538236618042, "lr": 5.1644092717875006e-05, "tps": 243896, "wall": 7287.3} {"step": 27120, "train_loss": 3.252509117126465, "lr": 5.163731503919238e-05, "tps": 243756, "wall": 7291.7} {"step": 27121, "train_loss": 3.172473192214966, "lr": 5.1630539267731346e-05, "tps": 243617, "wall": 7296.2} {"step": 27122, "train_loss": 3.1285719871520996, "lr": 5.162376540356869e-05, "tps": 243477, "wall": 7300.6} {"step": 27123, "train_loss": 3.129178285598755, "lr": 5.1616993446781106e-05, "tps": 243338, "wall": 7305.0} {"step": 27124, "train_loss": 3.1125166416168213, "lr": 5.161022339744537e-05, "tps": 243198, "wall": 7309.5} {"step": 27125, "train_loss": 3.043950319290161, "lr": 5.160345525563811e-05, "tps": 243059, "wall": 7314.0} {"step": 27126, "train_loss": 3.1840262413024902, "lr": 5.1596689021435995e-05, "tps": 242918, "wall": 7318.5} {"step": 27127, "train_loss": 3.3005621433258057, "lr": 5.158992469491573e-05, "tps": 242780, "wall": 7322.9} {"step": 27128, "train_loss": 3.183448076248169, "lr": 5.1583162276153904e-05, "tps": 242641, "wall": 7327.4} {"step": 27129, "train_loss": 3.1897692680358887, "lr": 5.157640176522709e-05, "tps": 242503, "wall": 7331.8} {"step": 27130, "train_loss": 3.1257057189941406, "lr": 5.1569643162211945e-05, "tps": 242365, "wall": 7336.3} {"step": 27131, "train_loss": 3.2443647384643555, "lr": 5.156288646718501e-05, "tps": 242227, "wall": 7340.7} {"step": 27132, "train_loss": 3.23659610748291, "lr": 5.1556131680222755e-05, "tps": 242089, "wall": 7345.2} {"step": 27133, "train_loss": 3.1992363929748535, "lr": 5.154937880140182e-05, "tps": 241951, "wall": 7349.6} {"step": 27134, "train_loss": 3.152735710144043, "lr": 5.1542627830798576e-05, "tps": 241813, "wall": 7354.1} {"step": 27135, "train_loss": 3.2030816078186035, "lr": 5.153587876848956e-05, "tps": 241676, "wall": 7358.5} {"step": 27136, "train_loss": 2.9897329807281494, "lr": 5.1529131614551276e-05, "tps": 241539, "wall": 7363.0} {"step": 27137, "train_loss": 3.2353768348693848, "lr": 5.152238636906005e-05, "tps": 241402, "wall": 7367.4} {"step": 27138, "train_loss": 3.118683338165283, "lr": 5.1515643032092374e-05, "tps": 241265, "wall": 7371.9} {"step": 27139, "train_loss": 3.221649169921875, "lr": 5.150890160372461e-05, "tps": 241128, "wall": 7376.3} {"step": 27140, "train_loss": 3.1902408599853516, "lr": 5.150216208403309e-05, "tps": 240989, "wall": 7380.9} {"step": 27141, "train_loss": 3.162466287612915, "lr": 5.149542447309425e-05, "tps": 240853, "wall": 7385.3} {"step": 27142, "train_loss": 3.204530715942383, "lr": 5.148868877098433e-05, "tps": 240716, "wall": 7389.8} {"step": 27143, "train_loss": 3.181915521621704, "lr": 5.148195497777963e-05, "tps": 240580, "wall": 7394.2} {"step": 27144, "train_loss": 3.218527317047119, "lr": 5.147522309355651e-05, "tps": 240444, "wall": 7398.7} {"step": 27145, "train_loss": 3.2374231815338135, "lr": 5.146849311839116e-05, "tps": 240309, "wall": 7403.1} {"step": 27146, "train_loss": 3.1808717250823975, "lr": 5.146176505235981e-05, "tps": 240173, "wall": 7407.6} {"step": 27147, "train_loss": 3.115880012512207, "lr": 5.145503889553874e-05, "tps": 240038, "wall": 7412.0} {"step": 27148, "train_loss": 3.215337038040161, "lr": 5.144831464800409e-05, "tps": 239903, "wall": 7416.5} {"step": 27149, "train_loss": 3.1991798877716064, "lr": 5.1441592309832045e-05, "tps": 239767, "wall": 7420.9} {"step": 27150, "train_loss": 3.2626466751098633, "lr": 5.143487188109879e-05, "tps": 239632, "wall": 7425.4} {"step": 27151, "train_loss": 3.303562641143799, "lr": 5.142815336188038e-05, "tps": 239497, "wall": 7429.9} {"step": 27152, "train_loss": 3.1973397731781006, "lr": 5.1421436752253003e-05, "tps": 239363, "wall": 7434.3} {"step": 27153, "train_loss": 3.2235107421875, "lr": 5.141472205229272e-05, "tps": 239226, "wall": 7438.8} {"step": 27154, "train_loss": 3.199582576751709, "lr": 5.140800926207555e-05, "tps": 239092, "wall": 7443.3} {"step": 27155, "train_loss": 3.157245635986328, "lr": 5.14012983816776e-05, "tps": 238958, "wall": 7447.7} {"step": 27156, "train_loss": 3.1022579669952393, "lr": 5.139458941117485e-05, "tps": 238824, "wall": 7452.2} {"step": 27157, "train_loss": 3.0835933685302734, "lr": 5.1387882350643316e-05, "tps": 238690, "wall": 7456.6} {"step": 27158, "train_loss": 3.1272685527801514, "lr": 5.138117720015897e-05, "tps": 238556, "wall": 7461.1} {"step": 27159, "train_loss": 3.1801536083221436, "lr": 5.1374473959797787e-05, "tps": 238422, "wall": 7465.5} {"step": 27160, "train_loss": 3.1075093746185303, "lr": 5.136777262963565e-05, "tps": 238289, "wall": 7470.0} {"step": 27161, "train_loss": 3.230482816696167, "lr": 5.136107320974853e-05, "tps": 238156, "wall": 7474.4} {"step": 27162, "train_loss": 3.242776393890381, "lr": 5.135437570021231e-05, "tps": 238023, "wall": 7478.9} {"step": 27163, "train_loss": 3.2190418243408203, "lr": 5.134768010110281e-05, "tps": 237890, "wall": 7483.4} {"step": 27164, "train_loss": 3.1604115962982178, "lr": 5.134098641249594e-05, "tps": 237758, "wall": 7487.8} {"step": 27165, "train_loss": 3.2735724449157715, "lr": 5.133429463446752e-05, "tps": 237625, "wall": 7492.3} {"step": 27166, "train_loss": 3.191239833831787, "lr": 5.1327604767093275e-05, "tps": 237493, "wall": 7496.7} {"step": 27167, "train_loss": 3.0989537239074707, "lr": 5.13209168104491e-05, "tps": 237358, "wall": 7501.2} {"step": 27168, "train_loss": 3.2092373371124268, "lr": 5.1314230764610685e-05, "tps": 237226, "wall": 7505.7} {"step": 27169, "train_loss": 3.144662618637085, "lr": 5.130754662965378e-05, "tps": 237094, "wall": 7510.1} {"step": 27170, "train_loss": 3.2261228561401367, "lr": 5.1300864405654124e-05, "tps": 236962, "wall": 7514.6} {"step": 27171, "train_loss": 3.123966932296753, "lr": 5.1294184092687404e-05, "tps": 236831, "wall": 7519.0} {"step": 27172, "train_loss": 3.162227153778076, "lr": 5.12875056908293e-05, "tps": 236699, "wall": 7523.5} {"step": 27173, "train_loss": 3.126897096633911, "lr": 5.1280829200155456e-05, "tps": 236568, "wall": 7528.0} {"step": 27174, "train_loss": 3.1569855213165283, "lr": 5.127415462074149e-05, "tps": 236437, "wall": 7532.4} {"step": 27175, "train_loss": 3.1619367599487305, "lr": 5.126748195266303e-05, "tps": 236306, "wall": 7536.8} {"step": 27176, "train_loss": 3.2378499507904053, "lr": 5.1260811195995684e-05, "tps": 236175, "wall": 7541.3} {"step": 27177, "train_loss": 3.0751945972442627, "lr": 5.125414235081498e-05, "tps": 236045, "wall": 7545.7} {"step": 27178, "train_loss": 3.2187764644622803, "lr": 5.12474754171965e-05, "tps": 235914, "wall": 7550.2} {"step": 27179, "train_loss": 3.1337733268737793, "lr": 5.1240810395215734e-05, "tps": 235784, "wall": 7554.6} {"step": 27180, "train_loss": 3.040985107421875, "lr": 5.123414728494818e-05, "tps": 235651, "wall": 7559.2} {"step": 27181, "train_loss": 3.172791004180908, "lr": 5.1227486086469364e-05, "tps": 235522, "wall": 7563.6} {"step": 27182, "train_loss": 3.1909523010253906, "lr": 5.12208267998547e-05, "tps": 235392, "wall": 7568.1} {"step": 27183, "train_loss": 3.1831300258636475, "lr": 5.121416942517966e-05, "tps": 235261, "wall": 7572.5} {"step": 27184, "train_loss": 3.074983596801758, "lr": 5.1207513962519624e-05, "tps": 235132, "wall": 7577.0} {"step": 27185, "train_loss": 3.241295337677002, "lr": 5.1200860411950005e-05, "tps": 235003, "wall": 7581.4} {"step": 27186, "train_loss": 3.187305450439453, "lr": 5.119420877354617e-05, "tps": 234874, "wall": 7585.9} {"step": 27187, "train_loss": 3.2011771202087402, "lr": 5.118755904738348e-05, "tps": 234743, "wall": 7590.4} {"step": 27188, "train_loss": 3.18992280960083, "lr": 5.118091123353721e-05, "tps": 234614, "wall": 7594.8} {"step": 27189, "train_loss": 3.1906256675720215, "lr": 5.117426533208275e-05, "tps": 234485, "wall": 7599.3} {"step": 27190, "train_loss": 3.1824967861175537, "lr": 5.116762134309535e-05, "tps": 234357, "wall": 7603.7} {"step": 27191, "train_loss": 3.17832350730896, "lr": 5.1160979266650244e-05, "tps": 234228, "wall": 7608.2} {"step": 27192, "train_loss": 3.2160515785217285, "lr": 5.115433910282274e-05, "tps": 234100, "wall": 7612.6} {"step": 27193, "train_loss": 3.1611950397491455, "lr": 5.1147700851687995e-05, "tps": 233972, "wall": 7617.1} {"step": 27194, "train_loss": 3.1998276710510254, "lr": 5.114106451332119e-05, "tps": 233843, "wall": 7621.6} {"step": 27195, "train_loss": 3.2038204669952393, "lr": 5.11344300877976e-05, "tps": 233715, "wall": 7626.0} {"step": 27196, "train_loss": 3.1706247329711914, "lr": 5.1127797575192306e-05, "tps": 233587, "wall": 7630.5} {"step": 27197, "train_loss": 3.2370033264160156, "lr": 5.1121166975580424e-05, "tps": 233459, "wall": 7634.9} {"step": 27198, "train_loss": 3.2487940788269043, "lr": 5.111453828903714e-05, "tps": 233331, "wall": 7639.4} {"step": 27199, "train_loss": 3.1888742446899414, "lr": 5.1107911515637496e-05, "tps": 233204, "wall": 7643.8} {"step": 27200, "train_loss": 3.1706395149230957, "lr": 5.110128665545654e-05, "tps": 233077, "wall": 7648.3} {"step": 27201, "train_loss": 3.1372859477996826, "lr": 5.109466370856937e-05, "tps": 232950, "wall": 7652.7} {"step": 27202, "train_loss": 3.236797332763672, "lr": 5.1088042675050996e-05, "tps": 232823, "wall": 7657.2} {"step": 27203, "train_loss": 3.2134227752685547, "lr": 5.108142355497637e-05, "tps": 232696, "wall": 7661.7} {"step": 27204, "train_loss": 3.2868213653564453, "lr": 5.107480634842057e-05, "tps": 232569, "wall": 7666.1} {"step": 27205, "train_loss": 3.2187089920043945, "lr": 5.106819105545845e-05, "tps": 232443, "wall": 7670.6} {"step": 27206, "train_loss": 3.1859591007232666, "lr": 5.1061577676165026e-05, "tps": 232317, "wall": 7675.0} {"step": 27207, "train_loss": 3.1284401416778564, "lr": 5.1054966210615215e-05, "tps": 232188, "wall": 7679.5} {"step": 27208, "train_loss": 3.2612316608428955, "lr": 5.104835665888382e-05, "tps": 232063, "wall": 7684.0} {"step": 27209, "train_loss": 3.1128196716308594, "lr": 5.104174902104584e-05, "tps": 231938, "wall": 7688.4} {"step": 27210, "train_loss": 3.250460624694824, "lr": 5.103514329717606e-05, "tps": 231812, "wall": 7692.9} {"step": 27211, "train_loss": 3.195262908935547, "lr": 5.1028539487349305e-05, "tps": 231686, "wall": 7697.3} {"step": 27212, "train_loss": 3.234938621520996, "lr": 5.102193759164041e-05, "tps": 231561, "wall": 7701.8} {"step": 27213, "train_loss": 3.1717796325683594, "lr": 5.1015337610124134e-05, "tps": 231435, "wall": 7706.2} {"step": 27214, "train_loss": 3.2016239166259766, "lr": 5.100873954287524e-05, "tps": 231310, "wall": 7710.7} {"step": 27215, "train_loss": 3.111452341079712, "lr": 5.1002143389968516e-05, "tps": 231185, "wall": 7715.1} {"step": 27216, "train_loss": 3.125779628753662, "lr": 5.099554915147866e-05, "tps": 231060, "wall": 7719.6} {"step": 27217, "train_loss": 3.0649490356445312, "lr": 5.098895682748034e-05, "tps": 230935, "wall": 7724.0} {"step": 27218, "train_loss": 3.205374240875244, "lr": 5.098236641804827e-05, "tps": 230811, "wall": 7728.5} {"step": 27219, "train_loss": 3.1370184421539307, "lr": 5.0975777923257094e-05, "tps": 230686, "wall": 7732.9} {"step": 27220, "train_loss": 3.0396203994750977, "lr": 5.0969191343181445e-05, "tps": 230562, "wall": 7737.4} {"step": 27221, "train_loss": 3.132373809814453, "lr": 5.0962606677895953e-05, "tps": 230437, "wall": 7741.9} {"step": 27222, "train_loss": 3.2093639373779297, "lr": 5.095602392747519e-05, "tps": 230312, "wall": 7746.4} {"step": 27223, "train_loss": 3.076209545135498, "lr": 5.094944309199373e-05, "tps": 230189, "wall": 7750.8} {"step": 27224, "train_loss": 3.3123042583465576, "lr": 5.094286417152614e-05, "tps": 230065, "wall": 7755.3} {"step": 27225, "train_loss": 3.021054744720459, "lr": 5.0936287166146915e-05, "tps": 229941, "wall": 7759.7} {"step": 27226, "train_loss": 3.303537368774414, "lr": 5.092971207593058e-05, "tps": 229817, "wall": 7764.2} {"step": 27227, "train_loss": 3.177286386489868, "lr": 5.092313890095162e-05, "tps": 229694, "wall": 7768.6} {"step": 27228, "train_loss": 3.209934711456299, "lr": 5.091656764128449e-05, "tps": 229571, "wall": 7773.1} {"step": 27229, "train_loss": 3.140631914138794, "lr": 5.090999829700363e-05, "tps": 229448, "wall": 7777.5} {"step": 27230, "train_loss": 3.1319198608398438, "lr": 5.090343086818344e-05, "tps": 229326, "wall": 7782.0} {"step": 27231, "train_loss": 3.237156867980957, "lr": 5.0896865354898336e-05, "tps": 229203, "wall": 7786.4} {"step": 27232, "train_loss": 3.1931681632995605, "lr": 5.0890301757222714e-05, "tps": 229081, "wall": 7790.9} {"step": 27233, "train_loss": 3.2883105278015137, "lr": 5.0883740075230856e-05, "tps": 228958, "wall": 7795.3} {"step": 27234, "train_loss": 3.2189502716064453, "lr": 5.08771803089972e-05, "tps": 228833, "wall": 7799.9} {"step": 27235, "train_loss": 3.2088675498962402, "lr": 5.0870622458595964e-05, "tps": 228711, "wall": 7804.3} {"step": 27236, "train_loss": 3.17038631439209, "lr": 5.086406652410144e-05, "tps": 228589, "wall": 7808.8} {"step": 27237, "train_loss": 3.1799166202545166, "lr": 5.0857512505587954e-05, "tps": 228467, "wall": 7813.2} {"step": 27238, "train_loss": 3.181117534637451, "lr": 5.085096040312972e-05, "tps": 228345, "wall": 7817.7} {"step": 27239, "train_loss": 3.1712636947631836, "lr": 5.0844410216800934e-05, "tps": 228223, "wall": 7822.2} {"step": 27240, "train_loss": 3.2031967639923096, "lr": 5.083786194667583e-05, "tps": 228102, "wall": 7826.6} {"step": 27241, "train_loss": 3.144284725189209, "lr": 5.0831315592828585e-05, "tps": 227980, "wall": 7831.1} {"step": 27242, "train_loss": 3.177067756652832, "lr": 5.0824771155333316e-05, "tps": 227859, "wall": 7835.5} {"step": 27243, "train_loss": 3.180004358291626, "lr": 5.081822863426423e-05, "tps": 227738, "wall": 7840.0} {"step": 27244, "train_loss": 3.157362461090088, "lr": 5.0811688029695404e-05, "tps": 227617, "wall": 7844.4} {"step": 27245, "train_loss": 3.173346519470215, "lr": 5.080514934170091e-05, "tps": 227496, "wall": 7848.9} {"step": 27246, "train_loss": 3.058161735534668, "lr": 5.0798612570354844e-05, "tps": 227375, "wall": 7853.3} {"step": 27247, "train_loss": 3.21791672706604, "lr": 5.0792077715731255e-05, "tps": 227255, "wall": 7857.8} {"step": 27248, "train_loss": 3.0693418979644775, "lr": 5.0785544777904146e-05, "tps": 227133, "wall": 7862.3} {"step": 27249, "train_loss": 3.16092586517334, "lr": 5.0779013756947556e-05, "tps": 227013, "wall": 7866.7} {"step": 27250, "train_loss": 3.169294834136963, "lr": 5.0772484652935434e-05, "tps": 226892, "wall": 7871.2} {"step": 27251, "train_loss": 3.1272828578948975, "lr": 5.076595746594177e-05, "tps": 226773, "wall": 7875.7} {"step": 27252, "train_loss": 3.17519474029541, "lr": 5.0759432196040526e-05, "tps": 226653, "wall": 7880.1} {"step": 27253, "train_loss": 3.2073686122894287, "lr": 5.0752908843305537e-05, "tps": 226532, "wall": 7884.6} {"step": 27254, "train_loss": 3.343766689300537, "lr": 5.074638740781079e-05, "tps": 226413, "wall": 7889.0} {"step": 27255, "train_loss": 3.216646432876587, "lr": 5.073986788963012e-05, "tps": 226293, "wall": 7893.5} {"step": 27256, "train_loss": 3.128345012664795, "lr": 5.0733350288837355e-05, "tps": 226174, "wall": 7898.0} {"step": 27257, "train_loss": 3.169896364212036, "lr": 5.072683460550639e-05, "tps": 226055, "wall": 7902.4} {"step": 27258, "train_loss": 3.1549184322357178, "lr": 5.072032083971099e-05, "tps": 225936, "wall": 7906.9} {"step": 27259, "train_loss": 3.2266194820404053, "lr": 5.0713808991524934e-05, "tps": 225817, "wall": 7911.3} {"step": 27260, "train_loss": 3.1507205963134766, "lr": 5.070729906102203e-05, "tps": 225698, "wall": 7915.8} {"step": 27261, "train_loss": 3.259241819381714, "lr": 5.0700791048275995e-05, "tps": 225576, "wall": 7920.3} {"step": 27262, "train_loss": 3.1199231147766113, "lr": 5.069428495336055e-05, "tps": 225458, "wall": 7924.8} {"step": 27263, "train_loss": 3.1943116188049316, "lr": 5.068778077634943e-05, "tps": 225340, "wall": 7929.2} {"step": 27264, "train_loss": 3.168081283569336, "lr": 5.0681278517316264e-05, "tps": 225222, "wall": 7933.7} {"step": 27265, "train_loss": 3.1564550399780273, "lr": 5.0674778176334714e-05, "tps": 225104, "wall": 7938.1} {"step": 27266, "train_loss": 3.2451956272125244, "lr": 5.066827975347849e-05, "tps": 224986, "wall": 7942.6} {"step": 27267, "train_loss": 3.2203006744384766, "lr": 5.06617832488211e-05, "tps": 224868, "wall": 7947.0} {"step": 27268, "train_loss": 3.159991502761841, "lr": 5.065528866243624e-05, "tps": 224751, "wall": 7951.5} {"step": 27269, "train_loss": 3.2742834091186523, "lr": 5.064879599439741e-05, "tps": 224633, "wall": 7955.9} {"step": 27270, "train_loss": 3.197852611541748, "lr": 5.064230524477818e-05, "tps": 224515, "wall": 7960.4} {"step": 27271, "train_loss": 3.0458197593688965, "lr": 5.063581641365207e-05, "tps": 224398, "wall": 7964.8} {"step": 27272, "train_loss": 3.11500883102417, "lr": 5.062932950109263e-05, "tps": 224281, "wall": 7969.3} {"step": 27273, "train_loss": 3.2464396953582764, "lr": 5.062284450717324e-05, "tps": 224165, "wall": 7973.7} {"step": 27274, "train_loss": 3.1068413257598877, "lr": 5.061636143196748e-05, "tps": 224046, "wall": 7978.2} {"step": 27275, "train_loss": 3.2065649032592773, "lr": 5.060988027554876e-05, "tps": 223930, "wall": 7982.7} {"step": 27276, "train_loss": 3.085317850112915, "lr": 5.060340103799042e-05, "tps": 223813, "wall": 7987.1} {"step": 27277, "train_loss": 3.156914710998535, "lr": 5.059692371936597e-05, "tps": 223697, "wall": 7991.6} {"step": 27278, "train_loss": 3.17340087890625, "lr": 5.059044831974872e-05, "tps": 223580, "wall": 7996.0} {"step": 27279, "train_loss": 3.0902626514434814, "lr": 5.0583974839212e-05, "tps": 223464, "wall": 8000.5} {"step": 27280, "train_loss": 3.0859415531158447, "lr": 5.057750327782922e-05, "tps": 223348, "wall": 8004.9} {"step": 27281, "train_loss": 3.2502613067626953, "lr": 5.057103363567366e-05, "tps": 223232, "wall": 8009.4} {"step": 27282, "train_loss": 3.1847777366638184, "lr": 5.056456591281855e-05, "tps": 223116, "wall": 8013.8} {"step": 27283, "train_loss": 3.2928853034973145, "lr": 5.055810010933723e-05, "tps": 223000, "wall": 8018.3} {"step": 27284, "train_loss": 3.2105154991149902, "lr": 5.05516362253029e-05, "tps": 222885, "wall": 8022.7} {"step": 27285, "train_loss": 3.2059831619262695, "lr": 5.054517426078882e-05, "tps": 222769, "wall": 8027.2} {"step": 27286, "train_loss": 3.037755012512207, "lr": 5.0538714215868186e-05, "tps": 222654, "wall": 8031.7} {"step": 27287, "train_loss": 3.256491184234619, "lr": 5.0532256090614125e-05, "tps": 222538, "wall": 8036.1} {"step": 27288, "train_loss": 3.208051919937134, "lr": 5.052579988509987e-05, "tps": 222422, "wall": 8040.6} {"step": 27289, "train_loss": 3.2360129356384277, "lr": 5.0519345599398514e-05, "tps": 222307, "wall": 8045.1} {"step": 27290, "train_loss": 3.1394474506378174, "lr": 5.051289323358317e-05, "tps": 222193, "wall": 8049.5} {"step": 27291, "train_loss": 3.2143776416778564, "lr": 5.050644278772695e-05, "tps": 222078, "wall": 8053.9} {"step": 27292, "train_loss": 3.181474208831787, "lr": 5.049999426190293e-05, "tps": 221964, "wall": 8058.4} {"step": 27293, "train_loss": 3.137155771255493, "lr": 5.04935476561841e-05, "tps": 221849, "wall": 8062.8} {"step": 27294, "train_loss": 3.2139225006103516, "lr": 5.0487102970643574e-05, "tps": 221735, "wall": 8067.3} {"step": 27295, "train_loss": 3.2602250576019287, "lr": 5.0480660205354325e-05, "tps": 221621, "wall": 8071.7} {"step": 27296, "train_loss": 3.1421165466308594, "lr": 5.0474219360389274e-05, "tps": 221507, "wall": 8076.2} {"step": 27297, "train_loss": 3.1653053760528564, "lr": 5.0467780435821474e-05, "tps": 221393, "wall": 8080.6} {"step": 27298, "train_loss": 3.0735995769500732, "lr": 5.046134343172383e-05, "tps": 221279, "wall": 8085.1} {"step": 27299, "train_loss": 3.1396875381469727, "lr": 5.045490834816925e-05, "tps": 221166, "wall": 8089.5} {"step": 27300, "train_loss": 3.1028120517730713, "lr": 5.044847518523065e-05, "tps": 221052, "wall": 8094.0} {"step": 27301, "train_loss": 3.1392288208007812, "lr": 5.0442043942980896e-05, "tps": 220937, "wall": 8098.5} {"step": 27302, "train_loss": 3.219428539276123, "lr": 5.043561462149282e-05, "tps": 220824, "wall": 8102.9} {"step": 27303, "train_loss": 3.1117067337036133, "lr": 5.042918722083929e-05, "tps": 220710, "wall": 8107.4} {"step": 27304, "train_loss": 3.2143282890319824, "lr": 5.042276174109308e-05, "tps": 220597, "wall": 8111.9} {"step": 27305, "train_loss": 3.1517648696899414, "lr": 5.041633818232704e-05, "tps": 220484, "wall": 8116.3} {"step": 27306, "train_loss": 3.201848030090332, "lr": 5.040991654461388e-05, "tps": 220371, "wall": 8120.8} {"step": 27307, "train_loss": 3.2190234661102295, "lr": 5.040349682802633e-05, "tps": 220258, "wall": 8125.2} {"step": 27308, "train_loss": 3.0805790424346924, "lr": 5.0397079032637184e-05, "tps": 220146, "wall": 8129.7} {"step": 27309, "train_loss": 3.187687873840332, "lr": 5.039066315851908e-05, "tps": 220034, "wall": 8134.1} {"step": 27310, "train_loss": 3.131251811981201, "lr": 5.038424920574471e-05, "tps": 219921, "wall": 8138.6} {"step": 27311, "train_loss": 3.311023712158203, "lr": 5.0377837174386776e-05, "tps": 219809, "wall": 8143.0} {"step": 27312, "train_loss": 3.203540563583374, "lr": 5.0371427064517874e-05, "tps": 219697, "wall": 8147.5} {"step": 27313, "train_loss": 3.1109395027160645, "lr": 5.036501887621058e-05, "tps": 219585, "wall": 8151.9} {"step": 27314, "train_loss": 3.091524124145508, "lr": 5.035861260953757e-05, "tps": 219473, "wall": 8156.4} {"step": 27315, "train_loss": 3.195983409881592, "lr": 5.035220826457137e-05, "tps": 219360, "wall": 8160.9} {"step": 27316, "train_loss": 3.2430877685546875, "lr": 5.03458058413845e-05, "tps": 219248, "wall": 8165.4} {"step": 27317, "train_loss": 3.2600302696228027, "lr": 5.0339405340049564e-05, "tps": 219137, "wall": 8169.8} {"step": 27318, "train_loss": 3.2708630561828613, "lr": 5.0333006760639e-05, "tps": 219025, "wall": 8174.3} {"step": 27319, "train_loss": 3.1346631050109863, "lr": 5.0326610103225304e-05, "tps": 218914, "wall": 8178.7} {"step": 27320, "train_loss": 3.256223201751709, "lr": 5.032021536788095e-05, "tps": 218803, "wall": 8183.2} {"step": 27321, "train_loss": 3.218099355697632, "lr": 5.0313822554678366e-05, "tps": 218692, "wall": 8187.6} {"step": 27322, "train_loss": 3.163957118988037, "lr": 5.030743166369002e-05, "tps": 218581, "wall": 8192.1} {"step": 27323, "train_loss": 3.153690814971924, "lr": 5.030104269498826e-05, "tps": 218470, "wall": 8196.6} {"step": 27324, "train_loss": 3.1487226486206055, "lr": 5.0294655648645425e-05, "tps": 218359, "wall": 8201.0} {"step": 27325, "train_loss": 3.13642954826355, "lr": 5.028827052473397e-05, "tps": 218249, "wall": 8205.5} {"step": 27326, "train_loss": 3.2154886722564697, "lr": 5.028188732332615e-05, "tps": 218138, "wall": 8209.9} {"step": 27327, "train_loss": 3.1193974018096924, "lr": 5.027550604449426e-05, "tps": 218028, "wall": 8214.4} {"step": 27328, "train_loss": 3.0293149948120117, "lr": 5.0269126688310656e-05, "tps": 217915, "wall": 8218.9} {"step": 27329, "train_loss": 3.1587913036346436, "lr": 5.026274925484755e-05, "tps": 217806, "wall": 8223.4} {"step": 27330, "train_loss": 3.191941738128662, "lr": 5.0256373744177196e-05, "tps": 217695, "wall": 8227.8} {"step": 27331, "train_loss": 3.048107147216797, "lr": 5.0250000156371845e-05, "tps": 217586, "wall": 8232.3} {"step": 27332, "train_loss": 3.1893255710601807, "lr": 5.024362849150368e-05, "tps": 217475, "wall": 8236.8} {"step": 27333, "train_loss": 3.251253843307495, "lr": 5.023725874964483e-05, "tps": 217366, "wall": 8241.2} {"step": 27334, "train_loss": 3.204496383666992, "lr": 5.023089093086754e-05, "tps": 217256, "wall": 8245.7} {"step": 27335, "train_loss": 3.221022605895996, "lr": 5.02245250352439e-05, "tps": 217147, "wall": 8250.1} {"step": 27336, "train_loss": 3.2378852367401123, "lr": 5.0218161062846e-05, "tps": 217038, "wall": 8254.6} {"step": 27337, "train_loss": 3.145589828491211, "lr": 5.021179901374597e-05, "tps": 216929, "wall": 8259.0} {"step": 27338, "train_loss": 3.2635979652404785, "lr": 5.020543888801587e-05, "tps": 216820, "wall": 8263.5} {"step": 27339, "train_loss": 3.1221628189086914, "lr": 5.019908068572773e-05, "tps": 216710, "wall": 8267.9} {"step": 27340, "train_loss": 3.1208248138427734, "lr": 5.019272440695361e-05, "tps": 216601, "wall": 8272.4} {"step": 27341, "train_loss": 3.2185466289520264, "lr": 5.018637005176547e-05, "tps": 216493, "wall": 8276.9} {"step": 27342, "train_loss": 3.251298666000366, "lr": 5.018001762023534e-05, "tps": 216383, "wall": 8281.4} {"step": 27343, "train_loss": 3.1687045097351074, "lr": 5.0173667112435154e-05, "tps": 216274, "wall": 8285.8} {"step": 27344, "train_loss": 3.1282858848571777, "lr": 5.016731852843684e-05, "tps": 216166, "wall": 8290.3} {"step": 27345, "train_loss": 3.2507741451263428, "lr": 5.016097186831234e-05, "tps": 216058, "wall": 8294.7} {"step": 27346, "train_loss": 3.251809597015381, "lr": 5.0154627132133545e-05, "tps": 215950, "wall": 8299.2} {"step": 27347, "train_loss": 3.181213855743408, "lr": 5.0148284319972305e-05, "tps": 215842, "wall": 8303.6} {"step": 27348, "train_loss": 3.1776530742645264, "lr": 5.014194343190052e-05, "tps": 215734, "wall": 8308.1} {"step": 27349, "train_loss": 3.129016399383545, "lr": 5.013560446798996e-05, "tps": 215626, "wall": 8312.6} {"step": 27350, "train_loss": 3.1600542068481445, "lr": 5.012926742831245e-05, "tps": 215519, "wall": 8317.0} {"step": 27351, "train_loss": 3.216371536254883, "lr": 5.012293231293982e-05, "tps": 215411, "wall": 8321.5} {"step": 27352, "train_loss": 3.1555726528167725, "lr": 5.011659912194381e-05, "tps": 215303, "wall": 8325.9} {"step": 27353, "train_loss": 3.1971211433410645, "lr": 5.011026785539611e-05, "tps": 215196, "wall": 8330.4} {"step": 27354, "train_loss": 3.093890428543091, "lr": 5.010393851336852e-05, "tps": 215089, "wall": 8334.8} {"step": 27355, "train_loss": 3.237351417541504, "lr": 5.009761109593272e-05, "tps": 214981, "wall": 8339.3} {"step": 27356, "train_loss": 3.2712113857269287, "lr": 5.009128560316033e-05, "tps": 214874, "wall": 8343.8} {"step": 27357, "train_loss": 3.0548934936523438, "lr": 5.0084962035123084e-05, "tps": 214767, "wall": 8348.3} {"step": 27358, "train_loss": 3.115492820739746, "lr": 5.007864039189255e-05, "tps": 214660, "wall": 8352.7} {"step": 27359, "train_loss": 3.2488889694213867, "lr": 5.0072320673540406e-05, "tps": 214554, "wall": 8357.2} {"step": 27360, "train_loss": 3.0818610191345215, "lr": 5.006600288013818e-05, "tps": 214448, "wall": 8361.6} {"step": 27361, "train_loss": 3.2479729652404785, "lr": 5.005968701175746e-05, "tps": 214341, "wall": 8366.1} {"step": 27362, "train_loss": 3.181743621826172, "lr": 5.005337306846983e-05, "tps": 214235, "wall": 8370.5} {"step": 27363, "train_loss": 3.1776468753814697, "lr": 5.0047061050346775e-05, "tps": 214129, "wall": 8375.0} {"step": 27364, "train_loss": 3.1774168014526367, "lr": 5.004075095745979e-05, "tps": 214023, "wall": 8379.4} {"step": 27365, "train_loss": 3.144423246383667, "lr": 5.003444278988037e-05, "tps": 213917, "wall": 8383.9} {"step": 27366, "train_loss": 3.104585647583008, "lr": 5.002813654768001e-05, "tps": 213811, "wall": 8388.3} {"step": 27367, "train_loss": 3.1222386360168457, "lr": 5.002183223093008e-05, "tps": 213706, "wall": 8392.8} {"step": 27368, "train_loss": 3.212414264678955, "lr": 5.0015529839702035e-05, "tps": 213600, "wall": 8397.2} {"step": 27369, "train_loss": 3.103144884109497, "lr": 5.000922937406729e-05, "tps": 213493, "wall": 8401.7} {"step": 27370, "train_loss": 3.1662185192108154, "lr": 5.000293083409716e-05, "tps": 213388, "wall": 8406.2} {"step": 27371, "train_loss": 3.159083366394043, "lr": 4.999663421986305e-05, "tps": 213283, "wall": 8410.6} {"step": 27372, "train_loss": 3.0790200233459473, "lr": 4.999033953143627e-05, "tps": 213178, "wall": 8415.1} {"step": 27373, "train_loss": 3.1162807941436768, "lr": 4.998404676888809e-05, "tps": 213073, "wall": 8419.5} {"step": 27374, "train_loss": 3.1077687740325928, "lr": 4.997775593228984e-05, "tps": 212968, "wall": 8424.0} {"step": 27375, "train_loss": 3.236323833465576, "lr": 4.997146702171276e-05, "tps": 212864, "wall": 8428.4} {"step": 27376, "train_loss": 3.113543748855591, "lr": 4.996518003722811e-05, "tps": 212759, "wall": 8432.9} {"step": 27377, "train_loss": 3.2330689430236816, "lr": 4.995889497890712e-05, "tps": 212654, "wall": 8437.4} {"step": 27378, "train_loss": 3.2291717529296875, "lr": 4.995261184682092e-05, "tps": 212550, "wall": 8441.8} {"step": 27379, "train_loss": 3.187366247177124, "lr": 4.9946330641040764e-05, "tps": 212445, "wall": 8446.3} {"step": 27380, "train_loss": 3.1950464248657227, "lr": 4.994005136163778e-05, "tps": 212341, "wall": 8450.7} {"step": 27381, "train_loss": 3.3096728324890137, "lr": 4.993377400868308e-05, "tps": 212237, "wall": 8455.2} {"step": 27382, "train_loss": 3.146143913269043, "lr": 4.99274985822478e-05, "tps": 212131, "wall": 8459.7} {"step": 27383, "train_loss": 3.1992299556732178, "lr": 4.9921225082403005e-05, "tps": 212028, "wall": 8464.2} {"step": 27384, "train_loss": 3.1877875328063965, "lr": 4.9914953509219766e-05, "tps": 211924, "wall": 8468.6} {"step": 27385, "train_loss": 3.331709146499634, "lr": 4.990868386276916e-05, "tps": 211820, "wall": 8473.1} {"step": 27386, "train_loss": 3.1554105281829834, "lr": 4.990241614312216e-05, "tps": 211716, "wall": 8477.5} {"step": 27387, "train_loss": 3.208237648010254, "lr": 4.9896150350349796e-05, "tps": 211613, "wall": 8482.0} {"step": 27388, "train_loss": 3.239776611328125, "lr": 4.9889886484523066e-05, "tps": 211510, "wall": 8486.4} {"step": 27389, "train_loss": 3.1777400970458984, "lr": 4.9883624545712886e-05, "tps": 211405, "wall": 8490.9} {"step": 27390, "train_loss": 3.161027431488037, "lr": 4.9877364533990196e-05, "tps": 211302, "wall": 8495.4} {"step": 27391, "train_loss": 3.061182975769043, "lr": 4.987110644942596e-05, "tps": 211199, "wall": 8499.9} {"step": 27392, "train_loss": 3.219301223754883, "lr": 4.986485029209099e-05, "tps": 211095, "wall": 8504.4} {"step": 27393, "train_loss": 3.190890312194824, "lr": 4.985859606205623e-05, "tps": 210993, "wall": 8508.8} {"step": 27394, "train_loss": 3.2220590114593506, "lr": 4.985234375939251e-05, "tps": 210890, "wall": 8513.2} {"step": 27395, "train_loss": 3.1953940391540527, "lr": 4.984609338417062e-05, "tps": 210787, "wall": 8517.7} {"step": 27396, "train_loss": 3.3113012313842773, "lr": 4.983984493646139e-05, "tps": 210683, "wall": 8522.2} {"step": 27397, "train_loss": 3.202725410461426, "lr": 4.983359841633566e-05, "tps": 210581, "wall": 8526.7} {"step": 27398, "train_loss": 3.106584072113037, "lr": 4.982735382386406e-05, "tps": 210478, "wall": 8531.1} {"step": 27399, "train_loss": 3.257345676422119, "lr": 4.982111115911743e-05, "tps": 210376, "wall": 8535.6} {"step": 27400, "train_loss": 3.204772472381592, "lr": 4.981487042216643e-05, "tps": 210275, "wall": 8540.0} {"step": 27401, "train_loss": 3.0896353721618652, "lr": 4.9808631613081825e-05, "tps": 210173, "wall": 8544.5} {"step": 27402, "train_loss": 3.1649765968322754, "lr": 4.980239473193425e-05, "tps": 210071, "wall": 8548.9} {"step": 27403, "train_loss": 3.2646889686584473, "lr": 4.97961597787943e-05, "tps": 209969, "wall": 8553.4} {"step": 27404, "train_loss": 3.1395020484924316, "lr": 4.9789926753732716e-05, "tps": 209866, "wall": 8557.9} {"step": 27405, "train_loss": 3.165247917175293, "lr": 4.978369565682003e-05, "tps": 209765, "wall": 8562.3} {"step": 27406, "train_loss": 3.106668472290039, "lr": 4.9777466488126855e-05, "tps": 209664, "wall": 8566.8} {"step": 27407, "train_loss": 3.1723251342773438, "lr": 4.977123924772374e-05, "tps": 209562, "wall": 8571.2} {"step": 27408, "train_loss": 3.1694726943969727, "lr": 4.976501393568126e-05, "tps": 209461, "wall": 8575.7} {"step": 27409, "train_loss": 3.2643790245056152, "lr": 4.9758790552069866e-05, "tps": 209358, "wall": 8580.2} {"step": 27410, "train_loss": 3.1613595485687256, "lr": 4.9752569096960136e-05, "tps": 209258, "wall": 8584.7} {"step": 27411, "train_loss": 3.0956015586853027, "lr": 4.974634957042251e-05, "tps": 209157, "wall": 8589.1} {"step": 27412, "train_loss": 3.1669199466705322, "lr": 4.974013197252743e-05, "tps": 209056, "wall": 8593.6} {"step": 27413, "train_loss": 3.286893367767334, "lr": 4.973391630334536e-05, "tps": 208955, "wall": 8598.0} {"step": 27414, "train_loss": 3.1378769874572754, "lr": 4.9727702562946696e-05, "tps": 208854, "wall": 8602.5} {"step": 27415, "train_loss": 3.177304267883301, "lr": 4.972149075140182e-05, "tps": 208754, "wall": 8606.9} {"step": 27416, "train_loss": 3.125035285949707, "lr": 4.971528086878111e-05, "tps": 208654, "wall": 8611.4} {"step": 27417, "train_loss": 3.126032590866089, "lr": 4.970907291515491e-05, "tps": 208554, "wall": 8615.8} {"step": 27418, "train_loss": 3.1409614086151123, "lr": 4.970286689059356e-05, "tps": 208453, "wall": 8620.3} {"step": 27419, "train_loss": 3.0525903701782227, "lr": 4.969666279516735e-05, "tps": 208353, "wall": 8624.7} {"step": 27420, "train_loss": 3.17539381980896, "lr": 4.969046062894652e-05, "tps": 208253, "wall": 8629.2} {"step": 27421, "train_loss": 3.1710658073425293, "lr": 4.96842603920014e-05, "tps": 208153, "wall": 8633.7} {"step": 27422, "train_loss": 3.1848981380462646, "lr": 4.96780620844022e-05, "tps": 208052, "wall": 8638.2} {"step": 27423, "train_loss": 3.1456003189086914, "lr": 4.9671865706219085e-05, "tps": 207952, "wall": 8642.6} {"step": 27424, "train_loss": 3.113375663757324, "lr": 4.966567125752232e-05, "tps": 207853, "wall": 8647.1} {"step": 27425, "train_loss": 3.0657362937927246, "lr": 4.965947873838205e-05, "tps": 207753, "wall": 8651.5} {"step": 27426, "train_loss": 3.086141347885132, "lr": 4.96532881488684e-05, "tps": 207654, "wall": 8656.0} {"step": 27427, "train_loss": 3.1489293575286865, "lr": 4.9647099489051526e-05, "tps": 207555, "wall": 8660.5} {"step": 27428, "train_loss": 3.14935302734375, "lr": 4.964091275900155e-05, "tps": 207456, "wall": 8664.9} {"step": 27429, "train_loss": 3.213779926300049, "lr": 4.963472795878848e-05, "tps": 207357, "wall": 8669.4} {"step": 27430, "train_loss": 3.2501420974731445, "lr": 4.962854508848246e-05, "tps": 207258, "wall": 8673.8} {"step": 27431, "train_loss": 3.138662338256836, "lr": 4.962236414815352e-05, "tps": 207159, "wall": 8678.3} {"step": 27432, "train_loss": 3.1312761306762695, "lr": 4.961618513787161e-05, "tps": 207060, "wall": 8682.7} {"step": 27433, "train_loss": 3.1498303413391113, "lr": 4.961000805770679e-05, "tps": 206962, "wall": 8687.2} {"step": 27434, "train_loss": 3.2856404781341553, "lr": 4.960383290772903e-05, "tps": 206863, "wall": 8691.6} {"step": 27435, "train_loss": 3.2183384895324707, "lr": 4.9597659688008247e-05, "tps": 206765, "wall": 8696.1} {"step": 27436, "train_loss": 3.1353814601898193, "lr": 4.959148839861442e-05, "tps": 206665, "wall": 8700.6} {"step": 27437, "train_loss": 3.2357492446899414, "lr": 4.95853190396174e-05, "tps": 206567, "wall": 8705.0} {"step": 27438, "train_loss": 3.1884326934814453, "lr": 4.9579151611087116e-05, "tps": 206469, "wall": 8709.5} {"step": 27439, "train_loss": 3.2257485389709473, "lr": 4.957298611309344e-05, "tps": 206371, "wall": 8713.9} {"step": 27440, "train_loss": 3.2007384300231934, "lr": 4.956682254570617e-05, "tps": 206273, "wall": 8718.4} {"step": 27441, "train_loss": 3.0865731239318848, "lr": 4.9560660908995175e-05, "tps": 206175, "wall": 8722.9} {"step": 27442, "train_loss": 3.1496872901916504, "lr": 4.9554501203030244e-05, "tps": 206077, "wall": 8727.3} {"step": 27443, "train_loss": 3.1507091522216797, "lr": 4.95483434278811e-05, "tps": 205980, "wall": 8731.8} {"step": 27444, "train_loss": 3.1082634925842285, "lr": 4.9542187583617585e-05, "tps": 205882, "wall": 8736.2} {"step": 27445, "train_loss": 3.106616258621216, "lr": 4.953603367030939e-05, "tps": 205785, "wall": 8740.7} {"step": 27446, "train_loss": 3.142169952392578, "lr": 4.952988168802619e-05, "tps": 205688, "wall": 8745.1} {"step": 27447, "train_loss": 3.10677433013916, "lr": 4.952373163683776e-05, "tps": 205590, "wall": 8749.6} {"step": 27448, "train_loss": 3.2021169662475586, "lr": 4.951758351681369e-05, "tps": 205493, "wall": 8754.0} {"step": 27449, "train_loss": 3.1460325717926025, "lr": 4.9511437328023656e-05, "tps": 205395, "wall": 8758.5} {"step": 27450, "train_loss": 3.2257637977600098, "lr": 4.95052930705373e-05, "tps": 205298, "wall": 8763.0} {"step": 27451, "train_loss": 3.124713897705078, "lr": 4.949915074442421e-05, "tps": 205201, "wall": 8767.4} {"step": 27452, "train_loss": 3.2036097049713135, "lr": 4.949301034975394e-05, "tps": 205105, "wall": 8771.9} {"step": 27453, "train_loss": 3.056959629058838, "lr": 4.9486871886596084e-05, "tps": 205008, "wall": 8776.3} {"step": 27454, "train_loss": 3.1455821990966797, "lr": 4.9480735355020156e-05, "tps": 204912, "wall": 8780.8} {"step": 27455, "train_loss": 3.1229841709136963, "lr": 4.9474600755095716e-05, "tps": 204815, "wall": 8785.3} {"step": 27456, "train_loss": 3.1588876247406006, "lr": 4.9468468086892206e-05, "tps": 204719, "wall": 8789.7} {"step": 27457, "train_loss": 3.145806074142456, "lr": 4.9462337350479096e-05, "tps": 204622, "wall": 8794.2} {"step": 27458, "train_loss": 3.2027506828308105, "lr": 4.945620854592589e-05, "tps": 204526, "wall": 8798.6} {"step": 27459, "train_loss": 3.134672164916992, "lr": 4.945008167330196e-05, "tps": 204430, "wall": 8803.1} {"step": 27460, "train_loss": 3.1945242881774902, "lr": 4.944395673267672e-05, "tps": 204335, "wall": 8807.5} {"step": 27461, "train_loss": 3.175994873046875, "lr": 4.9437833724119596e-05, "tps": 204239, "wall": 8812.0} {"step": 27462, "train_loss": 3.273007869720459, "lr": 4.9431712647699914e-05, "tps": 204143, "wall": 8816.4} {"step": 27463, "train_loss": 3.113194465637207, "lr": 4.942559350348698e-05, "tps": 204046, "wall": 8820.9} {"step": 27464, "train_loss": 3.170498847961426, "lr": 4.941947629155018e-05, "tps": 203951, "wall": 8825.4} {"step": 27465, "train_loss": 3.1238155364990234, "lr": 4.941336101195879e-05, "tps": 203855, "wall": 8829.8} {"step": 27466, "train_loss": 3.19132137298584, "lr": 4.9407247664782044e-05, "tps": 203760, "wall": 8834.3} {"step": 27467, "train_loss": 3.2150380611419678, "lr": 4.940113625008925e-05, "tps": 203665, "wall": 8838.7} {"step": 27468, "train_loss": 3.0517756938934326, "lr": 4.939502676794962e-05, "tps": 203570, "wall": 8843.2} {"step": 27469, "train_loss": 3.163177967071533, "lr": 4.938891921843233e-05, "tps": 203474, "wall": 8847.6} {"step": 27470, "train_loss": 3.08502197265625, "lr": 4.938281360160663e-05, "tps": 203380, "wall": 8852.1} {"step": 27471, "train_loss": 3.231215000152588, "lr": 4.937670991754159e-05, "tps": 203285, "wall": 8856.6} {"step": 27472, "train_loss": 3.1092543601989746, "lr": 4.9370608166306476e-05, "tps": 203190, "wall": 8861.0} {"step": 27473, "train_loss": 3.284285068511963, "lr": 4.9364508347970317e-05, "tps": 203095, "wall": 8865.5} {"step": 27474, "train_loss": 3.1772146224975586, "lr": 4.9358410462602205e-05, "tps": 203000, "wall": 8869.9} {"step": 27475, "train_loss": 3.1739537715911865, "lr": 4.9352314510271286e-05, "tps": 202906, "wall": 8874.4} {"step": 27476, "train_loss": 3.1645169258117676, "lr": 4.93462204910466e-05, "tps": 202810, "wall": 8878.9} {"step": 27477, "train_loss": 3.102841377258301, "lr": 4.934012840499712e-05, "tps": 202716, "wall": 8883.4} {"step": 27478, "train_loss": 3.2581610679626465, "lr": 4.933403825219191e-05, "tps": 202621, "wall": 8887.8} {"step": 27479, "train_loss": 3.113651990890503, "lr": 4.932795003269997e-05, "tps": 202527, "wall": 8892.3} {"step": 27480, "train_loss": 3.188736915588379, "lr": 4.9321863746590207e-05, "tps": 202433, "wall": 8896.7} {"step": 27481, "train_loss": 3.120715618133545, "lr": 4.9315779393931634e-05, "tps": 202339, "wall": 8901.2} {"step": 27482, "train_loss": 3.1994004249572754, "lr": 4.930969697479314e-05, "tps": 202246, "wall": 8905.6} {"step": 27483, "train_loss": 3.146407127380371, "lr": 4.930361648924361e-05, "tps": 202152, "wall": 8910.1} {"step": 27484, "train_loss": 3.1301944255828857, "lr": 4.9297537937351984e-05, "tps": 202058, "wall": 8914.5} {"step": 27485, "train_loss": 3.104192018508911, "lr": 4.9291461319187074e-05, "tps": 201965, "wall": 8919.0} {"step": 27486, "train_loss": 3.2318215370178223, "lr": 4.92853866348177e-05, "tps": 201872, "wall": 8923.4} {"step": 27487, "train_loss": 3.2291550636291504, "lr": 4.927931388431272e-05, "tps": 201778, "wall": 8927.9} {"step": 27488, "train_loss": 3.246532440185547, "lr": 4.9273243067740917e-05, "tps": 201685, "wall": 8932.3} {"step": 27489, "train_loss": 3.214838981628418, "lr": 4.926717418517103e-05, "tps": 201592, "wall": 8936.8} {"step": 27490, "train_loss": 3.097254753112793, "lr": 4.926110723667184e-05, "tps": 201498, "wall": 8941.3} {"step": 27491, "train_loss": 3.210291862487793, "lr": 4.9255042222312054e-05, "tps": 201404, "wall": 8945.7} {"step": 27492, "train_loss": 3.120191812515259, "lr": 4.924897914216041e-05, "tps": 201312, "wall": 8950.2} {"step": 27493, "train_loss": 3.2096729278564453, "lr": 4.924291799628556e-05, "tps": 201219, "wall": 8954.7} {"step": 27494, "train_loss": 3.1361522674560547, "lr": 4.9236858784756166e-05, "tps": 201126, "wall": 8959.1} {"step": 27495, "train_loss": 3.1287896633148193, "lr": 4.923080150764088e-05, "tps": 201033, "wall": 8963.6} {"step": 27496, "train_loss": 3.2390079498291016, "lr": 4.922474616500832e-05, "tps": 200940, "wall": 8968.0} {"step": 27497, "train_loss": 3.102632522583008, "lr": 4.921869275692704e-05, "tps": 200848, "wall": 8972.5} {"step": 27498, "train_loss": 3.2690515518188477, "lr": 4.921264128346569e-05, "tps": 200755, "wall": 8977.0} {"step": 27499, "train_loss": 3.18442440032959, "lr": 4.920659174469277e-05, "tps": 200663, "wall": 8981.4} {"step": 27500, "train_loss": 3.198340654373169, "lr": 4.92005441406768e-05, "tps": 200571, "wall": 8985.9} {"step": 27501, "train_loss": 3.106149673461914, "lr": 4.9194498471486314e-05, "tps": 200475, "wall": 8990.5} {"step": 27502, "train_loss": 3.133892059326172, "lr": 4.918845473718981e-05, "tps": 200383, "wall": 8995.0} {"step": 27503, "train_loss": 3.0838003158569336, "lr": 4.9182412937855694e-05, "tps": 200290, "wall": 8999.5} {"step": 27504, "train_loss": 3.1945178508758545, "lr": 4.917637307355248e-05, "tps": 200198, "wall": 9003.9} {"step": 27505, "train_loss": 3.1260533332824707, "lr": 4.917033514434854e-05, "tps": 200107, "wall": 9008.3} {"step": 27506, "train_loss": 3.2756054401397705, "lr": 4.916429915031227e-05, "tps": 200015, "wall": 9012.8} {"step": 27507, "train_loss": 3.2613208293914795, "lr": 4.915826509151207e-05, "tps": 199923, "wall": 9017.3} {"step": 27508, "train_loss": 3.2103333473205566, "lr": 4.915223296801626e-05, "tps": 199832, "wall": 9021.7} {"step": 27509, "train_loss": 3.2111153602600098, "lr": 4.9146202779893246e-05, "tps": 199740, "wall": 9026.2} {"step": 27510, "train_loss": 3.09909987449646, "lr": 4.9140174527211294e-05, "tps": 199649, "wall": 9030.6} {"step": 27511, "train_loss": 3.216805934906006, "lr": 4.913414821003863e-05, "tps": 199558, "wall": 9035.1} {"step": 27512, "train_loss": 3.012376546859741, "lr": 4.912812382844363e-05, "tps": 199467, "wall": 9039.5} {"step": 27513, "train_loss": 3.186509609222412, "lr": 4.912210138249449e-05, "tps": 199375, "wall": 9044.0} {"step": 27514, "train_loss": 3.168182373046875, "lr": 4.9116080872259385e-05, "tps": 199285, "wall": 9048.5} {"step": 27515, "train_loss": 3.126729965209961, "lr": 4.9110062297806605e-05, "tps": 199194, "wall": 9052.9} {"step": 27516, "train_loss": 3.1186718940734863, "lr": 4.910404565920427e-05, "tps": 199103, "wall": 9057.4} {"step": 27517, "train_loss": 3.1282663345336914, "lr": 4.9098030956520526e-05, "tps": 199011, "wall": 9061.9} {"step": 27518, "train_loss": 3.1119558811187744, "lr": 4.9092018189823566e-05, "tps": 198921, "wall": 9066.3} {"step": 27519, "train_loss": 3.1960744857788086, "lr": 4.9086007359181465e-05, "tps": 198831, "wall": 9070.8} {"step": 27520, "train_loss": 3.199770927429199, "lr": 4.9079998464662304e-05, "tps": 198740, "wall": 9075.2} {"step": 27521, "train_loss": 3.343193769454956, "lr": 4.9073991506334165e-05, "tps": 198650, "wall": 9079.7} {"step": 27522, "train_loss": 3.1911678314208984, "lr": 4.906798648426513e-05, "tps": 198560, "wall": 9084.1} {"step": 27523, "train_loss": 3.313511610031128, "lr": 4.9061983398523146e-05, "tps": 198470, "wall": 9088.6} {"step": 27524, "train_loss": 3.2072277069091797, "lr": 4.905598224917629e-05, "tps": 198380, "wall": 9093.0} {"step": 27525, "train_loss": 3.2014529705047607, "lr": 4.90499830362925e-05, "tps": 198290, "wall": 9097.5} {"step": 27526, "train_loss": 3.2416248321533203, "lr": 4.904398575993977e-05, "tps": 198200, "wall": 9101.9} {"step": 27527, "train_loss": 3.128579616546631, "lr": 4.903799042018602e-05, "tps": 198110, "wall": 9106.4} {"step": 27528, "train_loss": 3.1566002368927, "lr": 4.9031997017099135e-05, "tps": 198021, "wall": 9110.8} {"step": 27529, "train_loss": 3.188007354736328, "lr": 4.9026005550747044e-05, "tps": 197931, "wall": 9115.3} {"step": 27530, "train_loss": 3.1690025329589844, "lr": 4.9020016021197635e-05, "tps": 197840, "wall": 9119.8} {"step": 27531, "train_loss": 3.1506245136260986, "lr": 4.90140284285187e-05, "tps": 197751, "wall": 9124.3} {"step": 27532, "train_loss": 3.312824249267578, "lr": 4.900804277277815e-05, "tps": 197661, "wall": 9128.7} {"step": 27533, "train_loss": 3.1867713928222656, "lr": 4.90020590540437e-05, "tps": 197572, "wall": 9133.2} {"step": 27534, "train_loss": 3.108876943588257, "lr": 4.899607727238318e-05, "tps": 197483, "wall": 9137.6} {"step": 27535, "train_loss": 3.1804585456848145, "lr": 4.8990097427864364e-05, "tps": 197394, "wall": 9142.1} {"step": 27536, "train_loss": 3.2178287506103516, "lr": 4.898411952055498e-05, "tps": 197305, "wall": 9146.5} {"step": 27537, "train_loss": 3.080629348754883, "lr": 4.897814355052272e-05, "tps": 197215, "wall": 9151.1} {"step": 27538, "train_loss": 3.190051555633545, "lr": 4.897216951783532e-05, "tps": 197126, "wall": 9155.5} {"step": 27539, "train_loss": 3.1785688400268555, "lr": 4.896619742256043e-05, "tps": 197037, "wall": 9160.0} {"step": 27540, "train_loss": 3.128243923187256, "lr": 4.8960227264765694e-05, "tps": 196949, "wall": 9164.4} {"step": 27541, "train_loss": 3.178922653198242, "lr": 4.895425904451877e-05, "tps": 196860, "wall": 9168.9} {"step": 27542, "train_loss": 3.109990358352661, "lr": 4.894829276188726e-05, "tps": 196772, "wall": 9173.3} {"step": 27543, "train_loss": 3.1880152225494385, "lr": 4.894232841693872e-05, "tps": 196683, "wall": 9177.8} {"step": 27544, "train_loss": 3.0894227027893066, "lr": 4.893636600974077e-05, "tps": 196594, "wall": 9182.3} {"step": 27545, "train_loss": 3.1870741844177246, "lr": 4.893040554036088e-05, "tps": 196506, "wall": 9186.7} {"step": 27546, "train_loss": 3.1837120056152344, "lr": 4.892444700886666e-05, "tps": 196418, "wall": 9191.2} {"step": 27547, "train_loss": 3.156363010406494, "lr": 4.8918490415325525e-05, "tps": 196330, "wall": 9195.6} {"step": 27548, "train_loss": 3.1703593730926514, "lr": 4.891253575980498e-05, "tps": 196241, "wall": 9200.1} {"step": 27549, "train_loss": 3.2057719230651855, "lr": 4.8906583042372515e-05, "tps": 196153, "wall": 9204.6} {"step": 27550, "train_loss": 3.1295206546783447, "lr": 4.890063226309551e-05, "tps": 196066, "wall": 9209.0} {"step": 27551, "train_loss": 3.276662588119507, "lr": 4.88946834220414e-05, "tps": 195978, "wall": 9213.5} {"step": 27552, "train_loss": 3.160609006881714, "lr": 4.8888736519277584e-05, "tps": 195891, "wall": 9217.9} {"step": 27553, "train_loss": 3.1420090198516846, "lr": 4.8882791554871424e-05, "tps": 195803, "wall": 9222.4} {"step": 27554, "train_loss": 3.215843915939331, "lr": 4.887684852889023e-05, "tps": 195716, "wall": 9226.8} {"step": 27555, "train_loss": 3.191258192062378, "lr": 4.8870907441401384e-05, "tps": 195629, "wall": 9231.3} {"step": 27556, "train_loss": 3.224411725997925, "lr": 4.886496829247216e-05, "tps": 195542, "wall": 9235.7} {"step": 27557, "train_loss": 3.0571892261505127, "lr": 4.8859031082169805e-05, "tps": 195454, "wall": 9240.2} {"step": 27558, "train_loss": 3.1620492935180664, "lr": 4.8853095810561614e-05, "tps": 195367, "wall": 9244.7} {"step": 27559, "train_loss": 3.2641918659210205, "lr": 4.884716247771483e-05, "tps": 195280, "wall": 9249.1} {"step": 27560, "train_loss": 3.1528491973876953, "lr": 4.884123108369663e-05, "tps": 195194, "wall": 9253.5} {"step": 27561, "train_loss": 3.279994249343872, "lr": 4.8835301628574225e-05, "tps": 195107, "wall": 9258.0} {"step": 27562, "train_loss": 3.094843864440918, "lr": 4.8829374112414776e-05, "tps": 195020, "wall": 9262.4} {"step": 27563, "train_loss": 3.2004435062408447, "lr": 4.882344853528544e-05, "tps": 194934, "wall": 9266.9} {"step": 27564, "train_loss": 3.1974120140075684, "lr": 4.881752489725337e-05, "tps": 194847, "wall": 9271.4} {"step": 27565, "train_loss": 3.0996387004852295, "lr": 4.881160319838559e-05, "tps": 194760, "wall": 9275.8} {"step": 27566, "train_loss": 3.254051685333252, "lr": 4.880568343874929e-05, "tps": 194674, "wall": 9280.3} {"step": 27567, "train_loss": 3.2077155113220215, "lr": 4.879976561841143e-05, "tps": 194588, "wall": 9284.7} {"step": 27568, "train_loss": 3.239107608795166, "lr": 4.879384973743911e-05, "tps": 194501, "wall": 9289.2} {"step": 27569, "train_loss": 3.133798360824585, "lr": 4.8787935795899306e-05, "tps": 194416, "wall": 9293.6} {"step": 27570, "train_loss": 3.2617712020874023, "lr": 4.878202379385901e-05, "tps": 194329, "wall": 9298.1} {"step": 27571, "train_loss": 3.2514429092407227, "lr": 4.877611373138523e-05, "tps": 194242, "wall": 9302.6} {"step": 27572, "train_loss": 3.179887294769287, "lr": 4.8770205608544895e-05, "tps": 194156, "wall": 9307.0} {"step": 27573, "train_loss": 3.1909711360931396, "lr": 4.876429942540491e-05, "tps": 194071, "wall": 9311.5} {"step": 27574, "train_loss": 3.2289633750915527, "lr": 4.875839518203225e-05, "tps": 193985, "wall": 9315.9} {"step": 27575, "train_loss": 3.1399240493774414, "lr": 4.8752492878493746e-05, "tps": 193899, "wall": 9320.4} {"step": 27576, "train_loss": 3.16683030128479, "lr": 4.874659251485623e-05, "tps": 193814, "wall": 9324.8} {"step": 27577, "train_loss": 3.1334469318389893, "lr": 4.874069409118661e-05, "tps": 193728, "wall": 9329.3} {"step": 27578, "train_loss": 3.3350882530212402, "lr": 4.873479760755167e-05, "tps": 193643, "wall": 9333.8} {"step": 27579, "train_loss": 3.1312179565429688, "lr": 4.8728903064018196e-05, "tps": 193557, "wall": 9338.2} {"step": 27580, "train_loss": 3.1321980953216553, "lr": 4.872301046065298e-05, "tps": 193472, "wall": 9342.7} {"step": 27581, "train_loss": 3.2075271606445312, "lr": 4.871711979752278e-05, "tps": 193387, "wall": 9347.1} {"step": 27582, "train_loss": 3.1320409774780273, "lr": 4.871123107469427e-05, "tps": 193302, "wall": 9351.6} {"step": 27583, "train_loss": 3.0952084064483643, "lr": 4.870534429223424e-05, "tps": 193217, "wall": 9356.0} {"step": 27584, "train_loss": 3.2306151390075684, "lr": 4.869945945020934e-05, "tps": 193131, "wall": 9360.5} {"step": 27585, "train_loss": 3.1618974208831787, "lr": 4.869357654868622e-05, "tps": 193046, "wall": 9365.0} {"step": 27586, "train_loss": 3.167550563812256, "lr": 4.8687695587731535e-05, "tps": 192961, "wall": 9369.4} {"step": 27587, "train_loss": 3.0672659873962402, "lr": 4.868181656741187e-05, "tps": 192877, "wall": 9373.9} {"step": 27588, "train_loss": 3.2381489276885986, "lr": 4.86759394877939e-05, "tps": 192792, "wall": 9378.3} {"step": 27589, "train_loss": 3.2880074977874756, "lr": 4.867006434894414e-05, "tps": 192708, "wall": 9382.8} {"step": 27590, "train_loss": 3.1589317321777344, "lr": 4.866419115092913e-05, "tps": 192623, "wall": 9387.2} {"step": 27591, "train_loss": 3.1483850479125977, "lr": 4.8658319893815485e-05, "tps": 192538, "wall": 9391.7} {"step": 27592, "train_loss": 3.2770915031433105, "lr": 4.8652450577669645e-05, "tps": 192454, "wall": 9396.2} {"step": 27593, "train_loss": 3.1609840393066406, "lr": 4.864658320255808e-05, "tps": 192370, "wall": 9400.6} {"step": 27594, "train_loss": 3.1997339725494385, "lr": 4.8640717768547325e-05, "tps": 192286, "wall": 9405.1} {"step": 27595, "train_loss": 3.2200498580932617, "lr": 4.863485427570379e-05, "tps": 192202, "wall": 9409.5} {"step": 27596, "train_loss": 3.2080078125, "lr": 4.8628992724093883e-05, "tps": 192118, "wall": 9414.0} {"step": 27597, "train_loss": 3.1608290672302246, "lr": 4.862313311378404e-05, "tps": 192033, "wall": 9418.5} {"step": 27598, "train_loss": 3.208470582962036, "lr": 4.86172754448406e-05, "tps": 191949, "wall": 9422.9} {"step": 27599, "train_loss": 3.1162877082824707, "lr": 4.8611419717329915e-05, "tps": 191865, "wall": 9427.4} {"step": 27600, "train_loss": 3.170927047729492, "lr": 4.860556593131837e-05, "tps": 191782, "wall": 9431.8} {"step": 27601, "train_loss": 3.1790406703948975, "lr": 4.859971408687224e-05, "tps": 191698, "wall": 9436.3} {"step": 27602, "train_loss": 3.2201547622680664, "lr": 4.85938641840578e-05, "tps": 191615, "wall": 9440.7} {"step": 27603, "train_loss": 3.193171501159668, "lr": 4.858801622294136e-05, "tps": 191531, "wall": 9445.2} {"step": 27604, "train_loss": 3.148916244506836, "lr": 4.8582170203589134e-05, "tps": 191448, "wall": 9449.6} {"step": 27605, "train_loss": 3.209969997406006, "lr": 4.8576326126067365e-05, "tps": 191365, "wall": 9454.1} {"step": 27606, "train_loss": 3.156285285949707, "lr": 4.857048399044226e-05, "tps": 191282, "wall": 9458.6} {"step": 27607, "train_loss": 3.069078207015991, "lr": 4.856464379677996e-05, "tps": 191198, "wall": 9463.0} {"step": 27608, "train_loss": 3.0948069095611572, "lr": 4.8558805545146665e-05, "tps": 191115, "wall": 9467.5} {"step": 27609, "train_loss": 3.210817813873291, "lr": 4.8552969235608505e-05, "tps": 191032, "wall": 9471.9} {"step": 27610, "train_loss": 3.216780662536621, "lr": 4.854713486823157e-05, "tps": 190950, "wall": 9476.4} {"step": 27611, "train_loss": 3.114562511444092, "lr": 4.854130244308196e-05, "tps": 190866, "wall": 9480.9} {"step": 27612, "train_loss": 3.173203468322754, "lr": 4.8535471960225786e-05, "tps": 190783, "wall": 9485.3} {"step": 27613, "train_loss": 3.203493118286133, "lr": 4.852964341972902e-05, "tps": 190700, "wall": 9489.8} {"step": 27614, "train_loss": 3.1414694786071777, "lr": 4.852381682165776e-05, "tps": 190618, "wall": 9494.2} {"step": 27615, "train_loss": 3.245666980743408, "lr": 4.8517992166077964e-05, "tps": 190535, "wall": 9498.7} {"step": 27616, "train_loss": 3.080690860748291, "lr": 4.8512169453055624e-05, "tps": 190453, "wall": 9503.2} {"step": 27617, "train_loss": 3.172482490539551, "lr": 4.850634868265672e-05, "tps": 190370, "wall": 9507.6} {"step": 27618, "train_loss": 3.3065743446350098, "lr": 4.8500529854947176e-05, "tps": 190288, "wall": 9512.1} {"step": 27619, "train_loss": 3.1151907444000244, "lr": 4.849471296999288e-05, "tps": 190206, "wall": 9516.5} {"step": 27620, "train_loss": 3.2456586360931396, "lr": 4.848889802785979e-05, "tps": 190123, "wall": 9521.0} {"step": 27621, "train_loss": 3.179025173187256, "lr": 4.848308502861371e-05, "tps": 190041, "wall": 9525.5} {"step": 27622, "train_loss": 3.069777488708496, "lr": 4.8477273972320555e-05, "tps": 189960, "wall": 9529.9} {"step": 27623, "train_loss": 3.1749608516693115, "lr": 4.8471464859046104e-05, "tps": 189878, "wall": 9534.3} {"step": 27624, "train_loss": 3.16984224319458, "lr": 4.846565768885616e-05, "tps": 189795, "wall": 9538.9} {"step": 27625, "train_loss": 3.185533046722412, "lr": 4.845985246181656e-05, "tps": 189713, "wall": 9543.3} {"step": 27626, "train_loss": 3.185214042663574, "lr": 4.845404917799301e-05, "tps": 189632, "wall": 9547.8} {"step": 27627, "train_loss": 3.1744539737701416, "lr": 4.844824783745128e-05, "tps": 189550, "wall": 9552.2} {"step": 27628, "train_loss": 3.1691036224365234, "lr": 4.8442448440257084e-05, "tps": 189468, "wall": 9556.7} {"step": 27629, "train_loss": 3.146091938018799, "lr": 4.84366509864761e-05, "tps": 189387, "wall": 9561.1} {"step": 27630, "train_loss": 3.2172350883483887, "lr": 4.843085547617401e-05, "tps": 189306, "wall": 9565.6} {"step": 27631, "train_loss": 3.245476722717285, "lr": 4.8425061909416495e-05, "tps": 189225, "wall": 9570.0} {"step": 27632, "train_loss": 3.1753344535827637, "lr": 4.841927028626915e-05, "tps": 189143, "wall": 9574.5} {"step": 27633, "train_loss": 3.0859556198120117, "lr": 4.841348060679758e-05, "tps": 189062, "wall": 9579.0} {"step": 27634, "train_loss": 3.1312925815582275, "lr": 4.8407692871067404e-05, "tps": 188981, "wall": 9583.4} {"step": 27635, "train_loss": 3.2057716846466064, "lr": 4.840190707914416e-05, "tps": 188900, "wall": 9587.9} {"step": 27636, "train_loss": 3.180257797241211, "lr": 4.839612323109338e-05, "tps": 188819, "wall": 9592.3} {"step": 27637, "train_loss": 3.2832016944885254, "lr": 4.839034132698061e-05, "tps": 188738, "wall": 9596.8} {"step": 27638, "train_loss": 3.261110305786133, "lr": 4.838456136687136e-05, "tps": 188657, "wall": 9601.3} {"step": 27639, "train_loss": 3.180574655532837, "lr": 4.837878335083104e-05, "tps": 188576, "wall": 9605.7} {"step": 27640, "train_loss": 3.1425654888153076, "lr": 4.837300727892518e-05, "tps": 188495, "wall": 9610.2} {"step": 27641, "train_loss": 3.116055965423584, "lr": 4.8367233151219156e-05, "tps": 188415, "wall": 9614.7} {"step": 27642, "train_loss": 3.1813340187072754, "lr": 4.836146096777841e-05, "tps": 188334, "wall": 9619.1} {"step": 27643, "train_loss": 3.1117053031921387, "lr": 4.835569072866835e-05, "tps": 188254, "wall": 9623.6} {"step": 27644, "train_loss": 3.232423782348633, "lr": 4.834992243395427e-05, "tps": 188174, "wall": 9628.0} {"step": 27645, "train_loss": 3.149611473083496, "lr": 4.834415608370155e-05, "tps": 188093, "wall": 9632.5} {"step": 27646, "train_loss": 3.2187843322753906, "lr": 4.8338391677975566e-05, "tps": 188013, "wall": 9636.9} {"step": 27647, "train_loss": 3.354459524154663, "lr": 4.83326292168415e-05, "tps": 187933, "wall": 9641.4} {"step": 27648, "train_loss": 3.222660541534424, "lr": 4.832686870036476e-05, "tps": 187853, "wall": 9645.8} {"step": 27649, "train_loss": 3.145616292953491, "lr": 4.8321110128610516e-05, "tps": 187774, "wall": 9650.3} {"step": 27650, "train_loss": 3.138896942138672, "lr": 4.8315353501644e-05, "tps": 187694, "wall": 9654.7} {"step": 27651, "train_loss": 3.092535972595215, "lr": 4.830959881953048e-05, "tps": 187613, "wall": 9659.3} {"step": 27652, "train_loss": 3.2479021549224854, "lr": 4.8303846082335115e-05, "tps": 187533, "wall": 9663.7} {"step": 27653, "train_loss": 3.187497615814209, "lr": 4.8298095290123025e-05, "tps": 187453, "wall": 9668.2} {"step": 27654, "train_loss": 3.241105079650879, "lr": 4.8292346442959455e-05, "tps": 187374, "wall": 9672.6} {"step": 27655, "train_loss": 3.1629014015197754, "lr": 4.828659954090945e-05, "tps": 187294, "wall": 9677.1} {"step": 27656, "train_loss": 3.2068262100219727, "lr": 4.828085458403813e-05, "tps": 187215, "wall": 9681.5} {"step": 27657, "train_loss": 3.1937525272369385, "lr": 4.827511157241059e-05, "tps": 187136, "wall": 9686.0} {"step": 27658, "train_loss": 3.102825164794922, "lr": 4.8269370506091846e-05, "tps": 187056, "wall": 9690.4} {"step": 27659, "train_loss": 3.2332286834716797, "lr": 4.826363138514699e-05, "tps": 186977, "wall": 9694.9} {"step": 27660, "train_loss": 3.167266607284546, "lr": 4.8257894209641015e-05, "tps": 186898, "wall": 9699.3} {"step": 27661, "train_loss": 3.2690577507019043, "lr": 4.8252158979638886e-05, "tps": 186819, "wall": 9703.8} {"step": 27662, "train_loss": 3.1677699089050293, "lr": 4.824642569520561e-05, "tps": 186740, "wall": 9708.2} {"step": 27663, "train_loss": 3.1849565505981445, "lr": 4.8240694356406125e-05, "tps": 186661, "wall": 9712.7} {"step": 27664, "train_loss": 3.1776235103607178, "lr": 4.823496496330531e-05, "tps": 186582, "wall": 9717.1} {"step": 27665, "train_loss": 3.190936326980591, "lr": 4.822923751596813e-05, "tps": 186503, "wall": 9721.6} {"step": 27666, "train_loss": 3.1970927715301514, "lr": 4.8223512014459424e-05, "tps": 186424, "wall": 9726.1} {"step": 27667, "train_loss": 3.1116743087768555, "lr": 4.821778845884407e-05, "tps": 186345, "wall": 9730.6} {"step": 27668, "train_loss": 3.1539220809936523, "lr": 4.821206684918691e-05, "tps": 186267, "wall": 9735.0} {"step": 27669, "train_loss": 3.1339454650878906, "lr": 4.820634718555275e-05, "tps": 186188, "wall": 9739.5} {"step": 27670, "train_loss": 3.0940709114074707, "lr": 4.8200629468006384e-05, "tps": 186110, "wall": 9743.9} {"step": 27671, "train_loss": 3.2343759536743164, "lr": 4.819491369661258e-05, "tps": 186032, "wall": 9748.4} {"step": 27672, "train_loss": 3.196293354034424, "lr": 4.8189199871436095e-05, "tps": 185954, "wall": 9752.8} {"step": 27673, "train_loss": 3.1324148178100586, "lr": 4.818348799254163e-05, "tps": 185875, "wall": 9757.3} {"step": 27674, "train_loss": 3.233825445175171, "lr": 4.8177778059993925e-05, "tps": 185797, "wall": 9761.7} {"step": 27675, "train_loss": 3.1062254905700684, "lr": 4.8172070073857624e-05, "tps": 185719, "wall": 9766.2} {"step": 27676, "train_loss": 3.2117090225219727, "lr": 4.816636403419743e-05, "tps": 185641, "wall": 9770.6} {"step": 27677, "train_loss": 3.2192068099975586, "lr": 4.8160659941077954e-05, "tps": 185563, "wall": 9775.1} {"step": 27678, "train_loss": 3.1429996490478516, "lr": 4.81549577945638e-05, "tps": 185485, "wall": 9779.6} {"step": 27679, "train_loss": 3.2184674739837646, "lr": 4.814925759471961e-05, "tps": 185406, "wall": 9784.1} {"step": 27680, "train_loss": 3.1743338108062744, "lr": 4.8143559341609925e-05, "tps": 185329, "wall": 9788.5} {"step": 27681, "train_loss": 3.0809338092803955, "lr": 4.813786303529928e-05, "tps": 185251, "wall": 9793.0} {"step": 27682, "train_loss": 3.172213554382324, "lr": 4.813216867585223e-05, "tps": 185173, "wall": 9797.5} {"step": 27683, "train_loss": 3.10329008102417, "lr": 4.8126476263333296e-05, "tps": 185096, "wall": 9801.9} {"step": 27684, "train_loss": 3.224644184112549, "lr": 4.812078579780689e-05, "tps": 185018, "wall": 9806.4} {"step": 27685, "train_loss": 3.243359088897705, "lr": 4.8115097279337535e-05, "tps": 184941, "wall": 9810.8} {"step": 27686, "train_loss": 3.208131790161133, "lr": 4.810941070798969e-05, "tps": 184864, "wall": 9815.3} {"step": 27687, "train_loss": 3.0830230712890625, "lr": 4.8103726083827696e-05, "tps": 184786, "wall": 9819.7} {"step": 27688, "train_loss": 3.184765338897705, "lr": 4.8098043406916e-05, "tps": 184709, "wall": 9824.2} {"step": 27689, "train_loss": 3.236400604248047, "lr": 4.8092362677318997e-05, "tps": 184632, "wall": 9828.6} {"step": 27690, "train_loss": 3.1921238899230957, "lr": 4.808668389510097e-05, "tps": 184556, "wall": 9833.1} {"step": 27691, "train_loss": 3.1650843620300293, "lr": 4.808100706032631e-05, "tps": 184479, "wall": 9837.5} {"step": 27692, "train_loss": 3.20751953125, "lr": 4.8075332173059305e-05, "tps": 184401, "wall": 9842.0} {"step": 27693, "train_loss": 3.2126760482788086, "lr": 4.806965923336423e-05, "tps": 184324, "wall": 9846.5} {"step": 27694, "train_loss": 3.207902431488037, "lr": 4.8063988241305355e-05, "tps": 184247, "wall": 9851.0} {"step": 27695, "train_loss": 3.1424503326416016, "lr": 4.805831919694693e-05, "tps": 184171, "wall": 9855.4} {"step": 27696, "train_loss": 3.1642651557922363, "lr": 4.8052652100353174e-05, "tps": 184094, "wall": 9859.9} {"step": 27697, "train_loss": 3.2296152114868164, "lr": 4.804698695158827e-05, "tps": 184017, "wall": 9864.3} {"step": 27698, "train_loss": 3.1240034103393555, "lr": 4.8041323750716383e-05, "tps": 183941, "wall": 9868.8} {"step": 27699, "train_loss": 3.2530388832092285, "lr": 4.8035662497801705e-05, "tps": 183864, "wall": 9873.3} {"step": 27700, "train_loss": 3.103868246078491, "lr": 4.803000319290835e-05, "tps": 183788, "wall": 9877.7} {"step": 27701, "train_loss": 3.154376983642578, "lr": 4.802434583610039e-05, "tps": 183712, "wall": 9882.2} {"step": 27702, "train_loss": 3.239886999130249, "lr": 4.801869042744197e-05, "tps": 183636, "wall": 9886.6} {"step": 27703, "train_loss": 3.2008845806121826, "lr": 4.801303696699714e-05, "tps": 183560, "wall": 9891.1} {"step": 27704, "train_loss": 3.1840527057647705, "lr": 4.8007385454829895e-05, "tps": 183484, "wall": 9895.5} {"step": 27705, "train_loss": 3.20592999458313, "lr": 4.800173589100433e-05, "tps": 183407, "wall": 9900.0} {"step": 27706, "train_loss": 3.1772637367248535, "lr": 4.799608827558439e-05, "tps": 183331, "wall": 9904.5} {"step": 27707, "train_loss": 3.1428887844085693, "lr": 4.7990442608634056e-05, "tps": 183256, "wall": 9908.9} {"step": 27708, "train_loss": 3.139435291290283, "lr": 4.7984798890217306e-05, "tps": 183180, "wall": 9913.4} {"step": 27709, "train_loss": 3.1721842288970947, "lr": 4.7979157120398075e-05, "tps": 183104, "wall": 9917.9} {"step": 27710, "train_loss": 3.153477907180786, "lr": 4.7973517299240224e-05, "tps": 183028, "wall": 9922.3} {"step": 27711, "train_loss": 3.146247625350952, "lr": 4.796787942680769e-05, "tps": 182952, "wall": 9926.8} {"step": 27712, "train_loss": 3.189838409423828, "lr": 4.7962243503164314e-05, "tps": 182877, "wall": 9931.2} {"step": 27713, "train_loss": 3.242309093475342, "lr": 4.795660952837398e-05, "tps": 182802, "wall": 9935.7} {"step": 27714, "train_loss": 3.111760139465332, "lr": 4.795097750250047e-05, "tps": 182726, "wall": 9940.1} {"step": 27715, "train_loss": 3.158947229385376, "lr": 4.794534742560758e-05, "tps": 182651, "wall": 9944.6} {"step": 27716, "train_loss": 3.2104384899139404, "lr": 4.7939719297759135e-05, "tps": 182576, "wall": 9949.1} {"step": 27717, "train_loss": 3.1431524753570557, "lr": 4.793409311901884e-05, "tps": 182501, "wall": 9953.5} {"step": 27718, "train_loss": 3.1903493404388428, "lr": 4.792846888945041e-05, "tps": 182426, "wall": 9958.0} {"step": 27719, "train_loss": 3.09847354888916, "lr": 4.7922846609117636e-05, "tps": 182350, "wall": 9962.5} {"step": 27720, "train_loss": 3.1433892250061035, "lr": 4.791722627808416e-05, "tps": 182275, "wall": 9966.9} {"step": 27721, "train_loss": 3.2612617015838623, "lr": 4.791160789641364e-05, "tps": 182200, "wall": 9971.4} {"step": 27722, "train_loss": 3.1073646545410156, "lr": 4.790599146416976e-05, "tps": 182125, "wall": 9975.8} {"step": 27723, "train_loss": 3.021880626678467, "lr": 4.790037698141611e-05, "tps": 182050, "wall": 9980.3} {"step": 27724, "train_loss": 3.1107754707336426, "lr": 4.789476444821627e-05, "tps": 181976, "wall": 9984.7} {"step": 27725, "train_loss": 3.1715354919433594, "lr": 4.7889153864633886e-05, "tps": 181901, "wall": 9989.2} {"step": 27726, "train_loss": 3.2159438133239746, "lr": 4.788354523073247e-05, "tps": 181827, "wall": 9993.6} {"step": 27727, "train_loss": 3.0918807983398438, "lr": 4.787793854657554e-05, "tps": 181752, "wall": 9998.1} {"step": 27728, "train_loss": 3.318187713623047, "lr": 4.787233381222666e-05, "tps": 181678, "wall": 10002.5} {"step": 27729, "train_loss": 3.150237560272217, "lr": 4.786673102774929e-05, "tps": 181604, "wall": 10007.0} {"step": 27730, "train_loss": 3.120877742767334, "lr": 4.7861130193206884e-05, "tps": 181529, "wall": 10011.5} {"step": 27731, "train_loss": 3.1216037273406982, "lr": 4.7855531308662934e-05, "tps": 181455, "wall": 10015.9} {"step": 27732, "train_loss": 3.0351548194885254, "lr": 4.784993437418081e-05, "tps": 181380, "wall": 10020.4} {"step": 27733, "train_loss": 3.035552978515625, "lr": 4.7844339389823975e-05, "tps": 181306, "wall": 10024.9} {"step": 27734, "train_loss": 3.236205816268921, "lr": 4.78387463556558e-05, "tps": 181232, "wall": 10029.3} {"step": 27735, "train_loss": 3.2260022163391113, "lr": 4.783315527173955e-05, "tps": 181158, "wall": 10033.8} {"step": 27736, "train_loss": 3.145249366760254, "lr": 4.782756613813867e-05, "tps": 181084, "wall": 10038.2} {"step": 27737, "train_loss": 3.242650270462036, "lr": 4.7821978954916414e-05, "tps": 181010, "wall": 10042.7} {"step": 27738, "train_loss": 3.2244744300842285, "lr": 4.781639372213612e-05, "tps": 180937, "wall": 10047.2} {"step": 27739, "train_loss": 3.2510969638824463, "lr": 4.781081043986103e-05, "tps": 180863, "wall": 10051.6} {"step": 27740, "train_loss": 3.2360544204711914, "lr": 4.7805229108154385e-05, "tps": 180789, "wall": 10056.1} {"step": 27741, "train_loss": 3.168663501739502, "lr": 4.779964972707942e-05, "tps": 180716, "wall": 10060.5} {"step": 27742, "train_loss": 3.18624210357666, "lr": 4.779407229669935e-05, "tps": 180642, "wall": 10065.0} {"step": 27743, "train_loss": 3.225865364074707, "lr": 4.778849681707732e-05, "tps": 180569, "wall": 10069.4} {"step": 27744, "train_loss": 3.205066680908203, "lr": 4.778292328827654e-05, "tps": 180496, "wall": 10073.9} {"step": 27745, "train_loss": 3.1111092567443848, "lr": 4.777735171036013e-05, "tps": 180422, "wall": 10078.4} {"step": 27746, "train_loss": 3.1533122062683105, "lr": 4.7771782083391166e-05, "tps": 180349, "wall": 10082.8} {"step": 27747, "train_loss": 3.2359864711761475, "lr": 4.776621440743279e-05, "tps": 180275, "wall": 10087.3} {"step": 27748, "train_loss": 3.156360387802124, "lr": 4.776064868254806e-05, "tps": 180202, "wall": 10091.7} {"step": 27749, "train_loss": 3.20396089553833, "lr": 4.775508490879998e-05, "tps": 180129, "wall": 10096.2} {"step": 27750, "train_loss": 3.1514410972595215, "lr": 4.774952308625166e-05, "tps": 180056, "wall": 10100.7} {"step": 27751, "train_loss": 3.2081265449523926, "lr": 4.774396321496606e-05, "tps": 179983, "wall": 10105.1} {"step": 27752, "train_loss": 3.0244569778442383, "lr": 4.7738405295006136e-05, "tps": 179910, "wall": 10109.6} {"step": 27753, "train_loss": 3.1263654232025146, "lr": 4.77328493264349e-05, "tps": 179837, "wall": 10114.0} {"step": 27754, "train_loss": 3.2393126487731934, "lr": 4.772729530931524e-05, "tps": 179765, "wall": 10118.5} {"step": 27755, "train_loss": 3.2431893348693848, "lr": 4.772174324371013e-05, "tps": 179692, "wall": 10122.9} {"step": 27756, "train_loss": 3.22463059425354, "lr": 4.771619312968242e-05, "tps": 179619, "wall": 10127.4} {"step": 27757, "train_loss": 3.075143575668335, "lr": 4.771064496729499e-05, "tps": 179547, "wall": 10131.9} {"step": 27758, "train_loss": 3.2304928302764893, "lr": 4.770509875661069e-05, "tps": 179474, "wall": 10136.3} {"step": 27759, "train_loss": 3.1905860900878906, "lr": 4.769955449769238e-05, "tps": 179401, "wall": 10140.8} {"step": 27760, "train_loss": 3.0454955101013184, "lr": 4.76940121906028e-05, "tps": 179329, "wall": 10145.3} {"step": 27761, "train_loss": 3.1428375244140625, "lr": 4.7688471835404794e-05, "tps": 179256, "wall": 10149.7} {"step": 27762, "train_loss": 3.1943931579589844, "lr": 4.7682933432161096e-05, "tps": 179184, "wall": 10154.2} {"step": 27763, "train_loss": 3.1864328384399414, "lr": 4.7677396980934444e-05, "tps": 179111, "wall": 10158.7} {"step": 27764, "train_loss": 3.2910730838775635, "lr": 4.7671862481787586e-05, "tps": 179040, "wall": 10163.1} {"step": 27765, "train_loss": 3.1898388862609863, "lr": 4.766632993478318e-05, "tps": 178968, "wall": 10167.6} {"step": 27766, "train_loss": 3.1222915649414062, "lr": 4.7660799339983894e-05, "tps": 178896, "wall": 10172.0} {"step": 27767, "train_loss": 3.1877200603485107, "lr": 4.7655270697452406e-05, "tps": 178824, "wall": 10176.5} {"step": 27768, "train_loss": 3.230515956878662, "lr": 4.764974400725134e-05, "tps": 178752, "wall": 10180.9} {"step": 27769, "train_loss": 3.1591737270355225, "lr": 4.764421926944329e-05, "tps": 178680, "wall": 10185.4} {"step": 27770, "train_loss": 3.2714309692382812, "lr": 4.763869648409086e-05, "tps": 178609, "wall": 10189.9} {"step": 27771, "train_loss": 3.2399744987487793, "lr": 4.763317565125661e-05, "tps": 178537, "wall": 10194.3} {"step": 27772, "train_loss": 3.1179375648498535, "lr": 4.762765677100303e-05, "tps": 178464, "wall": 10198.8} {"step": 27773, "train_loss": 3.1828460693359375, "lr": 4.7622139843392724e-05, "tps": 178394, "wall": 10203.2} {"step": 27774, "train_loss": 3.1980576515197754, "lr": 4.7616624868488115e-05, "tps": 178322, "wall": 10207.7} {"step": 27775, "train_loss": 3.1046462059020996, "lr": 4.761111184635171e-05, "tps": 178251, "wall": 10212.2} {"step": 27776, "train_loss": 3.107426404953003, "lr": 4.760560077704598e-05, "tps": 178179, "wall": 10216.6} {"step": 27777, "train_loss": 3.204926013946533, "lr": 4.760009166063329e-05, "tps": 178108, "wall": 10221.0} {"step": 27778, "train_loss": 3.092419147491455, "lr": 4.7594584497176115e-05, "tps": 178037, "wall": 10225.5} {"step": 27779, "train_loss": 3.2465505599975586, "lr": 4.758907928673682e-05, "tps": 177966, "wall": 10230.0} {"step": 27780, "train_loss": 3.1641573905944824, "lr": 4.758357602937774e-05, "tps": 177895, "wall": 10234.4} {"step": 27781, "train_loss": 3.1150898933410645, "lr": 4.757807472516125e-05, "tps": 177824, "wall": 10238.8} {"step": 27782, "train_loss": 3.1792550086975098, "lr": 4.7572575374149676e-05, "tps": 177753, "wall": 10243.3} {"step": 27783, "train_loss": 3.16408634185791, "lr": 4.756707797640525e-05, "tps": 177682, "wall": 10247.8} {"step": 27784, "train_loss": 3.1354823112487793, "lr": 4.7561582531990345e-05, "tps": 177611, "wall": 10252.2} {"step": 27785, "train_loss": 3.2439355850219727, "lr": 4.755608904096714e-05, "tps": 177541, "wall": 10256.7} {"step": 27786, "train_loss": 3.1984004974365234, "lr": 4.7550597503397864e-05, "tps": 177469, "wall": 10261.2} {"step": 27787, "train_loss": 3.118774652481079, "lr": 4.754510791934477e-05, "tps": 177399, "wall": 10265.6} {"step": 27788, "train_loss": 3.2156622409820557, "lr": 4.753962028887004e-05, "tps": 177328, "wall": 10270.1} {"step": 27789, "train_loss": 3.092722177505493, "lr": 4.753413461203578e-05, "tps": 177258, "wall": 10274.5} {"step": 27790, "train_loss": 3.0668139457702637, "lr": 4.752865088890421e-05, "tps": 177187, "wall": 10279.0} {"step": 27791, "train_loss": 3.115298271179199, "lr": 4.7523169119537384e-05, "tps": 177117, "wall": 10283.4} {"step": 27792, "train_loss": 3.2165889739990234, "lr": 4.7517689303997445e-05, "tps": 177046, "wall": 10287.9} {"step": 27793, "train_loss": 3.1519670486450195, "lr": 4.751221144234647e-05, "tps": 176976, "wall": 10292.4} {"step": 27794, "train_loss": 3.1786558628082275, "lr": 4.750673553464647e-05, "tps": 176905, "wall": 10296.9} {"step": 27795, "train_loss": 3.2067904472351074, "lr": 4.7501261580959514e-05, "tps": 176835, "wall": 10301.3} {"step": 27796, "train_loss": 3.1764180660247803, "lr": 4.749578958134761e-05, "tps": 176765, "wall": 10305.8} {"step": 27797, "train_loss": 3.211754322052002, "lr": 4.74903195358727e-05, "tps": 176695, "wall": 10310.2} {"step": 27798, "train_loss": 3.200221538543701, "lr": 4.74848514445968e-05, "tps": 176625, "wall": 10314.7} {"step": 27799, "train_loss": 3.219059467315674, "lr": 4.747938530758186e-05, "tps": 176554, "wall": 10319.2} {"step": 27800, "train_loss": 3.209078311920166, "lr": 4.7473921124889726e-05, "tps": 176484, "wall": 10323.7} {"step": 27801, "train_loss": 3.157571315765381, "lr": 4.746845889658238e-05, "tps": 176414, "wall": 10328.1} {"step": 27802, "train_loss": 3.083073139190674, "lr": 4.746299862272168e-05, "tps": 176344, "wall": 10332.6} {"step": 27803, "train_loss": 3.153054714202881, "lr": 4.745754030336942e-05, "tps": 176275, "wall": 10337.0} {"step": 27804, "train_loss": 3.116246223449707, "lr": 4.745208393858752e-05, "tps": 176205, "wall": 10341.5} {"step": 27805, "train_loss": 3.228912353515625, "lr": 4.744662952843774e-05, "tps": 176136, "wall": 10345.9} {"step": 27806, "train_loss": 3.1708412170410156, "lr": 4.744117707298185e-05, "tps": 176066, "wall": 10350.4} {"step": 27807, "train_loss": 3.18475604057312, "lr": 4.743572657228167e-05, "tps": 175997, "wall": 10354.8} {"step": 27808, "train_loss": 3.15516996383667, "lr": 4.7430278026398885e-05, "tps": 175928, "wall": 10359.3} {"step": 27809, "train_loss": 3.264216423034668, "lr": 4.7424831435395276e-05, "tps": 175859, "wall": 10363.7} {"step": 27810, "train_loss": 3.1215147972106934, "lr": 4.741938679933251e-05, "tps": 175789, "wall": 10368.2} {"step": 27811, "train_loss": 3.155968189239502, "lr": 4.7413944118272244e-05, "tps": 175720, "wall": 10372.6} {"step": 27812, "train_loss": 3.1334965229034424, "lr": 4.740850339227618e-05, "tps": 175651, "wall": 10377.1} {"step": 27813, "train_loss": 3.1770834922790527, "lr": 4.740306462140593e-05, "tps": 175581, "wall": 10381.6} {"step": 27814, "train_loss": 3.181617259979248, "lr": 4.739762780572307e-05, "tps": 175512, "wall": 10386.1} {"step": 27815, "train_loss": 3.1951563358306885, "lr": 4.739219294528924e-05, "tps": 175443, "wall": 10390.5} {"step": 27816, "train_loss": 3.2491259574890137, "lr": 4.738676004016599e-05, "tps": 175373, "wall": 10395.0} {"step": 27817, "train_loss": 3.1519668102264404, "lr": 4.738132909041484e-05, "tps": 175305, "wall": 10399.5} {"step": 27818, "train_loss": 3.2478787899017334, "lr": 4.737590009609735e-05, "tps": 175236, "wall": 10403.9} {"step": 27819, "train_loss": 3.2306225299835205, "lr": 4.7370473057275015e-05, "tps": 175167, "wall": 10408.4} {"step": 27820, "train_loss": 3.1014692783355713, "lr": 4.736504797400928e-05, "tps": 175098, "wall": 10412.9} {"step": 27821, "train_loss": 3.1329071521759033, "lr": 4.735962484636163e-05, "tps": 175029, "wall": 10417.3} {"step": 27822, "train_loss": 3.2246646881103516, "lr": 4.7354203674393494e-05, "tps": 174961, "wall": 10421.8} {"step": 27823, "train_loss": 3.1549172401428223, "lr": 4.7348784458166246e-05, "tps": 174893, "wall": 10426.2} {"step": 27824, "train_loss": 3.1822056770324707, "lr": 4.734336719774134e-05, "tps": 174825, "wall": 10430.7} {"step": 27825, "train_loss": 3.1690759658813477, "lr": 4.733795189318011e-05, "tps": 174756, "wall": 10435.1} {"step": 27826, "train_loss": 3.22178316116333, "lr": 4.7332538544543874e-05, "tps": 174687, "wall": 10439.6} {"step": 27827, "train_loss": 3.122581958770752, "lr": 4.732712715189402e-05, "tps": 174618, "wall": 10444.1} {"step": 27828, "train_loss": 3.1910181045532227, "lr": 4.732171771529178e-05, "tps": 174551, "wall": 10448.5} {"step": 27829, "train_loss": 3.251359701156616, "lr": 4.731631023479848e-05, "tps": 174483, "wall": 10453.0} {"step": 27830, "train_loss": 3.181004524230957, "lr": 4.7310904710475365e-05, "tps": 174414, "wall": 10457.4} {"step": 27831, "train_loss": 3.1235313415527344, "lr": 4.730550114238365e-05, "tps": 174347, "wall": 10461.9} {"step": 27832, "train_loss": 3.171363353729248, "lr": 4.730009953058458e-05, "tps": 174278, "wall": 10466.3} {"step": 27833, "train_loss": 3.145991563796997, "lr": 4.7294699875139307e-05, "tps": 174211, "wall": 10470.8} {"step": 27834, "train_loss": 3.126376152038574, "lr": 4.7289302176109005e-05, "tps": 174142, "wall": 10475.3} {"step": 27835, "train_loss": 3.099381446838379, "lr": 4.728390643355487e-05, "tps": 174075, "wall": 10479.7} {"step": 27836, "train_loss": 3.1457064151763916, "lr": 4.727851264753798e-05, "tps": 174007, "wall": 10484.2} {"step": 27837, "train_loss": 3.1932733058929443, "lr": 4.72731208181194e-05, "tps": 173939, "wall": 10488.6} {"step": 27838, "train_loss": 3.1680431365966797, "lr": 4.726773094536029e-05, "tps": 173872, "wall": 10493.1} {"step": 27839, "train_loss": 3.2068326473236084, "lr": 4.7262343029321666e-05, "tps": 173804, "wall": 10497.6} {"step": 27840, "train_loss": 3.2426228523254395, "lr": 4.7256957070064554e-05, "tps": 173736, "wall": 10502.0} {"step": 27841, "train_loss": 3.09429931640625, "lr": 4.725157306764998e-05, "tps": 173668, "wall": 10506.5} {"step": 27842, "train_loss": 3.127092123031616, "lr": 4.7246191022138945e-05, "tps": 173601, "wall": 10511.0} {"step": 27843, "train_loss": 3.1676530838012695, "lr": 4.724081093359237e-05, "tps": 173533, "wall": 10515.4} {"step": 27844, "train_loss": 3.228720188140869, "lr": 4.723543280207126e-05, "tps": 173466, "wall": 10519.9} {"step": 27845, "train_loss": 3.247481346130371, "lr": 4.723005662763651e-05, "tps": 173399, "wall": 10524.3} {"step": 27846, "train_loss": 3.1935110092163086, "lr": 4.7224682410349034e-05, "tps": 173332, "wall": 10528.8} {"step": 27847, "train_loss": 3.1038990020751953, "lr": 4.72193101502697e-05, "tps": 173265, "wall": 10533.3} {"step": 27848, "train_loss": 3.2338640689849854, "lr": 4.7213939847459356e-05, "tps": 173198, "wall": 10537.7} {"step": 27849, "train_loss": 3.1704788208007812, "lr": 4.7208571501978844e-05, "tps": 173131, "wall": 10542.2} {"step": 27850, "train_loss": 3.169942617416382, "lr": 4.7203205113889003e-05, "tps": 173064, "wall": 10546.6} {"step": 27851, "train_loss": 3.134072780609131, "lr": 4.719784068325058e-05, "tps": 172997, "wall": 10551.1} {"step": 27852, "train_loss": 3.2047371864318848, "lr": 4.71924782101244e-05, "tps": 172930, "wall": 10555.5} {"step": 27853, "train_loss": 3.109532356262207, "lr": 4.718711769457115e-05, "tps": 172863, "wall": 10560.0} {"step": 27854, "train_loss": 3.185016632080078, "lr": 4.7181759136651565e-05, "tps": 172796, "wall": 10564.5} {"step": 27855, "train_loss": 3.179171085357666, "lr": 4.717640253642641e-05, "tps": 172729, "wall": 10568.9} {"step": 27856, "train_loss": 3.187509775161743, "lr": 4.7171047893956284e-05, "tps": 172663, "wall": 10573.4} {"step": 27857, "train_loss": 3.118136405944824, "lr": 4.716569520930187e-05, "tps": 172596, "wall": 10577.9} {"step": 27858, "train_loss": 3.1852707862854004, "lr": 4.7160344482523835e-05, "tps": 172530, "wall": 10582.3} {"step": 27859, "train_loss": 3.0605573654174805, "lr": 4.715499571368275e-05, "tps": 172463, "wall": 10586.8} {"step": 27860, "train_loss": 3.273268222808838, "lr": 4.7149648902839216e-05, "tps": 172397, "wall": 10591.2} {"step": 27861, "train_loss": 3.085735321044922, "lr": 4.714430405005384e-05, "tps": 172330, "wall": 10595.7} {"step": 27862, "train_loss": 3.1333229541778564, "lr": 4.713896115538711e-05, "tps": 172264, "wall": 10600.2} {"step": 27863, "train_loss": 3.1146724224090576, "lr": 4.7133620218899585e-05, "tps": 172198, "wall": 10604.6} {"step": 27864, "train_loss": 3.207839250564575, "lr": 4.7128281240651786e-05, "tps": 172132, "wall": 10609.1} {"step": 27865, "train_loss": 3.143923759460449, "lr": 4.712294422070415e-05, "tps": 172066, "wall": 10613.5} {"step": 27866, "train_loss": 3.1678531169891357, "lr": 4.7117609159117154e-05, "tps": 172000, "wall": 10617.9} {"step": 27867, "train_loss": 3.2866275310516357, "lr": 4.711227605595123e-05, "tps": 171933, "wall": 10622.4} {"step": 27868, "train_loss": 3.176546573638916, "lr": 4.7106944911266805e-05, "tps": 171868, "wall": 10626.9} {"step": 27869, "train_loss": 3.0974130630493164, "lr": 4.710161572512427e-05, "tps": 171802, "wall": 10631.3} {"step": 27870, "train_loss": 3.09220552444458, "lr": 4.7096288497583974e-05, "tps": 171736, "wall": 10635.8} {"step": 27871, "train_loss": 3.248772144317627, "lr": 4.709096322870627e-05, "tps": 171670, "wall": 10640.3} {"step": 27872, "train_loss": 3.253695487976074, "lr": 4.7085639918551505e-05, "tps": 171605, "wall": 10644.7} {"step": 27873, "train_loss": 3.280672311782837, "lr": 4.708031856717996e-05, "tps": 171539, "wall": 10649.2} {"step": 27874, "train_loss": 3.0965216159820557, "lr": 4.70749991746519e-05, "tps": 171473, "wall": 10653.6} {"step": 27875, "train_loss": 3.23203182220459, "lr": 4.706968174102762e-05, "tps": 171408, "wall": 10658.1} {"step": 27876, "train_loss": 3.0831503868103027, "lr": 4.7064366266367355e-05, "tps": 171342, "wall": 10662.5} {"step": 27877, "train_loss": 3.1931662559509277, "lr": 4.705905275073129e-05, "tps": 171277, "wall": 10667.0} {"step": 27878, "train_loss": 3.2061047554016113, "lr": 4.705374119417964e-05, "tps": 171212, "wall": 10671.4} {"step": 27879, "train_loss": 3.108604907989502, "lr": 4.7048431596772557e-05, "tps": 171147, "wall": 10675.9} {"step": 27880, "train_loss": 3.196995735168457, "lr": 4.704312395857019e-05, "tps": 171081, "wall": 10680.4} {"step": 27881, "train_loss": 3.256227493286133, "lr": 4.7037818279632696e-05, "tps": 171015, "wall": 10684.8} {"step": 27882, "train_loss": 3.2620885372161865, "lr": 4.703251456002012e-05, "tps": 170950, "wall": 10689.3} {"step": 27883, "train_loss": 3.206775188446045, "lr": 4.70272127997926e-05, "tps": 170885, "wall": 10693.7} {"step": 27884, "train_loss": 3.247957706451416, "lr": 4.702191299901017e-05, "tps": 170820, "wall": 10698.2} {"step": 27885, "train_loss": 3.21262788772583, "lr": 4.701661515773286e-05, "tps": 170755, "wall": 10702.6} {"step": 27886, "train_loss": 3.244220733642578, "lr": 4.7011319276020696e-05, "tps": 170690, "wall": 10707.1} {"step": 27887, "train_loss": 3.1238603591918945, "lr": 4.700602535393367e-05, "tps": 170625, "wall": 10711.6} {"step": 27888, "train_loss": 3.165336847305298, "lr": 4.7000733391531726e-05, "tps": 170560, "wall": 10716.0} {"step": 27889, "train_loss": 3.171424388885498, "lr": 4.699544338887486e-05, "tps": 170496, "wall": 10720.5} {"step": 27890, "train_loss": 3.1880457401275635, "lr": 4.699015534602298e-05, "tps": 170430, "wall": 10725.0} {"step": 27891, "train_loss": 3.2477426528930664, "lr": 4.6984869263035944e-05, "tps": 170366, "wall": 10729.4} {"step": 27892, "train_loss": 3.3137640953063965, "lr": 4.69795851399737e-05, "tps": 170301, "wall": 10733.9} {"step": 27893, "train_loss": 3.1754393577575684, "lr": 4.697430297689606e-05, "tps": 170236, "wall": 10738.4} {"step": 27894, "train_loss": 3.0761122703552246, "lr": 4.696902277386287e-05, "tps": 170171, "wall": 10742.8} {"step": 27895, "train_loss": 3.2715353965759277, "lr": 4.696374453093396e-05, "tps": 170106, "wall": 10747.3} {"step": 27896, "train_loss": 3.1105949878692627, "lr": 4.695846824816913e-05, "tps": 170042, "wall": 10751.8} {"step": 27897, "train_loss": 3.183244228363037, "lr": 4.695319392562809e-05, "tps": 169977, "wall": 10756.3} {"step": 27898, "train_loss": 3.148221015930176, "lr": 4.694792156337067e-05, "tps": 169913, "wall": 10760.7} {"step": 27899, "train_loss": 3.0440657138824463, "lr": 4.6942651161456514e-05, "tps": 169849, "wall": 10765.2} {"step": 27900, "train_loss": 3.0943081378936768, "lr": 4.69373827199454e-05, "tps": 169784, "wall": 10769.6} {"step": 27901, "train_loss": 3.269920825958252, "lr": 4.6932116238897e-05, "tps": 169720, "wall": 10774.1} {"step": 27902, "train_loss": 3.198215961456299, "lr": 4.6926851718370905e-05, "tps": 169656, "wall": 10778.5} {"step": 27903, "train_loss": 3.199188709259033, "lr": 4.692158915842685e-05, "tps": 169592, "wall": 10783.0} {"step": 27904, "train_loss": 3.134746789932251, "lr": 4.6916328559124355e-05, "tps": 169528, "wall": 10787.4} {"step": 27905, "train_loss": 3.2926723957061768, "lr": 4.691106992052305e-05, "tps": 169464, "wall": 10791.9} {"step": 27906, "train_loss": 3.130854368209839, "lr": 4.690581324268253e-05, "tps": 169400, "wall": 10796.4} {"step": 27907, "train_loss": 3.2165427207946777, "lr": 4.6900558525662306e-05, "tps": 169336, "wall": 10800.9} {"step": 27908, "train_loss": 3.221986770629883, "lr": 4.6895305769521916e-05, "tps": 169271, "wall": 10805.4} {"step": 27909, "train_loss": 3.218076229095459, "lr": 4.68900549743209e-05, "tps": 169208, "wall": 10809.8} {"step": 27910, "train_loss": 3.1800613403320312, "lr": 4.688480614011866e-05, "tps": 169144, "wall": 10814.3} {"step": 27911, "train_loss": 3.1934196949005127, "lr": 4.6879559266974714e-05, "tps": 169081, "wall": 10818.7} {"step": 27912, "train_loss": 3.0633983612060547, "lr": 4.6874314354948524e-05, "tps": 169017, "wall": 10823.1} {"step": 27913, "train_loss": 3.0428638458251953, "lr": 4.686907140409941e-05, "tps": 168954, "wall": 10827.6} {"step": 27914, "train_loss": 3.1432998180389404, "lr": 4.686383041448685e-05, "tps": 168891, "wall": 10832.0} {"step": 27915, "train_loss": 3.2980422973632812, "lr": 4.68585913861702e-05, "tps": 168827, "wall": 10836.5} {"step": 27916, "train_loss": 3.2198896408081055, "lr": 4.685335431920877e-05, "tps": 168764, "wall": 10841.0} {"step": 27917, "train_loss": 3.18750262260437, "lr": 4.684811921366192e-05, "tps": 168701, "wall": 10845.4} {"step": 27918, "train_loss": 3.2037744522094727, "lr": 4.684288606958897e-05, "tps": 168637, "wall": 10849.9} {"step": 27919, "train_loss": 3.0849833488464355, "lr": 4.683765488704912e-05, "tps": 168574, "wall": 10854.3} {"step": 27920, "train_loss": 3.1144611835479736, "lr": 4.6832425666101706e-05, "tps": 168510, "wall": 10858.8} {"step": 27921, "train_loss": 3.1587376594543457, "lr": 4.682719840680597e-05, "tps": 168448, "wall": 10863.3} {"step": 27922, "train_loss": 3.249800205230713, "lr": 4.682197310922105e-05, "tps": 168385, "wall": 10867.7} {"step": 27923, "train_loss": 3.3407483100891113, "lr": 4.681674977340622e-05, "tps": 168321, "wall": 10872.2} {"step": 27924, "train_loss": 3.223409414291382, "lr": 4.68115283994206e-05, "tps": 168258, "wall": 10876.7} {"step": 27925, "train_loss": 3.166351079940796, "lr": 4.680630898732338e-05, "tps": 168195, "wall": 10881.1} {"step": 27926, "train_loss": 3.156050443649292, "lr": 4.6801091537173635e-05, "tps": 168133, "wall": 10885.6} {"step": 27927, "train_loss": 3.2501251697540283, "lr": 4.679587604903049e-05, "tps": 168070, "wall": 10890.0} {"step": 27928, "train_loss": 3.2408745288848877, "lr": 4.679066252295306e-05, "tps": 168007, "wall": 10894.5} {"step": 27929, "train_loss": 3.178555488586426, "lr": 4.6785450959000374e-05, "tps": 167945, "wall": 10898.9} {"step": 27930, "train_loss": 3.1157383918762207, "lr": 4.678024135723144e-05, "tps": 167882, "wall": 10903.4} {"step": 27931, "train_loss": 3.186847686767578, "lr": 4.677503371770533e-05, "tps": 167820, "wall": 10907.8} {"step": 27932, "train_loss": 3.1574606895446777, "lr": 4.676982804048101e-05, "tps": 167757, "wall": 10912.3} {"step": 27933, "train_loss": 3.2202906608581543, "lr": 4.676462432561744e-05, "tps": 167695, "wall": 10916.7} {"step": 27934, "train_loss": 3.14030122756958, "lr": 4.6759422573173574e-05, "tps": 167632, "wall": 10921.2} {"step": 27935, "train_loss": 3.2229623794555664, "lr": 4.6754222783208344e-05, "tps": 167569, "wall": 10925.7} {"step": 27936, "train_loss": 3.0433242321014404, "lr": 4.6749024955780656e-05, "tps": 167506, "wall": 10930.2} {"step": 27937, "train_loss": 3.159766912460327, "lr": 4.674382909094939e-05, "tps": 167444, "wall": 10934.6} {"step": 27938, "train_loss": 3.2307791709899902, "lr": 4.67386351887734e-05, "tps": 167382, "wall": 10939.1} {"step": 27939, "train_loss": 3.205031394958496, "lr": 4.67334432493115e-05, "tps": 167320, "wall": 10943.5} {"step": 27940, "train_loss": 3.128002405166626, "lr": 4.672825327262255e-05, "tps": 167258, "wall": 10948.0} {"step": 27941, "train_loss": 3.233884811401367, "lr": 4.67230652587653e-05, "tps": 167196, "wall": 10952.4} {"step": 27942, "train_loss": 3.164716958999634, "lr": 4.671787920779857e-05, "tps": 167134, "wall": 10956.9} {"step": 27943, "train_loss": 3.186800956726074, "lr": 4.671269511978107e-05, "tps": 167072, "wall": 10961.3} {"step": 27944, "train_loss": 3.254364490509033, "lr": 4.670751299477152e-05, "tps": 167010, "wall": 10965.8} {"step": 27945, "train_loss": 3.1129794120788574, "lr": 4.670233283282867e-05, "tps": 166948, "wall": 10970.3} {"step": 27946, "train_loss": 3.2203369140625, "lr": 4.669715463401113e-05, "tps": 166886, "wall": 10974.7} {"step": 27947, "train_loss": 3.1895432472229004, "lr": 4.669197839837761e-05, "tps": 166824, "wall": 10979.2} {"step": 27948, "train_loss": 3.2232959270477295, "lr": 4.668680412598674e-05, "tps": 166762, "wall": 10983.7} {"step": 27949, "train_loss": 3.2775557041168213, "lr": 4.668163181689715e-05, "tps": 166700, "wall": 10988.1} {"step": 27950, "train_loss": 3.088224411010742, "lr": 4.6676461471167375e-05, "tps": 166639, "wall": 10992.6} {"step": 27951, "train_loss": 3.19197940826416, "lr": 4.667129308885603e-05, "tps": 166577, "wall": 10997.0} {"step": 27952, "train_loss": 3.13250732421875, "lr": 4.6666126670021684e-05, "tps": 166516, "wall": 11001.5} {"step": 27953, "train_loss": 3.1802432537078857, "lr": 4.666096221472279e-05, "tps": 166455, "wall": 11005.9} {"step": 27954, "train_loss": 3.216222047805786, "lr": 4.6655799723017903e-05, "tps": 166393, "wall": 11010.4} {"step": 27955, "train_loss": 3.1269304752349854, "lr": 4.665063919496552e-05, "tps": 166332, "wall": 11014.9} {"step": 27956, "train_loss": 3.1826963424682617, "lr": 4.664548063062405e-05, "tps": 166270, "wall": 11019.3} {"step": 27957, "train_loss": 3.14668607711792, "lr": 4.664032403005197e-05, "tps": 166209, "wall": 11023.8} {"step": 27958, "train_loss": 3.260859489440918, "lr": 4.6635169393307666e-05, "tps": 166148, "wall": 11028.2} {"step": 27959, "train_loss": 3.294959545135498, "lr": 4.6630016720449534e-05, "tps": 166086, "wall": 11032.7} {"step": 27960, "train_loss": 3.093893527984619, "lr": 4.662486601153598e-05, "tps": 166025, "wall": 11037.2} {"step": 27961, "train_loss": 3.1624789237976074, "lr": 4.6619717266625274e-05, "tps": 165963, "wall": 11041.7} {"step": 27962, "train_loss": 3.129241466522217, "lr": 4.6614570485775825e-05, "tps": 165902, "wall": 11046.1} {"step": 27963, "train_loss": 3.0840952396392822, "lr": 4.660942566904591e-05, "tps": 165841, "wall": 11050.6} {"step": 27964, "train_loss": 3.2401275634765625, "lr": 4.6604282816493785e-05, "tps": 165780, "wall": 11055.0} {"step": 27965, "train_loss": 3.237710475921631, "lr": 4.659914192817774e-05, "tps": 165719, "wall": 11059.5} {"step": 27966, "train_loss": 3.182448387145996, "lr": 4.659400300415599e-05, "tps": 165659, "wall": 11063.9} {"step": 27967, "train_loss": 3.1399192810058594, "lr": 4.6588866044486744e-05, "tps": 165598, "wall": 11068.4} {"step": 27968, "train_loss": 3.174201011657715, "lr": 4.658373104922822e-05, "tps": 165537, "wall": 11072.9} {"step": 27969, "train_loss": 3.2337417602539062, "lr": 4.657859801843856e-05, "tps": 165477, "wall": 11077.3} {"step": 27970, "train_loss": 3.2518227100372314, "lr": 4.6573466952175903e-05, "tps": 165416, "wall": 11081.8} {"step": 27971, "train_loss": 3.266939163208008, "lr": 4.6568337850498444e-05, "tps": 165355, "wall": 11086.2} {"step": 27972, "train_loss": 3.2843165397644043, "lr": 4.656321071346421e-05, "tps": 165295, "wall": 11090.7} {"step": 27973, "train_loss": 3.1592745780944824, "lr": 4.6558085541131304e-05, "tps": 165234, "wall": 11095.1} {"step": 27974, "train_loss": 3.2312793731689453, "lr": 4.65529623335578e-05, "tps": 165173, "wall": 11099.7} {"step": 27975, "train_loss": 3.183345317840576, "lr": 4.6547841090801716e-05, "tps": 165113, "wall": 11104.1} {"step": 27976, "train_loss": 3.1901628971099854, "lr": 4.6542721812921055e-05, "tps": 165053, "wall": 11108.5} {"step": 27977, "train_loss": 3.2432384490966797, "lr": 4.6537604499973866e-05, "tps": 164992, "wall": 11113.0} {"step": 27978, "train_loss": 3.2700395584106445, "lr": 4.6532489152018025e-05, "tps": 164932, "wall": 11117.5} {"step": 27979, "train_loss": 3.1978964805603027, "lr": 4.6527375769111563e-05, "tps": 164871, "wall": 11121.9} {"step": 27980, "train_loss": 3.1339869499206543, "lr": 4.6522264351312385e-05, "tps": 164811, "wall": 11126.4} {"step": 27981, "train_loss": 3.23734188079834, "lr": 4.651715489867834e-05, "tps": 164751, "wall": 11130.9} {"step": 27982, "train_loss": 3.171724319458008, "lr": 4.651204741126739e-05, "tps": 164691, "wall": 11135.3} {"step": 27983, "train_loss": 3.1486377716064453, "lr": 4.650694188913735e-05, "tps": 164631, "wall": 11139.8} {"step": 27984, "train_loss": 3.0548949241638184, "lr": 4.6501838332346035e-05, "tps": 164571, "wall": 11144.3} {"step": 27985, "train_loss": 3.192262887954712, "lr": 4.649673674095128e-05, "tps": 164511, "wall": 11148.7} {"step": 27986, "train_loss": 3.2053370475769043, "lr": 4.649163711501091e-05, "tps": 164451, "wall": 11153.2} {"step": 27987, "train_loss": 3.1534180641174316, "lr": 4.6486539454582636e-05, "tps": 164391, "wall": 11157.6} {"step": 27988, "train_loss": 3.2349555492401123, "lr": 4.648144375972422e-05, "tps": 164331, "wall": 11162.1} {"step": 27989, "train_loss": 3.093146800994873, "lr": 4.6476350030493434e-05, "tps": 164271, "wall": 11166.6} {"step": 27990, "train_loss": 3.027453899383545, "lr": 4.64712582669479e-05, "tps": 164212, "wall": 11171.0} {"step": 27991, "train_loss": 3.158175468444824, "lr": 4.646616846914537e-05, "tps": 164152, "wall": 11175.5} {"step": 27992, "train_loss": 3.1344213485717773, "lr": 4.646108063714347e-05, "tps": 164093, "wall": 11179.9} {"step": 27993, "train_loss": 3.1732380390167236, "lr": 4.645599477099982e-05, "tps": 164033, "wall": 11184.4} {"step": 27994, "train_loss": 3.2147932052612305, "lr": 4.645091087077206e-05, "tps": 163973, "wall": 11188.8} {"step": 27995, "train_loss": 3.1368765830993652, "lr": 4.644582893651775e-05, "tps": 163914, "wall": 11193.3} {"step": 27996, "train_loss": 3.1310741901397705, "lr": 4.644074896829451e-05, "tps": 163854, "wall": 11197.8} {"step": 27997, "train_loss": 3.107546806335449, "lr": 4.643567096615985e-05, "tps": 163795, "wall": 11202.3} {"step": 27998, "train_loss": 3.1932895183563232, "lr": 4.643059493017127e-05, "tps": 163736, "wall": 11206.7} {"step": 27999, "train_loss": 3.1877474784851074, "lr": 4.6425520860386326e-05, "tps": 163676, "wall": 11211.2} {"step": 28000, "train_loss": 3.2150163650512695, "lr": 4.642044875686249e-05, "tps": 163617, "wall": 11215.6, "val_loss_monitor": 3.3154462926097388} {"step": 28001, "train_loss": 3.1227126121520996, "lr": 4.6415378619657154e-05, "tps": 163114, "wall": 11250.6} {"step": 28002, "train_loss": 3.2149479389190674, "lr": 4.6410310448827837e-05, "tps": 163055, "wall": 11255.1} {"step": 28003, "train_loss": 3.2052369117736816, "lr": 4.64052442444319e-05, "tps": 162995, "wall": 11259.6} {"step": 28004, "train_loss": 3.199977397918701, "lr": 4.640018000652675e-05, "tps": 162937, "wall": 11264.1} {"step": 28005, "train_loss": 3.1788582801818848, "lr": 4.639511773516974e-05, "tps": 162878, "wall": 11268.5} {"step": 28006, "train_loss": 3.233891248703003, "lr": 4.639005743041826e-05, "tps": 162819, "wall": 11273.0} {"step": 28007, "train_loss": 3.1520237922668457, "lr": 4.638499909232957e-05, "tps": 162761, "wall": 11277.4} {"step": 28008, "train_loss": 3.079049587249756, "lr": 4.6379942720961025e-05, "tps": 162702, "wall": 11281.9} {"step": 28009, "train_loss": 3.2627341747283936, "lr": 4.637488831636988e-05, "tps": 162644, "wall": 11286.4} {"step": 28010, "train_loss": 3.1796534061431885, "lr": 4.6369835878613365e-05, "tps": 162585, "wall": 11290.8} {"step": 28011, "train_loss": 3.0978639125823975, "lr": 4.6364785407748765e-05, "tps": 162527, "wall": 11295.3} {"step": 28012, "train_loss": 3.2141880989074707, "lr": 4.635973690383327e-05, "tps": 162469, "wall": 11299.7} {"step": 28013, "train_loss": 3.14481258392334, "lr": 4.635469036692405e-05, "tps": 162411, "wall": 11304.2} {"step": 28014, "train_loss": 3.0733931064605713, "lr": 4.634964579707832e-05, "tps": 162353, "wall": 11308.6} {"step": 28015, "train_loss": 3.1961894035339355, "lr": 4.6344603194353165e-05, "tps": 162295, "wall": 11313.1} {"step": 28016, "train_loss": 3.189145088195801, "lr": 4.6339562558805764e-05, "tps": 162237, "wall": 11317.5} {"step": 28017, "train_loss": 3.155060291290283, "lr": 4.6334523890493196e-05, "tps": 162178, "wall": 11322.0} {"step": 28018, "train_loss": 3.144179105758667, "lr": 4.6329487189472504e-05, "tps": 162120, "wall": 11326.5} {"step": 28019, "train_loss": 3.209022045135498, "lr": 4.632445245580082e-05, "tps": 162062, "wall": 11330.9} {"step": 28020, "train_loss": 3.156153678894043, "lr": 4.631941968953512e-05, "tps": 162004, "wall": 11335.4} {"step": 28021, "train_loss": 3.151386260986328, "lr": 4.63143888907324e-05, "tps": 161946, "wall": 11339.9} {"step": 28022, "train_loss": 3.2016706466674805, "lr": 4.6309360059449724e-05, "tps": 161888, "wall": 11344.3} {"step": 28023, "train_loss": 3.200615644454956, "lr": 4.6304333195743995e-05, "tps": 161830, "wall": 11348.8} {"step": 28024, "train_loss": 3.2169907093048096, "lr": 4.629930829967215e-05, "tps": 161772, "wall": 11353.3} {"step": 28025, "train_loss": 3.2244608402252197, "lr": 4.629428537129117e-05, "tps": 161714, "wall": 11357.7} {"step": 28026, "train_loss": 3.1536080837249756, "lr": 4.628926441065793e-05, "tps": 161657, "wall": 11362.2} {"step": 28027, "train_loss": 3.1685585975646973, "lr": 4.628424541782927e-05, "tps": 161599, "wall": 11366.6} {"step": 28028, "train_loss": 3.2302403450012207, "lr": 4.627922839286209e-05, "tps": 161541, "wall": 11371.1} {"step": 28029, "train_loss": 3.1240897178649902, "lr": 4.627421333581323e-05, "tps": 161484, "wall": 11375.6} {"step": 28030, "train_loss": 3.2459897994995117, "lr": 4.626920024673944e-05, "tps": 161426, "wall": 11380.0} {"step": 28031, "train_loss": 3.208926200866699, "lr": 4.6264189125697575e-05, "tps": 161369, "wall": 11384.5} {"step": 28032, "train_loss": 3.1791296005249023, "lr": 4.625917997274435e-05, "tps": 161311, "wall": 11388.9} {"step": 28033, "train_loss": 3.0852975845336914, "lr": 4.625417278793657e-05, "tps": 161254, "wall": 11393.4} {"step": 28034, "train_loss": 3.180582046508789, "lr": 4.6249167571330886e-05, "tps": 161197, "wall": 11397.8} {"step": 28035, "train_loss": 3.153392791748047, "lr": 4.624416432298404e-05, "tps": 161139, "wall": 11402.3} {"step": 28036, "train_loss": 3.1746058464050293, "lr": 4.623916304295271e-05, "tps": 161081, "wall": 11406.8} {"step": 28037, "train_loss": 3.213710308074951, "lr": 4.623416373129356e-05, "tps": 161024, "wall": 11411.3} {"step": 28038, "train_loss": 3.220763683319092, "lr": 4.622916638806315e-05, "tps": 160967, "wall": 11415.7} {"step": 28039, "train_loss": 3.080160617828369, "lr": 4.6224171013318195e-05, "tps": 160910, "wall": 11420.2} {"step": 28040, "train_loss": 3.1907479763031006, "lr": 4.621917760711522e-05, "tps": 160853, "wall": 11424.6} {"step": 28041, "train_loss": 3.038583993911743, "lr": 4.621418616951078e-05, "tps": 160796, "wall": 11429.1} {"step": 28042, "train_loss": 3.1891112327575684, "lr": 4.620919670056145e-05, "tps": 160740, "wall": 11433.5} {"step": 28043, "train_loss": 3.2639217376708984, "lr": 4.6204209200323765e-05, "tps": 160683, "wall": 11438.0} {"step": 28044, "train_loss": 3.22489595413208, "lr": 4.6199223668854165e-05, "tps": 160626, "wall": 11442.4} {"step": 28045, "train_loss": 3.2975924015045166, "lr": 4.619424010620919e-05, "tps": 160569, "wall": 11446.9} {"step": 28046, "train_loss": 3.095508098602295, "lr": 4.618925851244527e-05, "tps": 160512, "wall": 11451.3} {"step": 28047, "train_loss": 3.245936632156372, "lr": 4.6184278887618786e-05, "tps": 160456, "wall": 11455.8} {"step": 28048, "train_loss": 3.0983967781066895, "lr": 4.617930123178625e-05, "tps": 160398, "wall": 11460.3} {"step": 28049, "train_loss": 3.2653558254241943, "lr": 4.617432554500396e-05, "tps": 160342, "wall": 11464.8} {"step": 28050, "train_loss": 3.190042734146118, "lr": 4.616935182732832e-05, "tps": 160285, "wall": 11469.2} {"step": 28051, "train_loss": 3.1124777793884277, "lr": 4.616438007881568e-05, "tps": 160228, "wall": 11473.7} {"step": 28052, "train_loss": 3.24029541015625, "lr": 4.615941029952232e-05, "tps": 160172, "wall": 11478.1} {"step": 28053, "train_loss": 3.148597478866577, "lr": 4.615444248950459e-05, "tps": 160115, "wall": 11482.6} {"step": 28054, "train_loss": 3.2454428672790527, "lr": 4.614947664881874e-05, "tps": 160059, "wall": 11487.1} {"step": 28055, "train_loss": 3.2177481651306152, "lr": 4.614451277752099e-05, "tps": 160003, "wall": 11491.5} {"step": 28056, "train_loss": 3.1459383964538574, "lr": 4.613955087566764e-05, "tps": 159946, "wall": 11496.0} {"step": 28057, "train_loss": 3.1405529975891113, "lr": 4.613459094331487e-05, "tps": 159890, "wall": 11500.4} {"step": 28058, "train_loss": 3.126424789428711, "lr": 4.612963298051883e-05, "tps": 159834, "wall": 11504.9} {"step": 28059, "train_loss": 3.0708699226379395, "lr": 4.6124676987335725e-05, "tps": 159778, "wall": 11509.3} {"step": 28060, "train_loss": 3.1405177116394043, "lr": 4.611972296382169e-05, "tps": 159722, "wall": 11513.8} {"step": 28061, "train_loss": 3.1750922203063965, "lr": 4.611477091003284e-05, "tps": 159665, "wall": 11518.3} {"step": 28062, "train_loss": 3.2770540714263916, "lr": 4.610982082602527e-05, "tps": 159609, "wall": 11522.7} {"step": 28063, "train_loss": 3.1347923278808594, "lr": 4.610487271185507e-05, "tps": 159553, "wall": 11527.2} {"step": 28064, "train_loss": 3.1964504718780518, "lr": 4.609992656757823e-05, "tps": 159497, "wall": 11531.7} {"step": 28065, "train_loss": 3.203470230102539, "lr": 4.6094982393250884e-05, "tps": 159441, "wall": 11536.1} {"step": 28066, "train_loss": 3.199763059616089, "lr": 4.609004018892898e-05, "tps": 159385, "wall": 11540.6} {"step": 28067, "train_loss": 3.190776824951172, "lr": 4.608509995466848e-05, "tps": 159329, "wall": 11545.0} {"step": 28068, "train_loss": 3.2206621170043945, "lr": 4.6080161690525395e-05, "tps": 159273, "wall": 11549.5} {"step": 28069, "train_loss": 3.2294883728027344, "lr": 4.6075225396555636e-05, "tps": 159217, "wall": 11553.9} {"step": 28070, "train_loss": 3.1630635261535645, "lr": 4.6070291072815154e-05, "tps": 159162, "wall": 11558.4} {"step": 28071, "train_loss": 3.2119336128234863, "lr": 4.6065358719359806e-05, "tps": 159106, "wall": 11562.8} {"step": 28072, "train_loss": 3.065448522567749, "lr": 4.606042833624551e-05, "tps": 159050, "wall": 11567.3} {"step": 28073, "train_loss": 3.277345657348633, "lr": 4.6055499923528076e-05, "tps": 158995, "wall": 11571.8} {"step": 28074, "train_loss": 3.2088441848754883, "lr": 4.6050573481263326e-05, "tps": 158939, "wall": 11576.2} {"step": 28075, "train_loss": 3.136601448059082, "lr": 4.604564900950711e-05, "tps": 158883, "wall": 11580.7} {"step": 28076, "train_loss": 3.14456844329834, "lr": 4.604072650831521e-05, "tps": 158828, "wall": 11585.2} {"step": 28077, "train_loss": 3.1444272994995117, "lr": 4.603580597774334e-05, "tps": 158772, "wall": 11589.6} {"step": 28078, "train_loss": 3.1702117919921875, "lr": 4.603088741784729e-05, "tps": 158717, "wall": 11594.1} {"step": 28079, "train_loss": 3.1258413791656494, "lr": 4.602597082868275e-05, "tps": 158662, "wall": 11598.5} {"step": 28080, "train_loss": 3.1441457271575928, "lr": 4.602105621030543e-05, "tps": 158607, "wall": 11603.0} {"step": 28081, "train_loss": 3.1785974502563477, "lr": 4.6016143562771e-05, "tps": 158551, "wall": 11607.4} {"step": 28082, "train_loss": 3.2577695846557617, "lr": 4.601123288613512e-05, "tps": 158496, "wall": 11611.9} {"step": 28083, "train_loss": 3.2661895751953125, "lr": 4.600632418045336e-05, "tps": 158441, "wall": 11616.4} {"step": 28084, "train_loss": 3.213858127593994, "lr": 4.6001417445781415e-05, "tps": 158386, "wall": 11620.8} {"step": 28085, "train_loss": 3.1730546951293945, "lr": 4.599651268217481e-05, "tps": 158330, "wall": 11625.3} {"step": 28086, "train_loss": 3.1808032989501953, "lr": 4.599160988968911e-05, "tps": 158276, "wall": 11629.7} {"step": 28087, "train_loss": 3.072448253631592, "lr": 4.59867090683799e-05, "tps": 158221, "wall": 11634.2} {"step": 28088, "train_loss": 3.1843748092651367, "lr": 4.5981810218302645e-05, "tps": 158165, "wall": 11638.7} {"step": 28089, "train_loss": 3.1564478874206543, "lr": 4.597691333951285e-05, "tps": 158110, "wall": 11643.1} {"step": 28090, "train_loss": 3.2950143814086914, "lr": 4.597201843206601e-05, "tps": 158055, "wall": 11647.6} {"step": 28091, "train_loss": 3.205134391784668, "lr": 4.5967125496017565e-05, "tps": 158001, "wall": 11652.1} {"step": 28092, "train_loss": 3.1158926486968994, "lr": 4.596223453142291e-05, "tps": 157946, "wall": 11656.5} {"step": 28093, "train_loss": 3.2555465698242188, "lr": 4.5957345538337506e-05, "tps": 157891, "wall": 11661.0} {"step": 28094, "train_loss": 3.150475025177002, "lr": 4.595245851681668e-05, "tps": 157837, "wall": 11665.4} {"step": 28095, "train_loss": 3.1083762645721436, "lr": 4.594757346691585e-05, "tps": 157782, "wall": 11669.9} {"step": 28096, "train_loss": 3.182204008102417, "lr": 4.594269038869032e-05, "tps": 157727, "wall": 11674.3} {"step": 28097, "train_loss": 3.2545528411865234, "lr": 4.5937809282195366e-05, "tps": 157673, "wall": 11678.8} {"step": 28098, "train_loss": 3.2616219520568848, "lr": 4.593293014748637e-05, "tps": 157618, "wall": 11683.2} {"step": 28099, "train_loss": 3.206383466720581, "lr": 4.592805298461856e-05, "tps": 157564, "wall": 11687.7} {"step": 28100, "train_loss": 3.2482051849365234, "lr": 4.592317779364716e-05, "tps": 157510, "wall": 11692.1} {"step": 28101, "train_loss": 3.195504665374756, "lr": 4.5918304574627424e-05, "tps": 157455, "wall": 11696.6} {"step": 28102, "train_loss": 3.1540207862854004, "lr": 4.591343332761457e-05, "tps": 157400, "wall": 11701.1} {"step": 28103, "train_loss": 3.112107038497925, "lr": 4.5908564052663736e-05, "tps": 157346, "wall": 11705.5} {"step": 28104, "train_loss": 3.2537951469421387, "lr": 4.590369674983012e-05, "tps": 157292, "wall": 11710.0} {"step": 28105, "train_loss": 3.2268948554992676, "lr": 4.589883141916885e-05, "tps": 157237, "wall": 11714.5} {"step": 28106, "train_loss": 3.228917360305786, "lr": 4.589396806073502e-05, "tps": 157183, "wall": 11718.9} {"step": 28107, "train_loss": 3.1788735389709473, "lr": 4.588910667458376e-05, "tps": 157129, "wall": 11723.4} {"step": 28108, "train_loss": 3.2578072547912598, "lr": 4.58842472607701e-05, "tps": 157075, "wall": 11727.8} {"step": 28109, "train_loss": 3.117418050765991, "lr": 4.587938981934911e-05, "tps": 157021, "wall": 11732.3} {"step": 28110, "train_loss": 3.129838228225708, "lr": 4.5874534350375825e-05, "tps": 156967, "wall": 11736.7} {"step": 28111, "train_loss": 3.1703009605407715, "lr": 4.5869680853905214e-05, "tps": 156913, "wall": 11741.2} {"step": 28112, "train_loss": 3.1267852783203125, "lr": 4.5864829329992294e-05, "tps": 156859, "wall": 11745.7} {"step": 28113, "train_loss": 3.213641405105591, "lr": 4.585997977869202e-05, "tps": 156805, "wall": 11750.1} {"step": 28114, "train_loss": 3.1732802391052246, "lr": 4.585513220005927e-05, "tps": 156751, "wall": 11754.6} {"step": 28115, "train_loss": 3.185142755508423, "lr": 4.585028659414905e-05, "tps": 156695, "wall": 11759.1} {"step": 28116, "train_loss": 3.1238484382629395, "lr": 4.5845442961016194e-05, "tps": 156642, "wall": 11763.6} {"step": 28117, "train_loss": 3.115945816040039, "lr": 4.5840601300715554e-05, "tps": 156588, "wall": 11768.0} {"step": 28118, "train_loss": 3.1910033226013184, "lr": 4.5835761613302045e-05, "tps": 156535, "wall": 11772.5} {"step": 28119, "train_loss": 3.225184440612793, "lr": 4.583092389883043e-05, "tps": 156481, "wall": 11776.9} {"step": 28120, "train_loss": 3.3226399421691895, "lr": 4.582608815735552e-05, "tps": 156427, "wall": 11781.4} {"step": 28121, "train_loss": 3.131251335144043, "lr": 4.582125438893213e-05, "tps": 156374, "wall": 11785.8} {"step": 28122, "train_loss": 3.1367928981781006, "lr": 4.5816422593615e-05, "tps": 156320, "wall": 11790.3} {"step": 28123, "train_loss": 3.1333537101745605, "lr": 4.581159277145882e-05, "tps": 156267, "wall": 11794.7} {"step": 28124, "train_loss": 3.0866801738739014, "lr": 4.580676492251836e-05, "tps": 156213, "wall": 11799.2} {"step": 28125, "train_loss": 3.182028293609619, "lr": 4.5801939046848294e-05, "tps": 156160, "wall": 11803.7} {"step": 28126, "train_loss": 3.0775909423828125, "lr": 4.579711514450328e-05, "tps": 156107, "wall": 11808.1} {"step": 28127, "train_loss": 3.177412509918213, "lr": 4.579229321553799e-05, "tps": 156053, "wall": 11812.6} {"step": 28128, "train_loss": 3.1834518909454346, "lr": 4.578747326000699e-05, "tps": 156000, "wall": 11817.0} {"step": 28129, "train_loss": 3.1859846115112305, "lr": 4.578265527796494e-05, "tps": 155946, "wall": 11821.5} {"step": 28130, "train_loss": 3.142759323120117, "lr": 4.57778392694664e-05, "tps": 155893, "wall": 11826.0} {"step": 28131, "train_loss": 3.205443859100342, "lr": 4.577302523456591e-05, "tps": 155840, "wall": 11830.4} {"step": 28132, "train_loss": 3.1968472003936768, "lr": 4.576821317331804e-05, "tps": 155787, "wall": 11834.9} {"step": 28133, "train_loss": 3.116769313812256, "lr": 4.576340308577727e-05, "tps": 155733, "wall": 11839.4} {"step": 28134, "train_loss": 3.0860490798950195, "lr": 4.5758594971998065e-05, "tps": 155680, "wall": 11843.8} {"step": 28135, "train_loss": 3.2056851387023926, "lr": 4.575378883203494e-05, "tps": 155627, "wall": 11848.3} {"step": 28136, "train_loss": 3.0733962059020996, "lr": 4.574898466594233e-05, "tps": 155575, "wall": 11852.7} {"step": 28137, "train_loss": 3.2233543395996094, "lr": 4.574418247377463e-05, "tps": 155522, "wall": 11857.2} {"step": 28138, "train_loss": 3.1454384326934814, "lr": 4.573938225558628e-05, "tps": 155469, "wall": 11861.6} {"step": 28139, "train_loss": 3.2924964427948, "lr": 4.5734584011431635e-05, "tps": 155416, "wall": 11866.1} {"step": 28140, "train_loss": 3.0527915954589844, "lr": 4.5729787741365026e-05, "tps": 155363, "wall": 11870.5} {"step": 28141, "train_loss": 3.229854106903076, "lr": 4.5724993445440825e-05, "tps": 155310, "wall": 11875.0} {"step": 28142, "train_loss": 3.041476249694824, "lr": 4.572020112371333e-05, "tps": 155256, "wall": 11879.5} {"step": 28143, "train_loss": 3.0885090827941895, "lr": 4.571541077623682e-05, "tps": 155204, "wall": 11884.0} {"step": 28144, "train_loss": 3.1747775077819824, "lr": 4.571062240306557e-05, "tps": 155151, "wall": 11888.4} {"step": 28145, "train_loss": 3.140042543411255, "lr": 4.570583600425381e-05, "tps": 155099, "wall": 11892.9} {"step": 28146, "train_loss": 3.0843186378479004, "lr": 4.570105157985577e-05, "tps": 155046, "wall": 11897.3} {"step": 28147, "train_loss": 3.160006046295166, "lr": 4.569626912992566e-05, "tps": 154994, "wall": 11901.8} {"step": 28148, "train_loss": 3.1122426986694336, "lr": 4.569148865451763e-05, "tps": 154941, "wall": 11906.3} {"step": 28149, "train_loss": 3.1906590461730957, "lr": 4.568671015368584e-05, "tps": 154889, "wall": 11910.7} {"step": 28150, "train_loss": 3.159486770629883, "lr": 4.568193362748445e-05, "tps": 154836, "wall": 11915.1} {"step": 28151, "train_loss": 3.28060245513916, "lr": 4.5677159075967524e-05, "tps": 154784, "wall": 11919.6} {"step": 28152, "train_loss": 3.1324336528778076, "lr": 4.5672386499189186e-05, "tps": 154732, "wall": 11924.1} {"step": 28153, "train_loss": 3.0691099166870117, "lr": 4.566761589720347e-05, "tps": 154679, "wall": 11928.5} {"step": 28154, "train_loss": 3.1842880249023438, "lr": 4.5662847270064435e-05, "tps": 154627, "wall": 11933.0} {"step": 28155, "train_loss": 3.1258511543273926, "lr": 4.565808061782612e-05, "tps": 154575, "wall": 11937.4} {"step": 28156, "train_loss": 3.1546802520751953, "lr": 4.565331594054247e-05, "tps": 154522, "wall": 11941.9} {"step": 28157, "train_loss": 3.1378488540649414, "lr": 4.564855323826751e-05, "tps": 154470, "wall": 11946.4} {"step": 28158, "train_loss": 3.2549071311950684, "lr": 4.5643792511055163e-05, "tps": 154418, "wall": 11950.9} {"step": 28159, "train_loss": 3.1828300952911377, "lr": 4.563903375895938e-05, "tps": 154365, "wall": 11955.3} {"step": 28160, "train_loss": 3.1341280937194824, "lr": 4.563427698203403e-05, "tps": 154313, "wall": 11959.8} {"step": 28161, "train_loss": 3.181842803955078, "lr": 4.5629522180333044e-05, "tps": 154261, "wall": 11964.2} {"step": 28162, "train_loss": 3.175628900527954, "lr": 4.562476935391026e-05, "tps": 154209, "wall": 11968.7} {"step": 28163, "train_loss": 3.1242411136627197, "lr": 4.562001850281951e-05, "tps": 154157, "wall": 11973.2} {"step": 28164, "train_loss": 3.0945796966552734, "lr": 4.561526962711463e-05, "tps": 154106, "wall": 11977.6} {"step": 28165, "train_loss": 3.140575885772705, "lr": 4.5610522726849414e-05, "tps": 154054, "wall": 11982.1} {"step": 28166, "train_loss": 3.1791865825653076, "lr": 4.560577780207762e-05, "tps": 154002, "wall": 11986.5} {"step": 28167, "train_loss": 3.2387256622314453, "lr": 4.560103485285303e-05, "tps": 153950, "wall": 11991.0} {"step": 28168, "train_loss": 3.191319227218628, "lr": 4.5596293879229323e-05, "tps": 153899, "wall": 11995.4} {"step": 28169, "train_loss": 3.0874991416931152, "lr": 4.559155488126026e-05, "tps": 153846, "wall": 11999.9} {"step": 28170, "train_loss": 3.13930344581604, "lr": 4.558681785899949e-05, "tps": 153794, "wall": 12004.4} {"step": 28171, "train_loss": 3.2567644119262695, "lr": 4.5582082812500684e-05, "tps": 153742, "wall": 12008.9} {"step": 28172, "train_loss": 3.232219696044922, "lr": 4.557734974181748e-05, "tps": 153691, "wall": 12013.3} {"step": 28173, "train_loss": 3.257018566131592, "lr": 4.55726186470035e-05, "tps": 153639, "wall": 12017.8} {"step": 28174, "train_loss": 3.2867112159729004, "lr": 4.5567889528112315e-05, "tps": 153588, "wall": 12022.3} {"step": 28175, "train_loss": 3.206662654876709, "lr": 4.556316238519753e-05, "tps": 153536, "wall": 12026.7} {"step": 28176, "train_loss": 3.119202136993408, "lr": 4.5558437218312675e-05, "tps": 153485, "wall": 12031.2} {"step": 28177, "train_loss": 3.197291851043701, "lr": 4.5553714027511266e-05, "tps": 153433, "wall": 12035.6} {"step": 28178, "train_loss": 3.078064203262329, "lr": 4.554899281284685e-05, "tps": 153382, "wall": 12040.1} {"step": 28179, "train_loss": 3.176095724105835, "lr": 4.554427357437287e-05, "tps": 153331, "wall": 12044.6} {"step": 28180, "train_loss": 3.189523220062256, "lr": 4.5539556312142774e-05, "tps": 153279, "wall": 12049.0} {"step": 28181, "train_loss": 3.223644733428955, "lr": 4.553484102621006e-05, "tps": 153228, "wall": 12053.5} {"step": 28182, "train_loss": 3.198054552078247, "lr": 4.553012771662807e-05, "tps": 153177, "wall": 12057.9} {"step": 28183, "train_loss": 3.184741258621216, "lr": 4.552541638345025e-05, "tps": 153125, "wall": 12062.4} {"step": 28184, "train_loss": 3.237004518508911, "lr": 4.552070702672996e-05, "tps": 153073, "wall": 12066.9} {"step": 28185, "train_loss": 3.1659908294677734, "lr": 4.551599964652052e-05, "tps": 153022, "wall": 12071.4} {"step": 28186, "train_loss": 3.13466739654541, "lr": 4.551129424287528e-05, "tps": 152971, "wall": 12075.9} {"step": 28187, "train_loss": 3.079793930053711, "lr": 4.550659081584755e-05, "tps": 152919, "wall": 12080.4} {"step": 28188, "train_loss": 3.2567343711853027, "lr": 4.5501889365490585e-05, "tps": 152868, "wall": 12084.8} {"step": 28189, "train_loss": 3.202282190322876, "lr": 4.5497189891857685e-05, "tps": 152817, "wall": 12089.3} {"step": 28190, "train_loss": 3.2781834602355957, "lr": 4.549249239500202e-05, "tps": 152766, "wall": 12093.8} {"step": 28191, "train_loss": 3.2296433448791504, "lr": 4.548779687497686e-05, "tps": 152715, "wall": 12098.3} {"step": 28192, "train_loss": 3.2696876525878906, "lr": 4.548310333183538e-05, "tps": 152664, "wall": 12102.7} {"step": 28193, "train_loss": 3.2534704208374023, "lr": 4.5478411765630755e-05, "tps": 152613, "wall": 12107.2} {"step": 28194, "train_loss": 3.16790771484375, "lr": 4.54737221764161e-05, "tps": 152563, "wall": 12111.6} {"step": 28195, "train_loss": 3.2440989017486572, "lr": 4.546903456424459e-05, "tps": 152512, "wall": 12116.1} {"step": 28196, "train_loss": 3.2592508792877197, "lr": 4.546434892916929e-05, "tps": 152460, "wall": 12120.6} {"step": 28197, "train_loss": 3.104846477508545, "lr": 4.5459665271243266e-05, "tps": 152409, "wall": 12125.1} {"step": 28198, "train_loss": 3.174924373626709, "lr": 4.5454983590519615e-05, "tps": 152359, "wall": 12129.6} {"step": 28199, "train_loss": 3.2176575660705566, "lr": 4.545030388705136e-05, "tps": 152308, "wall": 12134.0} {"step": 28200, "train_loss": 3.186610221862793, "lr": 4.544562616089148e-05, "tps": 152257, "wall": 12138.6} {"step": 28201, "train_loss": 3.113128662109375, "lr": 4.5440950412093e-05, "tps": 152206, "wall": 12143.0} {"step": 28202, "train_loss": 3.159420967102051, "lr": 4.5436276640708886e-05, "tps": 152156, "wall": 12147.4} {"step": 28203, "train_loss": 3.1612353324890137, "lr": 4.543160484679206e-05, "tps": 152105, "wall": 12151.9} {"step": 28204, "train_loss": 3.194375514984131, "lr": 4.542693503039549e-05, "tps": 152055, "wall": 12156.4} {"step": 28205, "train_loss": 3.2009406089782715, "lr": 4.5422267191572e-05, "tps": 152004, "wall": 12160.9} {"step": 28206, "train_loss": 3.0945348739624023, "lr": 4.5417601330374535e-05, "tps": 151954, "wall": 12165.3} {"step": 28207, "train_loss": 3.2731237411499023, "lr": 4.541293744685593e-05, "tps": 151903, "wall": 12169.8} {"step": 28208, "train_loss": 3.1570279598236084, "lr": 4.5408275541069e-05, "tps": 151853, "wall": 12174.3} {"step": 28209, "train_loss": 3.161452054977417, "lr": 4.540361561306659e-05, "tps": 151802, "wall": 12178.8} {"step": 28210, "train_loss": 3.149993419647217, "lr": 4.5398957662901475e-05, "tps": 151752, "wall": 12183.2} {"step": 28211, "train_loss": 3.2176361083984375, "lr": 4.539430169062637e-05, "tps": 151702, "wall": 12187.7} {"step": 28212, "train_loss": 3.222957134246826, "lr": 4.5389647696294095e-05, "tps": 151652, "wall": 12192.2} {"step": 28213, "train_loss": 3.1770684719085693, "lr": 4.538499567995735e-05, "tps": 151601, "wall": 12196.6} {"step": 28214, "train_loss": 3.2018015384674072, "lr": 4.5380345641668786e-05, "tps": 151551, "wall": 12201.1} {"step": 28215, "train_loss": 3.089857578277588, "lr": 4.5375697581481124e-05, "tps": 151501, "wall": 12205.6} {"step": 28216, "train_loss": 3.1943016052246094, "lr": 4.5371051499447024e-05, "tps": 151451, "wall": 12210.0} {"step": 28217, "train_loss": 3.293036460876465, "lr": 4.536640739561906e-05, "tps": 151401, "wall": 12214.5} {"step": 28218, "train_loss": 3.2014451026916504, "lr": 4.536176527004992e-05, "tps": 151351, "wall": 12219.0} {"step": 28219, "train_loss": 3.1034345626831055, "lr": 4.535712512279213e-05, "tps": 151301, "wall": 12223.4} {"step": 28220, "train_loss": 3.17441463470459, "lr": 4.5352486953898275e-05, "tps": 151251, "wall": 12227.9} {"step": 28221, "train_loss": 3.099907875061035, "lr": 4.534785076342091e-05, "tps": 151201, "wall": 12232.4} {"step": 28222, "train_loss": 3.149399995803833, "lr": 4.534321655141254e-05, "tps": 151152, "wall": 12236.8} {"step": 28223, "train_loss": 3.2419705390930176, "lr": 4.533858431792565e-05, "tps": 151101, "wall": 12241.3} {"step": 28224, "train_loss": 3.186572551727295, "lr": 4.5333954063012743e-05, "tps": 151051, "wall": 12245.8} {"step": 28225, "train_loss": 3.187164783477783, "lr": 4.5329325786726216e-05, "tps": 151002, "wall": 12250.3} {"step": 28226, "train_loss": 3.1176352500915527, "lr": 4.532469948911858e-05, "tps": 150952, "wall": 12254.8} {"step": 28227, "train_loss": 3.1679368019104004, "lr": 4.5320075170242196e-05, "tps": 150902, "wall": 12259.2} {"step": 28228, "train_loss": 3.1552140712738037, "lr": 4.5315452830149404e-05, "tps": 150853, "wall": 12263.7} {"step": 28229, "train_loss": 3.087341070175171, "lr": 4.531083246889266e-05, "tps": 150803, "wall": 12268.1} {"step": 28230, "train_loss": 3.1560006141662598, "lr": 4.530621408652424e-05, "tps": 150754, "wall": 12272.6} {"step": 28231, "train_loss": 3.234955310821533, "lr": 4.5301597683096475e-05, "tps": 150704, "wall": 12277.1} {"step": 28232, "train_loss": 3.213597297668457, "lr": 4.529698325866166e-05, "tps": 150655, "wall": 12281.5} {"step": 28233, "train_loss": 3.2252941131591797, "lr": 4.529237081327209e-05, "tps": 150605, "wall": 12286.0} {"step": 28234, "train_loss": 3.168581485748291, "lr": 4.5287760346979967e-05, "tps": 150556, "wall": 12290.5} {"step": 28235, "train_loss": 3.184816837310791, "lr": 4.5283151859837544e-05, "tps": 150507, "wall": 12294.9} {"step": 28236, "train_loss": 3.1816844940185547, "lr": 4.527854535189705e-05, "tps": 150456, "wall": 12299.5} {"step": 28237, "train_loss": 3.1552155017852783, "lr": 4.527394082321064e-05, "tps": 150407, "wall": 12303.9} {"step": 28238, "train_loss": 3.107109546661377, "lr": 4.526933827383047e-05, "tps": 150358, "wall": 12308.4} {"step": 28239, "train_loss": 3.0952723026275635, "lr": 4.52647377038087e-05, "tps": 150309, "wall": 12312.9} {"step": 28240, "train_loss": 3.200662612915039, "lr": 4.526013911319745e-05, "tps": 150260, "wall": 12317.3} {"step": 28241, "train_loss": 3.262185573577881, "lr": 4.5255542502048804e-05, "tps": 150211, "wall": 12321.8} {"step": 28242, "train_loss": 3.2219409942626953, "lr": 4.525094787041478e-05, "tps": 150162, "wall": 12326.2} {"step": 28243, "train_loss": 3.204028606414795, "lr": 4.5246355218347514e-05, "tps": 150113, "wall": 12330.7} {"step": 28244, "train_loss": 3.2253050804138184, "lr": 4.524176454589896e-05, "tps": 150064, "wall": 12335.2} {"step": 28245, "train_loss": 3.118353843688965, "lr": 4.523717585312117e-05, "tps": 150015, "wall": 12339.6} {"step": 28246, "train_loss": 3.2300992012023926, "lr": 4.52325891400661e-05, "tps": 149965, "wall": 12344.1} {"step": 28247, "train_loss": 3.137755870819092, "lr": 4.5228004406785695e-05, "tps": 149916, "wall": 12348.6} {"step": 28248, "train_loss": 3.1638264656066895, "lr": 4.522342165333194e-05, "tps": 149868, "wall": 12353.0} {"step": 28249, "train_loss": 3.1203384399414062, "lr": 4.521884087975672e-05, "tps": 149819, "wall": 12357.5} {"step": 28250, "train_loss": 3.055420398712158, "lr": 4.5214262086111905e-05, "tps": 149769, "wall": 12362.0} {"step": 28251, "train_loss": 3.157778024673462, "lr": 4.52096852724494e-05, "tps": 149721, "wall": 12366.5} {"step": 28252, "train_loss": 3.1539077758789062, "lr": 4.5205110438821044e-05, "tps": 149672, "wall": 12371.0} {"step": 28253, "train_loss": 3.1609909534454346, "lr": 4.520053758527863e-05, "tps": 149623, "wall": 12375.4} {"step": 28254, "train_loss": 3.1043617725372314, "lr": 4.519596671187399e-05, "tps": 149574, "wall": 12379.9} {"step": 28255, "train_loss": 3.183025360107422, "lr": 4.5191397818658916e-05, "tps": 149525, "wall": 12384.4} {"step": 28256, "train_loss": 3.2420248985290527, "lr": 4.51868309056851e-05, "tps": 149477, "wall": 12388.9} {"step": 28257, "train_loss": 3.117459297180176, "lr": 4.5182265973004365e-05, "tps": 149428, "wall": 12393.3} {"step": 28258, "train_loss": 3.2387475967407227, "lr": 4.5177703020668364e-05, "tps": 149379, "wall": 12397.8} {"step": 28259, "train_loss": 3.182706356048584, "lr": 4.51731420487288e-05, "tps": 149331, "wall": 12402.3} {"step": 28260, "train_loss": 3.1145167350769043, "lr": 4.5168583057237343e-05, "tps": 149282, "wall": 12406.8} {"step": 28261, "train_loss": 3.181776523590088, "lr": 4.516402604624562e-05, "tps": 149234, "wall": 12411.2} {"step": 28262, "train_loss": 3.200434684753418, "lr": 4.515947101580529e-05, "tps": 149185, "wall": 12415.7} {"step": 28263, "train_loss": 3.059312343597412, "lr": 4.515491796596794e-05, "tps": 149136, "wall": 12420.2} {"step": 28264, "train_loss": 3.180467128753662, "lr": 4.51503668967851e-05, "tps": 149088, "wall": 12424.7} {"step": 28265, "train_loss": 3.2117109298706055, "lr": 4.514581780830839e-05, "tps": 149039, "wall": 12429.2} {"step": 28266, "train_loss": 3.1807053089141846, "lr": 4.514127070058932e-05, "tps": 148991, "wall": 12433.7} {"step": 28267, "train_loss": 3.216676950454712, "lr": 4.5136725573679355e-05, "tps": 148942, "wall": 12438.1} {"step": 28268, "train_loss": 3.1700708866119385, "lr": 4.513218242763008e-05, "tps": 148894, "wall": 12442.6} {"step": 28269, "train_loss": 3.1695404052734375, "lr": 4.5127641262492864e-05, "tps": 148846, "wall": 12447.1} {"step": 28270, "train_loss": 3.104752540588379, "lr": 4.512310207831919e-05, "tps": 148798, "wall": 12451.6} {"step": 28271, "train_loss": 3.3053128719329834, "lr": 4.5118564875160486e-05, "tps": 148749, "wall": 12456.0} {"step": 28272, "train_loss": 3.1004638671875, "lr": 4.511402965306816e-05, "tps": 148701, "wall": 12460.5} {"step": 28273, "train_loss": 3.1006298065185547, "lr": 4.510949641209351e-05, "tps": 148653, "wall": 12465.0} {"step": 28274, "train_loss": 3.126067638397217, "lr": 4.5104965152288e-05, "tps": 148605, "wall": 12469.5} {"step": 28275, "train_loss": 3.0962564945220947, "lr": 4.510043587370289e-05, "tps": 148556, "wall": 12474.0} {"step": 28276, "train_loss": 3.103902816772461, "lr": 4.509590857638949e-05, "tps": 148508, "wall": 12478.5} {"step": 28277, "train_loss": 3.194906234741211, "lr": 4.5091383260399124e-05, "tps": 148460, "wall": 12483.0} {"step": 28278, "train_loss": 3.1854045391082764, "lr": 4.508685992578301e-05, "tps": 148411, "wall": 12487.5} {"step": 28279, "train_loss": 3.1903672218322754, "lr": 4.508233857259243e-05, "tps": 148363, "wall": 12492.0} {"step": 28280, "train_loss": 3.082425832748413, "lr": 4.507781920087856e-05, "tps": 148315, "wall": 12496.5} {"step": 28281, "train_loss": 3.2161405086517334, "lr": 4.507330181069262e-05, "tps": 148268, "wall": 12500.9} {"step": 28282, "train_loss": 3.232544422149658, "lr": 4.506878640208581e-05, "tps": 148220, "wall": 12505.4} {"step": 28283, "train_loss": 3.0569918155670166, "lr": 4.5064272975109226e-05, "tps": 148172, "wall": 12509.9} {"step": 28284, "train_loss": 3.2209882736206055, "lr": 4.505976152981402e-05, "tps": 148124, "wall": 12514.4} {"step": 28285, "train_loss": 3.234818458557129, "lr": 4.5055252066251296e-05, "tps": 148076, "wall": 12518.9} {"step": 28286, "train_loss": 3.294158697128296, "lr": 4.5050744584472174e-05, "tps": 148028, "wall": 12523.4} {"step": 28287, "train_loss": 3.128769636154175, "lr": 4.504623908452764e-05, "tps": 147980, "wall": 12527.9} {"step": 28288, "train_loss": 3.274332284927368, "lr": 4.504173556646879e-05, "tps": 147933, "wall": 12532.3} {"step": 28289, "train_loss": 3.23952579498291, "lr": 4.503723403034663e-05, "tps": 147885, "wall": 12536.8} {"step": 28290, "train_loss": 3.0891261100769043, "lr": 4.503273447621215e-05, "tps": 147836, "wall": 12541.4} {"step": 28291, "train_loss": 3.0493907928466797, "lr": 4.5028236904116316e-05, "tps": 147789, "wall": 12545.9} {"step": 28292, "train_loss": 3.2232043743133545, "lr": 4.502374131411007e-05, "tps": 147741, "wall": 12550.4} {"step": 28293, "train_loss": 3.2425503730773926, "lr": 4.501924770624435e-05, "tps": 147693, "wall": 12554.9} {"step": 28294, "train_loss": 3.1853623390197754, "lr": 4.5014756080570066e-05, "tps": 147646, "wall": 12559.4} {"step": 28295, "train_loss": 3.14337420463562, "lr": 4.5010266437138104e-05, "tps": 147598, "wall": 12563.9} {"step": 28296, "train_loss": 3.1562304496765137, "lr": 4.500577877599928e-05, "tps": 147551, "wall": 12568.3} {"step": 28297, "train_loss": 3.1095471382141113, "lr": 4.500129309720448e-05, "tps": 147503, "wall": 12572.8} {"step": 28298, "train_loss": 3.1138625144958496, "lr": 4.49968094008045e-05, "tps": 147456, "wall": 12577.3} {"step": 28299, "train_loss": 3.1610569953918457, "lr": 4.4992327686850127e-05, "tps": 147408, "wall": 12581.8} {"step": 28300, "train_loss": 3.1899521350860596, "lr": 4.498784795539214e-05, "tps": 147361, "wall": 12586.3} {"step": 28301, "train_loss": 3.1521077156066895, "lr": 4.498337020648127e-05, "tps": 147314, "wall": 12590.8} {"step": 28302, "train_loss": 3.132091760635376, "lr": 4.497889444016825e-05, "tps": 147266, "wall": 12595.3} {"step": 28303, "train_loss": 3.0866384506225586, "lr": 4.4974420656503805e-05, "tps": 147218, "wall": 12599.8} {"step": 28304, "train_loss": 3.1394667625427246, "lr": 4.496994885553856e-05, "tps": 147171, "wall": 12604.3} {"step": 28305, "train_loss": 3.275996685028076, "lr": 4.496547903732323e-05, "tps": 147124, "wall": 12608.8} {"step": 28306, "train_loss": 3.056307077407837, "lr": 4.496101120190841e-05, "tps": 147077, "wall": 12613.3} {"step": 28307, "train_loss": 3.2182188034057617, "lr": 4.4956545349344704e-05, "tps": 147029, "wall": 12617.8} {"step": 28308, "train_loss": 3.054483413696289, "lr": 4.495208147968275e-05, "tps": 146982, "wall": 12622.3} {"step": 28309, "train_loss": 3.2172725200653076, "lr": 4.494761959297309e-05, "tps": 146935, "wall": 12626.8} {"step": 28310, "train_loss": 3.204300880432129, "lr": 4.4943159689266245e-05, "tps": 146888, "wall": 12631.3} {"step": 28311, "train_loss": 3.1493592262268066, "lr": 4.493870176861276e-05, "tps": 146841, "wall": 12635.8} {"step": 28312, "train_loss": 3.1719281673431396, "lr": 4.4934245831063134e-05, "tps": 146794, "wall": 12640.3} {"step": 28313, "train_loss": 3.2425761222839355, "lr": 4.492979187666784e-05, "tps": 146747, "wall": 12644.7} {"step": 28314, "train_loss": 3.287318229675293, "lr": 4.492533990547736e-05, "tps": 146700, "wall": 12649.2} {"step": 28315, "train_loss": 3.0821261405944824, "lr": 4.492088991754206e-05, "tps": 146653, "wall": 12653.7} {"step": 28316, "train_loss": 3.2140345573425293, "lr": 4.491644191291242e-05, "tps": 146606, "wall": 12658.2} {"step": 28317, "train_loss": 3.124516010284424, "lr": 4.49119958916388e-05, "tps": 146559, "wall": 12662.8} {"step": 28318, "train_loss": 3.2157652378082275, "lr": 4.490755185377154e-05, "tps": 146512, "wall": 12667.3} {"step": 28319, "train_loss": 3.187229633331299, "lr": 4.490310979936103e-05, "tps": 146465, "wall": 12671.8} {"step": 28320, "train_loss": 3.1729235649108887, "lr": 4.489866972845757e-05, "tps": 146418, "wall": 12676.3} {"step": 28321, "train_loss": 3.281627655029297, "lr": 4.4894231641111404e-05, "tps": 146372, "wall": 12680.7} {"step": 28322, "train_loss": 3.2106027603149414, "lr": 4.48897955373729e-05, "tps": 146325, "wall": 12685.2} {"step": 28323, "train_loss": 3.21297025680542, "lr": 4.488536141729227e-05, "tps": 146279, "wall": 12689.7} {"step": 28324, "train_loss": 3.1254658699035645, "lr": 4.4880929280919695e-05, "tps": 146232, "wall": 12694.2} {"step": 28325, "train_loss": 3.0971460342407227, "lr": 4.487649912830546e-05, "tps": 146186, "wall": 12698.7} {"step": 28326, "train_loss": 3.1829192638397217, "lr": 4.4872070959499724e-05, "tps": 146139, "wall": 12703.2} {"step": 28327, "train_loss": 3.181868314743042, "lr": 4.48676447745526e-05, "tps": 146093, "wall": 12707.7} {"step": 28328, "train_loss": 3.1405751705169678, "lr": 4.486322057351432e-05, "tps": 146046, "wall": 12712.1} {"step": 28329, "train_loss": 3.2332396507263184, "lr": 4.485879835643494e-05, "tps": 146000, "wall": 12716.6} {"step": 28330, "train_loss": 3.187971591949463, "lr": 4.485437812336455e-05, "tps": 145953, "wall": 12721.2} {"step": 28331, "train_loss": 3.191375255584717, "lr": 4.4849959874353236e-05, "tps": 145907, "wall": 12725.7} {"step": 28332, "train_loss": 3.204841136932373, "lr": 4.484554360945106e-05, "tps": 145861, "wall": 12730.1} {"step": 28333, "train_loss": 3.0890085697174072, "lr": 4.484112932870805e-05, "tps": 145814, "wall": 12734.6} {"step": 28334, "train_loss": 3.202188014984131, "lr": 4.483671703217421e-05, "tps": 145768, "wall": 12739.1} {"step": 28335, "train_loss": 3.250922441482544, "lr": 4.4832306719899486e-05, "tps": 145722, "wall": 12743.6} {"step": 28336, "train_loss": 3.2767341136932373, "lr": 4.48278983919339e-05, "tps": 145676, "wall": 12748.1} {"step": 28337, "train_loss": 3.1725594997406006, "lr": 4.482349204832735e-05, "tps": 145630, "wall": 12752.5} {"step": 28338, "train_loss": 3.168043613433838, "lr": 4.481908768912973e-05, "tps": 145584, "wall": 12757.0} {"step": 28339, "train_loss": 3.194516181945801, "lr": 4.4814685314391005e-05, "tps": 145538, "wall": 12761.5} {"step": 28340, "train_loss": 3.1894564628601074, "lr": 4.4810284924160986e-05, "tps": 145492, "wall": 12766.0} {"step": 28341, "train_loss": 3.1498074531555176, "lr": 4.4805886518489507e-05, "tps": 145446, "wall": 12770.5} {"step": 28342, "train_loss": 3.3211984634399414, "lr": 4.480149009742646e-05, "tps": 145400, "wall": 12775.0} {"step": 28343, "train_loss": 3.1221776008605957, "lr": 4.4797095661021623e-05, "tps": 145353, "wall": 12779.5} {"step": 28344, "train_loss": 3.1734132766723633, "lr": 4.4792703209324715e-05, "tps": 145308, "wall": 12784.0} {"step": 28345, "train_loss": 3.1384963989257812, "lr": 4.478831274238558e-05, "tps": 145262, "wall": 12788.5} {"step": 28346, "train_loss": 3.194732427597046, "lr": 4.478392426025392e-05, "tps": 145216, "wall": 12793.0} {"step": 28347, "train_loss": 3.175283193588257, "lr": 4.477953776297941e-05, "tps": 145170, "wall": 12797.5} {"step": 28348, "train_loss": 3.172863721847534, "lr": 4.477515325061181e-05, "tps": 145125, "wall": 12801.9} {"step": 28349, "train_loss": 3.199604034423828, "lr": 4.477077072320074e-05, "tps": 145079, "wall": 12806.4} {"step": 28350, "train_loss": 3.1486289501190186, "lr": 4.476639018079585e-05, "tps": 145033, "wall": 12810.9} {"step": 28351, "train_loss": 3.1738033294677734, "lr": 4.476201162344679e-05, "tps": 144987, "wall": 12815.4} {"step": 28352, "train_loss": 3.1817948818206787, "lr": 4.475763505120312e-05, "tps": 144942, "wall": 12819.9} {"step": 28353, "train_loss": 3.1568970680236816, "lr": 4.4753260464114466e-05, "tps": 144896, "wall": 12824.3} {"step": 28354, "train_loss": 3.168555974960327, "lr": 4.474888786223035e-05, "tps": 144851, "wall": 12828.8} {"step": 28355, "train_loss": 3.1321864128112793, "lr": 4.47445172456003e-05, "tps": 144805, "wall": 12833.3} {"step": 28356, "train_loss": 3.1625499725341797, "lr": 4.474014861427387e-05, "tps": 144760, "wall": 12837.8} {"step": 28357, "train_loss": 3.161447048187256, "lr": 4.47357819683005e-05, "tps": 144714, "wall": 12842.3} {"step": 28358, "train_loss": 3.1466622352600098, "lr": 4.4731417307729655e-05, "tps": 144669, "wall": 12846.8} {"step": 28359, "train_loss": 3.134805917739868, "lr": 4.472705463261081e-05, "tps": 144623, "wall": 12851.3} {"step": 28360, "train_loss": 3.1375393867492676, "lr": 4.47226939429934e-05, "tps": 144578, "wall": 12855.8} {"step": 28361, "train_loss": 3.2132363319396973, "lr": 4.4718335238926755e-05, "tps": 144532, "wall": 12860.3} {"step": 28362, "train_loss": 3.2273340225219727, "lr": 4.47139785204603e-05, "tps": 144487, "wall": 12864.8} {"step": 28363, "train_loss": 3.0670130252838135, "lr": 4.4709623787643394e-05, "tps": 144442, "wall": 12869.2} {"step": 28364, "train_loss": 3.194286584854126, "lr": 4.470527104052534e-05, "tps": 144397, "wall": 12873.7} {"step": 28365, "train_loss": 3.151817798614502, "lr": 4.4700920279155475e-05, "tps": 144351, "wall": 12878.2} {"step": 28366, "train_loss": 3.1584091186523438, "lr": 4.469657150358307e-05, "tps": 144306, "wall": 12882.7} {"step": 28367, "train_loss": 3.2218003273010254, "lr": 4.469222471385735e-05, "tps": 144261, "wall": 12887.2} {"step": 28368, "train_loss": 3.2382540702819824, "lr": 4.468787991002763e-05, "tps": 144216, "wall": 12891.7} {"step": 28369, "train_loss": 3.1100282669067383, "lr": 4.468353709214307e-05, "tps": 144171, "wall": 12896.1} {"step": 28370, "train_loss": 3.1313931941986084, "lr": 4.467919626025289e-05, "tps": 144125, "wall": 12900.7} {"step": 28371, "train_loss": 3.139634847640991, "lr": 4.4674857414406265e-05, "tps": 144080, "wall": 12905.2} {"step": 28372, "train_loss": 3.2510628700256348, "lr": 4.4670520554652326e-05, "tps": 144035, "wall": 12909.7} {"step": 28373, "train_loss": 3.1403517723083496, "lr": 4.466618568104024e-05, "tps": 143990, "wall": 12914.2} {"step": 28374, "train_loss": 3.1963212490081787, "lr": 4.4661852793619086e-05, "tps": 143945, "wall": 12918.7} {"step": 28375, "train_loss": 3.165159225463867, "lr": 4.4657521892437926e-05, "tps": 143900, "wall": 12923.2} {"step": 28376, "train_loss": 3.1212663650512695, "lr": 4.465319297754586e-05, "tps": 143855, "wall": 12927.6} {"step": 28377, "train_loss": 3.1103527545928955, "lr": 4.4648866048991924e-05, "tps": 143810, "wall": 12932.1} {"step": 28378, "train_loss": 3.184807062149048, "lr": 4.464454110682508e-05, "tps": 143766, "wall": 12936.6} {"step": 28379, "train_loss": 3.2673633098602295, "lr": 4.464021815109439e-05, "tps": 143721, "wall": 12941.1} {"step": 28380, "train_loss": 3.1157798767089844, "lr": 4.463589718184879e-05, "tps": 143676, "wall": 12945.6} {"step": 28381, "train_loss": 3.1737961769104004, "lr": 4.463157819913724e-05, "tps": 143631, "wall": 12950.1} {"step": 28382, "train_loss": 3.3215131759643555, "lr": 4.462726120300864e-05, "tps": 143587, "wall": 12954.6} {"step": 28383, "train_loss": 3.2141153812408447, "lr": 4.462294619351193e-05, "tps": 143541, "wall": 12959.1} {"step": 28384, "train_loss": 3.2062273025512695, "lr": 4.4618633170695953e-05, "tps": 143497, "wall": 12963.6} {"step": 28385, "train_loss": 3.1914353370666504, "lr": 4.461432213460962e-05, "tps": 143452, "wall": 12968.1} {"step": 28386, "train_loss": 3.1602702140808105, "lr": 4.461001308530171e-05, "tps": 143408, "wall": 12972.6} {"step": 28387, "train_loss": 3.1535186767578125, "lr": 4.460570602282106e-05, "tps": 143363, "wall": 12977.0} {"step": 28388, "train_loss": 3.1785459518432617, "lr": 4.460140094721648e-05, "tps": 143319, "wall": 12981.5} {"step": 28389, "train_loss": 3.2001116275787354, "lr": 4.45970978585367e-05, "tps": 143274, "wall": 12986.0} {"step": 28390, "train_loss": 3.1221089363098145, "lr": 4.4592796756830484e-05, "tps": 143229, "wall": 12990.6} {"step": 28391, "train_loss": 3.142024040222168, "lr": 4.4588497642146574e-05, "tps": 143185, "wall": 12995.0} {"step": 28392, "train_loss": 3.238530397415161, "lr": 4.458420051453364e-05, "tps": 143141, "wall": 12999.5} {"step": 28393, "train_loss": 3.2228522300720215, "lr": 4.457990537404037e-05, "tps": 143096, "wall": 13004.0} {"step": 28394, "train_loss": 3.204296827316284, "lr": 4.457561222071542e-05, "tps": 143052, "wall": 13008.5} {"step": 28395, "train_loss": 3.0773138999938965, "lr": 4.457132105460744e-05, "tps": 143008, "wall": 13013.0} {"step": 28396, "train_loss": 3.1430423259735107, "lr": 4.4567031875765017e-05, "tps": 142963, "wall": 13017.5} {"step": 28397, "train_loss": 3.1789937019348145, "lr": 4.456274468423675e-05, "tps": 142919, "wall": 13022.0} {"step": 28398, "train_loss": 3.2254390716552734, "lr": 4.455845948007118e-05, "tps": 142874, "wall": 13026.5} {"step": 28399, "train_loss": 3.1434857845306396, "lr": 4.4554176263316904e-05, "tps": 142830, "wall": 13031.0} {"step": 28400, "train_loss": 3.2367489337921143, "lr": 4.4549895034022405e-05, "tps": 142786, "wall": 13035.5} {"step": 28401, "train_loss": 3.1812238693237305, "lr": 4.454561579223617e-05, "tps": 142742, "wall": 13040.0} {"step": 28402, "train_loss": 3.2168145179748535, "lr": 4.45413385380067e-05, "tps": 142698, "wall": 13044.4} {"step": 28403, "train_loss": 3.176193952560425, "lr": 4.453706327138245e-05, "tps": 142654, "wall": 13048.9} {"step": 28404, "train_loss": 3.2130637168884277, "lr": 4.4532789992411826e-05, "tps": 142610, "wall": 13053.4} {"step": 28405, "train_loss": 3.1417746543884277, "lr": 4.452851870114325e-05, "tps": 142566, "wall": 13057.9} {"step": 28406, "train_loss": 3.1213467121124268, "lr": 4.452424939762509e-05, "tps": 142522, "wall": 13062.4} {"step": 28407, "train_loss": 3.2123448848724365, "lr": 4.451998208190577e-05, "tps": 142478, "wall": 13066.9} {"step": 28408, "train_loss": 3.170125961303711, "lr": 4.451571675403357e-05, "tps": 142434, "wall": 13071.4} {"step": 28409, "train_loss": 3.061156988143921, "lr": 4.451145341405682e-05, "tps": 142390, "wall": 13075.8} {"step": 28410, "train_loss": 3.2667465209960938, "lr": 4.4507192062023816e-05, "tps": 142346, "wall": 13080.4} {"step": 28411, "train_loss": 3.0921969413757324, "lr": 4.450293269798283e-05, "tps": 142302, "wall": 13084.9} {"step": 28412, "train_loss": 3.1400952339172363, "lr": 4.449867532198213e-05, "tps": 142258, "wall": 13089.4} {"step": 28413, "train_loss": 3.337413787841797, "lr": 4.4494419934069924e-05, "tps": 142214, "wall": 13093.9} {"step": 28414, "train_loss": 3.143331527709961, "lr": 4.44901665342944e-05, "tps": 142171, "wall": 13098.3} {"step": 28415, "train_loss": 3.117234706878662, "lr": 4.44859151227038e-05, "tps": 142127, "wall": 13102.8} {"step": 28416, "train_loss": 3.140864849090576, "lr": 4.448166569934623e-05, "tps": 142083, "wall": 13107.3} {"step": 28417, "train_loss": 3.211177349090576, "lr": 4.447741826426984e-05, "tps": 142040, "wall": 13111.8} {"step": 28418, "train_loss": 3.1733150482177734, "lr": 4.447317281752278e-05, "tps": 141996, "wall": 13116.3} {"step": 28419, "train_loss": 3.107816696166992, "lr": 4.446892935915309e-05, "tps": 141952, "wall": 13120.8} {"step": 28420, "train_loss": 3.141817808151245, "lr": 4.4464687889208865e-05, "tps": 141909, "wall": 13125.3} {"step": 28421, "train_loss": 3.0650150775909424, "lr": 4.4460448407738164e-05, "tps": 141866, "wall": 13129.7} {"step": 28422, "train_loss": 3.264425277709961, "lr": 4.4456210914788993e-05, "tps": 141822, "wall": 13134.2} {"step": 28423, "train_loss": 3.175159454345703, "lr": 4.445197541040935e-05, "tps": 141778, "wall": 13138.8} {"step": 28424, "train_loss": 3.214200496673584, "lr": 4.4447741894647255e-05, "tps": 141735, "wall": 13143.2} {"step": 28425, "train_loss": 3.0750064849853516, "lr": 4.444351036755062e-05, "tps": 141691, "wall": 13147.7} {"step": 28426, "train_loss": 3.2234811782836914, "lr": 4.443928082916739e-05, "tps": 141648, "wall": 13152.2} {"step": 28427, "train_loss": 3.167006492614746, "lr": 4.44350532795455e-05, "tps": 141605, "wall": 13156.7} {"step": 28428, "train_loss": 3.17712664604187, "lr": 4.443082771873283e-05, "tps": 141562, "wall": 13161.2} {"step": 28429, "train_loss": 3.2652649879455566, "lr": 4.4426604146777207e-05, "tps": 141518, "wall": 13165.7} {"step": 28430, "train_loss": 3.1995911598205566, "lr": 4.4422382563726536e-05, "tps": 141475, "wall": 13170.1} {"step": 28431, "train_loss": 3.176118850708008, "lr": 4.4418162969628604e-05, "tps": 141432, "wall": 13174.6} {"step": 28432, "train_loss": 3.1571011543273926, "lr": 4.4413945364531215e-05, "tps": 141389, "wall": 13179.1} {"step": 28433, "train_loss": 3.2017300128936768, "lr": 4.440972974848218e-05, "tps": 141346, "wall": 13183.6} {"step": 28434, "train_loss": 3.1899025440216064, "lr": 4.44055161215292e-05, "tps": 141302, "wall": 13188.1} {"step": 28435, "train_loss": 3.0748677253723145, "lr": 4.4401304483720034e-05, "tps": 141259, "wall": 13192.6} {"step": 28436, "train_loss": 3.131269931793213, "lr": 4.4397094835102426e-05, "tps": 141216, "wall": 13197.1} {"step": 28437, "train_loss": 3.150315284729004, "lr": 4.439288717572398e-05, "tps": 141173, "wall": 13201.6} {"step": 28438, "train_loss": 3.148843765258789, "lr": 4.438868150563242e-05, "tps": 141130, "wall": 13206.1} {"step": 28439, "train_loss": 3.1404829025268555, "lr": 4.438447782487539e-05, "tps": 141087, "wall": 13210.6} {"step": 28440, "train_loss": 3.2027482986450195, "lr": 4.4380276133500484e-05, "tps": 141044, "wall": 13215.1} {"step": 28441, "train_loss": 3.167208194732666, "lr": 4.437607643155532e-05, "tps": 141001, "wall": 13219.5} {"step": 28442, "train_loss": 3.161680221557617, "lr": 4.4371878719087476e-05, "tps": 140958, "wall": 13224.0} {"step": 28443, "train_loss": 3.126652717590332, "lr": 4.4367682996144454e-05, "tps": 140916, "wall": 13228.5} {"step": 28444, "train_loss": 3.222970962524414, "lr": 4.4363489262773865e-05, "tps": 140873, "wall": 13233.0} {"step": 28445, "train_loss": 3.143561363220215, "lr": 4.4359297519023144e-05, "tps": 140830, "wall": 13237.4} {"step": 28446, "train_loss": 3.2461013793945312, "lr": 4.435510776493979e-05, "tps": 140787, "wall": 13241.9} {"step": 28447, "train_loss": 3.1675243377685547, "lr": 4.435092000057131e-05, "tps": 140745, "wall": 13246.4} {"step": 28448, "train_loss": 3.103984832763672, "lr": 4.4346734225965087e-05, "tps": 140702, "wall": 13250.9} {"step": 28449, "train_loss": 3.1879944801330566, "lr": 4.434255044116858e-05, "tps": 140659, "wall": 13255.4} {"step": 28450, "train_loss": 3.1783530712127686, "lr": 4.433836864622915e-05, "tps": 140616, "wall": 13259.9} {"step": 28451, "train_loss": 3.140387535095215, "lr": 4.433418884119418e-05, "tps": 140573, "wall": 13264.4} {"step": 28452, "train_loss": 3.1882946491241455, "lr": 4.433001102611104e-05, "tps": 140531, "wall": 13268.9} {"step": 28453, "train_loss": 3.199540853500366, "lr": 4.4325835201027025e-05, "tps": 140488, "wall": 13273.4} {"step": 28454, "train_loss": 3.1965854167938232, "lr": 4.4321661365989444e-05, "tps": 140446, "wall": 13277.9} {"step": 28455, "train_loss": 3.12141489982605, "lr": 4.431748952104561e-05, "tps": 140403, "wall": 13282.4} {"step": 28456, "train_loss": 3.1478188037872314, "lr": 4.431331966624276e-05, "tps": 140361, "wall": 13286.8} {"step": 28457, "train_loss": 3.1122446060180664, "lr": 4.4309151801628104e-05, "tps": 140318, "wall": 13291.3} {"step": 28458, "train_loss": 3.1602885723114014, "lr": 4.430498592724889e-05, "tps": 140276, "wall": 13295.8} {"step": 28459, "train_loss": 3.2460641860961914, "lr": 4.4300822043152305e-05, "tps": 140234, "wall": 13300.3} {"step": 28460, "train_loss": 3.205357551574707, "lr": 4.4296660149385505e-05, "tps": 140191, "wall": 13304.8} {"step": 28461, "train_loss": 3.3032119274139404, "lr": 4.429250024599567e-05, "tps": 140149, "wall": 13309.3} {"step": 28462, "train_loss": 3.1768765449523926, "lr": 4.428834233302988e-05, "tps": 140106, "wall": 13313.8} {"step": 28463, "train_loss": 3.1214101314544678, "lr": 4.428418641053524e-05, "tps": 140064, "wall": 13318.3} {"step": 28464, "train_loss": 3.2102317810058594, "lr": 4.428003247855887e-05, "tps": 140021, "wall": 13322.8} {"step": 28465, "train_loss": 3.193410873413086, "lr": 4.4275880537147766e-05, "tps": 139979, "wall": 13327.3} {"step": 28466, "train_loss": 3.1526331901550293, "lr": 4.4271730586349024e-05, "tps": 139937, "wall": 13331.8} {"step": 28467, "train_loss": 3.133688449859619, "lr": 4.426758262620962e-05, "tps": 139895, "wall": 13336.3} {"step": 28468, "train_loss": 3.1838717460632324, "lr": 4.426343665677651e-05, "tps": 139852, "wall": 13340.8} {"step": 28469, "train_loss": 3.0987515449523926, "lr": 4.425929267809675e-05, "tps": 139810, "wall": 13345.2} {"step": 28470, "train_loss": 3.1796841621398926, "lr": 4.4255150690217204e-05, "tps": 139768, "wall": 13349.7} {"step": 28471, "train_loss": 3.1736292839050293, "lr": 4.4251010693184816e-05, "tps": 139726, "wall": 13354.2} {"step": 28472, "train_loss": 3.3075523376464844, "lr": 4.424687268704649e-05, "tps": 139684, "wall": 13358.7} {"step": 28473, "train_loss": 3.064052104949951, "lr": 4.42427366718491e-05, "tps": 139642, "wall": 13363.2} {"step": 28474, "train_loss": 3.1619997024536133, "lr": 4.423860264763951e-05, "tps": 139600, "wall": 13367.7} {"step": 28475, "train_loss": 3.300569772720337, "lr": 4.423447061446452e-05, "tps": 139558, "wall": 13372.2} {"step": 28476, "train_loss": 3.1285295486450195, "lr": 4.4230340572370966e-05, "tps": 139516, "wall": 13376.7} {"step": 28477, "train_loss": 3.198395252227783, "lr": 4.4226212521405604e-05, "tps": 139474, "wall": 13381.2} {"step": 28478, "train_loss": 3.116077184677124, "lr": 4.422208646161523e-05, "tps": 139432, "wall": 13385.7} {"step": 28479, "train_loss": 3.094092845916748, "lr": 4.421796239304657e-05, "tps": 139390, "wall": 13390.2} {"step": 28480, "train_loss": 3.188800573348999, "lr": 4.421384031574633e-05, "tps": 139348, "wall": 13394.7} {"step": 28481, "train_loss": 3.2422876358032227, "lr": 4.420972022976123e-05, "tps": 139307, "wall": 13399.2} {"step": 28482, "train_loss": 3.228109121322632, "lr": 4.420560213513795e-05, "tps": 139265, "wall": 13403.7} {"step": 28483, "train_loss": 3.170149087905884, "lr": 4.420148603192308e-05, "tps": 139223, "wall": 13408.1} {"step": 28484, "train_loss": 3.172656297683716, "lr": 4.419737192016331e-05, "tps": 139181, "wall": 13412.6} {"step": 28485, "train_loss": 3.1541898250579834, "lr": 4.41932597999052e-05, "tps": 139140, "wall": 13417.1} {"step": 28486, "train_loss": 3.2738466262817383, "lr": 4.4189149671195366e-05, "tps": 139098, "wall": 13421.6} {"step": 28487, "train_loss": 3.1797332763671875, "lr": 4.418504153408038e-05, "tps": 139056, "wall": 13426.1} {"step": 28488, "train_loss": 3.1826276779174805, "lr": 4.418093538860672e-05, "tps": 139015, "wall": 13430.6} {"step": 28489, "train_loss": 3.178833484649658, "lr": 4.417683123482096e-05, "tps": 138973, "wall": 13435.1} {"step": 28490, "train_loss": 3.1637778282165527, "lr": 4.417272907276955e-05, "tps": 138931, "wall": 13439.6} {"step": 28491, "train_loss": 3.2142558097839355, "lr": 4.416862890249897e-05, "tps": 138890, "wall": 13444.1} {"step": 28492, "train_loss": 3.2474122047424316, "lr": 4.4164530724055706e-05, "tps": 138848, "wall": 13448.6} {"step": 28493, "train_loss": 3.2193641662597656, "lr": 4.416043453748614e-05, "tps": 138807, "wall": 13453.1} {"step": 28494, "train_loss": 3.125429391860962, "lr": 4.4156340342836666e-05, "tps": 138765, "wall": 13457.6} {"step": 28495, "train_loss": 3.159639358520508, "lr": 4.415224814015369e-05, "tps": 138724, "wall": 13462.0} {"step": 28496, "train_loss": 3.1025638580322266, "lr": 4.414815792948357e-05, "tps": 138682, "wall": 13466.5} {"step": 28497, "train_loss": 3.0872421264648438, "lr": 4.414406971087261e-05, "tps": 138641, "wall": 13471.0} {"step": 28498, "train_loss": 3.0959415435791016, "lr": 4.4139983484367166e-05, "tps": 138600, "wall": 13475.5} {"step": 28499, "train_loss": 3.1681971549987793, "lr": 4.413589925001349e-05, "tps": 138559, "wall": 13480.0} {"step": 28500, "train_loss": 3.2070441246032715, "lr": 4.413181700785785e-05, "tps": 138517, "wall": 13484.5} {"step": 28501, "train_loss": 3.1907496452331543, "lr": 4.4127736757946534e-05, "tps": 138474, "wall": 13489.1} {"step": 28502, "train_loss": 3.1672794818878174, "lr": 4.412365850032568e-05, "tps": 138433, "wall": 13493.6} {"step": 28503, "train_loss": 3.085698127746582, "lr": 4.411958223504159e-05, "tps": 138392, "wall": 13498.1} {"step": 28504, "train_loss": 3.024918556213379, "lr": 4.4115507962140375e-05, "tps": 138350, "wall": 13502.6} {"step": 28505, "train_loss": 3.128838539123535, "lr": 4.411143568166818e-05, "tps": 138309, "wall": 13507.2} {"step": 28506, "train_loss": 3.139244794845581, "lr": 4.4107365393671174e-05, "tps": 138268, "wall": 13511.6} {"step": 28507, "train_loss": 3.2169899940490723, "lr": 4.410329709819545e-05, "tps": 138227, "wall": 13516.1} {"step": 28508, "train_loss": 3.0859665870666504, "lr": 4.409923079528706e-05, "tps": 138186, "wall": 13520.6} {"step": 28509, "train_loss": 3.234921455383301, "lr": 4.4095166484992144e-05, "tps": 138145, "wall": 13525.1} {"step": 28510, "train_loss": 3.1263654232025146, "lr": 4.409110416735669e-05, "tps": 138104, "wall": 13529.6} {"step": 28511, "train_loss": 3.122891426086426, "lr": 4.408704384242669e-05, "tps": 138063, "wall": 13534.1} {"step": 28512, "train_loss": 3.1218204498291016, "lr": 4.40829855102482e-05, "tps": 138022, "wall": 13538.6} {"step": 28513, "train_loss": 3.179647922515869, "lr": 4.407892917086717e-05, "tps": 137981, "wall": 13543.0} {"step": 28514, "train_loss": 3.126904010772705, "lr": 4.407487482432953e-05, "tps": 137940, "wall": 13547.5} {"step": 28515, "train_loss": 3.1394224166870117, "lr": 4.407082247068125e-05, "tps": 137900, "wall": 13552.0} {"step": 28516, "train_loss": 3.1391568183898926, "lr": 4.40667721099682e-05, "tps": 137859, "wall": 13556.5} {"step": 28517, "train_loss": 3.186403751373291, "lr": 4.406272374223625e-05, "tps": 137818, "wall": 13561.0} {"step": 28518, "train_loss": 3.210501194000244, "lr": 4.405867736753134e-05, "tps": 137777, "wall": 13565.5} {"step": 28519, "train_loss": 3.160459041595459, "lr": 4.4054632985899206e-05, "tps": 137736, "wall": 13570.0} {"step": 28520, "train_loss": 3.1409239768981934, "lr": 4.4050590597385714e-05, "tps": 137695, "wall": 13574.5} {"step": 28521, "train_loss": 3.269592523574829, "lr": 4.404655020203666e-05, "tps": 137655, "wall": 13579.0} {"step": 28522, "train_loss": 3.260211706161499, "lr": 4.404251179989779e-05, "tps": 137614, "wall": 13583.4} {"step": 28523, "train_loss": 3.136643648147583, "lr": 4.403847539101487e-05, "tps": 137574, "wall": 13587.9} {"step": 28524, "train_loss": 3.196871757507324, "lr": 4.4034440975433644e-05, "tps": 137533, "wall": 13592.4} {"step": 28525, "train_loss": 3.1351919174194336, "lr": 4.403040855319976e-05, "tps": 137493, "wall": 13596.9} {"step": 28526, "train_loss": 3.1722376346588135, "lr": 4.402637812435895e-05, "tps": 137452, "wall": 13601.4} {"step": 28527, "train_loss": 3.1861791610717773, "lr": 4.402234968895683e-05, "tps": 137411, "wall": 13605.9} {"step": 28528, "train_loss": 3.142538070678711, "lr": 4.4018323247039044e-05, "tps": 137371, "wall": 13610.4} {"step": 28529, "train_loss": 3.026240825653076, "lr": 4.401429879865124e-05, "tps": 137330, "wall": 13614.9} {"step": 28530, "train_loss": 3.094698429107666, "lr": 4.4010276343838966e-05, "tps": 137289, "wall": 13619.4} {"step": 28531, "train_loss": 3.1673877239227295, "lr": 4.40062558826478e-05, "tps": 137249, "wall": 13623.9} {"step": 28532, "train_loss": 3.139963150024414, "lr": 4.4002237415123304e-05, "tps": 137209, "wall": 13628.4} {"step": 28533, "train_loss": 3.140200138092041, "lr": 4.3998220941310984e-05, "tps": 137168, "wall": 13632.9} {"step": 28534, "train_loss": 3.2792394161224365, "lr": 4.399420646125631e-05, "tps": 137128, "wall": 13637.3} {"step": 28535, "train_loss": 3.210510492324829, "lr": 4.39901939750048e-05, "tps": 137088, "wall": 13641.8} {"step": 28536, "train_loss": 3.1326937675476074, "lr": 4.398618348260191e-05, "tps": 137048, "wall": 13646.3} {"step": 28537, "train_loss": 3.155047655105591, "lr": 4.398217498409305e-05, "tps": 137007, "wall": 13650.8} {"step": 28538, "train_loss": 3.152984142303467, "lr": 4.397816847952362e-05, "tps": 136967, "wall": 13655.3} {"step": 28539, "train_loss": 3.110306978225708, "lr": 4.397416396893902e-05, "tps": 136927, "wall": 13659.8} {"step": 28540, "train_loss": 3.2390999794006348, "lr": 4.397016145238463e-05, "tps": 136887, "wall": 13664.2} {"step": 28541, "train_loss": 3.255035638809204, "lr": 4.3966160929905766e-05, "tps": 136847, "wall": 13668.7} {"step": 28542, "train_loss": 3.21315336227417, "lr": 4.396216240154775e-05, "tps": 136807, "wall": 13673.2} {"step": 28543, "train_loss": 3.1612844467163086, "lr": 4.39581658673559e-05, "tps": 136766, "wall": 13677.7} {"step": 28544, "train_loss": 3.2176311016082764, "lr": 4.3954171327375457e-05, "tps": 136726, "wall": 13682.3} {"step": 28545, "train_loss": 3.1672680377960205, "lr": 4.3950178781651685e-05, "tps": 136686, "wall": 13686.8} {"step": 28546, "train_loss": 3.0501177310943604, "lr": 4.394618823022982e-05, "tps": 136646, "wall": 13691.3} {"step": 28547, "train_loss": 3.1213788986206055, "lr": 4.394219967315506e-05, "tps": 136605, "wall": 13695.8} {"step": 28548, "train_loss": 3.2125296592712402, "lr": 4.393821311047255e-05, "tps": 136565, "wall": 13700.3} {"step": 28549, "train_loss": 3.1393637657165527, "lr": 4.393422854222754e-05, "tps": 136525, "wall": 13704.8} {"step": 28550, "train_loss": 3.1395208835601807, "lr": 4.3930245968465086e-05, "tps": 136485, "wall": 13709.2} {"step": 28551, "train_loss": 3.2333123683929443, "lr": 4.392626538923031e-05, "tps": 136446, "wall": 13713.7} {"step": 28552, "train_loss": 3.103442668914795, "lr": 4.392228680456837e-05, "tps": 136406, "wall": 13718.2} {"step": 28553, "train_loss": 3.1929104328155518, "lr": 4.3918310214524284e-05, "tps": 136366, "wall": 13722.7} {"step": 28554, "train_loss": 3.244053602218628, "lr": 4.3914335619143066e-05, "tps": 136326, "wall": 13727.2} {"step": 28555, "train_loss": 3.1305949687957764, "lr": 4.391036301846982e-05, "tps": 136286, "wall": 13731.7} {"step": 28556, "train_loss": 3.1601433753967285, "lr": 4.390639241254949e-05, "tps": 136247, "wall": 13736.2} {"step": 28557, "train_loss": 3.1329641342163086, "lr": 4.390242380142708e-05, "tps": 136206, "wall": 13740.7} {"step": 28558, "train_loss": 3.1597518920898438, "lr": 4.389845718514754e-05, "tps": 136167, "wall": 13745.2} {"step": 28559, "train_loss": 3.2619922161102295, "lr": 4.389449256375578e-05, "tps": 136127, "wall": 13749.7} {"step": 28560, "train_loss": 3.117262363433838, "lr": 4.389052993729678e-05, "tps": 136087, "wall": 13754.2} {"step": 28561, "train_loss": 3.1590123176574707, "lr": 4.388656930581535e-05, "tps": 136048, "wall": 13758.6} {"step": 28562, "train_loss": 3.1924855709075928, "lr": 4.38826106693564e-05, "tps": 136008, "wall": 13763.1} {"step": 28563, "train_loss": 3.2328929901123047, "lr": 4.387865402796478e-05, "tps": 135969, "wall": 13767.6} {"step": 28564, "train_loss": 3.1235456466674805, "lr": 4.387469938168527e-05, "tps": 135929, "wall": 13772.1} {"step": 28565, "train_loss": 3.1639902591705322, "lr": 4.38707467305627e-05, "tps": 135890, "wall": 13776.6} {"step": 28566, "train_loss": 3.1337027549743652, "lr": 4.386679607464184e-05, "tps": 135850, "wall": 13781.1} {"step": 28567, "train_loss": 3.1850953102111816, "lr": 4.386284741396746e-05, "tps": 135811, "wall": 13785.6} {"step": 28568, "train_loss": 3.2680563926696777, "lr": 4.385890074858424e-05, "tps": 135771, "wall": 13790.1} {"step": 28569, "train_loss": 3.154515027999878, "lr": 4.3854956078536955e-05, "tps": 135732, "wall": 13794.5} {"step": 28570, "train_loss": 3.1131222248077393, "lr": 4.385101340387024e-05, "tps": 135692, "wall": 13799.1} {"step": 28571, "train_loss": 3.1637895107269287, "lr": 4.384707272462877e-05, "tps": 135653, "wall": 13803.6} {"step": 28572, "train_loss": 3.282705307006836, "lr": 4.384313404085722e-05, "tps": 135613, "wall": 13808.1} {"step": 28573, "train_loss": 3.1648476123809814, "lr": 4.3839197352600135e-05, "tps": 135574, "wall": 13812.5} {"step": 28574, "train_loss": 3.107191562652588, "lr": 4.383526265990218e-05, "tps": 135534, "wall": 13817.0} {"step": 28575, "train_loss": 3.106480598449707, "lr": 4.38313299628079e-05, "tps": 135495, "wall": 13821.5} {"step": 28576, "train_loss": 3.232375383377075, "lr": 4.382739926136183e-05, "tps": 135456, "wall": 13826.0} {"step": 28577, "train_loss": 3.1559739112854004, "lr": 4.3823470555608507e-05, "tps": 135417, "wall": 13830.5} {"step": 28578, "train_loss": 3.1854989528656006, "lr": 4.3819543845592483e-05, "tps": 135378, "wall": 13835.0} {"step": 28579, "train_loss": 3.2181971073150635, "lr": 4.381561913135816e-05, "tps": 135338, "wall": 13839.5} {"step": 28580, "train_loss": 3.131978988647461, "lr": 4.381169641295004e-05, "tps": 135299, "wall": 13844.0} {"step": 28581, "train_loss": 3.1241512298583984, "lr": 4.3807775690412546e-05, "tps": 135260, "wall": 13848.5} {"step": 28582, "train_loss": 3.245730400085449, "lr": 4.380385696379013e-05, "tps": 135221, "wall": 13852.9} {"step": 28583, "train_loss": 3.170881509780884, "lr": 4.3799940233127126e-05, "tps": 135182, "wall": 13857.4} {"step": 28584, "train_loss": 3.121243476867676, "lr": 4.379602549846793e-05, "tps": 135142, "wall": 13862.0} {"step": 28585, "train_loss": 3.2764010429382324, "lr": 4.3792112759856916e-05, "tps": 135103, "wall": 13866.5} {"step": 28586, "train_loss": 3.081768035888672, "lr": 4.378820201733836e-05, "tps": 135064, "wall": 13871.0} {"step": 28587, "train_loss": 3.194791316986084, "lr": 4.378429327095659e-05, "tps": 135025, "wall": 13875.5} {"step": 28588, "train_loss": 3.2142348289489746, "lr": 4.378038652075589e-05, "tps": 134986, "wall": 13880.0} {"step": 28589, "train_loss": 3.1746602058410645, "lr": 4.377648176678049e-05, "tps": 134947, "wall": 13884.4} {"step": 28590, "train_loss": 3.1108882427215576, "lr": 4.377257900907464e-05, "tps": 134908, "wall": 13888.9} {"step": 28591, "train_loss": 3.272536277770996, "lr": 4.376867824768255e-05, "tps": 134869, "wall": 13893.4} {"step": 28592, "train_loss": 3.136932134628296, "lr": 4.3764779482648414e-05, "tps": 134830, "wall": 13897.9} {"step": 28593, "train_loss": 3.2322330474853516, "lr": 4.376088271401638e-05, "tps": 134792, "wall": 13902.4} {"step": 28594, "train_loss": 3.1317830085754395, "lr": 4.375698794183061e-05, "tps": 134753, "wall": 13906.9} {"step": 28595, "train_loss": 3.1760637760162354, "lr": 4.3753095166135205e-05, "tps": 134714, "wall": 13911.4} {"step": 28596, "train_loss": 3.3291096687316895, "lr": 4.374920438697427e-05, "tps": 134675, "wall": 13915.9} {"step": 28597, "train_loss": 3.233245372772217, "lr": 4.37453156043919e-05, "tps": 134636, "wall": 13920.4} {"step": 28598, "train_loss": 3.1437458992004395, "lr": 4.374142881843212e-05, "tps": 134597, "wall": 13924.9} {"step": 28599, "train_loss": 3.1047425270080566, "lr": 4.373754402913896e-05, "tps": 134559, "wall": 13929.4} {"step": 28600, "train_loss": 3.1803183555603027, "lr": 4.373366123655645e-05, "tps": 134520, "wall": 13933.9} {"step": 28601, "train_loss": 3.193237781524658, "lr": 4.372978044072856e-05, "tps": 134481, "wall": 13938.4} {"step": 28602, "train_loss": 3.08512806892395, "lr": 4.372590164169925e-05, "tps": 134443, "wall": 13942.9} {"step": 28603, "train_loss": 3.192598581314087, "lr": 4.372202483951248e-05, "tps": 134404, "wall": 13947.4} {"step": 28604, "train_loss": 3.091796636581421, "lr": 4.3718150034212116e-05, "tps": 134366, "wall": 13951.8} {"step": 28605, "train_loss": 3.144827127456665, "lr": 4.371427722584212e-05, "tps": 134327, "wall": 13956.3} {"step": 28606, "train_loss": 3.1125102043151855, "lr": 4.3710406414446306e-05, "tps": 134289, "wall": 13960.8} {"step": 28607, "train_loss": 3.1508307456970215, "lr": 4.3706537600068545e-05, "tps": 134250, "wall": 13965.3} {"step": 28608, "train_loss": 3.096651792526245, "lr": 4.3702670782752656e-05, "tps": 134212, "wall": 13969.8} {"step": 28609, "train_loss": 3.1894984245300293, "lr": 4.3698805962542474e-05, "tps": 134174, "wall": 13974.3} {"step": 28610, "train_loss": 3.2358124256134033, "lr": 4.3694943139481734e-05, "tps": 134135, "wall": 13978.8} {"step": 28611, "train_loss": 3.224691152572632, "lr": 4.369108231361423e-05, "tps": 134097, "wall": 13983.3} {"step": 28612, "train_loss": 3.1548001766204834, "lr": 4.36872234849837e-05, "tps": 134058, "wall": 13987.8} {"step": 28613, "train_loss": 3.1087520122528076, "lr": 4.368336665363381e-05, "tps": 134020, "wall": 13992.3} {"step": 28614, "train_loss": 3.0987954139709473, "lr": 4.367951181960828e-05, "tps": 133981, "wall": 13996.8} {"step": 28615, "train_loss": 3.1706416606903076, "lr": 4.3675658982950806e-05, "tps": 133943, "wall": 14001.3} {"step": 28616, "train_loss": 3.191234827041626, "lr": 4.367180814370499e-05, "tps": 133905, "wall": 14005.8} {"step": 28617, "train_loss": 3.1456708908081055, "lr": 4.3667959301914476e-05, "tps": 133866, "wall": 14010.3} {"step": 28618, "train_loss": 3.150465488433838, "lr": 4.366411245762284e-05, "tps": 133828, "wall": 14014.7} {"step": 28619, "train_loss": 3.043858289718628, "lr": 4.3660267610873686e-05, "tps": 133790, "wall": 14019.2} {"step": 28620, "train_loss": 3.04733943939209, "lr": 4.3656424761710576e-05, "tps": 133752, "wall": 14023.7} {"step": 28621, "train_loss": 3.0928492546081543, "lr": 4.3652583910177e-05, "tps": 133714, "wall": 14028.2} {"step": 28622, "train_loss": 3.2267403602600098, "lr": 4.364874505631653e-05, "tps": 133676, "wall": 14032.7} {"step": 28623, "train_loss": 3.159067153930664, "lr": 4.36449082001726e-05, "tps": 133638, "wall": 14037.2} {"step": 28624, "train_loss": 3.205686569213867, "lr": 4.364107334178868e-05, "tps": 133599, "wall": 14041.7} {"step": 28625, "train_loss": 3.0939245223999023, "lr": 4.363724048120822e-05, "tps": 133561, "wall": 14046.2} {"step": 28626, "train_loss": 3.2641825675964355, "lr": 4.3633409618474665e-05, "tps": 133523, "wall": 14050.7} {"step": 28627, "train_loss": 3.1475367546081543, "lr": 4.362958075363136e-05, "tps": 133485, "wall": 14055.2} {"step": 28628, "train_loss": 3.2988176345825195, "lr": 4.362575388672172e-05, "tps": 133447, "wall": 14059.6} {"step": 28629, "train_loss": 3.18009352684021, "lr": 4.3621929017789084e-05, "tps": 133410, "wall": 14064.1} {"step": 28630, "train_loss": 3.2613186836242676, "lr": 4.361810614687675e-05, "tps": 133372, "wall": 14068.6} {"step": 28631, "train_loss": 3.2648532390594482, "lr": 4.36142852740281e-05, "tps": 133334, "wall": 14073.1} {"step": 28632, "train_loss": 3.1187667846679688, "lr": 4.361046639928634e-05, "tps": 133296, "wall": 14077.6} {"step": 28633, "train_loss": 3.1686997413635254, "lr": 4.360664952269475e-05, "tps": 133258, "wall": 14082.1} {"step": 28634, "train_loss": 3.1386818885803223, "lr": 4.3602834644296596e-05, "tps": 133220, "wall": 14086.6} {"step": 28635, "train_loss": 3.186145305633545, "lr": 4.359902176413506e-05, "tps": 133182, "wall": 14091.1} {"step": 28636, "train_loss": 3.241180419921875, "lr": 4.3595210882253356e-05, "tps": 133144, "wall": 14095.6} {"step": 28637, "train_loss": 3.2159268856048584, "lr": 4.359140199869466e-05, "tps": 133106, "wall": 14100.1} {"step": 28638, "train_loss": 3.1366097927093506, "lr": 4.358759511350208e-05, "tps": 133069, "wall": 14104.6} {"step": 28639, "train_loss": 3.216886043548584, "lr": 4.358379022671878e-05, "tps": 133031, "wall": 14109.1} {"step": 28640, "train_loss": 3.2184174060821533, "lr": 4.357998733838786e-05, "tps": 132993, "wall": 14113.6} {"step": 28641, "train_loss": 3.0680148601531982, "lr": 4.357618644855237e-05, "tps": 132955, "wall": 14118.1} {"step": 28642, "train_loss": 3.1681017875671387, "lr": 4.357238755725539e-05, "tps": 132918, "wall": 14122.6} {"step": 28643, "train_loss": 3.19332218170166, "lr": 4.356859066453994e-05, "tps": 132880, "wall": 14127.0} {"step": 28644, "train_loss": 3.100665807723999, "lr": 4.3564795770449046e-05, "tps": 132843, "wall": 14131.5} {"step": 28645, "train_loss": 3.1889235973358154, "lr": 4.356100287502569e-05, "tps": 132805, "wall": 14136.0} {"step": 28646, "train_loss": 3.2061965465545654, "lr": 4.355721197831285e-05, "tps": 132768, "wall": 14140.5} {"step": 28647, "train_loss": 3.2014245986938477, "lr": 4.3553423080353427e-05, "tps": 132730, "wall": 14145.0} {"step": 28648, "train_loss": 3.288958787918091, "lr": 4.35496361811904e-05, "tps": 132693, "wall": 14149.5} {"step": 28649, "train_loss": 3.139070510864258, "lr": 4.3545851280866644e-05, "tps": 132655, "wall": 14154.0} {"step": 28650, "train_loss": 3.1360743045806885, "lr": 4.354206837942501e-05, "tps": 132618, "wall": 14158.5} {"step": 28651, "train_loss": 3.0626232624053955, "lr": 4.35382874769084e-05, "tps": 132580, "wall": 14163.0} {"step": 28652, "train_loss": 3.0809924602508545, "lr": 4.353450857335958e-05, "tps": 132543, "wall": 14167.5} {"step": 28653, "train_loss": 3.1944446563720703, "lr": 4.3530731668821414e-05, "tps": 132505, "wall": 14172.0} {"step": 28654, "train_loss": 3.178447723388672, "lr": 4.352695676333668e-05, "tps": 132468, "wall": 14176.4} {"step": 28655, "train_loss": 3.1401851177215576, "lr": 4.352318385694809e-05, "tps": 132431, "wall": 14180.9} {"step": 28656, "train_loss": 3.1822264194488525, "lr": 4.351941294969845e-05, "tps": 132394, "wall": 14185.4} {"step": 28657, "train_loss": 3.0574097633361816, "lr": 4.351564404163044e-05, "tps": 132356, "wall": 14189.9} {"step": 28658, "train_loss": 3.243393898010254, "lr": 4.351187713278675e-05, "tps": 132319, "wall": 14194.4} {"step": 28659, "train_loss": 3.256403684616089, "lr": 4.350811222321009e-05, "tps": 132282, "wall": 14198.9} {"step": 28660, "train_loss": 3.310210943222046, "lr": 4.350434931294307e-05, "tps": 132245, "wall": 14203.4} {"step": 28661, "train_loss": 3.101320266723633, "lr": 4.3500588402028314e-05, "tps": 132208, "wall": 14207.8} {"step": 28662, "train_loss": 3.274808883666992, "lr": 4.3496829490508465e-05, "tps": 132171, "wall": 14212.3} {"step": 28663, "train_loss": 3.30881929397583, "lr": 4.3493072578426076e-05, "tps": 132133, "wall": 14216.8} {"step": 28664, "train_loss": 3.2106642723083496, "lr": 4.348931766582369e-05, "tps": 132096, "wall": 14221.4} {"step": 28665, "train_loss": 3.1591598987579346, "lr": 4.3485564752743886e-05, "tps": 132059, "wall": 14225.9} {"step": 28666, "train_loss": 3.158545970916748, "lr": 4.3481813839229134e-05, "tps": 132021, "wall": 14230.4} {"step": 28667, "train_loss": 3.130293846130371, "lr": 4.347806492532195e-05, "tps": 131984, "wall": 14234.8} {"step": 28668, "train_loss": 3.092961311340332, "lr": 4.34743180110648e-05, "tps": 131948, "wall": 14239.3} {"step": 28669, "train_loss": 3.1755709648132324, "lr": 4.3470573096500136e-05, "tps": 131911, "wall": 14243.8} {"step": 28670, "train_loss": 3.241039514541626, "lr": 4.3466830181670336e-05, "tps": 131874, "wall": 14248.3} {"step": 28671, "train_loss": 3.1088643074035645, "lr": 4.346308926661787e-05, "tps": 131837, "wall": 14252.8} {"step": 28672, "train_loss": 3.16291880607605, "lr": 4.345935035138506e-05, "tps": 131800, "wall": 14257.3} {"step": 28673, "train_loss": 3.211639404296875, "lr": 4.345561343601428e-05, "tps": 131763, "wall": 14261.8} {"step": 28674, "train_loss": 3.068725347518921, "lr": 4.3451878520547875e-05, "tps": 131726, "wall": 14266.2} {"step": 28675, "train_loss": 3.2249932289123535, "lr": 4.3448145605028124e-05, "tps": 131689, "wall": 14270.7} {"step": 28676, "train_loss": 3.1915433406829834, "lr": 4.344441468949735e-05, "tps": 131653, "wall": 14275.2} {"step": 28677, "train_loss": 3.166372776031494, "lr": 4.344068577399781e-05, "tps": 131615, "wall": 14279.8} {"step": 28678, "train_loss": 3.189417839050293, "lr": 4.3436958858571694e-05, "tps": 131578, "wall": 14284.3} {"step": 28679, "train_loss": 3.143436908721924, "lr": 4.343323394326128e-05, "tps": 131542, "wall": 14288.7} {"step": 28680, "train_loss": 3.225041389465332, "lr": 4.342951102810875e-05, "tps": 131505, "wall": 14293.2} {"step": 28681, "train_loss": 3.203730583190918, "lr": 4.342579011315624e-05, "tps": 131468, "wall": 14297.7} {"step": 28682, "train_loss": 3.060004234313965, "lr": 4.342207119844598e-05, "tps": 131431, "wall": 14302.2} {"step": 28683, "train_loss": 3.175576686859131, "lr": 4.341835428402001e-05, "tps": 131395, "wall": 14306.7} {"step": 28684, "train_loss": 3.170567750930786, "lr": 4.3414639369920494e-05, "tps": 131358, "wall": 14311.2} {"step": 28685, "train_loss": 3.1992995738983154, "lr": 4.341092645618949e-05, "tps": 131321, "wall": 14315.7} {"step": 28686, "train_loss": 3.228456497192383, "lr": 4.3407215542869075e-05, "tps": 131285, "wall": 14320.2} {"step": 28687, "train_loss": 3.179027795791626, "lr": 4.340350663000127e-05, "tps": 131248, "wall": 14324.7} {"step": 28688, "train_loss": 3.078547477722168, "lr": 4.3399799717628086e-05, "tps": 131212, "wall": 14329.2} {"step": 28689, "train_loss": 3.1893115043640137, "lr": 4.339609480579153e-05, "tps": 131175, "wall": 14333.7} {"step": 28690, "train_loss": 3.1445112228393555, "lr": 4.339239189453357e-05, "tps": 131139, "wall": 14338.1} {"step": 28691, "train_loss": 3.2239270210266113, "lr": 4.338869098389616e-05, "tps": 131102, "wall": 14342.7} {"step": 28692, "train_loss": 3.1357882022857666, "lr": 4.3384992073921186e-05, "tps": 131065, "wall": 14347.2} {"step": 28693, "train_loss": 3.141495704650879, "lr": 4.338129516465059e-05, "tps": 131029, "wall": 14351.7} {"step": 28694, "train_loss": 3.0833303928375244, "lr": 4.337760025612625e-05, "tps": 130992, "wall": 14356.2} {"step": 28695, "train_loss": 3.0857033729553223, "lr": 4.3373907348390005e-05, "tps": 130956, "wall": 14360.7} {"step": 28696, "train_loss": 3.2366349697113037, "lr": 4.337021644148367e-05, "tps": 130920, "wall": 14365.1} {"step": 28697, "train_loss": 3.2825114727020264, "lr": 4.336652753544912e-05, "tps": 130883, "wall": 14369.6} {"step": 28698, "train_loss": 3.203341007232666, "lr": 4.336284063032806e-05, "tps": 130847, "wall": 14374.1} {"step": 28699, "train_loss": 3.1054952144622803, "lr": 4.3359155726162315e-05, "tps": 130811, "wall": 14378.6} {"step": 28700, "train_loss": 3.160277843475342, "lr": 4.335547282299362e-05, "tps": 130774, "wall": 14383.1} {"step": 28701, "train_loss": 3.1216979026794434, "lr": 4.335179192086366e-05, "tps": 130738, "wall": 14387.6} {"step": 28702, "train_loss": 3.2099437713623047, "lr": 4.334811301981418e-05, "tps": 130702, "wall": 14392.1} {"step": 28703, "train_loss": 3.108520030975342, "lr": 4.334443611988683e-05, "tps": 130666, "wall": 14396.6} {"step": 28704, "train_loss": 3.154522180557251, "lr": 4.334076122112324e-05, "tps": 130629, "wall": 14401.1} {"step": 28705, "train_loss": 3.2258360385894775, "lr": 4.3337088323565084e-05, "tps": 130593, "wall": 14405.6} {"step": 28706, "train_loss": 3.2049312591552734, "lr": 4.333341742725394e-05, "tps": 130557, "wall": 14410.1} {"step": 28707, "train_loss": 3.1692631244659424, "lr": 4.332974853223143e-05, "tps": 130521, "wall": 14414.6} {"step": 28708, "train_loss": 3.2135863304138184, "lr": 4.332608163853906e-05, "tps": 130485, "wall": 14419.1} {"step": 28709, "train_loss": 3.1829495429992676, "lr": 4.332241674621838e-05, "tps": 130449, "wall": 14423.5} {"step": 28710, "train_loss": 3.0936312675476074, "lr": 4.3318753855310954e-05, "tps": 130413, "wall": 14428.0} {"step": 28711, "train_loss": 3.227736473083496, "lr": 4.3315092965858225e-05, "tps": 130377, "wall": 14432.5} {"step": 28712, "train_loss": 3.181877613067627, "lr": 4.3311434077901694e-05, "tps": 130341, "wall": 14437.0} {"step": 28713, "train_loss": 3.0544955730438232, "lr": 4.330777719148278e-05, "tps": 130305, "wall": 14441.5} {"step": 28714, "train_loss": 3.2484867572784424, "lr": 4.330412230664294e-05, "tps": 130269, "wall": 14446.0} {"step": 28715, "train_loss": 3.0913825035095215, "lr": 4.330046942342355e-05, "tps": 130233, "wall": 14450.4} {"step": 28716, "train_loss": 3.187991142272949, "lr": 4.3296818541866e-05, "tps": 130197, "wall": 14454.9} {"step": 28717, "train_loss": 3.2588319778442383, "lr": 4.3293169662011674e-05, "tps": 130161, "wall": 14459.5} {"step": 28718, "train_loss": 3.0866265296936035, "lr": 4.328952278390186e-05, "tps": 130125, "wall": 14463.9} {"step": 28719, "train_loss": 3.1572651863098145, "lr": 4.3285877907577895e-05, "tps": 130089, "wall": 14468.4} {"step": 28720, "train_loss": 3.176999568939209, "lr": 4.328223503308106e-05, "tps": 130053, "wall": 14472.9} {"step": 28721, "train_loss": 3.2187538146972656, "lr": 4.327859416045264e-05, "tps": 130018, "wall": 14477.4} {"step": 28722, "train_loss": 3.276949167251587, "lr": 4.3274955289733845e-05, "tps": 129982, "wall": 14481.9} {"step": 28723, "train_loss": 3.1624560356140137, "lr": 4.3271318420965945e-05, "tps": 129946, "wall": 14486.4} {"step": 28724, "train_loss": 3.213789939880371, "lr": 4.3267683554190075e-05, "tps": 129910, "wall": 14490.9} {"step": 28725, "train_loss": 3.1154918670654297, "lr": 4.326405068944748e-05, "tps": 129875, "wall": 14495.4} {"step": 28726, "train_loss": 3.157414674758911, "lr": 4.326041982677926e-05, "tps": 129839, "wall": 14499.8} {"step": 28727, "train_loss": 3.169253349304199, "lr": 4.325679096622657e-05, "tps": 129803, "wall": 14504.3} {"step": 28728, "train_loss": 3.159134864807129, "lr": 4.3253164107830536e-05, "tps": 129768, "wall": 14508.8} {"step": 28729, "train_loss": 3.274723529815674, "lr": 4.324953925163218e-05, "tps": 129732, "wall": 14513.3} {"step": 28730, "train_loss": 3.189865827560425, "lr": 4.324591639767265e-05, "tps": 129696, "wall": 14517.8} {"step": 28731, "train_loss": 3.1088294982910156, "lr": 4.32422955459929e-05, "tps": 129660, "wall": 14522.3} {"step": 28732, "train_loss": 3.1440882682800293, "lr": 4.3238676696634e-05, "tps": 129625, "wall": 14526.8} {"step": 28733, "train_loss": 3.181382656097412, "lr": 4.323505984963694e-05, "tps": 129589, "wall": 14531.3} {"step": 28734, "train_loss": 3.2197072505950928, "lr": 4.32314450050427e-05, "tps": 129554, "wall": 14535.8} {"step": 28735, "train_loss": 3.22023868560791, "lr": 4.3227832162892195e-05, "tps": 129518, "wall": 14540.3} {"step": 28736, "train_loss": 3.173330068588257, "lr": 4.3224221323226366e-05, "tps": 129483, "wall": 14544.8} {"step": 28737, "train_loss": 3.1610047817230225, "lr": 4.3220612486086144e-05, "tps": 129447, "wall": 14549.3} {"step": 28738, "train_loss": 3.2962660789489746, "lr": 4.3217005651512356e-05, "tps": 129412, "wall": 14553.8} {"step": 28739, "train_loss": 3.141331672668457, "lr": 4.3213400819545924e-05, "tps": 129377, "wall": 14558.3} {"step": 28740, "train_loss": 3.191351890563965, "lr": 4.320979799022764e-05, "tps": 129341, "wall": 14562.7} {"step": 28741, "train_loss": 3.1123974323272705, "lr": 4.320619716359831e-05, "tps": 129306, "wall": 14567.2} {"step": 28742, "train_loss": 3.06471848487854, "lr": 4.320259833969876e-05, "tps": 129271, "wall": 14571.7} {"step": 28743, "train_loss": 3.147369384765625, "lr": 4.3199001518569725e-05, "tps": 129235, "wall": 14576.2} {"step": 28744, "train_loss": 3.1043105125427246, "lr": 4.319540670025199e-05, "tps": 129200, "wall": 14580.7} {"step": 28745, "train_loss": 3.1433115005493164, "lr": 4.3191813884786254e-05, "tps": 129164, "wall": 14585.2} {"step": 28746, "train_loss": 3.04396390914917, "lr": 4.318822307221321e-05, "tps": 129129, "wall": 14589.7} {"step": 28747, "train_loss": 3.084320068359375, "lr": 4.318463426257352e-05, "tps": 129094, "wall": 14594.2} {"step": 28748, "train_loss": 3.135739326477051, "lr": 4.318104745590789e-05, "tps": 129059, "wall": 14598.7} {"step": 28749, "train_loss": 3.110996723175049, "lr": 4.317746265225688e-05, "tps": 129024, "wall": 14603.2} {"step": 28750, "train_loss": 3.1635019779205322, "lr": 4.3173879851661175e-05, "tps": 128988, "wall": 14607.7} {"step": 28751, "train_loss": 3.1619882583618164, "lr": 4.31702990541613e-05, "tps": 128953, "wall": 14612.2} {"step": 28752, "train_loss": 3.1273744106292725, "lr": 4.316672025979787e-05, "tps": 128918, "wall": 14616.7} {"step": 28753, "train_loss": 3.1050291061401367, "lr": 4.3163143468611374e-05, "tps": 128883, "wall": 14621.1} {"step": 28754, "train_loss": 3.28413724899292, "lr": 4.3159568680642356e-05, "tps": 128848, "wall": 14625.6} {"step": 28755, "train_loss": 3.1973118782043457, "lr": 4.315599589593133e-05, "tps": 128813, "wall": 14630.1} {"step": 28756, "train_loss": 3.1509647369384766, "lr": 4.315242511451874e-05, "tps": 128778, "wall": 14634.6} {"step": 28757, "train_loss": 3.17305588722229, "lr": 4.314885633644504e-05, "tps": 128742, "wall": 14639.2} {"step": 28758, "train_loss": 3.2132534980773926, "lr": 4.314528956175068e-05, "tps": 128707, "wall": 14643.7} {"step": 28759, "train_loss": 3.194357395172119, "lr": 4.3141724790476035e-05, "tps": 128672, "wall": 14648.2} {"step": 28760, "train_loss": 3.1906535625457764, "lr": 4.313816202266149e-05, "tps": 128637, "wall": 14652.7} {"step": 28761, "train_loss": 3.101656675338745, "lr": 4.313460125834742e-05, "tps": 128602, "wall": 14657.1} {"step": 28762, "train_loss": 3.28173565864563, "lr": 4.313104249757417e-05, "tps": 128567, "wall": 14661.6} {"step": 28763, "train_loss": 3.2446370124816895, "lr": 4.312748574038202e-05, "tps": 128532, "wall": 14666.1} {"step": 28764, "train_loss": 3.1023471355438232, "lr": 4.31239309868113e-05, "tps": 128497, "wall": 14670.6} {"step": 28765, "train_loss": 3.2027666568756104, "lr": 4.312037823690226e-05, "tps": 128463, "wall": 14675.1} {"step": 28766, "train_loss": 3.228471517562866, "lr": 4.3116827490695125e-05, "tps": 128428, "wall": 14679.6} {"step": 28767, "train_loss": 3.1485724449157715, "lr": 4.311327874823014e-05, "tps": 128393, "wall": 14684.1} {"step": 28768, "train_loss": 3.1379756927490234, "lr": 4.310973200954749e-05, "tps": 128358, "wall": 14688.6} {"step": 28769, "train_loss": 3.269500732421875, "lr": 4.3106187274687386e-05, "tps": 128324, "wall": 14693.0} {"step": 28770, "train_loss": 3.219558000564575, "lr": 4.310264454368996e-05, "tps": 128289, "wall": 14697.5} {"step": 28771, "train_loss": 3.227656364440918, "lr": 4.3099103816595344e-05, "tps": 128254, "wall": 14702.1} {"step": 28772, "train_loss": 3.1333234310150146, "lr": 4.309556509344366e-05, "tps": 128219, "wall": 14706.6} {"step": 28773, "train_loss": 3.1594576835632324, "lr": 4.309202837427498e-05, "tps": 128184, "wall": 14711.1} {"step": 28774, "train_loss": 3.171360969543457, "lr": 4.308849365912937e-05, "tps": 128150, "wall": 14715.5} {"step": 28775, "train_loss": 3.161806583404541, "lr": 4.308496094804686e-05, "tps": 128115, "wall": 14720.0} {"step": 28776, "train_loss": 3.1707773208618164, "lr": 4.3081430241067514e-05, "tps": 128081, "wall": 14724.5} {"step": 28777, "train_loss": 3.1652255058288574, "lr": 4.307790153823127e-05, "tps": 128046, "wall": 14729.0} {"step": 28778, "train_loss": 3.1383814811706543, "lr": 4.307437483957813e-05, "tps": 128011, "wall": 14733.5} {"step": 28779, "train_loss": 3.164034366607666, "lr": 4.307085014514807e-05, "tps": 127977, "wall": 14738.0} {"step": 28780, "train_loss": 3.19706654548645, "lr": 4.306732745498096e-05, "tps": 127942, "wall": 14742.5} {"step": 28781, "train_loss": 3.2172980308532715, "lr": 4.306380676911676e-05, "tps": 127908, "wall": 14747.0} {"step": 28782, "train_loss": 3.089829921722412, "lr": 4.306028808759532e-05, "tps": 127873, "wall": 14751.4} {"step": 28783, "train_loss": 3.2089104652404785, "lr": 4.305677141045649e-05, "tps": 127839, "wall": 14755.9} {"step": 28784, "train_loss": 3.141287326812744, "lr": 4.305325673774015e-05, "tps": 127804, "wall": 14760.5} {"step": 28785, "train_loss": 3.2894651889801025, "lr": 4.304974406948608e-05, "tps": 127770, "wall": 14764.9} {"step": 28786, "train_loss": 3.1847331523895264, "lr": 4.304623340573409e-05, "tps": 127735, "wall": 14769.4} {"step": 28787, "train_loss": 3.225283622741699, "lr": 4.304272474652394e-05, "tps": 127701, "wall": 14773.9} {"step": 28788, "train_loss": 3.15081787109375, "lr": 4.303921809189537e-05, "tps": 127666, "wall": 14778.4} {"step": 28789, "train_loss": 3.1597206592559814, "lr": 4.303571344188813e-05, "tps": 127632, "wall": 14782.9} {"step": 28790, "train_loss": 3.2586476802825928, "lr": 4.303221079654188e-05, "tps": 127598, "wall": 14787.4} {"step": 28791, "train_loss": 3.097010612487793, "lr": 4.302871015589632e-05, "tps": 127563, "wall": 14791.9} {"step": 28792, "train_loss": 3.3538408279418945, "lr": 4.302521151999112e-05, "tps": 127529, "wall": 14796.4} {"step": 28793, "train_loss": 3.1331119537353516, "lr": 4.302171488886589e-05, "tps": 127495, "wall": 14800.9} {"step": 28794, "train_loss": 3.156558036804199, "lr": 4.3018220262560246e-05, "tps": 127460, "wall": 14805.4} {"step": 28795, "train_loss": 3.0611841678619385, "lr": 4.301472764111379e-05, "tps": 127426, "wall": 14809.9} {"step": 28796, "train_loss": 3.089181423187256, "lr": 4.3011237024566056e-05, "tps": 127392, "wall": 14814.4} {"step": 28797, "train_loss": 3.1461310386657715, "lr": 4.3007748412956605e-05, "tps": 127358, "wall": 14818.9} {"step": 28798, "train_loss": 3.193474292755127, "lr": 4.300426180632498e-05, "tps": 127323, "wall": 14823.4} {"step": 28799, "train_loss": 3.1640806198120117, "lr": 4.3000777204710625e-05, "tps": 127289, "wall": 14827.9} {"step": 28800, "train_loss": 3.052002429962158, "lr": 4.299729460815305e-05, "tps": 127255, "wall": 14832.4} {"step": 28801, "train_loss": 3.108976125717163, "lr": 4.2993814016691706e-05, "tps": 127221, "wall": 14836.9} {"step": 28802, "train_loss": 3.1302971839904785, "lr": 4.299033543036601e-05, "tps": 127187, "wall": 14841.3} {"step": 28803, "train_loss": 3.142695426940918, "lr": 4.298685884921535e-05, "tps": 127153, "wall": 14845.8} {"step": 28804, "train_loss": 3.163323402404785, "lr": 4.298338427327916e-05, "tps": 127119, "wall": 14850.3} {"step": 28805, "train_loss": 3.1830947399139404, "lr": 4.297991170259673e-05, "tps": 127085, "wall": 14854.8} {"step": 28806, "train_loss": 3.139888286590576, "lr": 4.297644113720748e-05, "tps": 127051, "wall": 14859.3} {"step": 28807, "train_loss": 3.0749268531799316, "lr": 4.2972972577150666e-05, "tps": 127017, "wall": 14863.8} {"step": 28808, "train_loss": 3.2330942153930664, "lr": 4.2969506022465576e-05, "tps": 126983, "wall": 14868.2} {"step": 28809, "train_loss": 3.1421122550964355, "lr": 4.296604147319151e-05, "tps": 126949, "wall": 14872.7} {"step": 28810, "train_loss": 3.190783739089966, "lr": 4.296257892936773e-05, "tps": 126916, "wall": 14877.2} {"step": 28811, "train_loss": 3.335298776626587, "lr": 4.2959118391033407e-05, "tps": 126881, "wall": 14881.7} {"step": 28812, "train_loss": 3.1040198802948, "lr": 4.295565985822776e-05, "tps": 126847, "wall": 14886.2} {"step": 28813, "train_loss": 3.183454990386963, "lr": 4.295220333099e-05, "tps": 126814, "wall": 14890.7} {"step": 28814, "train_loss": 3.2229204177856445, "lr": 4.294874880935923e-05, "tps": 126780, "wall": 14895.2} {"step": 28815, "train_loss": 3.158761978149414, "lr": 4.294529629337465e-05, "tps": 126746, "wall": 14899.7} {"step": 28816, "train_loss": 3.1864638328552246, "lr": 4.2941845783075305e-05, "tps": 126712, "wall": 14904.2} {"step": 28817, "train_loss": 3.122230291366577, "lr": 4.293839727850033e-05, "tps": 126678, "wall": 14908.7} {"step": 28818, "train_loss": 3.1494688987731934, "lr": 4.2934950779688744e-05, "tps": 126645, "wall": 14913.2} {"step": 28819, "train_loss": 3.1391279697418213, "lr": 4.293150628667964e-05, "tps": 126611, "wall": 14917.7} {"step": 28820, "train_loss": 3.3079094886779785, "lr": 4.292806379951197e-05, "tps": 126577, "wall": 14922.2} {"step": 28821, "train_loss": 3.256087303161621, "lr": 4.292462331822483e-05, "tps": 126543, "wall": 14926.7} {"step": 28822, "train_loss": 3.140308380126953, "lr": 4.2921184842857096e-05, "tps": 126510, "wall": 14931.2} {"step": 28823, "train_loss": 3.114717483520508, "lr": 4.291774837344776e-05, "tps": 126476, "wall": 14935.6} {"step": 28824, "train_loss": 3.2088708877563477, "lr": 4.291431391003577e-05, "tps": 126442, "wall": 14940.2} {"step": 28825, "train_loss": 3.2243590354919434, "lr": 4.291088145266001e-05, "tps": 126408, "wall": 14944.7} {"step": 28826, "train_loss": 3.172966480255127, "lr": 4.290745100135936e-05, "tps": 126375, "wall": 14949.2} {"step": 28827, "train_loss": 3.0812931060791016, "lr": 4.29040225561727e-05, "tps": 126341, "wall": 14953.7} {"step": 28828, "train_loss": 3.2712655067443848, "lr": 4.290059611713883e-05, "tps": 126308, "wall": 14958.2} {"step": 28829, "train_loss": 3.1011390686035156, "lr": 4.28971716842966e-05, "tps": 126274, "wall": 14962.6} {"step": 28830, "train_loss": 3.20371675491333, "lr": 4.289374925768479e-05, "tps": 126241, "wall": 14967.1} {"step": 28831, "train_loss": 3.199552297592163, "lr": 4.2890328837342147e-05, "tps": 126207, "wall": 14971.6} {"step": 28832, "train_loss": 3.1779251098632812, "lr": 4.288691042330747e-05, "tps": 126174, "wall": 14976.1} {"step": 28833, "train_loss": 3.089323043823242, "lr": 4.288349401561946e-05, "tps": 126140, "wall": 14980.6} {"step": 28834, "train_loss": 3.176492691040039, "lr": 4.288007961431676e-05, "tps": 126107, "wall": 14985.1} {"step": 28835, "train_loss": 3.222689628601074, "lr": 4.287666721943816e-05, "tps": 126073, "wall": 14989.6} {"step": 28836, "train_loss": 3.0900392532348633, "lr": 4.287325683102223e-05, "tps": 126040, "wall": 14994.1} {"step": 28837, "train_loss": 3.085531234741211, "lr": 4.286984844910762e-05, "tps": 126007, "wall": 14998.6} {"step": 28838, "train_loss": 3.246298313140869, "lr": 4.286644207373298e-05, "tps": 125973, "wall": 15003.1} {"step": 28839, "train_loss": 3.1871023178100586, "lr": 4.286303770493683e-05, "tps": 125939, "wall": 15007.6} {"step": 28840, "train_loss": 3.1159255504608154, "lr": 4.285963534275779e-05, "tps": 125906, "wall": 15012.1} {"step": 28841, "train_loss": 3.173017978668213, "lr": 4.285623498723438e-05, "tps": 125873, "wall": 15016.6} {"step": 28842, "train_loss": 3.1856424808502197, "lr": 4.2852836638405116e-05, "tps": 125840, "wall": 15021.1} {"step": 28843, "train_loss": 3.1530659198760986, "lr": 4.2849440296308516e-05, "tps": 125806, "wall": 15025.6} {"step": 28844, "train_loss": 3.259401321411133, "lr": 4.284604596098304e-05, "tps": 125773, "wall": 15030.0} {"step": 28845, "train_loss": 3.234978675842285, "lr": 4.284265363246713e-05, "tps": 125740, "wall": 15034.5} {"step": 28846, "train_loss": 3.059607982635498, "lr": 4.2839263310799245e-05, "tps": 125707, "wall": 15039.0} {"step": 28847, "train_loss": 3.1835384368896484, "lr": 4.283587499601776e-05, "tps": 125674, "wall": 15043.5} {"step": 28848, "train_loss": 3.15010142326355, "lr": 4.283248868816105e-05, "tps": 125641, "wall": 15048.0} {"step": 28849, "train_loss": 3.184863805770874, "lr": 4.2829104387267506e-05, "tps": 125607, "wall": 15052.5} {"step": 28850, "train_loss": 3.199732780456543, "lr": 4.282572209337546e-05, "tps": 125574, "wall": 15057.0} {"step": 28851, "train_loss": 3.283424139022827, "lr": 4.2822341806523194e-05, "tps": 125541, "wall": 15061.5} {"step": 28852, "train_loss": 3.1739251613616943, "lr": 4.2818963526749044e-05, "tps": 125508, "wall": 15066.0} {"step": 28853, "train_loss": 3.1398673057556152, "lr": 4.281558725409126e-05, "tps": 125475, "wall": 15070.5} {"step": 28854, "train_loss": 3.1950061321258545, "lr": 4.2812212988588066e-05, "tps": 125442, "wall": 15075.0} {"step": 28855, "train_loss": 3.216005325317383, "lr": 4.280884073027775e-05, "tps": 125408, "wall": 15079.5} {"step": 28856, "train_loss": 3.118854522705078, "lr": 4.2805470479198454e-05, "tps": 125376, "wall": 15084.0} {"step": 28857, "train_loss": 3.0707499980926514, "lr": 4.2802102235388356e-05, "tps": 125343, "wall": 15088.5} {"step": 28858, "train_loss": 3.3178138732910156, "lr": 4.279873599888565e-05, "tps": 125310, "wall": 15093.0} {"step": 28859, "train_loss": 3.1160850524902344, "lr": 4.279537176972843e-05, "tps": 125277, "wall": 15097.5} {"step": 28860, "train_loss": 3.1776301860809326, "lr": 4.279200954795486e-05, "tps": 125244, "wall": 15102.0} {"step": 28861, "train_loss": 3.1604626178741455, "lr": 4.278864933360297e-05, "tps": 125211, "wall": 15106.5} {"step": 28862, "train_loss": 3.174955129623413, "lr": 4.2785291126710844e-05, "tps": 125178, "wall": 15110.9} {"step": 28863, "train_loss": 3.163606882095337, "lr": 4.2781934927316543e-05, "tps": 125145, "wall": 15115.4} {"step": 28864, "train_loss": 3.179236888885498, "lr": 4.2778580735458064e-05, "tps": 125112, "wall": 15120.0} {"step": 28865, "train_loss": 3.043910503387451, "lr": 4.2775228551173385e-05, "tps": 125079, "wall": 15124.5} {"step": 28866, "train_loss": 3.118722677230835, "lr": 4.277187837450053e-05, "tps": 125046, "wall": 15129.0} {"step": 28867, "train_loss": 3.1373510360717773, "lr": 4.276853020547744e-05, "tps": 125013, "wall": 15133.5} {"step": 28868, "train_loss": 3.1453537940979004, "lr": 4.276518404414198e-05, "tps": 124981, "wall": 15138.0} {"step": 28869, "train_loss": 3.1139328479766846, "lr": 4.276183989053215e-05, "tps": 124948, "wall": 15142.4} {"step": 28870, "train_loss": 3.2341713905334473, "lr": 4.275849774468578e-05, "tps": 124915, "wall": 15146.9} {"step": 28871, "train_loss": 3.1773641109466553, "lr": 4.27551576066407e-05, "tps": 124883, "wall": 15151.4} {"step": 28872, "train_loss": 3.145739793777466, "lr": 4.2751819476434814e-05, "tps": 124850, "wall": 15155.9} {"step": 28873, "train_loss": 3.1766586303710938, "lr": 4.27484833541059e-05, "tps": 124817, "wall": 15160.4} {"step": 28874, "train_loss": 3.1924638748168945, "lr": 4.274514923969174e-05, "tps": 124785, "wall": 15164.9} {"step": 28875, "train_loss": 3.161708116531372, "lr": 4.2741817133230156e-05, "tps": 124752, "wall": 15169.4} {"step": 28876, "train_loss": 3.1290836334228516, "lr": 4.273848703475882e-05, "tps": 124719, "wall": 15173.9} {"step": 28877, "train_loss": 3.186628818511963, "lr": 4.27351589443155e-05, "tps": 124687, "wall": 15178.3} {"step": 28878, "train_loss": 3.2002573013305664, "lr": 4.2731832861937905e-05, "tps": 124654, "wall": 15182.9} {"step": 28879, "train_loss": 3.059110641479492, "lr": 4.272850878766369e-05, "tps": 124622, "wall": 15187.4} {"step": 28880, "train_loss": 3.0815653800964355, "lr": 4.272518672153053e-05, "tps": 124589, "wall": 15191.9} {"step": 28881, "train_loss": 3.081298351287842, "lr": 4.272186666357603e-05, "tps": 124556, "wall": 15196.3} {"step": 28882, "train_loss": 3.1884188652038574, "lr": 4.27185486138378e-05, "tps": 124524, "wall": 15200.8} {"step": 28883, "train_loss": 3.186553955078125, "lr": 4.271523257235346e-05, "tps": 124492, "wall": 15205.3} {"step": 28884, "train_loss": 3.241074800491333, "lr": 4.271191853916057e-05, "tps": 124459, "wall": 15209.8} {"step": 28885, "train_loss": 3.1399192810058594, "lr": 4.270860651429662e-05, "tps": 124427, "wall": 15214.3} {"step": 28886, "train_loss": 3.1058754920959473, "lr": 4.270529649779921e-05, "tps": 124395, "wall": 15218.8} {"step": 28887, "train_loss": 3.088559150695801, "lr": 4.270198848970578e-05, "tps": 124362, "wall": 15223.2} {"step": 28888, "train_loss": 3.2642619609832764, "lr": 4.26986824900538e-05, "tps": 124330, "wall": 15227.7} {"step": 28889, "train_loss": 3.068688154220581, "lr": 4.2695378498880753e-05, "tps": 124298, "wall": 15232.2} {"step": 28890, "train_loss": 3.267526149749756, "lr": 4.269207651622403e-05, "tps": 124265, "wall": 15236.7} {"step": 28891, "train_loss": 3.194756031036377, "lr": 4.2688776542121074e-05, "tps": 124232, "wall": 15241.3} {"step": 28892, "train_loss": 3.1571707725524902, "lr": 4.268547857660925e-05, "tps": 124200, "wall": 15245.8} {"step": 28893, "train_loss": 3.209298849105835, "lr": 4.268218261972589e-05, "tps": 124168, "wall": 15250.2} {"step": 28894, "train_loss": 3.064361095428467, "lr": 4.2678888671508404e-05, "tps": 124136, "wall": 15254.7} {"step": 28895, "train_loss": 3.1347360610961914, "lr": 4.267559673199404e-05, "tps": 124103, "wall": 15259.3} {"step": 28896, "train_loss": 3.174022912979126, "lr": 4.267230680122009e-05, "tps": 124071, "wall": 15263.7} {"step": 28897, "train_loss": 3.1845767498016357, "lr": 4.266901887922387e-05, "tps": 124039, "wall": 15268.2} {"step": 28898, "train_loss": 3.146101236343384, "lr": 4.2665732966042575e-05, "tps": 124007, "wall": 15272.7} {"step": 28899, "train_loss": 3.132396697998047, "lr": 4.266244906171345e-05, "tps": 123974, "wall": 15277.2} {"step": 28900, "train_loss": 3.1911392211914062, "lr": 4.265916716627372e-05, "tps": 123942, "wall": 15281.7} {"step": 28901, "train_loss": 3.1965603828430176, "lr": 4.265588727976054e-05, "tps": 123910, "wall": 15286.2} {"step": 28902, "train_loss": 3.213775157928467, "lr": 4.2652609402211024e-05, "tps": 123878, "wall": 15290.7} {"step": 28903, "train_loss": 3.1770434379577637, "lr": 4.2649333533662384e-05, "tps": 123846, "wall": 15295.2} {"step": 28904, "train_loss": 3.132272720336914, "lr": 4.264605967415167e-05, "tps": 123813, "wall": 15299.7} {"step": 28905, "train_loss": 3.1686689853668213, "lr": 4.264278782371597e-05, "tps": 123781, "wall": 15304.2} {"step": 28906, "train_loss": 3.2219767570495605, "lr": 4.263951798239239e-05, "tps": 123749, "wall": 15308.7} {"step": 28907, "train_loss": 3.220271587371826, "lr": 4.2636250150217946e-05, "tps": 123717, "wall": 15313.2} {"step": 28908, "train_loss": 3.0767078399658203, "lr": 4.263298432722962e-05, "tps": 123685, "wall": 15317.7} {"step": 28909, "train_loss": 3.1544671058654785, "lr": 4.262972051346449e-05, "tps": 123653, "wall": 15322.2} {"step": 28910, "train_loss": 3.151761054992676, "lr": 4.262645870895946e-05, "tps": 123621, "wall": 15326.7} {"step": 28911, "train_loss": 3.1334304809570312, "lr": 4.262319891375149e-05, "tps": 123589, "wall": 15331.2} {"step": 28912, "train_loss": 3.214667320251465, "lr": 4.261994112787755e-05, "tps": 123557, "wall": 15335.7} {"step": 28913, "train_loss": 3.216827869415283, "lr": 4.261668535137449e-05, "tps": 123526, "wall": 15340.1} {"step": 28914, "train_loss": 3.2445385456085205, "lr": 4.261343158427921e-05, "tps": 123494, "wall": 15344.6} {"step": 28915, "train_loss": 3.0831170082092285, "lr": 4.2610179826628605e-05, "tps": 123462, "wall": 15349.1} {"step": 28916, "train_loss": 3.1016788482666016, "lr": 4.260693007845944e-05, "tps": 123430, "wall": 15353.6} {"step": 28917, "train_loss": 3.1524832248687744, "lr": 4.26036823398086e-05, "tps": 123398, "wall": 15358.1} {"step": 28918, "train_loss": 3.280423641204834, "lr": 4.260043661071281e-05, "tps": 123366, "wall": 15362.6} {"step": 28919, "train_loss": 3.0848183631896973, "lr": 4.25971928912089e-05, "tps": 123334, "wall": 15367.1} {"step": 28920, "train_loss": 3.1560137271881104, "lr": 4.259395118133358e-05, "tps": 123302, "wall": 15371.6} {"step": 28921, "train_loss": 3.1973330974578857, "lr": 4.2590711481123566e-05, "tps": 123271, "wall": 15376.1} {"step": 28922, "train_loss": 3.0897905826568604, "lr": 4.2587473790615584e-05, "tps": 123239, "wall": 15380.6} {"step": 28923, "train_loss": 3.182896852493286, "lr": 4.258423810984631e-05, "tps": 123207, "wall": 15385.1} {"step": 28924, "train_loss": 3.31363582611084, "lr": 4.258100443885235e-05, "tps": 123176, "wall": 15389.6} {"step": 28925, "train_loss": 3.0522139072418213, "lr": 4.2577772777670376e-05, "tps": 123144, "wall": 15394.1} {"step": 28926, "train_loss": 3.08603572845459, "lr": 4.2574543126337005e-05, "tps": 123112, "wall": 15398.6} {"step": 28927, "train_loss": 3.2051260471343994, "lr": 4.25713154848888e-05, "tps": 123081, "wall": 15403.0} {"step": 28928, "train_loss": 3.1226611137390137, "lr": 4.256808985336233e-05, "tps": 123049, "wall": 15407.5} {"step": 28929, "train_loss": 3.1408934593200684, "lr": 4.256486623179415e-05, "tps": 123017, "wall": 15412.0} {"step": 28930, "train_loss": 3.1763367652893066, "lr": 4.2561644620220756e-05, "tps": 122986, "wall": 15416.5} {"step": 28931, "train_loss": 3.09390926361084, "lr": 4.2558425018678646e-05, "tps": 122954, "wall": 15421.1} {"step": 28932, "train_loss": 3.1442060470581055, "lr": 4.255520742720431e-05, "tps": 122922, "wall": 15425.6} {"step": 28933, "train_loss": 3.209381103515625, "lr": 4.255199184583417e-05, "tps": 122891, "wall": 15430.0} {"step": 28934, "train_loss": 3.136199712753296, "lr": 4.2548778274604674e-05, "tps": 122859, "wall": 15434.5} {"step": 28935, "train_loss": 3.12150239944458, "lr": 4.254556671355222e-05, "tps": 122828, "wall": 15439.0} {"step": 28936, "train_loss": 3.290841817855835, "lr": 4.2542357162713176e-05, "tps": 122796, "wall": 15443.5} {"step": 28937, "train_loss": 3.169292449951172, "lr": 4.253914962212392e-05, "tps": 122765, "wall": 15448.0} {"step": 28938, "train_loss": 3.14959979057312, "lr": 4.2535944091820764e-05, "tps": 122734, "wall": 15452.5} {"step": 28939, "train_loss": 3.2013144493103027, "lr": 4.253274057184006e-05, "tps": 122702, "wall": 15457.0} {"step": 28940, "train_loss": 3.0162036418914795, "lr": 4.2529539062218046e-05, "tps": 122671, "wall": 15461.5} {"step": 28941, "train_loss": 3.1847147941589355, "lr": 4.252633956299103e-05, "tps": 122639, "wall": 15466.0} {"step": 28942, "train_loss": 3.17547869682312, "lr": 4.2523142074195235e-05, "tps": 122608, "wall": 15470.4} {"step": 28943, "train_loss": 3.139829397201538, "lr": 4.251994659586689e-05, "tps": 122577, "wall": 15474.9} {"step": 28944, "train_loss": 3.1123011112213135, "lr": 4.2516753128042194e-05, "tps": 122545, "wall": 15479.5} {"step": 28945, "train_loss": 3.1552252769470215, "lr": 4.2513561670757306e-05, "tps": 122514, "wall": 15484.0} {"step": 28946, "train_loss": 3.155409336090088, "lr": 4.251037222404841e-05, "tps": 122482, "wall": 15488.4} {"step": 28947, "train_loss": 3.2021896839141846, "lr": 4.25071847879516e-05, "tps": 122451, "wall": 15493.0} {"step": 28948, "train_loss": 3.187352180480957, "lr": 4.2503999362503026e-05, "tps": 122420, "wall": 15497.4} {"step": 28949, "train_loss": 3.152606964111328, "lr": 4.250081594773875e-05, "tps": 122389, "wall": 15501.9} {"step": 28950, "train_loss": 3.142026901245117, "lr": 4.24976345436948e-05, "tps": 122357, "wall": 15506.4} {"step": 28951, "train_loss": 3.1627798080444336, "lr": 4.249445515040728e-05, "tps": 122326, "wall": 15510.9} {"step": 28952, "train_loss": 3.126864194869995, "lr": 4.249127776791217e-05, "tps": 122295, "wall": 15515.4} {"step": 28953, "train_loss": 3.092322826385498, "lr": 4.248810239624546e-05, "tps": 122264, "wall": 15519.9} {"step": 28954, "train_loss": 3.195427417755127, "lr": 4.248492903544313e-05, "tps": 122233, "wall": 15524.4} {"step": 28955, "train_loss": 3.1468091011047363, "lr": 4.248175768554112e-05, "tps": 122202, "wall": 15528.9} {"step": 28956, "train_loss": 3.270158290863037, "lr": 4.2478588346575386e-05, "tps": 122171, "wall": 15533.3} {"step": 28957, "train_loss": 3.169316053390503, "lr": 4.247542101858179e-05, "tps": 122140, "wall": 15537.8} {"step": 28958, "train_loss": 3.071908473968506, "lr": 4.247225570159623e-05, "tps": 122108, "wall": 15542.4} {"step": 28959, "train_loss": 3.208761692047119, "lr": 4.246909239565458e-05, "tps": 122077, "wall": 15546.8} {"step": 28960, "train_loss": 3.078444480895996, "lr": 4.246593110079263e-05, "tps": 122046, "wall": 15551.3} {"step": 28961, "train_loss": 3.19685697555542, "lr": 4.246277181704622e-05, "tps": 122015, "wall": 15555.8} {"step": 28962, "train_loss": 3.1667299270629883, "lr": 4.2459614544451156e-05, "tps": 121984, "wall": 15560.3} {"step": 28963, "train_loss": 3.1413278579711914, "lr": 4.2456459283043165e-05, "tps": 121953, "wall": 15564.8} {"step": 28964, "train_loss": 3.1681132316589355, "lr": 4.2453306032858006e-05, "tps": 121922, "wall": 15569.3} {"step": 28965, "train_loss": 3.137901782989502, "lr": 4.245015479393142e-05, "tps": 121891, "wall": 15573.8} {"step": 28966, "train_loss": 3.1448144912719727, "lr": 4.244700556629907e-05, "tps": 121860, "wall": 15578.3} {"step": 28967, "train_loss": 3.2367734909057617, "lr": 4.2443858349996643e-05, "tps": 121829, "wall": 15582.8} {"step": 28968, "train_loss": 3.205817699432373, "lr": 4.244071314505981e-05, "tps": 121799, "wall": 15587.2} {"step": 28969, "train_loss": 3.1852974891662598, "lr": 4.243756995152418e-05, "tps": 121768, "wall": 15591.7} {"step": 28970, "train_loss": 3.2901809215545654, "lr": 4.243442876942535e-05, "tps": 121737, "wall": 15596.2} {"step": 28971, "train_loss": 3.1477789878845215, "lr": 4.243128959879892e-05, "tps": 121706, "wall": 15600.7} {"step": 28972, "train_loss": 3.245236873626709, "lr": 4.242815243968046e-05, "tps": 121675, "wall": 15605.2} {"step": 28973, "train_loss": 3.194143772125244, "lr": 4.242501729210549e-05, "tps": 121644, "wall": 15609.7} {"step": 28974, "train_loss": 3.2270913124084473, "lr": 4.2421884156109545e-05, "tps": 121614, "wall": 15614.2} {"step": 28975, "train_loss": 3.119361400604248, "lr": 4.241875303172807e-05, "tps": 121583, "wall": 15618.7} {"step": 28976, "train_loss": 3.2274329662323, "lr": 4.2415623918996586e-05, "tps": 121552, "wall": 15623.1} {"step": 28977, "train_loss": 3.108816146850586, "lr": 4.2412496817950535e-05, "tps": 121522, "wall": 15627.6} {"step": 28978, "train_loss": 3.234422206878662, "lr": 4.2409371728625305e-05, "tps": 121491, "wall": 15632.1} {"step": 28979, "train_loss": 3.185861349105835, "lr": 4.240624865105632e-05, "tps": 121460, "wall": 15636.6} {"step": 28980, "train_loss": 3.258627414703369, "lr": 4.240312758527898e-05, "tps": 121430, "wall": 15641.1} {"step": 28981, "train_loss": 3.1884915828704834, "lr": 4.2400008531328605e-05, "tps": 121399, "wall": 15645.5} {"step": 28982, "train_loss": 3.2483575344085693, "lr": 4.239689148924054e-05, "tps": 121369, "wall": 15650.0} {"step": 28983, "train_loss": 3.188147783279419, "lr": 4.239377645905009e-05, "tps": 121338, "wall": 15654.5} {"step": 28984, "train_loss": 3.122709035873413, "lr": 4.239066344079256e-05, "tps": 121308, "wall": 15659.0} {"step": 28985, "train_loss": 3.1401748657226562, "lr": 4.23875524345032e-05, "tps": 121277, "wall": 15663.5} {"step": 28986, "train_loss": 3.1661839485168457, "lr": 4.238444344021726e-05, "tps": 121246, "wall": 15668.0} {"step": 28987, "train_loss": 3.181838035583496, "lr": 4.238133645796994e-05, "tps": 121216, "wall": 15672.4} {"step": 28988, "train_loss": 3.150038242340088, "lr": 4.237823148779647e-05, "tps": 121185, "wall": 15676.9} {"step": 28989, "train_loss": 3.174100875854492, "lr": 4.237512852973197e-05, "tps": 121155, "wall": 15681.4} {"step": 28990, "train_loss": 3.0772407054901123, "lr": 4.237202758381165e-05, "tps": 121125, "wall": 15685.8} {"step": 28991, "train_loss": 3.1821300983428955, "lr": 4.236892865007061e-05, "tps": 121094, "wall": 15690.4} {"step": 28992, "train_loss": 3.22369384765625, "lr": 4.2365831728543946e-05, "tps": 121064, "wall": 15694.8} {"step": 28993, "train_loss": 3.32089900970459, "lr": 4.236273681926675e-05, "tps": 121034, "wall": 15699.3} {"step": 28994, "train_loss": 3.216686248779297, "lr": 4.2359643922274096e-05, "tps": 121004, "wall": 15703.7} {"step": 28995, "train_loss": 3.1506142616271973, "lr": 4.235655303760099e-05, "tps": 120973, "wall": 15708.2} {"step": 28996, "train_loss": 3.1955349445343018, "lr": 4.235346416528246e-05, "tps": 120943, "wall": 15712.7} {"step": 28997, "train_loss": 3.053593873977661, "lr": 4.235037730535351e-05, "tps": 120913, "wall": 15717.1} {"step": 28998, "train_loss": 3.2389538288116455, "lr": 4.234729245784909e-05, "tps": 120882, "wall": 15721.6} {"step": 28999, "train_loss": 3.055730104446411, "lr": 4.234420962280415e-05, "tps": 120852, "wall": 15726.1} {"step": 29000, "train_loss": 3.207110643386841, "lr": 4.234112880025364e-05, "tps": 120822, "wall": 15730.6, "val_loss_monitor": 3.3105007599173697} {"step": 29001, "train_loss": 3.2257978916168213, "lr": 4.2338049990232386e-05, "tps": 120560, "wall": 15765.4} {"step": 29002, "train_loss": 3.1736197471618652, "lr": 4.2334973192775354e-05, "tps": 120529, "wall": 15769.9} {"step": 29003, "train_loss": 3.186703681945801, "lr": 4.233189840791735e-05, "tps": 120499, "wall": 15774.4} {"step": 29004, "train_loss": 3.1374504566192627, "lr": 4.232882563569318e-05, "tps": 120469, "wall": 15778.9} {"step": 29005, "train_loss": 3.0878093242645264, "lr": 4.2325754876137726e-05, "tps": 120439, "wall": 15783.4} {"step": 29006, "train_loss": 3.1486892700195312, "lr": 4.232268612928572e-05, "tps": 120409, "wall": 15787.8} {"step": 29007, "train_loss": 3.282064914703369, "lr": 4.2319619395171925e-05, "tps": 120379, "wall": 15792.3} {"step": 29008, "train_loss": 3.0924763679504395, "lr": 4.2316554673831116e-05, "tps": 120349, "wall": 15796.8} {"step": 29009, "train_loss": 3.1184051036834717, "lr": 4.231349196529797e-05, "tps": 120319, "wall": 15801.2} {"step": 29010, "train_loss": 3.0960533618927, "lr": 4.23104312696072e-05, "tps": 120290, "wall": 15805.7} {"step": 29011, "train_loss": 3.0789272785186768, "lr": 4.230737258679349e-05, "tps": 120260, "wall": 15810.1} {"step": 29012, "train_loss": 3.090837001800537, "lr": 4.2304315916891456e-05, "tps": 120230, "wall": 15814.6} {"step": 29013, "train_loss": 3.1860737800598145, "lr": 4.230126125993575e-05, "tps": 120200, "wall": 15819.0} {"step": 29014, "train_loss": 3.2022087574005127, "lr": 4.2298208615961e-05, "tps": 120170, "wall": 15823.5} {"step": 29015, "train_loss": 3.129634141921997, "lr": 4.229515798500173e-05, "tps": 120141, "wall": 15828.0} {"step": 29016, "train_loss": 3.185368061065674, "lr": 4.229210936709254e-05, "tps": 120111, "wall": 15832.4} {"step": 29017, "train_loss": 3.0842058658599854, "lr": 4.228906276226793e-05, "tps": 120081, "wall": 15836.9} {"step": 29018, "train_loss": 3.2019271850585938, "lr": 4.228601817056243e-05, "tps": 120051, "wall": 15841.4} {"step": 29019, "train_loss": 3.1977734565734863, "lr": 4.2282975592010544e-05, "tps": 120022, "wall": 15845.9} {"step": 29020, "train_loss": 3.1229121685028076, "lr": 4.227993502664672e-05, "tps": 119992, "wall": 15850.4} {"step": 29021, "train_loss": 3.169936180114746, "lr": 4.2276896474505395e-05, "tps": 119962, "wall": 15854.8} {"step": 29022, "train_loss": 3.163374423980713, "lr": 4.2273859935621016e-05, "tps": 119933, "wall": 15859.3} {"step": 29023, "train_loss": 3.1920955181121826, "lr": 4.227082541002797e-05, "tps": 119903, "wall": 15863.7} {"step": 29024, "train_loss": 3.2386844158172607, "lr": 4.226779289776062e-05, "tps": 119873, "wall": 15868.2} {"step": 29025, "train_loss": 3.170313835144043, "lr": 4.226476239885332e-05, "tps": 119844, "wall": 15872.6} {"step": 29026, "train_loss": 3.156802177429199, "lr": 4.226173391334041e-05, "tps": 119814, "wall": 15877.1} {"step": 29027, "train_loss": 3.14819073677063, "lr": 4.2258707441256205e-05, "tps": 119785, "wall": 15881.6} {"step": 29028, "train_loss": 3.290609121322632, "lr": 4.2255682982634974e-05, "tps": 119756, "wall": 15886.0} {"step": 29029, "train_loss": 3.217942237854004, "lr": 4.225266053751098e-05, "tps": 119726, "wall": 15890.5} {"step": 29030, "train_loss": 3.1595888137817383, "lr": 4.224964010591846e-05, "tps": 119697, "wall": 15894.9} {"step": 29031, "train_loss": 3.068276882171631, "lr": 4.224662168789164e-05, "tps": 119666, "wall": 15899.5} {"step": 29032, "train_loss": 3.227754831314087, "lr": 4.224360528346468e-05, "tps": 119637, "wall": 15903.9} {"step": 29033, "train_loss": 3.0935466289520264, "lr": 4.2240590892671804e-05, "tps": 119608, "wall": 15908.4} {"step": 29034, "train_loss": 3.12363338470459, "lr": 4.2237578515547135e-05, "tps": 119578, "wall": 15912.9} {"step": 29035, "train_loss": 3.058939218521118, "lr": 4.2234568152124776e-05, "tps": 119549, "wall": 15917.3} {"step": 29036, "train_loss": 3.1388587951660156, "lr": 4.2231559802438857e-05, "tps": 119519, "wall": 15921.8} {"step": 29037, "train_loss": 3.2179579734802246, "lr": 4.222855346652345e-05, "tps": 119490, "wall": 15926.2} {"step": 29038, "train_loss": 3.2317051887512207, "lr": 4.2225549144412577e-05, "tps": 119461, "wall": 15930.7} {"step": 29039, "train_loss": 3.191103458404541, "lr": 4.2222546836140344e-05, "tps": 119431, "wall": 15935.2} {"step": 29040, "train_loss": 3.3053336143493652, "lr": 4.2219546541740694e-05, "tps": 119402, "wall": 15939.6} {"step": 29041, "train_loss": 3.2551493644714355, "lr": 4.221654826124764e-05, "tps": 119373, "wall": 15944.1} {"step": 29042, "train_loss": 3.1800386905670166, "lr": 4.221355199469513e-05, "tps": 119343, "wall": 15948.5} {"step": 29043, "train_loss": 3.1709320545196533, "lr": 4.2210557742117144e-05, "tps": 119314, "wall": 15953.0} {"step": 29044, "train_loss": 3.145747661590576, "lr": 4.2207565503547565e-05, "tps": 119285, "wall": 15957.5} {"step": 29045, "train_loss": 3.115147590637207, "lr": 4.2204575279020314e-05, "tps": 119255, "wall": 15962.0} {"step": 29046, "train_loss": 3.1293282508850098, "lr": 4.220158706856923e-05, "tps": 119226, "wall": 15966.4} {"step": 29047, "train_loss": 3.1674370765686035, "lr": 4.219860087222821e-05, "tps": 119197, "wall": 15970.9} {"step": 29048, "train_loss": 3.0069046020507812, "lr": 4.219561669003106e-05, "tps": 119168, "wall": 15975.4} {"step": 29049, "train_loss": 3.16180419921875, "lr": 4.219263452201157e-05, "tps": 119138, "wall": 15979.9} {"step": 29050, "train_loss": 3.0255589485168457, "lr": 4.218965436820354e-05, "tps": 119109, "wall": 15984.3} {"step": 29051, "train_loss": 3.2629120349884033, "lr": 4.218667622864072e-05, "tps": 119080, "wall": 15988.8} {"step": 29052, "train_loss": 3.1770851612091064, "lr": 4.2183700103356865e-05, "tps": 119051, "wall": 15993.2} {"step": 29053, "train_loss": 3.1642990112304688, "lr": 4.218072599238567e-05, "tps": 119022, "wall": 15997.7} {"step": 29054, "train_loss": 3.1628801822662354, "lr": 4.217775389576082e-05, "tps": 118993, "wall": 16002.2} {"step": 29055, "train_loss": 3.2041404247283936, "lr": 4.217478381351599e-05, "tps": 118964, "wall": 16006.6} {"step": 29056, "train_loss": 3.138615131378174, "lr": 4.217181574568486e-05, "tps": 118935, "wall": 16011.1} {"step": 29057, "train_loss": 3.1449992656707764, "lr": 4.2168849692300996e-05, "tps": 118906, "wall": 16015.5} {"step": 29058, "train_loss": 3.1354215145111084, "lr": 4.216588565339802e-05, "tps": 118876, "wall": 16020.1} {"step": 29059, "train_loss": 3.168879508972168, "lr": 4.216292362900953e-05, "tps": 118847, "wall": 16024.5} {"step": 29060, "train_loss": 3.162808895111084, "lr": 4.215996361916906e-05, "tps": 118818, "wall": 16029.0} {"step": 29061, "train_loss": 3.2287192344665527, "lr": 4.215700562391012e-05, "tps": 118789, "wall": 16033.4} {"step": 29062, "train_loss": 3.1746506690979004, "lr": 4.215404964326626e-05, "tps": 118760, "wall": 16037.9} {"step": 29063, "train_loss": 3.184891700744629, "lr": 4.215109567727093e-05, "tps": 118731, "wall": 16042.3} {"step": 29064, "train_loss": 3.1925113201141357, "lr": 4.2148143725957626e-05, "tps": 118703, "wall": 16046.8} {"step": 29065, "train_loss": 3.108961343765259, "lr": 4.214519378935979e-05, "tps": 118674, "wall": 16051.2} {"step": 29066, "train_loss": 3.207373857498169, "lr": 4.2142245867510776e-05, "tps": 118645, "wall": 16055.7} {"step": 29067, "train_loss": 3.1316843032836914, "lr": 4.213929996044405e-05, "tps": 118616, "wall": 16060.1} {"step": 29068, "train_loss": 3.105125904083252, "lr": 4.213635606819296e-05, "tps": 118587, "wall": 16064.6} {"step": 29069, "train_loss": 3.2577054500579834, "lr": 4.2133414190790835e-05, "tps": 118559, "wall": 16069.0} {"step": 29070, "train_loss": 3.111773729324341, "lr": 4.213047432827103e-05, "tps": 118530, "wall": 16073.5} {"step": 29071, "train_loss": 3.1160101890563965, "lr": 4.212753648066684e-05, "tps": 118501, "wall": 16078.0} {"step": 29072, "train_loss": 3.150101661682129, "lr": 4.212460064801152e-05, "tps": 118472, "wall": 16082.5} {"step": 29073, "train_loss": 3.1307625770568848, "lr": 4.2121666830338355e-05, "tps": 118443, "wall": 16086.9} {"step": 29074, "train_loss": 3.07660174369812, "lr": 4.211873502768057e-05, "tps": 118414, "wall": 16091.4} {"step": 29075, "train_loss": 3.253452777862549, "lr": 4.211580524007137e-05, "tps": 118386, "wall": 16095.8} {"step": 29076, "train_loss": 3.134287118911743, "lr": 4.211287746754398e-05, "tps": 118357, "wall": 16100.3} {"step": 29077, "train_loss": 3.080244541168213, "lr": 4.210995171013151e-05, "tps": 118328, "wall": 16104.8} {"step": 29078, "train_loss": 3.1124532222747803, "lr": 4.210702796786714e-05, "tps": 118299, "wall": 16109.2} {"step": 29079, "train_loss": 3.238473892211914, "lr": 4.210410624078397e-05, "tps": 118271, "wall": 16113.7} {"step": 29080, "train_loss": 3.0396220684051514, "lr": 4.210118652891511e-05, "tps": 118242, "wall": 16118.2} {"step": 29081, "train_loss": 3.1320242881774902, "lr": 4.209826883229365e-05, "tps": 118213, "wall": 16122.6} {"step": 29082, "train_loss": 3.1481924057006836, "lr": 4.209535315095262e-05, "tps": 118185, "wall": 16127.1} {"step": 29083, "train_loss": 3.069094181060791, "lr": 4.209243948492505e-05, "tps": 118156, "wall": 16131.6} {"step": 29084, "train_loss": 3.1665725708007812, "lr": 4.2089527834243974e-05, "tps": 118127, "wall": 16136.0} {"step": 29085, "train_loss": 3.123875141143799, "lr": 4.208661819894232e-05, "tps": 118098, "wall": 16140.5} {"step": 29086, "train_loss": 3.112694263458252, "lr": 4.208371057905308e-05, "tps": 118070, "wall": 16145.0} {"step": 29087, "train_loss": 3.1707568168640137, "lr": 4.208080497460921e-05, "tps": 118041, "wall": 16149.5} {"step": 29088, "train_loss": 3.1279408931732178, "lr": 4.2077901385643586e-05, "tps": 118013, "wall": 16153.9} {"step": 29089, "train_loss": 3.219372272491455, "lr": 4.207499981218914e-05, "tps": 117984, "wall": 16158.4} {"step": 29090, "train_loss": 3.0842678546905518, "lr": 4.207210025427871e-05, "tps": 117956, "wall": 16162.9} {"step": 29091, "train_loss": 3.1541624069213867, "lr": 4.206920271194516e-05, "tps": 117927, "wall": 16167.3} {"step": 29092, "train_loss": 3.2180657386779785, "lr": 4.206630718522129e-05, "tps": 117899, "wall": 16171.8} {"step": 29093, "train_loss": 3.1473946571350098, "lr": 4.206341367413995e-05, "tps": 117870, "wall": 16176.3} {"step": 29094, "train_loss": 3.2036478519439697, "lr": 4.206052217873386e-05, "tps": 117842, "wall": 16180.7} {"step": 29095, "train_loss": 3.1772170066833496, "lr": 4.2057632699035816e-05, "tps": 117813, "wall": 16185.2} {"step": 29096, "train_loss": 3.13704252243042, "lr": 4.2054745235078516e-05, "tps": 117785, "wall": 16189.6} {"step": 29097, "train_loss": 3.1733365058898926, "lr": 4.205185978689471e-05, "tps": 117756, "wall": 16194.1} {"step": 29098, "train_loss": 3.167849063873291, "lr": 4.2048976354517046e-05, "tps": 117728, "wall": 16198.6} {"step": 29099, "train_loss": 3.167120933532715, "lr": 4.204609493797822e-05, "tps": 117699, "wall": 16203.0} {"step": 29100, "train_loss": 3.070796489715576, "lr": 4.2043215537310856e-05, "tps": 117671, "wall": 16207.5} {"step": 29101, "train_loss": 3.233346939086914, "lr": 4.2040338152547566e-05, "tps": 117643, "wall": 16212.0} {"step": 29102, "train_loss": 3.175565242767334, "lr": 4.203746278372096e-05, "tps": 117614, "wall": 16216.4} {"step": 29103, "train_loss": 3.109569549560547, "lr": 4.20345894308636e-05, "tps": 117586, "wall": 16220.9} {"step": 29104, "train_loss": 3.1881725788116455, "lr": 4.2031718094008035e-05, "tps": 117558, "wall": 16225.4} {"step": 29105, "train_loss": 3.095036268234253, "lr": 4.20288487731868e-05, "tps": 117530, "wall": 16229.8} {"step": 29106, "train_loss": 3.1502628326416016, "lr": 4.202598146843238e-05, "tps": 117501, "wall": 16234.3} {"step": 29107, "train_loss": 3.057432174682617, "lr": 4.2023116179777286e-05, "tps": 117473, "wall": 16238.7} {"step": 29108, "train_loss": 3.2322239875793457, "lr": 4.202025290725395e-05, "tps": 117445, "wall": 16243.2} {"step": 29109, "train_loss": 3.1365082263946533, "lr": 4.201739165089482e-05, "tps": 117417, "wall": 16247.7} {"step": 29110, "train_loss": 3.2374768257141113, "lr": 4.201453241073233e-05, "tps": 117388, "wall": 16252.1} {"step": 29111, "train_loss": 3.1464223861694336, "lr": 4.201167518679882e-05, "tps": 117360, "wall": 16256.6} {"step": 29112, "train_loss": 3.1867589950561523, "lr": 4.200881997912669e-05, "tps": 117332, "wall": 16261.1} {"step": 29113, "train_loss": 3.1375741958618164, "lr": 4.200596678774827e-05, "tps": 117304, "wall": 16265.5} {"step": 29114, "train_loss": 3.1435766220092773, "lr": 4.2003115612695894e-05, "tps": 117275, "wall": 16270.0} {"step": 29115, "train_loss": 3.131208658218384, "lr": 4.200026645400186e-05, "tps": 117247, "wall": 16274.5} {"step": 29116, "train_loss": 3.1942880153656006, "lr": 4.199741931169842e-05, "tps": 117219, "wall": 16278.9} {"step": 29117, "train_loss": 3.1737122535705566, "lr": 4.199457418581785e-05, "tps": 117191, "wall": 16283.4} {"step": 29118, "train_loss": 3.135343313217163, "lr": 4.199173107639238e-05, "tps": 117163, "wall": 16287.9} {"step": 29119, "train_loss": 3.2183032035827637, "lr": 4.198888998345421e-05, "tps": 117135, "wall": 16292.3} {"step": 29120, "train_loss": 3.2386388778686523, "lr": 4.198605090703551e-05, "tps": 117107, "wall": 16296.8} {"step": 29121, "train_loss": 3.000875473022461, "lr": 4.1983213847168476e-05, "tps": 117079, "wall": 16301.3} {"step": 29122, "train_loss": 3.134626865386963, "lr": 4.1980378803885226e-05, "tps": 117051, "wall": 16305.7} {"step": 29123, "train_loss": 3.076812744140625, "lr": 4.197754577721786e-05, "tps": 117023, "wall": 16310.2} {"step": 29124, "train_loss": 3.245236873626709, "lr": 4.1974714767198494e-05, "tps": 116995, "wall": 16314.7} {"step": 29125, "train_loss": 3.158463954925537, "lr": 4.197188577385919e-05, "tps": 116966, "wall": 16319.2} {"step": 29126, "train_loss": 3.157297134399414, "lr": 4.1969058797232e-05, "tps": 116939, "wall": 16323.6} {"step": 29127, "train_loss": 3.1877565383911133, "lr": 4.1966233837348937e-05, "tps": 116911, "wall": 16328.1} {"step": 29128, "train_loss": 3.195387363433838, "lr": 4.1963410894242e-05, "tps": 116883, "wall": 16332.5} {"step": 29129, "train_loss": 3.1546356678009033, "lr": 4.196058996794319e-05, "tps": 116855, "wall": 16337.0} {"step": 29130, "train_loss": 3.113067150115967, "lr": 4.1957771058484454e-05, "tps": 116827, "wall": 16341.5} {"step": 29131, "train_loss": 3.183971881866455, "lr": 4.1954954165897706e-05, "tps": 116799, "wall": 16345.9} {"step": 29132, "train_loss": 3.111335039138794, "lr": 4.195213929021487e-05, "tps": 116771, "wall": 16350.4} {"step": 29133, "train_loss": 3.06483793258667, "lr": 4.194932643146784e-05, "tps": 116743, "wall": 16354.8} {"step": 29134, "train_loss": 3.097368001937866, "lr": 4.1946515589688464e-05, "tps": 116715, "wall": 16359.3} {"step": 29135, "train_loss": 3.185764789581299, "lr": 4.19437067649086e-05, "tps": 116688, "wall": 16363.8} {"step": 29136, "train_loss": 3.0995254516601562, "lr": 4.194089995716006e-05, "tps": 116660, "wall": 16368.2} {"step": 29137, "train_loss": 3.115739583969116, "lr": 4.193809516647461e-05, "tps": 116632, "wall": 16372.7} {"step": 29138, "train_loss": 3.109395980834961, "lr": 4.193529239288407e-05, "tps": 116604, "wall": 16377.1} {"step": 29139, "train_loss": 3.1624083518981934, "lr": 4.1932491636420184e-05, "tps": 116576, "wall": 16381.6} {"step": 29140, "train_loss": 3.2253832817077637, "lr": 4.1929692897114655e-05, "tps": 116549, "wall": 16386.1} {"step": 29141, "train_loss": 3.179861068725586, "lr": 4.1926896174999205e-05, "tps": 116521, "wall": 16390.6} {"step": 29142, "train_loss": 3.18373703956604, "lr": 4.19241014701055e-05, "tps": 116493, "wall": 16395.0} {"step": 29143, "train_loss": 3.2298338413238525, "lr": 4.192130878246522e-05, "tps": 116465, "wall": 16399.5} {"step": 29144, "train_loss": 3.1484570503234863, "lr": 4.191851811210997e-05, "tps": 116438, "wall": 16403.9} {"step": 29145, "train_loss": 3.1844356060028076, "lr": 4.191572945907138e-05, "tps": 116410, "wall": 16408.4} {"step": 29146, "train_loss": 3.259279251098633, "lr": 4.191294282338107e-05, "tps": 116383, "wall": 16412.8} {"step": 29147, "train_loss": 3.1832168102264404, "lr": 4.191015820507055e-05, "tps": 116355, "wall": 16417.3} {"step": 29148, "train_loss": 3.209991931915283, "lr": 4.190737560417139e-05, "tps": 116327, "wall": 16421.8} {"step": 29149, "train_loss": 3.1786646842956543, "lr": 4.1904595020715124e-05, "tps": 116300, "wall": 16426.2} {"step": 29150, "train_loss": 3.278730869293213, "lr": 4.190181645473325e-05, "tps": 116272, "wall": 16430.7} {"step": 29151, "train_loss": 3.20751690864563, "lr": 4.189903990625721e-05, "tps": 116245, "wall": 16435.1} {"step": 29152, "train_loss": 3.2355637550354004, "lr": 4.1896265375318515e-05, "tps": 116216, "wall": 16439.7} {"step": 29153, "train_loss": 3.225116729736328, "lr": 4.1893492861948546e-05, "tps": 116189, "wall": 16444.1} {"step": 29154, "train_loss": 3.1175100803375244, "lr": 4.189072236617871e-05, "tps": 116162, "wall": 16448.6} {"step": 29155, "train_loss": 3.285243511199951, "lr": 4.188795388804041e-05, "tps": 116134, "wall": 16453.0} {"step": 29156, "train_loss": 3.1575927734375, "lr": 4.188518742756503e-05, "tps": 116107, "wall": 16457.5} {"step": 29157, "train_loss": 3.1201281547546387, "lr": 4.1882422984783867e-05, "tps": 116079, "wall": 16462.0} {"step": 29158, "train_loss": 3.100557327270508, "lr": 4.187966055972824e-05, "tps": 116052, "wall": 16466.4} {"step": 29159, "train_loss": 3.1860127449035645, "lr": 4.187690015242946e-05, "tps": 116024, "wall": 16470.9} {"step": 29160, "train_loss": 3.110048294067383, "lr": 4.187414176291879e-05, "tps": 115997, "wall": 16475.3} {"step": 29161, "train_loss": 3.1191341876983643, "lr": 4.18713853912275e-05, "tps": 115970, "wall": 16479.8} {"step": 29162, "train_loss": 3.1380648612976074, "lr": 4.186863103738676e-05, "tps": 115942, "wall": 16484.2} {"step": 29163, "train_loss": 3.062826633453369, "lr": 4.186587870142783e-05, "tps": 115915, "wall": 16488.7} {"step": 29164, "train_loss": 3.177835464477539, "lr": 4.186312838338187e-05, "tps": 115887, "wall": 16493.2} {"step": 29165, "train_loss": 3.1983065605163574, "lr": 4.186038008327999e-05, "tps": 115860, "wall": 16497.6} {"step": 29166, "train_loss": 3.292888641357422, "lr": 4.18576338011534e-05, "tps": 115832, "wall": 16502.1} {"step": 29167, "train_loss": 3.0615806579589844, "lr": 4.1854889537033154e-05, "tps": 115805, "wall": 16506.6} {"step": 29168, "train_loss": 3.109161138534546, "lr": 4.185214729095034e-05, "tps": 115778, "wall": 16511.0} {"step": 29169, "train_loss": 3.173602342605591, "lr": 4.1849407062936064e-05, "tps": 115750, "wall": 16515.5} {"step": 29170, "train_loss": 3.246337890625, "lr": 4.1846668853021354e-05, "tps": 115723, "wall": 16520.0} {"step": 29171, "train_loss": 3.1787309646606445, "lr": 4.184393266123719e-05, "tps": 115696, "wall": 16524.4} {"step": 29172, "train_loss": 3.119129180908203, "lr": 4.18411984876146e-05, "tps": 115669, "wall": 16528.9} {"step": 29173, "train_loss": 3.1473388671875, "lr": 4.183846633218456e-05, "tps": 115641, "wall": 16533.4} {"step": 29174, "train_loss": 3.1792430877685547, "lr": 4.1835736194978014e-05, "tps": 115614, "wall": 16537.8} {"step": 29175, "train_loss": 3.1318535804748535, "lr": 4.183300807602587e-05, "tps": 115587, "wall": 16542.3} {"step": 29176, "train_loss": 3.1656904220581055, "lr": 4.183028197535906e-05, "tps": 115560, "wall": 16546.7} {"step": 29177, "train_loss": 3.2963385581970215, "lr": 4.1827557893008454e-05, "tps": 115533, "wall": 16551.2} {"step": 29178, "train_loss": 3.180365562438965, "lr": 4.182483582900493e-05, "tps": 115505, "wall": 16555.7} {"step": 29179, "train_loss": 3.198103189468384, "lr": 4.182211578337927e-05, "tps": 115478, "wall": 16560.2} {"step": 29180, "train_loss": 3.140307903289795, "lr": 4.181939775616234e-05, "tps": 115451, "wall": 16564.6} {"step": 29181, "train_loss": 3.1073620319366455, "lr": 4.181668174738492e-05, "tps": 115423, "wall": 16569.1} {"step": 29182, "train_loss": 3.1806650161743164, "lr": 4.181396775707774e-05, "tps": 115396, "wall": 16573.6} {"step": 29183, "train_loss": 3.113360643386841, "lr": 4.18112557852716e-05, "tps": 115369, "wall": 16578.0} {"step": 29184, "train_loss": 3.1098668575286865, "lr": 4.18085458319972e-05, "tps": 115342, "wall": 16582.5} {"step": 29185, "train_loss": 3.085536479949951, "lr": 4.1805837897285216e-05, "tps": 115315, "wall": 16587.0} {"step": 29186, "train_loss": 3.1310548782348633, "lr": 4.1803131981166345e-05, "tps": 115288, "wall": 16591.5} {"step": 29187, "train_loss": 3.070992946624756, "lr": 4.180042808367124e-05, "tps": 115261, "wall": 16595.9} {"step": 29188, "train_loss": 3.077016830444336, "lr": 4.1797726204830496e-05, "tps": 115234, "wall": 16600.4} {"step": 29189, "train_loss": 3.1033830642700195, "lr": 4.179502634467479e-05, "tps": 115207, "wall": 16604.8} {"step": 29190, "train_loss": 3.265523672103882, "lr": 4.179232850323465e-05, "tps": 115180, "wall": 16609.3} {"step": 29191, "train_loss": 3.174952983856201, "lr": 4.178963268054065e-05, "tps": 115153, "wall": 16613.8} {"step": 29192, "train_loss": 3.2080559730529785, "lr": 4.178693887662334e-05, "tps": 115126, "wall": 16618.2} {"step": 29193, "train_loss": 3.148613691329956, "lr": 4.178424709151323e-05, "tps": 115098, "wall": 16622.7} {"step": 29194, "train_loss": 3.1740803718566895, "lr": 4.17815573252408e-05, "tps": 115072, "wall": 16627.2} {"step": 29195, "train_loss": 3.0812277793884277, "lr": 4.177886957783652e-05, "tps": 115045, "wall": 16631.6} {"step": 29196, "train_loss": 3.0912327766418457, "lr": 4.177618384933087e-05, "tps": 115018, "wall": 16636.1} {"step": 29197, "train_loss": 3.118966579437256, "lr": 4.177350013975424e-05, "tps": 114991, "wall": 16640.6} {"step": 29198, "train_loss": 3.145798921585083, "lr": 4.177081844913705e-05, "tps": 114964, "wall": 16645.0} {"step": 29199, "train_loss": 3.227027416229248, "lr": 4.176813877750966e-05, "tps": 114937, "wall": 16649.5} {"step": 29200, "train_loss": 3.1702115535736084, "lr": 4.176546112490244e-05, "tps": 114910, "wall": 16653.9} {"step": 29201, "train_loss": 3.208434581756592, "lr": 4.1762785491345725e-05, "tps": 114883, "wall": 16658.4} {"step": 29202, "train_loss": 3.0843544006347656, "lr": 4.176011187686979e-05, "tps": 114856, "wall": 16662.9} {"step": 29203, "train_loss": 3.2639036178588867, "lr": 4.1757440281505e-05, "tps": 114829, "wall": 16667.4} {"step": 29204, "train_loss": 3.172231435775757, "lr": 4.1754770705281536e-05, "tps": 114803, "wall": 16671.8} {"step": 29205, "train_loss": 3.0237245559692383, "lr": 4.175210314822967e-05, "tps": 114776, "wall": 16676.3} {"step": 29206, "train_loss": 3.0989060401916504, "lr": 4.1749437610379645e-05, "tps": 114749, "wall": 16680.8} {"step": 29207, "train_loss": 3.131701707839966, "lr": 4.174677409176162e-05, "tps": 114722, "wall": 16685.3} {"step": 29208, "train_loss": 3.172778606414795, "lr": 4.1744112592405775e-05, "tps": 114695, "wall": 16689.8} {"step": 29209, "train_loss": 3.078557252883911, "lr": 4.174145311234226e-05, "tps": 114668, "wall": 16694.2} {"step": 29210, "train_loss": 3.2307605743408203, "lr": 4.1738795651601244e-05, "tps": 114642, "wall": 16698.7} {"step": 29211, "train_loss": 3.059715509414673, "lr": 4.173614021021275e-05, "tps": 114615, "wall": 16703.1} {"step": 29212, "train_loss": 3.0811002254486084, "lr": 4.1733486788206934e-05, "tps": 114588, "wall": 16707.6} {"step": 29213, "train_loss": 3.139483690261841, "lr": 4.173083538561381e-05, "tps": 114562, "wall": 16712.1} {"step": 29214, "train_loss": 3.098966121673584, "lr": 4.172818600246343e-05, "tps": 114535, "wall": 16716.5} {"step": 29215, "train_loss": 3.1496424674987793, "lr": 4.172553863878581e-05, "tps": 114508, "wall": 16721.0} {"step": 29216, "train_loss": 3.1301915645599365, "lr": 4.1722893294610914e-05, "tps": 114482, "wall": 16725.5} {"step": 29217, "train_loss": 3.2151308059692383, "lr": 4.172024996996874e-05, "tps": 114455, "wall": 16729.9} {"step": 29218, "train_loss": 3.2024385929107666, "lr": 4.171760866488923e-05, "tps": 114428, "wall": 16734.4} {"step": 29219, "train_loss": 3.1136202812194824, "lr": 4.171496937940229e-05, "tps": 114402, "wall": 16738.8} {"step": 29220, "train_loss": 3.161418914794922, "lr": 4.171233211353782e-05, "tps": 114375, "wall": 16743.4} {"step": 29221, "train_loss": 3.203575611114502, "lr": 4.1709696867325696e-05, "tps": 114348, "wall": 16747.8} {"step": 29222, "train_loss": 3.215790271759033, "lr": 4.170706364079575e-05, "tps": 114322, "wall": 16752.3} {"step": 29223, "train_loss": 3.2538394927978516, "lr": 4.170443243397787e-05, "tps": 114295, "wall": 16756.7} {"step": 29224, "train_loss": 3.2176432609558105, "lr": 4.1701803246901786e-05, "tps": 114269, "wall": 16761.2} {"step": 29225, "train_loss": 3.131330728530884, "lr": 4.169917607959735e-05, "tps": 114242, "wall": 16765.6} {"step": 29226, "train_loss": 3.210843324661255, "lr": 4.169655093209429e-05, "tps": 114216, "wall": 16770.1} {"step": 29227, "train_loss": 3.1387364864349365, "lr": 4.1693927804422336e-05, "tps": 114189, "wall": 16774.6} {"step": 29228, "train_loss": 3.1223907470703125, "lr": 4.169130669661122e-05, "tps": 114163, "wall": 16779.0} {"step": 29229, "train_loss": 3.321443796157837, "lr": 4.168868760869062e-05, "tps": 114136, "wall": 16783.5} {"step": 29230, "train_loss": 3.165811538696289, "lr": 4.1686070540690206e-05, "tps": 114110, "wall": 16787.9} {"step": 29231, "train_loss": 3.3013572692871094, "lr": 4.1683455492639666e-05, "tps": 114084, "wall": 16792.4} {"step": 29232, "train_loss": 3.2839102745056152, "lr": 4.1680842464568566e-05, "tps": 114057, "wall": 16796.9} {"step": 29233, "train_loss": 3.175732135772705, "lr": 4.1678231456506525e-05, "tps": 114030, "wall": 16801.4} {"step": 29234, "train_loss": 3.0781540870666504, "lr": 4.167562246848315e-05, "tps": 114004, "wall": 16805.9} {"step": 29235, "train_loss": 3.2268104553222656, "lr": 4.167301550052794e-05, "tps": 113978, "wall": 16810.3} {"step": 29236, "train_loss": 3.094350814819336, "lr": 4.167041055267047e-05, "tps": 113951, "wall": 16814.8} {"step": 29237, "train_loss": 3.0763516426086426, "lr": 4.166780762494024e-05, "tps": 113925, "wall": 16819.3} {"step": 29238, "train_loss": 3.193124771118164, "lr": 4.166520671736672e-05, "tps": 113899, "wall": 16823.7} {"step": 29239, "train_loss": 3.1464438438415527, "lr": 4.166260782997939e-05, "tps": 113872, "wall": 16828.2} {"step": 29240, "train_loss": 3.1442489624023438, "lr": 4.166001096280771e-05, "tps": 113846, "wall": 16832.7} {"step": 29241, "train_loss": 3.117447853088379, "lr": 4.165741611588106e-05, "tps": 113820, "wall": 16837.1} {"step": 29242, "train_loss": 3.1872763633728027, "lr": 4.165482328922884e-05, "tps": 113793, "wall": 16841.6} {"step": 29243, "train_loss": 3.194584846496582, "lr": 4.165223248288042e-05, "tps": 113767, "wall": 16846.0} {"step": 29244, "train_loss": 3.1604397296905518, "lr": 4.1649643696865186e-05, "tps": 113741, "wall": 16850.5} {"step": 29245, "train_loss": 3.1416611671447754, "lr": 4.1647056931212426e-05, "tps": 113715, "wall": 16855.0} {"step": 29246, "train_loss": 3.1183063983917236, "lr": 4.164447218595144e-05, "tps": 113688, "wall": 16859.5} {"step": 29247, "train_loss": 3.2871103286743164, "lr": 4.164188946111155e-05, "tps": 113662, "wall": 16863.9} {"step": 29248, "train_loss": 3.0766642093658447, "lr": 4.1639308756721964e-05, "tps": 113636, "wall": 16868.4} {"step": 29249, "train_loss": 3.1166093349456787, "lr": 4.163673007281194e-05, "tps": 113610, "wall": 16872.9} {"step": 29250, "train_loss": 3.125580310821533, "lr": 4.163415340941069e-05, "tps": 113583, "wall": 16877.3} {"step": 29251, "train_loss": 3.214657783508301, "lr": 4.1631578766547405e-05, "tps": 113557, "wall": 16881.8} {"step": 29252, "train_loss": 3.1843533515930176, "lr": 4.1629006144251256e-05, "tps": 113531, "wall": 16886.3} {"step": 29253, "train_loss": 3.0582990646362305, "lr": 4.162643554255135e-05, "tps": 113505, "wall": 16890.7} {"step": 29254, "train_loss": 3.1674556732177734, "lr": 4.162386696147683e-05, "tps": 113479, "wall": 16895.2} {"step": 29255, "train_loss": 3.164547920227051, "lr": 4.16213004010568e-05, "tps": 113453, "wall": 16899.7} {"step": 29256, "train_loss": 3.104335308074951, "lr": 4.161873586132035e-05, "tps": 113427, "wall": 16904.1} {"step": 29257, "train_loss": 3.153360366821289, "lr": 4.161617334229649e-05, "tps": 113401, "wall": 16908.6} {"step": 29258, "train_loss": 3.1110196113586426, "lr": 4.1613612844014275e-05, "tps": 113375, "wall": 16913.1} {"step": 29259, "train_loss": 3.1513688564300537, "lr": 4.1611054366502706e-05, "tps": 113349, "wall": 16917.5} {"step": 29260, "train_loss": 3.149960517883301, "lr": 4.160849790979077e-05, "tps": 113322, "wall": 16922.0} {"step": 29261, "train_loss": 3.124903678894043, "lr": 4.1605943473907404e-05, "tps": 113296, "wall": 16926.5} {"step": 29262, "train_loss": 3.0932400226593018, "lr": 4.160339105888157e-05, "tps": 113270, "wall": 16930.9} {"step": 29263, "train_loss": 3.072909355163574, "lr": 4.160084066474217e-05, "tps": 113244, "wall": 16935.4} {"step": 29264, "train_loss": 3.1484487056732178, "lr": 4.159829229151811e-05, "tps": 113218, "wall": 16939.8} {"step": 29265, "train_loss": 3.186227798461914, "lr": 4.159574593923824e-05, "tps": 113192, "wall": 16944.3} {"step": 29266, "train_loss": 3.0621886253356934, "lr": 4.15932016079314e-05, "tps": 113167, "wall": 16948.8} {"step": 29267, "train_loss": 3.0980796813964844, "lr": 4.159065929762642e-05, "tps": 113141, "wall": 16953.2} {"step": 29268, "train_loss": 3.2844040393829346, "lr": 4.1588119008352125e-05, "tps": 113115, "wall": 16957.7} {"step": 29269, "train_loss": 3.1430294513702393, "lr": 4.1585580740137277e-05, "tps": 113089, "wall": 16962.1} {"step": 29270, "train_loss": 3.165555000305176, "lr": 4.15830444930106e-05, "tps": 113063, "wall": 16966.6} {"step": 29271, "train_loss": 3.128067970275879, "lr": 4.158051026700086e-05, "tps": 113037, "wall": 16971.1} {"step": 29272, "train_loss": 3.00984787940979, "lr": 4.1577978062136745e-05, "tps": 113011, "wall": 16975.5} {"step": 29273, "train_loss": 3.1156935691833496, "lr": 4.157544787844692e-05, "tps": 112985, "wall": 16980.0} {"step": 29274, "train_loss": 3.137624740600586, "lr": 4.157291971596012e-05, "tps": 112960, "wall": 16984.5} {"step": 29275, "train_loss": 3.1076111793518066, "lr": 4.15703935747049e-05, "tps": 112934, "wall": 16988.9} {"step": 29276, "train_loss": 3.219961404800415, "lr": 4.156786945470995e-05, "tps": 112908, "wall": 16993.4} {"step": 29277, "train_loss": 3.177292823791504, "lr": 4.15653473560038e-05, "tps": 112882, "wall": 16997.8} {"step": 29278, "train_loss": 3.174929141998291, "lr": 4.156282727861506e-05, "tps": 112856, "wall": 17002.3} {"step": 29279, "train_loss": 3.2213945388793945, "lr": 4.156030922257228e-05, "tps": 112831, "wall": 17006.8} {"step": 29280, "train_loss": 3.142174005508423, "lr": 4.155779318790395e-05, "tps": 112805, "wall": 17011.2} {"step": 29281, "train_loss": 3.087942600250244, "lr": 4.1555279174638584e-05, "tps": 112779, "wall": 17015.7} {"step": 29282, "train_loss": 3.1502490043640137, "lr": 4.15527671828047e-05, "tps": 112754, "wall": 17020.2} {"step": 29283, "train_loss": 3.1974611282348633, "lr": 4.1550257212430696e-05, "tps": 112728, "wall": 17024.6} {"step": 29284, "train_loss": 3.047607421875, "lr": 4.1547749263545055e-05, "tps": 112702, "wall": 17029.1} {"step": 29285, "train_loss": 3.1915807723999023, "lr": 4.154524333617614e-05, "tps": 112677, "wall": 17033.5} {"step": 29286, "train_loss": 3.0758183002471924, "lr": 4.1542739430352387e-05, "tps": 112651, "wall": 17038.0} {"step": 29287, "train_loss": 3.137942314147949, "lr": 4.154023754610211e-05, "tps": 112625, "wall": 17042.5} {"step": 29288, "train_loss": 3.2531018257141113, "lr": 4.15377376834537e-05, "tps": 112599, "wall": 17046.9} {"step": 29289, "train_loss": 3.188516616821289, "lr": 4.1535239842435444e-05, "tps": 112574, "wall": 17051.4} {"step": 29290, "train_loss": 3.152985095977783, "lr": 4.1532744023075634e-05, "tps": 112548, "wall": 17055.9} {"step": 29291, "train_loss": 3.101269006729126, "lr": 4.153025022540257e-05, "tps": 112523, "wall": 17060.3} {"step": 29292, "train_loss": 3.1158974170684814, "lr": 4.152775844944449e-05, "tps": 112497, "wall": 17064.8} {"step": 29293, "train_loss": 3.1500091552734375, "lr": 4.1525268695229606e-05, "tps": 112471, "wall": 17069.3} {"step": 29294, "train_loss": 3.2059340476989746, "lr": 4.1522780962786146e-05, "tps": 112446, "wall": 17073.7} {"step": 29295, "train_loss": 3.207782745361328, "lr": 4.152029525214226e-05, "tps": 112420, "wall": 17078.2} {"step": 29296, "train_loss": 3.1037776470184326, "lr": 4.1517811563326134e-05, "tps": 112395, "wall": 17082.6} {"step": 29297, "train_loss": 3.093806028366089, "lr": 4.15153298963659e-05, "tps": 112369, "wall": 17087.1} {"step": 29298, "train_loss": 3.0843727588653564, "lr": 4.1512850251289654e-05, "tps": 112344, "wall": 17091.6} {"step": 29299, "train_loss": 3.0946006774902344, "lr": 4.15103726281255e-05, "tps": 112318, "wall": 17096.0} {"step": 29300, "train_loss": 3.1886353492736816, "lr": 4.1507897026901503e-05, "tps": 112292, "wall": 17100.5} {"step": 29301, "train_loss": 3.1556224822998047, "lr": 4.15054234476457e-05, "tps": 112267, "wall": 17105.0} {"step": 29302, "train_loss": 3.1396584510803223, "lr": 4.1502951890386125e-05, "tps": 112242, "wall": 17109.5} {"step": 29303, "train_loss": 3.1256072521209717, "lr": 4.150048235515078e-05, "tps": 112216, "wall": 17113.9} {"step": 29304, "train_loss": 3.162691116333008, "lr": 4.14980148419676e-05, "tps": 112191, "wall": 17118.4} {"step": 29305, "train_loss": 3.046442985534668, "lr": 4.1495549350864584e-05, "tps": 112165, "wall": 17122.8} {"step": 29306, "train_loss": 3.117769956588745, "lr": 4.1493085881869633e-05, "tps": 112140, "wall": 17127.3} {"step": 29307, "train_loss": 3.072683334350586, "lr": 4.149062443501065e-05, "tps": 112114, "wall": 17131.8} {"step": 29308, "train_loss": 3.176692008972168, "lr": 4.148816501031555e-05, "tps": 112089, "wall": 17136.3} {"step": 29309, "train_loss": 3.147373676300049, "lr": 4.148570760781216e-05, "tps": 112064, "wall": 17140.7} {"step": 29310, "train_loss": 3.2325973510742188, "lr": 4.148325222752835e-05, "tps": 112038, "wall": 17145.2} {"step": 29311, "train_loss": 3.1579840183258057, "lr": 4.14807988694919e-05, "tps": 112013, "wall": 17149.6} {"step": 29312, "train_loss": 3.210052967071533, "lr": 4.1478347533730626e-05, "tps": 111988, "wall": 17154.1} {"step": 29313, "train_loss": 3.1728694438934326, "lr": 4.1475898220272295e-05, "tps": 111963, "wall": 17158.5} {"step": 29314, "train_loss": 3.1700243949890137, "lr": 4.1473450929144645e-05, "tps": 111937, "wall": 17163.1} {"step": 29315, "train_loss": 3.251513957977295, "lr": 4.147100566037538e-05, "tps": 111912, "wall": 17167.5} {"step": 29316, "train_loss": 3.0876412391662598, "lr": 4.1468562413992246e-05, "tps": 111886, "wall": 17172.0} {"step": 29317, "train_loss": 3.1269545555114746, "lr": 4.1466121190022894e-05, "tps": 111861, "wall": 17176.4} {"step": 29318, "train_loss": 3.173057794570923, "lr": 4.146368198849495e-05, "tps": 111836, "wall": 17180.9} {"step": 29319, "train_loss": 3.2509994506835938, "lr": 4.1461244809436105e-05, "tps": 111811, "wall": 17185.4} {"step": 29320, "train_loss": 3.159116744995117, "lr": 4.145880965287393e-05, "tps": 111786, "wall": 17189.8} {"step": 29321, "train_loss": 3.215064764022827, "lr": 4.145637651883602e-05, "tps": 111760, "wall": 17194.3} {"step": 29322, "train_loss": 3.1522440910339355, "lr": 4.145394540734994e-05, "tps": 111735, "wall": 17198.8} {"step": 29323, "train_loss": 3.1745777130126953, "lr": 4.145151631844322e-05, "tps": 111710, "wall": 17203.3} {"step": 29324, "train_loss": 3.156898260116577, "lr": 4.144908925214336e-05, "tps": 111685, "wall": 17207.7} {"step": 29325, "train_loss": 3.223104953765869, "lr": 4.14466642084779e-05, "tps": 111659, "wall": 17212.2} {"step": 29326, "train_loss": 3.2000715732574463, "lr": 4.144424118747429e-05, "tps": 111634, "wall": 17216.6} {"step": 29327, "train_loss": 3.084327220916748, "lr": 4.144182018915996e-05, "tps": 111609, "wall": 17221.1} {"step": 29328, "train_loss": 3.253939151763916, "lr": 4.1439401213562374e-05, "tps": 111584, "wall": 17225.6} {"step": 29329, "train_loss": 3.308043956756592, "lr": 4.1436984260708894e-05, "tps": 111559, "wall": 17230.0} {"step": 29330, "train_loss": 3.2309978008270264, "lr": 4.143456933062691e-05, "tps": 111534, "wall": 17234.5} {"step": 29331, "train_loss": 3.0543346405029297, "lr": 4.143215642334381e-05, "tps": 111509, "wall": 17239.0} {"step": 29332, "train_loss": 3.1873488426208496, "lr": 4.142974553888688e-05, "tps": 111484, "wall": 17243.4} {"step": 29333, "train_loss": 3.1816282272338867, "lr": 4.142733667728345e-05, "tps": 111458, "wall": 17247.9} {"step": 29334, "train_loss": 3.178791046142578, "lr": 4.1424929838560825e-05, "tps": 111433, "wall": 17252.4} {"step": 29335, "train_loss": 3.098242998123169, "lr": 4.1422525022746264e-05, "tps": 111409, "wall": 17256.8} {"step": 29336, "train_loss": 3.125157356262207, "lr": 4.142012222986698e-05, "tps": 111383, "wall": 17261.3} {"step": 29337, "train_loss": 3.191504955291748, "lr": 4.141772145995024e-05, "tps": 111359, "wall": 17265.7} {"step": 29338, "train_loss": 3.1982204914093018, "lr": 4.141532271302316e-05, "tps": 111334, "wall": 17270.2} {"step": 29339, "train_loss": 3.1963515281677246, "lr": 4.141292598911301e-05, "tps": 111309, "wall": 17274.7} {"step": 29340, "train_loss": 3.156777858734131, "lr": 4.141053128824688e-05, "tps": 111283, "wall": 17279.2} {"step": 29341, "train_loss": 3.1428518295288086, "lr": 4.140813861045193e-05, "tps": 111258, "wall": 17283.6} {"step": 29342, "train_loss": 3.202615976333618, "lr": 4.140574795575523e-05, "tps": 111234, "wall": 17288.1} {"step": 29343, "train_loss": 3.142617702484131, "lr": 4.140335932418389e-05, "tps": 111209, "wall": 17292.5} {"step": 29344, "train_loss": 3.0977277755737305, "lr": 4.140097271576494e-05, "tps": 111184, "wall": 17297.0} {"step": 29345, "train_loss": 3.2096943855285645, "lr": 4.1398588130525454e-05, "tps": 111159, "wall": 17301.5} {"step": 29346, "train_loss": 3.177654504776001, "lr": 4.1396205568492406e-05, "tps": 111134, "wall": 17305.9} {"step": 29347, "train_loss": 3.2364044189453125, "lr": 4.1393825029692826e-05, "tps": 111109, "wall": 17310.4} {"step": 29348, "train_loss": 3.1438493728637695, "lr": 4.139144651415364e-05, "tps": 111084, "wall": 17314.9} {"step": 29349, "train_loss": 3.0703134536743164, "lr": 4.138907002190181e-05, "tps": 111059, "wall": 17319.3} {"step": 29350, "train_loss": 3.02639102935791, "lr": 4.138669555296426e-05, "tps": 111034, "wall": 17323.8} {"step": 29351, "train_loss": 3.0848376750946045, "lr": 4.13843231073679e-05, "tps": 111010, "wall": 17328.2} {"step": 29352, "train_loss": 3.119215726852417, "lr": 4.1381952685139574e-05, "tps": 110985, "wall": 17332.7} {"step": 29353, "train_loss": 3.1963582038879395, "lr": 4.1379584286306144e-05, "tps": 110960, "wall": 17337.2} {"step": 29354, "train_loss": 3.2416296005249023, "lr": 4.137721791089446e-05, "tps": 110935, "wall": 17341.7} {"step": 29355, "train_loss": 3.2332725524902344, "lr": 4.1374853558931306e-05, "tps": 110910, "wall": 17346.2} {"step": 29356, "train_loss": 3.1892220973968506, "lr": 4.13724912304435e-05, "tps": 110885, "wall": 17350.6} {"step": 29357, "train_loss": 3.2413909435272217, "lr": 4.1370130925457764e-05, "tps": 110861, "wall": 17355.1} {"step": 29358, "train_loss": 3.2025389671325684, "lr": 4.136777264400082e-05, "tps": 110836, "wall": 17359.6} {"step": 29359, "train_loss": 3.139317512512207, "lr": 4.1365416386099456e-05, "tps": 110811, "wall": 17364.0} {"step": 29360, "train_loss": 3.1493582725524902, "lr": 4.136306215178029e-05, "tps": 110787, "wall": 17368.5} {"step": 29361, "train_loss": 3.1117160320281982, "lr": 4.136070994107003e-05, "tps": 110762, "wall": 17372.9} {"step": 29362, "train_loss": 3.151987075805664, "lr": 4.1358359753995304e-05, "tps": 110737, "wall": 17377.4} {"step": 29363, "train_loss": 3.187458038330078, "lr": 4.135601159058275e-05, "tps": 110713, "wall": 17381.9} {"step": 29364, "train_loss": 3.1357831954956055, "lr": 4.1353665450858956e-05, "tps": 110688, "wall": 17386.3} {"step": 29365, "train_loss": 3.128371477127075, "lr": 4.135132133485051e-05, "tps": 110663, "wall": 17390.8} {"step": 29366, "train_loss": 3.181626319885254, "lr": 4.1348979242583964e-05, "tps": 110639, "wall": 17395.2} {"step": 29367, "train_loss": 3.124204635620117, "lr": 4.1346639174085825e-05, "tps": 110614, "wall": 17399.8} {"step": 29368, "train_loss": 3.1881356239318848, "lr": 4.134430112938264e-05, "tps": 110589, "wall": 17404.2} {"step": 29369, "train_loss": 3.2309908866882324, "lr": 4.134196510850087e-05, "tps": 110565, "wall": 17408.7} {"step": 29370, "train_loss": 3.158371925354004, "lr": 4.1339631111467006e-05, "tps": 110540, "wall": 17413.2} {"step": 29371, "train_loss": 3.1674818992614746, "lr": 4.1337299138307455e-05, "tps": 110515, "wall": 17417.6} {"step": 29372, "train_loss": 3.1812081336975098, "lr": 4.133496918904863e-05, "tps": 110491, "wall": 17422.1} {"step": 29373, "train_loss": 3.197606325149536, "lr": 4.133264126371694e-05, "tps": 110467, "wall": 17426.5} {"step": 29374, "train_loss": 3.111636161804199, "lr": 4.133031536233877e-05, "tps": 110442, "wall": 17431.0} {"step": 29375, "train_loss": 3.1298952102661133, "lr": 4.1327991484940454e-05, "tps": 110417, "wall": 17435.4} {"step": 29376, "train_loss": 3.1626992225646973, "lr": 4.1325669631548306e-05, "tps": 110393, "wall": 17439.9} {"step": 29377, "train_loss": 3.1735429763793945, "lr": 4.132334980218866e-05, "tps": 110369, "wall": 17444.4} {"step": 29378, "train_loss": 3.0475544929504395, "lr": 4.1321031996887744e-05, "tps": 110344, "wall": 17448.8} {"step": 29379, "train_loss": 3.2085204124450684, "lr": 4.131871621567185e-05, "tps": 110320, "wall": 17453.3} {"step": 29380, "train_loss": 3.1898133754730225, "lr": 4.131640245856723e-05, "tps": 110295, "wall": 17457.7} {"step": 29381, "train_loss": 3.2063839435577393, "lr": 4.131409072560003e-05, "tps": 110270, "wall": 17462.2} {"step": 29382, "train_loss": 3.231541633605957, "lr": 4.1311781016796515e-05, "tps": 110246, "wall": 17466.7} {"step": 29383, "train_loss": 3.140559673309326, "lr": 4.1309473332182775e-05, "tps": 110222, "wall": 17471.2} {"step": 29384, "train_loss": 3.163989782333374, "lr": 4.130716767178501e-05, "tps": 110197, "wall": 17475.6} {"step": 29385, "train_loss": 3.1686630249023438, "lr": 4.130486403562932e-05, "tps": 110173, "wall": 17480.1} {"step": 29386, "train_loss": 3.1268296241760254, "lr": 4.13025624237418e-05, "tps": 110149, "wall": 17484.5} {"step": 29387, "train_loss": 3.0545759201049805, "lr": 4.130026283614851e-05, "tps": 110124, "wall": 17489.0} {"step": 29388, "train_loss": 3.1487715244293213, "lr": 4.1297965272875514e-05, "tps": 110100, "wall": 17493.5} {"step": 29389, "train_loss": 3.2792716026306152, "lr": 4.129566973394882e-05, "tps": 110075, "wall": 17498.0} {"step": 29390, "train_loss": 3.1879186630249023, "lr": 4.129337621939446e-05, "tps": 110051, "wall": 17502.4} {"step": 29391, "train_loss": 3.203582525253296, "lr": 4.129108472923842e-05, "tps": 110027, "wall": 17506.9} {"step": 29392, "train_loss": 3.1843957901000977, "lr": 4.128879526350662e-05, "tps": 110002, "wall": 17511.4} {"step": 29393, "train_loss": 3.1581578254699707, "lr": 4.128650782222501e-05, "tps": 109978, "wall": 17515.8} {"step": 29394, "train_loss": 3.142303466796875, "lr": 4.128422240541953e-05, "tps": 109953, "wall": 17520.4} {"step": 29395, "train_loss": 3.1100587844848633, "lr": 4.1281939013116e-05, "tps": 109929, "wall": 17524.8} {"step": 29396, "train_loss": 3.240601062774658, "lr": 4.1279657645340375e-05, "tps": 109905, "wall": 17529.3} {"step": 29397, "train_loss": 3.182947874069214, "lr": 4.127737830211847e-05, "tps": 109881, "wall": 17533.7} {"step": 29398, "train_loss": 3.141672134399414, "lr": 4.1275100983476044e-05, "tps": 109857, "wall": 17538.2} {"step": 29399, "train_loss": 3.1326873302459717, "lr": 4.127282568943899e-05, "tps": 109832, "wall": 17542.7} {"step": 29400, "train_loss": 3.169435501098633, "lr": 4.127055242003301e-05, "tps": 109808, "wall": 17547.1} {"step": 29401, "train_loss": 3.1116294860839844, "lr": 4.1268281175283874e-05, "tps": 109784, "wall": 17551.6} {"step": 29402, "train_loss": 3.148650646209717, "lr": 4.126601195521734e-05, "tps": 109760, "wall": 17556.0} {"step": 29403, "train_loss": 2.967621088027954, "lr": 4.126374475985907e-05, "tps": 109736, "wall": 17560.5} {"step": 29404, "train_loss": 3.1232380867004395, "lr": 4.12614795892348e-05, "tps": 109712, "wall": 17564.9} {"step": 29405, "train_loss": 3.1423850059509277, "lr": 4.125921644337012e-05, "tps": 109687, "wall": 17569.4} {"step": 29406, "train_loss": 3.1804463863372803, "lr": 4.1256955322290736e-05, "tps": 109663, "wall": 17573.8} {"step": 29407, "train_loss": 3.1456081867218018, "lr": 4.125469622602222e-05, "tps": 109639, "wall": 17578.3} {"step": 29408, "train_loss": 3.1039838790893555, "lr": 4.1252439154590186e-05, "tps": 109615, "wall": 17582.8} {"step": 29409, "train_loss": 3.308837890625, "lr": 4.125018410802017e-05, "tps": 109591, "wall": 17587.3} {"step": 29410, "train_loss": 3.153748035430908, "lr": 4.124793108633775e-05, "tps": 109567, "wall": 17591.7} {"step": 29411, "train_loss": 3.2369384765625, "lr": 4.124568008956845e-05, "tps": 109542, "wall": 17596.3} {"step": 29412, "train_loss": 3.204155921936035, "lr": 4.1243431117737726e-05, "tps": 109518, "wall": 17600.7} {"step": 29413, "train_loss": 3.170889377593994, "lr": 4.124118417087112e-05, "tps": 109494, "wall": 17605.2} {"step": 29414, "train_loss": 3.116257667541504, "lr": 4.1238939248994025e-05, "tps": 109470, "wall": 17609.6} {"step": 29415, "train_loss": 3.134065628051758, "lr": 4.1236696352131905e-05, "tps": 109446, "wall": 17614.1} {"step": 29416, "train_loss": 3.169001579284668, "lr": 4.1234455480310165e-05, "tps": 109422, "wall": 17618.5} {"step": 29417, "train_loss": 3.311513662338257, "lr": 4.1232216633554155e-05, "tps": 109399, "wall": 17623.0} {"step": 29418, "train_loss": 3.1553237438201904, "lr": 4.1229979811889306e-05, "tps": 109374, "wall": 17627.5} {"step": 29419, "train_loss": 3.223764419555664, "lr": 4.122774501534089e-05, "tps": 109351, "wall": 17631.9} {"step": 29420, "train_loss": 3.1273608207702637, "lr": 4.122551224393427e-05, "tps": 109327, "wall": 17636.4} {"step": 29421, "train_loss": 3.241666316986084, "lr": 4.122328149769472e-05, "tps": 109302, "wall": 17640.9} {"step": 29422, "train_loss": 3.2392847537994385, "lr": 4.1221052776647504e-05, "tps": 109278, "wall": 17645.4} {"step": 29423, "train_loss": 3.225844383239746, "lr": 4.121882608081786e-05, "tps": 109255, "wall": 17649.8} {"step": 29424, "train_loss": 3.0770857334136963, "lr": 4.121660141023103e-05, "tps": 109231, "wall": 17654.3} {"step": 29425, "train_loss": 3.1814041137695312, "lr": 4.121437876491222e-05, "tps": 109207, "wall": 17658.7} {"step": 29426, "train_loss": 3.2732534408569336, "lr": 4.1212158144886595e-05, "tps": 109183, "wall": 17663.2} {"step": 29427, "train_loss": 3.210693836212158, "lr": 4.1209939550179314e-05, "tps": 109159, "wall": 17667.7} {"step": 29428, "train_loss": 3.0275285243988037, "lr": 4.120772298081551e-05, "tps": 109135, "wall": 17672.1} {"step": 29429, "train_loss": 3.0996994972229004, "lr": 4.120550843682029e-05, "tps": 109111, "wall": 17676.6} {"step": 29430, "train_loss": 3.2536139488220215, "lr": 4.120329591821874e-05, "tps": 109088, "wall": 17681.0} {"step": 29431, "train_loss": 3.197237730026245, "lr": 4.120108542503595e-05, "tps": 109064, "wall": 17685.5} {"step": 29432, "train_loss": 3.122036933898926, "lr": 4.1198876957296915e-05, "tps": 109040, "wall": 17690.0} {"step": 29433, "train_loss": 3.114132881164551, "lr": 4.1196670515026684e-05, "tps": 109016, "wall": 17694.4} {"step": 29434, "train_loss": 3.1829264163970947, "lr": 4.1194466098250225e-05, "tps": 108992, "wall": 17698.9} {"step": 29435, "train_loss": 3.0699172019958496, "lr": 4.119226370699254e-05, "tps": 108968, "wall": 17703.4} {"step": 29436, "train_loss": 3.1941001415252686, "lr": 4.119006334127857e-05, "tps": 108945, "wall": 17707.8} {"step": 29437, "train_loss": 3.123490810394287, "lr": 4.118786500113323e-05, "tps": 108921, "wall": 17712.3} {"step": 29438, "train_loss": 3.04386830329895, "lr": 4.118566868658144e-05, "tps": 108897, "wall": 17716.8} {"step": 29439, "train_loss": 3.222740888595581, "lr": 4.1183474397648066e-05, "tps": 108873, "wall": 17721.2} {"step": 29440, "train_loss": 3.113203525543213, "lr": 4.118128213435795e-05, "tps": 108850, "wall": 17725.7} {"step": 29441, "train_loss": 3.1914775371551514, "lr": 4.1179091896735955e-05, "tps": 108826, "wall": 17730.2} {"step": 29442, "train_loss": 3.040553569793701, "lr": 4.117690368480688e-05, "tps": 108802, "wall": 17734.6} {"step": 29443, "train_loss": 3.0957305431365967, "lr": 4.117471749859552e-05, "tps": 108779, "wall": 17739.1} {"step": 29444, "train_loss": 3.1204442977905273, "lr": 4.117253333812663e-05, "tps": 108755, "wall": 17743.6} {"step": 29445, "train_loss": 3.0767831802368164, "lr": 4.117035120342496e-05, "tps": 108731, "wall": 17748.0} {"step": 29446, "train_loss": 3.122732639312744, "lr": 4.116817109451522e-05, "tps": 108708, "wall": 17752.5} {"step": 29447, "train_loss": 3.1033589839935303, "lr": 4.116599301142211e-05, "tps": 108684, "wall": 17756.9} {"step": 29448, "train_loss": 3.1062238216400146, "lr": 4.11638169541703e-05, "tps": 108660, "wall": 17761.4} {"step": 29449, "train_loss": 3.1725869178771973, "lr": 4.116164292278446e-05, "tps": 108637, "wall": 17765.9} {"step": 29450, "train_loss": 3.2217202186584473, "lr": 4.11594709172892e-05, "tps": 108613, "wall": 17770.4} {"step": 29451, "train_loss": 3.2103335857391357, "lr": 4.1157300937709145e-05, "tps": 108589, "wall": 17774.8} {"step": 29452, "train_loss": 3.1056759357452393, "lr": 4.1155132984068834e-05, "tps": 108566, "wall": 17779.3} {"step": 29453, "train_loss": 3.1968202590942383, "lr": 4.1152967056392886e-05, "tps": 108542, "wall": 17783.7} {"step": 29454, "train_loss": 3.1052708625793457, "lr": 4.1150803154705764e-05, "tps": 108519, "wall": 17788.2} {"step": 29455, "train_loss": 3.196845531463623, "lr": 4.114864127903203e-05, "tps": 108495, "wall": 17792.6} {"step": 29456, "train_loss": 3.158599376678467, "lr": 4.114648142939619e-05, "tps": 108472, "wall": 17797.1} {"step": 29457, "train_loss": 3.110391855239868, "lr": 4.1144323605822644e-05, "tps": 108448, "wall": 17801.6} {"step": 29458, "train_loss": 3.208831310272217, "lr": 4.11421678083359e-05, "tps": 108425, "wall": 17806.0} {"step": 29459, "train_loss": 3.112602710723877, "lr": 4.114001403696035e-05, "tps": 108401, "wall": 17810.5} {"step": 29460, "train_loss": 3.1682279109954834, "lr": 4.1137862291720384e-05, "tps": 108378, "wall": 17814.9} {"step": 29461, "train_loss": 3.040984630584717, "lr": 4.113571257264042e-05, "tps": 108354, "wall": 17819.5} {"step": 29462, "train_loss": 3.073617458343506, "lr": 4.1133564879744753e-05, "tps": 108331, "wall": 17823.9} {"step": 29463, "train_loss": 3.18325138092041, "lr": 4.113141921305775e-05, "tps": 108307, "wall": 17828.4} {"step": 29464, "train_loss": 3.178476333618164, "lr": 4.112927557260372e-05, "tps": 108284, "wall": 17832.8} {"step": 29465, "train_loss": 3.2510101795196533, "lr": 4.11271339584069e-05, "tps": 108261, "wall": 17837.3} {"step": 29466, "train_loss": 3.214529037475586, "lr": 4.112499437049162e-05, "tps": 108237, "wall": 17841.7} {"step": 29467, "train_loss": 3.04628849029541, "lr": 4.112285680888207e-05, "tps": 108214, "wall": 17846.2} {"step": 29468, "train_loss": 3.0916452407836914, "lr": 4.1120721273602455e-05, "tps": 108190, "wall": 17850.7} {"step": 29469, "train_loss": 3.080540180206299, "lr": 4.1118587764677005e-05, "tps": 108167, "wall": 17855.1} {"step": 29470, "train_loss": 3.1966867446899414, "lr": 4.111645628212986e-05, "tps": 108144, "wall": 17859.6} {"step": 29471, "train_loss": 3.1521921157836914, "lr": 4.1114326825985186e-05, "tps": 108120, "wall": 17864.0} {"step": 29472, "train_loss": 3.183683395385742, "lr": 4.111219939626709e-05, "tps": 108097, "wall": 17868.5} {"step": 29473, "train_loss": 3.236736297607422, "lr": 4.1110073992999686e-05, "tps": 108074, "wall": 17873.0} {"step": 29474, "train_loss": 3.0934836864471436, "lr": 4.110795061620703e-05, "tps": 108051, "wall": 17877.4} {"step": 29475, "train_loss": 3.075753688812256, "lr": 4.110582926591319e-05, "tps": 108027, "wall": 17881.9} {"step": 29476, "train_loss": 3.2808451652526855, "lr": 4.1103709942142186e-05, "tps": 108004, "wall": 17886.4} {"step": 29477, "train_loss": 3.1427621841430664, "lr": 4.110159264491804e-05, "tps": 107980, "wall": 17890.9} {"step": 29478, "train_loss": 3.183161497116089, "lr": 4.109947737426475e-05, "tps": 107957, "wall": 17895.3} {"step": 29479, "train_loss": 3.2556166648864746, "lr": 4.109736413020622e-05, "tps": 107934, "wall": 17899.8} {"step": 29480, "train_loss": 3.1417605876922607, "lr": 4.109525291276645e-05, "tps": 107911, "wall": 17904.2} {"step": 29481, "train_loss": 3.0698795318603516, "lr": 4.109314372196936e-05, "tps": 107887, "wall": 17908.7} {"step": 29482, "train_loss": 3.205343246459961, "lr": 4.109103655783878e-05, "tps": 107864, "wall": 17913.1} {"step": 29483, "train_loss": 3.1115293502807617, "lr": 4.1088931420398624e-05, "tps": 107841, "wall": 17917.6} {"step": 29484, "train_loss": 3.204209327697754, "lr": 4.1086828309672736e-05, "tps": 107818, "wall": 17922.1} {"step": 29485, "train_loss": 3.0817344188690186, "lr": 4.108472722568492e-05, "tps": 107795, "wall": 17926.5} {"step": 29486, "train_loss": 3.203442096710205, "lr": 4.1082628168459026e-05, "tps": 107772, "wall": 17931.0} {"step": 29487, "train_loss": 3.0818917751312256, "lr": 4.108053113801877e-05, "tps": 107748, "wall": 17935.4} {"step": 29488, "train_loss": 3.1459882259368896, "lr": 4.107843613438795e-05, "tps": 107725, "wall": 17940.0} {"step": 29489, "train_loss": 3.197183609008789, "lr": 4.107634315759028e-05, "tps": 107702, "wall": 17944.4} {"step": 29490, "train_loss": 3.221484661102295, "lr": 4.1074252207649486e-05, "tps": 107679, "wall": 17948.9} {"step": 29491, "train_loss": 3.203037738800049, "lr": 4.107216328458922e-05, "tps": 107656, "wall": 17953.3} {"step": 29492, "train_loss": 3.1521081924438477, "lr": 4.10700763884332e-05, "tps": 107633, "wall": 17957.8} {"step": 29493, "train_loss": 3.060638904571533, "lr": 4.1067991519205016e-05, "tps": 107610, "wall": 17962.2} {"step": 29494, "train_loss": 3.153386354446411, "lr": 4.1065908676928285e-05, "tps": 107587, "wall": 17966.7} {"step": 29495, "train_loss": 3.190413236618042, "lr": 4.1063827861626646e-05, "tps": 107564, "wall": 17971.2} {"step": 29496, "train_loss": 3.1467695236206055, "lr": 4.106174907332363e-05, "tps": 107540, "wall": 17975.6} {"step": 29497, "train_loss": 3.124797821044922, "lr": 4.1059672312042824e-05, "tps": 107517, "wall": 17980.1} {"step": 29498, "train_loss": 3.209617853164673, "lr": 4.105759757780771e-05, "tps": 107494, "wall": 17984.5} {"step": 29499, "train_loss": 3.177503824234009, "lr": 4.105552487064181e-05, "tps": 107471, "wall": 17989.0} {"step": 29500, "train_loss": 3.1163625717163086, "lr": 4.105345419056863e-05, "tps": 107448, "wall": 17993.5} {"step": 29501, "train_loss": 3.0975894927978516, "lr": 4.105138553761159e-05, "tps": 107425, "wall": 17998.1} {"step": 29502, "train_loss": 3.3790011405944824, "lr": 4.1049318911794114e-05, "tps": 107401, "wall": 18002.6} {"step": 29503, "train_loss": 3.033000946044922, "lr": 4.1047254313139654e-05, "tps": 107378, "wall": 18007.0} {"step": 29504, "train_loss": 3.207622766494751, "lr": 4.1045191741671576e-05, "tps": 107355, "wall": 18011.5} {"step": 29505, "train_loss": 3.1574814319610596, "lr": 4.104313119741325e-05, "tps": 107332, "wall": 18016.0} {"step": 29506, "train_loss": 3.1495919227600098, "lr": 4.1041072680388016e-05, "tps": 107309, "wall": 18020.4} {"step": 29507, "train_loss": 3.085872173309326, "lr": 4.103901619061918e-05, "tps": 107286, "wall": 18024.9} {"step": 29508, "train_loss": 3.1606216430664062, "lr": 4.1036961728130054e-05, "tps": 107264, "wall": 18029.4} {"step": 29509, "train_loss": 3.229443073272705, "lr": 4.1034909292943926e-05, "tps": 107241, "wall": 18033.8} {"step": 29510, "train_loss": 3.173293113708496, "lr": 4.1032858885084e-05, "tps": 107218, "wall": 18038.3} {"step": 29511, "train_loss": 3.1434764862060547, "lr": 4.103081050457355e-05, "tps": 107195, "wall": 18042.7} {"step": 29512, "train_loss": 3.281360387802124, "lr": 4.102876415143575e-05, "tps": 107172, "wall": 18047.2} {"step": 29513, "train_loss": 3.103370189666748, "lr": 4.1026719825693805e-05, "tps": 107149, "wall": 18051.7} {"step": 29514, "train_loss": 3.1458418369293213, "lr": 4.102467752737085e-05, "tps": 107126, "wall": 18056.1} {"step": 29515, "train_loss": 3.1496927738189697, "lr": 4.1022637256490023e-05, "tps": 107103, "wall": 18060.6} {"step": 29516, "train_loss": 3.1975598335266113, "lr": 4.102059901307446e-05, "tps": 107081, "wall": 18065.1} {"step": 29517, "train_loss": 3.152456045150757, "lr": 4.101856279714722e-05, "tps": 107058, "wall": 18069.5} {"step": 29518, "train_loss": 3.1952133178710938, "lr": 4.1016528608731394e-05, "tps": 107035, "wall": 18074.0} {"step": 29519, "train_loss": 3.242422580718994, "lr": 4.101449644785e-05, "tps": 107012, "wall": 18078.5} {"step": 29520, "train_loss": 3.162619113922119, "lr": 4.1012466314526096e-05, "tps": 106989, "wall": 18082.9} {"step": 29521, "train_loss": 3.1089329719543457, "lr": 4.1010438208782624e-05, "tps": 106967, "wall": 18087.4} {"step": 29522, "train_loss": 3.150662899017334, "lr": 4.1008412130642626e-05, "tps": 106944, "wall": 18091.8} {"step": 29523, "train_loss": 3.1298787593841553, "lr": 4.100638808012899e-05, "tps": 106921, "wall": 18096.3} {"step": 29524, "train_loss": 3.0562589168548584, "lr": 4.100436605726469e-05, "tps": 106898, "wall": 18100.8} {"step": 29525, "train_loss": 3.1975769996643066, "lr": 4.100234606207261e-05, "tps": 106876, "wall": 18105.2} {"step": 29526, "train_loss": 3.2111172676086426, "lr": 4.1000328094575644e-05, "tps": 106853, "wall": 18109.7} {"step": 29527, "train_loss": 3.1058967113494873, "lr": 4.0998312154796636e-05, "tps": 106830, "wall": 18114.1} {"step": 29528, "train_loss": 3.258620023727417, "lr": 4.0996298242758444e-05, "tps": 106808, "wall": 18118.6} {"step": 29529, "train_loss": 3.2281270027160645, "lr": 4.099428635848387e-05, "tps": 106784, "wall": 18123.2} {"step": 29530, "train_loss": 3.2158992290496826, "lr": 4.099227650199569e-05, "tps": 106762, "wall": 18127.6} {"step": 29531, "train_loss": 3.1531758308410645, "lr": 4.099026867331669e-05, "tps": 106739, "wall": 18132.1} {"step": 29532, "train_loss": 3.1970248222351074, "lr": 4.0988262872469616e-05, "tps": 106716, "wall": 18136.5} {"step": 29533, "train_loss": 3.032912492752075, "lr": 4.098625909947717e-05, "tps": 106694, "wall": 18141.0} {"step": 29534, "train_loss": 3.2070367336273193, "lr": 4.098425735436208e-05, "tps": 106671, "wall": 18145.4} {"step": 29535, "train_loss": 3.2459824085235596, "lr": 4.0982257637147e-05, "tps": 106649, "wall": 18149.9} {"step": 29536, "train_loss": 3.181130886077881, "lr": 4.0980259947854594e-05, "tps": 106626, "wall": 18154.4} {"step": 29537, "train_loss": 3.1495065689086914, "lr": 4.097826428650747e-05, "tps": 106604, "wall": 18158.8} {"step": 29538, "train_loss": 3.133035182952881, "lr": 4.097627065312829e-05, "tps": 106581, "wall": 18163.3} {"step": 29539, "train_loss": 3.151489734649658, "lr": 4.0974279047739564e-05, "tps": 106558, "wall": 18167.8} {"step": 29540, "train_loss": 3.1636786460876465, "lr": 4.097228947036392e-05, "tps": 106536, "wall": 18172.2} {"step": 29541, "train_loss": 3.125941514968872, "lr": 4.097030192102387e-05, "tps": 106513, "wall": 18176.7} {"step": 29542, "train_loss": 3.1555521488189697, "lr": 4.0968316399741894e-05, "tps": 106490, "wall": 18181.2} {"step": 29543, "train_loss": 3.118478298187256, "lr": 4.096633290654053e-05, "tps": 106468, "wall": 18185.6} {"step": 29544, "train_loss": 3.091907024383545, "lr": 4.0964351441442235e-05, "tps": 106445, "wall": 18190.1} {"step": 29545, "train_loss": 3.2039449214935303, "lr": 4.096237200446944e-05, "tps": 106423, "wall": 18194.6} {"step": 29546, "train_loss": 3.1451821327209473, "lr": 4.09603945956446e-05, "tps": 106400, "wall": 18199.0} {"step": 29547, "train_loss": 3.193244218826294, "lr": 4.0958419214990084e-05, "tps": 106378, "wall": 18203.5} {"step": 29548, "train_loss": 3.208158254623413, "lr": 4.095644586252829e-05, "tps": 106355, "wall": 18207.9} {"step": 29549, "train_loss": 3.2796764373779297, "lr": 4.095447453828155e-05, "tps": 106333, "wall": 18212.4} {"step": 29550, "train_loss": 3.111649990081787, "lr": 4.0952505242272204e-05, "tps": 106311, "wall": 18216.9} {"step": 29551, "train_loss": 3.0732839107513428, "lr": 4.095053797452258e-05, "tps": 106288, "wall": 18221.3} {"step": 29552, "train_loss": 3.1529886722564697, "lr": 4.094857273505496e-05, "tps": 106265, "wall": 18225.9} {"step": 29553, "train_loss": 3.125821352005005, "lr": 4.094660952389157e-05, "tps": 106242, "wall": 18230.4} {"step": 29554, "train_loss": 3.1314549446105957, "lr": 4.094464834105468e-05, "tps": 106220, "wall": 18234.9} {"step": 29555, "train_loss": 3.1679627895355225, "lr": 4.094268918656652e-05, "tps": 106197, "wall": 18239.4} {"step": 29556, "train_loss": 3.1835854053497314, "lr": 4.0940732060449225e-05, "tps": 106175, "wall": 18243.9} {"step": 29557, "train_loss": 3.1435132026672363, "lr": 4.093877696272503e-05, "tps": 106152, "wall": 18248.3} {"step": 29558, "train_loss": 3.1925625801086426, "lr": 4.093682389341607e-05, "tps": 106130, "wall": 18252.8} {"step": 29559, "train_loss": 3.143918037414551, "lr": 4.093487285254443e-05, "tps": 106108, "wall": 18257.2} {"step": 29560, "train_loss": 3.0674800872802734, "lr": 4.093292384013225e-05, "tps": 106086, "wall": 18261.7} {"step": 29561, "train_loss": 3.265075206756592, "lr": 4.093097685620159e-05, "tps": 106063, "wall": 18266.1} {"step": 29562, "train_loss": 3.1423392295837402, "lr": 4.092903190077452e-05, "tps": 106041, "wall": 18270.6} {"step": 29563, "train_loss": 3.0648608207702637, "lr": 4.092708897387305e-05, "tps": 106019, "wall": 18275.0} {"step": 29564, "train_loss": 3.1732711791992188, "lr": 4.092514807551922e-05, "tps": 105996, "wall": 18279.5} {"step": 29565, "train_loss": 3.210916519165039, "lr": 4.092320920573499e-05, "tps": 105974, "wall": 18284.0} {"step": 29566, "train_loss": 3.0443434715270996, "lr": 4.092127236454234e-05, "tps": 105952, "wall": 18288.4} {"step": 29567, "train_loss": 3.2400765419006348, "lr": 4.0919337551963214e-05, "tps": 105930, "wall": 18292.9} {"step": 29568, "train_loss": 3.1191787719726562, "lr": 4.09174047680195e-05, "tps": 105908, "wall": 18297.3} {"step": 29569, "train_loss": 3.17777156829834, "lr": 4.091547401273311e-05, "tps": 105885, "wall": 18301.8} {"step": 29570, "train_loss": 3.169241428375244, "lr": 4.091354528612592e-05, "tps": 105863, "wall": 18306.3} {"step": 29571, "train_loss": 3.104562759399414, "lr": 4.09116185882198e-05, "tps": 105841, "wall": 18310.7} {"step": 29572, "train_loss": 3.064638614654541, "lr": 4.0909693919036535e-05, "tps": 105819, "wall": 18315.2} {"step": 29573, "train_loss": 3.2433042526245117, "lr": 4.090777127859796e-05, "tps": 105796, "wall": 18319.6} {"step": 29574, "train_loss": 2.9977223873138428, "lr": 4.090585066692584e-05, "tps": 105774, "wall": 18324.1} {"step": 29575, "train_loss": 3.1685450077056885, "lr": 4.090393208404191e-05, "tps": 105752, "wall": 18328.5} {"step": 29576, "train_loss": 3.1017889976501465, "lr": 4.090201552996795e-05, "tps": 105730, "wall": 18333.0} {"step": 29577, "train_loss": 3.1600635051727295, "lr": 4.0900101004725625e-05, "tps": 105708, "wall": 18337.5} {"step": 29578, "train_loss": 3.135814666748047, "lr": 4.0898188508336674e-05, "tps": 105686, "wall": 18341.9} {"step": 29579, "train_loss": 3.189697265625, "lr": 4.08962780408227e-05, "tps": 105664, "wall": 18346.4} {"step": 29580, "train_loss": 3.1259992122650146, "lr": 4.089436960220541e-05, "tps": 105642, "wall": 18350.8} {"step": 29581, "train_loss": 3.150343179702759, "lr": 4.0892463192506364e-05, "tps": 105620, "wall": 18355.3} {"step": 29582, "train_loss": 3.1736900806427, "lr": 4.089055881174719e-05, "tps": 105597, "wall": 18359.8} {"step": 29583, "train_loss": 3.153226852416992, "lr": 4.088865645994947e-05, "tps": 105575, "wall": 18364.2} {"step": 29584, "train_loss": 3.206918239593506, "lr": 4.088675613713474e-05, "tps": 105553, "wall": 18368.7} {"step": 29585, "train_loss": 3.0875210762023926, "lr": 4.0884857843324496e-05, "tps": 105531, "wall": 18373.2} {"step": 29586, "train_loss": 3.0799059867858887, "lr": 4.08829615785403e-05, "tps": 105509, "wall": 18377.6} {"step": 29587, "train_loss": 3.127958059310913, "lr": 4.088106734280359e-05, "tps": 105487, "wall": 18382.1} {"step": 29588, "train_loss": 3.089449167251587, "lr": 4.087917513613586e-05, "tps": 105465, "wall": 18386.6} {"step": 29589, "train_loss": 3.1279845237731934, "lr": 4.08772849585585e-05, "tps": 105442, "wall": 18391.1} {"step": 29590, "train_loss": 3.155815362930298, "lr": 4.087539681009297e-05, "tps": 105421, "wall": 18395.5} {"step": 29591, "train_loss": 3.10538911819458, "lr": 4.087351069076063e-05, "tps": 105399, "wall": 18400.0} {"step": 29592, "train_loss": 2.956897020339966, "lr": 4.087162660058284e-05, "tps": 105377, "wall": 18404.5} {"step": 29593, "train_loss": 3.1694211959838867, "lr": 4.086974453958095e-05, "tps": 105355, "wall": 18408.9} {"step": 29594, "train_loss": 3.1434760093688965, "lr": 4.086786450777629e-05, "tps": 105333, "wall": 18413.4} {"step": 29595, "train_loss": 3.099400043487549, "lr": 4.0865986505190175e-05, "tps": 105311, "wall": 18417.8} {"step": 29596, "train_loss": 3.1814701557159424, "lr": 4.0864110531843824e-05, "tps": 105288, "wall": 18422.4} {"step": 29597, "train_loss": 3.03334641456604, "lr": 4.086223658775854e-05, "tps": 105266, "wall": 18426.8} {"step": 29598, "train_loss": 3.219780921936035, "lr": 4.0860364672955514e-05, "tps": 105245, "wall": 18431.3} {"step": 29599, "train_loss": 3.097601890563965, "lr": 4.0858494787455976e-05, "tps": 105223, "wall": 18435.7} {"step": 29600, "train_loss": 3.115852117538452, "lr": 4.08566269312811e-05, "tps": 105201, "wall": 18440.2} {"step": 29601, "train_loss": 3.1261491775512695, "lr": 4.0854761104452065e-05, "tps": 105179, "wall": 18444.6} {"step": 29602, "train_loss": 3.263775110244751, "lr": 4.085289730698996e-05, "tps": 105157, "wall": 18449.1} {"step": 29603, "train_loss": 3.0861144065856934, "lr": 4.085103553891595e-05, "tps": 105135, "wall": 18453.6} {"step": 29604, "train_loss": 3.1556897163391113, "lr": 4.084917580025109e-05, "tps": 105113, "wall": 18458.0} {"step": 29605, "train_loss": 3.1216094493865967, "lr": 4.084731809101645e-05, "tps": 105092, "wall": 18462.5} {"step": 29606, "train_loss": 3.139967679977417, "lr": 4.084546241123309e-05, "tps": 105070, "wall": 18466.9} {"step": 29607, "train_loss": 3.1296889781951904, "lr": 4.0843608760922024e-05, "tps": 105048, "wall": 18471.4} {"step": 29608, "train_loss": 3.275071144104004, "lr": 4.084175714010425e-05, "tps": 105026, "wall": 18475.8} {"step": 29609, "train_loss": 3.123807668685913, "lr": 4.083990754880074e-05, "tps": 105004, "wall": 18480.4} {"step": 29610, "train_loss": 3.2648627758026123, "lr": 4.083805998703244e-05, "tps": 104982, "wall": 18484.8} {"step": 29611, "train_loss": 3.1799116134643555, "lr": 4.083621445482031e-05, "tps": 104960, "wall": 18489.3} {"step": 29612, "train_loss": 3.1550662517547607, "lr": 4.083437095218522e-05, "tps": 104939, "wall": 18493.7} {"step": 29613, "train_loss": 3.189282178878784, "lr": 4.0832529479148085e-05, "tps": 104917, "wall": 18498.2} {"step": 29614, "train_loss": 3.073474645614624, "lr": 4.083069003572974e-05, "tps": 104895, "wall": 18502.6} {"step": 29615, "train_loss": 3.1209659576416016, "lr": 4.082885262195101e-05, "tps": 104873, "wall": 18507.1} {"step": 29616, "train_loss": 3.1484875679016113, "lr": 4.0827017237832764e-05, "tps": 104852, "wall": 18511.6} {"step": 29617, "train_loss": 3.2440905570983887, "lr": 4.082518388339574e-05, "tps": 104830, "wall": 18516.0} {"step": 29618, "train_loss": 3.154754638671875, "lr": 4.0823352558660745e-05, "tps": 104808, "wall": 18520.5} {"step": 29619, "train_loss": 3.0628533363342285, "lr": 4.0821523263648476e-05, "tps": 104787, "wall": 18524.9} {"step": 29620, "train_loss": 3.0690016746520996, "lr": 4.081969599837973e-05, "tps": 104765, "wall": 18529.4} {"step": 29621, "train_loss": 3.2108936309814453, "lr": 4.081787076287511e-05, "tps": 104743, "wall": 18533.8} {"step": 29622, "train_loss": 3.166482925415039, "lr": 4.081604755715537e-05, "tps": 104722, "wall": 18538.3} {"step": 29623, "train_loss": 3.1174333095550537, "lr": 4.081422638124113e-05, "tps": 104700, "wall": 18542.8} {"step": 29624, "train_loss": 3.179483652114868, "lr": 4.0812407235153024e-05, "tps": 104678, "wall": 18547.2} {"step": 29625, "train_loss": 3.161836624145508, "lr": 4.081059011891169e-05, "tps": 104657, "wall": 18551.7} {"step": 29626, "train_loss": 3.147918701171875, "lr": 4.080877503253767e-05, "tps": 104635, "wall": 18556.2} {"step": 29627, "train_loss": 3.187680721282959, "lr": 4.0806961976051526e-05, "tps": 104613, "wall": 18560.6} {"step": 29628, "train_loss": 3.1442153453826904, "lr": 4.080515094947383e-05, "tps": 104592, "wall": 18565.1} {"step": 29629, "train_loss": 3.2887115478515625, "lr": 4.0803341952825047e-05, "tps": 104570, "wall": 18569.5} {"step": 29630, "train_loss": 3.2034895420074463, "lr": 4.080153498612573e-05, "tps": 104549, "wall": 18574.0} {"step": 29631, "train_loss": 3.2206363677978516, "lr": 4.0799730049396316e-05, "tps": 104527, "wall": 18578.5} {"step": 29632, "train_loss": 3.0812883377075195, "lr": 4.079792714265724e-05, "tps": 104506, "wall": 18582.9} {"step": 29633, "train_loss": 3.19348406791687, "lr": 4.079612626592896e-05, "tps": 104484, "wall": 18587.4} {"step": 29634, "train_loss": 3.1751675605773926, "lr": 4.079432741923184e-05, "tps": 104463, "wall": 18591.8} {"step": 29635, "train_loss": 3.1468465328216553, "lr": 4.079253060258629e-05, "tps": 104441, "wall": 18596.3} {"step": 29636, "train_loss": 3.2416799068450928, "lr": 4.079073581601263e-05, "tps": 104419, "wall": 18600.8} {"step": 29637, "train_loss": 3.122504949569702, "lr": 4.078894305953121e-05, "tps": 104398, "wall": 18605.3} {"step": 29638, "train_loss": 3.1843137741088867, "lr": 4.078715233316235e-05, "tps": 104376, "wall": 18609.7} {"step": 29639, "train_loss": 3.1976513862609863, "lr": 4.078536363692632e-05, "tps": 104355, "wall": 18614.2} {"step": 29640, "train_loss": 3.1728920936584473, "lr": 4.07835769708434e-05, "tps": 104333, "wall": 18618.7} {"step": 29641, "train_loss": 3.199981212615967, "lr": 4.078179233493379e-05, "tps": 104312, "wall": 18623.1} {"step": 29642, "train_loss": 3.244633197784424, "lr": 4.078000972921775e-05, "tps": 104290, "wall": 18627.6} {"step": 29643, "train_loss": 3.1576499938964844, "lr": 4.077822915371545e-05, "tps": 104269, "wall": 18632.0} {"step": 29644, "train_loss": 3.185018301010132, "lr": 4.077645060844705e-05, "tps": 104247, "wall": 18636.5} {"step": 29645, "train_loss": 3.18514347076416, "lr": 4.077467409343273e-05, "tps": 104226, "wall": 18641.0} {"step": 29646, "train_loss": 3.092254638671875, "lr": 4.07728996086926e-05, "tps": 104204, "wall": 18645.4} {"step": 29647, "train_loss": 3.1030654907226562, "lr": 4.0771127154246753e-05, "tps": 104183, "wall": 18649.9} {"step": 29648, "train_loss": 3.253922462463379, "lr": 4.076935673011527e-05, "tps": 104162, "wall": 18654.4} {"step": 29649, "train_loss": 3.1034791469573975, "lr": 4.076758833631822e-05, "tps": 104140, "wall": 18658.8} {"step": 29650, "train_loss": 3.2240679264068604, "lr": 4.076582197287562e-05, "tps": 104119, "wall": 18663.3} {"step": 29651, "train_loss": 3.1426825523376465, "lr": 4.07640576398075e-05, "tps": 104097, "wall": 18667.8} {"step": 29652, "train_loss": 3.1379003524780273, "lr": 4.076229533713381e-05, "tps": 104076, "wall": 18672.2} {"step": 29653, "train_loss": 3.022927761077881, "lr": 4.076053506487456e-05, "tps": 104054, "wall": 18676.7} {"step": 29654, "train_loss": 3.154644012451172, "lr": 4.075877682304964e-05, "tps": 104033, "wall": 18681.2} {"step": 29655, "train_loss": 3.1908140182495117, "lr": 4.075702061167899e-05, "tps": 104012, "wall": 18685.6} {"step": 29656, "train_loss": 3.129507064819336, "lr": 4.075526643078253e-05, "tps": 103991, "wall": 18690.1} {"step": 29657, "train_loss": 3.0581302642822266, "lr": 4.07535142803801e-05, "tps": 103969, "wall": 18694.5} {"step": 29658, "train_loss": 3.202308177947998, "lr": 4.0751764160491554e-05, "tps": 103948, "wall": 18699.0} {"step": 29659, "train_loss": 3.219456911087036, "lr": 4.075001607113672e-05, "tps": 103927, "wall": 18703.4} {"step": 29660, "train_loss": 3.1879234313964844, "lr": 4.07482700123354e-05, "tps": 103906, "wall": 18707.9} {"step": 29661, "train_loss": 3.135772228240967, "lr": 4.074652598410739e-05, "tps": 103884, "wall": 18712.4} {"step": 29662, "train_loss": 3.1549267768859863, "lr": 4.07447839864724e-05, "tps": 103863, "wall": 18716.8} {"step": 29663, "train_loss": 3.091730833053589, "lr": 4.074304401945022e-05, "tps": 103841, "wall": 18721.3} {"step": 29664, "train_loss": 3.1677258014678955, "lr": 4.0741306083060524e-05, "tps": 103820, "wall": 18725.8} {"step": 29665, "train_loss": 3.2151670455932617, "lr": 4.073957017732303e-05, "tps": 103799, "wall": 18730.3} {"step": 29666, "train_loss": 3.071831703186035, "lr": 4.073783630225736e-05, "tps": 103778, "wall": 18734.7} {"step": 29667, "train_loss": 3.1487770080566406, "lr": 4.073610445788317e-05, "tps": 103756, "wall": 18739.2} {"step": 29668, "train_loss": 3.047215461730957, "lr": 4.073437464422013e-05, "tps": 103735, "wall": 18743.6} {"step": 29669, "train_loss": 3.1882622241973877, "lr": 4.0732646861287735e-05, "tps": 103714, "wall": 18748.1} {"step": 29670, "train_loss": 3.1165335178375244, "lr": 4.073092110910566e-05, "tps": 103693, "wall": 18752.6} {"step": 29671, "train_loss": 3.1581921577453613, "lr": 4.07291973876934e-05, "tps": 103672, "wall": 18757.0} {"step": 29672, "train_loss": 3.0762135982513428, "lr": 4.0727475697070464e-05, "tps": 103651, "wall": 18761.5} {"step": 29673, "train_loss": 3.1596126556396484, "lr": 4.072575603725642e-05, "tps": 103630, "wall": 18765.9} {"step": 29674, "train_loss": 3.093862295150757, "lr": 4.072403840827069e-05, "tps": 103608, "wall": 18770.4} {"step": 29675, "train_loss": 3.128063678741455, "lr": 4.072232281013274e-05, "tps": 103587, "wall": 18774.9} {"step": 29676, "train_loss": 3.16623592376709, "lr": 4.072060924286205e-05, "tps": 103566, "wall": 18779.4} {"step": 29677, "train_loss": 3.1419498920440674, "lr": 4.0718897706477966e-05, "tps": 103545, "wall": 18783.8} {"step": 29678, "train_loss": 3.1010632514953613, "lr": 4.071718820099991e-05, "tps": 103524, "wall": 18788.3} {"step": 29679, "train_loss": 3.1468470096588135, "lr": 4.071548072644726e-05, "tps": 103503, "wall": 18792.7} {"step": 29680, "train_loss": 3.1486175060272217, "lr": 4.0713775282839346e-05, "tps": 103482, "wall": 18797.2} {"step": 29681, "train_loss": 3.153352737426758, "lr": 4.071207187019547e-05, "tps": 103461, "wall": 18801.6} {"step": 29682, "train_loss": 3.2002460956573486, "lr": 4.0710370488534947e-05, "tps": 103440, "wall": 18806.1} {"step": 29683, "train_loss": 3.0864617824554443, "lr": 4.070867113787704e-05, "tps": 103419, "wall": 18810.6} {"step": 29684, "train_loss": 3.157118797302246, "lr": 4.070697381824102e-05, "tps": 103397, "wall": 18815.0} {"step": 29685, "train_loss": 3.1277520656585693, "lr": 4.0705278529646095e-05, "tps": 103377, "wall": 18819.5} {"step": 29686, "train_loss": 3.173372268676758, "lr": 4.070358527211147e-05, "tps": 103355, "wall": 18823.9} {"step": 29687, "train_loss": 3.2008423805236816, "lr": 4.070189404565633e-05, "tps": 103334, "wall": 18828.4} {"step": 29688, "train_loss": 3.182650566101074, "lr": 4.0700204850299856e-05, "tps": 103313, "wall": 18832.9} {"step": 29689, "train_loss": 3.136751174926758, "lr": 4.0698517686061136e-05, "tps": 103293, "wall": 18837.3} {"step": 29690, "train_loss": 3.1618173122406006, "lr": 4.069683255295932e-05, "tps": 103271, "wall": 18841.8} {"step": 29691, "train_loss": 3.0903444290161133, "lr": 4.0695149451013484e-05, "tps": 103250, "wall": 18846.3} {"step": 29692, "train_loss": 3.1462202072143555, "lr": 4.069346838024268e-05, "tps": 103229, "wall": 18850.7} {"step": 29693, "train_loss": 3.1355345249176025, "lr": 4.0691789340665984e-05, "tps": 103209, "wall": 18855.2} {"step": 29694, "train_loss": 3.1800265312194824, "lr": 4.069011233230239e-05, "tps": 103187, "wall": 18859.7} {"step": 29695, "train_loss": 3.2017359733581543, "lr": 4.068843735517092e-05, "tps": 103167, "wall": 18864.1} {"step": 29696, "train_loss": 3.150845766067505, "lr": 4.068676440929051e-05, "tps": 103146, "wall": 18868.6} {"step": 29697, "train_loss": 3.1790363788604736, "lr": 4.068509349468015e-05, "tps": 103125, "wall": 18873.1} {"step": 29698, "train_loss": 3.1376843452453613, "lr": 4.068342461135873e-05, "tps": 103104, "wall": 18877.5} {"step": 29699, "train_loss": 3.231076240539551, "lr": 4.06817577593452e-05, "tps": 103083, "wall": 18882.0} {"step": 29700, "train_loss": 3.1364665031433105, "lr": 4.068009293865841e-05, "tps": 103062, "wall": 18886.4} {"step": 29701, "train_loss": 3.2325005531311035, "lr": 4.067843014931724e-05, "tps": 103041, "wall": 18890.9} {"step": 29702, "train_loss": 3.228328227996826, "lr": 4.0676769391340496e-05, "tps": 103020, "wall": 18895.4} {"step": 29703, "train_loss": 3.1257026195526123, "lr": 4.067511066474702e-05, "tps": 102999, "wall": 18899.9} {"step": 29704, "train_loss": 3.136476516723633, "lr": 4.0673453969555586e-05, "tps": 102978, "wall": 18904.3} {"step": 29705, "train_loss": 3.1501541137695312, "lr": 4.067179930578496e-05, "tps": 102958, "wall": 18908.8} {"step": 29706, "train_loss": 3.2056713104248047, "lr": 4.06701466734539e-05, "tps": 102937, "wall": 18913.2} {"step": 29707, "train_loss": 3.1379451751708984, "lr": 4.0668496072581116e-05, "tps": 102916, "wall": 18917.7} {"step": 29708, "train_loss": 3.1251676082611084, "lr": 4.066684750318533e-05, "tps": 102895, "wall": 18922.1} {"step": 29709, "train_loss": 3.207048177719116, "lr": 4.0665200965285176e-05, "tps": 102875, "wall": 18926.6} {"step": 29710, "train_loss": 3.197767972946167, "lr": 4.066355645889933e-05, "tps": 102854, "wall": 18931.0} {"step": 29711, "train_loss": 3.153418779373169, "lr": 4.066191398404642e-05, "tps": 102833, "wall": 18935.5} {"step": 29712, "train_loss": 3.2207765579223633, "lr": 4.066027354074506e-05, "tps": 102812, "wall": 18939.9} {"step": 29713, "train_loss": 3.109203815460205, "lr": 4.0658635129013824e-05, "tps": 102792, "wall": 18944.4} {"step": 29714, "train_loss": 3.1163034439086914, "lr": 4.065699874887127e-05, "tps": 102771, "wall": 18948.9} {"step": 29715, "train_loss": 3.1840341091156006, "lr": 4.0655364400335925e-05, "tps": 102750, "wall": 18953.3} {"step": 29716, "train_loss": 3.156644105911255, "lr": 4.065373208342633e-05, "tps": 102729, "wall": 18957.8} {"step": 29717, "train_loss": 3.2827529907226562, "lr": 4.065210179816094e-05, "tps": 102708, "wall": 18962.3} {"step": 29718, "train_loss": 3.1273303031921387, "lr": 4.0650473544558254e-05, "tps": 102688, "wall": 18966.8} {"step": 29719, "train_loss": 3.168084144592285, "lr": 4.0648847322636704e-05, "tps": 102667, "wall": 18971.2} {"step": 29720, "train_loss": 3.0771963596343994, "lr": 4.064722313241471e-05, "tps": 102646, "wall": 18975.7} {"step": 29721, "train_loss": 3.13657283782959, "lr": 4.064560097391069e-05, "tps": 102626, "wall": 18980.1} {"step": 29722, "train_loss": 3.218701124191284, "lr": 4.0643980847143005e-05, "tps": 102605, "wall": 18984.6} {"step": 29723, "train_loss": 3.1977076530456543, "lr": 4.0642362752129985e-05, "tps": 102585, "wall": 18989.1} {"step": 29724, "train_loss": 3.0865211486816406, "lr": 4.0640746688889996e-05, "tps": 102564, "wall": 18993.5} {"step": 29725, "train_loss": 3.098997116088867, "lr": 4.063913265744135e-05, "tps": 102543, "wall": 18998.0} {"step": 29726, "train_loss": 3.1730990409851074, "lr": 4.063752065780229e-05, "tps": 102523, "wall": 19002.4} {"step": 29727, "train_loss": 3.191906213760376, "lr": 4.063591068999111e-05, "tps": 102502, "wall": 19006.9} {"step": 29728, "train_loss": 3.1926610469818115, "lr": 4.063430275402603e-05, "tps": 102482, "wall": 19011.3} {"step": 29729, "train_loss": 3.1509461402893066, "lr": 4.063269684992527e-05, "tps": 102461, "wall": 19015.8} {"step": 29730, "train_loss": 3.031120777130127, "lr": 4.0631092977707034e-05, "tps": 102440, "wall": 19020.3} {"step": 29731, "train_loss": 3.189307689666748, "lr": 4.0629491137389466e-05, "tps": 102420, "wall": 19024.7} {"step": 29732, "train_loss": 3.096575975418091, "lr": 4.062789132899073e-05, "tps": 102399, "wall": 19029.2} {"step": 29733, "train_loss": 3.1546356678009033, "lr": 4.062629355252895e-05, "tps": 102379, "wall": 19033.7} {"step": 29734, "train_loss": 3.143315315246582, "lr": 4.062469780802224e-05, "tps": 102358, "wall": 19038.1} {"step": 29735, "train_loss": 3.1560168266296387, "lr": 4.062310409548864e-05, "tps": 102337, "wall": 19042.6} {"step": 29736, "train_loss": 3.104217529296875, "lr": 4.062151241494621e-05, "tps": 102317, "wall": 19047.0} {"step": 29737, "train_loss": 3.1749796867370605, "lr": 4.0619922766413e-05, "tps": 102297, "wall": 19051.5} {"step": 29738, "train_loss": 3.2053937911987305, "lr": 4.0618335149907e-05, "tps": 102276, "wall": 19055.9} {"step": 29739, "train_loss": 3.1453609466552734, "lr": 4.0616749565446216e-05, "tps": 102256, "wall": 19060.4} {"step": 29740, "train_loss": 3.1457369327545166, "lr": 4.061516601304861e-05, "tps": 102235, "wall": 19064.8} {"step": 29741, "train_loss": 3.182119607925415, "lr": 4.061358449273208e-05, "tps": 102215, "wall": 19069.3} {"step": 29742, "train_loss": 3.086026430130005, "lr": 4.061200500451458e-05, "tps": 102194, "wall": 19073.8} {"step": 29743, "train_loss": 3.1835238933563232, "lr": 4.0610427548413996e-05, "tps": 102174, "wall": 19078.2} {"step": 29744, "train_loss": 3.1323161125183105, "lr": 4.0608852124448194e-05, "tps": 102153, "wall": 19082.7} {"step": 29745, "train_loss": 3.1954166889190674, "lr": 4.0607278732635015e-05, "tps": 102132, "wall": 19087.2} {"step": 29746, "train_loss": 3.0624492168426514, "lr": 4.060570737299229e-05, "tps": 102112, "wall": 19091.7} {"step": 29747, "train_loss": 3.172175884246826, "lr": 4.060413804553782e-05, "tps": 102092, "wall": 19096.1} {"step": 29748, "train_loss": 3.129894733428955, "lr": 4.060257075028938e-05, "tps": 102071, "wall": 19100.6} {"step": 29749, "train_loss": 3.1242244243621826, "lr": 4.060100548726471e-05, "tps": 102051, "wall": 19105.1} {"step": 29750, "train_loss": 3.1443982124328613, "lr": 4.059944225648157e-05, "tps": 102030, "wall": 19109.5} {"step": 29751, "train_loss": 3.0621414184570312, "lr": 4.059788105795765e-05, "tps": 102010, "wall": 19114.0} {"step": 29752, "train_loss": 3.2094407081604004, "lr": 4.0596321891710636e-05, "tps": 101990, "wall": 19118.5} {"step": 29753, "train_loss": 3.1805531978607178, "lr": 4.0594764757758197e-05, "tps": 101969, "wall": 19122.9} {"step": 29754, "train_loss": 3.202528238296509, "lr": 4.0593209656117956e-05, "tps": 101949, "wall": 19127.4} {"step": 29755, "train_loss": 3.0902395248413086, "lr": 4.0591656586807566e-05, "tps": 101929, "wall": 19131.8} {"step": 29756, "train_loss": 3.18221116065979, "lr": 4.059010554984458e-05, "tps": 101908, "wall": 19136.3} {"step": 29757, "train_loss": 3.1574056148529053, "lr": 4.0588556545246586e-05, "tps": 101888, "wall": 19140.8} {"step": 29758, "train_loss": 3.1570258140563965, "lr": 4.058700957303112e-05, "tps": 101867, "wall": 19145.3} {"step": 29759, "train_loss": 3.2390084266662598, "lr": 4.0585464633215744e-05, "tps": 101847, "wall": 19149.7} {"step": 29760, "train_loss": 3.2309980392456055, "lr": 4.05839217258179e-05, "tps": 101827, "wall": 19154.2} {"step": 29761, "train_loss": 3.141514301300049, "lr": 4.058238085085511e-05, "tps": 101806, "wall": 19158.7} {"step": 29762, "train_loss": 3.15743088722229, "lr": 4.058084200834482e-05, "tps": 101786, "wall": 19163.2} {"step": 29763, "train_loss": 3.1262731552124023, "lr": 4.057930519830445e-05, "tps": 101766, "wall": 19167.6} {"step": 29764, "train_loss": 3.0432212352752686, "lr": 4.057777042075142e-05, "tps": 101745, "wall": 19172.1} {"step": 29765, "train_loss": 3.070239543914795, "lr": 4.057623767570312e-05, "tps": 101725, "wall": 19176.5} {"step": 29766, "train_loss": 3.232869863510132, "lr": 4.057470696317689e-05, "tps": 101705, "wall": 19181.0} {"step": 29767, "train_loss": 3.2774102687835693, "lr": 4.05731782831901e-05, "tps": 101685, "wall": 19185.5} {"step": 29768, "train_loss": 3.0859975814819336, "lr": 4.0571651635760036e-05, "tps": 101664, "wall": 19189.9} {"step": 29769, "train_loss": 3.1022629737854004, "lr": 4.0570127020904035e-05, "tps": 101644, "wall": 19194.4} {"step": 29770, "train_loss": 3.0109314918518066, "lr": 4.0568604438639326e-05, "tps": 101624, "wall": 19198.9} {"step": 29771, "train_loss": 3.1543362140655518, "lr": 4.056708388898318e-05, "tps": 101603, "wall": 19203.4} {"step": 29772, "train_loss": 3.192348003387451, "lr": 4.056556537195282e-05, "tps": 101583, "wall": 19207.8} {"step": 29773, "train_loss": 3.141923427581787, "lr": 4.056404888756544e-05, "tps": 101563, "wall": 19212.3} {"step": 29774, "train_loss": 3.133676290512085, "lr": 4.05625344358382e-05, "tps": 101543, "wall": 19216.8} {"step": 29775, "train_loss": 3.1745810508728027, "lr": 4.0561022016788295e-05, "tps": 101523, "wall": 19221.2} {"step": 29776, "train_loss": 3.1031367778778076, "lr": 4.0559511630432854e-05, "tps": 101502, "wall": 19225.7} {"step": 29777, "train_loss": 3.1826436519622803, "lr": 4.055800327678894e-05, "tps": 101482, "wall": 19230.2} {"step": 29778, "train_loss": 3.222670078277588, "lr": 4.05564969558737e-05, "tps": 101462, "wall": 19234.6} {"step": 29779, "train_loss": 3.1027023792266846, "lr": 4.055499266770415e-05, "tps": 101442, "wall": 19239.1} {"step": 29780, "train_loss": 3.1726582050323486, "lr": 4.055349041229736e-05, "tps": 101422, "wall": 19243.5} {"step": 29781, "train_loss": 3.1782150268554688, "lr": 4.0551990189670335e-05, "tps": 101402, "wall": 19248.0} {"step": 29782, "train_loss": 3.1706840991973877, "lr": 4.0550491999840076e-05, "tps": 101382, "wall": 19252.5} {"step": 29783, "train_loss": 3.176311492919922, "lr": 4.054899584282356e-05, "tps": 101362, "wall": 19256.9} {"step": 29784, "train_loss": 3.0528271198272705, "lr": 4.054750171863773e-05, "tps": 101341, "wall": 19261.5} {"step": 29785, "train_loss": 3.0834157466888428, "lr": 4.054600962729948e-05, "tps": 101321, "wall": 19265.9} {"step": 29786, "train_loss": 3.1692652702331543, "lr": 4.054451956882577e-05, "tps": 101301, "wall": 19270.4} {"step": 29787, "train_loss": 3.265387535095215, "lr": 4.0543031543233453e-05, "tps": 101281, "wall": 19274.9} {"step": 29788, "train_loss": 3.146414279937744, "lr": 4.054154555053936e-05, "tps": 101261, "wall": 19279.4} {"step": 29789, "train_loss": 3.138601541519165, "lr": 4.054006159076036e-05, "tps": 101241, "wall": 19283.8} {"step": 29790, "train_loss": 3.0950965881347656, "lr": 4.053857966391324e-05, "tps": 101221, "wall": 19288.3} {"step": 29791, "train_loss": 3.206717014312744, "lr": 4.0537099770014815e-05, "tps": 101200, "wall": 19292.8} {"step": 29792, "train_loss": 3.211055040359497, "lr": 4.053562190908182e-05, "tps": 101180, "wall": 19297.3} {"step": 29793, "train_loss": 3.072338342666626, "lr": 4.053414608113102e-05, "tps": 101160, "wall": 19301.7} {"step": 29794, "train_loss": 3.1453495025634766, "lr": 4.0532672286179116e-05, "tps": 101140, "wall": 19306.2} {"step": 29795, "train_loss": 3.2127935886383057, "lr": 4.0531200524242795e-05, "tps": 101120, "wall": 19310.7} {"step": 29796, "train_loss": 3.2533388137817383, "lr": 4.052973079533878e-05, "tps": 101100, "wall": 19315.1} {"step": 29797, "train_loss": 3.1585636138916016, "lr": 4.052826309948364e-05, "tps": 101080, "wall": 19319.7} {"step": 29798, "train_loss": 3.1347579956054688, "lr": 4.052679743669407e-05, "tps": 101060, "wall": 19324.1} {"step": 29799, "train_loss": 3.1707725524902344, "lr": 4.052533380698664e-05, "tps": 101040, "wall": 19328.6} {"step": 29800, "train_loss": 3.114806652069092, "lr": 4.0523872210377956e-05, "tps": 101020, "wall": 19333.0} {"step": 29801, "train_loss": 3.180454730987549, "lr": 4.052241264688455e-05, "tps": 101000, "wall": 19337.5} {"step": 29802, "train_loss": 3.2090463638305664, "lr": 4.0520955116522945e-05, "tps": 100980, "wall": 19342.0} {"step": 29803, "train_loss": 3.224820613861084, "lr": 4.051949961930969e-05, "tps": 100960, "wall": 19346.5} {"step": 29804, "train_loss": 3.1049678325653076, "lr": 4.0518046155261234e-05, "tps": 100941, "wall": 19350.9} {"step": 29805, "train_loss": 3.1457109451293945, "lr": 4.051659472439408e-05, "tps": 100921, "wall": 19355.4} {"step": 29806, "train_loss": 3.184884786605835, "lr": 4.0515145326724634e-05, "tps": 100901, "wall": 19359.8} {"step": 29807, "train_loss": 3.1451125144958496, "lr": 4.051369796226935e-05, "tps": 100881, "wall": 19364.3} {"step": 29808, "train_loss": 3.207909107208252, "lr": 4.0512252631044584e-05, "tps": 100861, "wall": 19368.8} {"step": 29809, "train_loss": 3.230027675628662, "lr": 4.0510809333066755e-05, "tps": 100841, "wall": 19373.2} {"step": 29810, "train_loss": 3.105756998062134, "lr": 4.050936806835218e-05, "tps": 100821, "wall": 19377.7} {"step": 29811, "train_loss": 3.211240530014038, "lr": 4.050792883691719e-05, "tps": 100801, "wall": 19382.2} {"step": 29812, "train_loss": 3.1627771854400635, "lr": 4.050649163877809e-05, "tps": 100782, "wall": 19386.6} {"step": 29813, "train_loss": 3.1720752716064453, "lr": 4.050505647395115e-05, "tps": 100762, "wall": 19391.1} {"step": 29814, "train_loss": 3.2222728729248047, "lr": 4.0503623342452655e-05, "tps": 100742, "wall": 19395.6} {"step": 29815, "train_loss": 3.182753562927246, "lr": 4.0502192244298835e-05, "tps": 100722, "wall": 19400.0} {"step": 29816, "train_loss": 3.1128735542297363, "lr": 4.0500763179505874e-05, "tps": 100702, "wall": 19404.5} {"step": 29817, "train_loss": 3.2421183586120605, "lr": 4.049933614809e-05, "tps": 100683, "wall": 19409.0} {"step": 29818, "train_loss": 3.1881701946258545, "lr": 4.049791115006734e-05, "tps": 100663, "wall": 19413.4} {"step": 29819, "train_loss": 3.1252095699310303, "lr": 4.049648818545406e-05, "tps": 100643, "wall": 19417.9} {"step": 29820, "train_loss": 3.175877571105957, "lr": 4.049506725426627e-05, "tps": 100623, "wall": 19422.4} {"step": 29821, "train_loss": 3.2029194831848145, "lr": 4.049364835652007e-05, "tps": 100603, "wall": 19426.9} {"step": 29822, "train_loss": 3.1834375858306885, "lr": 4.049223149223154e-05, "tps": 100584, "wall": 19431.3} {"step": 29823, "train_loss": 3.2240750789642334, "lr": 4.049081666141671e-05, "tps": 100564, "wall": 19435.8} {"step": 29824, "train_loss": 3.1828479766845703, "lr": 4.0489403864091615e-05, "tps": 100544, "wall": 19440.3} {"step": 29825, "train_loss": 3.1168196201324463, "lr": 4.048799310027228e-05, "tps": 100524, "wall": 19444.8} {"step": 29826, "train_loss": 3.0741732120513916, "lr": 4.048658436997466e-05, "tps": 100504, "wall": 19449.2} {"step": 29827, "train_loss": 3.2068543434143066, "lr": 4.0485177673214726e-05, "tps": 100485, "wall": 19453.7} {"step": 29828, "train_loss": 3.1977291107177734, "lr": 4.048377301000841e-05, "tps": 100465, "wall": 19458.2} {"step": 29829, "train_loss": 3.1548972129821777, "lr": 4.048237038037164e-05, "tps": 100445, "wall": 19462.6} {"step": 29830, "train_loss": 3.0489206314086914, "lr": 4.048096978432028e-05, "tps": 100426, "wall": 19467.1} {"step": 29831, "train_loss": 3.125155210494995, "lr": 4.047957122187021e-05, "tps": 100406, "wall": 19471.6} {"step": 29832, "train_loss": 3.224424362182617, "lr": 4.047817469303725e-05, "tps": 100386, "wall": 19476.0} {"step": 29833, "train_loss": 3.1485884189605713, "lr": 4.047678019783726e-05, "tps": 100367, "wall": 19480.5} {"step": 29834, "train_loss": 3.209378480911255, "lr": 4.0475387736286e-05, "tps": 100347, "wall": 19485.0} {"step": 29835, "train_loss": 3.274481773376465, "lr": 4.047399730839927e-05, "tps": 100327, "wall": 19489.4} {"step": 29836, "train_loss": 3.1913676261901855, "lr": 4.0472608914192805e-05, "tps": 100308, "wall": 19493.9} {"step": 29837, "train_loss": 3.0815200805664062, "lr": 4.047122255368235e-05, "tps": 100288, "wall": 19498.4} {"step": 29838, "train_loss": 3.158313512802124, "lr": 4.04698382268836e-05, "tps": 100268, "wall": 19502.9} {"step": 29839, "train_loss": 3.1673049926757812, "lr": 4.0468455933812216e-05, "tps": 100249, "wall": 19507.3} {"step": 29840, "train_loss": 3.136996030807495, "lr": 4.046707567448388e-05, "tps": 100229, "wall": 19511.8} {"step": 29841, "train_loss": 3.0857701301574707, "lr": 4.0465697448914234e-05, "tps": 100209, "wall": 19516.4} {"step": 29842, "train_loss": 3.1112804412841797, "lr": 4.046432125711887e-05, "tps": 100189, "wall": 19521.0} {"step": 29843, "train_loss": 3.1251673698425293, "lr": 4.046294709911341e-05, "tps": 100168, "wall": 19525.6} {"step": 29844, "train_loss": 3.0703957080841064, "lr": 4.046157497491337e-05, "tps": 100148, "wall": 19530.3} {"step": 29845, "train_loss": 3.1807329654693604, "lr": 4.0460204884534335e-05, "tps": 100127, "wall": 19534.9} {"step": 29846, "train_loss": 3.1570863723754883, "lr": 4.045883682799181e-05, "tps": 100106, "wall": 19539.7} {"step": 29847, "train_loss": 3.0595955848693848, "lr": 4.045747080530131e-05, "tps": 100086, "wall": 19544.4} {"step": 29848, "train_loss": 3.008924961090088, "lr": 4.045610681647826e-05, "tps": 100065, "wall": 19549.1} {"step": 29849, "train_loss": 3.057888984680176, "lr": 4.045474486153817e-05, "tps": 100044, "wall": 19553.8} {"step": 29850, "train_loss": 3.14302396774292, "lr": 4.045338494049643e-05, "tps": 100023, "wall": 19558.6} {"step": 29851, "train_loss": 3.1983349323272705, "lr": 4.0452027053368475e-05, "tps": 100002, "wall": 19563.3} {"step": 29852, "train_loss": 3.1327342987060547, "lr": 4.045067120016966e-05, "tps": 99981, "wall": 19568.1} {"step": 29853, "train_loss": 3.0808987617492676, "lr": 4.044931738091534e-05, "tps": 99960, "wall": 19572.8} {"step": 29854, "train_loss": 3.20021390914917, "lr": 4.04479655956209e-05, "tps": 99939, "wall": 19577.6} {"step": 29855, "train_loss": 3.1915690898895264, "lr": 4.0446615844301586e-05, "tps": 99918, "wall": 19582.4} {"step": 29856, "train_loss": 3.197523593902588, "lr": 4.044526812697275e-05, "tps": 99897, "wall": 19587.2} {"step": 29857, "train_loss": 3.059441089630127, "lr": 4.0443922443649614e-05, "tps": 99876, "wall": 19591.9} {"step": 29858, "train_loss": 3.1152191162109375, "lr": 4.044257879434743e-05, "tps": 99855, "wall": 19596.7} {"step": 29859, "train_loss": 3.122659206390381, "lr": 4.044123717908145e-05, "tps": 99834, "wall": 19601.4} {"step": 29860, "train_loss": 3.1892309188842773, "lr": 4.043989759786684e-05, "tps": 99813, "wall": 19606.2} {"step": 29861, "train_loss": 3.2194554805755615, "lr": 4.0438560050718774e-05, "tps": 99792, "wall": 19611.0} {"step": 29862, "train_loss": 3.1881039142608643, "lr": 4.043722453765242e-05, "tps": 99771, "wall": 19615.8} {"step": 29863, "train_loss": 3.171705722808838, "lr": 4.0435891058682896e-05, "tps": 99750, "wall": 19620.6} {"step": 29864, "train_loss": 3.234558582305908, "lr": 4.043455961382533e-05, "tps": 99729, "wall": 19625.4} {"step": 29865, "train_loss": 3.1046504974365234, "lr": 4.043323020309477e-05, "tps": 99708, "wall": 19630.1} {"step": 29866, "train_loss": 3.0489375591278076, "lr": 4.043190282650631e-05, "tps": 99688, "wall": 19634.9} {"step": 29867, "train_loss": 3.109013080596924, "lr": 4.043057748407494e-05, "tps": 99666, "wall": 19639.7} {"step": 29868, "train_loss": 3.1183602809906006, "lr": 4.042925417581573e-05, "tps": 99646, "wall": 19644.5} {"step": 29869, "train_loss": 3.1436514854431152, "lr": 4.042793290174364e-05, "tps": 99625, "wall": 19649.3} {"step": 29870, "train_loss": 3.1206214427948, "lr": 4.042661366187364e-05, "tps": 99604, "wall": 19654.0} {"step": 29871, "train_loss": 3.1543920040130615, "lr": 4.042529645622066e-05, "tps": 99583, "wall": 19658.8} {"step": 29872, "train_loss": 3.1427202224731445, "lr": 4.0423981284799635e-05, "tps": 99562, "wall": 19663.6} {"step": 29873, "train_loss": 3.197822093963623, "lr": 4.042266814762548e-05, "tps": 99541, "wall": 19668.3} {"step": 29874, "train_loss": 3.083683967590332, "lr": 4.042135704471306e-05, "tps": 99520, "wall": 19673.1} {"step": 29875, "train_loss": 3.0336244106292725, "lr": 4.042004797607721e-05, "tps": 99500, "wall": 19677.9} {"step": 29876, "train_loss": 3.1298258304595947, "lr": 4.041874094173277e-05, "tps": 99478, "wall": 19682.7} {"step": 29877, "train_loss": 2.948481559753418, "lr": 4.041743594169456e-05, "tps": 99458, "wall": 19687.5} {"step": 29878, "train_loss": 3.1413443088531494, "lr": 4.041613297597734e-05, "tps": 99437, "wall": 19692.3} {"step": 29879, "train_loss": 3.159501552581787, "lr": 4.041483204459588e-05, "tps": 99416, "wall": 19697.1} {"step": 29880, "train_loss": 3.089114189147949, "lr": 4.041353314756493e-05, "tps": 99395, "wall": 19701.8} {"step": 29881, "train_loss": 3.252821207046509, "lr": 4.041223628489919e-05, "tps": 99375, "wall": 19706.6} {"step": 29882, "train_loss": 3.240121364593506, "lr": 4.041094145661334e-05, "tps": 99354, "wall": 19711.4} {"step": 29883, "train_loss": 3.1422715187072754, "lr": 4.040964866272208e-05, "tps": 99333, "wall": 19716.2} {"step": 29884, "train_loss": 3.2459635734558105, "lr": 4.040835790324002e-05, "tps": 99312, "wall": 19720.9} {"step": 29885, "train_loss": 3.052264928817749, "lr": 4.040706917818179e-05, "tps": 99292, "wall": 19725.7} {"step": 29886, "train_loss": 3.09771728515625, "lr": 4.040578248756203e-05, "tps": 99271, "wall": 19730.5} {"step": 29887, "train_loss": 3.088348388671875, "lr": 4.0404497831395236e-05, "tps": 99250, "wall": 19735.3} {"step": 29888, "train_loss": 3.1976237297058105, "lr": 4.040321520969603e-05, "tps": 99229, "wall": 19740.2} {"step": 29889, "train_loss": 3.0864949226379395, "lr": 4.040193462247892e-05, "tps": 99208, "wall": 19744.9} {"step": 29890, "train_loss": 3.2427754402160645, "lr": 4.040065606975841e-05, "tps": 99188, "wall": 19749.7} {"step": 29891, "train_loss": 3.1190428733825684, "lr": 4.039937955154899e-05, "tps": 99167, "wall": 19754.5} {"step": 29892, "train_loss": 3.1550087928771973, "lr": 4.03981050678651e-05, "tps": 99146, "wall": 19759.3} {"step": 29893, "train_loss": 3.0345282554626465, "lr": 4.039683261872121e-05, "tps": 99125, "wall": 19764.1} {"step": 29894, "train_loss": 3.133878231048584, "lr": 4.03955622041317e-05, "tps": 99105, "wall": 19768.9} {"step": 29895, "train_loss": 3.2374181747436523, "lr": 4.039429382411099e-05, "tps": 99084, "wall": 19773.7} {"step": 29896, "train_loss": 3.1029207706451416, "lr": 4.039302747867344e-05, "tps": 99063, "wall": 19778.4} {"step": 29897, "train_loss": 3.125297784805298, "lr": 4.039176316783337e-05, "tps": 99043, "wall": 19783.2} {"step": 29898, "train_loss": 3.2372636795043945, "lr": 4.0390500891605134e-05, "tps": 99022, "wall": 19788.0} {"step": 29899, "train_loss": 3.166245937347412, "lr": 4.038924065000302e-05, "tps": 99001, "wall": 19792.8} {"step": 29900, "train_loss": 3.1245508193969727, "lr": 4.038798244304132e-05, "tps": 98981, "wall": 19797.6} {"step": 29901, "train_loss": 3.1739025115966797, "lr": 4.038672627073425e-05, "tps": 98960, "wall": 19802.5} {"step": 29902, "train_loss": 3.113860607147217, "lr": 4.038547213309607e-05, "tps": 98939, "wall": 19807.3} {"step": 29903, "train_loss": 3.16324782371521, "lr": 4.038422003014097e-05, "tps": 98918, "wall": 19812.1} {"step": 29904, "train_loss": 3.1260080337524414, "lr": 4.038296996188316e-05, "tps": 98898, "wall": 19816.9} {"step": 29905, "train_loss": 3.1896133422851562, "lr": 4.038172192833677e-05, "tps": 98877, "wall": 19821.7} {"step": 29906, "train_loss": 3.0298688411712646, "lr": 4.0380475929515954e-05, "tps": 98856, "wall": 19826.5} {"step": 29907, "train_loss": 3.1400742530822754, "lr": 4.037923196543483e-05, "tps": 98836, "wall": 19831.3} {"step": 29908, "train_loss": 3.2261533737182617, "lr": 4.0377990036107474e-05, "tps": 98815, "wall": 19836.1} {"step": 29909, "train_loss": 3.1353654861450195, "lr": 4.0376750141547966e-05, "tps": 98794, "wall": 19840.9} {"step": 29910, "train_loss": 3.0998263359069824, "lr": 4.037551228177037e-05, "tps": 98774, "wall": 19845.7} {"step": 29911, "train_loss": 3.2226181030273438, "lr": 4.037427645678866e-05, "tps": 98753, "wall": 19850.5} {"step": 29912, "train_loss": 3.247657299041748, "lr": 4.037304266661689e-05, "tps": 98733, "wall": 19855.3} {"step": 29913, "train_loss": 3.221921682357788, "lr": 4.037181091126899e-05, "tps": 98712, "wall": 19860.2} {"step": 29914, "train_loss": 3.2206032276153564, "lr": 4.0370581190758925e-05, "tps": 98691, "wall": 19865.0} {"step": 29915, "train_loss": 3.2670023441314697, "lr": 4.036935350510065e-05, "tps": 98670, "wall": 19869.9} {"step": 29916, "train_loss": 3.1755123138427734, "lr": 4.036812785430806e-05, "tps": 98650, "wall": 19874.7} {"step": 29917, "train_loss": 3.2599387168884277, "lr": 4.036690423839502e-05, "tps": 98629, "wall": 19879.5} {"step": 29918, "train_loss": 3.1242926120758057, "lr": 4.036568265737542e-05, "tps": 98608, "wall": 19884.3} {"step": 29919, "train_loss": 3.2351651191711426, "lr": 4.036446311126309e-05, "tps": 98588, "wall": 19889.1} {"step": 29920, "train_loss": 3.155693531036377, "lr": 4.036324560007184e-05, "tps": 98567, "wall": 19893.9} {"step": 29921, "train_loss": 3.099489212036133, "lr": 4.036203012381546e-05, "tps": 98547, "wall": 19898.8} {"step": 29922, "train_loss": 3.2890260219573975, "lr": 4.0360816682507706e-05, "tps": 98526, "wall": 19903.6} {"step": 29923, "train_loss": 3.1077752113342285, "lr": 4.0359605276162346e-05, "tps": 98506, "wall": 19908.4} {"step": 29924, "train_loss": 3.1510446071624756, "lr": 4.03583959047931e-05, "tps": 98485, "wall": 19913.2} {"step": 29925, "train_loss": 3.147714138031006, "lr": 4.0357188568413664e-05, "tps": 98465, "wall": 19918.0} {"step": 29926, "train_loss": 3.1680097579956055, "lr": 4.03559832670377e-05, "tps": 98444, "wall": 19922.9} {"step": 29927, "train_loss": 3.053633689880371, "lr": 4.0354780000678894e-05, "tps": 98423, "wall": 19927.8} {"step": 29928, "train_loss": 3.2182464599609375, "lr": 4.0353578769350864e-05, "tps": 98402, "wall": 19932.6} {"step": 29929, "train_loss": 3.162959098815918, "lr": 4.035237957306719e-05, "tps": 98382, "wall": 19937.5} {"step": 29930, "train_loss": 3.0743048191070557, "lr": 4.03511824118415e-05, "tps": 98361, "wall": 19942.3} {"step": 29931, "train_loss": 3.16867733001709, "lr": 4.0349987285687316e-05, "tps": 98341, "wall": 19947.2} {"step": 29932, "train_loss": 3.1296119689941406, "lr": 4.034879419461822e-05, "tps": 98320, "wall": 19952.0} {"step": 29933, "train_loss": 3.138324022293091, "lr": 4.034760313864767e-05, "tps": 98299, "wall": 19956.8} {"step": 29934, "train_loss": 3.1738667488098145, "lr": 4.034641411778921e-05, "tps": 98279, "wall": 19961.7} {"step": 29935, "train_loss": 3.122373580932617, "lr": 4.034522713205629e-05, "tps": 98258, "wall": 19966.5} {"step": 29936, "train_loss": 3.170243263244629, "lr": 4.034404218146234e-05, "tps": 98238, "wall": 19971.3} {"step": 29937, "train_loss": 3.1702282428741455, "lr": 4.034285926602082e-05, "tps": 98217, "wall": 19976.2} {"step": 29938, "train_loss": 3.1951818466186523, "lr": 4.03416783857451e-05, "tps": 98197, "wall": 19981.0} {"step": 29939, "train_loss": 3.1622886657714844, "lr": 4.034049954064858e-05, "tps": 98176, "wall": 19985.9} {"step": 29940, "train_loss": 2.9942445755004883, "lr": 4.0339322730744575e-05, "tps": 98156, "wall": 19990.7} {"step": 29941, "train_loss": 3.1842989921569824, "lr": 4.0338147956046455e-05, "tps": 98135, "wall": 19995.5} {"step": 29942, "train_loss": 3.1065480709075928, "lr": 4.033697521656753e-05, "tps": 98115, "wall": 20000.4} {"step": 29943, "train_loss": 3.1652674674987793, "lr": 4.033580451232104e-05, "tps": 98094, "wall": 20005.2} {"step": 29944, "train_loss": 3.225034236907959, "lr": 4.033463584332029e-05, "tps": 98074, "wall": 20010.1} {"step": 29945, "train_loss": 3.160264015197754, "lr": 4.0333469209578514e-05, "tps": 98053, "wall": 20014.9} {"step": 29946, "train_loss": 3.2002346515655518, "lr": 4.033230461110892e-05, "tps": 98033, "wall": 20019.7} {"step": 29947, "train_loss": 3.204547882080078, "lr": 4.0331142047924676e-05, "tps": 98013, "wall": 20024.6} {"step": 29948, "train_loss": 3.1081790924072266, "lr": 4.0329981520038985e-05, "tps": 97992, "wall": 20029.4} {"step": 29949, "train_loss": 3.19335675239563, "lr": 4.0328823027465e-05, "tps": 97972, "wall": 20034.2} {"step": 29950, "train_loss": 3.1094236373901367, "lr": 4.032766657021581e-05, "tps": 97952, "wall": 20039.1} {"step": 29951, "train_loss": 3.16453218460083, "lr": 4.032651214830453e-05, "tps": 97931, "wall": 20044.0} {"step": 29952, "train_loss": 3.1391444206237793, "lr": 4.032535976174425e-05, "tps": 97911, "wall": 20048.8} {"step": 29953, "train_loss": 3.276918411254883, "lr": 4.032420941054801e-05, "tps": 97890, "wall": 20053.6} {"step": 29954, "train_loss": 3.10880446434021, "lr": 4.032306109472886e-05, "tps": 97870, "wall": 20058.5} {"step": 29955, "train_loss": 3.132338285446167, "lr": 4.032191481429978e-05, "tps": 97850, "wall": 20063.3} {"step": 29956, "train_loss": 3.044968605041504, "lr": 4.032077056927377e-05, "tps": 97829, "wall": 20068.2} {"step": 29957, "train_loss": 3.094125747680664, "lr": 4.03196283596638e-05, "tps": 97809, "wall": 20073.0} {"step": 29958, "train_loss": 3.1403391361236572, "lr": 4.031848818548279e-05, "tps": 97789, "wall": 20077.8} {"step": 29959, "train_loss": 3.140817165374756, "lr": 4.0317350046743674e-05, "tps": 97768, "wall": 20082.7} {"step": 29960, "train_loss": 3.1395483016967773, "lr": 4.031621394345932e-05, "tps": 97748, "wall": 20087.5} {"step": 29961, "train_loss": 3.1115710735321045, "lr": 4.031507987564263e-05, "tps": 97728, "wall": 20092.4} {"step": 29962, "train_loss": 3.116896152496338, "lr": 4.031394784330644e-05, "tps": 97707, "wall": 20097.2} {"step": 29963, "train_loss": 3.1378211975097656, "lr": 4.031281784646356e-05, "tps": 97687, "wall": 20102.1} {"step": 29964, "train_loss": 3.117184638977051, "lr": 4.031168988512681e-05, "tps": 97666, "wall": 20107.0} {"step": 29965, "train_loss": 3.168992757797241, "lr": 4.031056395930895e-05, "tps": 97646, "wall": 20111.8} {"step": 29966, "train_loss": 3.1109793186187744, "lr": 4.030944006902275e-05, "tps": 97626, "wall": 20116.7} {"step": 29967, "train_loss": 3.190589427947998, "lr": 4.030831821428093e-05, "tps": 97606, "wall": 20121.5} {"step": 29968, "train_loss": 3.186959743499756, "lr": 4.030719839509621e-05, "tps": 97586, "wall": 20126.3} {"step": 29969, "train_loss": 3.233067512512207, "lr": 4.030608061148124e-05, "tps": 97566, "wall": 20131.1} {"step": 29970, "train_loss": 3.1154298782348633, "lr": 4.030496486344873e-05, "tps": 97545, "wall": 20136.0} {"step": 29971, "train_loss": 3.0510144233703613, "lr": 4.03038511510113e-05, "tps": 97525, "wall": 20140.8} {"step": 29972, "train_loss": 3.272135019302368, "lr": 4.030273947418157e-05, "tps": 97505, "wall": 20145.6} {"step": 29973, "train_loss": 3.245063304901123, "lr": 4.030162983297213e-05, "tps": 97485, "wall": 20150.5} {"step": 29974, "train_loss": 3.062954902648926, "lr": 4.030052222739554e-05, "tps": 97465, "wall": 20155.3} {"step": 29975, "train_loss": 3.1246869564056396, "lr": 4.029941665746436e-05, "tps": 97444, "wall": 20160.2} {"step": 29976, "train_loss": 3.1928629875183105, "lr": 4.029831312319111e-05, "tps": 97424, "wall": 20165.0} {"step": 29977, "train_loss": 3.10452938079834, "lr": 4.029721162458828e-05, "tps": 97404, "wall": 20169.9} {"step": 29978, "train_loss": 3.0867698192596436, "lr": 4.0296112161668376e-05, "tps": 97384, "wall": 20174.7} {"step": 29979, "train_loss": 3.083102226257324, "lr": 4.029501473444383e-05, "tps": 97364, "wall": 20179.5} {"step": 29980, "train_loss": 3.0596654415130615, "lr": 4.029391934292707e-05, "tps": 97344, "wall": 20184.4} {"step": 29981, "train_loss": 3.105563163757324, "lr": 4.029282598713051e-05, "tps": 97324, "wall": 20189.2} {"step": 29982, "train_loss": 3.1825647354125977, "lr": 4.029173466706655e-05, "tps": 97303, "wall": 20194.1} {"step": 29983, "train_loss": 3.088874101638794, "lr": 4.029064538274755e-05, "tps": 97283, "wall": 20198.9} {"step": 29984, "train_loss": 3.188823699951172, "lr": 4.028955813418583e-05, "tps": 97263, "wall": 20203.8} {"step": 29985, "train_loss": 3.100918769836426, "lr": 4.0288472921393715e-05, "tps": 97243, "wall": 20208.6} {"step": 29986, "train_loss": 3.1936280727386475, "lr": 4.028738974438349e-05, "tps": 97223, "wall": 20213.4} {"step": 29987, "train_loss": 3.2299675941467285, "lr": 4.028630860316746e-05, "tps": 97203, "wall": 20218.3} {"step": 29988, "train_loss": 3.184000015258789, "lr": 4.0285229497757845e-05, "tps": 97183, "wall": 20223.2} {"step": 29989, "train_loss": 3.2397069931030273, "lr": 4.028415242816685e-05, "tps": 97163, "wall": 20228.0} {"step": 29990, "train_loss": 3.164158344268799, "lr": 4.028307739440672e-05, "tps": 97143, "wall": 20232.8} {"step": 29991, "train_loss": 2.991229295730591, "lr": 4.028200439648963e-05, "tps": 97123, "wall": 20237.7} {"step": 29992, "train_loss": 3.152291774749756, "lr": 4.028093343442767e-05, "tps": 97103, "wall": 20242.5} {"step": 29993, "train_loss": 3.0916950702667236, "lr": 4.027986450823306e-05, "tps": 97083, "wall": 20247.3} {"step": 29994, "train_loss": 3.220592737197876, "lr": 4.027879761791784e-05, "tps": 97063, "wall": 20252.1} {"step": 29995, "train_loss": 3.1237692832946777, "lr": 4.027773276349414e-05, "tps": 97043, "wall": 20257.0} {"step": 29996, "train_loss": 3.0802667140960693, "lr": 4.0276669944974014e-05, "tps": 97024, "wall": 20261.8} {"step": 29997, "train_loss": 3.0957629680633545, "lr": 4.0275609162369476e-05, "tps": 97004, "wall": 20266.6} {"step": 29998, "train_loss": 3.2587649822235107, "lr": 4.0274550415692544e-05, "tps": 96984, "wall": 20271.5} {"step": 29999, "train_loss": 3.096442699432373, "lr": 4.027349370495525e-05, "tps": 96964, "wall": 20276.3} {"step": 30000, "train_loss": 3.172236442565918, "lr": 4.027243903016954e-05, "tps": 96944, "wall": 20281.2, "val_loss_monitor": 3.30842036088145, "val_loss_full": 3.3264877908496473} {"step": 30001, "train_loss": 3.2333364486694336, "lr": 4.027138639134738e-05, "tps": 96369, "wall": 20402.8} {"step": 30002, "train_loss": 3.157244920730591, "lr": 4.0270335788500655e-05, "tps": 96348, "wall": 20407.9} {"step": 30003, "train_loss": 3.233698844909668, "lr": 4.02692872216413e-05, "tps": 96328, "wall": 20412.9} {"step": 30004, "train_loss": 3.1866841316223145, "lr": 4.026824069078117e-05, "tps": 96308, "wall": 20417.9} {"step": 30005, "train_loss": 3.2639851570129395, "lr": 4.026719619593215e-05, "tps": 96288, "wall": 20422.8} {"step": 30006, "train_loss": 3.1255369186401367, "lr": 4.026615373710603e-05, "tps": 96268, "wall": 20427.7} {"step": 30007, "train_loss": 3.161530017852783, "lr": 4.026511331431467e-05, "tps": 96248, "wall": 20432.6} {"step": 30008, "train_loss": 3.122870445251465, "lr": 4.0264074927569824e-05, "tps": 96228, "wall": 20437.5} {"step": 30009, "train_loss": 3.0903854370117188, "lr": 4.0263038576883255e-05, "tps": 96208, "wall": 20442.3} {"step": 30010, "train_loss": 3.1705410480499268, "lr": 4.026200426226672e-05, "tps": 96189, "wall": 20447.2} {"step": 30011, "train_loss": 3.2084195613861084, "lr": 4.026097198373191e-05, "tps": 96169, "wall": 20452.0} {"step": 30012, "train_loss": 3.2063488960266113, "lr": 4.025994174129053e-05, "tps": 96150, "wall": 20456.9} {"step": 30013, "train_loss": 3.1183507442474365, "lr": 4.025891353495426e-05, "tps": 96130, "wall": 20461.8} {"step": 30014, "train_loss": 3.189260482788086, "lr": 4.0257887364734756e-05, "tps": 96110, "wall": 20466.7} {"step": 30015, "train_loss": 3.2282485961914062, "lr": 4.025686323064361e-05, "tps": 96091, "wall": 20471.5} {"step": 30016, "train_loss": 3.167595863342285, "lr": 4.025584113269245e-05, "tps": 96071, "wall": 20476.4} {"step": 30017, "train_loss": 3.138914108276367, "lr": 4.0254821070892846e-05, "tps": 96051, "wall": 20481.2} {"step": 30018, "train_loss": 3.2172064781188965, "lr": 4.025380304525633e-05, "tps": 96032, "wall": 20486.1} {"step": 30019, "train_loss": 3.1426150798797607, "lr": 4.0252787055794494e-05, "tps": 96012, "wall": 20490.9} {"step": 30020, "train_loss": 3.0680668354034424, "lr": 4.025177310251879e-05, "tps": 95993, "wall": 20495.7} {"step": 30021, "train_loss": 3.216207265853882, "lr": 4.0250761185440724e-05, "tps": 95974, "wall": 20500.5} {"step": 30022, "train_loss": 3.1736104488372803, "lr": 4.024975130457177e-05, "tps": 95954, "wall": 20505.4} {"step": 30023, "train_loss": 3.16715669631958, "lr": 4.024874345992333e-05, "tps": 95935, "wall": 20510.2} {"step": 30024, "train_loss": 3.1799063682556152, "lr": 4.0247737651506876e-05, "tps": 95915, "wall": 20515.1} {"step": 30025, "train_loss": 3.1803112030029297, "lr": 4.024673387933378e-05, "tps": 95896, "wall": 20520.0} {"step": 30026, "train_loss": 3.1443238258361816, "lr": 4.0245732143415384e-05, "tps": 95876, "wall": 20524.8} {"step": 30027, "train_loss": 3.1476070880889893, "lr": 4.024473244376307e-05, "tps": 95857, "wall": 20529.6} {"step": 30028, "train_loss": 3.233081102371216, "lr": 4.024373478038815e-05, "tps": 95838, "wall": 20534.4} {"step": 30029, "train_loss": 3.2282614707946777, "lr": 4.024273915330193e-05, "tps": 95818, "wall": 20539.3} {"step": 30030, "train_loss": 3.1049461364746094, "lr": 4.0241745562515686e-05, "tps": 95799, "wall": 20544.1} {"step": 30031, "train_loss": 3.167527914047241, "lr": 4.024075400804066e-05, "tps": 95780, "wall": 20548.9} {"step": 30032, "train_loss": 3.2347116470336914, "lr": 4.023976448988811e-05, "tps": 95760, "wall": 20553.7} {"step": 30033, "train_loss": 3.1318302154541016, "lr": 4.023877700806923e-05, "tps": 95741, "wall": 20558.6} {"step": 30034, "train_loss": 3.141465187072754, "lr": 4.023779156259521e-05, "tps": 95722, "wall": 20563.4} {"step": 30035, "train_loss": 3.2148940563201904, "lr": 4.023680815347721e-05, "tps": 95702, "wall": 20568.2} {"step": 30036, "train_loss": 3.0836830139160156, "lr": 4.0235826780726364e-05, "tps": 95683, "wall": 20573.0} {"step": 30037, "train_loss": 3.1236062049865723, "lr": 4.023484744435383e-05, "tps": 95664, "wall": 20577.9} {"step": 30038, "train_loss": 3.1451051235198975, "lr": 4.0233870144370626e-05, "tps": 95644, "wall": 20582.8} {"step": 30039, "train_loss": 3.2045960426330566, "lr": 4.02328948807879e-05, "tps": 95625, "wall": 20587.6} {"step": 30040, "train_loss": 3.1850779056549072, "lr": 4.023192165361665e-05, "tps": 95606, "wall": 20592.4} {"step": 30041, "train_loss": 3.1480953693389893, "lr": 4.023095046286792e-05, "tps": 95587, "wall": 20597.3} {"step": 30042, "train_loss": 3.16017746925354, "lr": 4.02299813085527e-05, "tps": 95567, "wall": 20602.1} {"step": 30043, "train_loss": 3.089297294616699, "lr": 4.0229014190682e-05, "tps": 95548, "wall": 20606.9} {"step": 30044, "train_loss": 3.163455009460449, "lr": 4.022804910926673e-05, "tps": 95529, "wall": 20611.8} {"step": 30045, "train_loss": 3.1403777599334717, "lr": 4.022708606431784e-05, "tps": 95510, "wall": 20616.6} {"step": 30046, "train_loss": 3.1125919818878174, "lr": 4.0226125055846264e-05, "tps": 95490, "wall": 20621.4} {"step": 30047, "train_loss": 3.142457962036133, "lr": 4.0225166083862865e-05, "tps": 95471, "wall": 20626.3} {"step": 30048, "train_loss": 3.164660692214966, "lr": 4.0224209148378514e-05, "tps": 95452, "wall": 20631.1} {"step": 30049, "train_loss": 3.085946559906006, "lr": 4.022325424940403e-05, "tps": 95433, "wall": 20635.9} {"step": 30050, "train_loss": 3.1820905208587646, "lr": 4.022230138695026e-05, "tps": 95413, "wall": 20640.8} {"step": 30051, "train_loss": 3.1639440059661865, "lr": 4.022135056102798e-05, "tps": 95394, "wall": 20645.6} {"step": 30052, "train_loss": 3.2290232181549072, "lr": 4.022040177164798e-05, "tps": 95375, "wall": 20650.5} {"step": 30053, "train_loss": 3.0747528076171875, "lr": 4.0219455018820984e-05, "tps": 95356, "wall": 20655.3} {"step": 30054, "train_loss": 3.1267693042755127, "lr": 4.0218510302557724e-05, "tps": 95337, "wall": 20660.1} {"step": 30055, "train_loss": 3.1674840450286865, "lr": 4.021756762286891e-05, "tps": 95318, "wall": 20665.0} {"step": 30056, "train_loss": 3.127788543701172, "lr": 4.021662697976523e-05, "tps": 95299, "wall": 20669.8} {"step": 30057, "train_loss": 3.196721076965332, "lr": 4.021568837325729e-05, "tps": 95280, "wall": 20674.6} {"step": 30058, "train_loss": 3.2413158416748047, "lr": 4.02147518033558e-05, "tps": 95260, "wall": 20679.5} {"step": 30059, "train_loss": 3.0894875526428223, "lr": 4.0213817270071296e-05, "tps": 95241, "wall": 20684.3} {"step": 30060, "train_loss": 3.129115581512451, "lr": 4.0212884773414405e-05, "tps": 95222, "wall": 20689.1} {"step": 30061, "train_loss": 3.1161437034606934, "lr": 4.0211954313395693e-05, "tps": 95203, "wall": 20694.0} {"step": 30062, "train_loss": 3.0822391510009766, "lr": 4.021102589002567e-05, "tps": 95184, "wall": 20698.8} {"step": 30063, "train_loss": 3.1928465366363525, "lr": 4.021009950331489e-05, "tps": 95165, "wall": 20703.7} {"step": 30064, "train_loss": 3.157193899154663, "lr": 4.020917515327382e-05, "tps": 95146, "wall": 20708.6} {"step": 30065, "train_loss": 3.1802008152008057, "lr": 4.020825283991295e-05, "tps": 95127, "wall": 20713.4} {"step": 30066, "train_loss": 3.264315605163574, "lr": 4.020733256324271e-05, "tps": 95108, "wall": 20718.2} {"step": 30067, "train_loss": 3.1678454875946045, "lr": 4.020641432327352e-05, "tps": 95088, "wall": 20723.1} {"step": 30068, "train_loss": 3.1288247108459473, "lr": 4.020549812001582e-05, "tps": 95070, "wall": 20727.9} {"step": 30069, "train_loss": 3.134719133377075, "lr": 4.020458395347995e-05, "tps": 95051, "wall": 20732.7} {"step": 30070, "train_loss": 3.186948776245117, "lr": 4.020367182367629e-05, "tps": 95032, "wall": 20737.6} {"step": 30071, "train_loss": 3.147183656692505, "lr": 4.0202761730615154e-05, "tps": 95013, "wall": 20742.4} {"step": 30072, "train_loss": 3.0754456520080566, "lr": 4.0201853674306866e-05, "tps": 94994, "wall": 20747.2} {"step": 30073, "train_loss": 3.2397403717041016, "lr": 4.02009476547617e-05, "tps": 94975, "wall": 20752.1} {"step": 30074, "train_loss": 3.129882574081421, "lr": 4.0200043671989915e-05, "tps": 94956, "wall": 20756.9} {"step": 30075, "train_loss": 3.0894529819488525, "lr": 4.019914172600178e-05, "tps": 94936, "wall": 20761.8} {"step": 30076, "train_loss": 3.201622486114502, "lr": 4.01982418168075e-05, "tps": 94917, "wall": 20766.6} {"step": 30077, "train_loss": 3.1232755184173584, "lr": 4.019734394441724e-05, "tps": 94899, "wall": 20771.5} {"step": 30078, "train_loss": 3.142737627029419, "lr": 4.0196448108841225e-05, "tps": 94880, "wall": 20776.3} {"step": 30079, "train_loss": 3.130795478820801, "lr": 4.019555431008955e-05, "tps": 94861, "wall": 20781.2} {"step": 30080, "train_loss": 3.230842351913452, "lr": 4.019466254817236e-05, "tps": 94842, "wall": 20786.0} {"step": 30081, "train_loss": 3.2432425022125244, "lr": 4.0193772823099785e-05, "tps": 94823, "wall": 20790.8} {"step": 30082, "train_loss": 3.112072706222534, "lr": 4.019288513488185e-05, "tps": 94804, "wall": 20795.7} {"step": 30083, "train_loss": 3.116319417953491, "lr": 4.019199948352866e-05, "tps": 94785, "wall": 20800.5} {"step": 30084, "train_loss": 3.1575779914855957, "lr": 4.019111586905021e-05, "tps": 94766, "wall": 20805.3} {"step": 30085, "train_loss": 3.1529626846313477, "lr": 4.019023429145655e-05, "tps": 94747, "wall": 20810.1} {"step": 30086, "train_loss": 3.0719122886657715, "lr": 4.018935475075764e-05, "tps": 94728, "wall": 20815.0} {"step": 30087, "train_loss": 3.116455554962158, "lr": 4.018847724696343e-05, "tps": 94709, "wall": 20819.9} {"step": 30088, "train_loss": 3.0009734630584717, "lr": 4.0187601780083874e-05, "tps": 94691, "wall": 20824.7} {"step": 30089, "train_loss": 3.2196922302246094, "lr": 4.018672835012891e-05, "tps": 94672, "wall": 20829.5} {"step": 30090, "train_loss": 3.1312808990478516, "lr": 4.018585695710841e-05, "tps": 94653, "wall": 20834.3} {"step": 30091, "train_loss": 3.152055263519287, "lr": 4.0184987601032245e-05, "tps": 94634, "wall": 20839.2} {"step": 30092, "train_loss": 3.243317127227783, "lr": 4.0184120281910266e-05, "tps": 94615, "wall": 20844.0} {"step": 30093, "train_loss": 3.173858404159546, "lr": 4.0183254999752316e-05, "tps": 94596, "wall": 20848.9} {"step": 30094, "train_loss": 3.0927839279174805, "lr": 4.018239175456816e-05, "tps": 94578, "wall": 20853.7} {"step": 30095, "train_loss": 3.1406850814819336, "lr": 4.018153054636761e-05, "tps": 94559, "wall": 20858.5} {"step": 30096, "train_loss": 3.194960117340088, "lr": 4.018067137516043e-05, "tps": 94540, "wall": 20863.4} {"step": 30097, "train_loss": 3.1417980194091797, "lr": 4.01798142409563e-05, "tps": 94521, "wall": 20868.2} {"step": 30098, "train_loss": 3.1108407974243164, "lr": 4.017895914376498e-05, "tps": 94503, "wall": 20873.0} {"step": 30099, "train_loss": 3.0661184787750244, "lr": 4.017810608359614e-05, "tps": 94484, "wall": 20877.9} {"step": 30100, "train_loss": 3.1207773685455322, "lr": 4.017725506045944e-05, "tps": 94465, "wall": 20882.8} {"step": 30101, "train_loss": 3.1811275482177734, "lr": 4.017640607436451e-05, "tps": 94446, "wall": 20887.6} {"step": 30102, "train_loss": 3.154247283935547, "lr": 4.0175559125320994e-05, "tps": 94427, "wall": 20892.4} {"step": 30103, "train_loss": 3.1533591747283936, "lr": 4.017471421333845e-05, "tps": 94409, "wall": 20897.3} {"step": 30104, "train_loss": 3.127370595932007, "lr": 4.017387133842651e-05, "tps": 94390, "wall": 20902.1} {"step": 30105, "train_loss": 3.0529026985168457, "lr": 4.017303050059465e-05, "tps": 94371, "wall": 20906.9} {"step": 30106, "train_loss": 3.1989834308624268, "lr": 4.0172191699852445e-05, "tps": 94353, "wall": 20911.8} {"step": 30107, "train_loss": 3.1706109046936035, "lr": 4.017135493620939e-05, "tps": 94334, "wall": 20916.6} {"step": 30108, "train_loss": 3.22749662399292, "lr": 4.0170520209674935e-05, "tps": 94316, "wall": 20921.4} {"step": 30109, "train_loss": 3.051060199737549, "lr": 4.016968752025856e-05, "tps": 94297, "wall": 20926.2} {"step": 30110, "train_loss": 3.1009135246276855, "lr": 4.0168856867969705e-05, "tps": 94278, "wall": 20931.1} {"step": 30111, "train_loss": 3.1249988079071045, "lr": 4.0168028252817755e-05, "tps": 94260, "wall": 20935.9} {"step": 30112, "train_loss": 3.175647735595703, "lr": 4.016720167481213e-05, "tps": 94241, "wall": 20940.8} {"step": 30113, "train_loss": 3.194047451019287, "lr": 4.016637713396215e-05, "tps": 94222, "wall": 20945.6} {"step": 30114, "train_loss": 3.23053240776062, "lr": 4.016555463027719e-05, "tps": 94204, "wall": 20950.4} {"step": 30115, "train_loss": 3.0632758140563965, "lr": 4.016473416376654e-05, "tps": 94185, "wall": 20955.3} {"step": 30116, "train_loss": 3.24967622756958, "lr": 4.0163915734439525e-05, "tps": 94166, "wall": 20960.1} {"step": 30117, "train_loss": 3.140413761138916, "lr": 4.0163099342305413e-05, "tps": 94148, "wall": 20964.9} {"step": 30118, "train_loss": 3.1328485012054443, "lr": 4.016228498737343e-05, "tps": 94129, "wall": 20969.8} {"step": 30119, "train_loss": 3.16302752494812, "lr": 4.01614726696528e-05, "tps": 94111, "wall": 20974.6} {"step": 30120, "train_loss": 3.1744441986083984, "lr": 4.016066238915274e-05, "tps": 94092, "wall": 20979.4} {"step": 30121, "train_loss": 3.225456714630127, "lr": 4.015985414588245e-05, "tps": 94074, "wall": 20984.2} {"step": 30122, "train_loss": 3.142399311065674, "lr": 4.0159047939851036e-05, "tps": 94055, "wall": 20989.1} {"step": 30123, "train_loss": 3.0869498252868652, "lr": 4.0158243771067647e-05, "tps": 94037, "wall": 20993.9} {"step": 30124, "train_loss": 3.1602795124053955, "lr": 4.0157441639541434e-05, "tps": 94018, "wall": 20998.7} {"step": 30125, "train_loss": 3.1670687198638916, "lr": 4.0156641545281424e-05, "tps": 93999, "wall": 21003.6} {"step": 30126, "train_loss": 3.1653847694396973, "lr": 4.015584348829673e-05, "tps": 93981, "wall": 21008.4} {"step": 30127, "train_loss": 3.1696767807006836, "lr": 4.015504746859635e-05, "tps": 93962, "wall": 21013.3} {"step": 30128, "train_loss": 3.2367663383483887, "lr": 4.015425348618933e-05, "tps": 93944, "wall": 21018.1} {"step": 30129, "train_loss": 3.1674559116363525, "lr": 4.015346154108468e-05, "tps": 93925, "wall": 21023.0} {"step": 30130, "train_loss": 3.262587547302246, "lr": 4.0152671633291325e-05, "tps": 93907, "wall": 21027.8} {"step": 30131, "train_loss": 3.2684242725372314, "lr": 4.015188376281822e-05, "tps": 93888, "wall": 21032.6} {"step": 30132, "train_loss": 3.2579610347747803, "lr": 4.015109792967433e-05, "tps": 93870, "wall": 21037.4} {"step": 30133, "train_loss": 3.145629644393921, "lr": 4.015031413386853e-05, "tps": 93852, "wall": 21042.3} {"step": 30134, "train_loss": 3.0691609382629395, "lr": 4.014953237540968e-05, "tps": 93833, "wall": 21047.1} {"step": 30135, "train_loss": 3.1543819904327393, "lr": 4.014875265430667e-05, "tps": 93815, "wall": 21051.9} {"step": 30136, "train_loss": 3.0748753547668457, "lr": 4.014797497056832e-05, "tps": 93796, "wall": 21056.8} {"step": 30137, "train_loss": 3.148362636566162, "lr": 4.014719932420345e-05, "tps": 93778, "wall": 21061.6} {"step": 30138, "train_loss": 3.2136473655700684, "lr": 4.014642571522081e-05, "tps": 93759, "wall": 21066.5} {"step": 30139, "train_loss": 3.1677441596984863, "lr": 4.014565414362922e-05, "tps": 93741, "wall": 21071.3} {"step": 30140, "train_loss": 3.0873160362243652, "lr": 4.014488460943737e-05, "tps": 93723, "wall": 21076.1} {"step": 30141, "train_loss": 3.1941535472869873, "lr": 4.0144117112654e-05, "tps": 93704, "wall": 21080.9} {"step": 30142, "train_loss": 3.206467866897583, "lr": 4.0143351653287806e-05, "tps": 93686, "wall": 21085.8} {"step": 30143, "train_loss": 3.116516590118408, "lr": 4.0142588231347444e-05, "tps": 93667, "wall": 21090.7} {"step": 30144, "train_loss": 3.1182475090026855, "lr": 4.0141826846841586e-05, "tps": 93649, "wall": 21095.5} {"step": 30145, "train_loss": 3.1954755783081055, "lr": 4.014106749977883e-05, "tps": 93631, "wall": 21100.3} {"step": 30146, "train_loss": 3.116161823272705, "lr": 4.0140310190167814e-05, "tps": 93612, "wall": 21105.2} {"step": 30147, "train_loss": 3.2362475395202637, "lr": 4.013955491801708e-05, "tps": 93594, "wall": 21110.0} {"step": 30148, "train_loss": 3.122448682785034, "lr": 4.01388016833352e-05, "tps": 93576, "wall": 21114.8} {"step": 30149, "train_loss": 3.127594470977783, "lr": 4.0138050486130705e-05, "tps": 93557, "wall": 21119.7} {"step": 30150, "train_loss": 3.225316047668457, "lr": 4.0137301326412104e-05, "tps": 93539, "wall": 21124.6} {"step": 30151, "train_loss": 3.2409825325012207, "lr": 4.0136554204187875e-05, "tps": 93520, "wall": 21129.4} {"step": 30152, "train_loss": 3.1805129051208496, "lr": 4.01358091194665e-05, "tps": 93502, "wall": 21134.2} {"step": 30153, "train_loss": 3.281024694442749, "lr": 4.013506607225642e-05, "tps": 93484, "wall": 21139.0} {"step": 30154, "train_loss": 3.1419057846069336, "lr": 4.013432506256602e-05, "tps": 93466, "wall": 21143.9} {"step": 30155, "train_loss": 3.179969549179077, "lr": 4.0133586090403725e-05, "tps": 93448, "wall": 21148.7} {"step": 30156, "train_loss": 3.201848030090332, "lr": 4.01328491557779e-05, "tps": 93429, "wall": 21153.5} {"step": 30157, "train_loss": 3.179365634918213, "lr": 4.013211425869689e-05, "tps": 93411, "wall": 21158.3} {"step": 30158, "train_loss": 3.207425117492676, "lr": 4.0131381399169035e-05, "tps": 93393, "wall": 21163.2} {"step": 30159, "train_loss": 3.2238240242004395, "lr": 4.013065057720259e-05, "tps": 93375, "wall": 21168.0} {"step": 30160, "train_loss": 3.157174825668335, "lr": 4.012992179280587e-05, "tps": 93357, "wall": 21172.8} {"step": 30161, "train_loss": 3.1803197860717773, "lr": 4.012919504598715e-05, "tps": 93338, "wall": 21177.7} {"step": 30162, "train_loss": 3.259054183959961, "lr": 4.012847033675462e-05, "tps": 93320, "wall": 21182.6} {"step": 30163, "train_loss": 3.0641708374023438, "lr": 4.0127747665116536e-05, "tps": 93302, "wall": 21187.4} {"step": 30164, "train_loss": 3.14382266998291, "lr": 4.012702703108103e-05, "tps": 93283, "wall": 21192.2} {"step": 30165, "train_loss": 3.0882325172424316, "lr": 4.012630843465631e-05, "tps": 93265, "wall": 21197.1} {"step": 30166, "train_loss": 3.191225528717041, "lr": 4.0125591875850495e-05, "tps": 93247, "wall": 21201.9} {"step": 30167, "train_loss": 3.1680822372436523, "lr": 4.012487735467169e-05, "tps": 93229, "wall": 21206.7} {"step": 30168, "train_loss": 3.1886682510375977, "lr": 4.0124164871128025e-05, "tps": 93211, "wall": 21211.6} {"step": 30169, "train_loss": 3.193554639816284, "lr": 4.012345442522754e-05, "tps": 93193, "wall": 21216.4} {"step": 30170, "train_loss": 3.19091534614563, "lr": 4.0122746016978295e-05, "tps": 93175, "wall": 21221.2} {"step": 30171, "train_loss": 3.1993460655212402, "lr": 4.012203964638832e-05, "tps": 93156, "wall": 21226.0} {"step": 30172, "train_loss": 3.1797566413879395, "lr": 4.012133531346561e-05, "tps": 93138, "wall": 21230.9} {"step": 30173, "train_loss": 3.15478253364563, "lr": 4.0120633018218154e-05, "tps": 93120, "wall": 21235.7} {"step": 30174, "train_loss": 3.078629970550537, "lr": 4.011993276065388e-05, "tps": 93102, "wall": 21240.6} {"step": 30175, "train_loss": 3.0831456184387207, "lr": 4.0119234540780745e-05, "tps": 93084, "wall": 21245.5} {"step": 30176, "train_loss": 3.1180436611175537, "lr": 4.011853835860665e-05, "tps": 93065, "wall": 21250.3} {"step": 30177, "train_loss": 3.227660894393921, "lr": 4.011784421413951e-05, "tps": 93047, "wall": 21255.1} {"step": 30178, "train_loss": 3.078122854232788, "lr": 4.011715210738713e-05, "tps": 93029, "wall": 21260.0} {"step": 30179, "train_loss": 3.0812034606933594, "lr": 4.0116462038357396e-05, "tps": 93011, "wall": 21264.8} {"step": 30180, "train_loss": 3.104372024536133, "lr": 4.0115774007058104e-05, "tps": 92993, "wall": 21269.7} {"step": 30181, "train_loss": 3.0468950271606445, "lr": 4.011508801349707e-05, "tps": 92975, "wall": 21274.5} {"step": 30182, "train_loss": 3.1197991371154785, "lr": 4.011440405768202e-05, "tps": 92957, "wall": 21279.3} {"step": 30183, "train_loss": 3.229879379272461, "lr": 4.0113722139620766e-05, "tps": 92939, "wall": 21284.2} {"step": 30184, "train_loss": 3.250560998916626, "lr": 4.011304225932099e-05, "tps": 92921, "wall": 21289.0} {"step": 30185, "train_loss": 3.1598191261291504, "lr": 4.01123644167904e-05, "tps": 92903, "wall": 21293.8} {"step": 30186, "train_loss": 3.118623733520508, "lr": 4.0111688612036685e-05, "tps": 92885, "wall": 21298.6} {"step": 30187, "train_loss": 3.201486587524414, "lr": 4.0111014845067466e-05, "tps": 92867, "wall": 21303.5} {"step": 30188, "train_loss": 3.160059928894043, "lr": 4.011034311589042e-05, "tps": 92849, "wall": 21308.3} {"step": 30189, "train_loss": 3.175710678100586, "lr": 4.010967342451315e-05, "tps": 92831, "wall": 21313.1} {"step": 30190, "train_loss": 3.172790050506592, "lr": 4.010900577094322e-05, "tps": 92813, "wall": 21317.9} {"step": 30191, "train_loss": 3.2184927463531494, "lr": 4.0108340155188206e-05, "tps": 92795, "wall": 21322.7} {"step": 30192, "train_loss": 3.143157720565796, "lr": 4.010767657725567e-05, "tps": 92778, "wall": 21327.6} {"step": 30193, "train_loss": 3.0458459854125977, "lr": 4.010701503715307e-05, "tps": 92760, "wall": 21332.4} {"step": 30194, "train_loss": 3.0990946292877197, "lr": 4.010635553488795e-05, "tps": 92742, "wall": 21337.2} {"step": 30195, "train_loss": 3.2541537284851074, "lr": 4.010569807046776e-05, "tps": 92724, "wall": 21342.0} {"step": 30196, "train_loss": 3.0253472328186035, "lr": 4.0105042643899964e-05, "tps": 92706, "wall": 21346.8} {"step": 30197, "train_loss": 3.097208023071289, "lr": 4.0104389255191964e-05, "tps": 92688, "wall": 21351.6} {"step": 30198, "train_loss": 3.2198691368103027, "lr": 4.01037379043512e-05, "tps": 92671, "wall": 21356.4} {"step": 30199, "train_loss": 3.168989896774292, "lr": 4.0103088591385007e-05, "tps": 92653, "wall": 21361.3} {"step": 30200, "train_loss": 3.1962318420410156, "lr": 4.0102441316300754e-05, "tps": 92635, "wall": 21366.1} {"step": 30201, "train_loss": 3.1145291328430176, "lr": 4.010179607910578e-05, "tps": 92617, "wall": 21370.9} {"step": 30202, "train_loss": 3.148709774017334, "lr": 4.01011528798074e-05, "tps": 92599, "wall": 21375.7} {"step": 30203, "train_loss": 3.1705760955810547, "lr": 4.01005117184129e-05, "tps": 92582, "wall": 21380.5} {"step": 30204, "train_loss": 3.0822041034698486, "lr": 4.009987259492953e-05, "tps": 92564, "wall": 21385.3} {"step": 30205, "train_loss": 3.071786642074585, "lr": 4.009923550936452e-05, "tps": 92546, "wall": 21390.1} {"step": 30206, "train_loss": 3.1047487258911133, "lr": 4.009860046172513e-05, "tps": 92528, "wall": 21394.9} {"step": 30207, "train_loss": 3.173720359802246, "lr": 4.00979674520185e-05, "tps": 92511, "wall": 21399.7} {"step": 30208, "train_loss": 3.132584571838379, "lr": 4.009733648025184e-05, "tps": 92493, "wall": 21404.4} {"step": 30209, "train_loss": 3.1356325149536133, "lr": 4.0096707546432275e-05, "tps": 92476, "wall": 21409.2} {"step": 30210, "train_loss": 3.2312822341918945, "lr": 4.009608065056696e-05, "tps": 92458, "wall": 21414.0} {"step": 30211, "train_loss": 3.0719857215881348, "lr": 4.009545579266296e-05, "tps": 92441, "wall": 21418.8} {"step": 30212, "train_loss": 3.1042044162750244, "lr": 4.0094832972727373e-05, "tps": 92423, "wall": 21423.6} {"step": 30213, "train_loss": 3.1870627403259277, "lr": 4.009421219076724e-05, "tps": 92405, "wall": 21428.4} {"step": 30214, "train_loss": 3.1287455558776855, "lr": 4.0093593446789625e-05, "tps": 92388, "wall": 21433.2} {"step": 30215, "train_loss": 3.235978603363037, "lr": 4.009297674080151e-05, "tps": 92370, "wall": 21438.0} {"step": 30216, "train_loss": 3.2235536575317383, "lr": 4.009236207280988e-05, "tps": 92352, "wall": 21442.7} {"step": 30217, "train_loss": 3.113229274749756, "lr": 4.0091749442821705e-05, "tps": 92335, "wall": 21447.5} {"step": 30218, "train_loss": 3.068399667739868, "lr": 4.009113885084392e-05, "tps": 92318, "wall": 21452.3} {"step": 30219, "train_loss": 3.1699435710906982, "lr": 4.009053029688346e-05, "tps": 92300, "wall": 21457.1} {"step": 30220, "train_loss": 3.1911325454711914, "lr": 4.00899237809472e-05, "tps": 92283, "wall": 21461.8} {"step": 30221, "train_loss": 3.1323914527893066, "lr": 4.0089319303042016e-05, "tps": 92265, "wall": 21466.6} {"step": 30222, "train_loss": 3.143779754638672, "lr": 4.0088716863174764e-05, "tps": 92248, "wall": 21471.3} {"step": 30223, "train_loss": 3.2162528038024902, "lr": 4.008811646135224e-05, "tps": 92230, "wall": 21476.1} {"step": 30224, "train_loss": 3.218113660812378, "lr": 4.008751809758129e-05, "tps": 92213, "wall": 21481.0} {"step": 30225, "train_loss": 3.09932541847229, "lr": 4.008692177186866e-05, "tps": 92195, "wall": 21485.7} {"step": 30226, "train_loss": 3.0592217445373535, "lr": 4.0086327484221106e-05, "tps": 92178, "wall": 21490.5} {"step": 30227, "train_loss": 3.150644063949585, "lr": 4.008573523464537e-05, "tps": 92160, "wall": 21495.3} {"step": 30228, "train_loss": 3.1464486122131348, "lr": 4.0085145023148174e-05, "tps": 92143, "wall": 21500.1} {"step": 30229, "train_loss": 3.133415937423706, "lr": 4.008455684973615e-05, "tps": 92125, "wall": 21504.9} {"step": 30230, "train_loss": 3.1964759826660156, "lr": 4.008397071441604e-05, "tps": 92108, "wall": 21509.6} {"step": 30231, "train_loss": 3.150662899017334, "lr": 4.008338661719443e-05, "tps": 92091, "wall": 21514.4} {"step": 30232, "train_loss": 3.2793805599212646, "lr": 4.008280455807794e-05, "tps": 92073, "wall": 21519.2} {"step": 30233, "train_loss": 3.1527469158172607, "lr": 4.008222453707318e-05, "tps": 92056, "wall": 21523.9} {"step": 30234, "train_loss": 3.145174741744995, "lr": 4.008164655418673e-05, "tps": 92039, "wall": 21528.7} {"step": 30235, "train_loss": 3.207339286804199, "lr": 4.0081070609425104e-05, "tps": 92021, "wall": 21533.4} {"step": 30236, "train_loss": 3.1894586086273193, "lr": 4.008049670279484e-05, "tps": 92004, "wall": 21538.2} {"step": 30237, "train_loss": 3.276637077331543, "lr": 4.007992483430244e-05, "tps": 91987, "wall": 21543.0} {"step": 30238, "train_loss": 3.1032755374908447, "lr": 4.0079355003954395e-05, "tps": 91969, "wall": 21547.8} {"step": 30239, "train_loss": 3.166522264480591, "lr": 4.007878721175716e-05, "tps": 91952, "wall": 21552.5} {"step": 30240, "train_loss": 3.139704465866089, "lr": 4.007822145771714e-05, "tps": 91935, "wall": 21557.3} {"step": 30241, "train_loss": 3.2735819816589355, "lr": 4.0077657741840766e-05, "tps": 91917, "wall": 21562.1} {"step": 30242, "train_loss": 3.216341972351074, "lr": 4.007709606413442e-05, "tps": 91900, "wall": 21566.8} {"step": 30243, "train_loss": 3.243122100830078, "lr": 4.0076536424604464e-05, "tps": 91883, "wall": 21571.5} {"step": 30244, "train_loss": 3.1267521381378174, "lr": 4.007597882325722e-05, "tps": 91866, "wall": 21576.3} {"step": 30245, "train_loss": 3.1010401248931885, "lr": 4.0075423260099046e-05, "tps": 91849, "wall": 21581.0} {"step": 30246, "train_loss": 3.1498537063598633, "lr": 4.00748697351362e-05, "tps": 91831, "wall": 21585.8} {"step": 30247, "train_loss": 3.004775047302246, "lr": 4.007431824837496e-05, "tps": 91814, "wall": 21590.5} {"step": 30248, "train_loss": 3.1721041202545166, "lr": 4.007376879982159e-05, "tps": 91797, "wall": 21595.3} {"step": 30249, "train_loss": 3.183987617492676, "lr": 4.007322138948229e-05, "tps": 91780, "wall": 21600.1} {"step": 30250, "train_loss": 3.0799059867858887, "lr": 4.007267601736329e-05, "tps": 91763, "wall": 21604.8} {"step": 30251, "train_loss": 3.1665802001953125, "lr": 4.007213268347073e-05, "tps": 91746, "wall": 21609.5} {"step": 30252, "train_loss": 3.189467430114746, "lr": 4.007159138781079e-05, "tps": 91729, "wall": 21614.3} {"step": 30253, "train_loss": 3.1595683097839355, "lr": 4.0071052130389594e-05, "tps": 91712, "wall": 21619.0} {"step": 30254, "train_loss": 3.092560052871704, "lr": 4.007051491121325e-05, "tps": 91695, "wall": 21623.7} {"step": 30255, "train_loss": 3.0593864917755127, "lr": 4.0069979730287857e-05, "tps": 91678, "wall": 21628.5} {"step": 30256, "train_loss": 3.131345748901367, "lr": 4.006944658761946e-05, "tps": 91661, "wall": 21633.2} {"step": 30257, "train_loss": 3.1539037227630615, "lr": 4.006891548321411e-05, "tps": 91644, "wall": 21637.9} {"step": 30258, "train_loss": 3.189074993133545, "lr": 4.006838641707782e-05, "tps": 91627, "wall": 21642.7} {"step": 30259, "train_loss": 3.108299970626831, "lr": 4.006785938921657e-05, "tps": 91610, "wall": 21647.4} {"step": 30260, "train_loss": 3.1869871616363525, "lr": 4.0067334399636367e-05, "tps": 91593, "wall": 21652.1} {"step": 30261, "train_loss": 3.255258083343506, "lr": 4.0066811448343115e-05, "tps": 91576, "wall": 21656.9} {"step": 30262, "train_loss": 3.2034010887145996, "lr": 4.006629053534276e-05, "tps": 91558, "wall": 21661.6} {"step": 30263, "train_loss": 3.128811836242676, "lr": 4.006577166064122e-05, "tps": 91542, "wall": 21666.3} {"step": 30264, "train_loss": 3.1115856170654297, "lr": 4.006525482424434e-05, "tps": 91525, "wall": 21671.0} {"step": 30265, "train_loss": 3.2443575859069824, "lr": 4.0064740026157975e-05, "tps": 91508, "wall": 21675.8} {"step": 30266, "train_loss": 3.0856223106384277, "lr": 4.0064227266387995e-05, "tps": 91491, "wall": 21680.5} {"step": 30267, "train_loss": 3.1686527729034424, "lr": 4.006371654494016e-05, "tps": 91474, "wall": 21685.2} {"step": 30268, "train_loss": 3.1894736289978027, "lr": 4.006320786182027e-05, "tps": 91457, "wall": 21689.9} {"step": 30269, "train_loss": 3.218560218811035, "lr": 4.006270121703413e-05, "tps": 91440, "wall": 21694.6} {"step": 30270, "train_loss": 3.18472957611084, "lr": 4.006219661058742e-05, "tps": 91423, "wall": 21699.3} {"step": 30271, "train_loss": 3.086408853530884, "lr": 4.0061694042485885e-05, "tps": 91407, "wall": 21704.1} {"step": 30272, "train_loss": 3.074089765548706, "lr": 4.0061193512735216e-05, "tps": 91390, "wall": 21708.8} {"step": 30273, "train_loss": 3.089871406555176, "lr": 4.006069502134108e-05, "tps": 91373, "wall": 21713.5} {"step": 30274, "train_loss": 3.195647716522217, "lr": 4.0060198568309134e-05, "tps": 91356, "wall": 21718.2} {"step": 30275, "train_loss": 3.148874521255493, "lr": 4.005970415364498e-05, "tps": 91339, "wall": 21722.9} {"step": 30276, "train_loss": 3.139911651611328, "lr": 4.005921177735424e-05, "tps": 91322, "wall": 21727.7} {"step": 30277, "train_loss": 3.104051351547241, "lr": 4.005872143944249e-05, "tps": 91306, "wall": 21732.4} {"step": 30278, "train_loss": 3.133303165435791, "lr": 4.005823313991526e-05, "tps": 91289, "wall": 21737.1} {"step": 30279, "train_loss": 3.1859488487243652, "lr": 4.005774687877812e-05, "tps": 91272, "wall": 21741.8} {"step": 30280, "train_loss": 3.0439248085021973, "lr": 4.0057262656036534e-05, "tps": 91256, "wall": 21746.5} {"step": 30281, "train_loss": 3.184612274169922, "lr": 4.0056780471696044e-05, "tps": 91239, "wall": 21751.2} {"step": 30282, "train_loss": 3.148794651031494, "lr": 4.005630032576205e-05, "tps": 91222, "wall": 21755.9} {"step": 30283, "train_loss": 3.155637741088867, "lr": 4.0055822218240035e-05, "tps": 91205, "wall": 21760.6} {"step": 30284, "train_loss": 3.361574172973633, "lr": 4.00553461491354e-05, "tps": 91189, "wall": 21765.3} {"step": 30285, "train_loss": 3.180826187133789, "lr": 4.005487211845354e-05, "tps": 91172, "wall": 21770.0} {"step": 30286, "train_loss": 3.1572132110595703, "lr": 4.005440012619981e-05, "tps": 91155, "wall": 21774.7} {"step": 30287, "train_loss": 3.1090750694274902, "lr": 4.0053930172379595e-05, "tps": 91139, "wall": 21779.4} {"step": 30288, "train_loss": 3.280366897583008, "lr": 4.005346225699817e-05, "tps": 91122, "wall": 21784.1} {"step": 30289, "train_loss": 3.123690128326416, "lr": 4.0052996380060864e-05, "tps": 91105, "wall": 21788.8} {"step": 30290, "train_loss": 3.0338335037231445, "lr": 4.005253254157296e-05, "tps": 91089, "wall": 21793.5} {"step": 30291, "train_loss": 3.033444404602051, "lr": 4.00520707415397e-05, "tps": 91072, "wall": 21798.2} {"step": 30292, "train_loss": 3.0874199867248535, "lr": 4.005161097996632e-05, "tps": 91055, "wall": 21802.9} {"step": 30293, "train_loss": 3.109787940979004, "lr": 4.0051153256858e-05, "tps": 91039, "wall": 21807.6} {"step": 30294, "train_loss": 3.0231082439422607, "lr": 4.005069757221998e-05, "tps": 91022, "wall": 21812.3} {"step": 30295, "train_loss": 3.1417999267578125, "lr": 4.005024392605738e-05, "tps": 91006, "wall": 21817.0} {"step": 30296, "train_loss": 3.276279926300049, "lr": 4.0049792318375353e-05, "tps": 90989, "wall": 21821.6} {"step": 30297, "train_loss": 3.172240972518921, "lr": 4.004934274917902e-05, "tps": 90973, "wall": 21826.3} {"step": 30298, "train_loss": 3.0959386825561523, "lr": 4.004889521847347e-05, "tps": 90956, "wall": 21831.0} {"step": 30299, "train_loss": 3.165832042694092, "lr": 4.004844972626377e-05, "tps": 90940, "wall": 21835.7} {"step": 30300, "train_loss": 3.0663793087005615, "lr": 4.004800627255496e-05, "tps": 90923, "wall": 21840.4} {"step": 30301, "train_loss": 3.1388068199157715, "lr": 4.0047564857352066e-05, "tps": 90907, "wall": 21845.1} {"step": 30302, "train_loss": 3.2398521900177, "lr": 4.0047125480660094e-05, "tps": 90890, "wall": 21849.8} {"step": 30303, "train_loss": 3.061815023422241, "lr": 4.004668814248404e-05, "tps": 90874, "wall": 21854.5} {"step": 30304, "train_loss": 3.1503777503967285, "lr": 4.0046252842828816e-05, "tps": 90857, "wall": 21859.2} {"step": 30305, "train_loss": 3.161783456802368, "lr": 4.004581958169938e-05, "tps": 90841, "wall": 21863.8} {"step": 30306, "train_loss": 3.088371515274048, "lr": 4.0045388359100636e-05, "tps": 90824, "wall": 21868.5} {"step": 30307, "train_loss": 3.1025378704071045, "lr": 4.004495917503747e-05, "tps": 90808, "wall": 21873.2} {"step": 30308, "train_loss": 3.1626861095428467, "lr": 4.0044532029514734e-05, "tps": 90791, "wall": 21877.9} {"step": 30309, "train_loss": 3.160691499710083, "lr": 4.0044106922537276e-05, "tps": 90775, "wall": 21882.5} {"step": 30310, "train_loss": 3.076526165008545, "lr": 4.0043683854109925e-05, "tps": 90758, "wall": 21887.2} {"step": 30311, "train_loss": 3.132781982421875, "lr": 4.004326282423744e-05, "tps": 90742, "wall": 21891.9} {"step": 30312, "train_loss": 3.1919355392456055, "lr": 4.004284383292464e-05, "tps": 90726, "wall": 21896.6} {"step": 30313, "train_loss": 3.1895787715911865, "lr": 4.004242688017621e-05, "tps": 90709, "wall": 21901.3} {"step": 30314, "train_loss": 3.0952377319335938, "lr": 4.004201196599691e-05, "tps": 90693, "wall": 21906.0} {"step": 30315, "train_loss": 3.1839046478271484, "lr": 4.004159909039143e-05, "tps": 90676, "wall": 21910.7} {"step": 30316, "train_loss": 3.1820809841156006, "lr": 4.004118825336447e-05, "tps": 90660, "wall": 21915.3} {"step": 30317, "train_loss": 3.224325180053711, "lr": 4.0040779454920654e-05, "tps": 90644, "wall": 21920.0} {"step": 30318, "train_loss": 3.2165040969848633, "lr": 4.004037269506462e-05, "tps": 90627, "wall": 21924.6} {"step": 30319, "train_loss": 3.0526528358459473, "lr": 4.0039967973800975e-05, "tps": 90611, "wall": 21929.3} {"step": 30320, "train_loss": 2.9650230407714844, "lr": 4.0039565291134324e-05, "tps": 90595, "wall": 21934.0} {"step": 30321, "train_loss": 3.1789000034332275, "lr": 4.00391646470692e-05, "tps": 90578, "wall": 21938.7} {"step": 30322, "train_loss": 3.082324504852295, "lr": 4.003876604161016e-05, "tps": 90562, "wall": 21943.3} {"step": 30323, "train_loss": 3.168388843536377, "lr": 4.00383694747617e-05, "tps": 90546, "wall": 21948.0} {"step": 30324, "train_loss": 3.0795578956604004, "lr": 4.003797494652836e-05, "tps": 90530, "wall": 21952.7} {"step": 30325, "train_loss": 3.2358450889587402, "lr": 4.0037582456914544e-05, "tps": 90514, "wall": 21957.3} {"step": 30326, "train_loss": 3.0679662227630615, "lr": 4.0037192005924746e-05, "tps": 90497, "wall": 21962.0} {"step": 30327, "train_loss": 3.1040258407592773, "lr": 4.0036803593563356e-05, "tps": 90481, "wall": 21966.7} {"step": 30328, "train_loss": 3.077894687652588, "lr": 4.00364172198348e-05, "tps": 90465, "wall": 21971.3} {"step": 30329, "train_loss": 3.154994249343872, "lr": 4.0036032884743445e-05, "tps": 90448, "wall": 21976.0} {"step": 30330, "train_loss": 3.1843972206115723, "lr": 4.003565058829365e-05, "tps": 90432, "wall": 21980.7} {"step": 30331, "train_loss": 3.1356515884399414, "lr": 4.003527033048975e-05, "tps": 90416, "wall": 21985.3} {"step": 30332, "train_loss": 3.164926052093506, "lr": 4.003489211133603e-05, "tps": 90400, "wall": 21990.0} {"step": 30333, "train_loss": 3.0566112995147705, "lr": 4.00345159308368e-05, "tps": 90384, "wall": 21994.6} {"step": 30334, "train_loss": 3.0884337425231934, "lr": 4.003414178899629e-05, "tps": 90368, "wall": 21999.3} {"step": 30335, "train_loss": 3.1952450275421143, "lr": 4.003376968581878e-05, "tps": 90351, "wall": 22004.0} {"step": 30336, "train_loss": 3.072122097015381, "lr": 4.0033399621308444e-05, "tps": 90335, "wall": 22008.6} {"step": 30337, "train_loss": 3.222054958343506, "lr": 4.00330315954695e-05, "tps": 90319, "wall": 22013.3} {"step": 30338, "train_loss": 3.1532833576202393, "lr": 4.003266560830611e-05, "tps": 90303, "wall": 22017.9} {"step": 30339, "train_loss": 3.0231833457946777, "lr": 4.003230165982241e-05, "tps": 90287, "wall": 22022.6} {"step": 30340, "train_loss": 3.211117744445801, "lr": 4.003193975002255e-05, "tps": 90271, "wall": 22027.3} {"step": 30341, "train_loss": 3.124095916748047, "lr": 4.003157987891062e-05, "tps": 90255, "wall": 22031.9} {"step": 30342, "train_loss": 3.1401233673095703, "lr": 4.003122204649066e-05, "tps": 90238, "wall": 22036.6} {"step": 30343, "train_loss": 3.234283924102783, "lr": 4.003086625276678e-05, "tps": 90222, "wall": 22041.2} {"step": 30344, "train_loss": 3.1952624320983887, "lr": 4.003051249774297e-05, "tps": 90206, "wall": 22045.9} {"step": 30345, "train_loss": 3.023287534713745, "lr": 4.003016078142325e-05, "tps": 90190, "wall": 22050.5} {"step": 30346, "train_loss": 3.2098238468170166, "lr": 4.002981110381161e-05, "tps": 90174, "wall": 22055.2} {"step": 30347, "train_loss": 3.06740665435791, "lr": 4.0029463464912e-05, "tps": 90158, "wall": 22059.8} {"step": 30348, "train_loss": 3.139832019805908, "lr": 4.002911786472837e-05, "tps": 90142, "wall": 22064.4} {"step": 30349, "train_loss": 3.115260601043701, "lr": 4.002877430326463e-05, "tps": 90126, "wall": 22069.1} {"step": 30350, "train_loss": 3.1563351154327393, "lr": 4.0028432780524664e-05, "tps": 90110, "wall": 22073.7} {"step": 30351, "train_loss": 3.076002597808838, "lr": 4.0028093296512345e-05, "tps": 90094, "wall": 22078.4} {"step": 30352, "train_loss": 3.0291318893432617, "lr": 4.002775585123153e-05, "tps": 90078, "wall": 22083.1} {"step": 30353, "train_loss": 3.044731855392456, "lr": 4.0027420444686026e-05, "tps": 90062, "wall": 22087.7} {"step": 30354, "train_loss": 3.2073001861572266, "lr": 4.002708707687965e-05, "tps": 90046, "wall": 22092.3} {"step": 30355, "train_loss": 3.1650447845458984, "lr": 4.002675574781616e-05, "tps": 90030, "wall": 22097.0} {"step": 30356, "train_loss": 3.312389850616455, "lr": 4.0026426457499325e-05, "tps": 90014, "wall": 22101.6} {"step": 30357, "train_loss": 3.0528712272644043, "lr": 4.002609920593286e-05, "tps": 89999, "wall": 22106.2} {"step": 30358, "train_loss": 3.2095541954040527, "lr": 4.002577399312049e-05, "tps": 89983, "wall": 22110.9} {"step": 30359, "train_loss": 3.1991682052612305, "lr": 4.0025450819065866e-05, "tps": 89967, "wall": 22115.5} {"step": 30360, "train_loss": 3.053785800933838, "lr": 4.002512968377269e-05, "tps": 89951, "wall": 22120.1} {"step": 30361, "train_loss": 3.085814952850342, "lr": 4.0024810587244565e-05, "tps": 89935, "wall": 22124.8} {"step": 30362, "train_loss": 3.173462390899658, "lr": 4.0024493529485144e-05, "tps": 89919, "wall": 22129.4} {"step": 30363, "train_loss": 3.087653160095215, "lr": 4.0024178510497984e-05, "tps": 89903, "wall": 22134.0} {"step": 30364, "train_loss": 3.1330180168151855, "lr": 4.0023865530286676e-05, "tps": 89888, "wall": 22138.6} {"step": 30365, "train_loss": 3.110410690307617, "lr": 4.002355458885476e-05, "tps": 89872, "wall": 22143.3} {"step": 30366, "train_loss": 3.2184951305389404, "lr": 4.0023245686205734e-05, "tps": 89856, "wall": 22147.9} {"step": 30367, "train_loss": 3.133845329284668, "lr": 4.002293882234311e-05, "tps": 89840, "wall": 22152.5} {"step": 30368, "train_loss": 3.191304922103882, "lr": 4.002263399727041e-05, "tps": 89824, "wall": 22157.1} {"step": 30369, "train_loss": 3.109677791595459, "lr": 4.002233121099102e-05, "tps": 89809, "wall": 22161.7} {"step": 30370, "train_loss": 3.2045202255249023, "lr": 4.00220304635084e-05, "tps": 89793, "wall": 22166.4} {"step": 30371, "train_loss": 3.2051379680633545, "lr": 4.002173175482597e-05, "tps": 89777, "wall": 22171.0} {"step": 30372, "train_loss": 3.141021728515625, "lr": 4.002143508494709e-05, "tps": 89761, "wall": 22175.6} {"step": 30373, "train_loss": 3.145029067993164, "lr": 4.0021140453875135e-05, "tps": 89748, "wall": 22179.7} {"step": 30374, "train_loss": 3.1080803871154785, "lr": 4.002084786161343e-05, "tps": 89733, "wall": 22184.1} {"step": 30375, "train_loss": 3.2311015129089355, "lr": 4.002055730816529e-05, "tps": 89718, "wall": 22188.6} {"step": 30376, "train_loss": 3.1732187271118164, "lr": 4.002026879353403e-05, "tps": 89703, "wall": 22193.1} {"step": 30377, "train_loss": 3.171180248260498, "lr": 4.0019982317722896e-05, "tps": 89687, "wall": 22197.6} {"step": 30378, "train_loss": 3.0896196365356445, "lr": 4.001969788073513e-05, "tps": 89672, "wall": 22202.1} {"step": 30379, "train_loss": 3.1402740478515625, "lr": 4.0019415482573975e-05, "tps": 89656, "wall": 22206.7} {"step": 30380, "train_loss": 3.0169334411621094, "lr": 4.001913512324262e-05, "tps": 89641, "wall": 22211.3} {"step": 30381, "train_loss": 3.1360020637512207, "lr": 4.0018856802744234e-05, "tps": 89625, "wall": 22215.8} {"step": 30382, "train_loss": 3.2533931732177734, "lr": 4.0018580521081986e-05, "tps": 89610, "wall": 22220.4} {"step": 30383, "train_loss": 3.102907657623291, "lr": 4.0018306278258976e-05, "tps": 89594, "wall": 22225.0} {"step": 30384, "train_loss": 3.176624298095703, "lr": 4.001803407427834e-05, "tps": 89579, "wall": 22229.6} {"step": 30385, "train_loss": 3.1118383407592773, "lr": 4.0017763909143136e-05, "tps": 89563, "wall": 22234.2} {"step": 30386, "train_loss": 3.1448330879211426, "lr": 4.001749578285646e-05, "tps": 89547, "wall": 22238.8} {"step": 30387, "train_loss": 3.1560254096984863, "lr": 4.001722969542132e-05, "tps": 89532, "wall": 22243.5} {"step": 30388, "train_loss": 3.146592140197754, "lr": 4.001696564684074e-05, "tps": 89516, "wall": 22248.1} {"step": 30389, "train_loss": 3.128286361694336, "lr": 4.0016703637117706e-05, "tps": 89500, "wall": 22252.7} {"step": 30390, "train_loss": 3.2671380043029785, "lr": 4.001644366625521e-05, "tps": 89485, "wall": 22257.3} {"step": 30391, "train_loss": 3.111649990081787, "lr": 4.0016185734256145e-05, "tps": 89469, "wall": 22262.0} {"step": 30392, "train_loss": 3.1937668323516846, "lr": 4.001592984112348e-05, "tps": 89453, "wall": 22266.6} {"step": 30393, "train_loss": 3.1675047874450684, "lr": 4.001567598686009e-05, "tps": 89438, "wall": 22271.2} {"step": 30394, "train_loss": 3.098848819732666, "lr": 4.001542417146887e-05, "tps": 89422, "wall": 22275.9} {"step": 30395, "train_loss": 3.189934015274048, "lr": 4.001517439495266e-05, "tps": 89406, "wall": 22280.5} {"step": 30396, "train_loss": 3.198599338531494, "lr": 4.00149266573143e-05, "tps": 89391, "wall": 22285.1} {"step": 30397, "train_loss": 3.1664037704467773, "lr": 4.001468095855658e-05, "tps": 89375, "wall": 22289.8} {"step": 30398, "train_loss": 3.26334285736084, "lr": 4.0014437298682285e-05, "tps": 89360, "wall": 22294.4} {"step": 30399, "train_loss": 3.112276315689087, "lr": 4.001419567769418e-05, "tps": 89344, "wall": 22299.0} {"step": 30400, "train_loss": 3.129948616027832, "lr": 4.001395609559502e-05, "tps": 89328, "wall": 22303.7} {"step": 30401, "train_loss": 3.159940242767334, "lr": 4.0013718552387504e-05, "tps": 89313, "wall": 22308.3} {"step": 30402, "train_loss": 3.181335926055908, "lr": 4.001348304807431e-05, "tps": 89297, "wall": 22312.9} {"step": 30403, "train_loss": 3.151623487472534, "lr": 4.001324958265811e-05, "tps": 89282, "wall": 22317.6} {"step": 30404, "train_loss": 3.156548500061035, "lr": 4.001301815614156e-05, "tps": 89266, "wall": 22322.2} {"step": 30405, "train_loss": 3.1862196922302246, "lr": 4.0012788768527275e-05, "tps": 89250, "wall": 22326.9} {"step": 30406, "train_loss": 3.1878743171691895, "lr": 4.001256141981788e-05, "tps": 89235, "wall": 22331.5} {"step": 30407, "train_loss": 3.058105945587158, "lr": 4.00123361100159e-05, "tps": 89219, "wall": 22336.1} {"step": 30408, "train_loss": 3.155367612838745, "lr": 4.0012112839123925e-05, "tps": 89204, "wall": 22340.7} {"step": 30409, "train_loss": 3.101654529571533, "lr": 4.0011891607144466e-05, "tps": 89188, "wall": 22345.4} {"step": 30410, "train_loss": 3.0894534587860107, "lr": 4.001167241408003e-05, "tps": 89172, "wall": 22350.0} {"step": 30411, "train_loss": 3.2096590995788574, "lr": 4.0011455259933126e-05, "tps": 89157, "wall": 22354.6} {"step": 30412, "train_loss": 3.2179160118103027, "lr": 4.001124014470618e-05, "tps": 89141, "wall": 22359.2} {"step": 30413, "train_loss": 3.142209053039551, "lr": 4.001102706840166e-05, "tps": 89126, "wall": 22363.8} {"step": 30414, "train_loss": 3.1366753578186035, "lr": 4.001081603102195e-05, "tps": 89111, "wall": 22368.5} {"step": 30415, "train_loss": 3.1248087882995605, "lr": 4.001060703256944e-05, "tps": 89095, "wall": 22373.1} {"step": 30416, "train_loss": 3.0792486667633057, "lr": 4.001040007304652e-05, "tps": 89081, "wall": 22377.2} {"step": 30417, "train_loss": 3.130218505859375, "lr": 4.001019515245553e-05, "tps": 89067, "wall": 22381.7} {"step": 30418, "train_loss": 3.1701583862304688, "lr": 4.000999227079879e-05, "tps": 89052, "wall": 22386.1} {"step": 30419, "train_loss": 3.16139554977417, "lr": 4.00097914280786e-05, "tps": 89037, "wall": 22390.6} {"step": 30420, "train_loss": 3.1436517238616943, "lr": 4.000959262429722e-05, "tps": 89022, "wall": 22395.1} {"step": 30421, "train_loss": 3.092423677444458, "lr": 4.00093958594569e-05, "tps": 89007, "wall": 22399.6} {"step": 30422, "train_loss": 3.1469268798828125, "lr": 4.000920113355989e-05, "tps": 88992, "wall": 22404.2} {"step": 30423, "train_loss": 3.2571277618408203, "lr": 4.00090084466084e-05, "tps": 88977, "wall": 22408.8} {"step": 30424, "train_loss": 3.203425407409668, "lr": 4.000881779860459e-05, "tps": 88961, "wall": 22413.3} {"step": 30425, "train_loss": 3.1298317909240723, "lr": 4.000862918955062e-05, "tps": 88946, "wall": 22417.9} {"step": 30426, "train_loss": 3.262428045272827, "lr": 4.000844261944865e-05, "tps": 88931, "wall": 22422.5} {"step": 30427, "train_loss": 3.2730579376220703, "lr": 4.0008258088300765e-05, "tps": 88915, "wall": 22427.1} {"step": 30428, "train_loss": 3.2009119987487793, "lr": 4.000807559610909e-05, "tps": 88900, "wall": 22431.7} {"step": 30429, "train_loss": 3.269392967224121, "lr": 4.0007895142875654e-05, "tps": 88885, "wall": 22436.3} {"step": 30430, "train_loss": 3.1611509323120117, "lr": 4.000771672860254e-05, "tps": 88869, "wall": 22441.0} {"step": 30431, "train_loss": 3.121539354324341, "lr": 4.0007540353291725e-05, "tps": 88854, "wall": 22445.6} {"step": 30432, "train_loss": 3.20759916305542, "lr": 4.000736601694524e-05, "tps": 88839, "wall": 22450.2} {"step": 30433, "train_loss": 3.0715322494506836, "lr": 4.000719371956506e-05, "tps": 88823, "wall": 22454.9} {"step": 30434, "train_loss": 3.2178518772125244, "lr": 4.000702346115311e-05, "tps": 88808, "wall": 22459.5} {"step": 30435, "train_loss": 3.16579270362854, "lr": 4.0006855241711336e-05, "tps": 88792, "wall": 22464.1} {"step": 30436, "train_loss": 3.1293997764587402, "lr": 4.000668906124165e-05, "tps": 88777, "wall": 22468.7} {"step": 30437, "train_loss": 3.1259021759033203, "lr": 4.000652491974594e-05, "tps": 88762, "wall": 22473.3} {"step": 30438, "train_loss": 3.0755796432495117, "lr": 4.000636281722603e-05, "tps": 88747, "wall": 22477.9} {"step": 30439, "train_loss": 3.180997371673584, "lr": 4.0006202753683786e-05, "tps": 88731, "wall": 22482.6} {"step": 30440, "train_loss": 3.108870506286621, "lr": 4.000604472912103e-05, "tps": 88716, "wall": 22487.2} {"step": 30441, "train_loss": 3.151409149169922, "lr": 4.0005888743539524e-05, "tps": 88700, "wall": 22491.8} {"step": 30442, "train_loss": 3.072321653366089, "lr": 4.0005734796941054e-05, "tps": 88685, "wall": 22496.4} {"step": 30443, "train_loss": 3.166106700897217, "lr": 4.000558288932734e-05, "tps": 88670, "wall": 22501.1} {"step": 30444, "train_loss": 3.1642062664031982, "lr": 4.0005433020700156e-05, "tps": 88656, "wall": 22505.3} {"step": 30445, "train_loss": 3.180354118347168, "lr": 4.000528519106112e-05, "tps": 88642, "wall": 22509.7} {"step": 30446, "train_loss": 3.2409772872924805, "lr": 4.000513940041199e-05, "tps": 88627, "wall": 22514.2} {"step": 30447, "train_loss": 3.2348074913024902, "lr": 4.000499564875435e-05, "tps": 88612, "wall": 22518.7} {"step": 30448, "train_loss": 3.1803390979766846, "lr": 4.000485393608987e-05, "tps": 88597, "wall": 22523.2} {"step": 30449, "train_loss": 3.1119742393493652, "lr": 4.000471426242014e-05, "tps": 88582, "wall": 22527.7} {"step": 30450, "train_loss": 3.1289191246032715, "lr": 4.000457662774676e-05, "tps": 88567, "wall": 22532.3} {"step": 30451, "train_loss": 3.1709680557250977, "lr": 4.0004441032071254e-05, "tps": 88552, "wall": 22536.9} {"step": 30452, "train_loss": 2.9537854194641113, "lr": 4.000430747539517e-05, "tps": 88537, "wall": 22541.4} {"step": 30453, "train_loss": 3.1271047592163086, "lr": 4.0004175957720045e-05, "tps": 88522, "wall": 22546.0} {"step": 30454, "train_loss": 3.2145888805389404, "lr": 4.000404647904736e-05, "tps": 88507, "wall": 22550.6} {"step": 30455, "train_loss": 3.135934829711914, "lr": 4.0003919039378565e-05, "tps": 88492, "wall": 22555.2} {"step": 30456, "train_loss": 3.113964557647705, "lr": 4.000379363871509e-05, "tps": 88476, "wall": 22559.9} {"step": 30457, "train_loss": 3.0484819412231445, "lr": 4.00036702770584e-05, "tps": 88461, "wall": 22564.5} {"step": 30458, "train_loss": 3.1025495529174805, "lr": 4.000354895440987e-05, "tps": 88446, "wall": 22569.1} {"step": 30459, "train_loss": 3.176226854324341, "lr": 4.000342967077089e-05, "tps": 88431, "wall": 22573.7} {"step": 30460, "train_loss": 3.1919708251953125, "lr": 4.000331242614278e-05, "tps": 88417, "wall": 22578.1} {"step": 30461, "train_loss": 3.127553939819336, "lr": 4.000319722052687e-05, "tps": 88402, "wall": 22582.5} {"step": 30462, "train_loss": 3.220214366912842, "lr": 4.000308405392451e-05, "tps": 88388, "wall": 22587.0} {"step": 30463, "train_loss": 3.183025360107422, "lr": 4.0002972926336935e-05, "tps": 88373, "wall": 22591.4} {"step": 30464, "train_loss": 3.117899179458618, "lr": 4.000286383776541e-05, "tps": 88358, "wall": 22596.0} {"step": 30465, "train_loss": 3.1394882202148438, "lr": 4.0002756788211194e-05, "tps": 88344, "wall": 22600.5} {"step": 30466, "train_loss": 3.115450382232666, "lr": 4.0002651777675486e-05, "tps": 88329, "wall": 22605.1} {"step": 30467, "train_loss": 3.176152229309082, "lr": 4.0002548806159474e-05, "tps": 88314, "wall": 22609.7} {"step": 30468, "train_loss": 3.1478400230407715, "lr": 4.000244787366433e-05, "tps": 88299, "wall": 22614.2} {"step": 30469, "train_loss": 3.1470444202423096, "lr": 4.00023489801912e-05, "tps": 88283, "wall": 22618.9} {"step": 30470, "train_loss": 3.1895625591278076, "lr": 4.000225212574118e-05, "tps": 88268, "wall": 22623.5} {"step": 30471, "train_loss": 3.129870891571045, "lr": 4.0002157310315416e-05, "tps": 88253, "wall": 22628.2} {"step": 30472, "train_loss": 3.212466239929199, "lr": 4.000206453391493e-05, "tps": 88238, "wall": 22632.8} {"step": 30473, "train_loss": 3.2370803356170654, "lr": 4.000197379654079e-05, "tps": 88223, "wall": 22637.4} {"step": 30474, "train_loss": 3.116682767868042, "lr": 4.000188509819402e-05, "tps": 88207, "wall": 22642.1} {"step": 30475, "train_loss": 3.1515092849731445, "lr": 4.000179843887566e-05, "tps": 88192, "wall": 22646.7} {"step": 30476, "train_loss": 3.11446475982666, "lr": 4.000171381858665e-05, "tps": 88177, "wall": 22651.3} {"step": 30477, "train_loss": 3.0125322341918945, "lr": 4.000163123732798e-05, "tps": 88162, "wall": 22656.0} {"step": 30478, "train_loss": 3.0440304279327393, "lr": 4.0001550695100556e-05, "tps": 88147, "wall": 22660.7} {"step": 30479, "train_loss": 3.155843734741211, "lr": 4.000147219190531e-05, "tps": 88131, "wall": 22665.3} {"step": 30480, "train_loss": 3.0866451263427734, "lr": 4.000139572774311e-05, "tps": 88116, "wall": 22669.9} {"step": 30481, "train_loss": 3.1642181873321533, "lr": 4.000132130261485e-05, "tps": 88101, "wall": 22674.6} {"step": 30482, "train_loss": 3.1720614433288574, "lr": 4.0001248916521345e-05, "tps": 88086, "wall": 22679.2} {"step": 30483, "train_loss": 3.1447999477386475, "lr": 4.000117856946345e-05, "tps": 88071, "wall": 22683.9} {"step": 30484, "train_loss": 3.239764451980591, "lr": 4.000111026144193e-05, "tps": 88056, "wall": 22688.5} {"step": 30485, "train_loss": 3.1857519149780273, "lr": 4.0001043992457564e-05, "tps": 88041, "wall": 22693.2} {"step": 30486, "train_loss": 3.2468149662017822, "lr": 4.000097976251113e-05, "tps": 88025, "wall": 22697.8} {"step": 30487, "train_loss": 3.1416354179382324, "lr": 4.0000917571603323e-05, "tps": 88010, "wall": 22702.4} {"step": 30488, "train_loss": 3.257589817047119, "lr": 4.000085741973485e-05, "tps": 87995, "wall": 22707.1} {"step": 30489, "train_loss": 3.1535487174987793, "lr": 4.0000799306906426e-05, "tps": 87981, "wall": 22711.4} {"step": 30490, "train_loss": 3.135324001312256, "lr": 4.0000743233118675e-05, "tps": 87967, "wall": 22715.8} {"step": 30491, "train_loss": 3.125823497772217, "lr": 4.000068919837224e-05, "tps": 87953, "wall": 22720.2} {"step": 30492, "train_loss": 3.193599224090576, "lr": 4.0000637202667736e-05, "tps": 87938, "wall": 22724.7} {"step": 30493, "train_loss": 3.085672378540039, "lr": 4.0000587246005746e-05, "tps": 87924, "wall": 22729.3} {"step": 30494, "train_loss": 2.9890360832214355, "lr": 4.000053932838683e-05, "tps": 87909, "wall": 22733.8} {"step": 30495, "train_loss": 3.078216552734375, "lr": 4.000049344981158e-05, "tps": 87894, "wall": 22738.4} {"step": 30496, "train_loss": 3.2275824546813965, "lr": 4.000044961028045e-05, "tps": 87879, "wall": 22743.0} {"step": 30497, "train_loss": 3.2380409240722656, "lr": 4.000040780979396e-05, "tps": 87864, "wall": 22747.6} {"step": 30498, "train_loss": 3.058859348297119, "lr": 4.00003680483526e-05, "tps": 87850, "wall": 22752.2} {"step": 30499, "train_loss": 3.174373149871826, "lr": 4.000033032595682e-05, "tps": 87835, "wall": 22756.8} {"step": 30500, "train_loss": 3.1788291931152344, "lr": 4.0000294642607015e-05, "tps": 87820, "wall": 22761.4} {"step": 30501, "train_loss": 3.226623773574829, "lr": 4.0000260998303614e-05, "tps": 87804, "wall": 22766.3} {"step": 30502, "train_loss": 3.1527156829833984, "lr": 4.0000229393047e-05, "tps": 87789, "wall": 22770.9} {"step": 30503, "train_loss": 3.2121691703796387, "lr": 4.000019982683752e-05, "tps": 87774, "wall": 22775.6} {"step": 30504, "train_loss": 3.100571870803833, "lr": 4.0000172299675534e-05, "tps": 87759, "wall": 22780.2} {"step": 30505, "train_loss": 3.232628583908081, "lr": 4.000014681156131e-05, "tps": 87744, "wall": 22784.9} {"step": 30506, "train_loss": 3.214550495147705, "lr": 4.000012336249516e-05, "tps": 87729, "wall": 22789.5} {"step": 30507, "train_loss": 3.081352472305298, "lr": 4.000010195247737e-05, "tps": 87714, "wall": 22794.2} {"step": 30508, "train_loss": 3.1702957153320312, "lr": 4.0000082581508157e-05, "tps": 87698, "wall": 22798.9} {"step": 30509, "train_loss": 3.0794405937194824, "lr": 4.000006524958774e-05, "tps": 87683, "wall": 22803.6} {"step": 30510, "train_loss": 3.180427074432373, "lr": 4.0000049956716305e-05, "tps": 87668, "wall": 22808.3} {"step": 30511, "train_loss": 3.1675515174865723, "lr": 4.0000036702894064e-05, "tps": 87653, "wall": 22812.9} {"step": 30512, "train_loss": 3.199305295944214, "lr": 4.000002548812116e-05, "tps": 87638, "wall": 22817.6} {"step": 30513, "train_loss": 3.176884889602661, "lr": 4.000001631239768e-05, "tps": 87623, "wall": 22822.2} {"step": 30514, "train_loss": 3.133312225341797, "lr": 4.000000917572376e-05, "tps": 87608, "wall": 22826.9} {"step": 30515, "train_loss": 3.076563835144043, "lr": 4.000000407809946e-05, "tps": 87593, "wall": 22831.6} {"step": 30516, "train_loss": 3.1102583408355713, "lr": 4.000000101952487e-05, "tps": 87578, "wall": 22836.3}